efi.c 24.8 KB
Newer Older
H
Huang, Ying 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 * Common EFI (Extensible Firmware Interface) support functions
 * Based on Extensible Firmware Interface Specification version 1.0
 *
 * Copyright (C) 1999 VA Linux Systems
 * Copyright (C) 1999 Walt Drummond <drummond@valinux.com>
 * Copyright (C) 1999-2002 Hewlett-Packard Co.
 *	David Mosberger-Tang <davidm@hpl.hp.com>
 *	Stephane Eranian <eranian@hpl.hp.com>
 * Copyright (C) 2005-2008 Intel Co.
 *	Fenghua Yu <fenghua.yu@intel.com>
 *	Bibo Mao <bibo.mao@intel.com>
 *	Chandramouli Narayanan <mouli@linux.intel.com>
 *	Huang Ying <ying.huang@intel.com>
 *
 * Copied from efi_32.c to eliminate the duplicated code between EFI
 * 32/64 support code. --ying 2007-10-26
 *
 * All EFI Runtime Services are not implemented yet as EFI only
 * supports physical mode addressing on SoftSDV. This is to be fixed
 * in a future version.  --drummond 1999-07-20
 *
 * Implemented EFI runtime services and virtual mode calls.  --davidm
 *
 * Goutham Rao: <goutham.rao@intel.com>
 *	Skip non-WB memory and ignore empty memory ranges.
 */

29 30
#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt

H
Huang, Ying 已提交
31 32 33
#include <linux/kernel.h>
#include <linux/init.h>
#include <linux/efi.h>
34
#include <linux/efi-bgrt.h>
35
#include <linux/export.h>
H
Huang, Ying 已提交
36
#include <linux/bootmem.h>
37
#include <linux/memblock.h>
H
Huang, Ying 已提交
38 39 40 41 42 43 44 45 46 47
#include <linux/spinlock.h>
#include <linux/uaccess.h>
#include <linux/time.h>
#include <linux/io.h>
#include <linux/reboot.h>
#include <linux/bcd.h>

#include <asm/setup.h>
#include <asm/efi.h>
#include <asm/time.h>
48 49
#include <asm/cacheflush.h>
#include <asm/tlbflush.h>
50
#include <asm/x86_init.h>
H
Huang, Ying 已提交
51 52 53 54 55 56

#define EFI_DEBUG	1

int efi_enabled;
EXPORT_SYMBOL(efi_enabled);

57 58 59 60 61 62 63 64 65 66 67
struct efi __read_mostly efi = {
	.mps        = EFI_INVALID_TABLE_ADDR,
	.acpi       = EFI_INVALID_TABLE_ADDR,
	.acpi20     = EFI_INVALID_TABLE_ADDR,
	.smbios     = EFI_INVALID_TABLE_ADDR,
	.sal_systab = EFI_INVALID_TABLE_ADDR,
	.boot_info  = EFI_INVALID_TABLE_ADDR,
	.hcdp       = EFI_INVALID_TABLE_ADDR,
	.uga        = EFI_INVALID_TABLE_ADDR,
	.uv_systab  = EFI_INVALID_TABLE_ADDR,
};
H
Huang, Ying 已提交
68 69 70 71
EXPORT_SYMBOL(efi);

struct efi_memory_map memmap;

72 73 74
bool efi_64bit;
static bool efi_native;

H
Harvey Harrison 已提交
75
static struct efi efi_phys __initdata;
H
Huang, Ying 已提交
76 77
static efi_system_table_t efi_systab __initdata;

78 79 80 81 82 83 84
static int __init setup_noefi(char *arg)
{
	efi_enabled = 0;
	return 0;
}
early_param("noefi", setup_noefi);

85 86 87 88 89 90 91 92 93 94 95
int add_efi_memmap;
EXPORT_SYMBOL(add_efi_memmap);

static int __init setup_add_efi_memmap(char *arg)
{
	add_efi_memmap = 1;
	return 0;
}
early_param("add_efi_memmap", setup_add_efi_memmap);


H
Huang, Ying 已提交
96 97
static efi_status_t virt_efi_get_time(efi_time_t *tm, efi_time_cap_t *tc)
{
98 99 100 101 102 103 104
	unsigned long flags;
	efi_status_t status;

	spin_lock_irqsave(&rtc_lock, flags);
	status = efi_call_virt2(get_time, tm, tc);
	spin_unlock_irqrestore(&rtc_lock, flags);
	return status;
H
Huang, Ying 已提交
105 106 107 108
}

static efi_status_t virt_efi_set_time(efi_time_t *tm)
{
109 110 111 112 113 114 115
	unsigned long flags;
	efi_status_t status;

	spin_lock_irqsave(&rtc_lock, flags);
	status = efi_call_virt1(set_time, tm);
	spin_unlock_irqrestore(&rtc_lock, flags);
	return status;
H
Huang, Ying 已提交
116 117 118 119 120 121
}

static efi_status_t virt_efi_get_wakeup_time(efi_bool_t *enabled,
					     efi_bool_t *pending,
					     efi_time_t *tm)
{
122 123 124 125 126 127 128 129
	unsigned long flags;
	efi_status_t status;

	spin_lock_irqsave(&rtc_lock, flags);
	status = efi_call_virt3(get_wakeup_time,
				enabled, pending, tm);
	spin_unlock_irqrestore(&rtc_lock, flags);
	return status;
H
Huang, Ying 已提交
130 131 132 133
}

static efi_status_t virt_efi_set_wakeup_time(efi_bool_t enabled, efi_time_t *tm)
{
134 135 136 137 138 139 140 141
	unsigned long flags;
	efi_status_t status;

	spin_lock_irqsave(&rtc_lock, flags);
	status = efi_call_virt2(set_wakeup_time,
				enabled, tm);
	spin_unlock_irqrestore(&rtc_lock, flags);
	return status;
H
Huang, Ying 已提交
142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164
}

static efi_status_t virt_efi_get_variable(efi_char16_t *name,
					  efi_guid_t *vendor,
					  u32 *attr,
					  unsigned long *data_size,
					  void *data)
{
	return efi_call_virt5(get_variable,
			      name, vendor, attr,
			      data_size, data);
}

static efi_status_t virt_efi_get_next_variable(unsigned long *name_size,
					       efi_char16_t *name,
					       efi_guid_t *vendor)
{
	return efi_call_virt3(get_next_variable,
			      name_size, name, vendor);
}

static efi_status_t virt_efi_set_variable(efi_char16_t *name,
					  efi_guid_t *vendor,
165
					  u32 attr,
H
Huang, Ying 已提交
166 167 168 169 170 171 172 173
					  unsigned long data_size,
					  void *data)
{
	return efi_call_virt5(set_variable,
			      name, vendor, attr,
			      data_size, data);
}

174 175 176 177 178 179 180 181 182 183 184 185
static efi_status_t virt_efi_query_variable_info(u32 attr,
						 u64 *storage_space,
						 u64 *remaining_space,
						 u64 *max_variable_size)
{
	if (efi.runtime_version < EFI_2_00_SYSTEM_TABLE_REVISION)
		return EFI_UNSUPPORTED;

	return efi_call_virt4(query_variable_info, attr, storage_space,
			      remaining_space, max_variable_size);
}

H
Huang, Ying 已提交
186 187 188 189 190 191 192 193 194 195 196 197 198 199
static efi_status_t virt_efi_get_next_high_mono_count(u32 *count)
{
	return efi_call_virt1(get_next_high_mono_count, count);
}

static void virt_efi_reset_system(int reset_type,
				  efi_status_t status,
				  unsigned long data_size,
				  efi_char16_t *data)
{
	efi_call_virt4(reset_system, reset_type, status,
		       data_size, data);
}

200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221
static efi_status_t virt_efi_update_capsule(efi_capsule_header_t **capsules,
					    unsigned long count,
					    unsigned long sg_list)
{
	if (efi.runtime_version < EFI_2_00_SYSTEM_TABLE_REVISION)
		return EFI_UNSUPPORTED;

	return efi_call_virt3(update_capsule, capsules, count, sg_list);
}

static efi_status_t virt_efi_query_capsule_caps(efi_capsule_header_t **capsules,
						unsigned long count,
						u64 *max_size,
						int *reset_type)
{
	if (efi.runtime_version < EFI_2_00_SYSTEM_TABLE_REVISION)
		return EFI_UNSUPPORTED;

	return efi_call_virt4(query_capsule_caps, capsules, count, max_size,
			      reset_type);
}

H
Huang, Ying 已提交
222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237
static efi_status_t __init phys_efi_set_virtual_address_map(
	unsigned long memory_map_size,
	unsigned long descriptor_size,
	u32 descriptor_version,
	efi_memory_desc_t *virtual_map)
{
	efi_status_t status;

	efi_call_phys_prelog();
	status = efi_call_phys4(efi_phys.set_virtual_address_map,
				memory_map_size, descriptor_size,
				descriptor_version, virtual_map);
	efi_call_phys_epilog();
	return status;
}

238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253
static efi_status_t __init phys_efi_get_time(efi_time_t *tm,
					     efi_time_cap_t *tc)
{
	unsigned long flags;
	efi_status_t status;

	spin_lock_irqsave(&rtc_lock, flags);
	efi_call_phys_prelog();
	status = efi_call_phys2(efi_phys.get_time, virt_to_phys(tm),
				virt_to_phys(tc));
	efi_call_phys_epilog();
	spin_unlock_irqrestore(&rtc_lock, flags);
	return status;
}

int efi_set_rtc_mmss(unsigned long nowtime)
H
Huang, Ying 已提交
254 255 256 257 258 259 260 261
{
	int real_seconds, real_minutes;
	efi_status_t 	status;
	efi_time_t 	eft;
	efi_time_cap_t 	cap;

	status = efi.get_time(&eft, &cap);
	if (status != EFI_SUCCESS) {
262
		pr_err("Oops: efitime: can't read time!\n");
H
Huang, Ying 已提交
263 264 265 266 267 268 269 270 271 272 273 274 275
		return -1;
	}

	real_seconds = nowtime % 60;
	real_minutes = nowtime / 60;
	if (((abs(real_minutes - eft.minute) + 15)/30) & 1)
		real_minutes += 30;
	real_minutes %= 60;
	eft.minute = real_minutes;
	eft.second = real_seconds;

	status = efi.set_time(&eft);
	if (status != EFI_SUCCESS) {
276
		pr_err("Oops: efitime: can't write time!\n");
H
Huang, Ying 已提交
277 278 279 280 281
		return -1;
	}
	return 0;
}

282
unsigned long efi_get_time(void)
H
Huang, Ying 已提交
283 284 285 286 287 288 289
{
	efi_status_t status;
	efi_time_t eft;
	efi_time_cap_t cap;

	status = efi.get_time(&eft, &cap);
	if (status != EFI_SUCCESS)
290
		pr_err("Oops: efitime: can't read time!\n");
H
Huang, Ying 已提交
291 292 293 294 295

	return mktime(eft.year, eft.month, eft.day, eft.hour,
		      eft.minute, eft.second);
}

296 297 298 299 300 301
/*
 * Tell the kernel about the EFI memory map.  This might include
 * more than the max 128 entries that can fit in the e820 legacy
 * (zeropage) memory map.
 */

302
static void __init do_add_efi_memmap(void)
303 304 305 306 307 308 309 310 311
{
	void *p;

	for (p = memmap.map; p < memmap.map_end; p += memmap.desc_size) {
		efi_memory_desc_t *md = p;
		unsigned long long start = md->phys_addr;
		unsigned long long size = md->num_pages << EFI_PAGE_SHIFT;
		int e820_type;

312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337
		switch (md->type) {
		case EFI_LOADER_CODE:
		case EFI_LOADER_DATA:
		case EFI_BOOT_SERVICES_CODE:
		case EFI_BOOT_SERVICES_DATA:
		case EFI_CONVENTIONAL_MEMORY:
			if (md->attribute & EFI_MEMORY_WB)
				e820_type = E820_RAM;
			else
				e820_type = E820_RESERVED;
			break;
		case EFI_ACPI_RECLAIM_MEMORY:
			e820_type = E820_ACPI;
			break;
		case EFI_ACPI_MEMORY_NVS:
			e820_type = E820_NVS;
			break;
		case EFI_UNUSABLE_MEMORY:
			e820_type = E820_UNUSABLE;
			break;
		default:
			/*
			 * EFI_RESERVED_TYPE EFI_RUNTIME_SERVICES_CODE
			 * EFI_RUNTIME_SERVICES_DATA EFI_MEMORY_MAPPED_IO
			 * EFI_MEMORY_MAPPED_IO_PORT_SPACE EFI_PAL_CODE
			 */
338
			e820_type = E820_RESERVED;
339 340
			break;
		}
341
		e820_add_region(start, size, e820_type);
342 343 344 345
	}
	sanitize_e820_map(e820.map, ARRAY_SIZE(e820.map), &e820.nr_map);
}

346
int __init efi_memblock_x86_reserve_range(void)
347 348 349
{
	unsigned long pmap;

350
#ifdef CONFIG_X86_32
351 352 353 354 355
	/* Can't handle data above 4GB at this time */
	if (boot_params.efi_info.efi_memmap_hi) {
		pr_err("Memory map is above 4GB, disabling EFI.\n");
		return -EINVAL;
	}
356
	pmap = boot_params.efi_info.efi_memmap;
357 358 359
#else
	pmap = (boot_params.efi_info.efi_memmap |
		((__u64)boot_params.efi_info.efi_memmap_hi<<32));
360 361 362 363 364 365
#endif
	memmap.phys_map = (void *)pmap;
	memmap.nr_map = boot_params.efi_info.efi_memmap_size /
		boot_params.efi_info.efi_memdesc_size;
	memmap.desc_version = boot_params.efi_info.efi_memdesc_version;
	memmap.desc_size = boot_params.efi_info.efi_memdesc_size;
366
	memblock_reserve(pmap, memmap.nr_map * memmap.desc_size);
367 368

	return 0;
369 370
}

H
Huang, Ying 已提交
371 372 373 374 375 376 377 378 379 380 381
#if EFI_DEBUG
static void __init print_efi_memmap(void)
{
	efi_memory_desc_t *md;
	void *p;
	int i;

	for (p = memmap.map, i = 0;
	     p < memmap.map_end;
	     p += memmap.desc_size, i++) {
		md = p;
382
		pr_info("mem%02u: type=%u, attr=0x%llx, "
H
Huang, Ying 已提交
383 384 385 386 387 388 389 390
			"range=[0x%016llx-0x%016llx) (%lluMB)\n",
			i, md->type, md->attribute, md->phys_addr,
			md->phys_addr + (md->num_pages << EFI_PAGE_SHIFT),
			(md->num_pages >> (20 - EFI_PAGE_SHIFT)));
	}
}
#endif  /*  EFI_DEBUG  */

391 392 393 394 395 396
void __init efi_reserve_boot_services(void)
{
	void *p;

	for (p = memmap.map; p < memmap.map_end; p += memmap.desc_size) {
		efi_memory_desc_t *md = p;
397 398
		u64 start = md->phys_addr;
		u64 size = md->num_pages << EFI_PAGE_SHIFT;
399 400 401 402

		if (md->type != EFI_BOOT_SERVICES_CODE &&
		    md->type != EFI_BOOT_SERVICES_DATA)
			continue;
403 404 405 406 407 408 409 410 411
		/* Only reserve where possible:
		 * - Not within any already allocated areas
		 * - Not over any memory area (really needed, if above?)
		 * - Not within any part of the kernel
		 * - Not the bios reserved area
		*/
		if ((start+size >= virt_to_phys(_text)
				&& start <= virt_to_phys(_end)) ||
			!e820_all_mapped(start, start+size, E820_RAM) ||
412
			memblock_is_region_reserved(start, size)) {
413 414
			/* Could not reserve, skip it */
			md->num_pages = 0;
415
			memblock_dbg("Could not reserve boot range "
416 417 418
					"[0x%010llx-0x%010llx]\n",
						start, start+size-1);
		} else
419
			memblock_reserve(start, size);
420 421 422
	}
}

423 424 425 426 427 428 429 430 431
static void __init efi_unmap_memmap(void)
{
	if (memmap.map) {
		early_iounmap(memmap.map, memmap.nr_map * memmap.desc_size);
		memmap.map = NULL;
	}
}

void __init efi_free_boot_services(void)
432 433 434
{
	void *p;

435 436 437
	if (!efi_native)
		return;

438 439 440 441 442 443 444 445 446
	for (p = memmap.map; p < memmap.map_end; p += memmap.desc_size) {
		efi_memory_desc_t *md = p;
		unsigned long long start = md->phys_addr;
		unsigned long long size = md->num_pages << EFI_PAGE_SHIFT;

		if (md->type != EFI_BOOT_SERVICES_CODE &&
		    md->type != EFI_BOOT_SERVICES_DATA)
			continue;

447 448 449 450
		/* Could not reserve boot area */
		if (!size)
			continue;

451 452
		free_bootmem_late(start, size);
	}
453 454

	efi_unmap_memmap();
455 456
}

457
static int __init efi_systab_init(void *phys)
H
Huang, Ying 已提交
458
{
459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525
	if (efi_64bit) {
		efi_system_table_64_t *systab64;
		u64 tmp = 0;

		systab64 = early_ioremap((unsigned long)phys,
					 sizeof(*systab64));
		if (systab64 == NULL) {
			pr_err("Couldn't map the system table!\n");
			return -ENOMEM;
		}

		efi_systab.hdr = systab64->hdr;
		efi_systab.fw_vendor = systab64->fw_vendor;
		tmp |= systab64->fw_vendor;
		efi_systab.fw_revision = systab64->fw_revision;
		efi_systab.con_in_handle = systab64->con_in_handle;
		tmp |= systab64->con_in_handle;
		efi_systab.con_in = systab64->con_in;
		tmp |= systab64->con_in;
		efi_systab.con_out_handle = systab64->con_out_handle;
		tmp |= systab64->con_out_handle;
		efi_systab.con_out = systab64->con_out;
		tmp |= systab64->con_out;
		efi_systab.stderr_handle = systab64->stderr_handle;
		tmp |= systab64->stderr_handle;
		efi_systab.stderr = systab64->stderr;
		tmp |= systab64->stderr;
		efi_systab.runtime = (void *)(unsigned long)systab64->runtime;
		tmp |= systab64->runtime;
		efi_systab.boottime = (void *)(unsigned long)systab64->boottime;
		tmp |= systab64->boottime;
		efi_systab.nr_tables = systab64->nr_tables;
		efi_systab.tables = systab64->tables;
		tmp |= systab64->tables;

		early_iounmap(systab64, sizeof(*systab64));
#ifdef CONFIG_X86_32
		if (tmp >> 32) {
			pr_err("EFI data located above 4GB, disabling EFI.\n");
			return -EINVAL;
		}
#endif
	} else {
		efi_system_table_32_t *systab32;

		systab32 = early_ioremap((unsigned long)phys,
					 sizeof(*systab32));
		if (systab32 == NULL) {
			pr_err("Couldn't map the system table!\n");
			return -ENOMEM;
		}

		efi_systab.hdr = systab32->hdr;
		efi_systab.fw_vendor = systab32->fw_vendor;
		efi_systab.fw_revision = systab32->fw_revision;
		efi_systab.con_in_handle = systab32->con_in_handle;
		efi_systab.con_in = systab32->con_in;
		efi_systab.con_out_handle = systab32->con_out_handle;
		efi_systab.con_out = systab32->con_out;
		efi_systab.stderr_handle = systab32->stderr_handle;
		efi_systab.stderr = systab32->stderr;
		efi_systab.runtime = (void *)(unsigned long)systab32->runtime;
		efi_systab.boottime = (void *)(unsigned long)systab32->boottime;
		efi_systab.nr_tables = systab32->nr_tables;
		efi_systab.tables = systab32->tables;

		early_iounmap(systab32, sizeof(*systab32));
526
	}
527

H
Huang, Ying 已提交
528 529 530 531 532
	efi.systab = &efi_systab;

	/*
	 * Verify the EFI Table
	 */
533
	if (efi.systab->hdr.signature != EFI_SYSTEM_TABLE_SIGNATURE) {
534
		pr_err("System table signature incorrect!\n");
535 536
		return -EINVAL;
	}
H
Huang, Ying 已提交
537
	if ((efi.systab->hdr.revision >> 16) == 0)
538
		pr_err("Warning: System table version "
H
Huang, Ying 已提交
539 540 541
		       "%d.%02d, expected 1.00 or greater!\n",
		       efi.systab->hdr.revision >> 16,
		       efi.systab->hdr.revision & 0xffff);
542 543

	return 0;
544
}
H
Huang, Ying 已提交
545

546
static int __init efi_config_init(u64 tables, int nr_tables)
547
{
548 549 550 551 552 553 554
	void *config_tables, *tablep;
	int i, sz;

	if (efi_64bit)
		sz = sizeof(efi_config_table_64_t);
	else
		sz = sizeof(efi_config_table_32_t);
H
Huang, Ying 已提交
555 556 557 558

	/*
	 * Let's see what config tables the firmware passed to us.
	 */
559
	config_tables = early_ioremap(tables, nr_tables * sz);
560
	if (config_tables == NULL) {
561
		pr_err("Could not map Configuration table!\n");
562 563
		return -ENOMEM;
	}
H
Huang, Ying 已提交
564

565
	tablep = config_tables;
566
	pr_info("");
H
Huang, Ying 已提交
567
	for (i = 0; i < efi.systab->nr_tables; i++) {
568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588
		efi_guid_t guid;
		unsigned long table;

		if (efi_64bit) {
			u64 table64;
			guid = ((efi_config_table_64_t *)tablep)->guid;
			table64 = ((efi_config_table_64_t *)tablep)->table;
			table = table64;
#ifdef CONFIG_X86_32
			if (table64 >> 32) {
				pr_cont("\n");
				pr_err("Table located above 4GB, disabling EFI.\n");
				early_iounmap(config_tables,
					      efi.systab->nr_tables * sz);
				return -EINVAL;
			}
#endif
		} else {
			guid = ((efi_config_table_32_t *)tablep)->guid;
			table = ((efi_config_table_32_t *)tablep)->table;
		}
589 590 591 592 593 594 595 596 597 598 599 600
		if (!efi_guidcmp(guid, MPS_TABLE_GUID)) {
			efi.mps = table;
			pr_cont(" MPS=0x%lx ", table);
		} else if (!efi_guidcmp(guid, ACPI_20_TABLE_GUID)) {
			efi.acpi20 = table;
			pr_cont(" ACPI 2.0=0x%lx ", table);
		} else if (!efi_guidcmp(guid, ACPI_TABLE_GUID)) {
			efi.acpi = table;
			pr_cont(" ACPI=0x%lx ", table);
		} else if (!efi_guidcmp(guid, SMBIOS_TABLE_GUID)) {
			efi.smbios = table;
			pr_cont(" SMBIOS=0x%lx ", table);
N
Nick Piggin 已提交
601
#ifdef CONFIG_X86_UV
602 603 604
		} else if (!efi_guidcmp(guid, UV_SYSTEM_TABLE_GUID)) {
			efi.uv_systab = table;
			pr_cont(" UVsystab=0x%lx ", table);
N
Nick Piggin 已提交
605
#endif
606 607 608 609 610 611
		} else if (!efi_guidcmp(guid, HCDP_TABLE_GUID)) {
			efi.hcdp = table;
			pr_cont(" HCDP=0x%lx ", table);
		} else if (!efi_guidcmp(guid, UGA_IO_PROTOCOL_GUID)) {
			efi.uga = table;
			pr_cont(" UGA=0x%lx ", table);
H
Huang, Ying 已提交
612
		}
613
		tablep += sz;
H
Huang, Ying 已提交
614
	}
615
	pr_cont("\n");
616
	early_iounmap(config_tables, efi.systab->nr_tables * sz);
617
	return 0;
618 619
}

620
static int __init efi_runtime_init(void)
621 622
{
	efi_runtime_services_t *runtime;
H
Huang, Ying 已提交
623 624 625 626 627 628 629

	/*
	 * Check out the runtime services table. We need to map
	 * the runtime services table so that we can grab the physical
	 * address of several of the EFI runtime functions, needed to
	 * set the firmware into virtual mode.
	 */
630 631
	runtime = early_ioremap((unsigned long)efi.systab->runtime,
				sizeof(efi_runtime_services_t));
632
	if (!runtime) {
633
		pr_err("Could not map the runtime service table!\n");
634 635 636 637
		return -ENOMEM;
	}
	/*
	 * We will only need *early* access to the following
638
	 * two EFI runtime services before set_virtual_address_map
639 640
	 * is invoked.
	 */
641
	efi_phys.get_time = (efi_get_time_t *)runtime->get_time;
642 643 644
	efi_phys.set_virtual_address_map =
		(efi_set_virtual_address_map_t *)
		runtime->set_virtual_address_map;
645 646 647 648 649
	/*
	 * Make efi_get_time can be called before entering
	 * virtual mode.
	 */
	efi.get_time = phys_efi_get_time;
650
	early_iounmap(runtime, sizeof(efi_runtime_services_t));
651 652

	return 0;
653
}
H
Huang, Ying 已提交
654

655
static int __init efi_memmap_init(void)
656
{
H
Huang, Ying 已提交
657
	/* Map the EFI memory map */
658 659
	memmap.map = early_ioremap((unsigned long)memmap.phys_map,
				   memmap.nr_map * memmap.desc_size);
660
	if (memmap.map == NULL) {
661
		pr_err("Could not map the memory map!\n");
662 663
		return -ENOMEM;
	}
H
Huang, Ying 已提交
664
	memmap.map_end = memmap.map + (memmap.nr_map * memmap.desc_size);
R
Russ Anderson 已提交
665

666 667
	if (add_efi_memmap)
		do_add_efi_memmap();
668 669

	return 0;
670 671 672 673 674 675 676 677 678 679
}

void __init efi_init(void)
{
	efi_char16_t *c16;
	char vendor[100] = "unknown";
	int i = 0;
	void *tmp;

#ifdef CONFIG_X86_32
680 681 682 683 684 685
	if (boot_params.efi_info.efi_systab_hi ||
	    boot_params.efi_info.efi_memmap_hi) {
		pr_info("Table located above 4GB, disabling EFI.\n");
		efi_enabled = 0;
		return;
	}
686
	efi_phys.systab = (efi_system_table_t *)boot_params.efi_info.efi_systab;
687
	efi_native = !efi_64bit;
688 689
#else
	efi_phys.systab = (efi_system_table_t *)
690 691 692
			  (boot_params.efi_info.efi_systab |
			  ((__u64)boot_params.efi_info.efi_systab_hi<<32));
	efi_native = efi_64bit;
693 694
#endif

695 696 697 698
	if (efi_systab_init(efi_phys.systab)) {
		efi_enabled = 0;
		return;
	}
699 700 701 702 703 704 705 706 707 708

	/*
	 * Show what we know for posterity
	 */
	c16 = tmp = early_ioremap(efi.systab->fw_vendor, 2);
	if (c16) {
		for (i = 0; i < sizeof(vendor) - 1 && *c16; ++i)
			vendor[i] = *c16++;
		vendor[i] = '\0';
	} else
709
		pr_err("Could not map the firmware vendor!\n");
710 711
	early_iounmap(tmp, 2);

712 713 714
	pr_info("EFI v%u.%.02u by %s\n",
		efi.systab->hdr.revision >> 16,
		efi.systab->hdr.revision & 0xffff, vendor);
715

716 717 718 719
	if (efi_config_init(efi.systab->tables, efi.systab->nr_tables)) {
		efi_enabled = 0;
		return;
	}
720

721 722 723 724 725 726 727 728
	/*
	 * Note: We currently don't support runtime services on an EFI
	 * that doesn't match the kernel 32/64-bit mode.
	 */

	if (!efi_native)
		pr_info("No EFI runtime due to 32/64-bit mismatch with kernel\n");
	else if (efi_runtime_init()) {
729 730 731
		efi_enabled = 0;
		return;
	}
732

733 734 735 736
	if (efi_memmap_init()) {
		efi_enabled = 0;
		return;
	}
737
#ifdef CONFIG_X86_32
738 739 740 741
	if (efi_native) {
		x86_platform.get_wallclock = efi_get_time;
		x86_platform.set_wallclock = efi_set_rtc_mmss;
	}
742
#endif
743

H
Huang, Ying 已提交
744 745 746 747 748
#if EFI_DEBUG
	print_efi_memmap();
#endif
}

749 750 751 752 753
void __init efi_late_init(void)
{
	efi_bgrt_init();
}

754 755 756 757 758 759 760 761 762 763 764 765 766 767 768
void __init efi_set_executable(efi_memory_desc_t *md, bool executable)
{
	u64 addr, npages;

	addr = md->virt_addr;
	npages = md->num_pages;

	memrange_efi_to_native(&addr, &npages);

	if (executable)
		set_memory_x(addr, npages);
	else
		set_memory_nx(addr, npages);
}

769 770 771 772 773 774 775 776
static void __init runtime_code_page_mkexec(void)
{
	efi_memory_desc_t *md;
	void *p;

	/* Make EFI runtime service code area executable */
	for (p = memmap.map; p < memmap.map_end; p += memmap.desc_size) {
		md = p;
H
Huang, Ying 已提交
777 778 779 780

		if (md->type != EFI_RUNTIME_SERVICES_CODE)
			continue;

781
		efi_set_executable(md, true);
782 783 784
	}
}

785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812
/*
 * We can't ioremap data in EFI boot services RAM, because we've already mapped
 * it as RAM.  So, look it up in the existing EFI memory map instead.  Only
 * callable after efi_enter_virtual_mode and before efi_free_boot_services.
 */
void __iomem *efi_lookup_mapped_addr(u64 phys_addr)
{
	void *p;
	if (WARN_ON(!memmap.map))
		return NULL;
	for (p = memmap.map; p < memmap.map_end; p += memmap.desc_size) {
		efi_memory_desc_t *md = p;
		u64 size = md->num_pages << EFI_PAGE_SHIFT;
		u64 end = md->phys_addr + size;
		if (!(md->attribute & EFI_MEMORY_RUNTIME) &&
		    md->type != EFI_BOOT_SERVICES_CODE &&
		    md->type != EFI_BOOT_SERVICES_DATA)
			continue;
		if (!md->virt_addr)
			continue;
		if (phys_addr >= md->phys_addr && phys_addr < end) {
			phys_addr += md->virt_addr - md->phys_addr;
			return (__force void __iomem *)(unsigned long)phys_addr;
		}
	}
	return NULL;
}

H
Huang, Ying 已提交
813 814 815 816 817 818 819 820 821 822
/*
 * This function will switch the EFI runtime services to virtual mode.
 * Essentially, look through the EFI memmap and map every region that
 * has the runtime attribute bit set in its memory descriptor and update
 * that memory descriptor with the virtual address obtained from ioremap().
 * This enables the runtime services to be called without having to
 * thunk back into physical mode for every invocation.
 */
void __init efi_enter_virtual_mode(void)
{
823
	efi_memory_desc_t *md, *prev_md = NULL;
H
Huang, Ying 已提交
824
	efi_status_t status;
H
Huang, Ying 已提交
825
	unsigned long size;
826
	u64 end, systab, addr, npages, end_pfn;
827 828
	void *p, *va, *new_memmap = NULL;
	int count = 0;
H
Huang, Ying 已提交
829 830

	efi.systab = NULL;
831

832 833 834 835 836
	/*
	 * We don't do virtual mode, since we don't do runtime services, on
	 * non-native EFI
	 */

837 838 839 840
	if (!efi_native) {
		efi_unmap_memmap();
		return;
	}
841

842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868
	/* Merge contiguous regions of the same type and attribute */
	for (p = memmap.map; p < memmap.map_end; p += memmap.desc_size) {
		u64 prev_size;
		md = p;

		if (!prev_md) {
			prev_md = md;
			continue;
		}

		if (prev_md->type != md->type ||
		    prev_md->attribute != md->attribute) {
			prev_md = md;
			continue;
		}

		prev_size = prev_md->num_pages << EFI_PAGE_SHIFT;

		if (md->phys_addr == (prev_md->phys_addr + prev_size)) {
			prev_md->num_pages += md->num_pages;
			md->type = EFI_RESERVED_TYPE;
			md->attribute = 0;
			continue;
		}
		prev_md = md;
	}

H
Huang, Ying 已提交
869 870
	for (p = memmap.map; p < memmap.map_end; p += memmap.desc_size) {
		md = p;
871 872 873
		if (!(md->attribute & EFI_MEMORY_RUNTIME) &&
		    md->type != EFI_BOOT_SERVICES_CODE &&
		    md->type != EFI_BOOT_SERVICES_DATA)
H
Huang, Ying 已提交
874
			continue;
H
Huang, Ying 已提交
875 876 877 878

		size = md->num_pages << EFI_PAGE_SHIFT;
		end = md->phys_addr + size;

879 880 881 882
		end_pfn = PFN_UP(end);
		if (end_pfn <= max_low_pfn_mapped
		    || (end_pfn > (1UL << (32 - PAGE_SHIFT))
			&& end_pfn <= max_pfn_mapped))
H
Huang, Ying 已提交
883
			va = __va(md->phys_addr);
H
Huang, Ying 已提交
884
		else
885
			va = efi_ioremap(md->phys_addr, size, md->type);
H
Huang, Ying 已提交
886 887 888 889

		md->virt_addr = (u64) (unsigned long) va;

		if (!va) {
890
			pr_err("ioremap of 0x%llX failed!\n",
H
Huang, Ying 已提交
891
			       (unsigned long long)md->phys_addr);
H
Huang, Ying 已提交
892 893 894
			continue;
		}

H
Huang, Ying 已提交
895 896 897 898 899 900
		if (!(md->attribute & EFI_MEMORY_WB)) {
			addr = md->virt_addr;
			npages = md->num_pages;
			memrange_efi_to_native(&addr, &npages);
			set_memory_uc(addr, npages);
		}
901

H
Huang, Ying 已提交
902 903 904 905 906
		systab = (u64) (unsigned long) efi_phys.systab;
		if (md->phys_addr <= systab && systab < end) {
			systab += md->virt_addr - md->phys_addr;
			efi.systab = (efi_system_table_t *) (unsigned long) systab;
		}
907 908 909 910 911 912
		new_memmap = krealloc(new_memmap,
				      (count + 1) * memmap.desc_size,
				      GFP_KERNEL);
		memcpy(new_memmap + (count * memmap.desc_size), md,
		       memmap.desc_size);
		count++;
H
Huang, Ying 已提交
913 914 915 916 917
	}

	BUG_ON(!efi.systab);

	status = phys_efi_set_virtual_address_map(
918
		memmap.desc_size * count,
H
Huang, Ying 已提交
919 920
		memmap.desc_size,
		memmap.desc_version,
921
		(efi_memory_desc_t *)__pa(new_memmap));
H
Huang, Ying 已提交
922 923

	if (status != EFI_SUCCESS) {
924 925
		pr_alert("Unable to switch EFI into virtual mode "
			 "(status=%lx)!\n", status);
H
Huang, Ying 已提交
926 927 928 929 930 931 932 933 934
		panic("EFI call to SetVirtualAddressMap() failed!");
	}

	/*
	 * Now that EFI is in virtual mode, update the function
	 * pointers in the runtime service table to the new virtual addresses.
	 *
	 * Call EFI services through wrapper functions.
	 */
935
	efi.runtime_version = efi_systab.fw_revision;
H
Huang, Ying 已提交
936 937 938 939 940 941 942 943 944
	efi.get_time = virt_efi_get_time;
	efi.set_time = virt_efi_set_time;
	efi.get_wakeup_time = virt_efi_get_wakeup_time;
	efi.set_wakeup_time = virt_efi_set_wakeup_time;
	efi.get_variable = virt_efi_get_variable;
	efi.get_next_variable = virt_efi_get_next_variable;
	efi.set_variable = virt_efi_set_variable;
	efi.get_next_high_mono_count = virt_efi_get_next_high_mono_count;
	efi.reset_system = virt_efi_reset_system;
945
	efi.set_virtual_address_map = NULL;
946 947 948
	efi.query_variable_info = virt_efi_query_variable_info;
	efi.update_capsule = virt_efi_update_capsule;
	efi.query_capsule_caps = virt_efi_query_capsule_caps;
949 950
	if (__supported_pte_mask & _PAGE_NX)
		runtime_code_page_mkexec();
951

952
	kfree(new_memmap);
H
Huang, Ying 已提交
953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986
}

/*
 * Convenience functions to obtain memory types and attributes
 */
u32 efi_mem_type(unsigned long phys_addr)
{
	efi_memory_desc_t *md;
	void *p;

	for (p = memmap.map; p < memmap.map_end; p += memmap.desc_size) {
		md = p;
		if ((md->phys_addr <= phys_addr) &&
		    (phys_addr < (md->phys_addr +
				  (md->num_pages << EFI_PAGE_SHIFT))))
			return md->type;
	}
	return 0;
}

u64 efi_mem_attributes(unsigned long phys_addr)
{
	efi_memory_desc_t *md;
	void *p;

	for (p = memmap.map; p < memmap.map_end; p += memmap.desc_size) {
		md = p;
		if ((md->phys_addr <= phys_addr) &&
		    (phys_addr < (md->phys_addr +
				  (md->num_pages << EFI_PAGE_SHIFT))))
			return md->attribute;
	}
	return 0;
}