setup.c 33.4 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 *  Copyright (C) 1995  Linus Torvalds
 *
 *  Support of BIGMEM added by Gerhard Wichert, Siemens AG, July 1999
 *
 *  Memory region support
 *	David Parsons <orc@pell.chi.il.us>, July-August 1999
 *
 *  Added E820 sanitization routine (removes overlapping memory regions);
 *  Brian Moyle <bmoyle@mvista.com>, February 2001
 *
 * Moved CPU detection code to cpu/${cpu}.c
 *    Patrick Mochel <mochel@osdl.org>, March 2002
 *
 *  Provisions for empty E820 memory regions (reported by certain BIOSes).
 *  Alex Achenbach <xela@slit.de>, December 2002.
 *
 */

/*
 * This file handles the architecture-dependent parts of initialization
 */

#include <linux/sched.h>
#include <linux/mm.h>
26
#include <linux/mmzone.h>
27
#include <linux/screen_info.h>
L
Linus Torvalds 已提交
28 29
#include <linux/ioport.h>
#include <linux/acpi.h>
F
Feng Tang 已提交
30
#include <linux/sfi.h>
L
Linus Torvalds 已提交
31 32 33
#include <linux/apm_bios.h>
#include <linux/initrd.h>
#include <linux/bootmem.h>
34
#include <linux/memblock.h>
L
Linus Torvalds 已提交
35 36 37 38
#include <linux/seq_file.h>
#include <linux/console.h>
#include <linux/root_dev.h>
#include <linux/highmem.h>
39
#include <linux/export.h>
L
Linus Torvalds 已提交
40 41 42
#include <linux/efi.h>
#include <linux/init.h>
#include <linux/edd.h>
43
#include <linux/iscsi_ibft.h>
L
Linus Torvalds 已提交
44
#include <linux/nodemask.h>
45
#include <linux/kexec.h>
46
#include <linux/dmi.h>
D
Dave Hansen 已提交
47
#include <linux/pfn.h>
48
#include <linux/pci.h>
49
#include <asm/pci-direct.h>
50
#include <linux/init_ohci1394_dma.h>
51
#include <linux/kvm_para.h>
52
#include <linux/dma-contiguous.h>
53

54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
#include <linux/errno.h>
#include <linux/kernel.h>
#include <linux/stddef.h>
#include <linux/unistd.h>
#include <linux/ptrace.h>
#include <linux/user.h>
#include <linux/delay.h>

#include <linux/kallsyms.h>
#include <linux/cpufreq.h>
#include <linux/dma-mapping.h>
#include <linux/ctype.h>
#include <linux/uaccess.h>

#include <linux/percpu.h>
#include <linux/crash_dump.h>
70
#include <linux/tboot.h>
71
#include <linux/jiffies.h>
72
#include <linux/mem_encrypt.h>
73

74
#include <linux/usb/xhci-dbgp.h>
L
Linus Torvalds 已提交
75
#include <video/edid.h>
76

77
#include <asm/mtrr.h>
78
#include <asm/apic.h>
79
#include <asm/realmode.h>
80
#include <asm/e820/api.h>
L
Linus Torvalds 已提交
81 82
#include <asm/mpspec.h>
#include <asm/setup.h>
Y
Yinghai Lu 已提交
83
#include <asm/efi.h>
I
Ingo Molnar 已提交
84 85
#include <asm/timer.h>
#include <asm/i8259.h>
L
Linus Torvalds 已提交
86 87 88
#include <asm/sections.h>
#include <asm/io_apic.h>
#include <asm/ist.h>
89
#include <asm/setup_arch.h>
90
#include <asm/bios_ebda.h>
B
Bernhard Walle 已提交
91
#include <asm/cacheflush.h>
92
#include <asm/processor.h>
Y
Yinghai Lu 已提交
93
#include <asm/bugs.h>
A
Andrey Ryabinin 已提交
94
#include <asm/kasan.h>
L
Linus Torvalds 已提交
95

96
#include <asm/vsyscall.h>
97
#include <asm/cpu.h>
98 99
#include <asm/desc.h>
#include <asm/dma.h>
100
#include <asm/iommu.h>
101
#include <asm/gart.h>
102 103 104 105
#include <asm/mmu_context.h>
#include <asm/proto.h>

#include <asm/paravirt.h>
106
#include <asm/hypervisor.h>
107
#include <asm/olpc_ofw.h>
108 109 110 111

#include <asm/percpu.h>
#include <asm/topology.h>
#include <asm/apicdef.h>
112
#include <asm/amd_nb.h>
113
#include <asm/mce.h>
114
#include <asm/alternative.h>
115
#include <asm/prom.h>
116
#include <asm/microcode.h>
117
#include <asm/mmu_context.h>
118
#include <asm/kaslr.h>
119

120
/*
121 122 123
 * max_low_pfn_mapped: highest direct mapped pfn under 4GB
 * max_pfn_mapped:     highest direct mapped pfn over 4GB
 *
124
 * The direct mapping only covers E820_TYPE_RAM regions, so the ranges and gaps are
125
 * represented by pfn_mapped
126 127 128 129
 */
unsigned long max_low_pfn_mapped;
unsigned long max_pfn_mapped;

130
#ifdef CONFIG_DMI
131
RESERVE_BRK(dmi_alloc, 65536);
132
#endif
133

I
Ingo Molnar 已提交
134

135 136 137
static __initdata unsigned long _brk_start = (unsigned long)__brk_base;
unsigned long _brk_end = (unsigned long)__brk_base;

I
Ingo Molnar 已提交
138 139 140 141 142 143
#ifdef CONFIG_X86_64
int default_cpu_present_to_apicid(int mps_cpu)
{
	return __default_cpu_present_to_apicid(mps_cpu);
}

T
Thomas Gleixner 已提交
144
int default_check_phys_apicid_present(int phys_apicid)
I
Ingo Molnar 已提交
145
{
T
Thomas Gleixner 已提交
146
	return __default_check_phys_apicid_present(phys_apicid);
I
Ingo Molnar 已提交
147 148 149
}
#endif

150 151
struct boot_params boot_params;

152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176
/*
 * Machine setup..
 */
static struct resource data_resource = {
	.name	= "Kernel data",
	.start	= 0,
	.end	= 0,
	.flags	= IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM
};

static struct resource code_resource = {
	.name	= "Kernel code",
	.start	= 0,
	.end	= 0,
	.flags	= IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM
};

static struct resource bss_resource = {
	.name	= "Kernel bss",
	.start	= 0,
	.end	= 0,
	.flags	= IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM
};


177
#ifdef CONFIG_X86_32
178 179 180
/* cpu data as detected by the assembly code in head_32.S */
struct cpuinfo_x86 new_cpu_data;

L
Linus Torvalds 已提交
181
/* common cpu data for all cpus */
182
struct cpuinfo_x86 boot_cpu_data __read_mostly;
183
EXPORT_SYMBOL(boot_cpu_data);
L
Linus Torvalds 已提交
184

185 186
unsigned int def_to_bigsmp;

L
Linus Torvalds 已提交
187 188 189 190 191
/* for MCA, but anyone else can use it if they want */
unsigned int machine_id;
unsigned int machine_submodel_id;
unsigned int BIOS_revision;

192 193 194 195 196 197 198 199 200 201 202 203
struct apm_info apm_info;
EXPORT_SYMBOL(apm_info);

#if defined(CONFIG_X86_SPEEDSTEP_SMI) || \
	defined(CONFIG_X86_SPEEDSTEP_SMI_MODULE)
struct ist_info ist_info;
EXPORT_SYMBOL(ist_info);
#else
struct ist_info ist_info;
#endif

#else
204 205 206
struct cpuinfo_x86 boot_cpu_data __read_mostly = {
	.x86_phys_bits = MAX_PHYSMEM_BITS,
};
207 208 209 210 211
EXPORT_SYMBOL(boot_cpu_data);
#endif


#if !defined(CONFIG_X86_PAE) || defined(CONFIG_X86_64)
212
__visible unsigned long mmu_cr4_features __ro_after_init;
213
#else
214
__visible unsigned long mmu_cr4_features __ro_after_init = X86_CR4_PAE;
215 216
#endif

217 218
/* Boot loader ID and version as integers, for the benefit of proc_dointvec */
int bootloader_type, bootloader_version;
L
Linus Torvalds 已提交
219 220 221 222 223

/*
 * Setup options
 */
struct screen_info screen_info;
224
EXPORT_SYMBOL(screen_info);
L
Linus Torvalds 已提交
225
struct edid_info edid_info;
226
EXPORT_SYMBOL_GPL(edid_info);
L
Linus Torvalds 已提交
227 228 229

extern int root_mountflags;

230
unsigned long saved_video_mode;
L
Linus Torvalds 已提交
231

232
#define RAMDISK_IMAGE_START_MASK	0x07FF
L
Linus Torvalds 已提交
233
#define RAMDISK_PROMPT_FLAG		0x8000
234
#define RAMDISK_LOAD_FLAG		0x4000
L
Linus Torvalds 已提交
235

236
static char __initdata command_line[COMMAND_LINE_SIZE];
237 238 239
#ifdef CONFIG_CMDLINE_BOOL
static char __initdata builtin_cmdline[COMMAND_LINE_SIZE] = CONFIG_CMDLINE;
#endif
L
Linus Torvalds 已提交
240 241 242 243 244 245 246 247 248 249 250

#if defined(CONFIG_EDD) || defined(CONFIG_EDD_MODULE)
struct edd edd;
#ifdef CONFIG_EDD_MODULE
EXPORT_SYMBOL(edd);
#endif
/**
 * copy_edd() - Copy the BIOS EDD information
 *              from boot_params into a safe place.
 *
 */
251
static inline void __init copy_edd(void)
L
Linus Torvalds 已提交
252
{
253 254 255 256 257
     memcpy(edd.mbr_signature, boot_params.edd_mbr_sig_buffer,
	    sizeof(edd.mbr_signature));
     memcpy(edd.edd_info, boot_params.eddbuf, sizeof(edd.edd_info));
     edd.mbr_signature_nr = boot_params.edd_mbr_sig_buf_entries;
     edd.edd_info_nr = boot_params.eddbuf_entries;
L
Linus Torvalds 已提交
258 259
}
#else
260
static inline void __init copy_edd(void)
L
Linus Torvalds 已提交
261 262 263 264
{
}
#endif

265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283
void * __init extend_brk(size_t size, size_t align)
{
	size_t mask = align - 1;
	void *ret;

	BUG_ON(_brk_start == 0);
	BUG_ON(align & mask);

	_brk_end = (_brk_end + mask) & ~mask;
	BUG_ON((char *)(_brk_end + size) > __brk_limit);

	ret = (void *)_brk_end;
	_brk_end += size;

	memset(ret, 0, size);

	return ret;
}

284
#ifdef CONFIG_X86_32
285
static void __init cleanup_highmap(void)
286 287
{
}
288 289
#endif

290 291 292
static void __init reserve_brk(void)
{
	if (_brk_end > _brk_start)
293 294
		memblock_reserve(__pa_symbol(_brk_start),
				 _brk_end - _brk_start);
295 296 297 298 299 300

	/* Mark brk area as locked down and no longer taking any
	   new allocations */
	_brk_start = 0;
}

301 302
u64 relocated_ramdisk;

303 304
#ifdef CONFIG_BLK_DEV_INITRD

Y
Yinghai Lu 已提交
305 306 307 308
static u64 __init get_ramdisk_image(void)
{
	u64 ramdisk_image = boot_params.hdr.ramdisk_image;

309 310
	ramdisk_image |= (u64)boot_params.ext_ramdisk_image << 32;

Y
Yinghai Lu 已提交
311 312 313 314 315 316
	return ramdisk_image;
}
static u64 __init get_ramdisk_size(void)
{
	u64 ramdisk_size = boot_params.hdr.ramdisk_size;

317 318
	ramdisk_size |= (u64)boot_params.ext_ramdisk_size << 32;

Y
Yinghai Lu 已提交
319 320 321
	return ramdisk_size;
}

322
static void __init relocate_initrd(void)
323
{
324
	/* Assume only end is not page aligned */
Y
Yinghai Lu 已提交
325 326
	u64 ramdisk_image = get_ramdisk_image();
	u64 ramdisk_size  = get_ramdisk_size();
327
	u64 area_size     = PAGE_ALIGN(ramdisk_size);
328

329
	/* We need to move the initrd down into directly mapped mem */
330 331
	relocated_ramdisk = memblock_find_in_range(0, PFN_PHYS(max_pfn_mapped),
						   area_size, PAGE_SIZE);
332

333
	if (!relocated_ramdisk)
334
		panic("Cannot find place for new RAMDISK of size %lld\n",
335
		      ramdisk_size);
336

337
	/* Note: this includes all the mem currently occupied by
338
	   the initrd, we rely on that fact to keep the data intact. */
339 340
	memblock_reserve(relocated_ramdisk, area_size);
	initrd_start = relocated_ramdisk + PAGE_OFFSET;
341
	initrd_end   = initrd_start + ramdisk_size;
342
	printk(KERN_INFO "Allocated new RAMDISK: [mem %#010llx-%#010llx]\n",
343
	       relocated_ramdisk, relocated_ramdisk + ramdisk_size - 1);
344

M
Mark Salter 已提交
345 346
	copy_from_early_mem((void *)initrd_start, ramdisk_image, ramdisk_size);

347 348
	printk(KERN_INFO "Move RAMDISK from [mem %#010llx-%#010llx] to"
		" [mem %#010llx-%#010llx]\n",
349
		ramdisk_image, ramdisk_image + ramdisk_size - 1,
350
		relocated_ramdisk, relocated_ramdisk + ramdisk_size - 1);
351
}
Y
Yinghai Lu 已提交
352

353 354 355
static void __init early_reserve_initrd(void)
{
	/* Assume only end is not page aligned */
Y
Yinghai Lu 已提交
356 357
	u64 ramdisk_image = get_ramdisk_image();
	u64 ramdisk_size  = get_ramdisk_size();
358 359 360 361 362 363 364 365
	u64 ramdisk_end   = PAGE_ALIGN(ramdisk_image + ramdisk_size);

	if (!boot_params.hdr.type_of_loader ||
	    !ramdisk_image || !ramdisk_size)
		return;		/* No initrd provided by bootloader */

	memblock_reserve(ramdisk_image, ramdisk_end - ramdisk_image);
}
366 367
static void __init reserve_initrd(void)
{
368
	/* Assume only end is not page aligned */
Y
Yinghai Lu 已提交
369 370
	u64 ramdisk_image = get_ramdisk_image();
	u64 ramdisk_size  = get_ramdisk_size();
371
	u64 ramdisk_end   = PAGE_ALIGN(ramdisk_image + ramdisk_size);
372
	u64 mapped_size;
373 374 375 376 377

	if (!boot_params.hdr.type_of_loader ||
	    !ramdisk_image || !ramdisk_size)
		return;		/* No initrd provided by bootloader */

378 379 380 381 382 383 384 385
	/*
	 * If SME is active, this memory will be marked encrypted by the
	 * kernel when it is accessed (including relocation). However, the
	 * ramdisk image was loaded decrypted by the bootloader, so make
	 * sure that it is encrypted before accessing it.
	 */
	sme_early_encrypt(ramdisk_image, ramdisk_end - ramdisk_image);

386 387
	initrd_start = 0;

Y
Yinghai Lu 已提交
388
	mapped_size = memblock_mem_size(max_pfn_mapped);
389
	if (ramdisk_size >= (mapped_size>>1))
390 391
		panic("initrd too large to handle, "
		       "disabling initrd (%lld needed, %lld available)\n",
392
		       ramdisk_size, mapped_size>>1);
393

394 395
	printk(KERN_INFO "RAMDISK: [mem %#010llx-%#010llx]\n", ramdisk_image,
			ramdisk_end - 1);
396

397
	if (pfn_range_is_mapped(PFN_DOWN(ramdisk_image),
398 399
				PFN_DOWN(ramdisk_end))) {
		/* All are mapped, easy case */
400 401 402 403 404 405
		initrd_start = ramdisk_image + PAGE_OFFSET;
		initrd_end = initrd_start + ramdisk_size;
		return;
	}

	relocate_initrd();
406

407
	memblock_free(ramdisk_image, ramdisk_end - ramdisk_image);
408
}
409

Y
Yinghai Lu 已提交
410
#else
411 412 413
static void __init early_reserve_initrd(void)
{
}
414
static void __init reserve_initrd(void)
Y
Yinghai Lu 已提交
415 416
{
}
417 418
#endif /* CONFIG_BLK_DEV_INITRD */

419
static void __init parse_setup_data(void)
420 421
{
	struct setup_data *data;
422
	u64 pa_data, pa_next;
423 424 425

	pa_data = boot_params.hdr.setup_data;
	while (pa_data) {
426
		u32 data_len, data_type;
427

428
		data = early_memremap(pa_data, sizeof(*data));
429
		data_len = data->len + sizeof(struct setup_data);
430 431
		data_type = data->type;
		pa_next = data->next;
432
		early_memunmap(data, sizeof(*data));
433

434
		switch (data_type) {
435
		case SETUP_E820_EXT:
436
			e820__memory_setup_extended(pa_data, data_len);
437
			break;
438 439
		case SETUP_DTB:
			add_dtb(pa_data);
440
			break;
441 442 443
		case SETUP_EFI:
			parse_efi_setup(pa_data, data_len);
			break;
444 445 446
		default:
			break;
		}
447
		pa_data = pa_next;
448 449 450
	}
}

451
static void __init memblock_x86_reserve_range_setup_data(void)
452 453 454 455 456 457
{
	struct setup_data *data;
	u64 pa_data;

	pa_data = boot_params.hdr.setup_data;
	while (pa_data) {
458
		data = early_memremap(pa_data, sizeof(*data));
459
		memblock_reserve(pa_data, sizeof(*data) + data->len);
460
		pa_data = data->next;
461
		early_memunmap(data, sizeof(*data));
462 463 464
	}
}

465 466 467 468
/*
 * --------- Crashkernel reservation ------------------------------
 */

469
#ifdef CONFIG_KEXEC_CORE
470

471 472 473
/* 16M alignment for crash kernel regions */
#define CRASH_ALIGN		(16 << 20)

474 475 476
/*
 * Keep the crash kernel below this limit.  On 32 bits earlier kernels
 * would limit the kernel to the low 512 MiB due to mapping restrictions.
477
 * On 64bit, old kexec-tools need to under 896MiB.
478 479
 */
#ifdef CONFIG_X86_32
480 481
# define CRASH_ADDR_LOW_MAX	(512 << 20)
# define CRASH_ADDR_HIGH_MAX	(512 << 20)
482
#else
483 484
# define CRASH_ADDR_LOW_MAX	(896UL << 20)
# define CRASH_ADDR_HIGH_MAX	MAXMEM
485 486
#endif

487
static int __init reserve_crashkernel_low(void)
488 489
{
#ifdef CONFIG_X86_64
490
	unsigned long long base, low_base = 0, low_size = 0;
491 492 493
	unsigned long total_low_mem;
	int ret;

494 495
	total_low_mem = memblock_mem_size(1UL << (32 - PAGE_SHIFT));

496
	/* crashkernel=Y,low */
497
	ret = parse_crashkernel_low(boot_command_line, total_low_mem, &low_size, &base);
498
	if (ret) {
499 500
		/*
		 * two parts from lib/swiotlb.c:
501 502 503 504 505 506
		 * -swiotlb size: user-specified with swiotlb= or default.
		 *
		 * -swiotlb overflow buffer: now hardcoded to 32k. We round it
		 * to 8M for other buffers that may need to stay low too. Also
		 * make sure we allocate enough extra low memory so that we
		 * don't run out of DMA buffers for 32-bit devices.
507
		 */
508
		low_size = max(swiotlb_size_or_default() + (8UL << 20), 256UL << 20);
509
	} else {
510
		/* passed with crashkernel=0,low ? */
511
		if (!low_size)
512
			return 0;
513
	}
514

515
	low_base = memblock_find_in_range(0, 1ULL << 32, low_size, CRASH_ALIGN);
516
	if (!low_base) {
517 518 519
		pr_err("Cannot reserve %ldMB crashkernel low memory, please try smaller size.\n",
		       (unsigned long)(low_size >> 20));
		return -ENOMEM;
520 521
	}

522 523 524 525
	ret = memblock_reserve(low_base, low_size);
	if (ret) {
		pr_err("%s: Error reserving crashkernel low memblock.\n", __func__);
		return ret;
526 527 528
	}

	pr_info("Reserving %ldMB of low memory at %ldMB for crashkernel (System low RAM: %ldMB)\n",
529 530 531 532
		(unsigned long)(low_size >> 20),
		(unsigned long)(low_base >> 20),
		(unsigned long)(total_low_mem >> 20));

533 534 535
	crashk_low_res.start = low_base;
	crashk_low_res.end   = low_base + low_size - 1;
	insert_resource(&iomem_resource, &crashk_low_res);
536
#endif
537
	return 0;
538
}
539

540
static void __init reserve_crashkernel(void)
541
{
542
	unsigned long long crash_size, crash_base, total_mem;
543
	bool high = false;
544 545
	int ret;

546
	total_mem = memblock_phys_mem_size();
547

548
	/* crashkernel=XM */
549
	ret = parse_crashkernel(boot_command_line, total_mem, &crash_size, &crash_base);
550
	if (ret != 0 || crash_size <= 0) {
551
		/* crashkernel=X,high */
552
		ret = parse_crashkernel_high(boot_command_line, total_mem,
553
					     &crash_size, &crash_base);
554 555 556 557
		if (ret != 0 || crash_size <= 0)
			return;
		high = true;
	}
558 559 560

	/* 0 means: find the address automatically */
	if (crash_base <= 0) {
561
		/*
562 563 564
		 * Set CRASH_ADDR_LOW_MAX upper bound for crash memory,
		 * as old kexec-tools loads bzImage below that, unless
		 * "crashkernel=size[KMG],high" is specified.
565
		 */
566
		crash_base = memblock_find_in_range(CRASH_ALIGN,
567 568
						    high ? CRASH_ADDR_HIGH_MAX
							 : CRASH_ADDR_LOW_MAX,
569
						    crash_size, CRASH_ALIGN);
T
Tejun Heo 已提交
570
		if (!crash_base) {
571
			pr_info("crashkernel reservation failed - No suitable area found.\n");
572 573
			return;
		}
574

575
	} else {
576 577
		unsigned long long start;

578
		start = memblock_find_in_range(crash_base,
579 580
					       crash_base + crash_size,
					       crash_size, 1 << 20);
581 582
		if (start != crash_base) {
			pr_info("crashkernel reservation failed - memory is in use.\n");
583 584
			return;
		}
585
	}
586 587 588 589 590
	ret = memblock_reserve(crash_base, crash_size);
	if (ret) {
		pr_err("%s: Error reserving crashkernel memblock.\n", __func__);
		return;
	}
591

592 593 594 595
	if (crash_base >= (1ULL << 32) && reserve_crashkernel_low()) {
		memblock_free(crash_base, crash_size);
		return;
	}
596

597 598 599 600
	pr_info("Reserving %ldMB of memory at %ldMB for crashkernel (System RAM: %ldMB)\n",
		(unsigned long)(crash_size >> 20),
		(unsigned long)(crash_base >> 20),
		(unsigned long)(total_mem >> 20));
601

602 603 604
	crashk_res.start = crash_base;
	crashk_res.end   = crash_base + crash_size - 1;
	insert_resource(&iomem_resource, &crashk_res);
605 606
}
#else
607
static void __init reserve_crashkernel(void)
608 609 610 611
{
}
#endif

612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634
static struct resource standard_io_resources[] = {
	{ .name = "dma1", .start = 0x00, .end = 0x1f,
		.flags = IORESOURCE_BUSY | IORESOURCE_IO },
	{ .name = "pic1", .start = 0x20, .end = 0x21,
		.flags = IORESOURCE_BUSY | IORESOURCE_IO },
	{ .name = "timer0", .start = 0x40, .end = 0x43,
		.flags = IORESOURCE_BUSY | IORESOURCE_IO },
	{ .name = "timer1", .start = 0x50, .end = 0x53,
		.flags = IORESOURCE_BUSY | IORESOURCE_IO },
	{ .name = "keyboard", .start = 0x60, .end = 0x60,
		.flags = IORESOURCE_BUSY | IORESOURCE_IO },
	{ .name = "keyboard", .start = 0x64, .end = 0x64,
		.flags = IORESOURCE_BUSY | IORESOURCE_IO },
	{ .name = "dma page reg", .start = 0x80, .end = 0x8f,
		.flags = IORESOURCE_BUSY | IORESOURCE_IO },
	{ .name = "pic2", .start = 0xa0, .end = 0xa1,
		.flags = IORESOURCE_BUSY | IORESOURCE_IO },
	{ .name = "dma2", .start = 0xc0, .end = 0xdf,
		.flags = IORESOURCE_BUSY | IORESOURCE_IO },
	{ .name = "fpu", .start = 0xf0, .end = 0xff,
		.flags = IORESOURCE_BUSY | IORESOURCE_IO }
};

635
void __init reserve_standard_io_resources(void)
636 637 638 639 640 641 642 643 644
{
	int i;

	/* request I/O space for devices used on all i[345]86 PCs */
	for (i = 0; i < ARRAY_SIZE(standard_io_resources); i++)
		request_resource(&ioport_resource, &standard_io_resources[i]);

}

645 646 647 648 649 650 651
static __init void reserve_ibft_region(void)
{
	unsigned long addr, size = 0;

	addr = find_ibft_region(&size);

	if (size)
652
		memblock_reserve(addr, size);
653 654
}

655 656
static bool __init snb_gfx_workaround_needed(void)
{
657
#ifdef CONFIG_PCI
658 659
	int i;
	u16 vendor, devid;
660
	static const __initconst u16 snb_ids[] = {
661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681
		0x0102,
		0x0112,
		0x0122,
		0x0106,
		0x0116,
		0x0126,
		0x010a,
	};

	/* Assume no if something weird is going on with PCI */
	if (!early_pci_allowed())
		return false;

	vendor = read_pci_config_16(0, 2, 0, PCI_VENDOR_ID);
	if (vendor != 0x8086)
		return false;

	devid = read_pci_config_16(0, 2, 0, PCI_DEVICE_ID);
	for (i = 0; i < ARRAY_SIZE(snb_ids); i++)
		if (devid == snb_ids[i])
			return true;
682
#endif
683 684 685 686 687 688 689 690 691 692

	return false;
}

/*
 * Sandy Bridge graphics has trouble with certain ranges, exclude
 * them from allocation.
 */
static void __init trim_snb_memory(void)
{
693
	static const __initconst unsigned long bad_pages[] = {
694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731
		0x20050000,
		0x20110000,
		0x20130000,
		0x20138000,
		0x40004000,
	};
	int i;

	if (!snb_gfx_workaround_needed())
		return;

	printk(KERN_DEBUG "reserving inaccessible SNB gfx pages\n");

	/*
	 * Reserve all memory below the 1 MB mark that has not
	 * already been reserved.
	 */
	memblock_reserve(0, 1<<20);
	
	for (i = 0; i < ARRAY_SIZE(bad_pages); i++) {
		if (memblock_reserve(bad_pages[i], PAGE_SIZE))
			printk(KERN_WARNING "failed to reserve 0x%08lx\n",
			       bad_pages[i]);
	}
}

/*
 * Here we put platform-specific memory range workarounds, i.e.
 * memory known to be corrupt or otherwise in need to be reserved on
 * specific platforms.
 *
 * If this gets used more widely it could use a real dispatch mechanism.
 */
static void __init trim_platform_memory_ranges(void)
{
	trim_snb_memory();
}

732 733 734 735 736 737
static void __init trim_bios_range(void)
{
	/*
	 * A special case is the first 4Kb of memory;
	 * This is a BIOS owned area, not kernel ram, but generally
	 * not listed as such in the E820 table.
738 739 740
	 *
	 * This typically reserves additional memory (64KiB by default)
	 * since some BIOSes are known to corrupt low memory.  See the
741
	 * Kconfig help text for X86_RESERVE_LOW.
742
	 */
743
	e820__range_update(0, PAGE_SIZE, E820_TYPE_RAM, E820_TYPE_RESERVED);
744

745 746 747 748 749
	/*
	 * special case: Some BIOSen report the PC BIOS
	 * area (640->1Mb) as ram even though it is not.
	 * take them out.
	 */
750
	e820__range_remove(BIOS_BEGIN, BIOS_END - BIOS_BEGIN, E820_TYPE_RAM, 1);
751

752
	e820__update_table(e820_table);
753 754
}

755 756 757 758 759 760 761
/* called before trim_bios_range() to spare extra sanitize */
static void __init e820_add_kernel_range(void)
{
	u64 start = __pa_symbol(_text);
	u64 size = __pa_symbol(_end) - start;

	/*
762
	 * Complain if .text .data and .bss are not marked as E820_TYPE_RAM and
763 764 765 766 767
	 * attempt to fix it by adding the range. We may have a confused BIOS,
	 * or the user may have used memmap=exactmap or memmap=xxM$yyM to
	 * exclude kernel range. If we really are running on top non-RAM,
	 * we will crash later anyways.
	 */
768
	if (e820__mapped_all(start, start + size, E820_TYPE_RAM))
769 770
		return;

771 772 773
	pr_warn(".text .data .bss are not marked as E820_TYPE_RAM!\n");
	e820__range_remove(start, size, E820_TYPE_RAM, 0);
	e820__range_add(start, size, E820_TYPE_RAM);
774 775
}

776 777
static unsigned reserve_low = CONFIG_X86_RESERVE_LOW << 10;

778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799
static int __init parse_reservelow(char *p)
{
	unsigned long long size;

	if (!p)
		return -EINVAL;

	size = memparse(p, &p);

	if (size < 4096)
		size = 4096;

	if (size > 640*1024)
		size = 640*1024;

	reserve_low = size;

	return 0;
}

early_param("reservelow", parse_reservelow);

800 801 802 803 804
static void __init trim_low_memory_range(void)
{
	memblock_reserve(0, ALIGN(reserve_low, PAGE_SIZE));
}
	
805 806 807 808 809 810
/*
 * Dump out kernel offset information on panic.
 */
static int
dump_kernel_offset(struct notifier_block *self, unsigned long v, void *p)
{
811 812
	if (kaslr_enabled()) {
		pr_emerg("Kernel Offset: 0x%lx from 0x%lx (relocation range: 0x%lx-0x%lx)\n",
J
Jiri Kosina 已提交
813
			 kaslr_offset(),
814 815 816 817 818 819
			 __START_KERNEL,
			 __START_KERNEL_map,
			 MODULES_VADDR-1);
	} else {
		pr_emerg("Kernel Offset: disabled\n");
	}
820 821 822 823

	return 0;
}

824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843
static void __init simple_udelay_calibration(void)
{
	unsigned int tsc_khz, cpu_khz;
	unsigned long lpj;

	if (!boot_cpu_has(X86_FEATURE_TSC))
		return;

	cpu_khz = x86_platform.calibrate_cpu();
	tsc_khz = x86_platform.calibrate_tsc();

	tsc_khz = tsc_khz ? : cpu_khz;
	if (!tsc_khz)
		return;

	lpj = tsc_khz * 1000;
	do_div(lpj, HZ);
	loops_per_jiffy = lpj;
}

L
Linus Torvalds 已提交
844 845 846 847 848 849 850
/*
 * Determine if we were loaded by an EFI loader.  If so, then we have also been
 * passed the efi memmap, systab, etc., so we should use these data structures
 * for initialization.  Note, the efi init code path is determined by the
 * global efi_enabled. This allows the same kernel image to be used on existing
 * systems (with a traditional BIOS) as well as on EFI systems.
 */
851 852 853 854 855 856
/*
 * setup_arch - architecture-specific boot-time initializations
 *
 * Note: On x86_64, fixmaps are ready for use even before this is called.
 */

L
Linus Torvalds 已提交
857 858
void __init setup_arch(char **cmdline_p)
{
859 860 861
	memblock_reserve(__pa_symbol(_text),
			 (unsigned long)__bss_stop - (unsigned long)_text);

862 863
	early_reserve_initrd();

864 865 866 867 868 869
	/*
	 * At this point everything still needed from the boot loader
	 * or BIOS or kernel text should be early reserved or marked not
	 * RAM in e820. All other memory is free game.
	 */

870
#ifdef CONFIG_X86_32
L
Linus Torvalds 已提交
871
	memcpy(&boot_cpu_data, &new_cpu_data, sizeof(new_cpu_data));
872 873 874 875 876 877 878 879 880 881

	/*
	 * copy kernel address range established so far and switch
	 * to the proper swapper page table
	 */
	clone_pgd_range(swapper_pg_dir     + KERNEL_PGD_BOUNDARY,
			initial_page_table + KERNEL_PGD_BOUNDARY,
			KERNEL_PGD_PTRS);

	load_cr3(swapper_pg_dir);
882 883 884 885 886 887 888 889 890
	/*
	 * Note: Quark X1000 CPUs advertise PGE incorrectly and require
	 * a cr3 based tlb flush, so the following __flush_tlb_all()
	 * will not flush anything because the cpu quirk which clears
	 * X86_FEATURE_PGE has not been invoked yet. Though due to the
	 * load_cr3() above the TLB has been flushed already. The
	 * quirk is invoked before subsequent calls to __flush_tlb_all()
	 * so proper operation is guaranteed.
	 */
891
	__flush_tlb_all();
892 893 894
#else
	printk(KERN_INFO "Command line: %s\n", boot_command_line);
#endif
L
Linus Torvalds 已提交
895

896 897 898 899
	/*
	 * If we have OLPC OFW, we might end up relocating the fixmap due to
	 * reserve_top(), so do this before touching the ioremap area.
	 */
900 901
	olpc_ofw_detect();

902
	early_trap_init();
903
	early_cpu_init();
904 905
	early_ioremap_init();

906 907
	setup_olpc_ofw_pgd();

908 909 910
	ROOT_DEV = old_decode_dev(boot_params.hdr.root_dev);
	screen_info = boot_params.screen_info;
	edid_info = boot_params.edid_info;
911
#ifdef CONFIG_X86_32
912 913
	apm_info.bios = boot_params.apm_bios_info;
	ist_info = boot_params.ist_info;
914 915
#endif
	saved_video_mode = boot_params.hdr.vid_mode;
916
	bootloader_type = boot_params.hdr.type_of_loader;
917 918 919 920 921 922
	if ((bootloader_type >> 4) == 0xe) {
		bootloader_type &= 0xf;
		bootloader_type |= (boot_params.hdr.ext_loader_type+0x10) << 4;
	}
	bootloader_version  = bootloader_type & 0xf;
	bootloader_version |= boot_params.hdr.ext_loader_ver << 4;
L
Linus Torvalds 已提交
923 924

#ifdef CONFIG_BLK_DEV_RAM
925 926 927
	rd_image_start = boot_params.hdr.ram_size & RAMDISK_IMAGE_START_MASK;
	rd_prompt = ((boot_params.hdr.ram_size & RAMDISK_PROMPT_FLAG) != 0);
	rd_doload = ((boot_params.hdr.ram_size & RAMDISK_LOAD_FLAG) != 0);
L
Linus Torvalds 已提交
928
#endif
929 930
#ifdef CONFIG_EFI
	if (!strncmp((char *)&boot_params.efi_info.efi_loader_signature,
931
		     EFI32_LOADER_SIGNATURE, 4)) {
932
		set_bit(EFI_BOOT, &efi.flags);
933
	} else if (!strncmp((char *)&boot_params.efi_info.efi_loader_signature,
934
		     EFI64_LOADER_SIGNATURE, 4)) {
935 936
		set_bit(EFI_BOOT, &efi.flags);
		set_bit(EFI_64BIT, &efi.flags);
937
	}
938 939 940

	if (efi_enabled(EFI_BOOT))
		efi_memblock_x86_reserve_range();
941 942
#endif

943
	x86_init.oem.arch_setup();
944

945
	iomem_resource.end = (1ULL << boot_cpu_data.x86_phys_bits) - 1;
946
	e820__memory_setup();
947 948
	parse_setup_data();

L
Linus Torvalds 已提交
949 950
	copy_edd();

951
	if (!boot_params.hdr.root_flags)
L
Linus Torvalds 已提交
952 953 954 955
		root_mountflags &= ~MS_RDONLY;
	init_mm.start_code = (unsigned long) _text;
	init_mm.end_code = (unsigned long) _etext;
	init_mm.end_data = (unsigned long) _edata;
956
	init_mm.brk = _brk_end;
957 958

	mpx_mm_init(&init_mm);
L
Linus Torvalds 已提交
959

960 961 962 963 964 965 966
	code_resource.start = __pa_symbol(_text);
	code_resource.end = __pa_symbol(_etext)-1;
	data_resource.start = __pa_symbol(_etext);
	data_resource.end = __pa_symbol(_edata)-1;
	bss_resource.start = __pa_symbol(__bss_start);
	bss_resource.end = __pa_symbol(__bss_stop)-1;

967 968 969 970 971 972 973 974 975 976 977 978 979
#ifdef CONFIG_CMDLINE_BOOL
#ifdef CONFIG_CMDLINE_OVERRIDE
	strlcpy(boot_command_line, builtin_cmdline, COMMAND_LINE_SIZE);
#else
	if (builtin_cmdline[0]) {
		/* append boot loader cmdline to builtin */
		strlcat(builtin_cmdline, " ", COMMAND_LINE_SIZE);
		strlcat(builtin_cmdline, boot_command_line, COMMAND_LINE_SIZE);
		strlcpy(boot_command_line, builtin_cmdline, COMMAND_LINE_SIZE);
	}
#endif
#endif

980 981 982 983
	strlcpy(command_line, boot_command_line, COMMAND_LINE_SIZE);
	*cmdline_p = command_line;

	/*
984 985 986 987 988
	 * x86_configure_nx() is called before parse_early_param() to detect
	 * whether hardware doesn't support NX (so that the early EHCI debug
	 * console setup can safely call set_fixmap()). It may then be called
	 * again from within noexec_setup() during parsing early parameters
	 * to honor the respective command line option.
989
	 */
990
	x86_configure_nx();
991 992 993

	parse_early_param();

994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017
#ifdef CONFIG_MEMORY_HOTPLUG
	/*
	 * Memory used by the kernel cannot be hot-removed because Linux
	 * cannot migrate the kernel pages. When memory hotplug is
	 * enabled, we should prevent memblock from allocating memory
	 * for the kernel.
	 *
	 * ACPI SRAT records all hotpluggable memory ranges. But before
	 * SRAT is parsed, we don't know about it.
	 *
	 * The kernel image is loaded into memory at very early time. We
	 * cannot prevent this anyway. So on NUMA system, we set any
	 * node the kernel resides in as un-hotpluggable.
	 *
	 * Since on modern servers, one node could have double-digit
	 * gigabytes memory, we can assume the memory around the kernel
	 * image is also un-hotpluggable. So before SRAT is parsed, just
	 * allocate memory near the kernel image to try the best to keep
	 * the kernel away from hotpluggable memory.
	 */
	if (movable_node_is_enabled())
		memblock_set_bottom_up(true);
#endif

1018
	x86_report_nx();
1019

1020
	/* after early param, so could get panic from serial */
1021
	memblock_x86_reserve_range_setup_data();
1022

1023
	if (acpi_mps_check()) {
I
Ingo Molnar 已提交
1024
#ifdef CONFIG_X86_LOCAL_APIC
1025
		disable_apic = 1;
I
Ingo Molnar 已提交
1026
#endif
1027
		setup_clear_cpu_cap(X86_FEATURE_APIC);
1028 1029
	}

1030 1031 1032 1033 1034
#ifdef CONFIG_PCI
	if (pci_early_dump_regs)
		early_dump_pci_devices();
#endif

1035
	e820__reserve_setup_data();
1036
	e820__finish_early_params();
1037

1038
	if (efi_enabled(EFI_BOOT))
B
Brian Maly 已提交
1039 1040
		efi_init();

1041
	dmi_scan_machine();
1042
	dmi_memdev_walk();
1043
	dmi_set_dump_stack_arch_desc();
1044

1045 1046 1047 1048
	/*
	 * VMware detection requires dmi to be available, so this
	 * needs to be done after dmi_scan_machine, for the BP.
	 */
1049
	init_hypervisor_platform();
1050

1051 1052
	simple_udelay_calibration();

1053
	x86_init.resources.probe_roms();
1054

1055 1056 1057 1058 1059
	/* after parse_early_param, so could debug it */
	insert_resource(&iomem_resource, &code_resource);
	insert_resource(&iomem_resource, &data_resource);
	insert_resource(&iomem_resource, &bss_resource);

1060
	e820_add_kernel_range();
1061
	trim_bios_range();
1062
#ifdef CONFIG_X86_32
Y
Yinghai Lu 已提交
1063
	if (ppro_with_ram_bug()) {
1064 1065
		e820__range_update(0x70000000ULL, 0x40000ULL, E820_TYPE_RAM,
				  E820_TYPE_RESERVED);
1066
		e820__update_table(e820_table);
Y
Yinghai Lu 已提交
1067
		printk(KERN_INFO "fixed physical RAM map:\n");
1068
		e820__print_table("bad_ppro");
Y
Yinghai Lu 已提交
1069
	}
1070 1071 1072
#else
	early_gart_iommu_check();
#endif
Y
Yinghai Lu 已提交
1073

1074 1075 1076 1077
	/*
	 * partially used pages are not usable - thus
	 * we are rounding upwards:
	 */
1078
	max_pfn = e820__end_of_ram_pfn();
1079

1080 1081
	/* update e820 for memory not covered by WB MTRRs */
	mtrr_bp_init();
1082
	if (mtrr_trim_uncached_memory(max_pfn))
1083
		max_pfn = e820__end_of_ram_pfn();
1084

I
Igor Mammedov 已提交
1085 1086
	max_possible_pfn = max_pfn;

1087 1088 1089 1090 1091 1092 1093
	/*
	 * This call is required when the CPU does not support PAT. If
	 * mtrr_bp_init() invoked it already via pat_init() the call has no
	 * effect.
	 */
	init_cache_modes();

1094 1095 1096 1097 1098 1099
	/*
	 * Define random base addresses for memory sections after max_pfn is
	 * defined and before each memory section base is used.
	 */
	kernel_randomize_memory();

1100
#ifdef CONFIG_X86_32
1101
	/* max_low_pfn get updated here */
1102
	find_low_pfn_range();
1103
#else
Y
Yinghai Lu 已提交
1104
	check_x2apic();
1105 1106 1107

	/* How many end-of-memory variables you have, grandma! */
	/* need this before calling reserve_initrd */
1108
	if (max_pfn > (1UL<<(32 - PAGE_SHIFT)))
1109
		max_low_pfn = e820__end_of_low_ram_pfn();
1110 1111 1112
	else
		max_low_pfn = max_pfn;

1113
	high_memory = (void *)__va(max_pfn * PAGE_SIZE - 1) + 1;
1114 1115
#endif

1116 1117 1118 1119 1120
	/*
	 * Find and reserve possible boot-time SMP configuration:
	 */
	find_smp_config();

1121 1122
	reserve_ibft_region();

Y
Yinghai Lu 已提交
1123 1124
	early_alloc_pgt_buf();

1125
	/*
1126
	 * Need to conclude brk, before e820__memblock_setup()
1127 1128 1129 1130 1131
	 *  it could use memblock_find_in_range, could overlap with
	 *  brk area.
	 */
	reserve_brk();

1132 1133
	cleanup_highmap();

1134
	memblock_set_current_limit(ISA_END_ADDRESS);
1135
	e820__memblock_setup();
1136

1137 1138 1139
	if (!early_xdbc_setup_hardware())
		early_xdbc_register_console();

1140 1141 1142
	reserve_bios_regions();

	if (efi_enabled(EFI_MEMMAP)) {
T
Taku Izumi 已提交
1143
		efi_fake_memmap();
1144
		efi_find_mirror();
1145
		efi_esrt_init();
1146

1147 1148 1149 1150
		/*
		 * The EFI specification says that boot service code won't be
		 * called after ExitBootServices(). This is, in fact, a lie.
		 */
1151
		efi_reserve_boot_services();
1152
	}
1153

1154
	/* preallocate 4k for mptable mpc */
1155
	e820__memblock_alloc_reserved_mpc_new();
1156 1157 1158 1159 1160

#ifdef CONFIG_X86_CHECK_BIOS_CORRUPTION
	setup_bios_corruption_check();
#endif

1161
#ifdef CONFIG_X86_32
1162 1163
	printk(KERN_DEBUG "initial memory mapped: [mem 0x00000000-%#010lx]\n",
			(max_pfn_mapped<<PAGE_SHIFT) - 1);
1164
#endif
1165

1166
	reserve_real_mode();
1167

1168
	trim_platform_memory_ranges();
1169
	trim_low_memory_range();
1170

1171
	init_mem_mapping();
1172

1173
	early_trap_pf_init();
1174

1175 1176 1177 1178 1179 1180
	/*
	 * Update mmu_cr4_features (and, indirectly, trampoline_cr4_features)
	 * with the current CR4 value.  This may not be necessary, but
	 * auditing all the early-boot CR4 manipulation would be needed to
	 * rule it out.
	 */
1181
	mmu_cr4_features = __read_cr4();
1182

1183
	memblock_set_current_limit(get_max_mapped());
1184

1185 1186 1187 1188 1189 1190 1191 1192
	/*
	 * NOTE: On x86-32, only from this point on, fixmaps are ready for use.
	 */

#ifdef CONFIG_PROVIDE_OHCI1394_DMA_INIT
	if (init_ohci1394_dma_early)
		init_ohci1394_dma_on_all_controllers();
#endif
1193 1194
	/* Allocate bigger log buffer */
	setup_log_buf(1);
1195

1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209
	if (efi_enabled(EFI_BOOT)) {
		switch (boot_params.secure_boot) {
		case efi_secureboot_mode_disabled:
			pr_info("Secure boot disabled\n");
			break;
		case efi_secureboot_mode_enabled:
			pr_info("Secure boot enabled\n");
			break;
		default:
			pr_info("Secure boot could not be determined\n");
			break;
		}
	}

1210 1211
	reserve_initrd();

1212
	acpi_table_upgrade();
1213

1214 1215
	vsmp_init();

1216 1217 1218 1219 1220
	io_delay_init();

	/*
	 * Parse the ACPI tables for possible boot-time SMP configuration.
	 */
1221 1222 1223 1224
	acpi_boot_table_init();

	early_acpi_boot_init();

1225
	initmem_init();
1226
	dma_contiguous_reserve(max_pfn_mapped << PAGE_SHIFT);
1227 1228 1229 1230 1231 1232 1233

	/*
	 * Reserve memory for crash kernel after SRAT is parsed so that it
	 * won't consume hotpluggable memory.
	 */
	reserve_crashkernel();

1234
	memblock_find_dma_reserve();
1235

1236
#ifdef CONFIG_KVM_GUEST
1237 1238 1239
	kvmclock_init();
#endif

1240
	x86_init.paging.pagetable_init();
1241

A
Andrey Ryabinin 已提交
1242 1243
	kasan_init();

1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258
#ifdef CONFIG_X86_32
	/* sync back kernel address range */
	clone_pgd_range(initial_page_table + KERNEL_PGD_BOUNDARY,
			swapper_pg_dir     + KERNEL_PGD_BOUNDARY,
			KERNEL_PGD_PTRS);

	/*
	 * sync back low identity map too.  It is used for example
	 * in the 32-bit EFI stub.
	 */
	clone_pgd_range(initial_page_table,
			swapper_pg_dir     + KERNEL_PGD_BOUNDARY,
			min(KERNEL_PGD_PTRS, KERNEL_PGD_BOUNDARY));
#endif

1259 1260
	tboot_probe();

1261 1262
	map_vsyscall();

1263
	generic_apic_probe();
L
Linus Torvalds 已提交
1264

1265
	early_quirks();
1266

1267 1268 1269
	/*
	 * Read APIC and some other early information from ACPI tables.
	 */
L
Linus Torvalds 已提交
1270
	acpi_boot_init();
F
Feng Tang 已提交
1271
	sfi_init();
1272
	x86_dtb_init();
1273

1274 1275 1276
	/*
	 * get boot-time SMP configuration:
	 */
1277
	get_smp_config();
1278

1279 1280 1281 1282 1283 1284
	/*
	 * Systems w/o ACPI and mptables might not have it mapped the local
	 * APIC yet, but prefill_possible_map() might need to access it.
	 */
	init_apic_mappings();

1285
	prefill_possible_map();
Y
Yinghai Lu 已提交
1286

1287 1288
	init_cpu_to_node();

1289
	io_apic_init_mappings();
1290

1291
	kvm_guest_init();
L
Linus Torvalds 已提交
1292

1293
	e820__reserve_resources();
1294
	e820__register_nosave_regions(max_low_pfn);
L
Linus Torvalds 已提交
1295

1296
	x86_init.resources.reserve_resources();
1297

1298
	e820__setup_pci_gap();
1299

L
Linus Torvalds 已提交
1300 1301
#ifdef CONFIG_VT
#if defined(CONFIG_VGA_CONSOLE)
1302
	if (!efi_enabled(EFI_BOOT) || (efi_mem_type(0xa0000) != EFI_CONVENTIONAL_MEMORY))
L
Linus Torvalds 已提交
1303 1304 1305 1306 1307
		conswitchp = &vga_con;
#elif defined(CONFIG_DUMMY_CONSOLE)
	conswitchp = &dummy_con;
#endif
#endif
1308
	x86_init.oem.banner();
1309

1310 1311
	x86_init.timers.wallclock_init();

1312
	mcheck_init();
1313

1314
	arch_init_ideal_nops();
1315 1316

	register_refined_jiffies(CLOCK_TICK_RATE);
1317 1318

#ifdef CONFIG_EFI
B
Borislav Petkov 已提交
1319 1320
	if (efi_enabled(EFI_BOOT))
		efi_apply_memmap_quirks();
1321
#endif
L
Linus Torvalds 已提交
1322
}
1323

1324 1325
#ifdef CONFIG_X86_32

1326 1327 1328 1329 1330
static struct resource video_ram_resource = {
	.name	= "Video RAM area",
	.start	= 0xa0000,
	.end	= 0xbffff,
	.flags	= IORESOURCE_BUSY | IORESOURCE_MEM
1331 1332
};

1333
void __init i386_reserve_resources(void)
1334
{
1335 1336
	request_resource(&iomem_resource, &video_ram_resource);
	reserve_standard_io_resources();
1337 1338 1339
}

#endif /* CONFIG_X86_32 */
1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351

static struct notifier_block kernel_offset_notifier = {
	.notifier_call = dump_kernel_offset
};

static int __init register_kernel_offset_dumper(void)
{
	atomic_notifier_chain_register(&panic_notifier_list,
					&kernel_offset_notifier);
	return 0;
}
__initcall(register_kernel_offset_dumper);
1352 1353 1354 1355 1356 1357 1358 1359

void arch_show_smap(struct seq_file *m, struct vm_area_struct *vma)
{
	if (!boot_cpu_has(X86_FEATURE_OSPKE))
		return;

	seq_printf(m, "ProtectionKey:  %8u\n", vma_pkey(vma));
}