head_32.S 18.3 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10
/*
 *
 *  Copyright (C) 1991, 1992  Linus Torvalds
 *
 *  Enhanced CPU detection and feature setting code by Mike Jagdis
 *  and Martin Mares, November 1997.
 */

.text
#include <linux/threads.h>
11
#include <linux/init.h>
L
Linus Torvalds 已提交
12 13
#include <linux/linkage.h>
#include <asm/segment.h>
14 15
#include <asm/page_types.h>
#include <asm/pgtable_types.h>
L
Linus Torvalds 已提交
16 17
#include <asm/cache.h>
#include <asm/thread_info.h>
18
#include <asm/asm-offsets.h>
L
Linus Torvalds 已提交
19
#include <asm/setup.h>
20
#include <asm/processor-flags.h>
21
#include <asm/msr-index.h>
22
#include <asm/cpufeatures.h>
23
#include <asm/percpu.h>
24
#include <asm/nops.h>
25
#include <asm/bootparam.h>
26
#include <asm/export.h>
27 28 29

/* Physical address */
#define pa(X) ((X) - __PAGE_OFFSET)
L
Linus Torvalds 已提交
30 31 32 33 34 35 36 37 38 39 40 41 42 43 44

/*
 * References to members of the new_cpu_data structure.
 */

#define X86		new_cpu_data+CPUINFO_x86
#define X86_VENDOR	new_cpu_data+CPUINFO_x86_vendor
#define X86_MODEL	new_cpu_data+CPUINFO_x86_model
#define X86_MASK	new_cpu_data+CPUINFO_x86_mask
#define X86_HARD_MATH	new_cpu_data+CPUINFO_hard_math
#define X86_CPUID	new_cpu_data+CPUINFO_cpuid_level
#define X86_CAPABILITY	new_cpu_data+CPUINFO_x86_capability
#define X86_VENDOR_ID	new_cpu_data+CPUINFO_x86_vendor_id

/*
45 46
 * This is how much memory in addition to the memory covered up to
 * and including _end we need mapped initially.
47
 * We need:
48 49
 *     (KERNEL_IMAGE_SIZE/4096) / 1024 pages (worst case, non PAE)
 *     (KERNEL_IMAGE_SIZE/4096) / 512 + 4 pages (worst case for PAE)
L
Linus Torvalds 已提交
50 51 52 53 54
 *
 * Modulo rounding, each megabyte assigned here requires a kilobyte of
 * memory, which is currently unreclaimed.
 *
 * This should be a multiple of a page.
55 56 57
 *
 * KERNEL_IMAGE_SIZE should be greater than pa(_end)
 * and small than max_low_pfn, otherwise will waste some page table entries
L
Linus Torvalds 已提交
58 59
 */

60
#if PTRS_PER_PMD > 1
61
#define PAGE_TABLE_SIZE(pages) (((pages) / PTRS_PER_PMD) + PTRS_PER_PGD)
62
#else
63
#define PAGE_TABLE_SIZE(pages) ((pages) / PTRS_PER_PGD)
64 65
#endif

66 67 68 69 70 71 72 73 74 75
/*
 * Number of possible pages in the lowmem region.
 *
 * We shift 2 by 31 instead of 1 by 32 to the left in order to avoid a
 * gas warning about overflowing shift count when gas has been compiled
 * with only a host target support using a 32-bit type for internal
 * representation.
 */
LOWMEM_PAGES = (((2<<31) - __PAGE_OFFSET) >> PAGE_SHIFT)

76
/* Enough space to fit pagetables for the low memory linear map */
77
MAPPING_BEYOND_END = PAGE_TABLE_SIZE(LOWMEM_PAGES) << PAGE_SHIFT
78 79 80

/*
 * Worst-case size of the kernel mapping we need to make:
81 82
 * a relocatable kernel can live anywhere in lowmem, so we need to be able
 * to map all of lowmem.
83
 */
84
KERNEL_PAGES = LOWMEM_PAGES
85

86
INIT_MAP_SIZE = PAGE_TABLE_SIZE(KERNEL_PAGES) * PAGE_SIZE
87
RESERVE_BRK(pagetables, INIT_MAP_SIZE)
88

L
Linus Torvalds 已提交
89 90 91 92 93 94 95
/*
 * 32-bit kernel entrypoint; only used by the boot CPU.  On entry,
 * %esi points to the real-mode code as a 32-bit pointer.
 * CS and DS must be 4 GB flat segments, but we don't depend on
 * any particular GDT layout, because we load our own as soon as we
 * can.
 */
96
__HEAD
L
Linus Torvalds 已提交
97
ENTRY(startup_32)
98
	movl pa(initial_stack),%ecx
99
	
R
Rusty Russell 已提交
100 101
	/* test KEEP_SEGMENTS flag to see if the bootloader is asking
		us to not reload segments */
102
	testb $KEEP_SEGMENTS, BP_loadflags(%esi)
R
Rusty Russell 已提交
103
	jnz 2f
L
Linus Torvalds 已提交
104 105 106 107

/*
 * Set segments to known values.
 */
108
	lgdt pa(boot_gdt_descr)
L
Linus Torvalds 已提交
109 110 111 112 113
	movl $(__BOOT_DS),%eax
	movl %eax,%ds
	movl %eax,%es
	movl %eax,%fs
	movl %eax,%gs
114
	movl %eax,%ss
R
Rusty Russell 已提交
115
2:
116
	leal -__PAGE_OFFSET(%ecx),%esp
L
Linus Torvalds 已提交
117 118 119 120

/*
 * Clear BSS first so that there are no surprises...
 */
R
Rusty Russell 已提交
121
	cld
L
Linus Torvalds 已提交
122
	xorl %eax,%eax
123 124
	movl $pa(__bss_start),%edi
	movl $pa(__bss_stop),%ecx
L
Linus Torvalds 已提交
125 126 127
	subl %edi,%ecx
	shrl $2,%ecx
	rep ; stosl
128 129 130 131 132 133 134 135
/*
 * Copy bootup parameters out of the way.
 * Note: %esi still has the pointer to the real-mode data.
 * With the kexec as boot loader, parameter segment might be loaded beyond
 * kernel image and might not even be addressable by early boot page tables.
 * (kexec on panic case). Hence copy out the parameters before initializing
 * page tables.
 */
136
	movl $pa(boot_params),%edi
137 138 139 140
	movl $(PARAM_SIZE/4),%ecx
	cld
	rep
	movsl
141
	movl pa(boot_params) + NEW_CL_POINTER,%esi
142
	andl %esi,%esi
143
	jz 1f			# No command line
144
	movl $pa(boot_command_line),%edi
145 146 147 148
	movl $(COMMAND_LINE_SIZE/4),%ecx
	rep
	movsl
1:
L
Linus Torvalds 已提交
149

150
#ifdef CONFIG_OLPC
151 152 153 154 155
	/* save OFW's pgdir table for later use when calling into OFW */
	movl %cr3, %eax
	movl %eax, pa(olpc_ofw_pgd)
#endif

156
#ifdef CONFIG_MICROCODE
157 158 159 160
	/* Early load ucode on BSP. */
	call load_ucode_bsp
#endif

L
Linus Torvalds 已提交
161 162
/*
 * Initialize page tables.  This creates a PDE and a set of page
163
 * tables, which are located immediately beyond __brk_base.  The variable
164
 * _brk_end is set up to point to the first "safe" location.
L
Linus Torvalds 已提交
165
 * Mappings are created both at virtual address 0 (identity mapping)
166
 * and PAGE_OFFSET for up to _end.
L
Linus Torvalds 已提交
167
 */
168 169 170
#ifdef CONFIG_X86_PAE

	/*
171 172 173 174
	 * In PAE mode initial_page_table is statically defined to contain
	 * enough entries to cover the VMSPLIT option (that is the top 1, 2 or 3
	 * entries). The identity mapping is handled by pointing two PGD entries
	 * to the first kernel PMD.
175
	 *
176
	 * Note the upper half of each PMD or PTE are always zero at this stage.
177 178
	 */

J
Joe Korty 已提交
179
#define KPMDS (((-__PAGE_OFFSET) >> 30) & 3) /* Number of kernel PMDs */
180 181 182

	xorl %ebx,%ebx				/* %ebx is kept at zero */

183
	movl $pa(__brk_base), %edi
184
	movl $pa(initial_pg_pmd), %edx
185
	movl $PTE_IDENT_ATTR, %eax
186
10:
187
	leal PDE_IDENT_ATTR(%edi),%ecx		/* Create PMD entry */
188 189 190 191 192 193 194 195 196 197 198 199 200
	movl %ecx,(%edx)			/* Store PMD entry */
						/* Upper half already zero */
	addl $8,%edx
	movl $512,%ecx
11:
	stosl
	xchgl %eax,%ebx
	stosl
	xchgl %eax,%ebx
	addl $0x1000,%eax
	loop 11b

	/*
201
	 * End condition: we must map up to the end + MAPPING_BEYOND_END.
202
	 */
203
	movl $pa(_end) + MAPPING_BEYOND_END + PTE_IDENT_ATTR, %ebp
204 205 206
	cmpl %ebp,%eax
	jb 10b
1:
207 208
	addl $__PAGE_OFFSET, %edi
	movl %edi, pa(_brk_end)
209 210
	shrl $12, %eax
	movl %eax, pa(max_pfn_mapped)
211 212

	/* Do early initialization of the fixmap area */
213 214
	movl $pa(initial_pg_fixmap)+PDE_IDENT_ATTR,%eax
	movl %eax,pa(initial_pg_pmd+0x1000*KPMDS-8)
215 216 217 218
#else	/* Not PAE */

page_pde_offset = (__PAGE_OFFSET >> 20);

219
	movl $pa(__brk_base), %edi
220
	movl $pa(initial_page_table), %edx
221
	movl $PTE_IDENT_ATTR, %eax
L
Linus Torvalds 已提交
222
10:
223
	leal PDE_IDENT_ATTR(%edi),%ecx		/* Create PDE entry */
L
Linus Torvalds 已提交
224 225 226 227 228 229 230 231
	movl %ecx,(%edx)			/* Store identity PDE entry */
	movl %ecx,page_pde_offset(%edx)		/* Store kernel PDE entry */
	addl $4,%edx
	movl $1024, %ecx
11:
	stosl
	addl $0x1000,%eax
	loop 11b
232
	/*
233
	 * End condition: we must map up to the end + MAPPING_BEYOND_END.
234
	 */
235
	movl $pa(_end) + MAPPING_BEYOND_END + PTE_IDENT_ATTR, %ebp
L
Linus Torvalds 已提交
236 237
	cmpl %ebp,%eax
	jb 10b
238 239
	addl $__PAGE_OFFSET, %edi
	movl %edi, pa(_brk_end)
240 241
	shrl $12, %eax
	movl %eax, pa(max_pfn_mapped)
242

243
	/* Do early initialization of the fixmap area */
244 245
	movl $pa(initial_pg_fixmap)+PDE_IDENT_ATTR,%eax
	movl %eax,pa(initial_page_table+0xffc)
246
#endif
247 248 249 250

#ifdef CONFIG_PARAVIRT
	/* This is can only trip for a broken bootloader... */
	cmpw $0x207, pa(boot_params + BP_version)
251
	jb .Ldefault_entry
252 253 254 255 256

	/* Paravirt-compatible boot parameters.  Look to see what architecture
		we're booting under. */
	movl pa(boot_params + BP_hardware_subarch), %eax
	cmpl $num_subarch_entries, %eax
257
	jae .Lbad_subarch
258 259 260 261 262

	movl pa(subarch_entries)(,%eax,4), %eax
	subl $__PAGE_OFFSET, %eax
	jmp *%eax

263
.Lbad_subarch:
264 265 266 267 268 269 270 271 272
WEAK(lguest_entry)
WEAK(xen_entry)
	/* Unknown implementation; there's really
	   nothing we can do at this point. */
	ud2a

	__INITDATA

subarch_entries:
273
	.long .Ldefault_entry		/* normal x86/PC */
274 275
	.long lguest_entry		/* lguest hypervisor */
	.long xen_entry			/* Xen hypervisor */
276
	.long .Ldefault_entry		/* Moorestown MID */
277 278 279
num_subarch_entries = (. - subarch_entries) / 4
.previous
#else
280
	jmp .Ldefault_entry
281 282
#endif /* CONFIG_PARAVIRT */

283 284 285 286 287 288 289
#ifdef CONFIG_HOTPLUG_CPU
/*
 * Boot CPU0 entry point. It's called from play_dead(). Everything has been set
 * up already except stack. We just set up stack here. Then call
 * start_secondary().
 */
ENTRY(start_cpu0)
290
	movl initial_stack, %ecx
291 292 293 294 295
	movl %ecx, %esp
	jmp  *(initial_code)
ENDPROC(start_cpu0)
#endif

L
Linus Torvalds 已提交
296 297 298
/*
 * Non-boot CPU entry point; entered from trampoline.S
 * We can't lgdt here, because lgdt itself uses a data segment, but
299
 * we know the trampoline has already loaded the boot_gdt for us.
300 301 302
 *
 * If cpu hotplug is not supported then this code can go in init section
 * which will be freed later
L
Linus Torvalds 已提交
303 304 305 306 307 308 309 310
 */
ENTRY(startup_32_smp)
	cld
	movl $(__BOOT_DS),%eax
	movl %eax,%ds
	movl %eax,%es
	movl %eax,%fs
	movl %eax,%gs
311
	movl pa(initial_stack),%ecx
312 313
	movl %eax,%ss
	leal -__PAGE_OFFSET(%ecx),%esp
314

315
#ifdef CONFIG_MICROCODE
316 317 318 319
	/* Early load ucode on AP. */
	call load_ucode_ap
#endif

320
.Ldefault_entry:
321 322 323 324 325 326
#define CR0_STATE	(X86_CR0_PE | X86_CR0_MP | X86_CR0_ET | \
			 X86_CR0_NE | X86_CR0_WP | X86_CR0_AM | \
			 X86_CR0_PG)
	movl $(CR0_STATE & ~X86_CR0_PG),%eax
	movl %eax,%cr0

L
Linus Torvalds 已提交
327
/*
328 329 330 331 332 333 334 335 336 337 338
 * We want to start out with EFLAGS unambiguously cleared. Some BIOSes leave
 * bits like NT set. This would confuse the debugger if this code is traced. So
 * initialize them properly now before switching to protected mode. That means
 * DF in particular (even though we have cleared it earlier after copying the
 * command line) because GCC expects it.
 */
	pushl $0
	popfl

/*
 * New page tables may be in 4Mbyte page mode and may be using the global pages.
L
Linus Torvalds 已提交
339
 *
340 341
 * NOTE! If we are on a 486 we may have no cr4 at all! Specifically, cr4 exists
 * if and only if CPUID exists and has flags other than the FPU flag set.
L
Linus Torvalds 已提交
342
 */
343
	movl $-1,pa(X86_CPUID)		# preset CPUID level
344 345
	movl $X86_EFLAGS_ID,%ecx
	pushl %ecx
346
	popfl				# set EFLAGS=ID
347
	pushfl
348 349
	popl %eax			# get EFLAGS
	testl $X86_EFLAGS_ID,%eax	# did EFLAGS.ID remained set?
350
	jz .Lenable_paging		# hw disallowed setting of ID bit
351 352 353 354 355
					# which means no CPUID and no CR4

	xorl %eax,%eax
	cpuid
	movl %eax,pa(X86_CPUID)		# save largest std CPUID function
356

357 358
	movl $1,%eax
	cpuid
359
	andl $~1,%edx			# Ignore CPUID.FPU
360
	jz .Lenable_paging		# No flags or only CPUID.FPU = no CR4
361

362
	movl pa(mmu_cr4_features),%eax
L
Linus Torvalds 已提交
363 364
	movl %eax,%cr4

365
	testb $X86_CR4_PAE, %al		# check if PAE is enabled
366
	jz .Lenable_paging
L
Linus Torvalds 已提交
367 368 369 370

	/* Check if extended functions are implemented */
	movl $0x80000000, %eax
	cpuid
371 372 373
	/* Value must be in the range 0x80000001 to 0x8000ffff */
	subl $0x80000001, %eax
	cmpl $(0x8000ffff-0x80000001), %eax
374
	ja .Lenable_paging
375 376 377 378

	/* Clear bogus XD_DISABLE bits */
	call verify_cpu

L
Linus Torvalds 已提交
379 380 381
	mov $0x80000001, %eax
	cpuid
	/* Execute Disable bit supported? */
382
	btl $(X86_FEATURE_NX & 31), %edx
383
	jnc .Lenable_paging
L
Linus Torvalds 已提交
384 385

	/* Setup EFER (Extended Feature Enable Register) */
386
	movl $MSR_EFER, %ecx
L
Linus Torvalds 已提交
387 388
	rdmsr

389
	btsl $_EFER_NX, %eax
L
Linus Torvalds 已提交
390 391 392
	/* Make changes effective */
	wrmsr

393
.Lenable_paging:
L
Linus Torvalds 已提交
394 395 396 397

/*
 * Enable paging
 */
398
	movl $pa(initial_page_table), %eax
L
Linus Torvalds 已提交
399
	movl %eax,%cr3		/* set the page table pointer.. */
400
	movl $CR0_STATE,%eax
L
Linus Torvalds 已提交
401 402 403
	movl %eax,%cr0		/* ..and set paging (PG) bit */
	ljmp $__BOOT_CS,$1f	/* Clear prefetch and normalize %eip */
1:
404 405
	/* Shift the stack pointer to a virtual address */
	addl $__PAGE_OFFSET, %esp
L
Linus Torvalds 已提交
406 407 408 409 410

/*
 * start system 32-bit setup. We need to re-do some of the things done
 * in 16-bit mode for the "real" operations.
 */
411 412 413 414 415
	movl setup_once_ref,%eax
	andl %eax,%eax
	jz 1f				# Did we do this already?
	call *%eax
1:
416

L
Linus Torvalds 已提交
417
/*
418
 * Check if it is 486
L
Linus Torvalds 已提交
419
 */
420
	movb $4,X86			# at least 486
421
	cmpl $-1,X86_CPUID
422
	je .Lis486
L
Linus Torvalds 已提交
423 424 425 426 427 428 429 430 431 432

	/* get vendor info */
	xorl %eax,%eax			# call CPUID with 0 -> return vendor ID
	cpuid
	movl %eax,X86_CPUID		# save CPUID level
	movl %ebx,X86_VENDOR_ID		# lo 4 chars
	movl %edx,X86_VENDOR_ID+4	# next 4 chars
	movl %ecx,X86_VENDOR_ID+8	# last 4 chars

	orl %eax,%eax			# do we have processor info as well?
433
	je .Lis486
L
Linus Torvalds 已提交
434 435 436 437 438 439 440 441 442 443 444 445 446

	movl $1,%eax		# Use the CPUID instruction to get CPU type
	cpuid
	movb %al,%cl		# save reg for future use
	andb $0x0f,%ah		# mask processor family
	movb %ah,X86
	andb $0xf0,%al		# mask model
	shrb $4,%al
	movb %al,X86_MODEL
	andb $0x0f,%cl		# mask mask revision
	movb %cl,X86_MASK
	movl %edx,X86_CAPABILITY

447
.Lis486:
448
	movl $0x50022,%ecx	# set AM, WP, NE and MP
449
	movl %cr0,%eax
L
Linus Torvalds 已提交
450 451 452 453
	andl $0x80000011,%eax	# Save PG,PE,ET
	orl %ecx,%eax
	movl %eax,%cr0

454
	lgdt early_gdt_descr
L
Linus Torvalds 已提交
455 456 457 458 459 460 461 462 463
	lidt idt_descr
	ljmp $(__KERNEL_CS),$1f
1:	movl $(__KERNEL_DS),%eax	# reload all the segment registers
	movl %eax,%ss			# after changing gdt.

	movl $(__USER_DS),%eax		# DS/ES contains default USER segment
	movl %eax,%ds
	movl %eax,%es

464 465 466
	movl $(__KERNEL_PERCPU), %eax
	movl %eax,%fs			# set this cpu's percpu

467
	movl $(__KERNEL_STACK_CANARY),%eax
468
	movl %eax,%gs
469 470

	xorl %eax,%eax			# Clear LDT
L
Linus Torvalds 已提交
471
	lldt %ax
472

473
	pushl $0		# fake return address for unwinder
G
Glauber Costa 已提交
474
	jmp *(initial_code)
L
Linus Torvalds 已提交
475

476 477
#include "verify_cpu.S"

L
Linus Torvalds 已提交
478
/*
479
 *  setup_once
L
Linus Torvalds 已提交
480
 *
481
 *  The setup work we only want to run on the BSP.
L
Linus Torvalds 已提交
482 483 484
 *
 *  Warning: %esi is live across this function.
 */
485 486 487
__INIT
setup_once:
	/*
488 489 490 491 492
	 * Set up a idt with 256 interrupt gates that push zero if there
	 * is no error code and then jump to early_idt_handler_common.
	 * It doesn't actually load the idt - that needs to be done on
	 * each CPU. Interrupts are enabled elsewhere, when we can be
	 * relatively sure everything is ok.
493
	 */
L
Linus Torvalds 已提交
494

495
	movl $idt_table,%edi
496
	movl $early_idt_handler_array,%eax
497 498
	movl $NUM_EXCEPTION_VECTORS,%ecx
1:
L
Linus Torvalds 已提交
499
	movl %eax,(%edi)
500 501 502
	movl %eax,4(%edi)
	/* interrupt gate, dpl=0, present */
	movl $(0x8E000000 + __KERNEL_CS),2(%edi)
503
	addl $EARLY_IDT_HANDLER_SIZE,%eax
L
Linus Torvalds 已提交
504
	addl $8,%edi
505
	loop 1b
506

507 508
	movl $256 - NUM_EXCEPTION_VECTORS,%ecx
	movl $ignore_int,%edx
509
	movl $(__KERNEL_CS << 16),%eax
510
	movw %dx,%ax		/* selector = 0x0010 = cs */
511
	movw $0x8E00,%dx	/* interrupt gate - dpl=0, present */
512 513 514 515 516
2:
	movl %eax,(%edi)
	movl %edx,4(%edi)
	addl $8,%edi
	loop 2b
517

518 519 520 521 522 523 524 525 526 527 528 529 530
#ifdef CONFIG_CC_STACKPROTECTOR
	/*
	 * Configure the stack canary. The linker can't handle this by
	 * relocation.  Manually set base address in stack canary
	 * segment descriptor.
	 */
	movl $gdt_page,%eax
	movl $stack_canary,%ecx
	movw %cx, 8 * GDT_ENTRY_STACK_CANARY + 2(%eax)
	shrl $16, %ecx
	movb %cl, 8 * GDT_ENTRY_STACK_CANARY + 4(%eax)
	movb %ch, 8 * GDT_ENTRY_STACK_CANARY + 7(%eax)
#endif
531

532
	andl $0,setup_once_ref	/* Once is enough, thanks */
L
Linus Torvalds 已提交
533 534
	ret

535
ENTRY(early_idt_handler_array)
536 537 538 539 540 541
	# 36(%esp) %eflags
	# 32(%esp) %cs
	# 28(%esp) %eip
	# 24(%rsp) error code
	i = 0
	.rept NUM_EXCEPTION_VECTORS
542
	.ifeq (EXCEPTION_ERRCODE_MASK >> i) & 1
543 544 545
	pushl $0		# Dummy error code, to make stack frame uniform
	.endif
	pushl $i		# 20(%esp) Vector number
546
	jmp early_idt_handler_common
547
	i = i + 1
548
	.fill early_idt_handler_array + i*EARLY_IDT_HANDLER_SIZE - ., 1, 0xcc
549
	.endr
550
ENDPROC(early_idt_handler_array)
551
	
552 553 554 555 556
early_idt_handler_common:
	/*
	 * The stack is the hardware frame, an error code or zero, and the
	 * vector number.
	 */
557
	cld
558

559
	incl %ss:early_recursion_flag
560

561
	/* The vector number is in pt_regs->gs */
562

563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606
	cld
	pushl	%fs		/* pt_regs->fs */
	movw	$0, 2(%esp)	/* clear high bits (some CPUs leave garbage) */
	pushl	%es		/* pt_regs->es */
	movw	$0, 2(%esp)	/* clear high bits (some CPUs leave garbage) */
	pushl	%ds		/* pt_regs->ds */
	movw	$0, 2(%esp)	/* clear high bits (some CPUs leave garbage) */
	pushl	%eax		/* pt_regs->ax */
	pushl	%ebp		/* pt_regs->bp */
	pushl	%edi		/* pt_regs->di */
	pushl	%esi		/* pt_regs->si */
	pushl	%edx		/* pt_regs->dx */
	pushl	%ecx		/* pt_regs->cx */
	pushl	%ebx		/* pt_regs->bx */

	/* Fix up DS and ES */
	movl	$(__KERNEL_DS), %ecx
	movl	%ecx, %ds
	movl	%ecx, %es

	/* Load the vector number into EDX */
	movl	PT_GS(%esp), %edx

	/* Load GS into pt_regs->gs and clear high bits */
	movw	%gs, PT_GS(%esp)
	movw	$0, PT_GS+2(%esp)

	movl	%esp, %eax	/* args are pt_regs (EAX), trapnr (EDX) */
	call	early_fixup_exception

	popl	%ebx		/* pt_regs->bx */
	popl	%ecx		/* pt_regs->cx */
	popl	%edx		/* pt_regs->dx */
	popl	%esi		/* pt_regs->si */
	popl	%edi		/* pt_regs->di */
	popl	%ebp		/* pt_regs->bp */
	popl	%eax		/* pt_regs->ax */
	popl	%ds		/* pt_regs->ds */
	popl	%es		/* pt_regs->es */
	popl	%fs		/* pt_regs->fs */
	popl	%gs		/* pt_regs->gs */
	decl	%ss:early_recursion_flag
	addl	$4, %esp	/* pop pt_regs->orig_ax */
	iret
607
ENDPROC(early_idt_handler_common)
608

L
Linus Torvalds 已提交
609 610 611 612
/* This is the default interrupt "handler" :-) */
	ALIGN
ignore_int:
	cld
M
Matt Mackall 已提交
613
#ifdef CONFIG_PRINTK
L
Linus Torvalds 已提交
614 615 616 617 618 619 620 621
	pushl %eax
	pushl %ecx
	pushl %edx
	pushl %es
	pushl %ds
	movl $(__KERNEL_DS),%eax
	movl %eax,%ds
	movl %eax,%es
622 623 624
	cmpl $2,early_recursion_flag
	je hlt_loop
	incl early_recursion_flag
L
Linus Torvalds 已提交
625 626 627 628 629 630
	pushl 16(%esp)
	pushl 24(%esp)
	pushl 32(%esp)
	pushl 40(%esp)
	pushl $int_msg
	call printk
631 632 633

	call dump_stack

L
Linus Torvalds 已提交
634 635 636 637 638 639
	addl $(5*4),%esp
	popl %ds
	popl %es
	popl %edx
	popl %ecx
	popl %eax
M
Matt Mackall 已提交
640
#endif
L
Linus Torvalds 已提交
641
	iret
642 643 644 645

hlt_loop:
	hlt
	jmp hlt_loop
646 647 648
ENDPROC(ignore_int)
__INITDATA
	.align 4
649
GLOBAL(early_recursion_flag)
650
	.long 0
L
Linus Torvalds 已提交
651

652 653
__REFDATA
	.align 4
T
Thomas Gleixner 已提交
654 655
ENTRY(initial_code)
	.long i386_start_kernel
656 657
ENTRY(setup_once_ref)
	.long setup_once
T
Thomas Gleixner 已提交
658

L
Linus Torvalds 已提交
659 660 661
/*
 * BSS section
 */
662
__PAGE_ALIGNED_BSS
663
	.align PAGE_SIZE
664
#ifdef CONFIG_X86_PAE
665
initial_pg_pmd:
666 667
	.fill 1024*KPMDS,4,0
#else
668
ENTRY(initial_page_table)
L
Linus Torvalds 已提交
669
	.fill 1024,4,0
670
#endif
671
initial_pg_fixmap:
E
Eric W. Biderman 已提交
672
	.fill 1024,4,0
L
Linus Torvalds 已提交
673 674
ENTRY(empty_zero_page)
	.fill 4096,1,0
675 676
ENTRY(swapper_pg_dir)
	.fill 1024,4,0
677
EXPORT_SYMBOL(empty_zero_page)
678

L
Linus Torvalds 已提交
679 680 681
/*
 * This starts the data section.
 */
682
#ifdef CONFIG_X86_PAE
683
__PAGE_ALIGNED_DATA
684
	/* Page-aligned for the benefit of paravirt? */
685
	.align PAGE_SIZE
686 687
ENTRY(initial_page_table)
	.long	pa(initial_pg_pmd+PGD_IDENT_ATTR),0	/* low identity map */
688
# if KPMDS == 3
689 690 691
	.long	pa(initial_pg_pmd+PGD_IDENT_ATTR),0
	.long	pa(initial_pg_pmd+PGD_IDENT_ATTR+0x1000),0
	.long	pa(initial_pg_pmd+PGD_IDENT_ATTR+0x2000),0
692 693
# elif KPMDS == 2
	.long	0,0
694 695
	.long	pa(initial_pg_pmd+PGD_IDENT_ATTR),0
	.long	pa(initial_pg_pmd+PGD_IDENT_ATTR+0x1000),0
696 697 698
# elif KPMDS == 1
	.long	0,0
	.long	0,0
699
	.long	pa(initial_pg_pmd+PGD_IDENT_ATTR),0
700 701 702
# else
#  error "Kernel PMDs should be 1, 2 or 3"
# endif
703
	.align PAGE_SIZE		/* needs to be page-sized too */
704 705
#endif

L
Linus Torvalds 已提交
706
.data
707
.balign 4
708
ENTRY(initial_stack)
L
Linus Torvalds 已提交
709 710
	.long init_thread_union+THREAD_SIZE

711
__INITRODATA
L
Linus Torvalds 已提交
712
int_msg:
713
	.asciz "Unknown interrupt or fault at: %p %p %p\n"
L
Linus Torvalds 已提交
714

T
Thomas Gleixner 已提交
715
#include "../../x86/xen/xen-head.S"
716

L
Linus Torvalds 已提交
717 718 719 720 721 722 723
/*
 * The IDT and GDT 'descriptors' are a strange 48-bit object
 * only used by the lidt and lgdt instructions. They are not
 * like usual segment descriptors - they consist of a 16-bit
 * segment size, and 32-bit linear address value:
 */

724
	.data
L
Linus Torvalds 已提交
725 726 727 728 729 730 731 732
.globl boot_gdt_descr
.globl idt_descr

	ALIGN
# early boot GDT descriptor (must use 1:1 address mapping)
	.word 0				# 32 bit align gdt_desc.address
boot_gdt_descr:
	.word __BOOT_DS+7
733
	.long boot_gdt - __PAGE_OFFSET
L
Linus Torvalds 已提交
734 735 736 737 738 739 740 741

	.word 0				# 32-bit align idt_desc.address
idt_descr:
	.word IDT_ENTRIES*8-1		# idt contains 256 entries
	.long idt_table

# boot GDT descriptor (later on used by CPU#0):
	.word 0				# 32 bit align gdt_desc.address
742
ENTRY(early_gdt_descr)
L
Linus Torvalds 已提交
743
	.word GDT_ENTRIES*8-1
R
Rusty Russell 已提交
744
	.long gdt_page			/* Overwritten for secondary CPUs */
L
Linus Torvalds 已提交
745 746

/*
747
 * The boot_gdt must mirror the equivalent in setup.S and is
L
Linus Torvalds 已提交
748 749 750
 * used only for booting.
 */
	.align L1_CACHE_BYTES
751
ENTRY(boot_gdt)
L
Linus Torvalds 已提交
752 753 754
	.fill GDT_ENTRY_BOOT_CS,8,0
	.quad 0x00cf9a000000ffff	/* kernel 4GB code at 0x00000000 */
	.quad 0x00cf92000000ffff	/* kernel 4GB data at 0x00000000 */