head_64.S 7.7 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
/*
 *  linux/boot/head.S
 *
 *  Copyright (C) 1991, 1992, 1993  Linus Torvalds
 */

/*
 *  head.S contains the 32-bit startup code.
 *
 * NOTE!!! Startup happens at absolute address 0x00001000, which is also where
 * the page directory will exist. The startup code will be overwritten by
 * the page directory. [According to comments etc elsewhere on a compressed
 * kernel it will end up at 0x1000 + 1Mb I hope so as I assume this. - AC]
 *
 * Page 0 is deliberately kept safe, since System Management Mode code in 
 * laptops may need to access the BIOS data stored there.  This is also
 * useful for future device drivers that either access the BIOS via VM86 
 * mode.
 */

/*
22
 * High loaded stuff by Hans Lermen & Werner Almesberger, Feb. 1996
L
Linus Torvalds 已提交
23
 */
24 25
	.code32
	.text
L
Linus Torvalds 已提交
26 27 28

#include <linux/linkage.h>
#include <asm/segment.h>
29 30
#include <asm/pgtable_types.h>
#include <asm/page_types.h>
31
#include <asm/boot.h>
32
#include <asm/msr.h>
33
#include <asm/processor-flags.h>
34
#include <asm/asm-offsets.h>
L
Linus Torvalds 已提交
35

36
	.section ".text.head"
L
Linus Torvalds 已提交
37
	.code32
38
ENTRY(startup_32)
L
Linus Torvalds 已提交
39
	cld
40 41 42 43
	/*
	 * Test KEEP_SEGMENTS flag to see if the bootloader is asking
	 * us to not reload segments
	 */
44 45 46
	testb $(1<<6), BP_loadflags(%esi)
	jnz 1f

L
Linus Torvalds 已提交
47
	cli
48 49 50 51
	movl	$(__KERNEL_DS), %eax
	movl	%eax, %ds
	movl	%eax, %es
	movl	%eax, %ss
52
1:
53

54 55
/*
 * Calculate the delta between where we were compiled to run
56 57 58
 * at and where we were actually loaded at.  This can only be done
 * with a short local call on x86.  Nothing  else will tell us what
 * address we are running at.  The reserved chunk of the real-mode
59 60
 * data at 0x1e4 (defined as a scratch field) are used as the stack
 * for this calculation. Only 4 bytes are needed.
61
 */
62
	leal	(BP_scratch+4)(%esi), %esp
63 64 65 66
	call	1f
1:	popl	%ebp
	subl	$1b, %ebp

67
/* setup a stack and make sure cpu supports long mode. */
68
	movl	$boot_stack_end, %eax
69 70 71 72 73 74 75
	addl	%ebp, %eax
	movl	%eax, %esp

	call	verify_cpu
	testl	%eax, %eax
	jnz	no_longmode

76 77
/*
 * Compute the delta between where we were compiled to run at
78
 * and where the code will actually run at.
79 80
 *
 * %ebp contains the address we are loaded at by the boot loader and %ebx
81 82 83 84 85 86
 * contains the address where we should move the kernel image temporarily
 * for safe in-place decompression.
 */

#ifdef CONFIG_RELOCATABLE
	movl	%ebp, %ebx
87 88
	addl	$(PMD_PAGE_SIZE -1), %ebx
	andl	$PMD_PAGE_MASK, %ebx
89 90 91 92 93 94 95 96 97 98 99 100 101 102
#else
	movl	$CONFIG_PHYSICAL_START, %ebx
#endif

	/* Replace the compressed data size with the uncompressed size */
	subl	input_len(%ebp), %ebx
	movl	output_len(%ebp), %eax
	addl	%eax, %ebx
	/* Add 8 bytes for every 32K input block */
	shrl	$12, %eax
	addl	%eax, %ebx
	/* Add 32K + 18 bytes of extra slack and align on a 4K boundary */
	addl	$(32768 + 18 + 4095), %ebx
	andl	$~4095, %ebx
L
Linus Torvalds 已提交
103 104

/*
105
 * Prepare for entering 64 bit mode
L
Linus Torvalds 已提交
106
 */
107 108 109 110 111 112 113 114

	/* Load new GDT with the 64bit segments using 32bit descriptor */
	leal	gdt(%ebp), %eax
	movl	%eax, gdt+2(%ebp)
	lgdt	gdt(%ebp)

	/* Enable PAE mode */
	xorl	%eax, %eax
115
	orl	$(X86_CR4_PAE), %eax
116 117 118 119 120
	movl	%eax, %cr4

 /*
  * Build early 4G boot pagetable
  */
121
	/* Initialize Page tables to 0 */
122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161
	leal	pgtable(%ebx), %edi
	xorl	%eax, %eax
	movl	$((4096*6)/4), %ecx
	rep	stosl

	/* Build Level 4 */
	leal	pgtable + 0(%ebx), %edi
	leal	0x1007 (%edi), %eax
	movl	%eax, 0(%edi)

	/* Build Level 3 */
	leal	pgtable + 0x1000(%ebx), %edi
	leal	0x1007(%edi), %eax
	movl	$4, %ecx
1:	movl	%eax, 0x00(%edi)
	addl	$0x00001000, %eax
	addl	$8, %edi
	decl	%ecx
	jnz	1b

	/* Build Level 2 */
	leal	pgtable + 0x2000(%ebx), %edi
	movl	$0x00000183, %eax
	movl	$2048, %ecx
1:	movl	%eax, 0(%edi)
	addl	$0x00200000, %eax
	addl	$8, %edi
	decl	%ecx
	jnz	1b

	/* Enable the boot page tables */
	leal	pgtable(%ebx), %eax
	movl	%eax, %cr3

	/* Enable Long mode in EFER (Extended Feature Enable Register) */
	movl	$MSR_EFER, %ecx
	rdmsr
	btsl	$_EFER_LME, %eax
	wrmsr

162 163
	/*
	 * Setup for the jump to 64bit mode
164 165 166 167 168 169 170 171 172 173 174 175 176
	 *
	 * When the jump is performend we will be in long mode but
	 * in 32bit compatibility mode with EFER.LME = 1, CS.L = 0, CS.D = 1
	 * (and in turn EFER.LMA = 1).	To jump into 64bit mode we use
	 * the new gdt/idt that has __KERNEL_CS with CS.L = 1.
	 * We place all of the values on our mini stack so lret can
	 * used to perform that far jump.
	 */
	pushl	$__KERNEL_CS
	leal	startup_64(%ebp), %eax
	pushl	%eax

	/* Enter paged protected Mode, activating Long Mode */
177
	movl	$(X86_CR0_PG | X86_CR0_PE), %eax /* Enable Paging and Protected mode */
178 179 180 181
	movl	%eax, %cr0

	/* Jump from 32bit compatibility mode into 64bit mode. */
	lret
182
ENDPROC(startup_32)
183

184 185 186 187 188 189
no_longmode:
	/* This isn't an x86-64 CPU so hang */
1:
	hlt
	jmp     1b

T
Thomas Gleixner 已提交
190
#include "../../kernel/verify_cpu_64.S"
191

192 193
	/*
	 * Be careful here startup_64 needs to be at a predictable
194 195 196 197 198
	 * address so I can export it in an ELF header.  Bootloaders
	 * should look at the ELF header to find this address, as
	 * it may change in the future.
	 */
	.code64
199
	.org 0x200
200
ENTRY(startup_64)
201 202
	/*
	 * We come here either from startup_32 or directly from a
203 204 205 206 207 208 209 210 211 212
	 * 64bit bootloader.  If we come here from a bootloader we depend on
	 * an identity mapped page table being provied that maps our
	 * entire text+data+bss and hopefully all of memory.
	 */

	/* Setup data segments. */
	xorl	%eax, %eax
	movl	%eax, %ds
	movl	%eax, %es
	movl	%eax, %ss
213 214 215 216 217
	movl	%eax, %fs
	movl	%eax, %gs
	lldt	%ax
	movl    $0x20, %eax
	ltr	%ax
218

219 220
	/*
	 * Compute the decompressed kernel start address.  It is where
221 222 223 224 225 226 227 228 229 230 231
	 * we were loaded at aligned to a 2M boundary. %rbp contains the
	 * decompressed kernel start address.
	 *
	 * If it is a relocatable kernel then decompress and run the kernel
	 * from load address aligned to 2MB addr, otherwise decompress and
	 * run the kernel from CONFIG_PHYSICAL_START
	 */

	/* Start with the delta to where the kernel will run at. */
#ifdef CONFIG_RELOCATABLE
	leaq	startup_32(%rip) /* - $startup_32 */, %rbp
232 233
	addq	$(PMD_PAGE_SIZE - 1), %rbp
	andq	$PMD_PAGE_MASK, %rbp
234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251
	movq	%rbp, %rbx
#else
	movq	$CONFIG_PHYSICAL_START, %rbp
	movq	%rbp, %rbx
#endif

	/* Replace the compressed data size with the uncompressed size */
	movl	input_len(%rip), %eax
	subq	%rax, %rbx
	movl	output_len(%rip), %eax
	addq	%rax, %rbx
	/* Add 8 bytes for every 32K input block */
	shrq	$12, %rax
	addq	%rax, %rbx
	/* Add 32K + 18 bytes of extra slack and align on a 4K boundary */
	addq	$(32768 + 18 + 4095), %rbx
	andq	$~4095, %rbx

252 253 254 255 256 257 258
	/* Set up the stack */
	leaq	boot_stack_end(%rbx), %rsp

	/* Zero EFLAGS */
	pushq	$0
	popfq

259 260
/*
 * Copy the compressed kernel to the end of our buffer
261 262
 * where decompression in place becomes safe.
 */
263 264 265
	pushq	%rsi
	leaq	(_bss-8)(%rip), %rsi
	leaq	(_bss-8)(%rbx), %rdi
266
	movq	$_bss /* - $startup_32 */, %rcx
267 268 269 270 271
	shrq	$3, %rcx
	std
	rep	movsq
	cld
	popq	%rsi
272 273 274 275 276 277 278

/*
 * Jump to the relocated address.
 */
	leaq	relocated(%rbx), %rax
	jmp	*%rax

279
	.text
280 281
relocated:

L
Linus Torvalds 已提交
282
/*
283
 * Clear BSS (stack is currently empty)
L
Linus Torvalds 已提交
284
 */
285 286 287
	xorl	%eax, %eax
	leaq    _bss(%rip), %rdi
	leaq    _ebss(%rip), %rcx
288
	subq	%rdi, %rcx
289 290
	shrq	$3, %rcx
	rep	stosq
291

L
Linus Torvalds 已提交
292 293 294
/*
 * Do the decompression, and jump to the new kernel..
 */
295 296
	pushq	%rsi			# Save the real mode argument
	movq	%rsi, %rdi		# real mode address
297
	leaq	boot_heap(%rip), %rsi	# malloc area for uncompression
298 299 300 301 302 303
	leaq	input_data(%rip), %rdx  # input_data
	movl	input_len(%rip), %eax
	movq	%rax, %rcx		# input_len
	movq	%rbp, %r8		# output
	call	decompress_kernel
	popq	%rsi
L
Linus Torvalds 已提交
304 305

/*
306
 * Jump to the decompressed kernel.
L
Linus Torvalds 已提交
307
 */
308
	jmp	*%rbp
L
Linus Torvalds 已提交
309

310 311 312 313 314 315 316 317
	.data
gdt:
	.word	gdt_end - gdt
	.long	gdt
	.word	0
	.quad	0x0000000000000000	/* NULL descriptor */
	.quad	0x00af9a000000ffff	/* __KERNEL_CS */
	.quad	0x00cf92000000ffff	/* __KERNEL_DS */
318 319
	.quad	0x0080890000000000	/* TS descriptor */
	.quad   0x0000000000000000	/* TS continued */
320
gdt_end:
321

322 323 324 325 326
/*
 * Stack and heap for uncompression
 */
	.bss
	.balign 4
327 328 329 330 331
boot_heap:
	.fill BOOT_HEAP_SIZE, 1, 0
boot_stack:
	.fill BOOT_STACK_SIZE, 1, 0
boot_stack_end:
332 333 334 335 336 337 338 339

/*
 * Space for page tables (not in .bss so not zeroed)
 */
	.section ".pgtable","a",@nobits
	.balign 4096
pgtable:
	.fill 6*4096, 1, 0