entry.S 22.2 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44
/*
 *  linux/arch/i386/entry.S
 *
 *  Copyright (C) 1991, 1992  Linus Torvalds
 */

/*
 * entry.S contains the system-call and fault low-level handling routines.
 * This also contains the timer-interrupt handler, as well as all interrupts
 * and faults that can result in a task-switch.
 *
 * NOTE: This code handles signal-recognition, which happens every time
 * after a timer-interrupt and after each system call.
 *
 * I changed all the .align's to 4 (16 byte alignment), as that's faster
 * on a 486.
 *
 * Stack layout in 'ret_from_system_call':
 * 	ptrace needs to have all regs on the stack.
 *	if the order here is changed, it needs to be
 *	updated in fork.c:copy_process, signal.c:do_signal,
 *	ptrace.c and ptrace.h
 *
 *	 0(%esp) - %ebx
 *	 4(%esp) - %ecx
 *	 8(%esp) - %edx
 *       C(%esp) - %esi
 *	10(%esp) - %edi
 *	14(%esp) - %ebp
 *	18(%esp) - %eax
 *	1C(%esp) - %ds
 *	20(%esp) - %es
 *	24(%esp) - orig_eax
 *	28(%esp) - %eip
 *	2C(%esp) - %cs
 *	30(%esp) - %eflags
 *	34(%esp) - %oldesp
 *	38(%esp) - %oldss
 *
 * "current" is in register %ebx during any slow entries.
 */

#include <linux/linkage.h>
#include <asm/thread_info.h>
45
#include <asm/irqflags.h>
L
Linus Torvalds 已提交
46 47 48 49 50
#include <asm/errno.h>
#include <asm/segment.h>
#include <asm/smp.h>
#include <asm/page.h>
#include <asm/desc.h>
51
#include <asm/dwarf2.h>
L
Linus Torvalds 已提交
52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78
#include "irq_vectors.h"

#define nr_syscalls ((syscall_table_size)/4)

EBX		= 0x00
ECX		= 0x04
EDX		= 0x08
ESI		= 0x0C
EDI		= 0x10
EBP		= 0x14
EAX		= 0x18
DS		= 0x1C
ES		= 0x20
ORIG_EAX	= 0x24
EIP		= 0x28
CS		= 0x2C
EFLAGS		= 0x30
OLDESP		= 0x34
OLDSS		= 0x38

CF_MASK		= 0x00000001
TF_MASK		= 0x00000100
IF_MASK		= 0x00000200
DF_MASK		= 0x00000400 
NT_MASK		= 0x00004000
VM_MASK		= 0x00020000

79 80 81 82 83 84 85
/* These are replaces for paravirtualization */
#define DISABLE_INTERRUPTS		cli
#define ENABLE_INTERRUPTS		sti
#define ENABLE_INTERRUPTS_SYSEXIT	sti; sysexit
#define INTERRUPT_RETURN		iret
#define GET_CR0_INTO_EAX		movl %cr0, %eax

L
Linus Torvalds 已提交
86
#ifdef CONFIG_PREEMPT
87
#define preempt_stop		DISABLE_INTERRUPTS; TRACE_IRQS_OFF
L
Linus Torvalds 已提交
88 89 90 91 92
#else
#define preempt_stop
#define resume_kernel		restore_nocheck
#endif

93 94 95 96 97 98 99 100 101
.macro TRACE_IRQS_IRET
#ifdef CONFIG_TRACE_IRQFLAGS
	testl $IF_MASK,EFLAGS(%esp)     # interrupts off?
	jz 1f
	TRACE_IRQS_ON
1:
#endif
.endm

102 103 104 105 106 107
#ifdef CONFIG_VM86
#define resume_userspace_sig	check_userspace
#else
#define resume_userspace_sig	resume_userspace
#endif

L
Linus Torvalds 已提交
108 109 110
#define SAVE_ALL \
	cld; \
	pushl %es; \
111 112
	CFI_ADJUST_CFA_OFFSET 4;\
	/*CFI_REL_OFFSET es, 0;*/\
L
Linus Torvalds 已提交
113
	pushl %ds; \
114 115
	CFI_ADJUST_CFA_OFFSET 4;\
	/*CFI_REL_OFFSET ds, 0;*/\
L
Linus Torvalds 已提交
116
	pushl %eax; \
117 118
	CFI_ADJUST_CFA_OFFSET 4;\
	CFI_REL_OFFSET eax, 0;\
L
Linus Torvalds 已提交
119
	pushl %ebp; \
120 121
	CFI_ADJUST_CFA_OFFSET 4;\
	CFI_REL_OFFSET ebp, 0;\
L
Linus Torvalds 已提交
122
	pushl %edi; \
123 124
	CFI_ADJUST_CFA_OFFSET 4;\
	CFI_REL_OFFSET edi, 0;\
L
Linus Torvalds 已提交
125
	pushl %esi; \
126 127
	CFI_ADJUST_CFA_OFFSET 4;\
	CFI_REL_OFFSET esi, 0;\
L
Linus Torvalds 已提交
128
	pushl %edx; \
129 130
	CFI_ADJUST_CFA_OFFSET 4;\
	CFI_REL_OFFSET edx, 0;\
L
Linus Torvalds 已提交
131
	pushl %ecx; \
132 133
	CFI_ADJUST_CFA_OFFSET 4;\
	CFI_REL_OFFSET ecx, 0;\
L
Linus Torvalds 已提交
134
	pushl %ebx; \
135 136
	CFI_ADJUST_CFA_OFFSET 4;\
	CFI_REL_OFFSET ebx, 0;\
L
Linus Torvalds 已提交
137 138 139 140 141 142
	movl $(__USER_DS), %edx; \
	movl %edx, %ds; \
	movl %edx, %es;

#define RESTORE_INT_REGS \
	popl %ebx;	\
143 144
	CFI_ADJUST_CFA_OFFSET -4;\
	CFI_RESTORE ebx;\
L
Linus Torvalds 已提交
145
	popl %ecx;	\
146 147
	CFI_ADJUST_CFA_OFFSET -4;\
	CFI_RESTORE ecx;\
L
Linus Torvalds 已提交
148
	popl %edx;	\
149 150
	CFI_ADJUST_CFA_OFFSET -4;\
	CFI_RESTORE edx;\
L
Linus Torvalds 已提交
151
	popl %esi;	\
152 153
	CFI_ADJUST_CFA_OFFSET -4;\
	CFI_RESTORE esi;\
L
Linus Torvalds 已提交
154
	popl %edi;	\
155 156
	CFI_ADJUST_CFA_OFFSET -4;\
	CFI_RESTORE edi;\
L
Linus Torvalds 已提交
157
	popl %ebp;	\
158 159 160 161 162
	CFI_ADJUST_CFA_OFFSET -4;\
	CFI_RESTORE ebp;\
	popl %eax;	\
	CFI_ADJUST_CFA_OFFSET -4;\
	CFI_RESTORE eax
L
Linus Torvalds 已提交
163 164 165 166

#define RESTORE_REGS	\
	RESTORE_INT_REGS; \
1:	popl %ds;	\
167 168
	CFI_ADJUST_CFA_OFFSET -4;\
	/*CFI_RESTORE ds;*/\
L
Linus Torvalds 已提交
169
2:	popl %es;	\
170 171
	CFI_ADJUST_CFA_OFFSET -4;\
	/*CFI_RESTORE es;*/\
L
Linus Torvalds 已提交
172 173 174 175 176 177 178 179 180 181 182 183
.section .fixup,"ax";	\
3:	movl $0,(%esp);	\
	jmp 1b;		\
4:	movl $0,(%esp);	\
	jmp 2b;		\
.previous;		\
.section __ex_table,"a";\
	.align 4;	\
	.long 1b,3b;	\
	.long 2b,4b;	\
.previous

184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209
#define RING0_INT_FRAME \
	CFI_STARTPROC simple;\
	CFI_DEF_CFA esp, 3*4;\
	/*CFI_OFFSET cs, -2*4;*/\
	CFI_OFFSET eip, -3*4

#define RING0_EC_FRAME \
	CFI_STARTPROC simple;\
	CFI_DEF_CFA esp, 4*4;\
	/*CFI_OFFSET cs, -2*4;*/\
	CFI_OFFSET eip, -3*4

#define RING0_PTREGS_FRAME \
	CFI_STARTPROC simple;\
	CFI_DEF_CFA esp, OLDESP-EBX;\
	/*CFI_OFFSET cs, CS-OLDESP;*/\
	CFI_OFFSET eip, EIP-OLDESP;\
	/*CFI_OFFSET es, ES-OLDESP;*/\
	/*CFI_OFFSET ds, DS-OLDESP;*/\
	CFI_OFFSET eax, EAX-OLDESP;\
	CFI_OFFSET ebp, EBP-OLDESP;\
	CFI_OFFSET edi, EDI-OLDESP;\
	CFI_OFFSET esi, ESI-OLDESP;\
	CFI_OFFSET edx, EDX-OLDESP;\
	CFI_OFFSET ecx, ECX-OLDESP;\
	CFI_OFFSET ebx, EBX-OLDESP
L
Linus Torvalds 已提交
210 211

ENTRY(ret_from_fork)
212
	CFI_STARTPROC
L
Linus Torvalds 已提交
213
	pushl %eax
214
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
215 216 217
	call schedule_tail
	GET_THREAD_INFO(%ebp)
	popl %eax
218
	CFI_ADJUST_CFA_OFFSET -4
219 220 221 222
	pushl $0x0202			# Reset kernel eflags
	CFI_ADJUST_CFA_OFFSET 4
	popfl
	CFI_ADJUST_CFA_OFFSET -4
L
Linus Torvalds 已提交
223
	jmp syscall_exit
224
	CFI_ENDPROC
L
Linus Torvalds 已提交
225 226 227 228 229 230 231 232 233 234

/*
 * Return to user mode is not as complex as all this looks,
 * but we want the default path for a system call return to
 * go as quickly as possible which is why some of this is
 * less clear than it otherwise should be.
 */

	# userspace resumption stub bypassing syscall exit tracing
	ALIGN
235
	RING0_PTREGS_FRAME
L
Linus Torvalds 已提交
236 237 238 239
ret_from_exception:
	preempt_stop
ret_from_intr:
	GET_THREAD_INFO(%ebp)
240
check_userspace:
L
Linus Torvalds 已提交
241 242
	movl EFLAGS(%esp), %eax		# mix EFLAGS and CS
	movb CS(%esp), %al
243 244 245
	andl $(VM_MASK | SEGMENT_RPL_MASK), %eax
	cmpl $USER_RPL, %eax
	jb resume_kernel		# not returning to v8086 or userspace
L
Linus Torvalds 已提交
246
ENTRY(resume_userspace)
247
 	DISABLE_INTERRUPTS		# make sure we don't miss an interrupt
L
Linus Torvalds 已提交
248 249 250 251 252 253 254 255 256 257
					# setting need_resched or sigpending
					# between sampling and the iret
	movl TI_flags(%ebp), %ecx
	andl $_TIF_WORK_MASK, %ecx	# is there any work to be done on
					# int/exception return?
	jne work_pending
	jmp restore_all

#ifdef CONFIG_PREEMPT
ENTRY(resume_kernel)
258
	DISABLE_INTERRUPTS
L
Linus Torvalds 已提交
259 260 261 262 263 264 265 266 267 268 269
	cmpl $0,TI_preempt_count(%ebp)	# non-zero preempt_count ?
	jnz restore_nocheck
need_resched:
	movl TI_flags(%ebp), %ecx	# need_resched set ?
	testb $_TIF_NEED_RESCHED, %cl
	jz restore_all
	testl $IF_MASK,EFLAGS(%esp)     # interrupts off (exception path) ?
	jz restore_all
	call preempt_schedule_irq
	jmp need_resched
#endif
270
	CFI_ENDPROC
L
Linus Torvalds 已提交
271 272 273 274 275 276

/* SYSENTER_RETURN points to after the "sysenter" instruction in
   the vsyscall page.  See vsyscall-sysentry.S, which defines the symbol.  */

	# sysenter call handler stub
ENTRY(sysenter_entry)
277 278 279
	CFI_STARTPROC simple
	CFI_DEF_CFA esp, 0
	CFI_REGISTER esp, ebp
L
Linus Torvalds 已提交
280 281
	movl TSS_sysenter_esp0(%esp),%esp
sysenter_past_esp:
282 283 284 285
	/*
	 * No need to follow this irqs on/off section: the syscall
	 * disabled irqs and here we enable it straight after entry:
	 */
286
	ENABLE_INTERRUPTS
L
Linus Torvalds 已提交
287
	pushl $(__USER_DS)
288 289
	CFI_ADJUST_CFA_OFFSET 4
	/*CFI_REL_OFFSET ss, 0*/
L
Linus Torvalds 已提交
290
	pushl %ebp
291 292
	CFI_ADJUST_CFA_OFFSET 4
	CFI_REL_OFFSET esp, 0
L
Linus Torvalds 已提交
293
	pushfl
294
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
295
	pushl $(__USER_CS)
296 297
	CFI_ADJUST_CFA_OFFSET 4
	/*CFI_REL_OFFSET cs, 0*/
298 299 300 301 302 303
	/*
	 * Push current_thread_info()->sysenter_return to the stack.
	 * A tiny bit of offset fixup is necessary - 4*4 means the 4 words
	 * pushed above; +8 corresponds to copy_thread's esp0 setting.
	 */
	pushl (TI_sysenter_return-THREAD_SIZE+8+4*4)(%esp)
304 305
	CFI_ADJUST_CFA_OFFSET 4
	CFI_REL_OFFSET eip, 0
L
Linus Torvalds 已提交
306 307 308 309 310 311 312 313 314 315 316 317 318 319

/*
 * Load the potential sixth argument from user stack.
 * Careful about security.
 */
	cmpl $__PAGE_OFFSET-3,%ebp
	jae syscall_fault
1:	movl (%ebp),%ebp
.section __ex_table,"a"
	.align 4
	.long 1b,syscall_fault
.previous

	pushl %eax
320
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
321 322 323 324
	SAVE_ALL
	GET_THREAD_INFO(%ebp)

	/* Note, _TIF_SECCOMP is bit number 8, and so it needs testw and not testb */
325
	testw $(_TIF_SYSCALL_EMU|_TIF_SYSCALL_TRACE|_TIF_SECCOMP|_TIF_SYSCALL_AUDIT),TI_flags(%ebp)
L
Linus Torvalds 已提交
326 327 328 329 330
	jnz syscall_trace_entry
	cmpl $(nr_syscalls), %eax
	jae syscall_badsys
	call *sys_call_table(,%eax,4)
	movl %eax,EAX(%esp)
331
	DISABLE_INTERRUPTS
332
	TRACE_IRQS_OFF
L
Linus Torvalds 已提交
333 334 335 336 337 338 339
	movl TI_flags(%ebp), %ecx
	testw $_TIF_ALLWORK_MASK, %cx
	jne syscall_exit_work
/* if something modifies registers it must also disable sysexit */
	movl EIP(%esp), %edx
	movl OLDESP(%esp), %ecx
	xorl %ebp,%ebp
340
	TRACE_IRQS_ON
341
	ENABLE_INTERRUPTS_SYSEXIT
342
	CFI_ENDPROC
L
Linus Torvalds 已提交
343 344 345 346


	# system call handler stub
ENTRY(system_call)
347
	RING0_INT_FRAME			# can't unwind into user space anyway
L
Linus Torvalds 已提交
348
	pushl %eax			# save orig_eax
349
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
350 351
	SAVE_ALL
	GET_THREAD_INFO(%ebp)
352 353 354 355
	testl $TF_MASK,EFLAGS(%esp)
	jz no_singlestep
	orl $_TIF_SINGLESTEP,TI_flags(%ebp)
no_singlestep:
356
					# system call tracing in operation / emulation
L
Linus Torvalds 已提交
357
	/* Note, _TIF_SECCOMP is bit number 8, and so it needs testw and not testb */
358
	testw $(_TIF_SYSCALL_EMU|_TIF_SYSCALL_TRACE|_TIF_SECCOMP|_TIF_SYSCALL_AUDIT),TI_flags(%ebp)
L
Linus Torvalds 已提交
359 360 361 362 363 364 365
	jnz syscall_trace_entry
	cmpl $(nr_syscalls), %eax
	jae syscall_badsys
syscall_call:
	call *sys_call_table(,%eax,4)
	movl %eax,EAX(%esp)		# store the return value
syscall_exit:
366
	DISABLE_INTERRUPTS		# make sure we don't miss an interrupt
L
Linus Torvalds 已提交
367 368
					# setting need_resched or sigpending
					# between sampling and the iret
369
	TRACE_IRQS_OFF
L
Linus Torvalds 已提交
370 371 372 373 374 375
	movl TI_flags(%ebp), %ecx
	testw $_TIF_ALLWORK_MASK, %cx	# current->work
	jne syscall_exit_work

restore_all:
	movl EFLAGS(%esp), %eax		# mix EFLAGS, SS and CS
376 377 378
	# Warning: OLDSS(%esp) contains the wrong/random values if we
	# are returning to the kernel.
	# See comments in process.c:copy_thread() for details.
L
Linus Torvalds 已提交
379 380
	movb OLDSS(%esp), %ah
	movb CS(%esp), %al
381 382
	andl $(VM_MASK | (SEGMENT_TI_MASK << 8) | SEGMENT_RPL_MASK), %eax
	cmpl $((SEGMENT_LDT << 8) | USER_RPL), %eax
383
	CFI_REMEMBER_STATE
L
Linus Torvalds 已提交
384 385
	je ldt_ss			# returning to user-space with LDT SS
restore_nocheck:
386 387
	TRACE_IRQS_IRET
restore_nocheck_notrace:
L
Linus Torvalds 已提交
388 389
	RESTORE_REGS
	addl $4, %esp
390
	CFI_ADJUST_CFA_OFFSET -4
391
1:	INTERRUPT_RETURN
L
Linus Torvalds 已提交
392 393
.section .fixup,"ax"
iret_exc:
394
	TRACE_IRQS_ON
395
	ENABLE_INTERRUPTS
396 397 398
	pushl $0			# no error code
	pushl $do_iret_error
	jmp error_code
L
Linus Torvalds 已提交
399 400 401 402 403 404
.previous
.section __ex_table,"a"
	.align 4
	.long 1b,iret_exc
.previous

405
	CFI_RESTORE_STATE
L
Linus Torvalds 已提交
406 407 408 409 410 411 412 413 414 415 416 417
ldt_ss:
	larl OLDSS(%esp), %eax
	jnz restore_nocheck
	testl $0x00400000, %eax		# returning to 32bit stack?
	jnz restore_nocheck		# allright, normal return
	/* If returning to userspace with 16bit stack,
	 * try to fix the higher word of ESP, as the CPU
	 * won't restore it.
	 * This is an "official" bug of all the x86-compatible
	 * CPUs, which we can try to work around to make
	 * dosemu and wine happy. */
	subl $8, %esp		# reserve space for switch16 pointer
418
	CFI_ADJUST_CFA_OFFSET 8
419
	DISABLE_INTERRUPTS
420
	TRACE_IRQS_OFF
L
Linus Torvalds 已提交
421 422 423 424
	movl %esp, %eax
	/* Set up the 16bit stack frame with switch32 pointer on top,
	 * and a switch16 pointer on top of the current frame. */
	call setup_x86_bogus_stack
425
	CFI_ADJUST_CFA_OFFSET -8	# frame has moved
426
	TRACE_IRQS_IRET
L
Linus Torvalds 已提交
427 428
	RESTORE_REGS
	lss 20+4(%esp), %esp	# switch to 16bit stack
429
1:	INTERRUPT_RETURN
L
Linus Torvalds 已提交
430 431 432 433
.section __ex_table,"a"
	.align 4
	.long 1b,iret_exc
.previous
434
	CFI_ENDPROC
L
Linus Torvalds 已提交
435 436 437

	# perform work that needs to be done immediately before resumption
	ALIGN
438
	RING0_PTREGS_FRAME		# can't unwind into user space anyway
L
Linus Torvalds 已提交
439 440 441 442 443
work_pending:
	testb $_TIF_NEED_RESCHED, %cl
	jz work_notifysig
work_resched:
	call schedule
444
	DISABLE_INTERRUPTS		# make sure we don't miss an interrupt
L
Linus Torvalds 已提交
445 446
					# setting need_resched or sigpending
					# between sampling and the iret
447
	TRACE_IRQS_OFF
L
Linus Torvalds 已提交
448 449 450 451 452 453 454 455 456 457 458 459 460 461 462
	movl TI_flags(%ebp), %ecx
	andl $_TIF_WORK_MASK, %ecx	# is there any work to be done other
					# than syscall tracing?
	jz restore_all
	testb $_TIF_NEED_RESCHED, %cl
	jnz work_resched

work_notifysig:				# deal with pending signals and
					# notify-resume requests
	testl $VM_MASK, EFLAGS(%esp)
	movl %esp, %eax
	jne work_notifysig_v86		# returning to kernel-space or
					# vm86-space
	xorl %edx, %edx
	call do_notify_resume
463
	jmp resume_userspace_sig
L
Linus Torvalds 已提交
464 465 466

	ALIGN
work_notifysig_v86:
467
#ifdef CONFIG_VM86
L
Linus Torvalds 已提交
468
	pushl %ecx			# save ti_flags for do_notify_resume
469
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
470 471
	call save_v86_state		# %eax contains pt_regs pointer
	popl %ecx
472
	CFI_ADJUST_CFA_OFFSET -4
L
Linus Torvalds 已提交
473 474 475
	movl %eax, %esp
	xorl %edx, %edx
	call do_notify_resume
476
	jmp resume_userspace_sig
477
#endif
L
Linus Torvalds 已提交
478 479 480 481 482 483 484 485

	# perform syscall exit tracing
	ALIGN
syscall_trace_entry:
	movl $-ENOSYS,EAX(%esp)
	movl %esp, %eax
	xorl %edx,%edx
	call do_syscall_trace
486
	cmpl $0, %eax
487
	jne resume_userspace		# ret != 0 -> running under PTRACE_SYSEMU,
488
					# so must skip actual syscall
L
Linus Torvalds 已提交
489 490 491 492 493 494 495 496 497 498
	movl ORIG_EAX(%esp), %eax
	cmpl $(nr_syscalls), %eax
	jnae syscall_call
	jmp syscall_exit

	# perform syscall exit tracing
	ALIGN
syscall_exit_work:
	testb $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT|_TIF_SINGLESTEP), %cl
	jz work_pending
499
	TRACE_IRQS_ON
500
	ENABLE_INTERRUPTS		# could let do_syscall_trace() call
L
Linus Torvalds 已提交
501 502 503 504 505
					# schedule() instead
	movl %esp, %eax
	movl $1, %edx
	call do_syscall_trace
	jmp resume_userspace
506
	CFI_ENDPROC
L
Linus Torvalds 已提交
507

508
	RING0_INT_FRAME			# can't unwind into user space anyway
L
Linus Torvalds 已提交
509 510
syscall_fault:
	pushl %eax			# save orig_eax
511
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
512 513 514 515 516 517 518 519
	SAVE_ALL
	GET_THREAD_INFO(%ebp)
	movl $-EFAULT,EAX(%esp)
	jmp resume_userspace

syscall_badsys:
	movl $-ENOSYS,EAX(%esp)
	jmp resume_userspace
520
	CFI_ENDPROC
L
Linus Torvalds 已提交
521 522 523 524 525 526 527 528 529 530 531

#define FIXUP_ESPFIX_STACK \
	movl %esp, %eax; \
	/* switch to 32bit stack using the pointer on top of 16bit stack */ \
	lss %ss:CPU_16BIT_STACK_SIZE-8, %esp; \
	/* copy data from 16bit stack to 32bit stack */ \
	call fixup_x86_bogus_stack; \
	/* put ESP to the proper location */ \
	movl %eax, %esp;
#define UNWIND_ESPFIX_STACK \
	pushl %eax; \
532
	CFI_ADJUST_CFA_OFFSET 4; \
L
Linus Torvalds 已提交
533 534 535
	movl %ss, %eax; \
	/* see if on 16bit stack */ \
	cmpw $__ESPFIX_SS, %ax; \
536 537 538 539 540 541 542
	je 28f; \
27:	popl %eax; \
	CFI_ADJUST_CFA_OFFSET -4; \
.section .fixup,"ax"; \
28:	movl $__KERNEL_DS, %eax; \
	movl %eax, %ds; \
	movl %eax, %es; \
L
Linus Torvalds 已提交
543
	/* switch to 32bit stack */ \
544 545 546
	FIXUP_ESPFIX_STACK; \
	jmp 27b; \
.previous
L
Linus Torvalds 已提交
547 548 549 550 551 552 553 554 555 556 557

/*
 * Build the entry stubs and pointer table with
 * some assembler magic.
 */
.data
ENTRY(interrupt)
.text

vector=0
ENTRY(irq_entries_start)
558
	RING0_INT_FRAME
L
Linus Torvalds 已提交
559 560
.rept NR_IRQS
	ALIGN
561 562 563
 .if vector
	CFI_ADJUST_CFA_OFFSET -4
 .endif
564
1:	pushl $~(vector)
565
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
566 567 568 569 570 571 572
	jmp common_interrupt
.data
	.long 1b
.text
vector=vector+1
.endr

573 574 575 576
/*
 * the CPU automatically disables interrupts when executing an IRQ vector,
 * so IRQ-flags tracing has to follow that:
 */
L
Linus Torvalds 已提交
577 578 579
	ALIGN
common_interrupt:
	SAVE_ALL
580
	TRACE_IRQS_OFF
L
Linus Torvalds 已提交
581 582 583
	movl %esp,%eax
	call do_IRQ
	jmp ret_from_intr
584
	CFI_ENDPROC
L
Linus Torvalds 已提交
585 586 587

#define BUILD_INTERRUPT(name, nr)	\
ENTRY(name)				\
588
	RING0_INT_FRAME;		\
589
	pushl $~(nr);			\
590 591
	CFI_ADJUST_CFA_OFFSET 4;	\
	SAVE_ALL;			\
592
	TRACE_IRQS_OFF			\
L
Linus Torvalds 已提交
593 594
	movl %esp,%eax;			\
	call smp_/**/name;		\
595
	jmp ret_from_intr;		\
596
	CFI_ENDPROC
L
Linus Torvalds 已提交
597 598 599 600

/* The include is where all of the SMP etc. interrupts come from */
#include "entry_arch.h"

601 602 603
KPROBE_ENTRY(page_fault)
	RING0_EC_FRAME
	pushl $do_page_fault
604
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
605 606 607
	ALIGN
error_code:
	pushl %ds
608 609
	CFI_ADJUST_CFA_OFFSET 4
	/*CFI_REL_OFFSET ds, 0*/
L
Linus Torvalds 已提交
610
	pushl %eax
611 612
	CFI_ADJUST_CFA_OFFSET 4
	CFI_REL_OFFSET eax, 0
L
Linus Torvalds 已提交
613 614
	xorl %eax, %eax
	pushl %ebp
615 616
	CFI_ADJUST_CFA_OFFSET 4
	CFI_REL_OFFSET ebp, 0
L
Linus Torvalds 已提交
617
	pushl %edi
618 619
	CFI_ADJUST_CFA_OFFSET 4
	CFI_REL_OFFSET edi, 0
L
Linus Torvalds 已提交
620
	pushl %esi
621 622
	CFI_ADJUST_CFA_OFFSET 4
	CFI_REL_OFFSET esi, 0
L
Linus Torvalds 已提交
623
	pushl %edx
624 625
	CFI_ADJUST_CFA_OFFSET 4
	CFI_REL_OFFSET edx, 0
L
Linus Torvalds 已提交
626 627
	decl %eax			# eax = -1
	pushl %ecx
628 629
	CFI_ADJUST_CFA_OFFSET 4
	CFI_REL_OFFSET ecx, 0
L
Linus Torvalds 已提交
630
	pushl %ebx
631 632
	CFI_ADJUST_CFA_OFFSET 4
	CFI_REL_OFFSET ebx, 0
L
Linus Torvalds 已提交
633 634
	cld
	pushl %es
635 636
	CFI_ADJUST_CFA_OFFSET 4
	/*CFI_REL_OFFSET es, 0*/
L
Linus Torvalds 已提交
637 638
	UNWIND_ESPFIX_STACK
	popl %ecx
639 640
	CFI_ADJUST_CFA_OFFSET -4
	/*CFI_REGISTER es, ecx*/
L
Linus Torvalds 已提交
641 642 643 644
	movl ES(%esp), %edi		# get the function address
	movl ORIG_EAX(%esp), %edx	# get the error code
	movl %eax, ORIG_EAX(%esp)
	movl %ecx, ES(%esp)
645
	/*CFI_REL_OFFSET es, ES*/
L
Linus Torvalds 已提交
646 647 648 649 650 651
	movl $(__USER_DS), %ecx
	movl %ecx, %ds
	movl %ecx, %es
	movl %esp,%eax			# pt_regs pointer
	call *%edi
	jmp ret_from_exception
652
	CFI_ENDPROC
653
KPROBE_END(page_fault)
L
Linus Torvalds 已提交
654 655

ENTRY(coprocessor_error)
656
	RING0_INT_FRAME
L
Linus Torvalds 已提交
657
	pushl $0
658
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
659
	pushl $do_coprocessor_error
660
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
661
	jmp error_code
662
	CFI_ENDPROC
L
Linus Torvalds 已提交
663 664

ENTRY(simd_coprocessor_error)
665
	RING0_INT_FRAME
L
Linus Torvalds 已提交
666
	pushl $0
667
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
668
	pushl $do_simd_coprocessor_error
669
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
670
	jmp error_code
671
	CFI_ENDPROC
L
Linus Torvalds 已提交
672 673

ENTRY(device_not_available)
674
	RING0_INT_FRAME
L
Linus Torvalds 已提交
675
	pushl $-1			# mark this as an int
676
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
677
	SAVE_ALL
678
	GET_CR0_INTO_EAX
L
Linus Torvalds 已提交
679 680 681 682 683 684 685
	testl $0x4, %eax		# EM (math emulation bit)
	jne device_not_available_emulate
	preempt_stop
	call math_state_restore
	jmp ret_from_exception
device_not_available_emulate:
	pushl $0			# temporary storage for ORIG_EIP
686
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
687 688
	call math_emulate
	addl $4, %esp
689
	CFI_ADJUST_CFA_OFFSET -4
L
Linus Torvalds 已提交
690
	jmp ret_from_exception
691
	CFI_ENDPROC
L
Linus Torvalds 已提交
692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710

/*
 * Debug traps and NMI can happen at the one SYSENTER instruction
 * that sets up the real kernel stack. Check here, since we can't
 * allow the wrong stack to be used.
 *
 * "TSS_sysenter_esp0+12" is because the NMI/debug handler will have
 * already pushed 3 words if it hits on the sysenter instruction:
 * eflags, cs and eip.
 *
 * We just load the right stack, and push the three (known) values
 * by hand onto the new stack - while updating the return eip past
 * the instruction that would have done it for sysenter.
 */
#define FIX_STACK(offset, ok, label)		\
	cmpw $__KERNEL_CS,4(%esp);		\
	jne ok;					\
label:						\
	movl TSS_sysenter_esp0+offset(%esp),%esp;	\
711 712
	CFI_DEF_CFA esp, 0;			\
	CFI_UNDEFINED eip;			\
L
Linus Torvalds 已提交
713
	pushfl;					\
714
	CFI_ADJUST_CFA_OFFSET 4;		\
L
Linus Torvalds 已提交
715
	pushl $__KERNEL_CS;			\
716 717 718 719
	CFI_ADJUST_CFA_OFFSET 4;		\
	pushl $sysenter_past_esp;		\
	CFI_ADJUST_CFA_OFFSET 4;		\
	CFI_REL_OFFSET eip, 0
L
Linus Torvalds 已提交
720

721
KPROBE_ENTRY(debug)
722
	RING0_INT_FRAME
L
Linus Torvalds 已提交
723 724 725 726 727
	cmpl $sysenter_entry,(%esp)
	jne debug_stack_correct
	FIX_STACK(12, debug_stack_correct, debug_esp_fix_insn)
debug_stack_correct:
	pushl $-1			# mark this as an int
728
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
729 730 731 732 733
	SAVE_ALL
	xorl %edx,%edx			# error code 0
	movl %esp,%eax			# pt_regs pointer
	call do_debug
	jmp ret_from_exception
734
	CFI_ENDPROC
735 736
KPROBE_END(debug)

L
Linus Torvalds 已提交
737 738 739 740 741 742 743 744
/*
 * NMI is doubly nasty. It can happen _while_ we're handling
 * a debug fault, and the debug fault hasn't yet been able to
 * clear up the stack. So we first check whether we got  an
 * NMI on the sysenter entry path, but after that we need to
 * check whether we got an NMI on the debug path where the debug
 * fault happened on the sysenter path.
 */
745
KPROBE_ENTRY(nmi)
746
	RING0_INT_FRAME
L
Linus Torvalds 已提交
747
	pushl %eax
748
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
749 750 751
	movl %ss, %eax
	cmpw $__ESPFIX_SS, %ax
	popl %eax
752
	CFI_ADJUST_CFA_OFFSET -4
L
Linus Torvalds 已提交
753 754 755 756
	je nmi_16bit_stack
	cmpl $sysenter_entry,(%esp)
	je nmi_stack_fixup
	pushl %eax
757
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
758 759 760 761 762 763 764
	movl %esp,%eax
	/* Do not access memory above the end of our stack page,
	 * it might not exist.
	 */
	andl $(THREAD_SIZE-1),%eax
	cmpl $(THREAD_SIZE-20),%eax
	popl %eax
765
	CFI_ADJUST_CFA_OFFSET -4
L
Linus Torvalds 已提交
766 767 768 769
	jae nmi_stack_correct
	cmpl $sysenter_entry,12(%esp)
	je nmi_debug_stack_check
nmi_stack_correct:
770
	/* We have a RING0_INT_FRAME here */
L
Linus Torvalds 已提交
771
	pushl %eax
772
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
773 774 775 776
	SAVE_ALL
	xorl %edx,%edx		# zero error code
	movl %esp,%eax		# pt_regs pointer
	call do_nmi
777
	jmp restore_nocheck_notrace
778
	CFI_ENDPROC
L
Linus Torvalds 已提交
779 780

nmi_stack_fixup:
781
	RING0_INT_FRAME
L
Linus Torvalds 已提交
782 783
	FIX_STACK(12,nmi_stack_correct, 1)
	jmp nmi_stack_correct
784

L
Linus Torvalds 已提交
785
nmi_debug_stack_check:
786
	/* We have a RING0_INT_FRAME here */
L
Linus Torvalds 已提交
787 788
	cmpw $__KERNEL_CS,16(%esp)
	jne nmi_stack_correct
789 790
	cmpl $debug,(%esp)
	jb nmi_stack_correct
L
Linus Torvalds 已提交
791
	cmpl $debug_esp_fix_insn,(%esp)
792
	ja nmi_stack_correct
L
Linus Torvalds 已提交
793 794 795 796
	FIX_STACK(24,nmi_stack_correct, 1)
	jmp nmi_stack_correct

nmi_16bit_stack:
797 798 799 800
	/* We have a RING0_INT_FRAME here.
	 *
	 * create the pointer to lss back
	 */
L
Linus Torvalds 已提交
801
	pushl %ss
802
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
803
	pushl %esp
804
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
805 806 807 808 809
	movzwl %sp, %esp
	addw $4, (%esp)
	/* copy the iret frame of 12 bytes */
	.rept 3
	pushl 16(%esp)
810
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
811 812
	.endr
	pushl %eax
813
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
814 815
	SAVE_ALL
	FIXUP_ESPFIX_STACK		# %eax == %esp
816
	CFI_ADJUST_CFA_OFFSET -20	# the frame has now moved
L
Linus Torvalds 已提交
817 818 819 820
	xorl %edx,%edx			# zero error code
	call do_nmi
	RESTORE_REGS
	lss 12+4(%esp), %esp		# back to 16bit stack
821
1:	INTERRUPT_RETURN
822
	CFI_ENDPROC
L
Linus Torvalds 已提交
823 824 825 826
.section __ex_table,"a"
	.align 4
	.long 1b,iret_exc
.previous
827
KPROBE_END(nmi)
L
Linus Torvalds 已提交
828

829
KPROBE_ENTRY(int3)
830
	RING0_INT_FRAME
L
Linus Torvalds 已提交
831
	pushl $-1			# mark this as an int
832
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
833 834 835 836 837
	SAVE_ALL
	xorl %edx,%edx		# zero error code
	movl %esp,%eax		# pt_regs pointer
	call do_int3
	jmp ret_from_exception
838
	CFI_ENDPROC
839
KPROBE_END(int3)
L
Linus Torvalds 已提交
840 841

ENTRY(overflow)
842
	RING0_INT_FRAME
L
Linus Torvalds 已提交
843
	pushl $0
844
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
845
	pushl $do_overflow
846
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
847
	jmp error_code
848
	CFI_ENDPROC
L
Linus Torvalds 已提交
849 850

ENTRY(bounds)
851
	RING0_INT_FRAME
L
Linus Torvalds 已提交
852
	pushl $0
853
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
854
	pushl $do_bounds
855
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
856
	jmp error_code
857
	CFI_ENDPROC
L
Linus Torvalds 已提交
858 859

ENTRY(invalid_op)
860
	RING0_INT_FRAME
L
Linus Torvalds 已提交
861
	pushl $0
862
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
863
	pushl $do_invalid_op
864
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
865
	jmp error_code
866
	CFI_ENDPROC
L
Linus Torvalds 已提交
867 868

ENTRY(coprocessor_segment_overrun)
869
	RING0_INT_FRAME
L
Linus Torvalds 已提交
870
	pushl $0
871
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
872
	pushl $do_coprocessor_segment_overrun
873
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
874
	jmp error_code
875
	CFI_ENDPROC
L
Linus Torvalds 已提交
876 877

ENTRY(invalid_TSS)
878
	RING0_EC_FRAME
L
Linus Torvalds 已提交
879
	pushl $do_invalid_TSS
880
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
881
	jmp error_code
882
	CFI_ENDPROC
L
Linus Torvalds 已提交
883 884

ENTRY(segment_not_present)
885
	RING0_EC_FRAME
L
Linus Torvalds 已提交
886
	pushl $do_segment_not_present
887
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
888
	jmp error_code
889
	CFI_ENDPROC
L
Linus Torvalds 已提交
890 891

ENTRY(stack_segment)
892
	RING0_EC_FRAME
L
Linus Torvalds 已提交
893
	pushl $do_stack_segment
894
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
895
	jmp error_code
896
	CFI_ENDPROC
L
Linus Torvalds 已提交
897

898
KPROBE_ENTRY(general_protection)
899
	RING0_EC_FRAME
L
Linus Torvalds 已提交
900
	pushl $do_general_protection
901
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
902
	jmp error_code
903
	CFI_ENDPROC
904
KPROBE_END(general_protection)
L
Linus Torvalds 已提交
905 906

ENTRY(alignment_check)
907
	RING0_EC_FRAME
L
Linus Torvalds 已提交
908
	pushl $do_alignment_check
909
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
910
	jmp error_code
911
	CFI_ENDPROC
L
Linus Torvalds 已提交
912

913 914 915 916 917
ENTRY(divide_error)
	RING0_INT_FRAME
	pushl $0			# no error code
	CFI_ADJUST_CFA_OFFSET 4
	pushl $do_divide_error
918
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
919
	jmp error_code
920
	CFI_ENDPROC
L
Linus Torvalds 已提交
921 922 923

#ifdef CONFIG_X86_MCE
ENTRY(machine_check)
924
	RING0_INT_FRAME
L
Linus Torvalds 已提交
925
	pushl $0
926
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
927
	pushl machine_check_vector
928
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
929
	jmp error_code
930
	CFI_ENDPROC
L
Linus Torvalds 已提交
931 932 933
#endif

ENTRY(spurious_interrupt_bug)
934
	RING0_INT_FRAME
L
Linus Torvalds 已提交
935
	pushl $0
936
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
937
	pushl $do_spurious_interrupt_bug
938
	CFI_ADJUST_CFA_OFFSET 4
L
Linus Torvalds 已提交
939
	jmp error_code
940
	CFI_ENDPROC
L
Linus Torvalds 已提交
941

942 943
#ifdef CONFIG_STACK_UNWIND
ENTRY(arch_unwind_init_running)
944
	CFI_STARTPROC
945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968
	movl	4(%esp), %edx
	movl	(%esp), %ecx
	leal	4(%esp), %eax
	movl	%ebx, EBX(%edx)
	xorl	%ebx, %ebx
	movl	%ebx, ECX(%edx)
	movl	%ebx, EDX(%edx)
	movl	%esi, ESI(%edx)
	movl	%edi, EDI(%edx)
	movl	%ebp, EBP(%edx)
	movl	%ebx, EAX(%edx)
	movl	$__USER_DS, DS(%edx)
	movl	$__USER_DS, ES(%edx)
	movl	%ebx, ORIG_EAX(%edx)
	movl	%ecx, EIP(%edx)
	movl	12(%esp), %ecx
	movl	$__KERNEL_CS, CS(%edx)
	movl	%ebx, EFLAGS(%edx)
	movl	%eax, OLDESP(%edx)
	movl	8(%esp), %eax
	movl	%ecx, 8(%esp)
	movl	EBX(%edx), %ebx
	movl	$__KERNEL_DS, OLDSS(%edx)
	jmpl	*%eax
969
	CFI_ENDPROC
970 971 972
ENDPROC(arch_unwind_init_running)
#endif

973 974 975 976 977 978 979 980 981 982 983 984 985
ENTRY(kernel_thread_helper)
	pushl $0		# fake return address for unwinder
	CFI_STARTPROC
	movl %edx,%eax
	push %edx
	CFI_ADJUST_CFA_OFFSET 4
	call *%ebx
	push %eax
	CFI_ADJUST_CFA_OFFSET 4
	call do_exit
	CFI_ENDPROC
ENDPROC(kernel_thread_helper)

986
.section .rodata,"a"
987
#include "syscall_table.S"
L
Linus Torvalds 已提交
988 989

syscall_table_size=(.-sys_call_table)