blob: 6aa6932e21b172283e0a604d2391782776ed7629 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86_64/entry.S
3 *
4 * Copyright (C) 1991, 1992 Linus Torvalds
5 * Copyright (C) 2000, 2001, 2002 Andi Kleen SuSE Labs
6 * Copyright (C) 2000 Pavel Machek <pavel@suse.cz>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 */
8
9/*
10 * entry.S contains the system-call and fault low-level handling routines.
11 *
12 * NOTE: This code handles signal-recognition, which happens every time
13 * after an interrupt and after each system call.
14 *
15 * Normal syscalls and interrupts don't save a full stack frame, this is
16 * only done for syscall tracing, signals or fork/exec et.al.
17 *
18 * A note on terminology:
19 * - top of stack: Architecture defined interrupt frame from SS to RIP
20 * at the top of the kernel process stack.
21 * - partial stack frame: partially saved registers upto R11.
22 * - full stack frame: Like partial stack frame, but all register saved.
Andi Kleen2e91a172006-09-26 10:52:29 +020023 *
24 * Some macro usage:
25 * - CFI macros are used to generate dwarf2 unwind information for better
26 * backtraces. They don't change any code.
27 * - SAVE_ALL/RESTORE_ALL - Save/restore all registers
28 * - SAVE_ARGS/RESTORE_ARGS - Save/restore registers that C functions modify.
29 * There are unfortunately lots of special cases where some registers
30 * not touched. The macro is a big mess that should be cleaned up.
31 * - SAVE_REST/RESTORE_REST - Handle the registers not saved by SAVE_ARGS.
32 * Gives a full stack frame.
33 * - ENTRY/END Define functions in the symbol table.
34 * - FIXUP_TOP_OF_STACK/RESTORE_TOP_OF_STACK - Fix up the hardware stack
35 * frame that is otherwise undefined after a SYSCALL
36 * - TRACE_IRQ_* - Trace hard interrupt state for lock debugging.
37 * - errorentry/paranoidentry/zeroentry - Define exception entry points.
Linus Torvalds1da177e2005-04-16 15:20:36 -070038 */
39
Linus Torvalds1da177e2005-04-16 15:20:36 -070040#include <linux/linkage.h>
41#include <asm/segment.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#include <asm/cache.h>
43#include <asm/errno.h>
44#include <asm/dwarf2.h>
45#include <asm/calling.h>
Sam Ravnborge2d5df92005-09-09 21:28:48 +020046#include <asm/asm-offsets.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070047#include <asm/msr.h>
48#include <asm/unistd.h>
49#include <asm/thread_info.h>
50#include <asm/hw_irq.h>
Andi Kleen5f8efbb2006-01-16 01:56:39 +010051#include <asm/page.h>
Ingo Molnar2601e642006-07-03 00:24:45 -070052#include <asm/irqflags.h>
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +010053#include <asm/paravirt.h>
Abhishek Sagar395a59d2008-06-21 23:47:27 +053054#include <asm/ftrace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070055
56 .code64
57
Arnaldo Carvalho de Melo16444a82008-05-12 21:20:42 +020058#ifdef CONFIG_FTRACE
Steven Rostedtd61f82d2008-05-12 21:20:43 +020059#ifdef CONFIG_DYNAMIC_FTRACE
60ENTRY(mcount)
61
62 subq $0x38, %rsp
63 movq %rax, (%rsp)
64 movq %rcx, 8(%rsp)
65 movq %rdx, 16(%rsp)
66 movq %rsi, 24(%rsp)
67 movq %rdi, 32(%rsp)
68 movq %r8, 40(%rsp)
69 movq %r9, 48(%rsp)
70
71 movq 0x38(%rsp), %rdi
Abhishek Sagar395a59d2008-06-21 23:47:27 +053072 subq $MCOUNT_INSN_SIZE, %rdi
Steven Rostedtd61f82d2008-05-12 21:20:43 +020073
74.globl mcount_call
75mcount_call:
76 call ftrace_stub
77
78 movq 48(%rsp), %r9
79 movq 40(%rsp), %r8
80 movq 32(%rsp), %rdi
81 movq 24(%rsp), %rsi
82 movq 16(%rsp), %rdx
83 movq 8(%rsp), %rcx
84 movq (%rsp), %rax
85 addq $0x38, %rsp
86
87 retq
88END(mcount)
89
90ENTRY(ftrace_caller)
91
92 /* taken from glibc */
93 subq $0x38, %rsp
94 movq %rax, (%rsp)
95 movq %rcx, 8(%rsp)
96 movq %rdx, 16(%rsp)
97 movq %rsi, 24(%rsp)
98 movq %rdi, 32(%rsp)
99 movq %r8, 40(%rsp)
100 movq %r9, 48(%rsp)
101
102 movq 0x38(%rsp), %rdi
103 movq 8(%rbp), %rsi
Abhishek Sagar395a59d2008-06-21 23:47:27 +0530104 subq $MCOUNT_INSN_SIZE, %rdi
Steven Rostedtd61f82d2008-05-12 21:20:43 +0200105
106.globl ftrace_call
107ftrace_call:
108 call ftrace_stub
109
110 movq 48(%rsp), %r9
111 movq 40(%rsp), %r8
112 movq 32(%rsp), %rdi
113 movq 24(%rsp), %rsi
114 movq 16(%rsp), %rdx
115 movq 8(%rsp), %rcx
116 movq (%rsp), %rax
117 addq $0x38, %rsp
118
119.globl ftrace_stub
120ftrace_stub:
121 retq
122END(ftrace_caller)
123
124#else /* ! CONFIG_DYNAMIC_FTRACE */
Arnaldo Carvalho de Melo16444a82008-05-12 21:20:42 +0200125ENTRY(mcount)
126 cmpq $ftrace_stub, ftrace_trace_function
127 jnz trace
128.globl ftrace_stub
129ftrace_stub:
130 retq
131
132trace:
133 /* taken from glibc */
134 subq $0x38, %rsp
135 movq %rax, (%rsp)
136 movq %rcx, 8(%rsp)
137 movq %rdx, 16(%rsp)
138 movq %rsi, 24(%rsp)
139 movq %rdi, 32(%rsp)
140 movq %r8, 40(%rsp)
141 movq %r9, 48(%rsp)
142
143 movq 0x38(%rsp), %rdi
144 movq 8(%rbp), %rsi
Abhishek Sagar395a59d2008-06-21 23:47:27 +0530145 subq $MCOUNT_INSN_SIZE, %rdi
Arnaldo Carvalho de Melo16444a82008-05-12 21:20:42 +0200146
147 call *ftrace_trace_function
148
149 movq 48(%rsp), %r9
150 movq 40(%rsp), %r8
151 movq 32(%rsp), %rdi
152 movq 24(%rsp), %rsi
153 movq 16(%rsp), %rdx
154 movq 8(%rsp), %rcx
155 movq (%rsp), %rax
156 addq $0x38, %rsp
157
158 jmp ftrace_stub
159END(mcount)
Steven Rostedtd61f82d2008-05-12 21:20:43 +0200160#endif /* CONFIG_DYNAMIC_FTRACE */
161#endif /* CONFIG_FTRACE */
Arnaldo Carvalho de Melo16444a82008-05-12 21:20:42 +0200162
Andi Kleendc37db42005-04-16 15:25:05 -0700163#ifndef CONFIG_PREEMPT
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164#define retint_kernel retint_restore_args
165#endif
Ingo Molnar2601e642006-07-03 00:24:45 -0700166
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100167#ifdef CONFIG_PARAVIRT
Jeremy Fitzhardinge2be29982008-06-25 00:19:28 -0400168ENTRY(native_usergs_sysret64)
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100169 swapgs
170 sysretq
171#endif /* CONFIG_PARAVIRT */
172
Ingo Molnar2601e642006-07-03 00:24:45 -0700173
174.macro TRACE_IRQS_IRETQ offset=ARGOFFSET
175#ifdef CONFIG_TRACE_IRQFLAGS
176 bt $9,EFLAGS-\offset(%rsp) /* interrupts off? */
177 jnc 1f
178 TRACE_IRQS_ON
1791:
180#endif
181.endm
182
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183/*
184 * C code is not supposed to know about undefined top of stack. Every time
185 * a C function with an pt_regs argument is called from the SYSCALL based
186 * fast path FIXUP_TOP_OF_STACK is needed.
187 * RESTORE_TOP_OF_STACK syncs the syscall state after any possible ptregs
188 * manipulation.
189 */
190
191 /* %rsp:at FRAMEEND */
192 .macro FIXUP_TOP_OF_STACK tmp
193 movq %gs:pda_oldrsp,\tmp
194 movq \tmp,RSP(%rsp)
195 movq $__USER_DS,SS(%rsp)
196 movq $__USER_CS,CS(%rsp)
197 movq $-1,RCX(%rsp)
198 movq R11(%rsp),\tmp /* get eflags */
199 movq \tmp,EFLAGS(%rsp)
200 .endm
201
202 .macro RESTORE_TOP_OF_STACK tmp,offset=0
203 movq RSP-\offset(%rsp),\tmp
204 movq \tmp,%gs:pda_oldrsp
205 movq EFLAGS-\offset(%rsp),\tmp
206 movq \tmp,R11-\offset(%rsp)
207 .endm
208
209 .macro FAKE_STACK_FRAME child_rip
210 /* push in order ss, rsp, eflags, cs, rip */
Andi Kleen3829ee62005-07-28 21:15:48 -0700211 xorl %eax, %eax
Jeremy Fitzhardingee04e0a62008-06-25 00:19:25 -0400212 pushq $__KERNEL_DS /* ss */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200214 /*CFI_REL_OFFSET ss,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700215 pushq %rax /* rsp */
216 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200217 CFI_REL_OFFSET rsp,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700218 pushq $(1<<9) /* eflags - interrupts on */
219 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200220 /*CFI_REL_OFFSET rflags,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221 pushq $__KERNEL_CS /* cs */
222 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200223 /*CFI_REL_OFFSET cs,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224 pushq \child_rip /* rip */
225 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200226 CFI_REL_OFFSET rip,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 pushq %rax /* orig rax */
228 CFI_ADJUST_CFA_OFFSET 8
229 .endm
230
231 .macro UNFAKE_STACK_FRAME
232 addq $8*6, %rsp
233 CFI_ADJUST_CFA_OFFSET -(6*8)
234 .endm
235
Jan Beulich7effaa82005-09-12 18:49:24 +0200236 .macro CFI_DEFAULT_STACK start=1
237 .if \start
238 CFI_STARTPROC simple
Jan Beulichadf14232006-09-26 10:52:41 +0200239 CFI_SIGNAL_FRAME
Jan Beulich7effaa82005-09-12 18:49:24 +0200240 CFI_DEF_CFA rsp,SS+8
241 .else
242 CFI_DEF_CFA_OFFSET SS+8
243 .endif
244 CFI_REL_OFFSET r15,R15
245 CFI_REL_OFFSET r14,R14
246 CFI_REL_OFFSET r13,R13
247 CFI_REL_OFFSET r12,R12
248 CFI_REL_OFFSET rbp,RBP
249 CFI_REL_OFFSET rbx,RBX
250 CFI_REL_OFFSET r11,R11
251 CFI_REL_OFFSET r10,R10
252 CFI_REL_OFFSET r9,R9
253 CFI_REL_OFFSET r8,R8
254 CFI_REL_OFFSET rax,RAX
255 CFI_REL_OFFSET rcx,RCX
256 CFI_REL_OFFSET rdx,RDX
257 CFI_REL_OFFSET rsi,RSI
258 CFI_REL_OFFSET rdi,RDI
259 CFI_REL_OFFSET rip,RIP
260 /*CFI_REL_OFFSET cs,CS*/
261 /*CFI_REL_OFFSET rflags,EFLAGS*/
262 CFI_REL_OFFSET rsp,RSP
263 /*CFI_REL_OFFSET ss,SS*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700264 .endm
265/*
266 * A newly forked process directly context switches into this.
267 */
268/* rdi: prev */
269ENTRY(ret_from_fork)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700270 CFI_DEFAULT_STACK
Andi Kleen658fdbe2006-09-26 10:52:41 +0200271 push kernel_eflags(%rip)
272 CFI_ADJUST_CFA_OFFSET 4
273 popf # reset kernel eflags
274 CFI_ADJUST_CFA_OFFSET -4
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 call schedule_tail
276 GET_THREAD_INFO(%rcx)
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300277 testl $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT),TI_flags(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278 jnz rff_trace
279rff_action:
280 RESTORE_REST
281 testl $3,CS-ARGOFFSET(%rsp) # from kernel_thread?
282 je int_ret_from_sys_call
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300283 testl $_TIF_IA32,TI_flags(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284 jnz int_ret_from_sys_call
285 RESTORE_TOP_OF_STACK %rdi,ARGOFFSET
286 jmp ret_from_sys_call
287rff_trace:
288 movq %rsp,%rdi
289 call syscall_trace_leave
290 GET_THREAD_INFO(%rcx)
291 jmp rff_action
292 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200293END(ret_from_fork)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294
295/*
296 * System call entry. Upto 6 arguments in registers are supported.
297 *
298 * SYSCALL does not save anything on the stack and does not change the
299 * stack pointer.
300 */
301
302/*
303 * Register setup:
304 * rax system call number
305 * rdi arg0
306 * rcx return address for syscall/sysret, C arg3
307 * rsi arg1
308 * rdx arg2
309 * r10 arg3 (--> moved to rcx for C)
310 * r8 arg4
311 * r9 arg5
312 * r11 eflags for syscall/sysret, temporary for C
313 * r12-r15,rbp,rbx saved by C code, not touched.
314 *
315 * Interrupts are off on entry.
316 * Only called from user space.
317 *
318 * XXX if we had a free scratch register we could save the RSP into the stack frame
319 * and report it properly in ps. Unfortunately we haven't.
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200320 *
321 * When user can change the frames always force IRET. That is because
322 * it deals with uncanonical addresses better. SYSRET has trouble
323 * with them due to bugs in both AMD and Intel CPUs.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700324 */
325
326ENTRY(system_call)
Jan Beulich7effaa82005-09-12 18:49:24 +0200327 CFI_STARTPROC simple
Jan Beulichadf14232006-09-26 10:52:41 +0200328 CFI_SIGNAL_FRAME
Jan Beulichdffead42006-06-26 13:57:38 +0200329 CFI_DEF_CFA rsp,PDA_STACKOFFSET
Jan Beulich7effaa82005-09-12 18:49:24 +0200330 CFI_REGISTER rip,rcx
331 /*CFI_REGISTER rflags,r11*/
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100332 SWAPGS_UNSAFE_STACK
333 /*
334 * A hypervisor implementation might want to use a label
335 * after the swapgs, so that it can do the swapgs
336 * for the guest and jump here on syscall.
337 */
338ENTRY(system_call_after_swapgs)
339
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340 movq %rsp,%gs:pda_oldrsp
341 movq %gs:pda_kernelstack,%rsp
Ingo Molnar2601e642006-07-03 00:24:45 -0700342 /*
343 * No need to follow this irqs off/on section - it's straight
344 * and short:
345 */
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100346 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700347 SAVE_ARGS 8,1
348 movq %rax,ORIG_RAX-ARGOFFSET(%rsp)
Jan Beulich7effaa82005-09-12 18:49:24 +0200349 movq %rcx,RIP-ARGOFFSET(%rsp)
350 CFI_REL_OFFSET rip,RIP-ARGOFFSET
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351 GET_THREAD_INFO(%rcx)
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300352 testl $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT|_TIF_SECCOMP), \
353 TI_flags(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354 jnz tracesys
355 cmpq $__NR_syscall_max,%rax
356 ja badsys
357 movq %r10,%rcx
358 call *sys_call_table(,%rax,8) # XXX: rip relative
359 movq %rax,RAX-ARGOFFSET(%rsp)
360/*
361 * Syscall return path ending with SYSRET (fast path)
362 * Has incomplete stack frame and undefined top of stack.
363 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364ret_from_sys_call:
Andi Kleen11b854b2005-04-16 15:25:02 -0700365 movl $_TIF_ALLWORK_MASK,%edi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700366 /* edi: flagmask */
367sysret_check:
Peter Zijlstra10cd7062007-10-11 22:11:12 +0200368 LOCKDEP_SYS_EXIT
Linus Torvalds1da177e2005-04-16 15:20:36 -0700369 GET_THREAD_INFO(%rcx)
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100370 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700371 TRACE_IRQS_OFF
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300372 movl TI_flags(%rcx),%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700373 andl %edi,%edx
374 jnz sysret_careful
Jan Beulichbcddc012006-12-07 02:14:02 +0100375 CFI_REMEMBER_STATE
Ingo Molnar2601e642006-07-03 00:24:45 -0700376 /*
377 * sysretq will re-enable interrupts:
378 */
379 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700380 movq RIP-ARGOFFSET(%rsp),%rcx
Jan Beulich7effaa82005-09-12 18:49:24 +0200381 CFI_REGISTER rip,rcx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382 RESTORE_ARGS 0,-ARG_SKIP,1
Jan Beulich7effaa82005-09-12 18:49:24 +0200383 /*CFI_REGISTER rflags,r11*/
Jeremy Fitzhardingec7245da2008-06-25 00:19:27 -0400384 movq %gs:pda_oldrsp, %rsp
Jeremy Fitzhardinge2be29982008-06-25 00:19:28 -0400385 USERGS_SYSRET64
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386
Jan Beulichbcddc012006-12-07 02:14:02 +0100387 CFI_RESTORE_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700388 /* Handle reschedules */
389 /* edx: work, edi: workmask */
390sysret_careful:
391 bt $TIF_NEED_RESCHED,%edx
392 jnc sysret_signal
Ingo Molnar2601e642006-07-03 00:24:45 -0700393 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100394 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200396 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700397 call schedule
398 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200399 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700400 jmp sysret_check
401
402 /* Handle a signal */
403sysret_signal:
Ingo Molnar2601e642006-07-03 00:24:45 -0700404 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100405 ENABLE_INTERRUPTS(CLBR_NONE)
Peter Zijlstra8f4d37e2008-01-25 21:08:29 +0100406 testl $_TIF_DO_NOTIFY_MASK,%edx
Andi Kleen10ffdbb2005-05-16 21:53:19 -0700407 jz 1f
408
409 /* Really a signal */
410 /* edx: work flags (arg3) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700411 leaq do_notify_resume(%rip),%rax
412 leaq -ARGOFFSET(%rsp),%rdi # &pt_regs -> arg1
413 xorl %esi,%esi # oldset -> arg2
414 call ptregscall_common
Roland McGratheca91e72008-07-10 14:50:39 -07004151: movl $_TIF_WORK_MASK,%edi
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200416 /* Use IRET because user could have changed frame. This
417 works because ptregscall_common has called FIXUP_TOP_OF_STACK. */
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100418 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700419 TRACE_IRQS_OFF
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200420 jmp int_with_check
Linus Torvalds1da177e2005-04-16 15:20:36 -0700421
Jan Beulich7effaa82005-09-12 18:49:24 +0200422badsys:
423 movq $-ENOSYS,RAX-ARGOFFSET(%rsp)
424 jmp ret_from_sys_call
425
Linus Torvalds1da177e2005-04-16 15:20:36 -0700426 /* Do syscall tracing */
427tracesys:
428 SAVE_REST
Roland McGratha31f8dd2008-03-16 21:59:11 -0700429 movq $-ENOSYS,RAX(%rsp) /* ptrace can change this for a bad syscall */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700430 FIXUP_TOP_OF_STACK %rdi
431 movq %rsp,%rdi
432 call syscall_trace_enter
433 LOAD_ARGS ARGOFFSET /* reload args from stack in case ptrace changed it */
434 RESTORE_REST
435 cmpq $__NR_syscall_max,%rax
Roland McGratha31f8dd2008-03-16 21:59:11 -0700436 ja int_ret_from_sys_call /* RAX(%rsp) set to -ENOSYS above */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437 movq %r10,%rcx /* fixup for C */
438 call *sys_call_table(,%rax,8)
Roland McGratha31f8dd2008-03-16 21:59:11 -0700439 movq %rax,RAX-ARGOFFSET(%rsp)
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200440 /* Use IRET because user could have changed frame */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700441
Linus Torvalds1da177e2005-04-16 15:20:36 -0700442/*
443 * Syscall return path ending with IRET.
444 * Has correct top of stack, but partial stack frame.
Jan Beulichbcddc012006-12-07 02:14:02 +0100445 */
446 .globl int_ret_from_sys_call
447int_ret_from_sys_call:
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100448 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700449 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700450 testl $3,CS-ARGOFFSET(%rsp)
451 je retint_restore_args
452 movl $_TIF_ALLWORK_MASK,%edi
453 /* edi: mask to check */
454int_with_check:
Peter Zijlstra10cd7062007-10-11 22:11:12 +0200455 LOCKDEP_SYS_EXIT_IRQ
Linus Torvalds1da177e2005-04-16 15:20:36 -0700456 GET_THREAD_INFO(%rcx)
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300457 movl TI_flags(%rcx),%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700458 andl %edi,%edx
459 jnz int_careful
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300460 andl $~TS_COMPAT,TI_status(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700461 jmp retint_swapgs
462
463 /* Either reschedule or signal or syscall exit tracking needed. */
464 /* First do a reschedule test. */
465 /* edx: work, edi: workmask */
466int_careful:
467 bt $TIF_NEED_RESCHED,%edx
468 jnc int_very_careful
Ingo Molnar2601e642006-07-03 00:24:45 -0700469 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100470 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700471 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200472 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473 call schedule
474 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200475 CFI_ADJUST_CFA_OFFSET -8
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100476 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700477 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700478 jmp int_with_check
479
480 /* handle signals and tracing -- both require a full stack frame */
481int_very_careful:
Ingo Molnar2601e642006-07-03 00:24:45 -0700482 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100483 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700484 SAVE_REST
485 /* Check for syscall exit trace */
486 testl $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT|_TIF_SINGLESTEP),%edx
487 jz int_signal
488 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200489 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490 leaq 8(%rsp),%rdi # &ptregs -> arg1
491 call syscall_trace_leave
492 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200493 CFI_ADJUST_CFA_OFFSET -8
Andi Kleen36c11042005-04-16 15:25:01 -0700494 andl $~(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT|_TIF_SINGLESTEP),%edi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700495 jmp int_restore_rest
496
497int_signal:
Peter Zijlstra8f4d37e2008-01-25 21:08:29 +0100498 testl $_TIF_DO_NOTIFY_MASK,%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499 jz 1f
500 movq %rsp,%rdi # &ptregs -> arg1
501 xorl %esi,%esi # oldset -> arg2
502 call do_notify_resume
Roland McGratheca91e72008-07-10 14:50:39 -07005031: movl $_TIF_WORK_MASK,%edi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700504int_restore_rest:
505 RESTORE_REST
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100506 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700507 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508 jmp int_with_check
509 CFI_ENDPROC
Jan Beulichbcddc012006-12-07 02:14:02 +0100510END(system_call)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511
512/*
513 * Certain special system calls that need to save a complete full stack frame.
514 */
515
516 .macro PTREGSCALL label,func,arg
517 .globl \label
518\label:
519 leaq \func(%rip),%rax
520 leaq -ARGOFFSET+8(%rsp),\arg /* 8 for return address */
521 jmp ptregscall_common
Jan Beulich4b787e02006-06-26 13:56:55 +0200522END(\label)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700523 .endm
524
Jan Beulich7effaa82005-09-12 18:49:24 +0200525 CFI_STARTPROC
526
Linus Torvalds1da177e2005-04-16 15:20:36 -0700527 PTREGSCALL stub_clone, sys_clone, %r8
528 PTREGSCALL stub_fork, sys_fork, %rdi
529 PTREGSCALL stub_vfork, sys_vfork, %rdi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700530 PTREGSCALL stub_sigaltstack, sys_sigaltstack, %rdx
531 PTREGSCALL stub_iopl, sys_iopl, %rsi
532
533ENTRY(ptregscall_common)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534 popq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200535 CFI_ADJUST_CFA_OFFSET -8
536 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700537 SAVE_REST
538 movq %r11, %r15
Jan Beulich7effaa82005-09-12 18:49:24 +0200539 CFI_REGISTER rip, r15
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540 FIXUP_TOP_OF_STACK %r11
541 call *%rax
542 RESTORE_TOP_OF_STACK %r11
543 movq %r15, %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200544 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700545 RESTORE_REST
546 pushq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200547 CFI_ADJUST_CFA_OFFSET 8
548 CFI_REL_OFFSET rip, 0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700549 ret
550 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200551END(ptregscall_common)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700552
553ENTRY(stub_execve)
554 CFI_STARTPROC
555 popq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200556 CFI_ADJUST_CFA_OFFSET -8
557 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700558 SAVE_REST
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559 FIXUP_TOP_OF_STACK %r11
Ingo Molnar5d119b22008-02-26 12:55:57 +0100560 movq %rsp, %rcx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561 call sys_execve
Linus Torvalds1da177e2005-04-16 15:20:36 -0700562 RESTORE_TOP_OF_STACK %r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700563 movq %rax,RAX(%rsp)
564 RESTORE_REST
565 jmp int_ret_from_sys_call
566 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200567END(stub_execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700568
569/*
570 * sigreturn is special because it needs to restore all registers on return.
571 * This cannot be done with SYSRET, so use the IRET return path instead.
572 */
573ENTRY(stub_rt_sigreturn)
574 CFI_STARTPROC
Jan Beulich7effaa82005-09-12 18:49:24 +0200575 addq $8, %rsp
576 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577 SAVE_REST
578 movq %rsp,%rdi
579 FIXUP_TOP_OF_STACK %r11
580 call sys_rt_sigreturn
581 movq %rax,RAX(%rsp) # fixme, this could be done at the higher layer
582 RESTORE_REST
583 jmp int_ret_from_sys_call
584 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200585END(stub_rt_sigreturn)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586
Jan Beulich7effaa82005-09-12 18:49:24 +0200587/*
588 * initial frame state for interrupts and exceptions
589 */
590 .macro _frame ref
591 CFI_STARTPROC simple
Jan Beulichadf14232006-09-26 10:52:41 +0200592 CFI_SIGNAL_FRAME
Jan Beulich7effaa82005-09-12 18:49:24 +0200593 CFI_DEF_CFA rsp,SS+8-\ref
594 /*CFI_REL_OFFSET ss,SS-\ref*/
595 CFI_REL_OFFSET rsp,RSP-\ref
596 /*CFI_REL_OFFSET rflags,EFLAGS-\ref*/
597 /*CFI_REL_OFFSET cs,CS-\ref*/
598 CFI_REL_OFFSET rip,RIP-\ref
599 .endm
600
601/* initial frame state for interrupts (and exceptions without error code) */
602#define INTR_FRAME _frame RIP
603/* initial frame state for exceptions with error code (and interrupts with
604 vector already pushed) */
605#define XCPT_FRAME _frame ORIG_RAX
606
Linus Torvalds1da177e2005-04-16 15:20:36 -0700607/*
608 * Interrupt entry/exit.
609 *
610 * Interrupt entry points save only callee clobbered registers in fast path.
611 *
612 * Entry runs with interrupts off.
613 */
614
615/* 0(%rsp): interrupt number */
616 .macro interrupt func
Linus Torvalds1da177e2005-04-16 15:20:36 -0700617 cld
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618 SAVE_ARGS
619 leaq -ARGOFFSET(%rsp),%rdi # arg1 for handler
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200620 pushq %rbp
621 CFI_ADJUST_CFA_OFFSET 8
622 CFI_REL_OFFSET rbp, 0
623 movq %rsp,%rbp
624 CFI_DEF_CFA_REGISTER rbp
Linus Torvalds1da177e2005-04-16 15:20:36 -0700625 testl $3,CS(%rdi)
626 je 1f
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100627 SWAPGS
Andi Kleen96e54042006-09-26 10:52:39 +0200628 /* irqcount is used to check if a CPU is already on an interrupt
629 stack or not. While this is essentially redundant with preempt_count
630 it is a little cheaper to use a separate counter in the PDA
631 (short of moving irq_enter into assembly, which would be too
632 much work) */
6331: incl %gs:pda_irqcount
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200634 cmoveq %gs:pda_irqstackptr,%rsp
Andi Kleen26995002006-08-02 22:37:28 +0200635 push %rbp # backlink for old unwinder
Ingo Molnar2601e642006-07-03 00:24:45 -0700636 /*
637 * We entered an interrupt context - irqs are off:
638 */
639 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640 call \func
641 .endm
642
643ENTRY(common_interrupt)
Jan Beulich7effaa82005-09-12 18:49:24 +0200644 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700645 interrupt do_IRQ
646 /* 0(%rsp): oldrsp-ARGOFFSET */
Jan Beulich7effaa82005-09-12 18:49:24 +0200647ret_from_intr:
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100648 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700649 TRACE_IRQS_OFF
Andi Kleen3829ee62005-07-28 21:15:48 -0700650 decl %gs:pda_irqcount
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200651 leaveq
Jan Beulich7effaa82005-09-12 18:49:24 +0200652 CFI_DEF_CFA_REGISTER rsp
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200653 CFI_ADJUST_CFA_OFFSET -8
Jan Beulich7effaa82005-09-12 18:49:24 +0200654exit_intr:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700655 GET_THREAD_INFO(%rcx)
656 testl $3,CS-ARGOFFSET(%rsp)
657 je retint_kernel
658
659 /* Interrupt came from user space */
660 /*
661 * Has a correct top of stack, but a partial stack frame
662 * %rcx: thread info. Interrupts off.
663 */
664retint_with_reschedule:
665 movl $_TIF_WORK_MASK,%edi
Jan Beulich7effaa82005-09-12 18:49:24 +0200666retint_check:
Peter Zijlstra10cd7062007-10-11 22:11:12 +0200667 LOCKDEP_SYS_EXIT_IRQ
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300668 movl TI_flags(%rcx),%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700669 andl %edi,%edx
Jan Beulich7effaa82005-09-12 18:49:24 +0200670 CFI_REMEMBER_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700671 jnz retint_careful
Peter Zijlstra10cd7062007-10-11 22:11:12 +0200672
673retint_swapgs: /* return to user-space */
Ingo Molnar2601e642006-07-03 00:24:45 -0700674 /*
675 * The iretq could re-enable interrupts:
676 */
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100677 DISABLE_INTERRUPTS(CLBR_ANY)
Ingo Molnar2601e642006-07-03 00:24:45 -0700678 TRACE_IRQS_IRETQ
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100679 SWAPGS
Ingo Molnar2601e642006-07-03 00:24:45 -0700680 jmp restore_args
681
Peter Zijlstra10cd7062007-10-11 22:11:12 +0200682retint_restore_args: /* return to kernel space */
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100683 DISABLE_INTERRUPTS(CLBR_ANY)
Ingo Molnar2601e642006-07-03 00:24:45 -0700684 /*
685 * The iretq could re-enable interrupts:
686 */
687 TRACE_IRQS_IRETQ
688restore_args:
Ingo Molnar3701d8632008-02-09 23:24:08 +0100689 RESTORE_ARGS 0,8,0
690
Adrian Bunkf7f3d792008-02-13 23:29:53 +0200691irq_return:
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100692 INTERRUPT_RETURN
Ingo Molnar3701d8632008-02-09 23:24:08 +0100693
694 .section __ex_table, "a"
695 .quad irq_return, bad_iret
696 .previous
697
698#ifdef CONFIG_PARAVIRT
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100699ENTRY(native_iret)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700700 iretq
701
702 .section __ex_table,"a"
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100703 .quad native_iret, bad_iret
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704 .previous
Ingo Molnar3701d8632008-02-09 23:24:08 +0100705#endif
706
Linus Torvalds1da177e2005-04-16 15:20:36 -0700707 .section .fixup,"ax"
Linus Torvalds1da177e2005-04-16 15:20:36 -0700708bad_iret:
Roland McGrath3aa4b372008-02-06 22:39:43 +0100709 /*
710 * The iret traps when the %cs or %ss being restored is bogus.
711 * We've lost the original trap vector and error code.
712 * #GPF is the most likely one to get for an invalid selector.
713 * So pretend we completed the iret and took the #GPF in user mode.
714 *
715 * We are now running with the kernel GS after exception recovery.
716 * But error_entry expects us to have user GS to match the user %cs,
717 * so swap back.
718 */
719 pushq $0
720
721 SWAPGS
722 jmp general_protection
723
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100724 .previous
725
Jan Beulich7effaa82005-09-12 18:49:24 +0200726 /* edi: workmask, edx: work */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727retint_careful:
Jan Beulich7effaa82005-09-12 18:49:24 +0200728 CFI_RESTORE_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700729 bt $TIF_NEED_RESCHED,%edx
730 jnc retint_signal
Ingo Molnar2601e642006-07-03 00:24:45 -0700731 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100732 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200734 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735 call schedule
736 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200737 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738 GET_THREAD_INFO(%rcx)
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100739 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700740 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741 jmp retint_check
742
743retint_signal:
Peter Zijlstra8f4d37e2008-01-25 21:08:29 +0100744 testl $_TIF_DO_NOTIFY_MASK,%edx
Andi Kleen10ffdbb2005-05-16 21:53:19 -0700745 jz retint_swapgs
Ingo Molnar2601e642006-07-03 00:24:45 -0700746 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100747 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700748 SAVE_REST
749 movq $-1,ORIG_RAX(%rsp)
Andi Kleen3829ee62005-07-28 21:15:48 -0700750 xorl %esi,%esi # oldset
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751 movq %rsp,%rdi # &pt_regs
752 call do_notify_resume
753 RESTORE_REST
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100754 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700755 TRACE_IRQS_OFF
Andi Kleenbe9e6872005-05-01 08:58:51 -0700756 GET_THREAD_INFO(%rcx)
Roland McGratheca91e72008-07-10 14:50:39 -0700757 jmp retint_with_reschedule
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758
759#ifdef CONFIG_PREEMPT
760 /* Returning to kernel space. Check if we need preemption */
761 /* rcx: threadinfo. interrupts off. */
Andi Kleenb06baba2006-09-26 10:52:29 +0200762ENTRY(retint_kernel)
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300763 cmpl $0,TI_preempt_count(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700764 jnz retint_restore_args
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300765 bt $TIF_NEED_RESCHED,TI_flags(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700766 jnc retint_restore_args
767 bt $9,EFLAGS-ARGOFFSET(%rsp) /* interrupts off? */
768 jnc retint_restore_args
769 call preempt_schedule_irq
770 jmp exit_intr
771#endif
Jan Beulich4b787e02006-06-26 13:56:55 +0200772
Linus Torvalds1da177e2005-04-16 15:20:36 -0700773 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200774END(common_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775
776/*
777 * APIC interrupts.
778 */
779 .macro apicinterrupt num,func
Jan Beulich7effaa82005-09-12 18:49:24 +0200780 INTR_FRAME
Rusty Russell19eadf92006-06-27 02:53:44 -0700781 pushq $~(\num)
Jan Beulich7effaa82005-09-12 18:49:24 +0200782 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700783 interrupt \func
784 jmp ret_from_intr
785 CFI_ENDPROC
786 .endm
787
788ENTRY(thermal_interrupt)
789 apicinterrupt THERMAL_APIC_VECTOR,smp_thermal_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200790END(thermal_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700791
Jacob Shin89b831e2005-11-05 17:25:53 +0100792ENTRY(threshold_interrupt)
793 apicinterrupt THRESHOLD_APIC_VECTOR,mce_threshold_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200794END(threshold_interrupt)
Jacob Shin89b831e2005-11-05 17:25:53 +0100795
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796#ifdef CONFIG_SMP
797ENTRY(reschedule_interrupt)
798 apicinterrupt RESCHEDULE_VECTOR,smp_reschedule_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200799END(reschedule_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700800
Andi Kleene5bc8b62005-09-12 18:49:24 +0200801 .macro INVALIDATE_ENTRY num
802ENTRY(invalidate_interrupt\num)
803 apicinterrupt INVALIDATE_TLB_VECTOR_START+\num,smp_invalidate_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200804END(invalidate_interrupt\num)
Andi Kleene5bc8b62005-09-12 18:49:24 +0200805 .endm
806
807 INVALIDATE_ENTRY 0
808 INVALIDATE_ENTRY 1
809 INVALIDATE_ENTRY 2
810 INVALIDATE_ENTRY 3
811 INVALIDATE_ENTRY 4
812 INVALIDATE_ENTRY 5
813 INVALIDATE_ENTRY 6
814 INVALIDATE_ENTRY 7
Linus Torvalds1da177e2005-04-16 15:20:36 -0700815
816ENTRY(call_function_interrupt)
817 apicinterrupt CALL_FUNCTION_VECTOR,smp_call_function_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200818END(call_function_interrupt)
Jens Axboe3b16cf82008-06-26 11:21:54 +0200819ENTRY(call_function_single_interrupt)
820 apicinterrupt CALL_FUNCTION_SINGLE_VECTOR,smp_call_function_single_interrupt
821END(call_function_single_interrupt)
Eric W. Biederman61014292007-02-23 04:40:58 -0700822ENTRY(irq_move_cleanup_interrupt)
823 apicinterrupt IRQ_MOVE_CLEANUP_VECTOR,smp_irq_move_cleanup_interrupt
824END(irq_move_cleanup_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700825#endif
826
Linus Torvalds1da177e2005-04-16 15:20:36 -0700827ENTRY(apic_timer_interrupt)
828 apicinterrupt LOCAL_TIMER_VECTOR,smp_apic_timer_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200829END(apic_timer_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700830
Cliff Wickman18129242008-06-02 08:56:14 -0500831ENTRY(uv_bau_message_intr1)
832 apicinterrupt 220,uv_bau_message_interrupt
833END(uv_bau_message_intr1)
834
Linus Torvalds1da177e2005-04-16 15:20:36 -0700835ENTRY(error_interrupt)
836 apicinterrupt ERROR_APIC_VECTOR,smp_error_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200837END(error_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700838
839ENTRY(spurious_interrupt)
840 apicinterrupt SPURIOUS_APIC_VECTOR,smp_spurious_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200841END(spurious_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700842
843/*
844 * Exception entry points.
845 */
846 .macro zeroentry sym
Jan Beulich7effaa82005-09-12 18:49:24 +0200847 INTR_FRAME
Jeremy Fitzhardingefab58422008-06-25 00:19:31 -0400848 PARAVIRT_ADJUST_EXCEPTION_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700849 pushq $0 /* push error code/oldrax */
Jan Beulich7effaa82005-09-12 18:49:24 +0200850 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700851 pushq %rax /* push real oldrax to the rdi slot */
Jan Beulich7effaa82005-09-12 18:49:24 +0200852 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich37550902007-05-02 19:27:05 +0200853 CFI_REL_OFFSET rax,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700854 leaq \sym(%rip),%rax
855 jmp error_entry
Jan Beulich7effaa82005-09-12 18:49:24 +0200856 CFI_ENDPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700857 .endm
858
859 .macro errorentry sym
Jan Beulich7effaa82005-09-12 18:49:24 +0200860 XCPT_FRAME
Jeremy Fitzhardingefab58422008-06-25 00:19:31 -0400861 PARAVIRT_ADJUST_EXCEPTION_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700862 pushq %rax
Jan Beulich7effaa82005-09-12 18:49:24 +0200863 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich37550902007-05-02 19:27:05 +0200864 CFI_REL_OFFSET rax,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700865 leaq \sym(%rip),%rax
866 jmp error_entry
Jan Beulich7effaa82005-09-12 18:49:24 +0200867 CFI_ENDPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700868 .endm
869
870 /* error code is on the stack already */
871 /* handle NMI like exceptions that can happen everywhere */
Ingo Molnar2601e642006-07-03 00:24:45 -0700872 .macro paranoidentry sym, ist=0, irqtrace=1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700873 SAVE_ALL
874 cld
875 movl $1,%ebx
876 movl $MSR_GS_BASE,%ecx
877 rdmsr
878 testl %edx,%edx
879 js 1f
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100880 SWAPGS
Linus Torvalds1da177e2005-04-16 15:20:36 -0700881 xorl %ebx,%ebx
Jan Beulichb556b352006-01-11 22:43:00 +01008821:
883 .if \ist
884 movq %gs:pda_data_offset, %rbp
885 .endif
886 movq %rsp,%rdi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700887 movq ORIG_RAX(%rsp),%rsi
888 movq $-1,ORIG_RAX(%rsp)
Jan Beulichb556b352006-01-11 22:43:00 +0100889 .if \ist
Andi Kleen5f8efbb2006-01-16 01:56:39 +0100890 subq $EXCEPTION_STKSZ, per_cpu__init_tss + TSS_ist + (\ist - 1) * 8(%rbp)
Jan Beulichb556b352006-01-11 22:43:00 +0100891 .endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700892 call \sym
Jan Beulichb556b352006-01-11 22:43:00 +0100893 .if \ist
Andi Kleen5f8efbb2006-01-16 01:56:39 +0100894 addq $EXCEPTION_STKSZ, per_cpu__init_tss + TSS_ist + (\ist - 1) * 8(%rbp)
Jan Beulichb556b352006-01-11 22:43:00 +0100895 .endif
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100896 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700897 .if \irqtrace
898 TRACE_IRQS_OFF
899 .endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700900 .endm
Ingo Molnar2601e642006-07-03 00:24:45 -0700901
902 /*
903 * "Paranoid" exit path from exception stack.
904 * Paranoid because this is used by NMIs and cannot take
905 * any kernel state for granted.
906 * We don't do kernel preemption checks here, because only
907 * NMI should be common and it does not enable IRQs and
908 * cannot get reschedule ticks.
909 *
910 * "trace" is 0 for the NMI handler only, because irq-tracing
911 * is fundamentally NMI-unsafe. (we cannot change the soft and
912 * hard flags at once, atomically)
913 */
914 .macro paranoidexit trace=1
915 /* ebx: no swapgs flag */
916paranoid_exit\trace:
917 testl %ebx,%ebx /* swapgs needed? */
918 jnz paranoid_restore\trace
919 testl $3,CS(%rsp)
920 jnz paranoid_userspace\trace
921paranoid_swapgs\trace:
Andi Kleen7a0a2df2006-09-26 10:52:37 +0200922 .if \trace
Ingo Molnar2601e642006-07-03 00:24:45 -0700923 TRACE_IRQS_IRETQ 0
Andi Kleen7a0a2df2006-09-26 10:52:37 +0200924 .endif
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100925 SWAPGS_UNSAFE_STACK
Ingo Molnar2601e642006-07-03 00:24:45 -0700926paranoid_restore\trace:
927 RESTORE_ALL 8
Ingo Molnar3701d8632008-02-09 23:24:08 +0100928 jmp irq_return
Ingo Molnar2601e642006-07-03 00:24:45 -0700929paranoid_userspace\trace:
930 GET_THREAD_INFO(%rcx)
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300931 movl TI_flags(%rcx),%ebx
Ingo Molnar2601e642006-07-03 00:24:45 -0700932 andl $_TIF_WORK_MASK,%ebx
933 jz paranoid_swapgs\trace
934 movq %rsp,%rdi /* &pt_regs */
935 call sync_regs
936 movq %rax,%rsp /* switch stack for scheduling */
937 testl $_TIF_NEED_RESCHED,%ebx
938 jnz paranoid_schedule\trace
939 movl %ebx,%edx /* arg3: thread flags */
940 .if \trace
941 TRACE_IRQS_ON
942 .endif
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100943 ENABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700944 xorl %esi,%esi /* arg2: oldset */
945 movq %rsp,%rdi /* arg1: &pt_regs */
946 call do_notify_resume
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100947 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700948 .if \trace
949 TRACE_IRQS_OFF
950 .endif
951 jmp paranoid_userspace\trace
952paranoid_schedule\trace:
953 .if \trace
954 TRACE_IRQS_ON
955 .endif
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100956 ENABLE_INTERRUPTS(CLBR_ANY)
Ingo Molnar2601e642006-07-03 00:24:45 -0700957 call schedule
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100958 DISABLE_INTERRUPTS(CLBR_ANY)
Ingo Molnar2601e642006-07-03 00:24:45 -0700959 .if \trace
960 TRACE_IRQS_OFF
961 .endif
962 jmp paranoid_userspace\trace
963 CFI_ENDPROC
964 .endm
965
Linus Torvalds1da177e2005-04-16 15:20:36 -0700966/*
967 * Exception entry point. This expects an error code/orig_rax on the stack
968 * and the exception handler in %rax.
969 */
Prasanna S.Pd28c4392006-09-26 10:52:34 +0200970KPROBE_ENTRY(error_entry)
Jan Beulich7effaa82005-09-12 18:49:24 +0200971 _frame RDI
Jan Beulich37550902007-05-02 19:27:05 +0200972 CFI_REL_OFFSET rax,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700973 /* rdi slot contains rax, oldrax contains error code */
974 cld
975 subq $14*8,%rsp
976 CFI_ADJUST_CFA_OFFSET (14*8)
977 movq %rsi,13*8(%rsp)
978 CFI_REL_OFFSET rsi,RSI
979 movq 14*8(%rsp),%rsi /* load rax from rdi slot */
Jan Beulich37550902007-05-02 19:27:05 +0200980 CFI_REGISTER rax,rsi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700981 movq %rdx,12*8(%rsp)
982 CFI_REL_OFFSET rdx,RDX
983 movq %rcx,11*8(%rsp)
984 CFI_REL_OFFSET rcx,RCX
985 movq %rsi,10*8(%rsp) /* store rax */
986 CFI_REL_OFFSET rax,RAX
987 movq %r8, 9*8(%rsp)
988 CFI_REL_OFFSET r8,R8
989 movq %r9, 8*8(%rsp)
990 CFI_REL_OFFSET r9,R9
991 movq %r10,7*8(%rsp)
992 CFI_REL_OFFSET r10,R10
993 movq %r11,6*8(%rsp)
994 CFI_REL_OFFSET r11,R11
995 movq %rbx,5*8(%rsp)
996 CFI_REL_OFFSET rbx,RBX
997 movq %rbp,4*8(%rsp)
998 CFI_REL_OFFSET rbp,RBP
999 movq %r12,3*8(%rsp)
1000 CFI_REL_OFFSET r12,R12
1001 movq %r13,2*8(%rsp)
1002 CFI_REL_OFFSET r13,R13
1003 movq %r14,1*8(%rsp)
1004 CFI_REL_OFFSET r14,R14
1005 movq %r15,(%rsp)
1006 CFI_REL_OFFSET r15,R15
1007 xorl %ebx,%ebx
1008 testl $3,CS(%rsp)
1009 je error_kernelspace
1010error_swapgs:
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +01001011 SWAPGS
Linus Torvalds1da177e2005-04-16 15:20:36 -07001012error_sti:
1013 movq %rdi,RDI(%rsp)
Jan Beulich37550902007-05-02 19:27:05 +02001014 CFI_REL_OFFSET rdi,RDI
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015 movq %rsp,%rdi
1016 movq ORIG_RAX(%rsp),%rsi /* get error code */
1017 movq $-1,ORIG_RAX(%rsp)
1018 call *%rax
Peter Zijlstra10cd7062007-10-11 22:11:12 +02001019 /* ebx: no swapgs flag (1: don't need swapgs, 0: need it) */
1020error_exit:
1021 movl %ebx,%eax
Linus Torvalds1da177e2005-04-16 15:20:36 -07001022 RESTORE_REST
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +01001023 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -07001024 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -07001025 GET_THREAD_INFO(%rcx)
1026 testl %eax,%eax
1027 jne retint_kernel
Peter Zijlstra10cd7062007-10-11 22:11:12 +02001028 LOCKDEP_SYS_EXIT_IRQ
Glauber Costa26ccb8a2008-06-24 11:19:35 -03001029 movl TI_flags(%rcx),%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -07001030 movl $_TIF_WORK_MASK,%edi
1031 andl %edi,%edx
1032 jnz retint_careful
Peter Zijlstra10cd7062007-10-11 22:11:12 +02001033 jmp retint_swapgs
Linus Torvalds1da177e2005-04-16 15:20:36 -07001034 CFI_ENDPROC
1035
1036error_kernelspace:
1037 incl %ebx
1038 /* There are two places in the kernel that can potentially fault with
1039 usergs. Handle them here. The exception handlers after
1040 iret run with kernel gs again, so don't set the user space flag.
1041 B stepping K8s sometimes report an truncated RIP for IRET
1042 exceptions returning to compat mode. Check for these here too. */
Vegard Nossum9d8ad5d2008-06-27 17:22:17 +02001043 leaq irq_return(%rip),%rcx
1044 cmpq %rcx,RIP(%rsp)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001045 je error_swapgs
Vegard Nossum9d8ad5d2008-06-27 17:22:17 +02001046 movl %ecx,%ecx /* zero extend */
1047 cmpq %rcx,RIP(%rsp)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001048 je error_swapgs
1049 cmpq $gs_change,RIP(%rsp)
1050 je error_swapgs
1051 jmp error_sti
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001052KPROBE_END(error_entry)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001053
1054 /* Reload gs selector with exception handling */
1055 /* edi: new selector */
Jeremy Fitzhardinge9f9d4892008-06-25 00:19:32 -04001056ENTRY(native_load_gs_index)
Jan Beulich7effaa82005-09-12 18:49:24 +02001057 CFI_STARTPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -07001058 pushf
Jan Beulich7effaa82005-09-12 18:49:24 +02001059 CFI_ADJUST_CFA_OFFSET 8
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +01001060 DISABLE_INTERRUPTS(CLBR_ANY | ~(CLBR_RDI))
1061 SWAPGS
Linus Torvalds1da177e2005-04-16 15:20:36 -07001062gs_change:
1063 movl %edi,%gs
10642: mfence /* workaround */
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +01001065 SWAPGS
Linus Torvalds1da177e2005-04-16 15:20:36 -07001066 popf
Jan Beulich7effaa82005-09-12 18:49:24 +02001067 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -07001068 ret
Jan Beulich7effaa82005-09-12 18:49:24 +02001069 CFI_ENDPROC
Jeremy Fitzhardinge9f9d4892008-06-25 00:19:32 -04001070ENDPROC(native_load_gs_index)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001071
1072 .section __ex_table,"a"
1073 .align 8
1074 .quad gs_change,bad_gs
1075 .previous
1076 .section .fixup,"ax"
1077 /* running with kernelgs */
1078bad_gs:
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +01001079 SWAPGS /* switch back to user gs */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001080 xorl %eax,%eax
1081 movl %eax,%gs
1082 jmp 2b
1083 .previous
1084
1085/*
1086 * Create a kernel thread.
1087 *
1088 * C extern interface:
1089 * extern long kernel_thread(int (*fn)(void *), void * arg, unsigned long flags)
1090 *
1091 * asm input arguments:
1092 * rdi: fn, rsi: arg, rdx: flags
1093 */
1094ENTRY(kernel_thread)
1095 CFI_STARTPROC
1096 FAKE_STACK_FRAME $child_rip
1097 SAVE_ALL
1098
1099 # rdi: flags, rsi: usp, rdx: will be &pt_regs
1100 movq %rdx,%rdi
1101 orq kernel_thread_flags(%rip),%rdi
1102 movq $-1, %rsi
1103 movq %rsp, %rdx
1104
1105 xorl %r8d,%r8d
1106 xorl %r9d,%r9d
1107
1108 # clone now
1109 call do_fork
1110 movq %rax,RAX(%rsp)
1111 xorl %edi,%edi
1112
1113 /*
1114 * It isn't worth to check for reschedule here,
1115 * so internally to the x86_64 port you can rely on kernel_thread()
1116 * not to reschedule the child before returning, this avoids the need
1117 * of hacks for example to fork off the per-CPU idle tasks.
1118 * [Hopefully no generic code relies on the reschedule -AK]
1119 */
1120 RESTORE_ALL
1121 UNFAKE_STACK_FRAME
1122 ret
1123 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001124ENDPROC(kernel_thread)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001125
1126child_rip:
Andi Kleenc05991e2006-08-30 19:37:08 +02001127 pushq $0 # fake return address
1128 CFI_STARTPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -07001129 /*
1130 * Here we are in the child and the registers are set as they were
1131 * at kernel_thread() invocation in the parent.
1132 */
1133 movq %rdi, %rax
1134 movq %rsi, %rdi
1135 call *%rax
1136 # exit
Andrey Mirkin1c5b5cf2007-10-17 18:04:33 +02001137 mov %eax, %edi
Linus Torvalds1da177e2005-04-16 15:20:36 -07001138 call do_exit
Andi Kleenc05991e2006-08-30 19:37:08 +02001139 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001140ENDPROC(child_rip)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001141
1142/*
1143 * execve(). This function needs to use IRET, not SYSRET, to set up all state properly.
1144 *
1145 * C extern interface:
1146 * extern long execve(char *name, char **argv, char **envp)
1147 *
1148 * asm input arguments:
1149 * rdi: name, rsi: argv, rdx: envp
1150 *
1151 * We want to fallback into:
Ingo Molnar5d119b22008-02-26 12:55:57 +01001152 * extern long sys_execve(char *name, char **argv,char **envp, struct pt_regs *regs)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001153 *
1154 * do_sys_execve asm fallback arguments:
Ingo Molnar5d119b22008-02-26 12:55:57 +01001155 * rdi: name, rsi: argv, rdx: envp, rcx: fake frame on the stack
Linus Torvalds1da177e2005-04-16 15:20:36 -07001156 */
Arnd Bergmann3db03b42006-10-02 02:18:31 -07001157ENTRY(kernel_execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158 CFI_STARTPROC
1159 FAKE_STACK_FRAME $0
1160 SAVE_ALL
Ingo Molnar5d119b22008-02-26 12:55:57 +01001161 movq %rsp,%rcx
Linus Torvalds1da177e2005-04-16 15:20:36 -07001162 call sys_execve
1163 movq %rax, RAX(%rsp)
1164 RESTORE_REST
1165 testq %rax,%rax
1166 je int_ret_from_sys_call
1167 RESTORE_ARGS
1168 UNFAKE_STACK_FRAME
1169 ret
1170 CFI_ENDPROC
Arnd Bergmann3db03b42006-10-02 02:18:31 -07001171ENDPROC(kernel_execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001172
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001173KPROBE_ENTRY(page_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001174 errorentry do_page_fault
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001175KPROBE_END(page_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001176
1177ENTRY(coprocessor_error)
1178 zeroentry do_coprocessor_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001179END(coprocessor_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001180
1181ENTRY(simd_coprocessor_error)
1182 zeroentry do_simd_coprocessor_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001183END(simd_coprocessor_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001184
1185ENTRY(device_not_available)
1186 zeroentry math_state_restore
Jan Beulich4b787e02006-06-26 13:56:55 +02001187END(device_not_available)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001188
1189 /* runs on exception stack */
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001190KPROBE_ENTRY(debug)
Jan Beulich7effaa82005-09-12 18:49:24 +02001191 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001192 pushq $0
1193 CFI_ADJUST_CFA_OFFSET 8
Andi Kleen5f8efbb2006-01-16 01:56:39 +01001194 paranoidentry do_debug, DEBUG_STACK
Ingo Molnar2601e642006-07-03 00:24:45 -07001195 paranoidexit
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001196KPROBE_END(debug)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001197
1198 /* runs on exception stack */
Andi Kleeneddb6fb2006-02-03 21:50:41 +01001199KPROBE_ENTRY(nmi)
Jan Beulich7effaa82005-09-12 18:49:24 +02001200 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001201 pushq $-1
Jan Beulich7effaa82005-09-12 18:49:24 +02001202 CFI_ADJUST_CFA_OFFSET 8
Ingo Molnar2601e642006-07-03 00:24:45 -07001203 paranoidentry do_nmi, 0, 0
1204#ifdef CONFIG_TRACE_IRQFLAGS
1205 paranoidexit 0
1206#else
1207 jmp paranoid_exit1
1208 CFI_ENDPROC
1209#endif
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001210KPROBE_END(nmi)
Andi Kleen6fefb0d2005-04-16 15:25:03 -07001211
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001212KPROBE_ENTRY(int3)
Jan Beulichb556b352006-01-11 22:43:00 +01001213 INTR_FRAME
1214 pushq $0
1215 CFI_ADJUST_CFA_OFFSET 8
Andi Kleen5f8efbb2006-01-16 01:56:39 +01001216 paranoidentry do_int3, DEBUG_STACK
Ingo Molnar2601e642006-07-03 00:24:45 -07001217 jmp paranoid_exit1
Jan Beulichb556b352006-01-11 22:43:00 +01001218 CFI_ENDPROC
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001219KPROBE_END(int3)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001220
1221ENTRY(overflow)
1222 zeroentry do_overflow
Jan Beulich4b787e02006-06-26 13:56:55 +02001223END(overflow)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001224
1225ENTRY(bounds)
1226 zeroentry do_bounds
Jan Beulich4b787e02006-06-26 13:56:55 +02001227END(bounds)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001228
1229ENTRY(invalid_op)
1230 zeroentry do_invalid_op
Jan Beulich4b787e02006-06-26 13:56:55 +02001231END(invalid_op)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001232
1233ENTRY(coprocessor_segment_overrun)
1234 zeroentry do_coprocessor_segment_overrun
Jan Beulich4b787e02006-06-26 13:56:55 +02001235END(coprocessor_segment_overrun)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001236
Linus Torvalds1da177e2005-04-16 15:20:36 -07001237 /* runs on exception stack */
1238ENTRY(double_fault)
Jan Beulich7effaa82005-09-12 18:49:24 +02001239 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001240 paranoidentry do_double_fault
Ingo Molnar2601e642006-07-03 00:24:45 -07001241 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001242 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001243END(double_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001244
1245ENTRY(invalid_TSS)
1246 errorentry do_invalid_TSS
Jan Beulich4b787e02006-06-26 13:56:55 +02001247END(invalid_TSS)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001248
1249ENTRY(segment_not_present)
1250 errorentry do_segment_not_present
Jan Beulich4b787e02006-06-26 13:56:55 +02001251END(segment_not_present)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001252
1253 /* runs on exception stack */
1254ENTRY(stack_segment)
Jan Beulich7effaa82005-09-12 18:49:24 +02001255 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001256 paranoidentry do_stack_segment
Ingo Molnar2601e642006-07-03 00:24:45 -07001257 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001258 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001259END(stack_segment)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001260
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001261KPROBE_ENTRY(general_protection)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001262 errorentry do_general_protection
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001263KPROBE_END(general_protection)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001264
1265ENTRY(alignment_check)
1266 errorentry do_alignment_check
Jan Beulich4b787e02006-06-26 13:56:55 +02001267END(alignment_check)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001268
1269ENTRY(divide_error)
1270 zeroentry do_divide_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001271END(divide_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001272
1273ENTRY(spurious_interrupt_bug)
1274 zeroentry do_spurious_interrupt_bug
Jan Beulich4b787e02006-06-26 13:56:55 +02001275END(spurious_interrupt_bug)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001276
1277#ifdef CONFIG_X86_MCE
1278 /* runs on exception stack */
1279ENTRY(machine_check)
Jan Beulich7effaa82005-09-12 18:49:24 +02001280 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001281 pushq $0
1282 CFI_ADJUST_CFA_OFFSET 8
1283 paranoidentry do_machine_check
Ingo Molnar2601e642006-07-03 00:24:45 -07001284 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001285 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001286END(machine_check)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287#endif
1288
Andi Kleen26995002006-08-02 22:37:28 +02001289/* Call softirq on interrupt stack. Interrupts are off. */
Andi Kleened6b6762005-07-28 21:15:49 -07001290ENTRY(call_softirq)
Jan Beulich7effaa82005-09-12 18:49:24 +02001291 CFI_STARTPROC
Andi Kleen26995002006-08-02 22:37:28 +02001292 push %rbp
1293 CFI_ADJUST_CFA_OFFSET 8
1294 CFI_REL_OFFSET rbp,0
1295 mov %rsp,%rbp
1296 CFI_DEF_CFA_REGISTER rbp
Andi Kleened6b6762005-07-28 21:15:49 -07001297 incl %gs:pda_irqcount
Andi Kleen26995002006-08-02 22:37:28 +02001298 cmove %gs:pda_irqstackptr,%rsp
1299 push %rbp # backlink for old unwinder
Andi Kleened6b6762005-07-28 21:15:49 -07001300 call __do_softirq
Andi Kleen26995002006-08-02 22:37:28 +02001301 leaveq
Jan Beulich7effaa82005-09-12 18:49:24 +02001302 CFI_DEF_CFA_REGISTER rsp
Andi Kleen26995002006-08-02 22:37:28 +02001303 CFI_ADJUST_CFA_OFFSET -8
Andi Kleened6b6762005-07-28 21:15:49 -07001304 decl %gs:pda_irqcount
Andi Kleened6b6762005-07-28 21:15:49 -07001305 ret
Jan Beulich7effaa82005-09-12 18:49:24 +02001306 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001307ENDPROC(call_softirq)
Andi Kleen75154f42007-06-23 02:29:25 +02001308
1309KPROBE_ENTRY(ignore_sysret)
1310 CFI_STARTPROC
1311 mov $-ENOSYS,%eax
1312 sysret
1313 CFI_ENDPROC
1314ENDPROC(ignore_sysret)
Jeremy Fitzhardinge3d75e1b2008-07-08 15:06:49 -07001315
1316#ifdef CONFIG_XEN
1317ENTRY(xen_hypervisor_callback)
1318 zeroentry xen_do_hypervisor_callback
1319END(xen_hypervisor_callback)
1320
1321/*
1322# A note on the "critical region" in our callback handler.
1323# We want to avoid stacking callback handlers due to events occurring
1324# during handling of the last event. To do this, we keep events disabled
1325# until we've done all processing. HOWEVER, we must enable events before
1326# popping the stack frame (can't be done atomically) and so it would still
1327# be possible to get enough handler activations to overflow the stack.
1328# Although unlikely, bugs of that kind are hard to track down, so we'd
1329# like to avoid the possibility.
1330# So, on entry to the handler we detect whether we interrupted an
1331# existing activation in its critical region -- if so, we pop the current
1332# activation and restart the handler using the previous one.
1333*/
1334ENTRY(xen_do_hypervisor_callback) # do_hypervisor_callback(struct *pt_regs)
1335 CFI_STARTPROC
1336/* Since we don't modify %rdi, evtchn_do_upall(struct *pt_regs) will
1337 see the correct pointer to the pt_regs */
1338 movq %rdi, %rsp # we don't return, adjust the stack frame
1339 CFI_ENDPROC
1340 CFI_DEFAULT_STACK
134111: incl %gs:pda_irqcount
1342 movq %rsp,%rbp
1343 CFI_DEF_CFA_REGISTER rbp
1344 cmovzq %gs:pda_irqstackptr,%rsp
1345 pushq %rbp # backlink for old unwinder
1346 call xen_evtchn_do_upcall
1347 popq %rsp
1348 CFI_DEF_CFA_REGISTER rsp
1349 decl %gs:pda_irqcount
1350 jmp error_exit
1351 CFI_ENDPROC
1352END(do_hypervisor_callback)
1353
1354/*
1355# Hypervisor uses this for application faults while it executes.
1356# We get here for two reasons:
1357# 1. Fault while reloading DS, ES, FS or GS
1358# 2. Fault while executing IRET
1359# Category 1 we do not need to fix up as Xen has already reloaded all segment
1360# registers that could be reloaded and zeroed the others.
1361# Category 2 we fix up by killing the current process. We cannot use the
1362# normal Linux return path in this case because if we use the IRET hypercall
1363# to pop the stack frame we end up in an infinite loop of failsafe callbacks.
1364# We distinguish between categories by comparing each saved segment register
1365# with its current contents: any discrepancy means we in category 1.
1366*/
1367ENTRY(xen_failsafe_callback)
Jeremy Fitzhardinge4a5c3e72008-07-08 15:07:09 -07001368 framesz = (RIP-0x30) /* workaround buggy gas */
1369 _frame framesz
Jeremy Fitzhardinge3d75e1b2008-07-08 15:06:49 -07001370 CFI_REL_OFFSET rcx, 0
1371 CFI_REL_OFFSET r11, 8
1372 movw %ds,%cx
1373 cmpw %cx,0x10(%rsp)
1374 CFI_REMEMBER_STATE
1375 jne 1f
1376 movw %es,%cx
1377 cmpw %cx,0x18(%rsp)
1378 jne 1f
1379 movw %fs,%cx
1380 cmpw %cx,0x20(%rsp)
1381 jne 1f
1382 movw %gs,%cx
1383 cmpw %cx,0x28(%rsp)
1384 jne 1f
1385 /* All segments match their saved values => Category 2 (Bad IRET). */
1386 movq (%rsp),%rcx
1387 CFI_RESTORE rcx
1388 movq 8(%rsp),%r11
1389 CFI_RESTORE r11
1390 addq $0x30,%rsp
1391 CFI_ADJUST_CFA_OFFSET -0x30
Jeremy Fitzhardinge4a5c3e72008-07-08 15:07:09 -07001392 pushq $0
1393 CFI_ADJUST_CFA_OFFSET 8
1394 pushq %r11
1395 CFI_ADJUST_CFA_OFFSET 8
1396 pushq %rcx
1397 CFI_ADJUST_CFA_OFFSET 8
1398 jmp general_protection
Jeremy Fitzhardinge3d75e1b2008-07-08 15:06:49 -07001399 CFI_RESTORE_STATE
14001: /* Segment mismatch => Category 1 (Bad segment). Retry the IRET. */
1401 movq (%rsp),%rcx
1402 CFI_RESTORE rcx
1403 movq 8(%rsp),%r11
1404 CFI_RESTORE r11
1405 addq $0x30,%rsp
1406 CFI_ADJUST_CFA_OFFSET -0x30
1407 pushq $0
1408 CFI_ADJUST_CFA_OFFSET 8
1409 SAVE_ALL
1410 jmp error_exit
1411 CFI_ENDPROC
Jeremy Fitzhardinge3d75e1b2008-07-08 15:06:49 -07001412END(xen_failsafe_callback)
1413
1414#endif /* CONFIG_XEN */