blob: a169225869ccfe62ed5c6780d7098e11c6680002 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86_64/entry.S
3 *
4 * Copyright (C) 1991, 1992 Linus Torvalds
5 * Copyright (C) 2000, 2001, 2002 Andi Kleen SuSE Labs
6 * Copyright (C) 2000 Pavel Machek <pavel@suse.cz>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 */
8
9/*
10 * entry.S contains the system-call and fault low-level handling routines.
11 *
12 * NOTE: This code handles signal-recognition, which happens every time
13 * after an interrupt and after each system call.
14 *
15 * Normal syscalls and interrupts don't save a full stack frame, this is
16 * only done for syscall tracing, signals or fork/exec et.al.
17 *
18 * A note on terminology:
19 * - top of stack: Architecture defined interrupt frame from SS to RIP
20 * at the top of the kernel process stack.
21 * - partial stack frame: partially saved registers upto R11.
22 * - full stack frame: Like partial stack frame, but all register saved.
Andi Kleen2e91a172006-09-26 10:52:29 +020023 *
24 * Some macro usage:
25 * - CFI macros are used to generate dwarf2 unwind information for better
26 * backtraces. They don't change any code.
27 * - SAVE_ALL/RESTORE_ALL - Save/restore all registers
28 * - SAVE_ARGS/RESTORE_ARGS - Save/restore registers that C functions modify.
29 * There are unfortunately lots of special cases where some registers
30 * not touched. The macro is a big mess that should be cleaned up.
31 * - SAVE_REST/RESTORE_REST - Handle the registers not saved by SAVE_ARGS.
32 * Gives a full stack frame.
33 * - ENTRY/END Define functions in the symbol table.
34 * - FIXUP_TOP_OF_STACK/RESTORE_TOP_OF_STACK - Fix up the hardware stack
35 * frame that is otherwise undefined after a SYSCALL
36 * - TRACE_IRQ_* - Trace hard interrupt state for lock debugging.
37 * - errorentry/paranoidentry/zeroentry - Define exception entry points.
Linus Torvalds1da177e2005-04-16 15:20:36 -070038 */
39
Linus Torvalds1da177e2005-04-16 15:20:36 -070040#include <linux/linkage.h>
41#include <asm/segment.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#include <asm/cache.h>
43#include <asm/errno.h>
44#include <asm/dwarf2.h>
45#include <asm/calling.h>
Sam Ravnborge2d5df92005-09-09 21:28:48 +020046#include <asm/asm-offsets.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070047#include <asm/msr.h>
48#include <asm/unistd.h>
49#include <asm/thread_info.h>
50#include <asm/hw_irq.h>
Andi Kleen5f8efbb2006-01-16 01:56:39 +010051#include <asm/page.h>
Ingo Molnar2601e642006-07-03 00:24:45 -070052#include <asm/irqflags.h>
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +010053#include <asm/paravirt.h>
Abhishek Sagar395a59d2008-06-21 23:47:27 +053054#include <asm/ftrace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070055
56 .code64
57
Arnaldo Carvalho de Melo16444a82008-05-12 21:20:42 +020058#ifdef CONFIG_FTRACE
Steven Rostedtd61f82d2008-05-12 21:20:43 +020059#ifdef CONFIG_DYNAMIC_FTRACE
60ENTRY(mcount)
61
62 subq $0x38, %rsp
63 movq %rax, (%rsp)
64 movq %rcx, 8(%rsp)
65 movq %rdx, 16(%rsp)
66 movq %rsi, 24(%rsp)
67 movq %rdi, 32(%rsp)
68 movq %r8, 40(%rsp)
69 movq %r9, 48(%rsp)
70
71 movq 0x38(%rsp), %rdi
Abhishek Sagar395a59d2008-06-21 23:47:27 +053072 subq $MCOUNT_INSN_SIZE, %rdi
Steven Rostedtd61f82d2008-05-12 21:20:43 +020073
74.globl mcount_call
75mcount_call:
76 call ftrace_stub
77
78 movq 48(%rsp), %r9
79 movq 40(%rsp), %r8
80 movq 32(%rsp), %rdi
81 movq 24(%rsp), %rsi
82 movq 16(%rsp), %rdx
83 movq 8(%rsp), %rcx
84 movq (%rsp), %rax
85 addq $0x38, %rsp
86
87 retq
88END(mcount)
89
90ENTRY(ftrace_caller)
91
92 /* taken from glibc */
93 subq $0x38, %rsp
94 movq %rax, (%rsp)
95 movq %rcx, 8(%rsp)
96 movq %rdx, 16(%rsp)
97 movq %rsi, 24(%rsp)
98 movq %rdi, 32(%rsp)
99 movq %r8, 40(%rsp)
100 movq %r9, 48(%rsp)
101
102 movq 0x38(%rsp), %rdi
103 movq 8(%rbp), %rsi
Abhishek Sagar395a59d2008-06-21 23:47:27 +0530104 subq $MCOUNT_INSN_SIZE, %rdi
Steven Rostedtd61f82d2008-05-12 21:20:43 +0200105
106.globl ftrace_call
107ftrace_call:
108 call ftrace_stub
109
110 movq 48(%rsp), %r9
111 movq 40(%rsp), %r8
112 movq 32(%rsp), %rdi
113 movq 24(%rsp), %rsi
114 movq 16(%rsp), %rdx
115 movq 8(%rsp), %rcx
116 movq (%rsp), %rax
117 addq $0x38, %rsp
118
119.globl ftrace_stub
120ftrace_stub:
121 retq
122END(ftrace_caller)
123
124#else /* ! CONFIG_DYNAMIC_FTRACE */
Arnaldo Carvalho de Melo16444a82008-05-12 21:20:42 +0200125ENTRY(mcount)
126 cmpq $ftrace_stub, ftrace_trace_function
127 jnz trace
128.globl ftrace_stub
129ftrace_stub:
130 retq
131
132trace:
133 /* taken from glibc */
134 subq $0x38, %rsp
135 movq %rax, (%rsp)
136 movq %rcx, 8(%rsp)
137 movq %rdx, 16(%rsp)
138 movq %rsi, 24(%rsp)
139 movq %rdi, 32(%rsp)
140 movq %r8, 40(%rsp)
141 movq %r9, 48(%rsp)
142
143 movq 0x38(%rsp), %rdi
144 movq 8(%rbp), %rsi
Abhishek Sagar395a59d2008-06-21 23:47:27 +0530145 subq $MCOUNT_INSN_SIZE, %rdi
Arnaldo Carvalho de Melo16444a82008-05-12 21:20:42 +0200146
147 call *ftrace_trace_function
148
149 movq 48(%rsp), %r9
150 movq 40(%rsp), %r8
151 movq 32(%rsp), %rdi
152 movq 24(%rsp), %rsi
153 movq 16(%rsp), %rdx
154 movq 8(%rsp), %rcx
155 movq (%rsp), %rax
156 addq $0x38, %rsp
157
158 jmp ftrace_stub
159END(mcount)
Steven Rostedtd61f82d2008-05-12 21:20:43 +0200160#endif /* CONFIG_DYNAMIC_FTRACE */
161#endif /* CONFIG_FTRACE */
Arnaldo Carvalho de Melo16444a82008-05-12 21:20:42 +0200162
Andi Kleendc37db42005-04-16 15:25:05 -0700163#ifndef CONFIG_PREEMPT
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164#define retint_kernel retint_restore_args
165#endif
Ingo Molnar2601e642006-07-03 00:24:45 -0700166
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100167#ifdef CONFIG_PARAVIRT
Jeremy Fitzhardinge2be29982008-06-25 00:19:28 -0400168ENTRY(native_usergs_sysret64)
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100169 swapgs
170 sysretq
171#endif /* CONFIG_PARAVIRT */
172
Ingo Molnar2601e642006-07-03 00:24:45 -0700173
174.macro TRACE_IRQS_IRETQ offset=ARGOFFSET
175#ifdef CONFIG_TRACE_IRQFLAGS
176 bt $9,EFLAGS-\offset(%rsp) /* interrupts off? */
177 jnc 1f
178 TRACE_IRQS_ON
1791:
180#endif
181.endm
182
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183/*
184 * C code is not supposed to know about undefined top of stack. Every time
185 * a C function with an pt_regs argument is called from the SYSCALL based
186 * fast path FIXUP_TOP_OF_STACK is needed.
187 * RESTORE_TOP_OF_STACK syncs the syscall state after any possible ptregs
188 * manipulation.
189 */
190
191 /* %rsp:at FRAMEEND */
192 .macro FIXUP_TOP_OF_STACK tmp
193 movq %gs:pda_oldrsp,\tmp
194 movq \tmp,RSP(%rsp)
195 movq $__USER_DS,SS(%rsp)
196 movq $__USER_CS,CS(%rsp)
197 movq $-1,RCX(%rsp)
198 movq R11(%rsp),\tmp /* get eflags */
199 movq \tmp,EFLAGS(%rsp)
200 .endm
201
202 .macro RESTORE_TOP_OF_STACK tmp,offset=0
203 movq RSP-\offset(%rsp),\tmp
204 movq \tmp,%gs:pda_oldrsp
205 movq EFLAGS-\offset(%rsp),\tmp
206 movq \tmp,R11-\offset(%rsp)
207 .endm
208
209 .macro FAKE_STACK_FRAME child_rip
210 /* push in order ss, rsp, eflags, cs, rip */
Andi Kleen3829ee62005-07-28 21:15:48 -0700211 xorl %eax, %eax
Jeremy Fitzhardingee04e0a62008-06-25 00:19:25 -0400212 pushq $__KERNEL_DS /* ss */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200214 /*CFI_REL_OFFSET ss,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700215 pushq %rax /* rsp */
216 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200217 CFI_REL_OFFSET rsp,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700218 pushq $(1<<9) /* eflags - interrupts on */
219 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200220 /*CFI_REL_OFFSET rflags,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221 pushq $__KERNEL_CS /* cs */
222 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200223 /*CFI_REL_OFFSET cs,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224 pushq \child_rip /* rip */
225 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200226 CFI_REL_OFFSET rip,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 pushq %rax /* orig rax */
228 CFI_ADJUST_CFA_OFFSET 8
229 .endm
230
231 .macro UNFAKE_STACK_FRAME
232 addq $8*6, %rsp
233 CFI_ADJUST_CFA_OFFSET -(6*8)
234 .endm
235
Jan Beulich7effaa82005-09-12 18:49:24 +0200236 .macro CFI_DEFAULT_STACK start=1
237 .if \start
238 CFI_STARTPROC simple
Jan Beulichadf14232006-09-26 10:52:41 +0200239 CFI_SIGNAL_FRAME
Jan Beulich7effaa82005-09-12 18:49:24 +0200240 CFI_DEF_CFA rsp,SS+8
241 .else
242 CFI_DEF_CFA_OFFSET SS+8
243 .endif
244 CFI_REL_OFFSET r15,R15
245 CFI_REL_OFFSET r14,R14
246 CFI_REL_OFFSET r13,R13
247 CFI_REL_OFFSET r12,R12
248 CFI_REL_OFFSET rbp,RBP
249 CFI_REL_OFFSET rbx,RBX
250 CFI_REL_OFFSET r11,R11
251 CFI_REL_OFFSET r10,R10
252 CFI_REL_OFFSET r9,R9
253 CFI_REL_OFFSET r8,R8
254 CFI_REL_OFFSET rax,RAX
255 CFI_REL_OFFSET rcx,RCX
256 CFI_REL_OFFSET rdx,RDX
257 CFI_REL_OFFSET rsi,RSI
258 CFI_REL_OFFSET rdi,RDI
259 CFI_REL_OFFSET rip,RIP
260 /*CFI_REL_OFFSET cs,CS*/
261 /*CFI_REL_OFFSET rflags,EFLAGS*/
262 CFI_REL_OFFSET rsp,RSP
263 /*CFI_REL_OFFSET ss,SS*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700264 .endm
265/*
266 * A newly forked process directly context switches into this.
267 */
268/* rdi: prev */
269ENTRY(ret_from_fork)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700270 CFI_DEFAULT_STACK
Andi Kleen658fdbe2006-09-26 10:52:41 +0200271 push kernel_eflags(%rip)
272 CFI_ADJUST_CFA_OFFSET 4
273 popf # reset kernel eflags
274 CFI_ADJUST_CFA_OFFSET -4
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 call schedule_tail
276 GET_THREAD_INFO(%rcx)
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300277 testl $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT),TI_flags(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278 jnz rff_trace
279rff_action:
280 RESTORE_REST
281 testl $3,CS-ARGOFFSET(%rsp) # from kernel_thread?
282 je int_ret_from_sys_call
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300283 testl $_TIF_IA32,TI_flags(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284 jnz int_ret_from_sys_call
285 RESTORE_TOP_OF_STACK %rdi,ARGOFFSET
286 jmp ret_from_sys_call
287rff_trace:
288 movq %rsp,%rdi
289 call syscall_trace_leave
290 GET_THREAD_INFO(%rcx)
291 jmp rff_action
292 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200293END(ret_from_fork)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294
295/*
296 * System call entry. Upto 6 arguments in registers are supported.
297 *
298 * SYSCALL does not save anything on the stack and does not change the
299 * stack pointer.
300 */
301
302/*
303 * Register setup:
304 * rax system call number
305 * rdi arg0
306 * rcx return address for syscall/sysret, C arg3
307 * rsi arg1
308 * rdx arg2
309 * r10 arg3 (--> moved to rcx for C)
310 * r8 arg4
311 * r9 arg5
312 * r11 eflags for syscall/sysret, temporary for C
313 * r12-r15,rbp,rbx saved by C code, not touched.
314 *
315 * Interrupts are off on entry.
316 * Only called from user space.
317 *
318 * XXX if we had a free scratch register we could save the RSP into the stack frame
319 * and report it properly in ps. Unfortunately we haven't.
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200320 *
321 * When user can change the frames always force IRET. That is because
322 * it deals with uncanonical addresses better. SYSRET has trouble
323 * with them due to bugs in both AMD and Intel CPUs.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700324 */
325
326ENTRY(system_call)
Jan Beulich7effaa82005-09-12 18:49:24 +0200327 CFI_STARTPROC simple
Jan Beulichadf14232006-09-26 10:52:41 +0200328 CFI_SIGNAL_FRAME
Jan Beulichdffead42006-06-26 13:57:38 +0200329 CFI_DEF_CFA rsp,PDA_STACKOFFSET
Jan Beulich7effaa82005-09-12 18:49:24 +0200330 CFI_REGISTER rip,rcx
331 /*CFI_REGISTER rflags,r11*/
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100332 SWAPGS_UNSAFE_STACK
333 /*
334 * A hypervisor implementation might want to use a label
335 * after the swapgs, so that it can do the swapgs
336 * for the guest and jump here on syscall.
337 */
338ENTRY(system_call_after_swapgs)
339
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340 movq %rsp,%gs:pda_oldrsp
341 movq %gs:pda_kernelstack,%rsp
Ingo Molnar2601e642006-07-03 00:24:45 -0700342 /*
343 * No need to follow this irqs off/on section - it's straight
344 * and short:
345 */
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100346 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700347 SAVE_ARGS 8,1
348 movq %rax,ORIG_RAX-ARGOFFSET(%rsp)
Jan Beulich7effaa82005-09-12 18:49:24 +0200349 movq %rcx,RIP-ARGOFFSET(%rsp)
350 CFI_REL_OFFSET rip,RIP-ARGOFFSET
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351 GET_THREAD_INFO(%rcx)
Roland McGrathd4d67152008-07-09 02:38:07 -0700352 testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353 jnz tracesys
354 cmpq $__NR_syscall_max,%rax
355 ja badsys
356 movq %r10,%rcx
357 call *sys_call_table(,%rax,8) # XXX: rip relative
358 movq %rax,RAX-ARGOFFSET(%rsp)
359/*
360 * Syscall return path ending with SYSRET (fast path)
361 * Has incomplete stack frame and undefined top of stack.
362 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363ret_from_sys_call:
Andi Kleen11b854b2005-04-16 15:25:02 -0700364 movl $_TIF_ALLWORK_MASK,%edi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365 /* edi: flagmask */
366sysret_check:
Peter Zijlstra10cd7062007-10-11 22:11:12 +0200367 LOCKDEP_SYS_EXIT
Linus Torvalds1da177e2005-04-16 15:20:36 -0700368 GET_THREAD_INFO(%rcx)
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100369 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700370 TRACE_IRQS_OFF
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300371 movl TI_flags(%rcx),%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 andl %edi,%edx
373 jnz sysret_careful
Jan Beulichbcddc012006-12-07 02:14:02 +0100374 CFI_REMEMBER_STATE
Ingo Molnar2601e642006-07-03 00:24:45 -0700375 /*
376 * sysretq will re-enable interrupts:
377 */
378 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379 movq RIP-ARGOFFSET(%rsp),%rcx
Jan Beulich7effaa82005-09-12 18:49:24 +0200380 CFI_REGISTER rip,rcx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381 RESTORE_ARGS 0,-ARG_SKIP,1
Jan Beulich7effaa82005-09-12 18:49:24 +0200382 /*CFI_REGISTER rflags,r11*/
Jeremy Fitzhardingec7245da2008-06-25 00:19:27 -0400383 movq %gs:pda_oldrsp, %rsp
Jeremy Fitzhardinge2be29982008-06-25 00:19:28 -0400384 USERGS_SYSRET64
Linus Torvalds1da177e2005-04-16 15:20:36 -0700385
Jan Beulichbcddc012006-12-07 02:14:02 +0100386 CFI_RESTORE_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700387 /* Handle reschedules */
388 /* edx: work, edi: workmask */
389sysret_careful:
390 bt $TIF_NEED_RESCHED,%edx
391 jnc sysret_signal
Ingo Molnar2601e642006-07-03 00:24:45 -0700392 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100393 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200395 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700396 call schedule
397 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200398 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 jmp sysret_check
400
401 /* Handle a signal */
402sysret_signal:
Ingo Molnar2601e642006-07-03 00:24:45 -0700403 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100404 ENABLE_INTERRUPTS(CLBR_NONE)
Andi Kleen10ffdbb2005-05-16 21:53:19 -0700405 /* edx: work flags (arg3) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700406 leaq do_notify_resume(%rip),%rax
407 leaq -ARGOFFSET(%rsp),%rdi # &pt_regs -> arg1
408 xorl %esi,%esi # oldset -> arg2
409 call ptregscall_common
Roland McGrath15e8f342008-06-23 20:41:12 -0700410 movl $_TIF_WORK_MASK,%edi
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200411 /* Use IRET because user could have changed frame. This
412 works because ptregscall_common has called FIXUP_TOP_OF_STACK. */
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100413 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700414 TRACE_IRQS_OFF
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200415 jmp int_with_check
Linus Torvalds1da177e2005-04-16 15:20:36 -0700416
Jan Beulich7effaa82005-09-12 18:49:24 +0200417badsys:
418 movq $-ENOSYS,RAX-ARGOFFSET(%rsp)
419 jmp ret_from_sys_call
420
Linus Torvalds1da177e2005-04-16 15:20:36 -0700421 /* Do syscall tracing */
422tracesys:
423 SAVE_REST
Roland McGratha31f8dd2008-03-16 21:59:11 -0700424 movq $-ENOSYS,RAX(%rsp) /* ptrace can change this for a bad syscall */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700425 FIXUP_TOP_OF_STACK %rdi
426 movq %rsp,%rdi
427 call syscall_trace_enter
Roland McGrathd4d67152008-07-09 02:38:07 -0700428 /*
429 * Reload arg registers from stack in case ptrace changed them.
430 * We don't reload %rax because syscall_trace_enter() returned
431 * the value it wants us to use in the table lookup.
432 */
433 LOAD_ARGS ARGOFFSET, 1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700434 RESTORE_REST
435 cmpq $__NR_syscall_max,%rax
Roland McGratha31f8dd2008-03-16 21:59:11 -0700436 ja int_ret_from_sys_call /* RAX(%rsp) set to -ENOSYS above */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437 movq %r10,%rcx /* fixup for C */
438 call *sys_call_table(,%rax,8)
Roland McGratha31f8dd2008-03-16 21:59:11 -0700439 movq %rax,RAX-ARGOFFSET(%rsp)
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200440 /* Use IRET because user could have changed frame */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700441
Linus Torvalds1da177e2005-04-16 15:20:36 -0700442/*
443 * Syscall return path ending with IRET.
444 * Has correct top of stack, but partial stack frame.
Jan Beulichbcddc012006-12-07 02:14:02 +0100445 */
446 .globl int_ret_from_sys_call
447int_ret_from_sys_call:
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100448 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700449 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700450 testl $3,CS-ARGOFFSET(%rsp)
451 je retint_restore_args
452 movl $_TIF_ALLWORK_MASK,%edi
453 /* edi: mask to check */
454int_with_check:
Peter Zijlstra10cd7062007-10-11 22:11:12 +0200455 LOCKDEP_SYS_EXIT_IRQ
Linus Torvalds1da177e2005-04-16 15:20:36 -0700456 GET_THREAD_INFO(%rcx)
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300457 movl TI_flags(%rcx),%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700458 andl %edi,%edx
459 jnz int_careful
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300460 andl $~TS_COMPAT,TI_status(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700461 jmp retint_swapgs
462
463 /* Either reschedule or signal or syscall exit tracking needed. */
464 /* First do a reschedule test. */
465 /* edx: work, edi: workmask */
466int_careful:
467 bt $TIF_NEED_RESCHED,%edx
468 jnc int_very_careful
Ingo Molnar2601e642006-07-03 00:24:45 -0700469 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100470 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700471 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200472 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473 call schedule
474 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200475 CFI_ADJUST_CFA_OFFSET -8
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100476 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700477 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700478 jmp int_with_check
479
480 /* handle signals and tracing -- both require a full stack frame */
481int_very_careful:
Ingo Molnar2601e642006-07-03 00:24:45 -0700482 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100483 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700484 SAVE_REST
485 /* Check for syscall exit trace */
Roland McGrathd4d67152008-07-09 02:38:07 -0700486 testl $_TIF_WORK_SYSCALL_EXIT,%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700487 jz int_signal
488 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200489 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490 leaq 8(%rsp),%rdi # &ptregs -> arg1
491 call syscall_trace_leave
492 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200493 CFI_ADJUST_CFA_OFFSET -8
Roland McGrathd4d67152008-07-09 02:38:07 -0700494 andl $~(_TIF_WORK_SYSCALL_EXIT|_TIF_SYSCALL_EMU),%edi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700495 jmp int_restore_rest
496
497int_signal:
Peter Zijlstra8f4d37e2008-01-25 21:08:29 +0100498 testl $_TIF_DO_NOTIFY_MASK,%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499 jz 1f
500 movq %rsp,%rdi # &ptregs -> arg1
501 xorl %esi,%esi # oldset -> arg2
502 call do_notify_resume
Roland McGratheca91e72008-07-10 14:50:39 -07005031: movl $_TIF_WORK_MASK,%edi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700504int_restore_rest:
505 RESTORE_REST
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100506 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700507 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508 jmp int_with_check
509 CFI_ENDPROC
Jan Beulichbcddc012006-12-07 02:14:02 +0100510END(system_call)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511
512/*
513 * Certain special system calls that need to save a complete full stack frame.
514 */
515
516 .macro PTREGSCALL label,func,arg
517 .globl \label
518\label:
519 leaq \func(%rip),%rax
520 leaq -ARGOFFSET+8(%rsp),\arg /* 8 for return address */
521 jmp ptregscall_common
Jan Beulich4b787e02006-06-26 13:56:55 +0200522END(\label)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700523 .endm
524
Jan Beulich7effaa82005-09-12 18:49:24 +0200525 CFI_STARTPROC
526
Linus Torvalds1da177e2005-04-16 15:20:36 -0700527 PTREGSCALL stub_clone, sys_clone, %r8
528 PTREGSCALL stub_fork, sys_fork, %rdi
529 PTREGSCALL stub_vfork, sys_vfork, %rdi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700530 PTREGSCALL stub_sigaltstack, sys_sigaltstack, %rdx
531 PTREGSCALL stub_iopl, sys_iopl, %rsi
532
533ENTRY(ptregscall_common)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534 popq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200535 CFI_ADJUST_CFA_OFFSET -8
536 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700537 SAVE_REST
538 movq %r11, %r15
Jan Beulich7effaa82005-09-12 18:49:24 +0200539 CFI_REGISTER rip, r15
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540 FIXUP_TOP_OF_STACK %r11
541 call *%rax
542 RESTORE_TOP_OF_STACK %r11
543 movq %r15, %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200544 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700545 RESTORE_REST
546 pushq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200547 CFI_ADJUST_CFA_OFFSET 8
548 CFI_REL_OFFSET rip, 0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700549 ret
550 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200551END(ptregscall_common)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700552
553ENTRY(stub_execve)
554 CFI_STARTPROC
555 popq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200556 CFI_ADJUST_CFA_OFFSET -8
557 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700558 SAVE_REST
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559 FIXUP_TOP_OF_STACK %r11
Ingo Molnar5d119b22008-02-26 12:55:57 +0100560 movq %rsp, %rcx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561 call sys_execve
Linus Torvalds1da177e2005-04-16 15:20:36 -0700562 RESTORE_TOP_OF_STACK %r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700563 movq %rax,RAX(%rsp)
564 RESTORE_REST
565 jmp int_ret_from_sys_call
566 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200567END(stub_execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700568
569/*
570 * sigreturn is special because it needs to restore all registers on return.
571 * This cannot be done with SYSRET, so use the IRET return path instead.
572 */
573ENTRY(stub_rt_sigreturn)
574 CFI_STARTPROC
Jan Beulich7effaa82005-09-12 18:49:24 +0200575 addq $8, %rsp
576 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577 SAVE_REST
578 movq %rsp,%rdi
579 FIXUP_TOP_OF_STACK %r11
580 call sys_rt_sigreturn
581 movq %rax,RAX(%rsp) # fixme, this could be done at the higher layer
582 RESTORE_REST
583 jmp int_ret_from_sys_call
584 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200585END(stub_rt_sigreturn)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586
Jan Beulich7effaa82005-09-12 18:49:24 +0200587/*
588 * initial frame state for interrupts and exceptions
589 */
590 .macro _frame ref
591 CFI_STARTPROC simple
Jan Beulichadf14232006-09-26 10:52:41 +0200592 CFI_SIGNAL_FRAME
Jan Beulich7effaa82005-09-12 18:49:24 +0200593 CFI_DEF_CFA rsp,SS+8-\ref
594 /*CFI_REL_OFFSET ss,SS-\ref*/
595 CFI_REL_OFFSET rsp,RSP-\ref
596 /*CFI_REL_OFFSET rflags,EFLAGS-\ref*/
597 /*CFI_REL_OFFSET cs,CS-\ref*/
598 CFI_REL_OFFSET rip,RIP-\ref
599 .endm
600
601/* initial frame state for interrupts (and exceptions without error code) */
602#define INTR_FRAME _frame RIP
603/* initial frame state for exceptions with error code (and interrupts with
604 vector already pushed) */
605#define XCPT_FRAME _frame ORIG_RAX
606
Linus Torvalds1da177e2005-04-16 15:20:36 -0700607/*
608 * Interrupt entry/exit.
609 *
610 * Interrupt entry points save only callee clobbered registers in fast path.
611 *
612 * Entry runs with interrupts off.
613 */
614
615/* 0(%rsp): interrupt number */
616 .macro interrupt func
Linus Torvalds1da177e2005-04-16 15:20:36 -0700617 cld
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618 SAVE_ARGS
619 leaq -ARGOFFSET(%rsp),%rdi # arg1 for handler
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200620 pushq %rbp
621 CFI_ADJUST_CFA_OFFSET 8
622 CFI_REL_OFFSET rbp, 0
623 movq %rsp,%rbp
624 CFI_DEF_CFA_REGISTER rbp
Linus Torvalds1da177e2005-04-16 15:20:36 -0700625 testl $3,CS(%rdi)
626 je 1f
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100627 SWAPGS
Andi Kleen96e54042006-09-26 10:52:39 +0200628 /* irqcount is used to check if a CPU is already on an interrupt
629 stack or not. While this is essentially redundant with preempt_count
630 it is a little cheaper to use a separate counter in the PDA
631 (short of moving irq_enter into assembly, which would be too
632 much work) */
6331: incl %gs:pda_irqcount
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200634 cmoveq %gs:pda_irqstackptr,%rsp
Andi Kleen26995002006-08-02 22:37:28 +0200635 push %rbp # backlink for old unwinder
Ingo Molnar2601e642006-07-03 00:24:45 -0700636 /*
637 * We entered an interrupt context - irqs are off:
638 */
639 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640 call \func
641 .endm
642
643ENTRY(common_interrupt)
Jan Beulich7effaa82005-09-12 18:49:24 +0200644 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700645 interrupt do_IRQ
646 /* 0(%rsp): oldrsp-ARGOFFSET */
Jan Beulich7effaa82005-09-12 18:49:24 +0200647ret_from_intr:
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100648 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700649 TRACE_IRQS_OFF
Andi Kleen3829ee62005-07-28 21:15:48 -0700650 decl %gs:pda_irqcount
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200651 leaveq
Jan Beulich7effaa82005-09-12 18:49:24 +0200652 CFI_DEF_CFA_REGISTER rsp
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200653 CFI_ADJUST_CFA_OFFSET -8
Jan Beulich7effaa82005-09-12 18:49:24 +0200654exit_intr:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700655 GET_THREAD_INFO(%rcx)
656 testl $3,CS-ARGOFFSET(%rsp)
657 je retint_kernel
658
659 /* Interrupt came from user space */
660 /*
661 * Has a correct top of stack, but a partial stack frame
662 * %rcx: thread info. Interrupts off.
663 */
664retint_with_reschedule:
665 movl $_TIF_WORK_MASK,%edi
Jan Beulich7effaa82005-09-12 18:49:24 +0200666retint_check:
Peter Zijlstra10cd7062007-10-11 22:11:12 +0200667 LOCKDEP_SYS_EXIT_IRQ
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300668 movl TI_flags(%rcx),%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700669 andl %edi,%edx
Jan Beulich7effaa82005-09-12 18:49:24 +0200670 CFI_REMEMBER_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700671 jnz retint_careful
Peter Zijlstra10cd7062007-10-11 22:11:12 +0200672
673retint_swapgs: /* return to user-space */
Ingo Molnar2601e642006-07-03 00:24:45 -0700674 /*
675 * The iretq could re-enable interrupts:
676 */
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100677 DISABLE_INTERRUPTS(CLBR_ANY)
Ingo Molnar2601e642006-07-03 00:24:45 -0700678 TRACE_IRQS_IRETQ
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100679 SWAPGS
Ingo Molnar2601e642006-07-03 00:24:45 -0700680 jmp restore_args
681
Peter Zijlstra10cd7062007-10-11 22:11:12 +0200682retint_restore_args: /* return to kernel space */
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100683 DISABLE_INTERRUPTS(CLBR_ANY)
Ingo Molnar2601e642006-07-03 00:24:45 -0700684 /*
685 * The iretq could re-enable interrupts:
686 */
687 TRACE_IRQS_IRETQ
688restore_args:
Ingo Molnar3701d8632008-02-09 23:24:08 +0100689 RESTORE_ARGS 0,8,0
690
Adrian Bunkf7f3d792008-02-13 23:29:53 +0200691irq_return:
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100692 INTERRUPT_RETURN
Ingo Molnar3701d8632008-02-09 23:24:08 +0100693
694 .section __ex_table, "a"
695 .quad irq_return, bad_iret
696 .previous
697
698#ifdef CONFIG_PARAVIRT
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100699ENTRY(native_iret)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700700 iretq
701
702 .section __ex_table,"a"
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100703 .quad native_iret, bad_iret
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704 .previous
Ingo Molnar3701d8632008-02-09 23:24:08 +0100705#endif
706
Linus Torvalds1da177e2005-04-16 15:20:36 -0700707 .section .fixup,"ax"
Linus Torvalds1da177e2005-04-16 15:20:36 -0700708bad_iret:
Roland McGrath3aa4b372008-02-06 22:39:43 +0100709 /*
710 * The iret traps when the %cs or %ss being restored is bogus.
711 * We've lost the original trap vector and error code.
712 * #GPF is the most likely one to get for an invalid selector.
713 * So pretend we completed the iret and took the #GPF in user mode.
714 *
715 * We are now running with the kernel GS after exception recovery.
716 * But error_entry expects us to have user GS to match the user %cs,
717 * so swap back.
718 */
719 pushq $0
720
721 SWAPGS
722 jmp general_protection
723
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100724 .previous
725
Jan Beulich7effaa82005-09-12 18:49:24 +0200726 /* edi: workmask, edx: work */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727retint_careful:
Jan Beulich7effaa82005-09-12 18:49:24 +0200728 CFI_RESTORE_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700729 bt $TIF_NEED_RESCHED,%edx
730 jnc retint_signal
Ingo Molnar2601e642006-07-03 00:24:45 -0700731 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100732 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200734 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735 call schedule
736 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200737 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738 GET_THREAD_INFO(%rcx)
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100739 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700740 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741 jmp retint_check
742
743retint_signal:
Peter Zijlstra8f4d37e2008-01-25 21:08:29 +0100744 testl $_TIF_DO_NOTIFY_MASK,%edx
Andi Kleen10ffdbb2005-05-16 21:53:19 -0700745 jz retint_swapgs
Ingo Molnar2601e642006-07-03 00:24:45 -0700746 TRACE_IRQS_ON
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100747 ENABLE_INTERRUPTS(CLBR_NONE)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700748 SAVE_REST
749 movq $-1,ORIG_RAX(%rsp)
Andi Kleen3829ee62005-07-28 21:15:48 -0700750 xorl %esi,%esi # oldset
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751 movq %rsp,%rdi # &pt_regs
752 call do_notify_resume
753 RESTORE_REST
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100754 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700755 TRACE_IRQS_OFF
Andi Kleenbe9e6872005-05-01 08:58:51 -0700756 GET_THREAD_INFO(%rcx)
Roland McGratheca91e72008-07-10 14:50:39 -0700757 jmp retint_with_reschedule
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758
759#ifdef CONFIG_PREEMPT
760 /* Returning to kernel space. Check if we need preemption */
761 /* rcx: threadinfo. interrupts off. */
Andi Kleenb06baba2006-09-26 10:52:29 +0200762ENTRY(retint_kernel)
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300763 cmpl $0,TI_preempt_count(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700764 jnz retint_restore_args
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300765 bt $TIF_NEED_RESCHED,TI_flags(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700766 jnc retint_restore_args
767 bt $9,EFLAGS-ARGOFFSET(%rsp) /* interrupts off? */
768 jnc retint_restore_args
769 call preempt_schedule_irq
770 jmp exit_intr
771#endif
Jan Beulich4b787e02006-06-26 13:56:55 +0200772
Linus Torvalds1da177e2005-04-16 15:20:36 -0700773 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200774END(common_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775
776/*
777 * APIC interrupts.
778 */
779 .macro apicinterrupt num,func
Jan Beulich7effaa82005-09-12 18:49:24 +0200780 INTR_FRAME
Rusty Russell19eadf92006-06-27 02:53:44 -0700781 pushq $~(\num)
Jan Beulich7effaa82005-09-12 18:49:24 +0200782 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700783 interrupt \func
784 jmp ret_from_intr
785 CFI_ENDPROC
786 .endm
787
788ENTRY(thermal_interrupt)
789 apicinterrupt THERMAL_APIC_VECTOR,smp_thermal_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200790END(thermal_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700791
Jacob Shin89b831e2005-11-05 17:25:53 +0100792ENTRY(threshold_interrupt)
793 apicinterrupt THRESHOLD_APIC_VECTOR,mce_threshold_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200794END(threshold_interrupt)
Jacob Shin89b831e2005-11-05 17:25:53 +0100795
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796#ifdef CONFIG_SMP
797ENTRY(reschedule_interrupt)
798 apicinterrupt RESCHEDULE_VECTOR,smp_reschedule_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200799END(reschedule_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700800
Andi Kleene5bc8b62005-09-12 18:49:24 +0200801 .macro INVALIDATE_ENTRY num
802ENTRY(invalidate_interrupt\num)
803 apicinterrupt INVALIDATE_TLB_VECTOR_START+\num,smp_invalidate_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200804END(invalidate_interrupt\num)
Andi Kleene5bc8b62005-09-12 18:49:24 +0200805 .endm
806
807 INVALIDATE_ENTRY 0
808 INVALIDATE_ENTRY 1
809 INVALIDATE_ENTRY 2
810 INVALIDATE_ENTRY 3
811 INVALIDATE_ENTRY 4
812 INVALIDATE_ENTRY 5
813 INVALIDATE_ENTRY 6
814 INVALIDATE_ENTRY 7
Linus Torvalds1da177e2005-04-16 15:20:36 -0700815
816ENTRY(call_function_interrupt)
817 apicinterrupt CALL_FUNCTION_VECTOR,smp_call_function_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200818END(call_function_interrupt)
Jens Axboe3b16cf82008-06-26 11:21:54 +0200819ENTRY(call_function_single_interrupt)
820 apicinterrupt CALL_FUNCTION_SINGLE_VECTOR,smp_call_function_single_interrupt
821END(call_function_single_interrupt)
Eric W. Biederman61014292007-02-23 04:40:58 -0700822ENTRY(irq_move_cleanup_interrupt)
823 apicinterrupt IRQ_MOVE_CLEANUP_VECTOR,smp_irq_move_cleanup_interrupt
824END(irq_move_cleanup_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700825#endif
826
Linus Torvalds1da177e2005-04-16 15:20:36 -0700827ENTRY(apic_timer_interrupt)
828 apicinterrupt LOCAL_TIMER_VECTOR,smp_apic_timer_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200829END(apic_timer_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700830
Cliff Wickman18129242008-06-02 08:56:14 -0500831ENTRY(uv_bau_message_intr1)
832 apicinterrupt 220,uv_bau_message_interrupt
833END(uv_bau_message_intr1)
834
Linus Torvalds1da177e2005-04-16 15:20:36 -0700835ENTRY(error_interrupt)
836 apicinterrupt ERROR_APIC_VECTOR,smp_error_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200837END(error_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700838
839ENTRY(spurious_interrupt)
840 apicinterrupt SPURIOUS_APIC_VECTOR,smp_spurious_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200841END(spurious_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700842
843/*
844 * Exception entry points.
845 */
846 .macro zeroentry sym
Jan Beulich7effaa82005-09-12 18:49:24 +0200847 INTR_FRAME
Jeremy Fitzhardingefab58422008-06-25 00:19:31 -0400848 PARAVIRT_ADJUST_EXCEPTION_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700849 pushq $0 /* push error code/oldrax */
Jan Beulich7effaa82005-09-12 18:49:24 +0200850 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700851 pushq %rax /* push real oldrax to the rdi slot */
Jan Beulich7effaa82005-09-12 18:49:24 +0200852 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich37550902007-05-02 19:27:05 +0200853 CFI_REL_OFFSET rax,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700854 leaq \sym(%rip),%rax
855 jmp error_entry
Jan Beulich7effaa82005-09-12 18:49:24 +0200856 CFI_ENDPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700857 .endm
858
859 .macro errorentry sym
Jan Beulich7effaa82005-09-12 18:49:24 +0200860 XCPT_FRAME
Jeremy Fitzhardingefab58422008-06-25 00:19:31 -0400861 PARAVIRT_ADJUST_EXCEPTION_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700862 pushq %rax
Jan Beulich7effaa82005-09-12 18:49:24 +0200863 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich37550902007-05-02 19:27:05 +0200864 CFI_REL_OFFSET rax,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700865 leaq \sym(%rip),%rax
866 jmp error_entry
Jan Beulich7effaa82005-09-12 18:49:24 +0200867 CFI_ENDPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700868 .endm
869
870 /* error code is on the stack already */
871 /* handle NMI like exceptions that can happen everywhere */
Ingo Molnar2601e642006-07-03 00:24:45 -0700872 .macro paranoidentry sym, ist=0, irqtrace=1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700873 SAVE_ALL
874 cld
875 movl $1,%ebx
876 movl $MSR_GS_BASE,%ecx
877 rdmsr
878 testl %edx,%edx
879 js 1f
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100880 SWAPGS
Linus Torvalds1da177e2005-04-16 15:20:36 -0700881 xorl %ebx,%ebx
Jan Beulichb556b352006-01-11 22:43:00 +01008821:
883 .if \ist
884 movq %gs:pda_data_offset, %rbp
885 .endif
886 movq %rsp,%rdi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700887 movq ORIG_RAX(%rsp),%rsi
888 movq $-1,ORIG_RAX(%rsp)
Jan Beulichb556b352006-01-11 22:43:00 +0100889 .if \ist
Andi Kleen5f8efbb2006-01-16 01:56:39 +0100890 subq $EXCEPTION_STKSZ, per_cpu__init_tss + TSS_ist + (\ist - 1) * 8(%rbp)
Jan Beulichb556b352006-01-11 22:43:00 +0100891 .endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700892 call \sym
Jan Beulichb556b352006-01-11 22:43:00 +0100893 .if \ist
Andi Kleen5f8efbb2006-01-16 01:56:39 +0100894 addq $EXCEPTION_STKSZ, per_cpu__init_tss + TSS_ist + (\ist - 1) * 8(%rbp)
Jan Beulichb556b352006-01-11 22:43:00 +0100895 .endif
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100896 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700897 .if \irqtrace
898 TRACE_IRQS_OFF
899 .endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700900 .endm
Ingo Molnar2601e642006-07-03 00:24:45 -0700901
902 /*
903 * "Paranoid" exit path from exception stack.
904 * Paranoid because this is used by NMIs and cannot take
905 * any kernel state for granted.
906 * We don't do kernel preemption checks here, because only
907 * NMI should be common and it does not enable IRQs and
908 * cannot get reschedule ticks.
909 *
910 * "trace" is 0 for the NMI handler only, because irq-tracing
911 * is fundamentally NMI-unsafe. (we cannot change the soft and
912 * hard flags at once, atomically)
913 */
914 .macro paranoidexit trace=1
915 /* ebx: no swapgs flag */
916paranoid_exit\trace:
917 testl %ebx,%ebx /* swapgs needed? */
918 jnz paranoid_restore\trace
919 testl $3,CS(%rsp)
920 jnz paranoid_userspace\trace
921paranoid_swapgs\trace:
Andi Kleen7a0a2df2006-09-26 10:52:37 +0200922 .if \trace
Ingo Molnar2601e642006-07-03 00:24:45 -0700923 TRACE_IRQS_IRETQ 0
Andi Kleen7a0a2df2006-09-26 10:52:37 +0200924 .endif
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100925 SWAPGS_UNSAFE_STACK
Ingo Molnar2601e642006-07-03 00:24:45 -0700926paranoid_restore\trace:
927 RESTORE_ALL 8
Ingo Molnar3701d8632008-02-09 23:24:08 +0100928 jmp irq_return
Ingo Molnar2601e642006-07-03 00:24:45 -0700929paranoid_userspace\trace:
930 GET_THREAD_INFO(%rcx)
Glauber Costa26ccb8a2008-06-24 11:19:35 -0300931 movl TI_flags(%rcx),%ebx
Ingo Molnar2601e642006-07-03 00:24:45 -0700932 andl $_TIF_WORK_MASK,%ebx
933 jz paranoid_swapgs\trace
934 movq %rsp,%rdi /* &pt_regs */
935 call sync_regs
936 movq %rax,%rsp /* switch stack for scheduling */
937 testl $_TIF_NEED_RESCHED,%ebx
938 jnz paranoid_schedule\trace
939 movl %ebx,%edx /* arg3: thread flags */
940 .if \trace
941 TRACE_IRQS_ON
942 .endif
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100943 ENABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700944 xorl %esi,%esi /* arg2: oldset */
945 movq %rsp,%rdi /* arg1: &pt_regs */
946 call do_notify_resume
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100947 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -0700948 .if \trace
949 TRACE_IRQS_OFF
950 .endif
951 jmp paranoid_userspace\trace
952paranoid_schedule\trace:
953 .if \trace
954 TRACE_IRQS_ON
955 .endif
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100956 ENABLE_INTERRUPTS(CLBR_ANY)
Ingo Molnar2601e642006-07-03 00:24:45 -0700957 call schedule
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +0100958 DISABLE_INTERRUPTS(CLBR_ANY)
Ingo Molnar2601e642006-07-03 00:24:45 -0700959 .if \trace
960 TRACE_IRQS_OFF
961 .endif
962 jmp paranoid_userspace\trace
963 CFI_ENDPROC
964 .endm
965
Linus Torvalds1da177e2005-04-16 15:20:36 -0700966/*
967 * Exception entry point. This expects an error code/orig_rax on the stack
968 * and the exception handler in %rax.
969 */
Prasanna S.Pd28c4392006-09-26 10:52:34 +0200970KPROBE_ENTRY(error_entry)
Jan Beulich7effaa82005-09-12 18:49:24 +0200971 _frame RDI
Jan Beulich37550902007-05-02 19:27:05 +0200972 CFI_REL_OFFSET rax,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700973 /* rdi slot contains rax, oldrax contains error code */
974 cld
975 subq $14*8,%rsp
976 CFI_ADJUST_CFA_OFFSET (14*8)
977 movq %rsi,13*8(%rsp)
978 CFI_REL_OFFSET rsi,RSI
979 movq 14*8(%rsp),%rsi /* load rax from rdi slot */
Jan Beulich37550902007-05-02 19:27:05 +0200980 CFI_REGISTER rax,rsi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700981 movq %rdx,12*8(%rsp)
982 CFI_REL_OFFSET rdx,RDX
983 movq %rcx,11*8(%rsp)
984 CFI_REL_OFFSET rcx,RCX
985 movq %rsi,10*8(%rsp) /* store rax */
986 CFI_REL_OFFSET rax,RAX
987 movq %r8, 9*8(%rsp)
988 CFI_REL_OFFSET r8,R8
989 movq %r9, 8*8(%rsp)
990 CFI_REL_OFFSET r9,R9
991 movq %r10,7*8(%rsp)
992 CFI_REL_OFFSET r10,R10
993 movq %r11,6*8(%rsp)
994 CFI_REL_OFFSET r11,R11
995 movq %rbx,5*8(%rsp)
996 CFI_REL_OFFSET rbx,RBX
997 movq %rbp,4*8(%rsp)
998 CFI_REL_OFFSET rbp,RBP
999 movq %r12,3*8(%rsp)
1000 CFI_REL_OFFSET r12,R12
1001 movq %r13,2*8(%rsp)
1002 CFI_REL_OFFSET r13,R13
1003 movq %r14,1*8(%rsp)
1004 CFI_REL_OFFSET r14,R14
1005 movq %r15,(%rsp)
1006 CFI_REL_OFFSET r15,R15
1007 xorl %ebx,%ebx
1008 testl $3,CS(%rsp)
1009 je error_kernelspace
1010error_swapgs:
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +01001011 SWAPGS
Linus Torvalds1da177e2005-04-16 15:20:36 -07001012error_sti:
1013 movq %rdi,RDI(%rsp)
Jan Beulich37550902007-05-02 19:27:05 +02001014 CFI_REL_OFFSET rdi,RDI
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015 movq %rsp,%rdi
1016 movq ORIG_RAX(%rsp),%rsi /* get error code */
1017 movq $-1,ORIG_RAX(%rsp)
1018 call *%rax
Peter Zijlstra10cd7062007-10-11 22:11:12 +02001019 /* ebx: no swapgs flag (1: don't need swapgs, 0: need it) */
1020error_exit:
1021 movl %ebx,%eax
Linus Torvalds1da177e2005-04-16 15:20:36 -07001022 RESTORE_REST
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +01001023 DISABLE_INTERRUPTS(CLBR_NONE)
Ingo Molnar2601e642006-07-03 00:24:45 -07001024 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -07001025 GET_THREAD_INFO(%rcx)
1026 testl %eax,%eax
1027 jne retint_kernel
Peter Zijlstra10cd7062007-10-11 22:11:12 +02001028 LOCKDEP_SYS_EXIT_IRQ
Glauber Costa26ccb8a2008-06-24 11:19:35 -03001029 movl TI_flags(%rcx),%edx
Linus Torvalds1da177e2005-04-16 15:20:36 -07001030 movl $_TIF_WORK_MASK,%edi
1031 andl %edi,%edx
1032 jnz retint_careful
Peter Zijlstra10cd7062007-10-11 22:11:12 +02001033 jmp retint_swapgs
Linus Torvalds1da177e2005-04-16 15:20:36 -07001034 CFI_ENDPROC
1035
1036error_kernelspace:
1037 incl %ebx
1038 /* There are two places in the kernel that can potentially fault with
1039 usergs. Handle them here. The exception handlers after
1040 iret run with kernel gs again, so don't set the user space flag.
1041 B stepping K8s sometimes report an truncated RIP for IRET
1042 exceptions returning to compat mode. Check for these here too. */
Vegard Nossum9d8ad5d2008-06-27 17:22:17 +02001043 leaq irq_return(%rip),%rcx
1044 cmpq %rcx,RIP(%rsp)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001045 je error_swapgs
Vegard Nossum9d8ad5d2008-06-27 17:22:17 +02001046 movl %ecx,%ecx /* zero extend */
1047 cmpq %rcx,RIP(%rsp)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001048 je error_swapgs
1049 cmpq $gs_change,RIP(%rsp)
1050 je error_swapgs
1051 jmp error_sti
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001052KPROBE_END(error_entry)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001053
1054 /* Reload gs selector with exception handling */
1055 /* edi: new selector */
Jeremy Fitzhardinge9f9d4892008-06-25 00:19:32 -04001056ENTRY(native_load_gs_index)
Jan Beulich7effaa82005-09-12 18:49:24 +02001057 CFI_STARTPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -07001058 pushf
Jan Beulich7effaa82005-09-12 18:49:24 +02001059 CFI_ADJUST_CFA_OFFSET 8
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +01001060 DISABLE_INTERRUPTS(CLBR_ANY | ~(CLBR_RDI))
1061 SWAPGS
Linus Torvalds1da177e2005-04-16 15:20:36 -07001062gs_change:
1063 movl %edi,%gs
10642: mfence /* workaround */
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +01001065 SWAPGS
Linus Torvalds1da177e2005-04-16 15:20:36 -07001066 popf
Jan Beulich7effaa82005-09-12 18:49:24 +02001067 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -07001068 ret
Jan Beulich7effaa82005-09-12 18:49:24 +02001069 CFI_ENDPROC
Jeremy Fitzhardinge9f9d4892008-06-25 00:19:32 -04001070ENDPROC(native_load_gs_index)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001071
1072 .section __ex_table,"a"
1073 .align 8
1074 .quad gs_change,bad_gs
1075 .previous
1076 .section .fixup,"ax"
1077 /* running with kernelgs */
1078bad_gs:
Glauber de Oliveira Costa72fe4852008-01-30 13:32:08 +01001079 SWAPGS /* switch back to user gs */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001080 xorl %eax,%eax
1081 movl %eax,%gs
1082 jmp 2b
1083 .previous
1084
1085/*
1086 * Create a kernel thread.
1087 *
1088 * C extern interface:
1089 * extern long kernel_thread(int (*fn)(void *), void * arg, unsigned long flags)
1090 *
1091 * asm input arguments:
1092 * rdi: fn, rsi: arg, rdx: flags
1093 */
1094ENTRY(kernel_thread)
1095 CFI_STARTPROC
1096 FAKE_STACK_FRAME $child_rip
1097 SAVE_ALL
1098
1099 # rdi: flags, rsi: usp, rdx: will be &pt_regs
1100 movq %rdx,%rdi
1101 orq kernel_thread_flags(%rip),%rdi
1102 movq $-1, %rsi
1103 movq %rsp, %rdx
1104
1105 xorl %r8d,%r8d
1106 xorl %r9d,%r9d
1107
1108 # clone now
1109 call do_fork
1110 movq %rax,RAX(%rsp)
1111 xorl %edi,%edi
1112
1113 /*
1114 * It isn't worth to check for reschedule here,
1115 * so internally to the x86_64 port you can rely on kernel_thread()
1116 * not to reschedule the child before returning, this avoids the need
1117 * of hacks for example to fork off the per-CPU idle tasks.
1118 * [Hopefully no generic code relies on the reschedule -AK]
1119 */
1120 RESTORE_ALL
1121 UNFAKE_STACK_FRAME
1122 ret
1123 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001124ENDPROC(kernel_thread)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001125
1126child_rip:
Andi Kleenc05991e2006-08-30 19:37:08 +02001127 pushq $0 # fake return address
1128 CFI_STARTPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -07001129 /*
1130 * Here we are in the child and the registers are set as they were
1131 * at kernel_thread() invocation in the parent.
1132 */
1133 movq %rdi, %rax
1134 movq %rsi, %rdi
1135 call *%rax
1136 # exit
Andrey Mirkin1c5b5cf2007-10-17 18:04:33 +02001137 mov %eax, %edi
Linus Torvalds1da177e2005-04-16 15:20:36 -07001138 call do_exit
Andi Kleenc05991e2006-08-30 19:37:08 +02001139 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001140ENDPROC(child_rip)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001141
1142/*
1143 * execve(). This function needs to use IRET, not SYSRET, to set up all state properly.
1144 *
1145 * C extern interface:
1146 * extern long execve(char *name, char **argv, char **envp)
1147 *
1148 * asm input arguments:
1149 * rdi: name, rsi: argv, rdx: envp
1150 *
1151 * We want to fallback into:
Ingo Molnar5d119b22008-02-26 12:55:57 +01001152 * extern long sys_execve(char *name, char **argv,char **envp, struct pt_regs *regs)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001153 *
1154 * do_sys_execve asm fallback arguments:
Ingo Molnar5d119b22008-02-26 12:55:57 +01001155 * rdi: name, rsi: argv, rdx: envp, rcx: fake frame on the stack
Linus Torvalds1da177e2005-04-16 15:20:36 -07001156 */
Arnd Bergmann3db03b42006-10-02 02:18:31 -07001157ENTRY(kernel_execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158 CFI_STARTPROC
1159 FAKE_STACK_FRAME $0
1160 SAVE_ALL
Ingo Molnar5d119b22008-02-26 12:55:57 +01001161 movq %rsp,%rcx
Linus Torvalds1da177e2005-04-16 15:20:36 -07001162 call sys_execve
1163 movq %rax, RAX(%rsp)
1164 RESTORE_REST
1165 testq %rax,%rax
1166 je int_ret_from_sys_call
1167 RESTORE_ARGS
1168 UNFAKE_STACK_FRAME
1169 ret
1170 CFI_ENDPROC
Arnd Bergmann3db03b42006-10-02 02:18:31 -07001171ENDPROC(kernel_execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001172
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001173KPROBE_ENTRY(page_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001174 errorentry do_page_fault
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001175KPROBE_END(page_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001176
1177ENTRY(coprocessor_error)
1178 zeroentry do_coprocessor_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001179END(coprocessor_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001180
1181ENTRY(simd_coprocessor_error)
1182 zeroentry do_simd_coprocessor_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001183END(simd_coprocessor_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001184
1185ENTRY(device_not_available)
1186 zeroentry math_state_restore
Jan Beulich4b787e02006-06-26 13:56:55 +02001187END(device_not_available)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001188
1189 /* runs on exception stack */
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001190KPROBE_ENTRY(debug)
Jan Beulich7effaa82005-09-12 18:49:24 +02001191 INTR_FRAME
Jeremy Fitzhardinge09402942008-07-12 02:22:12 -07001192 PARAVIRT_ADJUST_EXCEPTION_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001193 pushq $0
1194 CFI_ADJUST_CFA_OFFSET 8
Andi Kleen5f8efbb2006-01-16 01:56:39 +01001195 paranoidentry do_debug, DEBUG_STACK
Ingo Molnar2601e642006-07-03 00:24:45 -07001196 paranoidexit
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001197KPROBE_END(debug)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001198
1199 /* runs on exception stack */
Andi Kleeneddb6fb2006-02-03 21:50:41 +01001200KPROBE_ENTRY(nmi)
Jan Beulich7effaa82005-09-12 18:49:24 +02001201 INTR_FRAME
Jeremy Fitzhardinge09402942008-07-12 02:22:12 -07001202 PARAVIRT_ADJUST_EXCEPTION_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001203 pushq $-1
Jan Beulich7effaa82005-09-12 18:49:24 +02001204 CFI_ADJUST_CFA_OFFSET 8
Ingo Molnar2601e642006-07-03 00:24:45 -07001205 paranoidentry do_nmi, 0, 0
1206#ifdef CONFIG_TRACE_IRQFLAGS
1207 paranoidexit 0
1208#else
1209 jmp paranoid_exit1
1210 CFI_ENDPROC
1211#endif
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001212KPROBE_END(nmi)
Andi Kleen6fefb0d2005-04-16 15:25:03 -07001213
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001214KPROBE_ENTRY(int3)
Jan Beulichb556b352006-01-11 22:43:00 +01001215 INTR_FRAME
Jeremy Fitzhardinge09402942008-07-12 02:22:12 -07001216 PARAVIRT_ADJUST_EXCEPTION_FRAME
Jan Beulichb556b352006-01-11 22:43:00 +01001217 pushq $0
1218 CFI_ADJUST_CFA_OFFSET 8
Andi Kleen5f8efbb2006-01-16 01:56:39 +01001219 paranoidentry do_int3, DEBUG_STACK
Ingo Molnar2601e642006-07-03 00:24:45 -07001220 jmp paranoid_exit1
Jan Beulichb556b352006-01-11 22:43:00 +01001221 CFI_ENDPROC
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001222KPROBE_END(int3)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001223
1224ENTRY(overflow)
1225 zeroentry do_overflow
Jan Beulich4b787e02006-06-26 13:56:55 +02001226END(overflow)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001227
1228ENTRY(bounds)
1229 zeroentry do_bounds
Jan Beulich4b787e02006-06-26 13:56:55 +02001230END(bounds)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001231
1232ENTRY(invalid_op)
1233 zeroentry do_invalid_op
Jan Beulich4b787e02006-06-26 13:56:55 +02001234END(invalid_op)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001235
1236ENTRY(coprocessor_segment_overrun)
1237 zeroentry do_coprocessor_segment_overrun
Jan Beulich4b787e02006-06-26 13:56:55 +02001238END(coprocessor_segment_overrun)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001239
Linus Torvalds1da177e2005-04-16 15:20:36 -07001240 /* runs on exception stack */
1241ENTRY(double_fault)
Jan Beulich7effaa82005-09-12 18:49:24 +02001242 XCPT_FRAME
Jeremy Fitzhardinge09402942008-07-12 02:22:12 -07001243 PARAVIRT_ADJUST_EXCEPTION_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001244 paranoidentry do_double_fault
Ingo Molnar2601e642006-07-03 00:24:45 -07001245 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001246 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001247END(double_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001248
1249ENTRY(invalid_TSS)
1250 errorentry do_invalid_TSS
Jan Beulich4b787e02006-06-26 13:56:55 +02001251END(invalid_TSS)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001252
1253ENTRY(segment_not_present)
1254 errorentry do_segment_not_present
Jan Beulich4b787e02006-06-26 13:56:55 +02001255END(segment_not_present)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001256
1257 /* runs on exception stack */
1258ENTRY(stack_segment)
Jan Beulich7effaa82005-09-12 18:49:24 +02001259 XCPT_FRAME
Jeremy Fitzhardinge09402942008-07-12 02:22:12 -07001260 PARAVIRT_ADJUST_EXCEPTION_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001261 paranoidentry do_stack_segment
Ingo Molnar2601e642006-07-03 00:24:45 -07001262 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001263 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001264END(stack_segment)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001265
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001266KPROBE_ENTRY(general_protection)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001267 errorentry do_general_protection
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001268KPROBE_END(general_protection)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001269
1270ENTRY(alignment_check)
1271 errorentry do_alignment_check
Jan Beulich4b787e02006-06-26 13:56:55 +02001272END(alignment_check)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001273
1274ENTRY(divide_error)
1275 zeroentry do_divide_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001276END(divide_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001277
1278ENTRY(spurious_interrupt_bug)
1279 zeroentry do_spurious_interrupt_bug
Jan Beulich4b787e02006-06-26 13:56:55 +02001280END(spurious_interrupt_bug)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001281
1282#ifdef CONFIG_X86_MCE
1283 /* runs on exception stack */
1284ENTRY(machine_check)
Jan Beulich7effaa82005-09-12 18:49:24 +02001285 INTR_FRAME
Jeremy Fitzhardinge09402942008-07-12 02:22:12 -07001286 PARAVIRT_ADJUST_EXCEPTION_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287 pushq $0
1288 CFI_ADJUST_CFA_OFFSET 8
1289 paranoidentry do_machine_check
Ingo Molnar2601e642006-07-03 00:24:45 -07001290 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001291 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001292END(machine_check)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001293#endif
1294
Andi Kleen26995002006-08-02 22:37:28 +02001295/* Call softirq on interrupt stack. Interrupts are off. */
Andi Kleened6b6762005-07-28 21:15:49 -07001296ENTRY(call_softirq)
Jan Beulich7effaa82005-09-12 18:49:24 +02001297 CFI_STARTPROC
Andi Kleen26995002006-08-02 22:37:28 +02001298 push %rbp
1299 CFI_ADJUST_CFA_OFFSET 8
1300 CFI_REL_OFFSET rbp,0
1301 mov %rsp,%rbp
1302 CFI_DEF_CFA_REGISTER rbp
Andi Kleened6b6762005-07-28 21:15:49 -07001303 incl %gs:pda_irqcount
Andi Kleen26995002006-08-02 22:37:28 +02001304 cmove %gs:pda_irqstackptr,%rsp
1305 push %rbp # backlink for old unwinder
Andi Kleened6b6762005-07-28 21:15:49 -07001306 call __do_softirq
Andi Kleen26995002006-08-02 22:37:28 +02001307 leaveq
Jan Beulich7effaa82005-09-12 18:49:24 +02001308 CFI_DEF_CFA_REGISTER rsp
Andi Kleen26995002006-08-02 22:37:28 +02001309 CFI_ADJUST_CFA_OFFSET -8
Andi Kleened6b6762005-07-28 21:15:49 -07001310 decl %gs:pda_irqcount
Andi Kleened6b6762005-07-28 21:15:49 -07001311 ret
Jan Beulich7effaa82005-09-12 18:49:24 +02001312 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001313ENDPROC(call_softirq)
Andi Kleen75154f42007-06-23 02:29:25 +02001314
1315KPROBE_ENTRY(ignore_sysret)
1316 CFI_STARTPROC
1317 mov $-ENOSYS,%eax
1318 sysret
1319 CFI_ENDPROC
1320ENDPROC(ignore_sysret)
Jeremy Fitzhardinge3d75e1b2008-07-08 15:06:49 -07001321
1322#ifdef CONFIG_XEN
1323ENTRY(xen_hypervisor_callback)
1324 zeroentry xen_do_hypervisor_callback
1325END(xen_hypervisor_callback)
1326
1327/*
1328# A note on the "critical region" in our callback handler.
1329# We want to avoid stacking callback handlers due to events occurring
1330# during handling of the last event. To do this, we keep events disabled
1331# until we've done all processing. HOWEVER, we must enable events before
1332# popping the stack frame (can't be done atomically) and so it would still
1333# be possible to get enough handler activations to overflow the stack.
1334# Although unlikely, bugs of that kind are hard to track down, so we'd
1335# like to avoid the possibility.
1336# So, on entry to the handler we detect whether we interrupted an
1337# existing activation in its critical region -- if so, we pop the current
1338# activation and restart the handler using the previous one.
1339*/
1340ENTRY(xen_do_hypervisor_callback) # do_hypervisor_callback(struct *pt_regs)
1341 CFI_STARTPROC
1342/* Since we don't modify %rdi, evtchn_do_upall(struct *pt_regs) will
1343 see the correct pointer to the pt_regs */
1344 movq %rdi, %rsp # we don't return, adjust the stack frame
1345 CFI_ENDPROC
1346 CFI_DEFAULT_STACK
134711: incl %gs:pda_irqcount
1348 movq %rsp,%rbp
1349 CFI_DEF_CFA_REGISTER rbp
1350 cmovzq %gs:pda_irqstackptr,%rsp
1351 pushq %rbp # backlink for old unwinder
1352 call xen_evtchn_do_upcall
1353 popq %rsp
1354 CFI_DEF_CFA_REGISTER rsp
1355 decl %gs:pda_irqcount
1356 jmp error_exit
1357 CFI_ENDPROC
1358END(do_hypervisor_callback)
1359
1360/*
1361# Hypervisor uses this for application faults while it executes.
1362# We get here for two reasons:
1363# 1. Fault while reloading DS, ES, FS or GS
1364# 2. Fault while executing IRET
1365# Category 1 we do not need to fix up as Xen has already reloaded all segment
1366# registers that could be reloaded and zeroed the others.
1367# Category 2 we fix up by killing the current process. We cannot use the
1368# normal Linux return path in this case because if we use the IRET hypercall
1369# to pop the stack frame we end up in an infinite loop of failsafe callbacks.
1370# We distinguish between categories by comparing each saved segment register
1371# with its current contents: any discrepancy means we in category 1.
1372*/
1373ENTRY(xen_failsafe_callback)
Jeremy Fitzhardinge4a5c3e72008-07-08 15:07:09 -07001374 framesz = (RIP-0x30) /* workaround buggy gas */
1375 _frame framesz
Jeremy Fitzhardinge3d75e1b2008-07-08 15:06:49 -07001376 CFI_REL_OFFSET rcx, 0
1377 CFI_REL_OFFSET r11, 8
1378 movw %ds,%cx
1379 cmpw %cx,0x10(%rsp)
1380 CFI_REMEMBER_STATE
1381 jne 1f
1382 movw %es,%cx
1383 cmpw %cx,0x18(%rsp)
1384 jne 1f
1385 movw %fs,%cx
1386 cmpw %cx,0x20(%rsp)
1387 jne 1f
1388 movw %gs,%cx
1389 cmpw %cx,0x28(%rsp)
1390 jne 1f
1391 /* All segments match their saved values => Category 2 (Bad IRET). */
1392 movq (%rsp),%rcx
1393 CFI_RESTORE rcx
1394 movq 8(%rsp),%r11
1395 CFI_RESTORE r11
1396 addq $0x30,%rsp
1397 CFI_ADJUST_CFA_OFFSET -0x30
Jeremy Fitzhardinge4a5c3e72008-07-08 15:07:09 -07001398 pushq $0
1399 CFI_ADJUST_CFA_OFFSET 8
1400 pushq %r11
1401 CFI_ADJUST_CFA_OFFSET 8
1402 pushq %rcx
1403 CFI_ADJUST_CFA_OFFSET 8
1404 jmp general_protection
Jeremy Fitzhardinge3d75e1b2008-07-08 15:06:49 -07001405 CFI_RESTORE_STATE
14061: /* Segment mismatch => Category 1 (Bad segment). Retry the IRET. */
1407 movq (%rsp),%rcx
1408 CFI_RESTORE rcx
1409 movq 8(%rsp),%r11
1410 CFI_RESTORE r11
1411 addq $0x30,%rsp
1412 CFI_ADJUST_CFA_OFFSET -0x30
1413 pushq $0
1414 CFI_ADJUST_CFA_OFFSET 8
1415 SAVE_ALL
1416 jmp error_exit
1417 CFI_ENDPROC
Jeremy Fitzhardinge3d75e1b2008-07-08 15:06:49 -07001418END(xen_failsafe_callback)
1419
1420#endif /* CONFIG_XEN */