blob: 038dcf733a1b30f501dcbf4504ab026819b62e73 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86_64/entry.S
3 *
4 * Copyright (C) 1991, 1992 Linus Torvalds
5 * Copyright (C) 2000, 2001, 2002 Andi Kleen SuSE Labs
6 * Copyright (C) 2000 Pavel Machek <pavel@suse.cz>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 */
8
9/*
10 * entry.S contains the system-call and fault low-level handling routines.
11 *
12 * NOTE: This code handles signal-recognition, which happens every time
13 * after an interrupt and after each system call.
14 *
15 * Normal syscalls and interrupts don't save a full stack frame, this is
16 * only done for syscall tracing, signals or fork/exec et.al.
17 *
18 * A note on terminology:
19 * - top of stack: Architecture defined interrupt frame from SS to RIP
20 * at the top of the kernel process stack.
21 * - partial stack frame: partially saved registers upto R11.
22 * - full stack frame: Like partial stack frame, but all register saved.
Andi Kleen2e91a172006-09-26 10:52:29 +020023 *
24 * Some macro usage:
25 * - CFI macros are used to generate dwarf2 unwind information for better
26 * backtraces. They don't change any code.
27 * - SAVE_ALL/RESTORE_ALL - Save/restore all registers
28 * - SAVE_ARGS/RESTORE_ARGS - Save/restore registers that C functions modify.
29 * There are unfortunately lots of special cases where some registers
30 * not touched. The macro is a big mess that should be cleaned up.
31 * - SAVE_REST/RESTORE_REST - Handle the registers not saved by SAVE_ARGS.
32 * Gives a full stack frame.
33 * - ENTRY/END Define functions in the symbol table.
34 * - FIXUP_TOP_OF_STACK/RESTORE_TOP_OF_STACK - Fix up the hardware stack
35 * frame that is otherwise undefined after a SYSCALL
36 * - TRACE_IRQ_* - Trace hard interrupt state for lock debugging.
37 * - errorentry/paranoidentry/zeroentry - Define exception entry points.
Linus Torvalds1da177e2005-04-16 15:20:36 -070038 */
39
Linus Torvalds1da177e2005-04-16 15:20:36 -070040#include <linux/linkage.h>
41#include <asm/segment.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#include <asm/cache.h>
43#include <asm/errno.h>
44#include <asm/dwarf2.h>
45#include <asm/calling.h>
Sam Ravnborge2d5df92005-09-09 21:28:48 +020046#include <asm/asm-offsets.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070047#include <asm/msr.h>
48#include <asm/unistd.h>
49#include <asm/thread_info.h>
50#include <asm/hw_irq.h>
Andi Kleen5f8efbb2006-01-16 01:56:39 +010051#include <asm/page.h>
Ingo Molnar2601e642006-07-03 00:24:45 -070052#include <asm/irqflags.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070053
54 .code64
55
Andi Kleendc37db42005-04-16 15:25:05 -070056#ifndef CONFIG_PREEMPT
Linus Torvalds1da177e2005-04-16 15:20:36 -070057#define retint_kernel retint_restore_args
58#endif
Ingo Molnar2601e642006-07-03 00:24:45 -070059
60
61.macro TRACE_IRQS_IRETQ offset=ARGOFFSET
62#ifdef CONFIG_TRACE_IRQFLAGS
63 bt $9,EFLAGS-\offset(%rsp) /* interrupts off? */
64 jnc 1f
65 TRACE_IRQS_ON
661:
67#endif
68.endm
69
Linus Torvalds1da177e2005-04-16 15:20:36 -070070/*
71 * C code is not supposed to know about undefined top of stack. Every time
72 * a C function with an pt_regs argument is called from the SYSCALL based
73 * fast path FIXUP_TOP_OF_STACK is needed.
74 * RESTORE_TOP_OF_STACK syncs the syscall state after any possible ptregs
75 * manipulation.
76 */
77
78 /* %rsp:at FRAMEEND */
79 .macro FIXUP_TOP_OF_STACK tmp
80 movq %gs:pda_oldrsp,\tmp
81 movq \tmp,RSP(%rsp)
82 movq $__USER_DS,SS(%rsp)
83 movq $__USER_CS,CS(%rsp)
84 movq $-1,RCX(%rsp)
85 movq R11(%rsp),\tmp /* get eflags */
86 movq \tmp,EFLAGS(%rsp)
87 .endm
88
89 .macro RESTORE_TOP_OF_STACK tmp,offset=0
90 movq RSP-\offset(%rsp),\tmp
91 movq \tmp,%gs:pda_oldrsp
92 movq EFLAGS-\offset(%rsp),\tmp
93 movq \tmp,R11-\offset(%rsp)
94 .endm
95
96 .macro FAKE_STACK_FRAME child_rip
97 /* push in order ss, rsp, eflags, cs, rip */
Andi Kleen3829ee62005-07-28 21:15:48 -070098 xorl %eax, %eax
Linus Torvalds1da177e2005-04-16 15:20:36 -070099 pushq %rax /* ss */
100 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200101 /*CFI_REL_OFFSET ss,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102 pushq %rax /* rsp */
103 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200104 CFI_REL_OFFSET rsp,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105 pushq $(1<<9) /* eflags - interrupts on */
106 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200107 /*CFI_REL_OFFSET rflags,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700108 pushq $__KERNEL_CS /* cs */
109 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200110 /*CFI_REL_OFFSET cs,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111 pushq \child_rip /* rip */
112 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200113 CFI_REL_OFFSET rip,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114 pushq %rax /* orig rax */
115 CFI_ADJUST_CFA_OFFSET 8
116 .endm
117
118 .macro UNFAKE_STACK_FRAME
119 addq $8*6, %rsp
120 CFI_ADJUST_CFA_OFFSET -(6*8)
121 .endm
122
Jan Beulich7effaa82005-09-12 18:49:24 +0200123 .macro CFI_DEFAULT_STACK start=1
124 .if \start
125 CFI_STARTPROC simple
Jan Beulichadf14232006-09-26 10:52:41 +0200126 CFI_SIGNAL_FRAME
Jan Beulich7effaa82005-09-12 18:49:24 +0200127 CFI_DEF_CFA rsp,SS+8
128 .else
129 CFI_DEF_CFA_OFFSET SS+8
130 .endif
131 CFI_REL_OFFSET r15,R15
132 CFI_REL_OFFSET r14,R14
133 CFI_REL_OFFSET r13,R13
134 CFI_REL_OFFSET r12,R12
135 CFI_REL_OFFSET rbp,RBP
136 CFI_REL_OFFSET rbx,RBX
137 CFI_REL_OFFSET r11,R11
138 CFI_REL_OFFSET r10,R10
139 CFI_REL_OFFSET r9,R9
140 CFI_REL_OFFSET r8,R8
141 CFI_REL_OFFSET rax,RAX
142 CFI_REL_OFFSET rcx,RCX
143 CFI_REL_OFFSET rdx,RDX
144 CFI_REL_OFFSET rsi,RSI
145 CFI_REL_OFFSET rdi,RDI
146 CFI_REL_OFFSET rip,RIP
147 /*CFI_REL_OFFSET cs,CS*/
148 /*CFI_REL_OFFSET rflags,EFLAGS*/
149 CFI_REL_OFFSET rsp,RSP
150 /*CFI_REL_OFFSET ss,SS*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151 .endm
152/*
153 * A newly forked process directly context switches into this.
154 */
155/* rdi: prev */
156ENTRY(ret_from_fork)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157 CFI_DEFAULT_STACK
Andi Kleen658fdbe2006-09-26 10:52:41 +0200158 push kernel_eflags(%rip)
159 CFI_ADJUST_CFA_OFFSET 4
160 popf # reset kernel eflags
161 CFI_ADJUST_CFA_OFFSET -4
Linus Torvalds1da177e2005-04-16 15:20:36 -0700162 call schedule_tail
163 GET_THREAD_INFO(%rcx)
164 testl $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT),threadinfo_flags(%rcx)
165 jnz rff_trace
166rff_action:
167 RESTORE_REST
168 testl $3,CS-ARGOFFSET(%rsp) # from kernel_thread?
169 je int_ret_from_sys_call
170 testl $_TIF_IA32,threadinfo_flags(%rcx)
171 jnz int_ret_from_sys_call
172 RESTORE_TOP_OF_STACK %rdi,ARGOFFSET
173 jmp ret_from_sys_call
174rff_trace:
175 movq %rsp,%rdi
176 call syscall_trace_leave
177 GET_THREAD_INFO(%rcx)
178 jmp rff_action
179 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200180END(ret_from_fork)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181
182/*
183 * System call entry. Upto 6 arguments in registers are supported.
184 *
185 * SYSCALL does not save anything on the stack and does not change the
186 * stack pointer.
187 */
188
189/*
190 * Register setup:
191 * rax system call number
192 * rdi arg0
193 * rcx return address for syscall/sysret, C arg3
194 * rsi arg1
195 * rdx arg2
196 * r10 arg3 (--> moved to rcx for C)
197 * r8 arg4
198 * r9 arg5
199 * r11 eflags for syscall/sysret, temporary for C
200 * r12-r15,rbp,rbx saved by C code, not touched.
201 *
202 * Interrupts are off on entry.
203 * Only called from user space.
204 *
205 * XXX if we had a free scratch register we could save the RSP into the stack frame
206 * and report it properly in ps. Unfortunately we haven't.
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200207 *
208 * When user can change the frames always force IRET. That is because
209 * it deals with uncanonical addresses better. SYSRET has trouble
210 * with them due to bugs in both AMD and Intel CPUs.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211 */
212
213ENTRY(system_call)
Jan Beulich7effaa82005-09-12 18:49:24 +0200214 CFI_STARTPROC simple
Jan Beulichadf14232006-09-26 10:52:41 +0200215 CFI_SIGNAL_FRAME
Jan Beulichdffead42006-06-26 13:57:38 +0200216 CFI_DEF_CFA rsp,PDA_STACKOFFSET
Jan Beulich7effaa82005-09-12 18:49:24 +0200217 CFI_REGISTER rip,rcx
218 /*CFI_REGISTER rflags,r11*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219 swapgs
220 movq %rsp,%gs:pda_oldrsp
221 movq %gs:pda_kernelstack,%rsp
Ingo Molnar2601e642006-07-03 00:24:45 -0700222 /*
223 * No need to follow this irqs off/on section - it's straight
224 * and short:
225 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226 sti
227 SAVE_ARGS 8,1
228 movq %rax,ORIG_RAX-ARGOFFSET(%rsp)
Jan Beulich7effaa82005-09-12 18:49:24 +0200229 movq %rcx,RIP-ARGOFFSET(%rsp)
230 CFI_REL_OFFSET rip,RIP-ARGOFFSET
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231 GET_THREAD_INFO(%rcx)
232 testl $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT|_TIF_SECCOMP),threadinfo_flags(%rcx)
Jan Beulich7effaa82005-09-12 18:49:24 +0200233 CFI_REMEMBER_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234 jnz tracesys
235 cmpq $__NR_syscall_max,%rax
236 ja badsys
237 movq %r10,%rcx
238 call *sys_call_table(,%rax,8) # XXX: rip relative
239 movq %rax,RAX-ARGOFFSET(%rsp)
240/*
241 * Syscall return path ending with SYSRET (fast path)
242 * Has incomplete stack frame and undefined top of stack.
243 */
244 .globl ret_from_sys_call
245ret_from_sys_call:
Andi Kleen11b854b2005-04-16 15:25:02 -0700246 movl $_TIF_ALLWORK_MASK,%edi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247 /* edi: flagmask */
248sysret_check:
249 GET_THREAD_INFO(%rcx)
250 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700251 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252 movl threadinfo_flags(%rcx),%edx
253 andl %edi,%edx
Jan Beulich7effaa82005-09-12 18:49:24 +0200254 CFI_REMEMBER_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 jnz sysret_careful
Ingo Molnar2601e642006-07-03 00:24:45 -0700256 /*
257 * sysretq will re-enable interrupts:
258 */
259 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260 movq RIP-ARGOFFSET(%rsp),%rcx
Jan Beulich7effaa82005-09-12 18:49:24 +0200261 CFI_REGISTER rip,rcx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262 RESTORE_ARGS 0,-ARG_SKIP,1
Jan Beulich7effaa82005-09-12 18:49:24 +0200263 /*CFI_REGISTER rflags,r11*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700264 movq %gs:pda_oldrsp,%rsp
265 swapgs
266 sysretq
267
268 /* Handle reschedules */
269 /* edx: work, edi: workmask */
270sysret_careful:
Jan Beulich7effaa82005-09-12 18:49:24 +0200271 CFI_RESTORE_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272 bt $TIF_NEED_RESCHED,%edx
273 jnc sysret_signal
Ingo Molnar2601e642006-07-03 00:24:45 -0700274 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 sti
276 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200277 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278 call schedule
279 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200280 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281 jmp sysret_check
282
283 /* Handle a signal */
284sysret_signal:
Ingo Molnar2601e642006-07-03 00:24:45 -0700285 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286 sti
Andi Kleen10ffdbb2005-05-16 21:53:19 -0700287 testl $(_TIF_SIGPENDING|_TIF_NOTIFY_RESUME|_TIF_SINGLESTEP),%edx
288 jz 1f
289
290 /* Really a signal */
291 /* edx: work flags (arg3) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292 leaq do_notify_resume(%rip),%rax
293 leaq -ARGOFFSET(%rsp),%rdi # &pt_regs -> arg1
294 xorl %esi,%esi # oldset -> arg2
295 call ptregscall_common
Andi Kleen10ffdbb2005-05-16 21:53:19 -07002961: movl $_TIF_NEED_RESCHED,%edi
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200297 /* Use IRET because user could have changed frame. This
298 works because ptregscall_common has called FIXUP_TOP_OF_STACK. */
299 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700300 TRACE_IRQS_OFF
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200301 jmp int_with_check
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302
Jan Beulich7effaa82005-09-12 18:49:24 +0200303badsys:
304 movq $-ENOSYS,RAX-ARGOFFSET(%rsp)
305 jmp ret_from_sys_call
306
Linus Torvalds1da177e2005-04-16 15:20:36 -0700307 /* Do syscall tracing */
308tracesys:
Jan Beulich7effaa82005-09-12 18:49:24 +0200309 CFI_RESTORE_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310 SAVE_REST
311 movq $-ENOSYS,RAX(%rsp)
312 FIXUP_TOP_OF_STACK %rdi
313 movq %rsp,%rdi
314 call syscall_trace_enter
315 LOAD_ARGS ARGOFFSET /* reload args from stack in case ptrace changed it */
316 RESTORE_REST
317 cmpq $__NR_syscall_max,%rax
Jan Beulichcc7d4792006-10-21 18:37:02 +0200318 movq $-ENOSYS,%rcx
319 cmova %rcx,%rax
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320 ja 1f
321 movq %r10,%rcx /* fixup for C */
322 call *sys_call_table(,%rax,8)
Andi Kleen822ff012006-05-30 22:48:03 +02003231: movq %rax,RAX-ARGOFFSET(%rsp)
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200324 /* Use IRET because user could have changed frame */
325 jmp int_ret_from_sys_call
Jan Beulich7effaa82005-09-12 18:49:24 +0200326 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200327END(system_call)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328
Linus Torvalds1da177e2005-04-16 15:20:36 -0700329/*
330 * Syscall return path ending with IRET.
331 * Has correct top of stack, but partial stack frame.
332 */
Jan Beulich7effaa82005-09-12 18:49:24 +0200333ENTRY(int_ret_from_sys_call)
334 CFI_STARTPROC simple
Jan Beulichadf14232006-09-26 10:52:41 +0200335 CFI_SIGNAL_FRAME
Jan Beulich7effaa82005-09-12 18:49:24 +0200336 CFI_DEF_CFA rsp,SS+8-ARGOFFSET
337 /*CFI_REL_OFFSET ss,SS-ARGOFFSET*/
338 CFI_REL_OFFSET rsp,RSP-ARGOFFSET
339 /*CFI_REL_OFFSET rflags,EFLAGS-ARGOFFSET*/
340 /*CFI_REL_OFFSET cs,CS-ARGOFFSET*/
341 CFI_REL_OFFSET rip,RIP-ARGOFFSET
342 CFI_REL_OFFSET rdx,RDX-ARGOFFSET
343 CFI_REL_OFFSET rcx,RCX-ARGOFFSET
344 CFI_REL_OFFSET rax,RAX-ARGOFFSET
345 CFI_REL_OFFSET rdi,RDI-ARGOFFSET
346 CFI_REL_OFFSET rsi,RSI-ARGOFFSET
347 CFI_REL_OFFSET r8,R8-ARGOFFSET
348 CFI_REL_OFFSET r9,R9-ARGOFFSET
349 CFI_REL_OFFSET r10,R10-ARGOFFSET
350 CFI_REL_OFFSET r11,R11-ARGOFFSET
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700352 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353 testl $3,CS-ARGOFFSET(%rsp)
354 je retint_restore_args
355 movl $_TIF_ALLWORK_MASK,%edi
356 /* edi: mask to check */
357int_with_check:
358 GET_THREAD_INFO(%rcx)
359 movl threadinfo_flags(%rcx),%edx
360 andl %edi,%edx
361 jnz int_careful
Andi Kleenbf2fcc62006-01-11 22:44:06 +0100362 andl $~TS_COMPAT,threadinfo_status(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363 jmp retint_swapgs
364
365 /* Either reschedule or signal or syscall exit tracking needed. */
366 /* First do a reschedule test. */
367 /* edx: work, edi: workmask */
368int_careful:
369 bt $TIF_NEED_RESCHED,%edx
370 jnc int_very_careful
Ingo Molnar2601e642006-07-03 00:24:45 -0700371 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 sti
373 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200374 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700375 call schedule
376 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200377 CFI_ADJUST_CFA_OFFSET -8
Andi Kleencdd219c2005-04-16 15:25:04 -0700378 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700379 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700380 jmp int_with_check
381
382 /* handle signals and tracing -- both require a full stack frame */
383int_very_careful:
Ingo Molnar2601e642006-07-03 00:24:45 -0700384 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700385 sti
386 SAVE_REST
387 /* Check for syscall exit trace */
388 testl $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT|_TIF_SINGLESTEP),%edx
389 jz int_signal
390 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200391 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392 leaq 8(%rsp),%rdi # &ptregs -> arg1
393 call syscall_trace_leave
394 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200395 CFI_ADJUST_CFA_OFFSET -8
Andi Kleen36c11042005-04-16 15:25:01 -0700396 andl $~(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT|_TIF_SINGLESTEP),%edi
Andi Kleenbe9e6872005-05-01 08:58:51 -0700397 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700398 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 jmp int_restore_rest
400
401int_signal:
402 testl $(_TIF_NOTIFY_RESUME|_TIF_SIGPENDING|_TIF_SINGLESTEP),%edx
403 jz 1f
404 movq %rsp,%rdi # &ptregs -> arg1
405 xorl %esi,%esi # oldset -> arg2
406 call do_notify_resume
4071: movl $_TIF_NEED_RESCHED,%edi
408int_restore_rest:
409 RESTORE_REST
Andi Kleenbe9e6872005-05-01 08:58:51 -0700410 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700411 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700412 jmp int_with_check
413 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200414END(int_ret_from_sys_call)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415
416/*
417 * Certain special system calls that need to save a complete full stack frame.
418 */
419
420 .macro PTREGSCALL label,func,arg
421 .globl \label
422\label:
423 leaq \func(%rip),%rax
424 leaq -ARGOFFSET+8(%rsp),\arg /* 8 for return address */
425 jmp ptregscall_common
Jan Beulich4b787e02006-06-26 13:56:55 +0200426END(\label)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700427 .endm
428
Jan Beulich7effaa82005-09-12 18:49:24 +0200429 CFI_STARTPROC
430
Linus Torvalds1da177e2005-04-16 15:20:36 -0700431 PTREGSCALL stub_clone, sys_clone, %r8
432 PTREGSCALL stub_fork, sys_fork, %rdi
433 PTREGSCALL stub_vfork, sys_vfork, %rdi
434 PTREGSCALL stub_rt_sigsuspend, sys_rt_sigsuspend, %rdx
435 PTREGSCALL stub_sigaltstack, sys_sigaltstack, %rdx
436 PTREGSCALL stub_iopl, sys_iopl, %rsi
437
438ENTRY(ptregscall_common)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700439 popq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200440 CFI_ADJUST_CFA_OFFSET -8
441 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700442 SAVE_REST
443 movq %r11, %r15
Jan Beulich7effaa82005-09-12 18:49:24 +0200444 CFI_REGISTER rip, r15
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445 FIXUP_TOP_OF_STACK %r11
446 call *%rax
447 RESTORE_TOP_OF_STACK %r11
448 movq %r15, %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200449 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700450 RESTORE_REST
451 pushq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200452 CFI_ADJUST_CFA_OFFSET 8
453 CFI_REL_OFFSET rip, 0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 ret
455 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200456END(ptregscall_common)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457
458ENTRY(stub_execve)
459 CFI_STARTPROC
460 popq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200461 CFI_ADJUST_CFA_OFFSET -8
462 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463 SAVE_REST
Linus Torvalds1da177e2005-04-16 15:20:36 -0700464 FIXUP_TOP_OF_STACK %r11
465 call sys_execve
Linus Torvalds1da177e2005-04-16 15:20:36 -0700466 RESTORE_TOP_OF_STACK %r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700467 movq %rax,RAX(%rsp)
468 RESTORE_REST
469 jmp int_ret_from_sys_call
470 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200471END(stub_execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472
473/*
474 * sigreturn is special because it needs to restore all registers on return.
475 * This cannot be done with SYSRET, so use the IRET return path instead.
476 */
477ENTRY(stub_rt_sigreturn)
478 CFI_STARTPROC
Jan Beulich7effaa82005-09-12 18:49:24 +0200479 addq $8, %rsp
480 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481 SAVE_REST
482 movq %rsp,%rdi
483 FIXUP_TOP_OF_STACK %r11
484 call sys_rt_sigreturn
485 movq %rax,RAX(%rsp) # fixme, this could be done at the higher layer
486 RESTORE_REST
487 jmp int_ret_from_sys_call
488 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200489END(stub_rt_sigreturn)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490
Jan Beulich7effaa82005-09-12 18:49:24 +0200491/*
492 * initial frame state for interrupts and exceptions
493 */
494 .macro _frame ref
495 CFI_STARTPROC simple
Jan Beulichadf14232006-09-26 10:52:41 +0200496 CFI_SIGNAL_FRAME
Jan Beulich7effaa82005-09-12 18:49:24 +0200497 CFI_DEF_CFA rsp,SS+8-\ref
498 /*CFI_REL_OFFSET ss,SS-\ref*/
499 CFI_REL_OFFSET rsp,RSP-\ref
500 /*CFI_REL_OFFSET rflags,EFLAGS-\ref*/
501 /*CFI_REL_OFFSET cs,CS-\ref*/
502 CFI_REL_OFFSET rip,RIP-\ref
503 .endm
504
505/* initial frame state for interrupts (and exceptions without error code) */
506#define INTR_FRAME _frame RIP
507/* initial frame state for exceptions with error code (and interrupts with
508 vector already pushed) */
509#define XCPT_FRAME _frame ORIG_RAX
510
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511/*
512 * Interrupt entry/exit.
513 *
514 * Interrupt entry points save only callee clobbered registers in fast path.
515 *
516 * Entry runs with interrupts off.
517 */
518
519/* 0(%rsp): interrupt number */
520 .macro interrupt func
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 cld
Linus Torvalds1da177e2005-04-16 15:20:36 -0700522 SAVE_ARGS
523 leaq -ARGOFFSET(%rsp),%rdi # arg1 for handler
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200524 pushq %rbp
525 CFI_ADJUST_CFA_OFFSET 8
526 CFI_REL_OFFSET rbp, 0
527 movq %rsp,%rbp
528 CFI_DEF_CFA_REGISTER rbp
Linus Torvalds1da177e2005-04-16 15:20:36 -0700529 testl $3,CS(%rdi)
530 je 1f
531 swapgs
Andi Kleen96e54042006-09-26 10:52:39 +0200532 /* irqcount is used to check if a CPU is already on an interrupt
533 stack or not. While this is essentially redundant with preempt_count
534 it is a little cheaper to use a separate counter in the PDA
535 (short of moving irq_enter into assembly, which would be too
536 much work) */
5371: incl %gs:pda_irqcount
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200538 cmoveq %gs:pda_irqstackptr,%rsp
Andi Kleen26995002006-08-02 22:37:28 +0200539 push %rbp # backlink for old unwinder
Andi Kleen7d0b0e82006-10-05 18:47:22 +0200540 CFI_ADJUST_CFA_OFFSET 8
541 CFI_REL_OFFSET rbp,0
Ingo Molnar2601e642006-07-03 00:24:45 -0700542 /*
543 * We entered an interrupt context - irqs are off:
544 */
545 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700546 call \func
547 .endm
548
549ENTRY(common_interrupt)
Jan Beulich7effaa82005-09-12 18:49:24 +0200550 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700551 interrupt do_IRQ
552 /* 0(%rsp): oldrsp-ARGOFFSET */
Jan Beulich7effaa82005-09-12 18:49:24 +0200553ret_from_intr:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700554 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700555 TRACE_IRQS_OFF
Andi Kleen3829ee62005-07-28 21:15:48 -0700556 decl %gs:pda_irqcount
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200557 leaveq
Jan Beulich7effaa82005-09-12 18:49:24 +0200558 CFI_DEF_CFA_REGISTER rsp
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200559 CFI_ADJUST_CFA_OFFSET -8
Jan Beulich7effaa82005-09-12 18:49:24 +0200560exit_intr:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561 GET_THREAD_INFO(%rcx)
562 testl $3,CS-ARGOFFSET(%rsp)
563 je retint_kernel
564
565 /* Interrupt came from user space */
566 /*
567 * Has a correct top of stack, but a partial stack frame
568 * %rcx: thread info. Interrupts off.
569 */
570retint_with_reschedule:
571 movl $_TIF_WORK_MASK,%edi
Jan Beulich7effaa82005-09-12 18:49:24 +0200572retint_check:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700573 movl threadinfo_flags(%rcx),%edx
574 andl %edi,%edx
Jan Beulich7effaa82005-09-12 18:49:24 +0200575 CFI_REMEMBER_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700576 jnz retint_careful
577retint_swapgs:
Ingo Molnar2601e642006-07-03 00:24:45 -0700578 /*
579 * The iretq could re-enable interrupts:
580 */
581 cli
582 TRACE_IRQS_IRETQ
Linus Torvalds1da177e2005-04-16 15:20:36 -0700583 swapgs
Ingo Molnar2601e642006-07-03 00:24:45 -0700584 jmp restore_args
585
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586retint_restore_args:
587 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700588 /*
589 * The iretq could re-enable interrupts:
590 */
591 TRACE_IRQS_IRETQ
592restore_args:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593 RESTORE_ARGS 0,8,0
594iret_label:
595 iretq
596
597 .section __ex_table,"a"
598 .quad iret_label,bad_iret
599 .previous
600 .section .fixup,"ax"
601 /* force a signal here? this matches i386 behaviour */
602 /* running with kernel gs */
603bad_iret:
Andi Kleen3076a492006-03-25 16:31:55 +0100604 movq $11,%rdi /* SIGSEGV */
Ingo Molnar2601e642006-07-03 00:24:45 -0700605 TRACE_IRQS_ON
Andi Kleen2391c4b2006-02-16 23:42:01 +0100606 sti
Linus Torvalds1da177e2005-04-16 15:20:36 -0700607 jmp do_exit
608 .previous
609
Jan Beulich7effaa82005-09-12 18:49:24 +0200610 /* edi: workmask, edx: work */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700611retint_careful:
Jan Beulich7effaa82005-09-12 18:49:24 +0200612 CFI_RESTORE_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 bt $TIF_NEED_RESCHED,%edx
614 jnc retint_signal
Ingo Molnar2601e642006-07-03 00:24:45 -0700615 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700616 sti
617 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200618 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619 call schedule
620 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200621 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700622 GET_THREAD_INFO(%rcx)
623 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700624 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700625 jmp retint_check
626
627retint_signal:
Andi Kleen10ffdbb2005-05-16 21:53:19 -0700628 testl $(_TIF_SIGPENDING|_TIF_NOTIFY_RESUME|_TIF_SINGLESTEP),%edx
629 jz retint_swapgs
Ingo Molnar2601e642006-07-03 00:24:45 -0700630 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700631 sti
632 SAVE_REST
633 movq $-1,ORIG_RAX(%rsp)
Andi Kleen3829ee62005-07-28 21:15:48 -0700634 xorl %esi,%esi # oldset
Linus Torvalds1da177e2005-04-16 15:20:36 -0700635 movq %rsp,%rdi # &pt_regs
636 call do_notify_resume
637 RESTORE_REST
638 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700639 TRACE_IRQS_OFF
Andi Kleen10ffdbb2005-05-16 21:53:19 -0700640 movl $_TIF_NEED_RESCHED,%edi
Andi Kleenbe9e6872005-05-01 08:58:51 -0700641 GET_THREAD_INFO(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700642 jmp retint_check
643
644#ifdef CONFIG_PREEMPT
645 /* Returning to kernel space. Check if we need preemption */
646 /* rcx: threadinfo. interrupts off. */
Andi Kleenb06baba2006-09-26 10:52:29 +0200647ENTRY(retint_kernel)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700648 cmpl $0,threadinfo_preempt_count(%rcx)
649 jnz retint_restore_args
650 bt $TIF_NEED_RESCHED,threadinfo_flags(%rcx)
651 jnc retint_restore_args
652 bt $9,EFLAGS-ARGOFFSET(%rsp) /* interrupts off? */
653 jnc retint_restore_args
654 call preempt_schedule_irq
655 jmp exit_intr
656#endif
Jan Beulich4b787e02006-06-26 13:56:55 +0200657
Linus Torvalds1da177e2005-04-16 15:20:36 -0700658 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200659END(common_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700660
661/*
662 * APIC interrupts.
663 */
664 .macro apicinterrupt num,func
Jan Beulich7effaa82005-09-12 18:49:24 +0200665 INTR_FRAME
Rusty Russell19eadf92006-06-27 02:53:44 -0700666 pushq $~(\num)
Jan Beulich7effaa82005-09-12 18:49:24 +0200667 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668 interrupt \func
669 jmp ret_from_intr
670 CFI_ENDPROC
671 .endm
672
673ENTRY(thermal_interrupt)
674 apicinterrupt THERMAL_APIC_VECTOR,smp_thermal_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200675END(thermal_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700676
Jacob Shin89b831e2005-11-05 17:25:53 +0100677ENTRY(threshold_interrupt)
678 apicinterrupt THRESHOLD_APIC_VECTOR,mce_threshold_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200679END(threshold_interrupt)
Jacob Shin89b831e2005-11-05 17:25:53 +0100680
Linus Torvalds1da177e2005-04-16 15:20:36 -0700681#ifdef CONFIG_SMP
682ENTRY(reschedule_interrupt)
683 apicinterrupt RESCHEDULE_VECTOR,smp_reschedule_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200684END(reschedule_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700685
Andi Kleene5bc8b62005-09-12 18:49:24 +0200686 .macro INVALIDATE_ENTRY num
687ENTRY(invalidate_interrupt\num)
688 apicinterrupt INVALIDATE_TLB_VECTOR_START+\num,smp_invalidate_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200689END(invalidate_interrupt\num)
Andi Kleene5bc8b62005-09-12 18:49:24 +0200690 .endm
691
692 INVALIDATE_ENTRY 0
693 INVALIDATE_ENTRY 1
694 INVALIDATE_ENTRY 2
695 INVALIDATE_ENTRY 3
696 INVALIDATE_ENTRY 4
697 INVALIDATE_ENTRY 5
698 INVALIDATE_ENTRY 6
699 INVALIDATE_ENTRY 7
Linus Torvalds1da177e2005-04-16 15:20:36 -0700700
701ENTRY(call_function_interrupt)
702 apicinterrupt CALL_FUNCTION_VECTOR,smp_call_function_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200703END(call_function_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704#endif
705
Linus Torvalds1da177e2005-04-16 15:20:36 -0700706ENTRY(apic_timer_interrupt)
707 apicinterrupt LOCAL_TIMER_VECTOR,smp_apic_timer_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200708END(apic_timer_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700709
710ENTRY(error_interrupt)
711 apicinterrupt ERROR_APIC_VECTOR,smp_error_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200712END(error_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713
714ENTRY(spurious_interrupt)
715 apicinterrupt SPURIOUS_APIC_VECTOR,smp_spurious_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200716END(spurious_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700717
718/*
719 * Exception entry points.
720 */
721 .macro zeroentry sym
Jan Beulich7effaa82005-09-12 18:49:24 +0200722 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723 pushq $0 /* push error code/oldrax */
Jan Beulich7effaa82005-09-12 18:49:24 +0200724 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700725 pushq %rax /* push real oldrax to the rdi slot */
Jan Beulich7effaa82005-09-12 18:49:24 +0200726 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727 leaq \sym(%rip),%rax
728 jmp error_entry
Jan Beulich7effaa82005-09-12 18:49:24 +0200729 CFI_ENDPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700730 .endm
731
732 .macro errorentry sym
Jan Beulich7effaa82005-09-12 18:49:24 +0200733 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700734 pushq %rax
Jan Beulich7effaa82005-09-12 18:49:24 +0200735 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700736 leaq \sym(%rip),%rax
737 jmp error_entry
Jan Beulich7effaa82005-09-12 18:49:24 +0200738 CFI_ENDPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700739 .endm
740
741 /* error code is on the stack already */
742 /* handle NMI like exceptions that can happen everywhere */
Ingo Molnar2601e642006-07-03 00:24:45 -0700743 .macro paranoidentry sym, ist=0, irqtrace=1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700744 SAVE_ALL
745 cld
746 movl $1,%ebx
747 movl $MSR_GS_BASE,%ecx
748 rdmsr
749 testl %edx,%edx
750 js 1f
751 swapgs
752 xorl %ebx,%ebx
Jan Beulichb556b352006-01-11 22:43:00 +01007531:
754 .if \ist
755 movq %gs:pda_data_offset, %rbp
756 .endif
757 movq %rsp,%rdi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758 movq ORIG_RAX(%rsp),%rsi
759 movq $-1,ORIG_RAX(%rsp)
Jan Beulichb556b352006-01-11 22:43:00 +0100760 .if \ist
Andi Kleen5f8efbb2006-01-16 01:56:39 +0100761 subq $EXCEPTION_STKSZ, per_cpu__init_tss + TSS_ist + (\ist - 1) * 8(%rbp)
Jan Beulichb556b352006-01-11 22:43:00 +0100762 .endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700763 call \sym
Jan Beulichb556b352006-01-11 22:43:00 +0100764 .if \ist
Andi Kleen5f8efbb2006-01-16 01:56:39 +0100765 addq $EXCEPTION_STKSZ, per_cpu__init_tss + TSS_ist + (\ist - 1) * 8(%rbp)
Jan Beulichb556b352006-01-11 22:43:00 +0100766 .endif
Andi Kleen6fefb0d2005-04-16 15:25:03 -0700767 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700768 .if \irqtrace
769 TRACE_IRQS_OFF
770 .endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700771 .endm
Ingo Molnar2601e642006-07-03 00:24:45 -0700772
773 /*
774 * "Paranoid" exit path from exception stack.
775 * Paranoid because this is used by NMIs and cannot take
776 * any kernel state for granted.
777 * We don't do kernel preemption checks here, because only
778 * NMI should be common and it does not enable IRQs and
779 * cannot get reschedule ticks.
780 *
781 * "trace" is 0 for the NMI handler only, because irq-tracing
782 * is fundamentally NMI-unsafe. (we cannot change the soft and
783 * hard flags at once, atomically)
784 */
785 .macro paranoidexit trace=1
786 /* ebx: no swapgs flag */
787paranoid_exit\trace:
788 testl %ebx,%ebx /* swapgs needed? */
789 jnz paranoid_restore\trace
790 testl $3,CS(%rsp)
791 jnz paranoid_userspace\trace
792paranoid_swapgs\trace:
Andi Kleen7a0a2df2006-09-26 10:52:37 +0200793 .if \trace
Ingo Molnar2601e642006-07-03 00:24:45 -0700794 TRACE_IRQS_IRETQ 0
Andi Kleen7a0a2df2006-09-26 10:52:37 +0200795 .endif
Ingo Molnar2601e642006-07-03 00:24:45 -0700796 swapgs
797paranoid_restore\trace:
798 RESTORE_ALL 8
799 iretq
800paranoid_userspace\trace:
801 GET_THREAD_INFO(%rcx)
802 movl threadinfo_flags(%rcx),%ebx
803 andl $_TIF_WORK_MASK,%ebx
804 jz paranoid_swapgs\trace
805 movq %rsp,%rdi /* &pt_regs */
806 call sync_regs
807 movq %rax,%rsp /* switch stack for scheduling */
808 testl $_TIF_NEED_RESCHED,%ebx
809 jnz paranoid_schedule\trace
810 movl %ebx,%edx /* arg3: thread flags */
811 .if \trace
812 TRACE_IRQS_ON
813 .endif
814 sti
815 xorl %esi,%esi /* arg2: oldset */
816 movq %rsp,%rdi /* arg1: &pt_regs */
817 call do_notify_resume
818 cli
819 .if \trace
820 TRACE_IRQS_OFF
821 .endif
822 jmp paranoid_userspace\trace
823paranoid_schedule\trace:
824 .if \trace
825 TRACE_IRQS_ON
826 .endif
827 sti
828 call schedule
829 cli
830 .if \trace
831 TRACE_IRQS_OFF
832 .endif
833 jmp paranoid_userspace\trace
834 CFI_ENDPROC
835 .endm
836
Linus Torvalds1da177e2005-04-16 15:20:36 -0700837/*
838 * Exception entry point. This expects an error code/orig_rax on the stack
839 * and the exception handler in %rax.
840 */
Prasanna S.Pd28c4392006-09-26 10:52:34 +0200841KPROBE_ENTRY(error_entry)
Jan Beulich7effaa82005-09-12 18:49:24 +0200842 _frame RDI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700843 /* rdi slot contains rax, oldrax contains error code */
844 cld
845 subq $14*8,%rsp
846 CFI_ADJUST_CFA_OFFSET (14*8)
847 movq %rsi,13*8(%rsp)
848 CFI_REL_OFFSET rsi,RSI
849 movq 14*8(%rsp),%rsi /* load rax from rdi slot */
850 movq %rdx,12*8(%rsp)
851 CFI_REL_OFFSET rdx,RDX
852 movq %rcx,11*8(%rsp)
853 CFI_REL_OFFSET rcx,RCX
854 movq %rsi,10*8(%rsp) /* store rax */
855 CFI_REL_OFFSET rax,RAX
856 movq %r8, 9*8(%rsp)
857 CFI_REL_OFFSET r8,R8
858 movq %r9, 8*8(%rsp)
859 CFI_REL_OFFSET r9,R9
860 movq %r10,7*8(%rsp)
861 CFI_REL_OFFSET r10,R10
862 movq %r11,6*8(%rsp)
863 CFI_REL_OFFSET r11,R11
864 movq %rbx,5*8(%rsp)
865 CFI_REL_OFFSET rbx,RBX
866 movq %rbp,4*8(%rsp)
867 CFI_REL_OFFSET rbp,RBP
868 movq %r12,3*8(%rsp)
869 CFI_REL_OFFSET r12,R12
870 movq %r13,2*8(%rsp)
871 CFI_REL_OFFSET r13,R13
872 movq %r14,1*8(%rsp)
873 CFI_REL_OFFSET r14,R14
874 movq %r15,(%rsp)
875 CFI_REL_OFFSET r15,R15
876 xorl %ebx,%ebx
877 testl $3,CS(%rsp)
878 je error_kernelspace
879error_swapgs:
880 swapgs
881error_sti:
882 movq %rdi,RDI(%rsp)
883 movq %rsp,%rdi
884 movq ORIG_RAX(%rsp),%rsi /* get error code */
885 movq $-1,ORIG_RAX(%rsp)
886 call *%rax
887 /* ebx: no swapgs flag (1: don't need swapgs, 0: need it) */
888error_exit:
889 movl %ebx,%eax
890 RESTORE_REST
891 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700892 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700893 GET_THREAD_INFO(%rcx)
894 testl %eax,%eax
895 jne retint_kernel
896 movl threadinfo_flags(%rcx),%edx
897 movl $_TIF_WORK_MASK,%edi
898 andl %edi,%edx
899 jnz retint_careful
Ingo Molnar2601e642006-07-03 00:24:45 -0700900 /*
901 * The iret might restore flags:
902 */
903 TRACE_IRQS_IRETQ
Linus Torvalds1da177e2005-04-16 15:20:36 -0700904 swapgs
905 RESTORE_ARGS 0,8,0
Jan Beulich505cc4e2006-01-11 22:42:20 +0100906 jmp iret_label
Linus Torvalds1da177e2005-04-16 15:20:36 -0700907 CFI_ENDPROC
908
909error_kernelspace:
910 incl %ebx
911 /* There are two places in the kernel that can potentially fault with
912 usergs. Handle them here. The exception handlers after
913 iret run with kernel gs again, so don't set the user space flag.
914 B stepping K8s sometimes report an truncated RIP for IRET
915 exceptions returning to compat mode. Check for these here too. */
916 leaq iret_label(%rip),%rbp
917 cmpq %rbp,RIP(%rsp)
918 je error_swapgs
919 movl %ebp,%ebp /* zero extend */
920 cmpq %rbp,RIP(%rsp)
921 je error_swapgs
922 cmpq $gs_change,RIP(%rsp)
923 je error_swapgs
924 jmp error_sti
Prasanna S.Pd28c4392006-09-26 10:52:34 +0200925KPROBE_END(error_entry)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700926
927 /* Reload gs selector with exception handling */
928 /* edi: new selector */
929ENTRY(load_gs_index)
Jan Beulich7effaa82005-09-12 18:49:24 +0200930 CFI_STARTPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700931 pushf
Jan Beulich7effaa82005-09-12 18:49:24 +0200932 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700933 cli
934 swapgs
935gs_change:
936 movl %edi,%gs
9372: mfence /* workaround */
938 swapgs
939 popf
Jan Beulich7effaa82005-09-12 18:49:24 +0200940 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700941 ret
Jan Beulich7effaa82005-09-12 18:49:24 +0200942 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200943ENDPROC(load_gs_index)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700944
945 .section __ex_table,"a"
946 .align 8
947 .quad gs_change,bad_gs
948 .previous
949 .section .fixup,"ax"
950 /* running with kernelgs */
951bad_gs:
952 swapgs /* switch back to user gs */
953 xorl %eax,%eax
954 movl %eax,%gs
955 jmp 2b
956 .previous
957
958/*
959 * Create a kernel thread.
960 *
961 * C extern interface:
962 * extern long kernel_thread(int (*fn)(void *), void * arg, unsigned long flags)
963 *
964 * asm input arguments:
965 * rdi: fn, rsi: arg, rdx: flags
966 */
967ENTRY(kernel_thread)
968 CFI_STARTPROC
969 FAKE_STACK_FRAME $child_rip
970 SAVE_ALL
971
972 # rdi: flags, rsi: usp, rdx: will be &pt_regs
973 movq %rdx,%rdi
974 orq kernel_thread_flags(%rip),%rdi
975 movq $-1, %rsi
976 movq %rsp, %rdx
977
978 xorl %r8d,%r8d
979 xorl %r9d,%r9d
980
981 # clone now
982 call do_fork
983 movq %rax,RAX(%rsp)
984 xorl %edi,%edi
Andi Kleen51ec28e2006-10-05 18:47:22 +0200985 test %rax,%rax
986 jnz 1f
987 /* terminate stack in child */
988 movq %rdi,RIP(%rsp)
9891:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700990
991 /*
992 * It isn't worth to check for reschedule here,
993 * so internally to the x86_64 port you can rely on kernel_thread()
994 * not to reschedule the child before returning, this avoids the need
995 * of hacks for example to fork off the per-CPU idle tasks.
996 * [Hopefully no generic code relies on the reschedule -AK]
997 */
998 RESTORE_ALL
999 UNFAKE_STACK_FRAME
1000 ret
1001 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001002ENDPROC(kernel_thread)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001003
1004child_rip:
Andi Kleenc05991e2006-08-30 19:37:08 +02001005 pushq $0 # fake return address
1006 CFI_STARTPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -07001007 /*
1008 * Here we are in the child and the registers are set as they were
1009 * at kernel_thread() invocation in the parent.
1010 */
1011 movq %rdi, %rax
1012 movq %rsi, %rdi
1013 call *%rax
1014 # exit
Andi Kleen3829ee62005-07-28 21:15:48 -07001015 xorl %edi, %edi
Linus Torvalds1da177e2005-04-16 15:20:36 -07001016 call do_exit
Andi Kleenc05991e2006-08-30 19:37:08 +02001017 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001018ENDPROC(child_rip)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001019
1020/*
1021 * execve(). This function needs to use IRET, not SYSRET, to set up all state properly.
1022 *
1023 * C extern interface:
1024 * extern long execve(char *name, char **argv, char **envp)
1025 *
1026 * asm input arguments:
1027 * rdi: name, rsi: argv, rdx: envp
1028 *
1029 * We want to fallback into:
1030 * extern long sys_execve(char *name, char **argv,char **envp, struct pt_regs regs)
1031 *
1032 * do_sys_execve asm fallback arguments:
1033 * rdi: name, rsi: argv, rdx: envp, fake frame on the stack
1034 */
Arnd Bergmann3db03b42006-10-02 02:18:31 -07001035ENTRY(kernel_execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001036 CFI_STARTPROC
1037 FAKE_STACK_FRAME $0
1038 SAVE_ALL
1039 call sys_execve
1040 movq %rax, RAX(%rsp)
1041 RESTORE_REST
1042 testq %rax,%rax
1043 je int_ret_from_sys_call
1044 RESTORE_ARGS
1045 UNFAKE_STACK_FRAME
1046 ret
1047 CFI_ENDPROC
Arnd Bergmann3db03b42006-10-02 02:18:31 -07001048ENDPROC(kernel_execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001049
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001050KPROBE_ENTRY(page_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001051 errorentry do_page_fault
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001052KPROBE_END(page_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001053
1054ENTRY(coprocessor_error)
1055 zeroentry do_coprocessor_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001056END(coprocessor_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001057
1058ENTRY(simd_coprocessor_error)
1059 zeroentry do_simd_coprocessor_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001060END(simd_coprocessor_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001061
1062ENTRY(device_not_available)
1063 zeroentry math_state_restore
Jan Beulich4b787e02006-06-26 13:56:55 +02001064END(device_not_available)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001065
1066 /* runs on exception stack */
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001067KPROBE_ENTRY(debug)
Jan Beulich7effaa82005-09-12 18:49:24 +02001068 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001069 pushq $0
1070 CFI_ADJUST_CFA_OFFSET 8
Andi Kleen5f8efbb2006-01-16 01:56:39 +01001071 paranoidentry do_debug, DEBUG_STACK
Ingo Molnar2601e642006-07-03 00:24:45 -07001072 paranoidexit
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001073KPROBE_END(debug)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001074
1075 /* runs on exception stack */
Andi Kleeneddb6fb2006-02-03 21:50:41 +01001076KPROBE_ENTRY(nmi)
Jan Beulich7effaa82005-09-12 18:49:24 +02001077 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001078 pushq $-1
Jan Beulich7effaa82005-09-12 18:49:24 +02001079 CFI_ADJUST_CFA_OFFSET 8
Ingo Molnar2601e642006-07-03 00:24:45 -07001080 paranoidentry do_nmi, 0, 0
1081#ifdef CONFIG_TRACE_IRQFLAGS
1082 paranoidexit 0
1083#else
1084 jmp paranoid_exit1
1085 CFI_ENDPROC
1086#endif
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001087KPROBE_END(nmi)
Andi Kleen6fefb0d2005-04-16 15:25:03 -07001088
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001089KPROBE_ENTRY(int3)
Jan Beulichb556b352006-01-11 22:43:00 +01001090 INTR_FRAME
1091 pushq $0
1092 CFI_ADJUST_CFA_OFFSET 8
Andi Kleen5f8efbb2006-01-16 01:56:39 +01001093 paranoidentry do_int3, DEBUG_STACK
Ingo Molnar2601e642006-07-03 00:24:45 -07001094 jmp paranoid_exit1
Jan Beulichb556b352006-01-11 22:43:00 +01001095 CFI_ENDPROC
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001096KPROBE_END(int3)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001097
1098ENTRY(overflow)
1099 zeroentry do_overflow
Jan Beulich4b787e02006-06-26 13:56:55 +02001100END(overflow)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001101
1102ENTRY(bounds)
1103 zeroentry do_bounds
Jan Beulich4b787e02006-06-26 13:56:55 +02001104END(bounds)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001105
1106ENTRY(invalid_op)
1107 zeroentry do_invalid_op
Jan Beulich4b787e02006-06-26 13:56:55 +02001108END(invalid_op)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001109
1110ENTRY(coprocessor_segment_overrun)
1111 zeroentry do_coprocessor_segment_overrun
Jan Beulich4b787e02006-06-26 13:56:55 +02001112END(coprocessor_segment_overrun)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001113
1114ENTRY(reserved)
1115 zeroentry do_reserved
Jan Beulich4b787e02006-06-26 13:56:55 +02001116END(reserved)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001117
1118 /* runs on exception stack */
1119ENTRY(double_fault)
Jan Beulich7effaa82005-09-12 18:49:24 +02001120 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001121 paranoidentry do_double_fault
Ingo Molnar2601e642006-07-03 00:24:45 -07001122 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001123 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001124END(double_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001125
1126ENTRY(invalid_TSS)
1127 errorentry do_invalid_TSS
Jan Beulich4b787e02006-06-26 13:56:55 +02001128END(invalid_TSS)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001129
1130ENTRY(segment_not_present)
1131 errorentry do_segment_not_present
Jan Beulich4b787e02006-06-26 13:56:55 +02001132END(segment_not_present)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001133
1134 /* runs on exception stack */
1135ENTRY(stack_segment)
Jan Beulich7effaa82005-09-12 18:49:24 +02001136 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001137 paranoidentry do_stack_segment
Ingo Molnar2601e642006-07-03 00:24:45 -07001138 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001139 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001140END(stack_segment)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001141
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001142KPROBE_ENTRY(general_protection)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001143 errorentry do_general_protection
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001144KPROBE_END(general_protection)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001145
1146ENTRY(alignment_check)
1147 errorentry do_alignment_check
Jan Beulich4b787e02006-06-26 13:56:55 +02001148END(alignment_check)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001149
1150ENTRY(divide_error)
1151 zeroentry do_divide_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001152END(divide_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001153
1154ENTRY(spurious_interrupt_bug)
1155 zeroentry do_spurious_interrupt_bug
Jan Beulich4b787e02006-06-26 13:56:55 +02001156END(spurious_interrupt_bug)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001157
1158#ifdef CONFIG_X86_MCE
1159 /* runs on exception stack */
1160ENTRY(machine_check)
Jan Beulich7effaa82005-09-12 18:49:24 +02001161 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001162 pushq $0
1163 CFI_ADJUST_CFA_OFFSET 8
1164 paranoidentry do_machine_check
Ingo Molnar2601e642006-07-03 00:24:45 -07001165 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001166 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001167END(machine_check)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001168#endif
1169
Andi Kleen26995002006-08-02 22:37:28 +02001170/* Call softirq on interrupt stack. Interrupts are off. */
Andi Kleened6b6762005-07-28 21:15:49 -07001171ENTRY(call_softirq)
Jan Beulich7effaa82005-09-12 18:49:24 +02001172 CFI_STARTPROC
Andi Kleen26995002006-08-02 22:37:28 +02001173 push %rbp
1174 CFI_ADJUST_CFA_OFFSET 8
1175 CFI_REL_OFFSET rbp,0
1176 mov %rsp,%rbp
1177 CFI_DEF_CFA_REGISTER rbp
Andi Kleened6b6762005-07-28 21:15:49 -07001178 incl %gs:pda_irqcount
Andi Kleen26995002006-08-02 22:37:28 +02001179 cmove %gs:pda_irqstackptr,%rsp
1180 push %rbp # backlink for old unwinder
Andi Kleen7d0b0e82006-10-05 18:47:22 +02001181 CFI_ADJUST_CFA_OFFSET 8
Andi Kleened6b6762005-07-28 21:15:49 -07001182 call __do_softirq
Andi Kleen26995002006-08-02 22:37:28 +02001183 leaveq
Jan Beulich7effaa82005-09-12 18:49:24 +02001184 CFI_DEF_CFA_REGISTER rsp
Andi Kleen26995002006-08-02 22:37:28 +02001185 CFI_ADJUST_CFA_OFFSET -8
Andi Kleened6b6762005-07-28 21:15:49 -07001186 decl %gs:pda_irqcount
Andi Kleened6b6762005-07-28 21:15:49 -07001187 ret
Jan Beulich7effaa82005-09-12 18:49:24 +02001188 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001189ENDPROC(call_softirq)
Jan Beulichb538ed22006-06-26 13:57:32 +02001190
1191#ifdef CONFIG_STACK_UNWIND
1192ENTRY(arch_unwind_init_running)
1193 CFI_STARTPROC
1194 movq %r15, R15(%rdi)
1195 movq %r14, R14(%rdi)
1196 xchgq %rsi, %rdx
1197 movq %r13, R13(%rdi)
1198 movq %r12, R12(%rdi)
1199 xorl %eax, %eax
1200 movq %rbp, RBP(%rdi)
1201 movq %rbx, RBX(%rdi)
1202 movq (%rsp), %rcx
1203 movq %rax, R11(%rdi)
1204 movq %rax, R10(%rdi)
1205 movq %rax, R9(%rdi)
1206 movq %rax, R8(%rdi)
1207 movq %rax, RAX(%rdi)
1208 movq %rax, RCX(%rdi)
1209 movq %rax, RDX(%rdi)
1210 movq %rax, RSI(%rdi)
1211 movq %rax, RDI(%rdi)
1212 movq %rax, ORIG_RAX(%rdi)
1213 movq %rcx, RIP(%rdi)
1214 leaq 8(%rsp), %rcx
1215 movq $__KERNEL_CS, CS(%rdi)
1216 movq %rax, EFLAGS(%rdi)
1217 movq %rcx, RSP(%rdi)
1218 movq $__KERNEL_DS, SS(%rdi)
1219 jmpq *%rdx
1220 CFI_ENDPROC
1221ENDPROC(arch_unwind_init_running)
1222#endif