blob: ea32688386fd85148e2d466290bd32ef69707d4d [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86_64/entry.S
3 *
4 * Copyright (C) 1991, 1992 Linus Torvalds
5 * Copyright (C) 2000, 2001, 2002 Andi Kleen SuSE Labs
6 * Copyright (C) 2000 Pavel Machek <pavel@suse.cz>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 */
8
9/*
10 * entry.S contains the system-call and fault low-level handling routines.
11 *
12 * NOTE: This code handles signal-recognition, which happens every time
13 * after an interrupt and after each system call.
14 *
15 * Normal syscalls and interrupts don't save a full stack frame, this is
16 * only done for syscall tracing, signals or fork/exec et.al.
17 *
18 * A note on terminology:
19 * - top of stack: Architecture defined interrupt frame from SS to RIP
20 * at the top of the kernel process stack.
21 * - partial stack frame: partially saved registers upto R11.
22 * - full stack frame: Like partial stack frame, but all register saved.
Andi Kleen2e91a172006-09-26 10:52:29 +020023 *
24 * Some macro usage:
25 * - CFI macros are used to generate dwarf2 unwind information for better
26 * backtraces. They don't change any code.
27 * - SAVE_ALL/RESTORE_ALL - Save/restore all registers
28 * - SAVE_ARGS/RESTORE_ARGS - Save/restore registers that C functions modify.
29 * There are unfortunately lots of special cases where some registers
30 * not touched. The macro is a big mess that should be cleaned up.
31 * - SAVE_REST/RESTORE_REST - Handle the registers not saved by SAVE_ARGS.
32 * Gives a full stack frame.
33 * - ENTRY/END Define functions in the symbol table.
34 * - FIXUP_TOP_OF_STACK/RESTORE_TOP_OF_STACK - Fix up the hardware stack
35 * frame that is otherwise undefined after a SYSCALL
36 * - TRACE_IRQ_* - Trace hard interrupt state for lock debugging.
37 * - errorentry/paranoidentry/zeroentry - Define exception entry points.
Linus Torvalds1da177e2005-04-16 15:20:36 -070038 */
39
Linus Torvalds1da177e2005-04-16 15:20:36 -070040#include <linux/linkage.h>
41#include <asm/segment.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#include <asm/cache.h>
43#include <asm/errno.h>
44#include <asm/dwarf2.h>
45#include <asm/calling.h>
Sam Ravnborge2d5df92005-09-09 21:28:48 +020046#include <asm/asm-offsets.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070047#include <asm/msr.h>
48#include <asm/unistd.h>
49#include <asm/thread_info.h>
50#include <asm/hw_irq.h>
Andi Kleen5f8efbb2006-01-16 01:56:39 +010051#include <asm/page.h>
Ingo Molnar2601e642006-07-03 00:24:45 -070052#include <asm/irqflags.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070053
54 .code64
55
Andi Kleendc37db42005-04-16 15:25:05 -070056#ifndef CONFIG_PREEMPT
Linus Torvalds1da177e2005-04-16 15:20:36 -070057#define retint_kernel retint_restore_args
58#endif
Ingo Molnar2601e642006-07-03 00:24:45 -070059
60
61.macro TRACE_IRQS_IRETQ offset=ARGOFFSET
62#ifdef CONFIG_TRACE_IRQFLAGS
63 bt $9,EFLAGS-\offset(%rsp) /* interrupts off? */
64 jnc 1f
65 TRACE_IRQS_ON
661:
67#endif
68.endm
69
Linus Torvalds1da177e2005-04-16 15:20:36 -070070/*
71 * C code is not supposed to know about undefined top of stack. Every time
72 * a C function with an pt_regs argument is called from the SYSCALL based
73 * fast path FIXUP_TOP_OF_STACK is needed.
74 * RESTORE_TOP_OF_STACK syncs the syscall state after any possible ptregs
75 * manipulation.
76 */
77
78 /* %rsp:at FRAMEEND */
79 .macro FIXUP_TOP_OF_STACK tmp
80 movq %gs:pda_oldrsp,\tmp
81 movq \tmp,RSP(%rsp)
82 movq $__USER_DS,SS(%rsp)
83 movq $__USER_CS,CS(%rsp)
84 movq $-1,RCX(%rsp)
85 movq R11(%rsp),\tmp /* get eflags */
86 movq \tmp,EFLAGS(%rsp)
87 .endm
88
89 .macro RESTORE_TOP_OF_STACK tmp,offset=0
90 movq RSP-\offset(%rsp),\tmp
91 movq \tmp,%gs:pda_oldrsp
92 movq EFLAGS-\offset(%rsp),\tmp
93 movq \tmp,R11-\offset(%rsp)
94 .endm
95
96 .macro FAKE_STACK_FRAME child_rip
97 /* push in order ss, rsp, eflags, cs, rip */
Andi Kleen3829ee62005-07-28 21:15:48 -070098 xorl %eax, %eax
Linus Torvalds1da177e2005-04-16 15:20:36 -070099 pushq %rax /* ss */
100 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200101 /*CFI_REL_OFFSET ss,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102 pushq %rax /* rsp */
103 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200104 CFI_REL_OFFSET rsp,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105 pushq $(1<<9) /* eflags - interrupts on */
106 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200107 /*CFI_REL_OFFSET rflags,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700108 pushq $__KERNEL_CS /* cs */
109 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200110 /*CFI_REL_OFFSET cs,0*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111 pushq \child_rip /* rip */
112 CFI_ADJUST_CFA_OFFSET 8
Jan Beulich7effaa82005-09-12 18:49:24 +0200113 CFI_REL_OFFSET rip,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114 pushq %rax /* orig rax */
115 CFI_ADJUST_CFA_OFFSET 8
116 .endm
117
118 .macro UNFAKE_STACK_FRAME
119 addq $8*6, %rsp
120 CFI_ADJUST_CFA_OFFSET -(6*8)
121 .endm
122
Jan Beulich7effaa82005-09-12 18:49:24 +0200123 .macro CFI_DEFAULT_STACK start=1
124 .if \start
125 CFI_STARTPROC simple
126 CFI_DEF_CFA rsp,SS+8
127 .else
128 CFI_DEF_CFA_OFFSET SS+8
129 .endif
130 CFI_REL_OFFSET r15,R15
131 CFI_REL_OFFSET r14,R14
132 CFI_REL_OFFSET r13,R13
133 CFI_REL_OFFSET r12,R12
134 CFI_REL_OFFSET rbp,RBP
135 CFI_REL_OFFSET rbx,RBX
136 CFI_REL_OFFSET r11,R11
137 CFI_REL_OFFSET r10,R10
138 CFI_REL_OFFSET r9,R9
139 CFI_REL_OFFSET r8,R8
140 CFI_REL_OFFSET rax,RAX
141 CFI_REL_OFFSET rcx,RCX
142 CFI_REL_OFFSET rdx,RDX
143 CFI_REL_OFFSET rsi,RSI
144 CFI_REL_OFFSET rdi,RDI
145 CFI_REL_OFFSET rip,RIP
146 /*CFI_REL_OFFSET cs,CS*/
147 /*CFI_REL_OFFSET rflags,EFLAGS*/
148 CFI_REL_OFFSET rsp,RSP
149 /*CFI_REL_OFFSET ss,SS*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700150 .endm
151/*
152 * A newly forked process directly context switches into this.
153 */
154/* rdi: prev */
155ENTRY(ret_from_fork)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156 CFI_DEFAULT_STACK
157 call schedule_tail
158 GET_THREAD_INFO(%rcx)
159 testl $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT),threadinfo_flags(%rcx)
160 jnz rff_trace
161rff_action:
162 RESTORE_REST
163 testl $3,CS-ARGOFFSET(%rsp) # from kernel_thread?
164 je int_ret_from_sys_call
165 testl $_TIF_IA32,threadinfo_flags(%rcx)
166 jnz int_ret_from_sys_call
167 RESTORE_TOP_OF_STACK %rdi,ARGOFFSET
168 jmp ret_from_sys_call
169rff_trace:
170 movq %rsp,%rdi
171 call syscall_trace_leave
172 GET_THREAD_INFO(%rcx)
173 jmp rff_action
174 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200175END(ret_from_fork)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176
177/*
178 * System call entry. Upto 6 arguments in registers are supported.
179 *
180 * SYSCALL does not save anything on the stack and does not change the
181 * stack pointer.
182 */
183
184/*
185 * Register setup:
186 * rax system call number
187 * rdi arg0
188 * rcx return address for syscall/sysret, C arg3
189 * rsi arg1
190 * rdx arg2
191 * r10 arg3 (--> moved to rcx for C)
192 * r8 arg4
193 * r9 arg5
194 * r11 eflags for syscall/sysret, temporary for C
195 * r12-r15,rbp,rbx saved by C code, not touched.
196 *
197 * Interrupts are off on entry.
198 * Only called from user space.
199 *
200 * XXX if we had a free scratch register we could save the RSP into the stack frame
201 * and report it properly in ps. Unfortunately we haven't.
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200202 *
203 * When user can change the frames always force IRET. That is because
204 * it deals with uncanonical addresses better. SYSRET has trouble
205 * with them due to bugs in both AMD and Intel CPUs.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206 */
207
208ENTRY(system_call)
Jan Beulich7effaa82005-09-12 18:49:24 +0200209 CFI_STARTPROC simple
Jan Beulichdffead42006-06-26 13:57:38 +0200210 CFI_DEF_CFA rsp,PDA_STACKOFFSET
Jan Beulich7effaa82005-09-12 18:49:24 +0200211 CFI_REGISTER rip,rcx
212 /*CFI_REGISTER rflags,r11*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 swapgs
214 movq %rsp,%gs:pda_oldrsp
215 movq %gs:pda_kernelstack,%rsp
Ingo Molnar2601e642006-07-03 00:24:45 -0700216 /*
217 * No need to follow this irqs off/on section - it's straight
218 * and short:
219 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 sti
221 SAVE_ARGS 8,1
222 movq %rax,ORIG_RAX-ARGOFFSET(%rsp)
Jan Beulich7effaa82005-09-12 18:49:24 +0200223 movq %rcx,RIP-ARGOFFSET(%rsp)
224 CFI_REL_OFFSET rip,RIP-ARGOFFSET
Linus Torvalds1da177e2005-04-16 15:20:36 -0700225 GET_THREAD_INFO(%rcx)
226 testl $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT|_TIF_SECCOMP),threadinfo_flags(%rcx)
Jan Beulich7effaa82005-09-12 18:49:24 +0200227 CFI_REMEMBER_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228 jnz tracesys
229 cmpq $__NR_syscall_max,%rax
230 ja badsys
231 movq %r10,%rcx
232 call *sys_call_table(,%rax,8) # XXX: rip relative
233 movq %rax,RAX-ARGOFFSET(%rsp)
234/*
235 * Syscall return path ending with SYSRET (fast path)
236 * Has incomplete stack frame and undefined top of stack.
237 */
238 .globl ret_from_sys_call
239ret_from_sys_call:
Andi Kleen11b854b2005-04-16 15:25:02 -0700240 movl $_TIF_ALLWORK_MASK,%edi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241 /* edi: flagmask */
242sysret_check:
243 GET_THREAD_INFO(%rcx)
244 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700245 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246 movl threadinfo_flags(%rcx),%edx
247 andl %edi,%edx
Jan Beulich7effaa82005-09-12 18:49:24 +0200248 CFI_REMEMBER_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249 jnz sysret_careful
Ingo Molnar2601e642006-07-03 00:24:45 -0700250 /*
251 * sysretq will re-enable interrupts:
252 */
253 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254 movq RIP-ARGOFFSET(%rsp),%rcx
Jan Beulich7effaa82005-09-12 18:49:24 +0200255 CFI_REGISTER rip,rcx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256 RESTORE_ARGS 0,-ARG_SKIP,1
Jan Beulich7effaa82005-09-12 18:49:24 +0200257 /*CFI_REGISTER rflags,r11*/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258 movq %gs:pda_oldrsp,%rsp
259 swapgs
260 sysretq
261
262 /* Handle reschedules */
263 /* edx: work, edi: workmask */
264sysret_careful:
Jan Beulich7effaa82005-09-12 18:49:24 +0200265 CFI_RESTORE_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266 bt $TIF_NEED_RESCHED,%edx
267 jnc sysret_signal
Ingo Molnar2601e642006-07-03 00:24:45 -0700268 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269 sti
270 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200271 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272 call schedule
273 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200274 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 jmp sysret_check
276
277 /* Handle a signal */
278sysret_signal:
Ingo Molnar2601e642006-07-03 00:24:45 -0700279 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280 sti
Andi Kleen10ffdbb2005-05-16 21:53:19 -0700281 testl $(_TIF_SIGPENDING|_TIF_NOTIFY_RESUME|_TIF_SINGLESTEP),%edx
282 jz 1f
283
284 /* Really a signal */
285 /* edx: work flags (arg3) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286 leaq do_notify_resume(%rip),%rax
287 leaq -ARGOFFSET(%rsp),%rdi # &pt_regs -> arg1
288 xorl %esi,%esi # oldset -> arg2
289 call ptregscall_common
Andi Kleen10ffdbb2005-05-16 21:53:19 -07002901: movl $_TIF_NEED_RESCHED,%edi
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200291 /* Use IRET because user could have changed frame. This
292 works because ptregscall_common has called FIXUP_TOP_OF_STACK. */
293 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700294 TRACE_IRQS_OFF
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200295 jmp int_with_check
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296
Jan Beulich7effaa82005-09-12 18:49:24 +0200297badsys:
298 movq $-ENOSYS,RAX-ARGOFFSET(%rsp)
299 jmp ret_from_sys_call
300
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301 /* Do syscall tracing */
302tracesys:
Jan Beulich7effaa82005-09-12 18:49:24 +0200303 CFI_RESTORE_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700304 SAVE_REST
305 movq $-ENOSYS,RAX(%rsp)
306 FIXUP_TOP_OF_STACK %rdi
307 movq %rsp,%rdi
308 call syscall_trace_enter
309 LOAD_ARGS ARGOFFSET /* reload args from stack in case ptrace changed it */
310 RESTORE_REST
311 cmpq $__NR_syscall_max,%rax
312 ja 1f
313 movq %r10,%rcx /* fixup for C */
314 call *sys_call_table(,%rax,8)
Andi Kleen822ff012006-05-30 22:48:03 +02003151: movq %rax,RAX-ARGOFFSET(%rsp)
Andi Kleen7bf36bb2006-04-07 19:50:00 +0200316 /* Use IRET because user could have changed frame */
317 jmp int_ret_from_sys_call
Jan Beulich7effaa82005-09-12 18:49:24 +0200318 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200319END(system_call)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320
Linus Torvalds1da177e2005-04-16 15:20:36 -0700321/*
322 * Syscall return path ending with IRET.
323 * Has correct top of stack, but partial stack frame.
324 */
Jan Beulich7effaa82005-09-12 18:49:24 +0200325ENTRY(int_ret_from_sys_call)
326 CFI_STARTPROC simple
327 CFI_DEF_CFA rsp,SS+8-ARGOFFSET
328 /*CFI_REL_OFFSET ss,SS-ARGOFFSET*/
329 CFI_REL_OFFSET rsp,RSP-ARGOFFSET
330 /*CFI_REL_OFFSET rflags,EFLAGS-ARGOFFSET*/
331 /*CFI_REL_OFFSET cs,CS-ARGOFFSET*/
332 CFI_REL_OFFSET rip,RIP-ARGOFFSET
333 CFI_REL_OFFSET rdx,RDX-ARGOFFSET
334 CFI_REL_OFFSET rcx,RCX-ARGOFFSET
335 CFI_REL_OFFSET rax,RAX-ARGOFFSET
336 CFI_REL_OFFSET rdi,RDI-ARGOFFSET
337 CFI_REL_OFFSET rsi,RSI-ARGOFFSET
338 CFI_REL_OFFSET r8,R8-ARGOFFSET
339 CFI_REL_OFFSET r9,R9-ARGOFFSET
340 CFI_REL_OFFSET r10,R10-ARGOFFSET
341 CFI_REL_OFFSET r11,R11-ARGOFFSET
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700343 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344 testl $3,CS-ARGOFFSET(%rsp)
345 je retint_restore_args
346 movl $_TIF_ALLWORK_MASK,%edi
347 /* edi: mask to check */
348int_with_check:
349 GET_THREAD_INFO(%rcx)
350 movl threadinfo_flags(%rcx),%edx
351 andl %edi,%edx
352 jnz int_careful
Andi Kleenbf2fcc62006-01-11 22:44:06 +0100353 andl $~TS_COMPAT,threadinfo_status(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354 jmp retint_swapgs
355
356 /* Either reschedule or signal or syscall exit tracking needed. */
357 /* First do a reschedule test. */
358 /* edx: work, edi: workmask */
359int_careful:
360 bt $TIF_NEED_RESCHED,%edx
361 jnc int_very_careful
Ingo Molnar2601e642006-07-03 00:24:45 -0700362 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363 sti
364 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200365 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700366 call schedule
367 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200368 CFI_ADJUST_CFA_OFFSET -8
Andi Kleencdd219c2005-04-16 15:25:04 -0700369 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700370 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700371 jmp int_with_check
372
373 /* handle signals and tracing -- both require a full stack frame */
374int_very_careful:
Ingo Molnar2601e642006-07-03 00:24:45 -0700375 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376 sti
377 SAVE_REST
378 /* Check for syscall exit trace */
379 testl $(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT|_TIF_SINGLESTEP),%edx
380 jz int_signal
381 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200382 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700383 leaq 8(%rsp),%rdi # &ptregs -> arg1
384 call syscall_trace_leave
385 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200386 CFI_ADJUST_CFA_OFFSET -8
Andi Kleen36c11042005-04-16 15:25:01 -0700387 andl $~(_TIF_SYSCALL_TRACE|_TIF_SYSCALL_AUDIT|_TIF_SINGLESTEP),%edi
Andi Kleenbe9e6872005-05-01 08:58:51 -0700388 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700389 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700390 jmp int_restore_rest
391
392int_signal:
393 testl $(_TIF_NOTIFY_RESUME|_TIF_SIGPENDING|_TIF_SINGLESTEP),%edx
394 jz 1f
395 movq %rsp,%rdi # &ptregs -> arg1
396 xorl %esi,%esi # oldset -> arg2
397 call do_notify_resume
3981: movl $_TIF_NEED_RESCHED,%edi
399int_restore_rest:
400 RESTORE_REST
Andi Kleenbe9e6872005-05-01 08:58:51 -0700401 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700402 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700403 jmp int_with_check
404 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200405END(int_ret_from_sys_call)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700406
407/*
408 * Certain special system calls that need to save a complete full stack frame.
409 */
410
411 .macro PTREGSCALL label,func,arg
412 .globl \label
413\label:
414 leaq \func(%rip),%rax
415 leaq -ARGOFFSET+8(%rsp),\arg /* 8 for return address */
416 jmp ptregscall_common
Jan Beulich4b787e02006-06-26 13:56:55 +0200417END(\label)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700418 .endm
419
Jan Beulich7effaa82005-09-12 18:49:24 +0200420 CFI_STARTPROC
421
Linus Torvalds1da177e2005-04-16 15:20:36 -0700422 PTREGSCALL stub_clone, sys_clone, %r8
423 PTREGSCALL stub_fork, sys_fork, %rdi
424 PTREGSCALL stub_vfork, sys_vfork, %rdi
425 PTREGSCALL stub_rt_sigsuspend, sys_rt_sigsuspend, %rdx
426 PTREGSCALL stub_sigaltstack, sys_sigaltstack, %rdx
427 PTREGSCALL stub_iopl, sys_iopl, %rsi
428
429ENTRY(ptregscall_common)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700430 popq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200431 CFI_ADJUST_CFA_OFFSET -8
432 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700433 SAVE_REST
434 movq %r11, %r15
Jan Beulich7effaa82005-09-12 18:49:24 +0200435 CFI_REGISTER rip, r15
Linus Torvalds1da177e2005-04-16 15:20:36 -0700436 FIXUP_TOP_OF_STACK %r11
437 call *%rax
438 RESTORE_TOP_OF_STACK %r11
439 movq %r15, %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200440 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700441 RESTORE_REST
442 pushq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200443 CFI_ADJUST_CFA_OFFSET 8
444 CFI_REL_OFFSET rip, 0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445 ret
446 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200447END(ptregscall_common)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700448
449ENTRY(stub_execve)
450 CFI_STARTPROC
451 popq %r11
Jan Beulich7effaa82005-09-12 18:49:24 +0200452 CFI_ADJUST_CFA_OFFSET -8
453 CFI_REGISTER rip, r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 SAVE_REST
Linus Torvalds1da177e2005-04-16 15:20:36 -0700455 FIXUP_TOP_OF_STACK %r11
456 call sys_execve
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457 RESTORE_TOP_OF_STACK %r11
Linus Torvalds1da177e2005-04-16 15:20:36 -0700458 movq %rax,RAX(%rsp)
459 RESTORE_REST
460 jmp int_ret_from_sys_call
461 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200462END(stub_execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463
464/*
465 * sigreturn is special because it needs to restore all registers on return.
466 * This cannot be done with SYSRET, so use the IRET return path instead.
467 */
468ENTRY(stub_rt_sigreturn)
469 CFI_STARTPROC
Jan Beulich7effaa82005-09-12 18:49:24 +0200470 addq $8, %rsp
471 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472 SAVE_REST
473 movq %rsp,%rdi
474 FIXUP_TOP_OF_STACK %r11
475 call sys_rt_sigreturn
476 movq %rax,RAX(%rsp) # fixme, this could be done at the higher layer
477 RESTORE_REST
478 jmp int_ret_from_sys_call
479 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200480END(stub_rt_sigreturn)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481
Jan Beulich7effaa82005-09-12 18:49:24 +0200482/*
483 * initial frame state for interrupts and exceptions
484 */
485 .macro _frame ref
486 CFI_STARTPROC simple
487 CFI_DEF_CFA rsp,SS+8-\ref
488 /*CFI_REL_OFFSET ss,SS-\ref*/
489 CFI_REL_OFFSET rsp,RSP-\ref
490 /*CFI_REL_OFFSET rflags,EFLAGS-\ref*/
491 /*CFI_REL_OFFSET cs,CS-\ref*/
492 CFI_REL_OFFSET rip,RIP-\ref
493 .endm
494
495/* initial frame state for interrupts (and exceptions without error code) */
496#define INTR_FRAME _frame RIP
497/* initial frame state for exceptions with error code (and interrupts with
498 vector already pushed) */
499#define XCPT_FRAME _frame ORIG_RAX
500
Linus Torvalds1da177e2005-04-16 15:20:36 -0700501/*
502 * Interrupt entry/exit.
503 *
504 * Interrupt entry points save only callee clobbered registers in fast path.
505 *
506 * Entry runs with interrupts off.
507 */
508
509/* 0(%rsp): interrupt number */
510 .macro interrupt func
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 cld
Linus Torvalds1da177e2005-04-16 15:20:36 -0700512 SAVE_ARGS
513 leaq -ARGOFFSET(%rsp),%rdi # arg1 for handler
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200514 pushq %rbp
515 CFI_ADJUST_CFA_OFFSET 8
516 CFI_REL_OFFSET rbp, 0
517 movq %rsp,%rbp
518 CFI_DEF_CFA_REGISTER rbp
Linus Torvalds1da177e2005-04-16 15:20:36 -0700519 testl $3,CS(%rdi)
520 je 1f
521 swapgs
Andi Kleen96e54042006-09-26 10:52:39 +0200522 /* irqcount is used to check if a CPU is already on an interrupt
523 stack or not. While this is essentially redundant with preempt_count
524 it is a little cheaper to use a separate counter in the PDA
525 (short of moving irq_enter into assembly, which would be too
526 much work) */
5271: incl %gs:pda_irqcount
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200528 cmoveq %gs:pda_irqstackptr,%rsp
Andi Kleen26995002006-08-02 22:37:28 +0200529 push %rbp # backlink for old unwinder
Ingo Molnar2601e642006-07-03 00:24:45 -0700530 /*
531 * We entered an interrupt context - irqs are off:
532 */
533 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534 call \func
535 .endm
536
537ENTRY(common_interrupt)
Jan Beulich7effaa82005-09-12 18:49:24 +0200538 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700539 interrupt do_IRQ
540 /* 0(%rsp): oldrsp-ARGOFFSET */
Jan Beulich7effaa82005-09-12 18:49:24 +0200541ret_from_intr:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700542 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700543 TRACE_IRQS_OFF
Andi Kleen3829ee62005-07-28 21:15:48 -0700544 decl %gs:pda_irqcount
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200545 leaveq
Jan Beulich7effaa82005-09-12 18:49:24 +0200546 CFI_DEF_CFA_REGISTER rsp
Jan Beulich1de9c3f2006-06-26 13:57:35 +0200547 CFI_ADJUST_CFA_OFFSET -8
Jan Beulich7effaa82005-09-12 18:49:24 +0200548exit_intr:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700549 GET_THREAD_INFO(%rcx)
550 testl $3,CS-ARGOFFSET(%rsp)
551 je retint_kernel
552
553 /* Interrupt came from user space */
554 /*
555 * Has a correct top of stack, but a partial stack frame
556 * %rcx: thread info. Interrupts off.
557 */
558retint_with_reschedule:
559 movl $_TIF_WORK_MASK,%edi
Jan Beulich7effaa82005-09-12 18:49:24 +0200560retint_check:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561 movl threadinfo_flags(%rcx),%edx
562 andl %edi,%edx
Jan Beulich7effaa82005-09-12 18:49:24 +0200563 CFI_REMEMBER_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700564 jnz retint_careful
565retint_swapgs:
Ingo Molnar2601e642006-07-03 00:24:45 -0700566 /*
567 * The iretq could re-enable interrupts:
568 */
569 cli
570 TRACE_IRQS_IRETQ
Linus Torvalds1da177e2005-04-16 15:20:36 -0700571 swapgs
Ingo Molnar2601e642006-07-03 00:24:45 -0700572 jmp restore_args
573
Linus Torvalds1da177e2005-04-16 15:20:36 -0700574retint_restore_args:
575 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700576 /*
577 * The iretq could re-enable interrupts:
578 */
579 TRACE_IRQS_IRETQ
580restore_args:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700581 RESTORE_ARGS 0,8,0
582iret_label:
583 iretq
584
585 .section __ex_table,"a"
586 .quad iret_label,bad_iret
587 .previous
588 .section .fixup,"ax"
589 /* force a signal here? this matches i386 behaviour */
590 /* running with kernel gs */
591bad_iret:
Andi Kleen3076a492006-03-25 16:31:55 +0100592 movq $11,%rdi /* SIGSEGV */
Ingo Molnar2601e642006-07-03 00:24:45 -0700593 TRACE_IRQS_ON
Andi Kleen2391c4b2006-02-16 23:42:01 +0100594 sti
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595 jmp do_exit
596 .previous
597
Jan Beulich7effaa82005-09-12 18:49:24 +0200598 /* edi: workmask, edx: work */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700599retint_careful:
Jan Beulich7effaa82005-09-12 18:49:24 +0200600 CFI_RESTORE_STATE
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601 bt $TIF_NEED_RESCHED,%edx
602 jnc retint_signal
Ingo Molnar2601e642006-07-03 00:24:45 -0700603 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604 sti
605 pushq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200606 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700607 call schedule
608 popq %rdi
Jan Beulich7effaa82005-09-12 18:49:24 +0200609 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700610 GET_THREAD_INFO(%rcx)
611 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700612 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 jmp retint_check
614
615retint_signal:
Andi Kleen10ffdbb2005-05-16 21:53:19 -0700616 testl $(_TIF_SIGPENDING|_TIF_NOTIFY_RESUME|_TIF_SINGLESTEP),%edx
617 jz retint_swapgs
Ingo Molnar2601e642006-07-03 00:24:45 -0700618 TRACE_IRQS_ON
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619 sti
620 SAVE_REST
621 movq $-1,ORIG_RAX(%rsp)
Andi Kleen3829ee62005-07-28 21:15:48 -0700622 xorl %esi,%esi # oldset
Linus Torvalds1da177e2005-04-16 15:20:36 -0700623 movq %rsp,%rdi # &pt_regs
624 call do_notify_resume
625 RESTORE_REST
626 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700627 TRACE_IRQS_OFF
Andi Kleen10ffdbb2005-05-16 21:53:19 -0700628 movl $_TIF_NEED_RESCHED,%edi
Andi Kleenbe9e6872005-05-01 08:58:51 -0700629 GET_THREAD_INFO(%rcx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700630 jmp retint_check
631
632#ifdef CONFIG_PREEMPT
633 /* Returning to kernel space. Check if we need preemption */
634 /* rcx: threadinfo. interrupts off. */
Andi Kleenb06baba2006-09-26 10:52:29 +0200635ENTRY(retint_kernel)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700636 cmpl $0,threadinfo_preempt_count(%rcx)
637 jnz retint_restore_args
638 bt $TIF_NEED_RESCHED,threadinfo_flags(%rcx)
639 jnc retint_restore_args
640 bt $9,EFLAGS-ARGOFFSET(%rsp) /* interrupts off? */
641 jnc retint_restore_args
642 call preempt_schedule_irq
643 jmp exit_intr
644#endif
Jan Beulich4b787e02006-06-26 13:56:55 +0200645
Linus Torvalds1da177e2005-04-16 15:20:36 -0700646 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200647END(common_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700648
649/*
650 * APIC interrupts.
651 */
652 .macro apicinterrupt num,func
Jan Beulich7effaa82005-09-12 18:49:24 +0200653 INTR_FRAME
Rusty Russell19eadf92006-06-27 02:53:44 -0700654 pushq $~(\num)
Jan Beulich7effaa82005-09-12 18:49:24 +0200655 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700656 interrupt \func
657 jmp ret_from_intr
658 CFI_ENDPROC
659 .endm
660
661ENTRY(thermal_interrupt)
662 apicinterrupt THERMAL_APIC_VECTOR,smp_thermal_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200663END(thermal_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700664
Jacob Shin89b831e2005-11-05 17:25:53 +0100665ENTRY(threshold_interrupt)
666 apicinterrupt THRESHOLD_APIC_VECTOR,mce_threshold_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200667END(threshold_interrupt)
Jacob Shin89b831e2005-11-05 17:25:53 +0100668
Linus Torvalds1da177e2005-04-16 15:20:36 -0700669#ifdef CONFIG_SMP
670ENTRY(reschedule_interrupt)
671 apicinterrupt RESCHEDULE_VECTOR,smp_reschedule_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200672END(reschedule_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700673
Andi Kleene5bc8b62005-09-12 18:49:24 +0200674 .macro INVALIDATE_ENTRY num
675ENTRY(invalidate_interrupt\num)
676 apicinterrupt INVALIDATE_TLB_VECTOR_START+\num,smp_invalidate_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200677END(invalidate_interrupt\num)
Andi Kleene5bc8b62005-09-12 18:49:24 +0200678 .endm
679
680 INVALIDATE_ENTRY 0
681 INVALIDATE_ENTRY 1
682 INVALIDATE_ENTRY 2
683 INVALIDATE_ENTRY 3
684 INVALIDATE_ENTRY 4
685 INVALIDATE_ENTRY 5
686 INVALIDATE_ENTRY 6
687 INVALIDATE_ENTRY 7
Linus Torvalds1da177e2005-04-16 15:20:36 -0700688
689ENTRY(call_function_interrupt)
690 apicinterrupt CALL_FUNCTION_VECTOR,smp_call_function_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200691END(call_function_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700692#endif
693
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694ENTRY(apic_timer_interrupt)
695 apicinterrupt LOCAL_TIMER_VECTOR,smp_apic_timer_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200696END(apic_timer_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700697
698ENTRY(error_interrupt)
699 apicinterrupt ERROR_APIC_VECTOR,smp_error_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200700END(error_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700701
702ENTRY(spurious_interrupt)
703 apicinterrupt SPURIOUS_APIC_VECTOR,smp_spurious_interrupt
Jan Beulich4b787e02006-06-26 13:56:55 +0200704END(spurious_interrupt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700705
706/*
707 * Exception entry points.
708 */
709 .macro zeroentry sym
Jan Beulich7effaa82005-09-12 18:49:24 +0200710 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700711 pushq $0 /* push error code/oldrax */
Jan Beulich7effaa82005-09-12 18:49:24 +0200712 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713 pushq %rax /* push real oldrax to the rdi slot */
Jan Beulich7effaa82005-09-12 18:49:24 +0200714 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700715 leaq \sym(%rip),%rax
716 jmp error_entry
Jan Beulich7effaa82005-09-12 18:49:24 +0200717 CFI_ENDPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 .endm
719
720 .macro errorentry sym
Jan Beulich7effaa82005-09-12 18:49:24 +0200721 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -0700722 pushq %rax
Jan Beulich7effaa82005-09-12 18:49:24 +0200723 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700724 leaq \sym(%rip),%rax
725 jmp error_entry
Jan Beulich7effaa82005-09-12 18:49:24 +0200726 CFI_ENDPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727 .endm
728
729 /* error code is on the stack already */
730 /* handle NMI like exceptions that can happen everywhere */
Ingo Molnar2601e642006-07-03 00:24:45 -0700731 .macro paranoidentry sym, ist=0, irqtrace=1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700732 SAVE_ALL
733 cld
734 movl $1,%ebx
735 movl $MSR_GS_BASE,%ecx
736 rdmsr
737 testl %edx,%edx
738 js 1f
739 swapgs
740 xorl %ebx,%ebx
Jan Beulichb556b352006-01-11 22:43:00 +01007411:
742 .if \ist
743 movq %gs:pda_data_offset, %rbp
744 .endif
745 movq %rsp,%rdi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700746 movq ORIG_RAX(%rsp),%rsi
747 movq $-1,ORIG_RAX(%rsp)
Jan Beulichb556b352006-01-11 22:43:00 +0100748 .if \ist
Andi Kleen5f8efbb2006-01-16 01:56:39 +0100749 subq $EXCEPTION_STKSZ, per_cpu__init_tss + TSS_ist + (\ist - 1) * 8(%rbp)
Jan Beulichb556b352006-01-11 22:43:00 +0100750 .endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751 call \sym
Jan Beulichb556b352006-01-11 22:43:00 +0100752 .if \ist
Andi Kleen5f8efbb2006-01-16 01:56:39 +0100753 addq $EXCEPTION_STKSZ, per_cpu__init_tss + TSS_ist + (\ist - 1) * 8(%rbp)
Jan Beulichb556b352006-01-11 22:43:00 +0100754 .endif
Andi Kleen6fefb0d2005-04-16 15:25:03 -0700755 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700756 .if \irqtrace
757 TRACE_IRQS_OFF
758 .endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700759 .endm
Ingo Molnar2601e642006-07-03 00:24:45 -0700760
761 /*
762 * "Paranoid" exit path from exception stack.
763 * Paranoid because this is used by NMIs and cannot take
764 * any kernel state for granted.
765 * We don't do kernel preemption checks here, because only
766 * NMI should be common and it does not enable IRQs and
767 * cannot get reschedule ticks.
768 *
769 * "trace" is 0 for the NMI handler only, because irq-tracing
770 * is fundamentally NMI-unsafe. (we cannot change the soft and
771 * hard flags at once, atomically)
772 */
773 .macro paranoidexit trace=1
774 /* ebx: no swapgs flag */
775paranoid_exit\trace:
776 testl %ebx,%ebx /* swapgs needed? */
777 jnz paranoid_restore\trace
778 testl $3,CS(%rsp)
779 jnz paranoid_userspace\trace
780paranoid_swapgs\trace:
Andi Kleen7a0a2df2006-09-26 10:52:37 +0200781 .if \trace
Ingo Molnar2601e642006-07-03 00:24:45 -0700782 TRACE_IRQS_IRETQ 0
Andi Kleen7a0a2df2006-09-26 10:52:37 +0200783 .endif
Ingo Molnar2601e642006-07-03 00:24:45 -0700784 swapgs
785paranoid_restore\trace:
786 RESTORE_ALL 8
787 iretq
788paranoid_userspace\trace:
789 GET_THREAD_INFO(%rcx)
790 movl threadinfo_flags(%rcx),%ebx
791 andl $_TIF_WORK_MASK,%ebx
792 jz paranoid_swapgs\trace
793 movq %rsp,%rdi /* &pt_regs */
794 call sync_regs
795 movq %rax,%rsp /* switch stack for scheduling */
796 testl $_TIF_NEED_RESCHED,%ebx
797 jnz paranoid_schedule\trace
798 movl %ebx,%edx /* arg3: thread flags */
799 .if \trace
800 TRACE_IRQS_ON
801 .endif
802 sti
803 xorl %esi,%esi /* arg2: oldset */
804 movq %rsp,%rdi /* arg1: &pt_regs */
805 call do_notify_resume
806 cli
807 .if \trace
808 TRACE_IRQS_OFF
809 .endif
810 jmp paranoid_userspace\trace
811paranoid_schedule\trace:
812 .if \trace
813 TRACE_IRQS_ON
814 .endif
815 sti
816 call schedule
817 cli
818 .if \trace
819 TRACE_IRQS_OFF
820 .endif
821 jmp paranoid_userspace\trace
822 CFI_ENDPROC
823 .endm
824
Linus Torvalds1da177e2005-04-16 15:20:36 -0700825/*
826 * Exception entry point. This expects an error code/orig_rax on the stack
827 * and the exception handler in %rax.
828 */
Prasanna S.Pd28c4392006-09-26 10:52:34 +0200829KPROBE_ENTRY(error_entry)
Jan Beulich7effaa82005-09-12 18:49:24 +0200830 _frame RDI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700831 /* rdi slot contains rax, oldrax contains error code */
832 cld
833 subq $14*8,%rsp
834 CFI_ADJUST_CFA_OFFSET (14*8)
835 movq %rsi,13*8(%rsp)
836 CFI_REL_OFFSET rsi,RSI
837 movq 14*8(%rsp),%rsi /* load rax from rdi slot */
838 movq %rdx,12*8(%rsp)
839 CFI_REL_OFFSET rdx,RDX
840 movq %rcx,11*8(%rsp)
841 CFI_REL_OFFSET rcx,RCX
842 movq %rsi,10*8(%rsp) /* store rax */
843 CFI_REL_OFFSET rax,RAX
844 movq %r8, 9*8(%rsp)
845 CFI_REL_OFFSET r8,R8
846 movq %r9, 8*8(%rsp)
847 CFI_REL_OFFSET r9,R9
848 movq %r10,7*8(%rsp)
849 CFI_REL_OFFSET r10,R10
850 movq %r11,6*8(%rsp)
851 CFI_REL_OFFSET r11,R11
852 movq %rbx,5*8(%rsp)
853 CFI_REL_OFFSET rbx,RBX
854 movq %rbp,4*8(%rsp)
855 CFI_REL_OFFSET rbp,RBP
856 movq %r12,3*8(%rsp)
857 CFI_REL_OFFSET r12,R12
858 movq %r13,2*8(%rsp)
859 CFI_REL_OFFSET r13,R13
860 movq %r14,1*8(%rsp)
861 CFI_REL_OFFSET r14,R14
862 movq %r15,(%rsp)
863 CFI_REL_OFFSET r15,R15
864 xorl %ebx,%ebx
865 testl $3,CS(%rsp)
866 je error_kernelspace
867error_swapgs:
868 swapgs
869error_sti:
870 movq %rdi,RDI(%rsp)
871 movq %rsp,%rdi
872 movq ORIG_RAX(%rsp),%rsi /* get error code */
873 movq $-1,ORIG_RAX(%rsp)
874 call *%rax
875 /* ebx: no swapgs flag (1: don't need swapgs, 0: need it) */
876error_exit:
877 movl %ebx,%eax
878 RESTORE_REST
879 cli
Ingo Molnar2601e642006-07-03 00:24:45 -0700880 TRACE_IRQS_OFF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700881 GET_THREAD_INFO(%rcx)
882 testl %eax,%eax
883 jne retint_kernel
884 movl threadinfo_flags(%rcx),%edx
885 movl $_TIF_WORK_MASK,%edi
886 andl %edi,%edx
887 jnz retint_careful
Ingo Molnar2601e642006-07-03 00:24:45 -0700888 /*
889 * The iret might restore flags:
890 */
891 TRACE_IRQS_IRETQ
Linus Torvalds1da177e2005-04-16 15:20:36 -0700892 swapgs
893 RESTORE_ARGS 0,8,0
Jan Beulich505cc4e2006-01-11 22:42:20 +0100894 jmp iret_label
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895 CFI_ENDPROC
896
897error_kernelspace:
898 incl %ebx
899 /* There are two places in the kernel that can potentially fault with
900 usergs. Handle them here. The exception handlers after
901 iret run with kernel gs again, so don't set the user space flag.
902 B stepping K8s sometimes report an truncated RIP for IRET
903 exceptions returning to compat mode. Check for these here too. */
904 leaq iret_label(%rip),%rbp
905 cmpq %rbp,RIP(%rsp)
906 je error_swapgs
907 movl %ebp,%ebp /* zero extend */
908 cmpq %rbp,RIP(%rsp)
909 je error_swapgs
910 cmpq $gs_change,RIP(%rsp)
911 je error_swapgs
912 jmp error_sti
Prasanna S.Pd28c4392006-09-26 10:52:34 +0200913KPROBE_END(error_entry)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700914
915 /* Reload gs selector with exception handling */
916 /* edi: new selector */
917ENTRY(load_gs_index)
Jan Beulich7effaa82005-09-12 18:49:24 +0200918 CFI_STARTPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700919 pushf
Jan Beulich7effaa82005-09-12 18:49:24 +0200920 CFI_ADJUST_CFA_OFFSET 8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700921 cli
922 swapgs
923gs_change:
924 movl %edi,%gs
9252: mfence /* workaround */
926 swapgs
927 popf
Jan Beulich7effaa82005-09-12 18:49:24 +0200928 CFI_ADJUST_CFA_OFFSET -8
Linus Torvalds1da177e2005-04-16 15:20:36 -0700929 ret
Jan Beulich7effaa82005-09-12 18:49:24 +0200930 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200931ENDPROC(load_gs_index)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700932
933 .section __ex_table,"a"
934 .align 8
935 .quad gs_change,bad_gs
936 .previous
937 .section .fixup,"ax"
938 /* running with kernelgs */
939bad_gs:
940 swapgs /* switch back to user gs */
941 xorl %eax,%eax
942 movl %eax,%gs
943 jmp 2b
944 .previous
945
946/*
947 * Create a kernel thread.
948 *
949 * C extern interface:
950 * extern long kernel_thread(int (*fn)(void *), void * arg, unsigned long flags)
951 *
952 * asm input arguments:
953 * rdi: fn, rsi: arg, rdx: flags
954 */
955ENTRY(kernel_thread)
956 CFI_STARTPROC
957 FAKE_STACK_FRAME $child_rip
958 SAVE_ALL
959
960 # rdi: flags, rsi: usp, rdx: will be &pt_regs
961 movq %rdx,%rdi
962 orq kernel_thread_flags(%rip),%rdi
963 movq $-1, %rsi
964 movq %rsp, %rdx
965
966 xorl %r8d,%r8d
967 xorl %r9d,%r9d
968
969 # clone now
970 call do_fork
971 movq %rax,RAX(%rsp)
972 xorl %edi,%edi
973
974 /*
975 * It isn't worth to check for reschedule here,
976 * so internally to the x86_64 port you can rely on kernel_thread()
977 * not to reschedule the child before returning, this avoids the need
978 * of hacks for example to fork off the per-CPU idle tasks.
979 * [Hopefully no generic code relies on the reschedule -AK]
980 */
981 RESTORE_ALL
982 UNFAKE_STACK_FRAME
983 ret
984 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +0200985ENDPROC(kernel_thread)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700986
987child_rip:
Andi Kleenc05991e2006-08-30 19:37:08 +0200988 pushq $0 # fake return address
989 CFI_STARTPROC
Linus Torvalds1da177e2005-04-16 15:20:36 -0700990 /*
991 * Here we are in the child and the registers are set as they were
992 * at kernel_thread() invocation in the parent.
993 */
994 movq %rdi, %rax
995 movq %rsi, %rdi
996 call *%rax
997 # exit
Andi Kleen3829ee62005-07-28 21:15:48 -0700998 xorl %edi, %edi
Linus Torvalds1da177e2005-04-16 15:20:36 -0700999 call do_exit
Andi Kleenc05991e2006-08-30 19:37:08 +02001000 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001001ENDPROC(child_rip)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001002
1003/*
1004 * execve(). This function needs to use IRET, not SYSRET, to set up all state properly.
1005 *
1006 * C extern interface:
1007 * extern long execve(char *name, char **argv, char **envp)
1008 *
1009 * asm input arguments:
1010 * rdi: name, rsi: argv, rdx: envp
1011 *
1012 * We want to fallback into:
1013 * extern long sys_execve(char *name, char **argv,char **envp, struct pt_regs regs)
1014 *
1015 * do_sys_execve asm fallback arguments:
1016 * rdi: name, rsi: argv, rdx: envp, fake frame on the stack
1017 */
1018ENTRY(execve)
1019 CFI_STARTPROC
1020 FAKE_STACK_FRAME $0
1021 SAVE_ALL
1022 call sys_execve
1023 movq %rax, RAX(%rsp)
1024 RESTORE_REST
1025 testq %rax,%rax
1026 je int_ret_from_sys_call
1027 RESTORE_ARGS
1028 UNFAKE_STACK_FRAME
1029 ret
1030 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001031ENDPROC(execve)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001032
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001033KPROBE_ENTRY(page_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001034 errorentry do_page_fault
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001035KPROBE_END(page_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001036
1037ENTRY(coprocessor_error)
1038 zeroentry do_coprocessor_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001039END(coprocessor_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001040
1041ENTRY(simd_coprocessor_error)
1042 zeroentry do_simd_coprocessor_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001043END(simd_coprocessor_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001044
1045ENTRY(device_not_available)
1046 zeroentry math_state_restore
Jan Beulich4b787e02006-06-26 13:56:55 +02001047END(device_not_available)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001048
1049 /* runs on exception stack */
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001050KPROBE_ENTRY(debug)
Jan Beulich7effaa82005-09-12 18:49:24 +02001051 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001052 pushq $0
1053 CFI_ADJUST_CFA_OFFSET 8
Andi Kleen5f8efbb2006-01-16 01:56:39 +01001054 paranoidentry do_debug, DEBUG_STACK
Ingo Molnar2601e642006-07-03 00:24:45 -07001055 paranoidexit
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001056KPROBE_END(debug)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001057
1058 /* runs on exception stack */
Andi Kleeneddb6fb2006-02-03 21:50:41 +01001059KPROBE_ENTRY(nmi)
Jan Beulich7effaa82005-09-12 18:49:24 +02001060 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001061 pushq $-1
Jan Beulich7effaa82005-09-12 18:49:24 +02001062 CFI_ADJUST_CFA_OFFSET 8
Ingo Molnar2601e642006-07-03 00:24:45 -07001063 paranoidentry do_nmi, 0, 0
1064#ifdef CONFIG_TRACE_IRQFLAGS
1065 paranoidexit 0
1066#else
1067 jmp paranoid_exit1
1068 CFI_ENDPROC
1069#endif
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001070KPROBE_END(nmi)
Andi Kleen6fefb0d2005-04-16 15:25:03 -07001071
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001072KPROBE_ENTRY(int3)
Jan Beulichb556b352006-01-11 22:43:00 +01001073 INTR_FRAME
1074 pushq $0
1075 CFI_ADJUST_CFA_OFFSET 8
Andi Kleen5f8efbb2006-01-16 01:56:39 +01001076 paranoidentry do_int3, DEBUG_STACK
Ingo Molnar2601e642006-07-03 00:24:45 -07001077 jmp paranoid_exit1
Jan Beulichb556b352006-01-11 22:43:00 +01001078 CFI_ENDPROC
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001079KPROBE_END(int3)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001080
1081ENTRY(overflow)
1082 zeroentry do_overflow
Jan Beulich4b787e02006-06-26 13:56:55 +02001083END(overflow)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001084
1085ENTRY(bounds)
1086 zeroentry do_bounds
Jan Beulich4b787e02006-06-26 13:56:55 +02001087END(bounds)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001088
1089ENTRY(invalid_op)
1090 zeroentry do_invalid_op
Jan Beulich4b787e02006-06-26 13:56:55 +02001091END(invalid_op)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001092
1093ENTRY(coprocessor_segment_overrun)
1094 zeroentry do_coprocessor_segment_overrun
Jan Beulich4b787e02006-06-26 13:56:55 +02001095END(coprocessor_segment_overrun)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001096
1097ENTRY(reserved)
1098 zeroentry do_reserved
Jan Beulich4b787e02006-06-26 13:56:55 +02001099END(reserved)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001100
1101 /* runs on exception stack */
1102ENTRY(double_fault)
Jan Beulich7effaa82005-09-12 18:49:24 +02001103 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001104 paranoidentry do_double_fault
Ingo Molnar2601e642006-07-03 00:24:45 -07001105 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001106 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001107END(double_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001108
1109ENTRY(invalid_TSS)
1110 errorentry do_invalid_TSS
Jan Beulich4b787e02006-06-26 13:56:55 +02001111END(invalid_TSS)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001112
1113ENTRY(segment_not_present)
1114 errorentry do_segment_not_present
Jan Beulich4b787e02006-06-26 13:56:55 +02001115END(segment_not_present)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001116
1117 /* runs on exception stack */
1118ENTRY(stack_segment)
Jan Beulich7effaa82005-09-12 18:49:24 +02001119 XCPT_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001120 paranoidentry do_stack_segment
Ingo Molnar2601e642006-07-03 00:24:45 -07001121 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001122 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001123END(stack_segment)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001124
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -07001125KPROBE_ENTRY(general_protection)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001126 errorentry do_general_protection
Prasanna S.Pd28c4392006-09-26 10:52:34 +02001127KPROBE_END(general_protection)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001128
1129ENTRY(alignment_check)
1130 errorentry do_alignment_check
Jan Beulich4b787e02006-06-26 13:56:55 +02001131END(alignment_check)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001132
1133ENTRY(divide_error)
1134 zeroentry do_divide_error
Jan Beulich4b787e02006-06-26 13:56:55 +02001135END(divide_error)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001136
1137ENTRY(spurious_interrupt_bug)
1138 zeroentry do_spurious_interrupt_bug
Jan Beulich4b787e02006-06-26 13:56:55 +02001139END(spurious_interrupt_bug)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001140
1141#ifdef CONFIG_X86_MCE
1142 /* runs on exception stack */
1143ENTRY(machine_check)
Jan Beulich7effaa82005-09-12 18:49:24 +02001144 INTR_FRAME
Linus Torvalds1da177e2005-04-16 15:20:36 -07001145 pushq $0
1146 CFI_ADJUST_CFA_OFFSET 8
1147 paranoidentry do_machine_check
Ingo Molnar2601e642006-07-03 00:24:45 -07001148 jmp paranoid_exit1
Linus Torvalds1da177e2005-04-16 15:20:36 -07001149 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001150END(machine_check)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001151#endif
1152
Andi Kleen26995002006-08-02 22:37:28 +02001153/* Call softirq on interrupt stack. Interrupts are off. */
Andi Kleened6b6762005-07-28 21:15:49 -07001154ENTRY(call_softirq)
Jan Beulich7effaa82005-09-12 18:49:24 +02001155 CFI_STARTPROC
Andi Kleen26995002006-08-02 22:37:28 +02001156 push %rbp
1157 CFI_ADJUST_CFA_OFFSET 8
1158 CFI_REL_OFFSET rbp,0
1159 mov %rsp,%rbp
1160 CFI_DEF_CFA_REGISTER rbp
Andi Kleened6b6762005-07-28 21:15:49 -07001161 incl %gs:pda_irqcount
Andi Kleen26995002006-08-02 22:37:28 +02001162 cmove %gs:pda_irqstackptr,%rsp
1163 push %rbp # backlink for old unwinder
Andi Kleened6b6762005-07-28 21:15:49 -07001164 call __do_softirq
Andi Kleen26995002006-08-02 22:37:28 +02001165 leaveq
Jan Beulich7effaa82005-09-12 18:49:24 +02001166 CFI_DEF_CFA_REGISTER rsp
Andi Kleen26995002006-08-02 22:37:28 +02001167 CFI_ADJUST_CFA_OFFSET -8
Andi Kleened6b6762005-07-28 21:15:49 -07001168 decl %gs:pda_irqcount
Andi Kleened6b6762005-07-28 21:15:49 -07001169 ret
Jan Beulich7effaa82005-09-12 18:49:24 +02001170 CFI_ENDPROC
Jan Beulich4b787e02006-06-26 13:56:55 +02001171ENDPROC(call_softirq)
Jan Beulichb538ed22006-06-26 13:57:32 +02001172
1173#ifdef CONFIG_STACK_UNWIND
1174ENTRY(arch_unwind_init_running)
1175 CFI_STARTPROC
1176 movq %r15, R15(%rdi)
1177 movq %r14, R14(%rdi)
1178 xchgq %rsi, %rdx
1179 movq %r13, R13(%rdi)
1180 movq %r12, R12(%rdi)
1181 xorl %eax, %eax
1182 movq %rbp, RBP(%rdi)
1183 movq %rbx, RBX(%rdi)
1184 movq (%rsp), %rcx
1185 movq %rax, R11(%rdi)
1186 movq %rax, R10(%rdi)
1187 movq %rax, R9(%rdi)
1188 movq %rax, R8(%rdi)
1189 movq %rax, RAX(%rdi)
1190 movq %rax, RCX(%rdi)
1191 movq %rax, RDX(%rdi)
1192 movq %rax, RSI(%rdi)
1193 movq %rax, RDI(%rdi)
1194 movq %rax, ORIG_RAX(%rdi)
1195 movq %rcx, RIP(%rdi)
1196 leaq 8(%rsp), %rcx
1197 movq $__KERNEL_CS, CS(%rdi)
1198 movq %rax, EFLAGS(%rdi)
1199 movq %rcx, RSP(%rdi)
1200 movq $__KERNEL_DS, SS(%rdi)
1201 jmpq *%rdx
1202 CFI_ENDPROC
1203ENDPROC(arch_unwind_init_running)
1204#endif