| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* | 
|  | 2 | *  linux/arch/x86_64/entry.S | 
|  | 3 | * | 
|  | 4 | *  Copyright (C) 1991, 1992  Linus Torvalds | 
|  | 5 | *  Copyright (C) 2000, 2001, 2002  Andi Kleen SuSE Labs | 
|  | 6 | *  Copyright (C) 2000  Pavel Machek <pavel@suse.cz> | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 7 | */ | 
|  | 8 |  | 
|  | 9 | /* | 
|  | 10 | * entry.S contains the system-call and fault low-level handling routines. | 
|  | 11 | * | 
|  | 12 | * NOTE: This code handles signal-recognition, which happens every time | 
|  | 13 | * after an interrupt and after each system call. | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 14 | * | 
|  | 15 | * Normal syscalls and interrupts don't save a full stack frame, this is | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 16 | * only done for syscall tracing, signals or fork/exec et.al. | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 17 | * | 
|  | 18 | * A note on terminology: | 
|  | 19 | * - top of stack: Architecture defined interrupt frame from SS to RIP | 
|  | 20 | * at the top of the kernel process stack. | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 21 | * - partial stack frame: partially saved registers upto R11. | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 22 | * - full stack frame: Like partial stack frame, but all register saved. | 
| Andi Kleen | 2e91a17 | 2006-09-26 10:52:29 +0200 | [diff] [blame] | 23 | * | 
|  | 24 | * Some macro usage: | 
|  | 25 | * - CFI macros are used to generate dwarf2 unwind information for better | 
|  | 26 | * backtraces. They don't change any code. | 
|  | 27 | * - SAVE_ALL/RESTORE_ALL - Save/restore all registers | 
|  | 28 | * - SAVE_ARGS/RESTORE_ARGS - Save/restore registers that C functions modify. | 
|  | 29 | * There are unfortunately lots of special cases where some registers | 
|  | 30 | * not touched. The macro is a big mess that should be cleaned up. | 
|  | 31 | * - SAVE_REST/RESTORE_REST - Handle the registers not saved by SAVE_ARGS. | 
|  | 32 | * Gives a full stack frame. | 
|  | 33 | * - ENTRY/END Define functions in the symbol table. | 
|  | 34 | * - FIXUP_TOP_OF_STACK/RESTORE_TOP_OF_STACK - Fix up the hardware stack | 
|  | 35 | * frame that is otherwise undefined after a SYSCALL | 
|  | 36 | * - TRACE_IRQ_* - Trace hard interrupt state for lock debugging. | 
|  | 37 | * - errorentry/paranoidentry/zeroentry - Define exception entry points. | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 38 | */ | 
|  | 39 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 40 | #include <linux/linkage.h> | 
|  | 41 | #include <asm/segment.h> | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 42 | #include <asm/cache.h> | 
|  | 43 | #include <asm/errno.h> | 
|  | 44 | #include <asm/dwarf2.h> | 
|  | 45 | #include <asm/calling.h> | 
| Sam Ravnborg | e2d5df9 | 2005-09-09 21:28:48 +0200 | [diff] [blame] | 46 | #include <asm/asm-offsets.h> | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 47 | #include <asm/msr.h> | 
|  | 48 | #include <asm/unistd.h> | 
|  | 49 | #include <asm/thread_info.h> | 
|  | 50 | #include <asm/hw_irq.h> | 
| Jeremy Fitzhardinge | 0341c14 | 2009-02-13 11:14:01 -0800 | [diff] [blame] | 51 | #include <asm/page_types.h> | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 52 | #include <asm/irqflags.h> | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 53 | #include <asm/paravirt.h> | 
| Abhishek Sagar | 395a59d | 2008-06-21 23:47:27 +0530 | [diff] [blame] | 54 | #include <asm/ftrace.h> | 
| Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 55 | #include <asm/percpu.h> | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 56 |  | 
| Roland McGrath | 86a1c34 | 2008-06-23 15:37:04 -0700 | [diff] [blame] | 57 | /* Avoid __ASSEMBLER__'ifying <linux/audit.h> just for this.  */ | 
|  | 58 | #include <linux/elf-em.h> | 
|  | 59 | #define AUDIT_ARCH_X86_64	(EM_X86_64|__AUDIT_ARCH_64BIT|__AUDIT_ARCH_LE) | 
|  | 60 | #define __AUDIT_ARCH_64BIT 0x80000000 | 
|  | 61 | #define __AUDIT_ARCH_LE	   0x40000000 | 
|  | 62 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 63 | .code64 | 
| Steven Rostedt | 606576c | 2008-10-06 19:06:12 -0400 | [diff] [blame] | 64 | #ifdef CONFIG_FUNCTION_TRACER | 
| Steven Rostedt | d61f82d | 2008-05-12 21:20:43 +0200 | [diff] [blame] | 65 | #ifdef CONFIG_DYNAMIC_FTRACE | 
|  | 66 | ENTRY(mcount) | 
| Steven Rostedt | d61f82d | 2008-05-12 21:20:43 +0200 | [diff] [blame] | 67 | retq | 
|  | 68 | END(mcount) | 
|  | 69 |  | 
|  | 70 | ENTRY(ftrace_caller) | 
| Steven Rostedt | 60a7ecf | 2008-11-05 16:05:44 -0500 | [diff] [blame] | 71 | cmpl $0, function_trace_stop | 
|  | 72 | jne  ftrace_stub | 
| Steven Rostedt | d61f82d | 2008-05-12 21:20:43 +0200 | [diff] [blame] | 73 |  | 
| Cyrill Gorcunov | d680fe4 | 2008-12-13 00:09:08 +0300 | [diff] [blame] | 74 | MCOUNT_SAVE_FRAME | 
| Steven Rostedt | d61f82d | 2008-05-12 21:20:43 +0200 | [diff] [blame] | 75 |  | 
|  | 76 | movq 0x38(%rsp), %rdi | 
|  | 77 | movq 8(%rbp), %rsi | 
| Abhishek Sagar | 395a59d | 2008-06-21 23:47:27 +0530 | [diff] [blame] | 78 | subq $MCOUNT_INSN_SIZE, %rdi | 
| Steven Rostedt | d61f82d | 2008-05-12 21:20:43 +0200 | [diff] [blame] | 79 |  | 
| Cyrill Gorcunov | bc8b2b9 | 2009-02-23 22:57:01 +0300 | [diff] [blame] | 80 | GLOBAL(ftrace_call) | 
| Steven Rostedt | d61f82d | 2008-05-12 21:20:43 +0200 | [diff] [blame] | 81 | call ftrace_stub | 
|  | 82 |  | 
| Cyrill Gorcunov | d680fe4 | 2008-12-13 00:09:08 +0300 | [diff] [blame] | 83 | MCOUNT_RESTORE_FRAME | 
| Steven Rostedt | d61f82d | 2008-05-12 21:20:43 +0200 | [diff] [blame] | 84 |  | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 85 | #ifdef CONFIG_FUNCTION_GRAPH_TRACER | 
| Cyrill Gorcunov | bc8b2b9 | 2009-02-23 22:57:01 +0300 | [diff] [blame] | 86 | GLOBAL(ftrace_graph_call) | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 87 | jmp ftrace_stub | 
|  | 88 | #endif | 
| Steven Rostedt | d61f82d | 2008-05-12 21:20:43 +0200 | [diff] [blame] | 89 |  | 
| Cyrill Gorcunov | bc8b2b9 | 2009-02-23 22:57:01 +0300 | [diff] [blame] | 90 | GLOBAL(ftrace_stub) | 
| Steven Rostedt | d61f82d | 2008-05-12 21:20:43 +0200 | [diff] [blame] | 91 | retq | 
|  | 92 | END(ftrace_caller) | 
|  | 93 |  | 
|  | 94 | #else /* ! CONFIG_DYNAMIC_FTRACE */ | 
| Arnaldo Carvalho de Melo | 16444a8 | 2008-05-12 21:20:42 +0200 | [diff] [blame] | 95 | ENTRY(mcount) | 
| Steven Rostedt | 60a7ecf | 2008-11-05 16:05:44 -0500 | [diff] [blame] | 96 | cmpl $0, function_trace_stop | 
|  | 97 | jne  ftrace_stub | 
|  | 98 |  | 
| Arnaldo Carvalho de Melo | 16444a8 | 2008-05-12 21:20:42 +0200 | [diff] [blame] | 99 | cmpq $ftrace_stub, ftrace_trace_function | 
|  | 100 | jnz trace | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 101 |  | 
|  | 102 | #ifdef CONFIG_FUNCTION_GRAPH_TRACER | 
|  | 103 | cmpq $ftrace_stub, ftrace_graph_return | 
|  | 104 | jnz ftrace_graph_caller | 
| Steven Rostedt | e49dc19 | 2008-12-02 23:50:05 -0500 | [diff] [blame] | 105 |  | 
|  | 106 | cmpq $ftrace_graph_entry_stub, ftrace_graph_entry | 
|  | 107 | jnz ftrace_graph_caller | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 108 | #endif | 
|  | 109 |  | 
| Cyrill Gorcunov | bc8b2b9 | 2009-02-23 22:57:01 +0300 | [diff] [blame] | 110 | GLOBAL(ftrace_stub) | 
| Arnaldo Carvalho de Melo | 16444a8 | 2008-05-12 21:20:42 +0200 | [diff] [blame] | 111 | retq | 
|  | 112 |  | 
|  | 113 | trace: | 
| Cyrill Gorcunov | d680fe4 | 2008-12-13 00:09:08 +0300 | [diff] [blame] | 114 | MCOUNT_SAVE_FRAME | 
| Arnaldo Carvalho de Melo | 16444a8 | 2008-05-12 21:20:42 +0200 | [diff] [blame] | 115 |  | 
|  | 116 | movq 0x38(%rsp), %rdi | 
|  | 117 | movq 8(%rbp), %rsi | 
| Abhishek Sagar | 395a59d | 2008-06-21 23:47:27 +0530 | [diff] [blame] | 118 | subq $MCOUNT_INSN_SIZE, %rdi | 
| Arnaldo Carvalho de Melo | 16444a8 | 2008-05-12 21:20:42 +0200 | [diff] [blame] | 119 |  | 
|  | 120 | call   *ftrace_trace_function | 
|  | 121 |  | 
| Cyrill Gorcunov | d680fe4 | 2008-12-13 00:09:08 +0300 | [diff] [blame] | 122 | MCOUNT_RESTORE_FRAME | 
| Arnaldo Carvalho de Melo | 16444a8 | 2008-05-12 21:20:42 +0200 | [diff] [blame] | 123 |  | 
|  | 124 | jmp ftrace_stub | 
|  | 125 | END(mcount) | 
| Steven Rostedt | d61f82d | 2008-05-12 21:20:43 +0200 | [diff] [blame] | 126 | #endif /* CONFIG_DYNAMIC_FTRACE */ | 
| Steven Rostedt | 606576c | 2008-10-06 19:06:12 -0400 | [diff] [blame] | 127 | #endif /* CONFIG_FUNCTION_TRACER */ | 
| Arnaldo Carvalho de Melo | 16444a8 | 2008-05-12 21:20:42 +0200 | [diff] [blame] | 128 |  | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 129 | #ifdef CONFIG_FUNCTION_GRAPH_TRACER | 
|  | 130 | ENTRY(ftrace_graph_caller) | 
|  | 131 | cmpl $0, function_trace_stop | 
|  | 132 | jne ftrace_stub | 
|  | 133 |  | 
| Cyrill Gorcunov | d680fe4 | 2008-12-13 00:09:08 +0300 | [diff] [blame] | 134 | MCOUNT_SAVE_FRAME | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 135 |  | 
|  | 136 | leaq 8(%rbp), %rdi | 
|  | 137 | movq 0x38(%rsp), %rsi | 
| Steven Rostedt | bb4304c | 2008-12-02 15:34:09 -0500 | [diff] [blame] | 138 | subq $MCOUNT_INSN_SIZE, %rsi | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 139 |  | 
|  | 140 | call	prepare_ftrace_return | 
|  | 141 |  | 
| Cyrill Gorcunov | d680fe4 | 2008-12-13 00:09:08 +0300 | [diff] [blame] | 142 | MCOUNT_RESTORE_FRAME | 
|  | 143 |  | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 144 | retq | 
|  | 145 | END(ftrace_graph_caller) | 
|  | 146 |  | 
| Cyrill Gorcunov | bc8b2b9 | 2009-02-23 22:57:01 +0300 | [diff] [blame] | 147 | GLOBAL(return_to_handler) | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 148 | subq  $80, %rsp | 
|  | 149 |  | 
| Steven Rostedt | e71e99c | 2009-03-25 14:30:04 -0400 | [diff] [blame] | 150 | /* Save the return values */ | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 151 | movq %rax, (%rsp) | 
| Steven Rostedt | e71e99c | 2009-03-25 14:30:04 -0400 | [diff] [blame] | 152 | movq %rdx, 8(%rsp) | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 153 |  | 
|  | 154 | call ftrace_return_to_handler | 
|  | 155 |  | 
|  | 156 | movq %rax, 72(%rsp) | 
| Steven Rostedt | e71e99c | 2009-03-25 14:30:04 -0400 | [diff] [blame] | 157 | movq 8(%rsp), %rdx | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 158 | movq (%rsp), %rax | 
| Frederic Weisbecker | 48d68b2 | 2008-12-02 00:20:39 +0100 | [diff] [blame] | 159 | addq $72, %rsp | 
|  | 160 | retq | 
|  | 161 | #endif | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 162 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 163 |  | 
|  | 164 | #ifndef CONFIG_PREEMPT | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 165 | #define retint_kernel retint_restore_args | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 166 | #endif | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 167 |  | 
|  | 168 | #ifdef CONFIG_PARAVIRT | 
|  | 169 | ENTRY(native_usergs_sysret64) | 
|  | 170 | swapgs | 
|  | 171 | sysretq | 
| Cyrill Gorcunov | b3baaa1 | 2009-02-23 22:57:00 +0300 | [diff] [blame] | 172 | ENDPROC(native_usergs_sysret64) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 173 | #endif /* CONFIG_PARAVIRT */ | 
|  | 174 |  | 
|  | 175 |  | 
|  | 176 | .macro TRACE_IRQS_IRETQ offset=ARGOFFSET | 
|  | 177 | #ifdef CONFIG_TRACE_IRQFLAGS | 
|  | 178 | bt   $9,EFLAGS-\offset(%rsp)	/* interrupts off? */ | 
|  | 179 | jnc  1f | 
|  | 180 | TRACE_IRQS_ON | 
|  | 181 | 1: | 
|  | 182 | #endif | 
|  | 183 | .endm | 
|  | 184 |  | 
|  | 185 | /* | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 186 | * C code is not supposed to know about undefined top of stack. Every time | 
|  | 187 | * a C function with an pt_regs argument is called from the SYSCALL based | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 188 | * fast path FIXUP_TOP_OF_STACK is needed. | 
|  | 189 | * RESTORE_TOP_OF_STACK syncs the syscall state after any possible ptregs | 
|  | 190 | * manipulation. | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 191 | */ | 
|  | 192 |  | 
|  | 193 | /* %rsp:at FRAMEEND */ | 
| Alexander van Heukelum | c002a1e | 2008-11-21 16:41:55 +0100 | [diff] [blame] | 194 | .macro FIXUP_TOP_OF_STACK tmp offset=0 | 
| Brian Gerst | 3d1e42a | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 195 | movq PER_CPU_VAR(old_rsp),\tmp | 
| Alexander van Heukelum | c002a1e | 2008-11-21 16:41:55 +0100 | [diff] [blame] | 196 | movq \tmp,RSP+\offset(%rsp) | 
|  | 197 | movq $__USER_DS,SS+\offset(%rsp) | 
|  | 198 | movq $__USER_CS,CS+\offset(%rsp) | 
|  | 199 | movq $-1,RCX+\offset(%rsp) | 
|  | 200 | movq R11+\offset(%rsp),\tmp  /* get eflags */ | 
|  | 201 | movq \tmp,EFLAGS+\offset(%rsp) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 202 | .endm | 
|  | 203 |  | 
| Alexander van Heukelum | c002a1e | 2008-11-21 16:41:55 +0100 | [diff] [blame] | 204 | .macro RESTORE_TOP_OF_STACK tmp offset=0 | 
|  | 205 | movq RSP+\offset(%rsp),\tmp | 
| Brian Gerst | 3d1e42a | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 206 | movq \tmp,PER_CPU_VAR(old_rsp) | 
| Alexander van Heukelum | c002a1e | 2008-11-21 16:41:55 +0100 | [diff] [blame] | 207 | movq EFLAGS+\offset(%rsp),\tmp | 
|  | 208 | movq \tmp,R11+\offset(%rsp) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 209 | .endm | 
|  | 210 |  | 
|  | 211 | .macro FAKE_STACK_FRAME child_rip | 
|  | 212 | /* push in order ss, rsp, eflags, cs, rip */ | 
|  | 213 | xorl %eax, %eax | 
|  | 214 | pushq $__KERNEL_DS /* ss */ | 
|  | 215 | CFI_ADJUST_CFA_OFFSET	8 | 
|  | 216 | /*CFI_REL_OFFSET	ss,0*/ | 
|  | 217 | pushq %rax /* rsp */ | 
|  | 218 | CFI_ADJUST_CFA_OFFSET	8 | 
|  | 219 | CFI_REL_OFFSET	rsp,0 | 
| gorcunov@gmail.com | 3345453 | 2008-11-26 22:17:02 +0300 | [diff] [blame] | 220 | pushq $X86_EFLAGS_IF /* eflags - interrupts on */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 221 | CFI_ADJUST_CFA_OFFSET	8 | 
|  | 222 | /*CFI_REL_OFFSET	rflags,0*/ | 
|  | 223 | pushq $__KERNEL_CS /* cs */ | 
|  | 224 | CFI_ADJUST_CFA_OFFSET	8 | 
|  | 225 | /*CFI_REL_OFFSET	cs,0*/ | 
|  | 226 | pushq \child_rip /* rip */ | 
|  | 227 | CFI_ADJUST_CFA_OFFSET	8 | 
|  | 228 | CFI_REL_OFFSET	rip,0 | 
|  | 229 | pushq	%rax /* orig rax */ | 
|  | 230 | CFI_ADJUST_CFA_OFFSET	8 | 
|  | 231 | .endm | 
|  | 232 |  | 
|  | 233 | .macro UNFAKE_STACK_FRAME | 
|  | 234 | addq $8*6, %rsp | 
|  | 235 | CFI_ADJUST_CFA_OFFSET	-(6*8) | 
|  | 236 | .endm | 
|  | 237 |  | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 238 | /* | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 239 | * initial frame state for interrupts (and exceptions without error code) | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 240 | */ | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 241 | .macro EMPTY_FRAME start=1 offset=0 | 
|  | 242 | .if \start | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 243 | CFI_STARTPROC simple | 
|  | 244 | CFI_SIGNAL_FRAME | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 245 | CFI_DEF_CFA rsp,8+\offset | 
|  | 246 | .else | 
|  | 247 | CFI_DEF_CFA_OFFSET 8+\offset | 
|  | 248 | .endif | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 249 | .endm | 
|  | 250 |  | 
|  | 251 | /* | 
|  | 252 | * initial frame state for interrupts (and exceptions without error code) | 
|  | 253 | */ | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 254 | .macro INTR_FRAME start=1 offset=0 | 
| Ingo Molnar | e8a0e27 | 2008-11-21 15:11:32 +0100 | [diff] [blame] | 255 | EMPTY_FRAME \start, SS+8+\offset-RIP | 
|  | 256 | /*CFI_REL_OFFSET ss, SS+\offset-RIP*/ | 
|  | 257 | CFI_REL_OFFSET rsp, RSP+\offset-RIP | 
|  | 258 | /*CFI_REL_OFFSET rflags, EFLAGS+\offset-RIP*/ | 
|  | 259 | /*CFI_REL_OFFSET cs, CS+\offset-RIP*/ | 
|  | 260 | CFI_REL_OFFSET rip, RIP+\offset-RIP | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 261 | .endm | 
|  | 262 |  | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 263 | /* | 
|  | 264 | * initial frame state for exceptions with error code (and interrupts | 
|  | 265 | * with vector already pushed) | 
|  | 266 | */ | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 267 | .macro XCPT_FRAME start=1 offset=0 | 
| Ingo Molnar | e8a0e27 | 2008-11-21 15:11:32 +0100 | [diff] [blame] | 268 | INTR_FRAME \start, RIP+\offset-ORIG_RAX | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 269 | /*CFI_REL_OFFSET orig_rax, ORIG_RAX-ORIG_RAX*/ | 
|  | 270 | .endm | 
|  | 271 |  | 
|  | 272 | /* | 
|  | 273 | * frame that enables calling into C. | 
|  | 274 | */ | 
|  | 275 | .macro PARTIAL_FRAME start=1 offset=0 | 
| Ingo Molnar | e8a0e27 | 2008-11-21 15:11:32 +0100 | [diff] [blame] | 276 | XCPT_FRAME \start, ORIG_RAX+\offset-ARGOFFSET | 
|  | 277 | CFI_REL_OFFSET rdi, RDI+\offset-ARGOFFSET | 
|  | 278 | CFI_REL_OFFSET rsi, RSI+\offset-ARGOFFSET | 
|  | 279 | CFI_REL_OFFSET rdx, RDX+\offset-ARGOFFSET | 
|  | 280 | CFI_REL_OFFSET rcx, RCX+\offset-ARGOFFSET | 
|  | 281 | CFI_REL_OFFSET rax, RAX+\offset-ARGOFFSET | 
|  | 282 | CFI_REL_OFFSET r8, R8+\offset-ARGOFFSET | 
|  | 283 | CFI_REL_OFFSET r9, R9+\offset-ARGOFFSET | 
|  | 284 | CFI_REL_OFFSET r10, R10+\offset-ARGOFFSET | 
|  | 285 | CFI_REL_OFFSET r11, R11+\offset-ARGOFFSET | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 286 | .endm | 
|  | 287 |  | 
|  | 288 | /* | 
|  | 289 | * frame that enables passing a complete pt_regs to a C function. | 
|  | 290 | */ | 
|  | 291 | .macro DEFAULT_FRAME start=1 offset=0 | 
| Ingo Molnar | e8a0e27 | 2008-11-21 15:11:32 +0100 | [diff] [blame] | 292 | PARTIAL_FRAME \start, R11+\offset-R15 | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 293 | CFI_REL_OFFSET rbx, RBX+\offset | 
|  | 294 | CFI_REL_OFFSET rbp, RBP+\offset | 
|  | 295 | CFI_REL_OFFSET r12, R12+\offset | 
|  | 296 | CFI_REL_OFFSET r13, R13+\offset | 
|  | 297 | CFI_REL_OFFSET r14, R14+\offset | 
|  | 298 | CFI_REL_OFFSET r15, R15+\offset | 
|  | 299 | .endm | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 300 |  | 
|  | 301 | /* save partial stack frame */ | 
|  | 302 | ENTRY(save_args) | 
|  | 303 | XCPT_FRAME | 
|  | 304 | cld | 
| Ingo Molnar | 14ae22b | 2008-11-21 15:20:47 +0100 | [diff] [blame] | 305 | movq_cfi rdi, RDI+16-ARGOFFSET | 
|  | 306 | movq_cfi rsi, RSI+16-ARGOFFSET | 
|  | 307 | movq_cfi rdx, RDX+16-ARGOFFSET | 
|  | 308 | movq_cfi rcx, RCX+16-ARGOFFSET | 
|  | 309 | movq_cfi rax, RAX+16-ARGOFFSET | 
|  | 310 | movq_cfi  r8,  R8+16-ARGOFFSET | 
|  | 311 | movq_cfi  r9,  R9+16-ARGOFFSET | 
|  | 312 | movq_cfi r10, R10+16-ARGOFFSET | 
|  | 313 | movq_cfi r11, R11+16-ARGOFFSET | 
|  | 314 |  | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 315 | leaq -ARGOFFSET+16(%rsp),%rdi	/* arg1 for handler */ | 
| Ingo Molnar | 14ae22b | 2008-11-21 15:20:47 +0100 | [diff] [blame] | 316 | movq_cfi rbp, 8		/* push %rbp */ | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 317 | leaq 8(%rsp), %rbp		/* mov %rsp, %ebp */ | 
|  | 318 | testl $3, CS(%rdi) | 
|  | 319 | je 1f | 
|  | 320 | SWAPGS | 
|  | 321 | /* | 
| Brian Gerst | 5689553 | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 322 | * irq_count is used to check if a CPU is already on an interrupt stack | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 323 | * or not. While this is essentially redundant with preempt_count it is | 
|  | 324 | * a little cheaper to use a separate counter in the PDA (short of | 
|  | 325 | * moving irq_enter into assembly, which would be too much work) | 
|  | 326 | */ | 
| Brian Gerst | 5689553 | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 327 | 1:	incl PER_CPU_VAR(irq_count) | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 328 | jne 2f | 
| Ingo Molnar | 14ae22b | 2008-11-21 15:20:47 +0100 | [diff] [blame] | 329 | popq_cfi %rax			/* move return address... */ | 
| Brian Gerst | 26f80bd | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 330 | mov PER_CPU_VAR(irq_stack_ptr),%rsp | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 331 | EMPTY_FRAME 0 | 
| Martin Hicks | a67798c | 2009-01-30 10:50:54 -0600 | [diff] [blame] | 332 | pushq_cfi %rbp			/* backlink for unwinder */ | 
| Ingo Molnar | 14ae22b | 2008-11-21 15:20:47 +0100 | [diff] [blame] | 333 | pushq_cfi %rax			/* ... to the new stack */ | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 334 | /* | 
|  | 335 | * We entered an interrupt context - irqs are off: | 
|  | 336 | */ | 
|  | 337 | 2:	TRACE_IRQS_OFF | 
|  | 338 | ret | 
|  | 339 | CFI_ENDPROC | 
|  | 340 | END(save_args) | 
|  | 341 |  | 
| Alexander van Heukelum | c002a1e | 2008-11-21 16:41:55 +0100 | [diff] [blame] | 342 | ENTRY(save_rest) | 
|  | 343 | PARTIAL_FRAME 1 REST_SKIP+8 | 
|  | 344 | movq 5*8+16(%rsp), %r11	/* save return address */ | 
|  | 345 | movq_cfi rbx, RBX+16 | 
|  | 346 | movq_cfi rbp, RBP+16 | 
|  | 347 | movq_cfi r12, R12+16 | 
|  | 348 | movq_cfi r13, R13+16 | 
|  | 349 | movq_cfi r14, R14+16 | 
|  | 350 | movq_cfi r15, R15+16 | 
|  | 351 | movq %r11, 8(%rsp)	/* return address */ | 
|  | 352 | FIXUP_TOP_OF_STACK %r11, 16 | 
|  | 353 | ret | 
|  | 354 | CFI_ENDPROC | 
|  | 355 | END(save_rest) | 
|  | 356 |  | 
| Alexander van Heukelum | e2f6bc2 | 2008-11-21 16:43:18 +0100 | [diff] [blame] | 357 | /* save complete stack frame */ | 
| Jan Beulich | c281018 | 2009-03-12 10:38:55 +0000 | [diff] [blame] | 358 | .pushsection .kprobes.text, "ax" | 
| Alexander van Heukelum | e2f6bc2 | 2008-11-21 16:43:18 +0100 | [diff] [blame] | 359 | ENTRY(save_paranoid) | 
|  | 360 | XCPT_FRAME 1 RDI+8 | 
|  | 361 | cld | 
|  | 362 | movq_cfi rdi, RDI+8 | 
|  | 363 | movq_cfi rsi, RSI+8 | 
|  | 364 | movq_cfi rdx, RDX+8 | 
|  | 365 | movq_cfi rcx, RCX+8 | 
|  | 366 | movq_cfi rax, RAX+8 | 
|  | 367 | movq_cfi r8, R8+8 | 
|  | 368 | movq_cfi r9, R9+8 | 
|  | 369 | movq_cfi r10, R10+8 | 
|  | 370 | movq_cfi r11, R11+8 | 
|  | 371 | movq_cfi rbx, RBX+8 | 
|  | 372 | movq_cfi rbp, RBP+8 | 
|  | 373 | movq_cfi r12, R12+8 | 
|  | 374 | movq_cfi r13, R13+8 | 
|  | 375 | movq_cfi r14, R14+8 | 
|  | 376 | movq_cfi r15, R15+8 | 
|  | 377 | movl $1,%ebx | 
|  | 378 | movl $MSR_GS_BASE,%ecx | 
|  | 379 | rdmsr | 
|  | 380 | testl %edx,%edx | 
|  | 381 | js 1f	/* negative -> in kernel */ | 
|  | 382 | SWAPGS | 
|  | 383 | xorl %ebx,%ebx | 
|  | 384 | 1:	ret | 
|  | 385 | CFI_ENDPROC | 
|  | 386 | END(save_paranoid) | 
| Jan Beulich | c281018 | 2009-03-12 10:38:55 +0000 | [diff] [blame] | 387 | .popsection | 
| Alexander van Heukelum | e2f6bc2 | 2008-11-21 16:43:18 +0100 | [diff] [blame] | 388 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 389 | /* | 
| Ingo Molnar | 5b3eec0 | 2008-11-27 14:41:21 +0100 | [diff] [blame] | 390 | * A newly forked process directly context switches into this address. | 
|  | 391 | * | 
|  | 392 | * rdi: prev task we switched from | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 393 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 394 | ENTRY(ret_from_fork) | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 395 | DEFAULT_FRAME | 
| Ingo Molnar | 5b3eec0 | 2008-11-27 14:41:21 +0100 | [diff] [blame] | 396 |  | 
| Benjamin LaHaise | 7106a5a | 2009-01-10 23:00:22 -0500 | [diff] [blame] | 397 | LOCK ; btr $TIF_FORK,TI_flags(%r8) | 
|  | 398 |  | 
| Andi Kleen | 658fdbe | 2006-09-26 10:52:41 +0200 | [diff] [blame] | 399 | push kernel_eflags(%rip) | 
| Alexander van Heukelum | e0a5a5d | 2008-07-22 18:14:16 +0200 | [diff] [blame] | 400 | CFI_ADJUST_CFA_OFFSET 8 | 
| Ingo Molnar | 5b3eec0 | 2008-11-27 14:41:21 +0100 | [diff] [blame] | 401 | popf					# reset kernel eflags | 
| Alexander van Heukelum | e0a5a5d | 2008-07-22 18:14:16 +0200 | [diff] [blame] | 402 | CFI_ADJUST_CFA_OFFSET -8 | 
| Ingo Molnar | 5b3eec0 | 2008-11-27 14:41:21 +0100 | [diff] [blame] | 403 |  | 
|  | 404 | call schedule_tail			# rdi: 'prev' task parameter | 
|  | 405 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 406 | GET_THREAD_INFO(%rcx) | 
| Ingo Molnar | 5b3eec0 | 2008-11-27 14:41:21 +0100 | [diff] [blame] | 407 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 408 | RESTORE_REST | 
| Ingo Molnar | 5b3eec0 | 2008-11-27 14:41:21 +0100 | [diff] [blame] | 409 |  | 
|  | 410 | testl $3, CS-ARGOFFSET(%rsp)		# from kernel_thread? | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 411 | je   int_ret_from_sys_call | 
| Ingo Molnar | 5b3eec0 | 2008-11-27 14:41:21 +0100 | [diff] [blame] | 412 |  | 
|  | 413 | testl $_TIF_IA32, TI_flags(%rcx)	# 32-bit compat task needs IRET | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 414 | jnz  int_ret_from_sys_call | 
| Ingo Molnar | 5b3eec0 | 2008-11-27 14:41:21 +0100 | [diff] [blame] | 415 |  | 
| Alexander van Heukelum | c002a1e | 2008-11-21 16:41:55 +0100 | [diff] [blame] | 416 | RESTORE_TOP_OF_STACK %rdi, -ARGOFFSET | 
| Ingo Molnar | 5b3eec0 | 2008-11-27 14:41:21 +0100 | [diff] [blame] | 417 | jmp ret_from_sys_call			# go to the SYSRET fastpath | 
|  | 418 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 419 | CFI_ENDPROC | 
| Jan Beulich | 4b787e0 | 2006-06-26 13:56:55 +0200 | [diff] [blame] | 420 | END(ret_from_fork) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 421 |  | 
|  | 422 | /* | 
|  | 423 | * System call entry. Upto 6 arguments in registers are supported. | 
|  | 424 | * | 
|  | 425 | * SYSCALL does not save anything on the stack and does not change the | 
|  | 426 | * stack pointer. | 
|  | 427 | */ | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 428 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 429 | /* | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 430 | * Register setup: | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 431 | * rax  system call number | 
|  | 432 | * rdi  arg0 | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 433 | * rcx  return address for syscall/sysret, C arg3 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 434 | * rsi  arg1 | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 435 | * rdx  arg2 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 436 | * r10  arg3 	(--> moved to rcx for C) | 
|  | 437 | * r8   arg4 | 
|  | 438 | * r9   arg5 | 
|  | 439 | * r11  eflags for syscall/sysret, temporary for C | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 440 | * r12-r15,rbp,rbx saved by C code, not touched. | 
|  | 441 | * | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 442 | * Interrupts are off on entry. | 
|  | 443 | * Only called from user space. | 
|  | 444 | * | 
|  | 445 | * XXX	if we had a free scratch register we could save the RSP into the stack frame | 
|  | 446 | *      and report it properly in ps. Unfortunately we haven't. | 
| Andi Kleen | 7bf36bb | 2006-04-07 19:50:00 +0200 | [diff] [blame] | 447 | * | 
|  | 448 | * When user can change the frames always force IRET. That is because | 
|  | 449 | * it deals with uncanonical addresses better. SYSRET has trouble | 
|  | 450 | * with them due to bugs in both AMD and Intel CPUs. | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 451 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 452 |  | 
|  | 453 | ENTRY(system_call) | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 454 | CFI_STARTPROC	simple | 
| Jan Beulich | adf1423 | 2006-09-26 10:52:41 +0200 | [diff] [blame] | 455 | CFI_SIGNAL_FRAME | 
| Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 456 | CFI_DEF_CFA	rsp,KERNEL_STACK_OFFSET | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 457 | CFI_REGISTER	rip,rcx | 
|  | 458 | /*CFI_REGISTER	rflags,r11*/ | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 459 | SWAPGS_UNSAFE_STACK | 
|  | 460 | /* | 
|  | 461 | * A hypervisor implementation might want to use a label | 
|  | 462 | * after the swapgs, so that it can do the swapgs | 
|  | 463 | * for the guest and jump here on syscall. | 
|  | 464 | */ | 
|  | 465 | ENTRY(system_call_after_swapgs) | 
|  | 466 |  | 
| Brian Gerst | 3d1e42a | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 467 | movq	%rsp,PER_CPU_VAR(old_rsp) | 
| Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 468 | movq	PER_CPU_VAR(kernel_stack),%rsp | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 469 | /* | 
|  | 470 | * No need to follow this irqs off/on section - it's straight | 
|  | 471 | * and short: | 
|  | 472 | */ | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 473 | ENABLE_INTERRUPTS(CLBR_NONE) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 474 | SAVE_ARGS 8,1 | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 475 | movq  %rax,ORIG_RAX-ARGOFFSET(%rsp) | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 476 | movq  %rcx,RIP-ARGOFFSET(%rsp) | 
|  | 477 | CFI_REL_OFFSET rip,RIP-ARGOFFSET | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 478 | GET_THREAD_INFO(%rcx) | 
| Roland McGrath | d4d6715 | 2008-07-09 02:38:07 -0700 | [diff] [blame] | 479 | testl $_TIF_WORK_SYSCALL_ENTRY,TI_flags(%rcx) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 480 | jnz tracesys | 
| Roland McGrath | 86a1c34 | 2008-06-23 15:37:04 -0700 | [diff] [blame] | 481 | system_call_fastpath: | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 482 | cmpq $__NR_syscall_max,%rax | 
|  | 483 | ja badsys | 
|  | 484 | movq %r10,%rcx | 
|  | 485 | call *sys_call_table(,%rax,8)  # XXX:	 rip relative | 
|  | 486 | movq %rax,RAX-ARGOFFSET(%rsp) | 
|  | 487 | /* | 
|  | 488 | * Syscall return path ending with SYSRET (fast path) | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 489 | * Has incomplete stack frame and undefined top of stack. | 
|  | 490 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 491 | ret_from_sys_call: | 
| Andi Kleen | 11b854b | 2005-04-16 15:25:02 -0700 | [diff] [blame] | 492 | movl $_TIF_ALLWORK_MASK,%edi | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 493 | /* edi:	flagmask */ | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 494 | sysret_check: | 
| Peter Zijlstra | 10cd706 | 2007-10-11 22:11:12 +0200 | [diff] [blame] | 495 | LOCKDEP_SYS_EXIT | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 496 | GET_THREAD_INFO(%rcx) | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 497 | DISABLE_INTERRUPTS(CLBR_NONE) | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 498 | TRACE_IRQS_OFF | 
| Glauber Costa | 26ccb8a | 2008-06-24 11:19:35 -0300 | [diff] [blame] | 499 | movl TI_flags(%rcx),%edx | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 500 | andl %edi,%edx | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 501 | jnz  sysret_careful | 
| Jan Beulich | bcddc01 | 2006-12-07 02:14:02 +0100 | [diff] [blame] | 502 | CFI_REMEMBER_STATE | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 503 | /* | 
|  | 504 | * sysretq will re-enable interrupts: | 
|  | 505 | */ | 
|  | 506 | TRACE_IRQS_ON | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 507 | movq RIP-ARGOFFSET(%rsp),%rcx | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 508 | CFI_REGISTER	rip,rcx | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 509 | RESTORE_ARGS 0,-ARG_SKIP,1 | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 510 | /*CFI_REGISTER	rflags,r11*/ | 
| Brian Gerst | 3d1e42a | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 511 | movq	PER_CPU_VAR(old_rsp), %rsp | 
| Jeremy Fitzhardinge | 2be2998 | 2008-06-25 00:19:28 -0400 | [diff] [blame] | 512 | USERGS_SYSRET64 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 513 |  | 
| Jan Beulich | bcddc01 | 2006-12-07 02:14:02 +0100 | [diff] [blame] | 514 | CFI_RESTORE_STATE | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 515 | /* Handle reschedules */ | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 516 | /* edx:	work, edi: workmask */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 517 | sysret_careful: | 
|  | 518 | bt $TIF_NEED_RESCHED,%edx | 
|  | 519 | jnc sysret_signal | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 520 | TRACE_IRQS_ON | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 521 | ENABLE_INTERRUPTS(CLBR_NONE) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 522 | pushq %rdi | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 523 | CFI_ADJUST_CFA_OFFSET 8 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 524 | call schedule | 
|  | 525 | popq  %rdi | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 526 | CFI_ADJUST_CFA_OFFSET -8 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 527 | jmp sysret_check | 
|  | 528 |  | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 529 | /* Handle a signal */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 530 | sysret_signal: | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 531 | TRACE_IRQS_ON | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 532 | ENABLE_INTERRUPTS(CLBR_NONE) | 
| Roland McGrath | 86a1c34 | 2008-06-23 15:37:04 -0700 | [diff] [blame] | 533 | #ifdef CONFIG_AUDITSYSCALL | 
|  | 534 | bt $TIF_SYSCALL_AUDIT,%edx | 
|  | 535 | jc sysret_audit | 
|  | 536 | #endif | 
| Andi Kleen | 10ffdbb | 2005-05-16 21:53:19 -0700 | [diff] [blame] | 537 | /* edx:	work flags (arg3) */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 538 | leaq -ARGOFFSET(%rsp),%rdi # &pt_regs -> arg1 | 
|  | 539 | xorl %esi,%esi # oldset -> arg2 | 
| Alexander van Heukelum | c810841 | 2008-11-21 22:59:52 +0100 | [diff] [blame] | 540 | SAVE_REST | 
|  | 541 | FIXUP_TOP_OF_STACK %r11 | 
|  | 542 | call do_notify_resume | 
|  | 543 | RESTORE_TOP_OF_STACK %r11 | 
|  | 544 | RESTORE_REST | 
| Roland McGrath | 15e8f34 | 2008-06-23 20:41:12 -0700 | [diff] [blame] | 545 | movl $_TIF_WORK_MASK,%edi | 
| Andi Kleen | 7bf36bb | 2006-04-07 19:50:00 +0200 | [diff] [blame] | 546 | /* Use IRET because user could have changed frame. This | 
|  | 547 | works because ptregscall_common has called FIXUP_TOP_OF_STACK. */ | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 548 | DISABLE_INTERRUPTS(CLBR_NONE) | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 549 | TRACE_IRQS_OFF | 
| Andi Kleen | 7bf36bb | 2006-04-07 19:50:00 +0200 | [diff] [blame] | 550 | jmp int_with_check | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 551 |  | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 552 | badsys: | 
|  | 553 | movq $-ENOSYS,RAX-ARGOFFSET(%rsp) | 
|  | 554 | jmp ret_from_sys_call | 
|  | 555 |  | 
| Roland McGrath | 86a1c34 | 2008-06-23 15:37:04 -0700 | [diff] [blame] | 556 | #ifdef CONFIG_AUDITSYSCALL | 
|  | 557 | /* | 
|  | 558 | * Fast path for syscall audit without full syscall trace. | 
|  | 559 | * We just call audit_syscall_entry() directly, and then | 
|  | 560 | * jump back to the normal fast path. | 
|  | 561 | */ | 
|  | 562 | auditsys: | 
|  | 563 | movq %r10,%r9			/* 6th arg: 4th syscall arg */ | 
|  | 564 | movq %rdx,%r8			/* 5th arg: 3rd syscall arg */ | 
|  | 565 | movq %rsi,%rcx			/* 4th arg: 2nd syscall arg */ | 
|  | 566 | movq %rdi,%rdx			/* 3rd arg: 1st syscall arg */ | 
|  | 567 | movq %rax,%rsi			/* 2nd arg: syscall number */ | 
|  | 568 | movl $AUDIT_ARCH_X86_64,%edi	/* 1st arg: audit arch */ | 
|  | 569 | call audit_syscall_entry | 
|  | 570 | LOAD_ARGS 0		/* reload call-clobbered registers */ | 
|  | 571 | jmp system_call_fastpath | 
|  | 572 |  | 
|  | 573 | /* | 
|  | 574 | * Return fast path for syscall audit.  Call audit_syscall_exit() | 
|  | 575 | * directly and then jump back to the fast path with TIF_SYSCALL_AUDIT | 
|  | 576 | * masked off. | 
|  | 577 | */ | 
|  | 578 | sysret_audit: | 
|  | 579 | movq %rax,%rsi		/* second arg, syscall return value */ | 
|  | 580 | cmpq $0,%rax		/* is it < 0? */ | 
|  | 581 | setl %al		/* 1 if so, 0 if not */ | 
|  | 582 | movzbl %al,%edi		/* zero-extend that into %edi */ | 
|  | 583 | inc %edi /* first arg, 0->1(AUDITSC_SUCCESS), 1->2(AUDITSC_FAILURE) */ | 
|  | 584 | call audit_syscall_exit | 
|  | 585 | movl $(_TIF_ALLWORK_MASK & ~_TIF_SYSCALL_AUDIT),%edi | 
|  | 586 | jmp sysret_check | 
|  | 587 | #endif	/* CONFIG_AUDITSYSCALL */ | 
|  | 588 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 589 | /* Do syscall tracing */ | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 590 | tracesys: | 
| Roland McGrath | 86a1c34 | 2008-06-23 15:37:04 -0700 | [diff] [blame] | 591 | #ifdef CONFIG_AUDITSYSCALL | 
|  | 592 | testl $(_TIF_WORK_SYSCALL_ENTRY & ~_TIF_SYSCALL_AUDIT),TI_flags(%rcx) | 
|  | 593 | jz auditsys | 
|  | 594 | #endif | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 595 | SAVE_REST | 
| Roland McGrath | a31f8dd | 2008-03-16 21:59:11 -0700 | [diff] [blame] | 596 | movq $-ENOSYS,RAX(%rsp) /* ptrace can change this for a bad syscall */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 597 | FIXUP_TOP_OF_STACK %rdi | 
|  | 598 | movq %rsp,%rdi | 
|  | 599 | call syscall_trace_enter | 
| Roland McGrath | d4d6715 | 2008-07-09 02:38:07 -0700 | [diff] [blame] | 600 | /* | 
|  | 601 | * Reload arg registers from stack in case ptrace changed them. | 
|  | 602 | * We don't reload %rax because syscall_trace_enter() returned | 
|  | 603 | * the value it wants us to use in the table lookup. | 
|  | 604 | */ | 
|  | 605 | LOAD_ARGS ARGOFFSET, 1 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 606 | RESTORE_REST | 
|  | 607 | cmpq $__NR_syscall_max,%rax | 
| Roland McGrath | a31f8dd | 2008-03-16 21:59:11 -0700 | [diff] [blame] | 608 | ja   int_ret_from_sys_call	/* RAX(%rsp) set to -ENOSYS above */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 609 | movq %r10,%rcx	/* fixup for C */ | 
|  | 610 | call *sys_call_table(,%rax,8) | 
| Roland McGrath | a31f8dd | 2008-03-16 21:59:11 -0700 | [diff] [blame] | 611 | movq %rax,RAX-ARGOFFSET(%rsp) | 
| Andi Kleen | 7bf36bb | 2006-04-07 19:50:00 +0200 | [diff] [blame] | 612 | /* Use IRET because user could have changed frame */ | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 613 |  | 
|  | 614 | /* | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 615 | * Syscall return path ending with IRET. | 
|  | 616 | * Has correct top of stack, but partial stack frame. | 
| Jan Beulich | bcddc01 | 2006-12-07 02:14:02 +0100 | [diff] [blame] | 617 | */ | 
| Cyrill Gorcunov | bc8b2b9 | 2009-02-23 22:57:01 +0300 | [diff] [blame] | 618 | GLOBAL(int_ret_from_sys_call) | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 619 | DISABLE_INTERRUPTS(CLBR_NONE) | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 620 | TRACE_IRQS_OFF | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 621 | testl $3,CS-ARGOFFSET(%rsp) | 
|  | 622 | je retint_restore_args | 
|  | 623 | movl $_TIF_ALLWORK_MASK,%edi | 
|  | 624 | /* edi:	mask to check */ | 
| Cyrill Gorcunov | bc8b2b9 | 2009-02-23 22:57:01 +0300 | [diff] [blame] | 625 | GLOBAL(int_with_check) | 
| Peter Zijlstra | 10cd706 | 2007-10-11 22:11:12 +0200 | [diff] [blame] | 626 | LOCKDEP_SYS_EXIT_IRQ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 627 | GET_THREAD_INFO(%rcx) | 
| Glauber Costa | 26ccb8a | 2008-06-24 11:19:35 -0300 | [diff] [blame] | 628 | movl TI_flags(%rcx),%edx | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 629 | andl %edi,%edx | 
|  | 630 | jnz   int_careful | 
| Glauber Costa | 26ccb8a | 2008-06-24 11:19:35 -0300 | [diff] [blame] | 631 | andl    $~TS_COMPAT,TI_status(%rcx) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 632 | jmp   retint_swapgs | 
|  | 633 |  | 
|  | 634 | /* Either reschedule or signal or syscall exit tracking needed. */ | 
|  | 635 | /* First do a reschedule test. */ | 
|  | 636 | /* edx:	work, edi: workmask */ | 
|  | 637 | int_careful: | 
|  | 638 | bt $TIF_NEED_RESCHED,%edx | 
|  | 639 | jnc  int_very_careful | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 640 | TRACE_IRQS_ON | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 641 | ENABLE_INTERRUPTS(CLBR_NONE) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 642 | pushq %rdi | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 643 | CFI_ADJUST_CFA_OFFSET 8 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 644 | call schedule | 
|  | 645 | popq %rdi | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 646 | CFI_ADJUST_CFA_OFFSET -8 | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 647 | DISABLE_INTERRUPTS(CLBR_NONE) | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 648 | TRACE_IRQS_OFF | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 649 | jmp int_with_check | 
|  | 650 |  | 
|  | 651 | /* handle signals and tracing -- both require a full stack frame */ | 
|  | 652 | int_very_careful: | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 653 | TRACE_IRQS_ON | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 654 | ENABLE_INTERRUPTS(CLBR_NONE) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 655 | SAVE_REST | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 656 | /* Check for syscall exit trace */ | 
| Roland McGrath | d4d6715 | 2008-07-09 02:38:07 -0700 | [diff] [blame] | 657 | testl $_TIF_WORK_SYSCALL_EXIT,%edx | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 658 | jz int_signal | 
|  | 659 | pushq %rdi | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 660 | CFI_ADJUST_CFA_OFFSET 8 | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 661 | leaq 8(%rsp),%rdi	# &ptregs -> arg1 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 662 | call syscall_trace_leave | 
|  | 663 | popq %rdi | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 664 | CFI_ADJUST_CFA_OFFSET -8 | 
| Roland McGrath | d4d6715 | 2008-07-09 02:38:07 -0700 | [diff] [blame] | 665 | andl $~(_TIF_WORK_SYSCALL_EXIT|_TIF_SYSCALL_EMU),%edi | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 666 | jmp int_restore_rest | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 667 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 668 | int_signal: | 
| Peter Zijlstra | 8f4d37e | 2008-01-25 21:08:29 +0100 | [diff] [blame] | 669 | testl $_TIF_DO_NOTIFY_MASK,%edx | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 670 | jz 1f | 
|  | 671 | movq %rsp,%rdi		# &ptregs -> arg1 | 
|  | 672 | xorl %esi,%esi		# oldset -> arg2 | 
|  | 673 | call do_notify_resume | 
| Roland McGrath | eca91e7 | 2008-07-10 14:50:39 -0700 | [diff] [blame] | 674 | 1:	movl $_TIF_WORK_MASK,%edi | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 675 | int_restore_rest: | 
|  | 676 | RESTORE_REST | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 677 | DISABLE_INTERRUPTS(CLBR_NONE) | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 678 | TRACE_IRQS_OFF | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 679 | jmp int_with_check | 
|  | 680 | CFI_ENDPROC | 
| Jan Beulich | bcddc01 | 2006-12-07 02:14:02 +0100 | [diff] [blame] | 681 | END(system_call) | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 682 |  | 
|  | 683 | /* | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 684 | * Certain special system calls that need to save a complete full stack frame. | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 685 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 686 | .macro PTREGSCALL label,func,arg | 
| Alexander van Heukelum | c002a1e | 2008-11-21 16:41:55 +0100 | [diff] [blame] | 687 | ENTRY(\label) | 
|  | 688 | PARTIAL_FRAME 1 8		/* offset 8: return address */ | 
|  | 689 | subq $REST_SKIP, %rsp | 
|  | 690 | CFI_ADJUST_CFA_OFFSET REST_SKIP | 
|  | 691 | call save_rest | 
|  | 692 | DEFAULT_FRAME 0 8		/* offset 8: return address */ | 
|  | 693 | leaq 8(%rsp), \arg	/* pt_regs pointer */ | 
|  | 694 | call \func | 
|  | 695 | jmp ptregscall_common | 
|  | 696 | CFI_ENDPROC | 
| Jan Beulich | 4b787e0 | 2006-06-26 13:56:55 +0200 | [diff] [blame] | 697 | END(\label) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 698 | .endm | 
|  | 699 |  | 
|  | 700 | PTREGSCALL stub_clone, sys_clone, %r8 | 
|  | 701 | PTREGSCALL stub_fork, sys_fork, %rdi | 
|  | 702 | PTREGSCALL stub_vfork, sys_vfork, %rdi | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 703 | PTREGSCALL stub_sigaltstack, sys_sigaltstack, %rdx | 
|  | 704 | PTREGSCALL stub_iopl, sys_iopl, %rsi | 
|  | 705 |  | 
|  | 706 | ENTRY(ptregscall_common) | 
| Alexander van Heukelum | c002a1e | 2008-11-21 16:41:55 +0100 | [diff] [blame] | 707 | DEFAULT_FRAME 1 8	/* offset 8: return address */ | 
|  | 708 | RESTORE_TOP_OF_STACK %r11, 8 | 
|  | 709 | movq_cfi_restore R15+8, r15 | 
|  | 710 | movq_cfi_restore R14+8, r14 | 
|  | 711 | movq_cfi_restore R13+8, r13 | 
|  | 712 | movq_cfi_restore R12+8, r12 | 
|  | 713 | movq_cfi_restore RBP+8, rbp | 
|  | 714 | movq_cfi_restore RBX+8, rbx | 
|  | 715 | ret $REST_SKIP		/* pop extended registers */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 716 | CFI_ENDPROC | 
| Jan Beulich | 4b787e0 | 2006-06-26 13:56:55 +0200 | [diff] [blame] | 717 | END(ptregscall_common) | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 718 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 719 | ENTRY(stub_execve) | 
|  | 720 | CFI_STARTPROC | 
|  | 721 | popq %r11 | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 722 | CFI_ADJUST_CFA_OFFSET -8 | 
|  | 723 | CFI_REGISTER rip, r11 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 724 | SAVE_REST | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 725 | FIXUP_TOP_OF_STACK %r11 | 
| Ingo Molnar | 5d119b2 | 2008-02-26 12:55:57 +0100 | [diff] [blame] | 726 | movq %rsp, %rcx | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 727 | call sys_execve | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 728 | RESTORE_TOP_OF_STACK %r11 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 729 | movq %rax,RAX(%rsp) | 
|  | 730 | RESTORE_REST | 
|  | 731 | jmp int_ret_from_sys_call | 
|  | 732 | CFI_ENDPROC | 
| Jan Beulich | 4b787e0 | 2006-06-26 13:56:55 +0200 | [diff] [blame] | 733 | END(stub_execve) | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 734 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 735 | /* | 
|  | 736 | * sigreturn is special because it needs to restore all registers on return. | 
|  | 737 | * This cannot be done with SYSRET, so use the IRET return path instead. | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 738 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 739 | ENTRY(stub_rt_sigreturn) | 
|  | 740 | CFI_STARTPROC | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 741 | addq $8, %rsp | 
|  | 742 | CFI_ADJUST_CFA_OFFSET	-8 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 743 | SAVE_REST | 
|  | 744 | movq %rsp,%rdi | 
|  | 745 | FIXUP_TOP_OF_STACK %r11 | 
|  | 746 | call sys_rt_sigreturn | 
|  | 747 | movq %rax,RAX(%rsp) # fixme, this could be done at the higher layer | 
|  | 748 | RESTORE_REST | 
|  | 749 | jmp int_ret_from_sys_call | 
|  | 750 | CFI_ENDPROC | 
| Jan Beulich | 4b787e0 | 2006-06-26 13:56:55 +0200 | [diff] [blame] | 751 | END(stub_rt_sigreturn) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 752 |  | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 753 | /* | 
| H. Peter Anvin | 939b787 | 2008-11-11 13:51:52 -0800 | [diff] [blame] | 754 | * Build the entry stubs and pointer table with some assembler magic. | 
|  | 755 | * We pack 7 stubs into a single 32-byte chunk, which will fit in a | 
|  | 756 | * single cache line on all modern x86 implementations. | 
|  | 757 | */ | 
|  | 758 | .section .init.rodata,"a" | 
|  | 759 | ENTRY(interrupt) | 
|  | 760 | .text | 
|  | 761 | .p2align 5 | 
|  | 762 | .p2align CONFIG_X86_L1_CACHE_SHIFT | 
|  | 763 | ENTRY(irq_entries_start) | 
|  | 764 | INTR_FRAME | 
|  | 765 | vector=FIRST_EXTERNAL_VECTOR | 
|  | 766 | .rept (NR_VECTORS-FIRST_EXTERNAL_VECTOR+6)/7 | 
|  | 767 | .balign 32 | 
|  | 768 | .rept	7 | 
|  | 769 | .if vector < NR_VECTORS | 
| H. Peter Anvin | 8665596 | 2008-11-12 10:27:35 -0800 | [diff] [blame] | 770 | .if vector <> FIRST_EXTERNAL_VECTOR | 
| H. Peter Anvin | 939b787 | 2008-11-11 13:51:52 -0800 | [diff] [blame] | 771 | CFI_ADJUST_CFA_OFFSET -8 | 
|  | 772 | .endif | 
|  | 773 | 1:	pushq $(~vector+0x80)	/* Note: always in signed byte range */ | 
|  | 774 | CFI_ADJUST_CFA_OFFSET 8 | 
| H. Peter Anvin | 8665596 | 2008-11-12 10:27:35 -0800 | [diff] [blame] | 775 | .if ((vector-FIRST_EXTERNAL_VECTOR)%7) <> 6 | 
| H. Peter Anvin | 939b787 | 2008-11-11 13:51:52 -0800 | [diff] [blame] | 776 | jmp 2f | 
|  | 777 | .endif | 
|  | 778 | .previous | 
|  | 779 | .quad 1b | 
|  | 780 | .text | 
|  | 781 | vector=vector+1 | 
|  | 782 | .endif | 
|  | 783 | .endr | 
|  | 784 | 2:	jmp common_interrupt | 
|  | 785 | .endr | 
|  | 786 | CFI_ENDPROC | 
|  | 787 | END(irq_entries_start) | 
|  | 788 |  | 
|  | 789 | .previous | 
|  | 790 | END(interrupt) | 
|  | 791 | .previous | 
|  | 792 |  | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 793 | /* | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 794 | * Interrupt entry/exit. | 
|  | 795 | * | 
|  | 796 | * Interrupt entry points save only callee clobbered registers in fast path. | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 797 | * | 
|  | 798 | * Entry runs with interrupts off. | 
|  | 799 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 800 |  | 
| Alexander van Heukelum | 722024d | 2008-11-13 13:50:20 +0100 | [diff] [blame] | 801 | /* 0(%rsp): ~(interrupt number) */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 802 | .macro interrupt func | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 803 | subq $10*8, %rsp | 
|  | 804 | CFI_ADJUST_CFA_OFFSET 10*8 | 
|  | 805 | call save_args | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 806 | PARTIAL_FRAME 0 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 807 | call \func | 
|  | 808 | .endm | 
|  | 809 |  | 
| Alexander van Heukelum | 722024d | 2008-11-13 13:50:20 +0100 | [diff] [blame] | 810 | /* | 
|  | 811 | * The interrupt stubs push (~vector+0x80) onto the stack and | 
|  | 812 | * then jump to common_interrupt. | 
|  | 813 | */ | 
| H. Peter Anvin | 939b787 | 2008-11-11 13:51:52 -0800 | [diff] [blame] | 814 | .p2align CONFIG_X86_L1_CACHE_SHIFT | 
|  | 815 | common_interrupt: | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 816 | XCPT_FRAME | 
| Alexander van Heukelum | 722024d | 2008-11-13 13:50:20 +0100 | [diff] [blame] | 817 | addq $-0x80,(%rsp)		/* Adjust vector to [-256,-1] range */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 818 | interrupt do_IRQ | 
| Brian Gerst | 3d1e42a | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 819 | /* 0(%rsp): old_rsp-ARGOFFSET */ | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 820 | ret_from_intr: | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 821 | DISABLE_INTERRUPTS(CLBR_NONE) | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 822 | TRACE_IRQS_OFF | 
| Brian Gerst | 5689553 | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 823 | decl PER_CPU_VAR(irq_count) | 
| Jan Beulich | 1de9c3f | 2006-06-26 13:57:35 +0200 | [diff] [blame] | 824 | leaveq | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 825 | CFI_DEF_CFA_REGISTER	rsp | 
| Jan Beulich | 1de9c3f | 2006-06-26 13:57:35 +0200 | [diff] [blame] | 826 | CFI_ADJUST_CFA_OFFSET	-8 | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 827 | exit_intr: | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 828 | GET_THREAD_INFO(%rcx) | 
|  | 829 | testl $3,CS-ARGOFFSET(%rsp) | 
|  | 830 | je retint_kernel | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 831 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 832 | /* Interrupt came from user space */ | 
|  | 833 | /* | 
|  | 834 | * Has a correct top of stack, but a partial stack frame | 
|  | 835 | * %rcx: thread info. Interrupts off. | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 836 | */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 837 | retint_with_reschedule: | 
|  | 838 | movl $_TIF_WORK_MASK,%edi | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 839 | retint_check: | 
| Peter Zijlstra | 10cd706 | 2007-10-11 22:11:12 +0200 | [diff] [blame] | 840 | LOCKDEP_SYS_EXIT_IRQ | 
| Glauber Costa | 26ccb8a | 2008-06-24 11:19:35 -0300 | [diff] [blame] | 841 | movl TI_flags(%rcx),%edx | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 842 | andl %edi,%edx | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 843 | CFI_REMEMBER_STATE | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 844 | jnz  retint_careful | 
| Peter Zijlstra | 10cd706 | 2007-10-11 22:11:12 +0200 | [diff] [blame] | 845 |  | 
|  | 846 | retint_swapgs:		/* return to user-space */ | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 847 | /* | 
|  | 848 | * The iretq could re-enable interrupts: | 
|  | 849 | */ | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 850 | DISABLE_INTERRUPTS(CLBR_ANY) | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 851 | TRACE_IRQS_IRETQ | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 852 | SWAPGS | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 853 | jmp restore_args | 
|  | 854 |  | 
| Peter Zijlstra | 10cd706 | 2007-10-11 22:11:12 +0200 | [diff] [blame] | 855 | retint_restore_args:	/* return to kernel space */ | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 856 | DISABLE_INTERRUPTS(CLBR_ANY) | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 857 | /* | 
|  | 858 | * The iretq could re-enable interrupts: | 
|  | 859 | */ | 
|  | 860 | TRACE_IRQS_IRETQ | 
|  | 861 | restore_args: | 
| Ingo Molnar | 3701d863 | 2008-02-09 23:24:08 +0100 | [diff] [blame] | 862 | RESTORE_ARGS 0,8,0 | 
|  | 863 |  | 
| Adrian Bunk | f7f3d79 | 2008-02-13 23:29:53 +0200 | [diff] [blame] | 864 | irq_return: | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 865 | INTERRUPT_RETURN | 
| Ingo Molnar | 3701d863 | 2008-02-09 23:24:08 +0100 | [diff] [blame] | 866 |  | 
|  | 867 | .section __ex_table, "a" | 
|  | 868 | .quad irq_return, bad_iret | 
|  | 869 | .previous | 
|  | 870 |  | 
|  | 871 | #ifdef CONFIG_PARAVIRT | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 872 | ENTRY(native_iret) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 873 | iretq | 
|  | 874 |  | 
|  | 875 | .section __ex_table,"a" | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 876 | .quad native_iret, bad_iret | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 877 | .previous | 
| Ingo Molnar | 3701d863 | 2008-02-09 23:24:08 +0100 | [diff] [blame] | 878 | #endif | 
|  | 879 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 880 | .section .fixup,"ax" | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 881 | bad_iret: | 
| Roland McGrath | 3aa4b37 | 2008-02-06 22:39:43 +0100 | [diff] [blame] | 882 | /* | 
|  | 883 | * The iret traps when the %cs or %ss being restored is bogus. | 
|  | 884 | * We've lost the original trap vector and error code. | 
|  | 885 | * #GPF is the most likely one to get for an invalid selector. | 
|  | 886 | * So pretend we completed the iret and took the #GPF in user mode. | 
|  | 887 | * | 
|  | 888 | * We are now running with the kernel GS after exception recovery. | 
|  | 889 | * But error_entry expects us to have user GS to match the user %cs, | 
|  | 890 | * so swap back. | 
|  | 891 | */ | 
|  | 892 | pushq $0 | 
|  | 893 |  | 
|  | 894 | SWAPGS | 
|  | 895 | jmp general_protection | 
|  | 896 |  | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 897 | .previous | 
|  | 898 |  | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 899 | /* edi: workmask, edx: work */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 900 | retint_careful: | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 901 | CFI_RESTORE_STATE | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 902 | bt    $TIF_NEED_RESCHED,%edx | 
|  | 903 | jnc   retint_signal | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 904 | TRACE_IRQS_ON | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 905 | ENABLE_INTERRUPTS(CLBR_NONE) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 906 | pushq %rdi | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 907 | CFI_ADJUST_CFA_OFFSET	8 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 908 | call  schedule | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 909 | popq %rdi | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 910 | CFI_ADJUST_CFA_OFFSET	-8 | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 911 | GET_THREAD_INFO(%rcx) | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 912 | DISABLE_INTERRUPTS(CLBR_NONE) | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 913 | TRACE_IRQS_OFF | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 914 | jmp retint_check | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 915 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 916 | retint_signal: | 
| Peter Zijlstra | 8f4d37e | 2008-01-25 21:08:29 +0100 | [diff] [blame] | 917 | testl $_TIF_DO_NOTIFY_MASK,%edx | 
| Andi Kleen | 10ffdbb | 2005-05-16 21:53:19 -0700 | [diff] [blame] | 918 | jz    retint_swapgs | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 919 | TRACE_IRQS_ON | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 920 | ENABLE_INTERRUPTS(CLBR_NONE) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 921 | SAVE_REST | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 922 | movq $-1,ORIG_RAX(%rsp) | 
| Andi Kleen | 3829ee6 | 2005-07-28 21:15:48 -0700 | [diff] [blame] | 923 | xorl %esi,%esi		# oldset | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 924 | movq %rsp,%rdi		# &pt_regs | 
|  | 925 | call do_notify_resume | 
|  | 926 | RESTORE_REST | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 927 | DISABLE_INTERRUPTS(CLBR_NONE) | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 928 | TRACE_IRQS_OFF | 
| Andi Kleen | be9e687 | 2005-05-01 08:58:51 -0700 | [diff] [blame] | 929 | GET_THREAD_INFO(%rcx) | 
| Roland McGrath | eca91e7 | 2008-07-10 14:50:39 -0700 | [diff] [blame] | 930 | jmp retint_with_reschedule | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 931 |  | 
|  | 932 | #ifdef CONFIG_PREEMPT | 
|  | 933 | /* Returning to kernel space. Check if we need preemption */ | 
|  | 934 | /* rcx:	 threadinfo. interrupts off. */ | 
| Andi Kleen | b06baba | 2006-09-26 10:52:29 +0200 | [diff] [blame] | 935 | ENTRY(retint_kernel) | 
| Glauber Costa | 26ccb8a | 2008-06-24 11:19:35 -0300 | [diff] [blame] | 936 | cmpl $0,TI_preempt_count(%rcx) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 937 | jnz  retint_restore_args | 
| Glauber Costa | 26ccb8a | 2008-06-24 11:19:35 -0300 | [diff] [blame] | 938 | bt  $TIF_NEED_RESCHED,TI_flags(%rcx) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 939 | jnc  retint_restore_args | 
|  | 940 | bt   $9,EFLAGS-ARGOFFSET(%rsp)	/* interrupts off? */ | 
|  | 941 | jnc  retint_restore_args | 
|  | 942 | call preempt_schedule_irq | 
|  | 943 | jmp exit_intr | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 944 | #endif | 
| Jan Beulich | 4b787e0 | 2006-06-26 13:56:55 +0200 | [diff] [blame] | 945 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 946 | CFI_ENDPROC | 
| Jan Beulich | 4b787e0 | 2006-06-26 13:56:55 +0200 | [diff] [blame] | 947 | END(common_interrupt) | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 948 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 949 | /* | 
|  | 950 | * APIC interrupts. | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 951 | */ | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 952 | .macro apicinterrupt num sym do_sym | 
|  | 953 | ENTRY(\sym) | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 954 | INTR_FRAME | 
| Rusty Russell | 19eadf9 | 2006-06-27 02:53:44 -0700 | [diff] [blame] | 955 | pushq $~(\num) | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 956 | CFI_ADJUST_CFA_OFFSET 8 | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 957 | interrupt \do_sym | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 958 | jmp ret_from_intr | 
|  | 959 | CFI_ENDPROC | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 960 | END(\sym) | 
|  | 961 | .endm | 
| Jacob Shin | 89b831e | 2005-11-05 17:25:53 +0100 | [diff] [blame] | 962 |  | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 963 | #ifdef CONFIG_SMP | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 964 | apicinterrupt IRQ_MOVE_CLEANUP_VECTOR \ | 
|  | 965 | irq_move_cleanup_interrupt smp_irq_move_cleanup_interrupt | 
| Andi Kleen | 4ef702c | 2009-05-27 21:56:52 +0200 | [diff] [blame] | 966 | apicinterrupt REBOOT_VECTOR \ | 
|  | 967 | reboot_interrupt smp_reboot_interrupt | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 968 | #endif | 
|  | 969 |  | 
| Nick Piggin | 03b4863 | 2009-01-20 04:36:04 +0100 | [diff] [blame] | 970 | #ifdef CONFIG_X86_UV | 
| Cyrill Gorcunov | 5ae3a13 | 2008-11-27 00:02:10 +0300 | [diff] [blame] | 971 | apicinterrupt UV_BAU_MESSAGE \ | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 972 | uv_bau_message_intr1 uv_bau_message_interrupt | 
| Nick Piggin | 03b4863 | 2009-01-20 04:36:04 +0100 | [diff] [blame] | 973 | #endif | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 974 | apicinterrupt LOCAL_TIMER_VECTOR \ | 
|  | 975 | apic_timer_interrupt smp_apic_timer_interrupt | 
| Dimitri Sivanich | acaabe7 | 2009-03-04 12:56:05 -0600 | [diff] [blame] | 976 | apicinterrupt GENERIC_INTERRUPT_VECTOR \ | 
|  | 977 | generic_interrupt smp_generic_interrupt | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 978 |  | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 979 | #ifdef CONFIG_SMP | 
|  | 980 | apicinterrupt INVALIDATE_TLB_VECTOR_START+0 \ | 
|  | 981 | invalidate_interrupt0 smp_invalidate_interrupt | 
|  | 982 | apicinterrupt INVALIDATE_TLB_VECTOR_START+1 \ | 
|  | 983 | invalidate_interrupt1 smp_invalidate_interrupt | 
|  | 984 | apicinterrupt INVALIDATE_TLB_VECTOR_START+2 \ | 
|  | 985 | invalidate_interrupt2 smp_invalidate_interrupt | 
|  | 986 | apicinterrupt INVALIDATE_TLB_VECTOR_START+3 \ | 
|  | 987 | invalidate_interrupt3 smp_invalidate_interrupt | 
|  | 988 | apicinterrupt INVALIDATE_TLB_VECTOR_START+4 \ | 
|  | 989 | invalidate_interrupt4 smp_invalidate_interrupt | 
|  | 990 | apicinterrupt INVALIDATE_TLB_VECTOR_START+5 \ | 
|  | 991 | invalidate_interrupt5 smp_invalidate_interrupt | 
|  | 992 | apicinterrupt INVALIDATE_TLB_VECTOR_START+6 \ | 
|  | 993 | invalidate_interrupt6 smp_invalidate_interrupt | 
|  | 994 | apicinterrupt INVALIDATE_TLB_VECTOR_START+7 \ | 
|  | 995 | invalidate_interrupt7 smp_invalidate_interrupt | 
|  | 996 | #endif | 
| Cliff Wickman | 1812924 | 2008-06-02 08:56:14 -0500 | [diff] [blame] | 997 |  | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 998 | apicinterrupt THRESHOLD_APIC_VECTOR \ | 
| Andi Kleen | 7856f6c | 2009-04-28 23:32:56 +0200 | [diff] [blame] | 999 | threshold_interrupt smp_threshold_interrupt | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1000 | apicinterrupt THERMAL_APIC_VECTOR \ | 
|  | 1001 | thermal_interrupt smp_thermal_interrupt | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1002 |  | 
| Andi Kleen | ccc3c31 | 2009-05-27 21:56:54 +0200 | [diff] [blame] | 1003 | #ifdef CONFIG_X86_MCE | 
|  | 1004 | apicinterrupt MCE_SELF_VECTOR \ | 
|  | 1005 | mce_self_interrupt smp_mce_self_interrupt | 
|  | 1006 | #endif | 
|  | 1007 |  | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1008 | #ifdef CONFIG_SMP | 
|  | 1009 | apicinterrupt CALL_FUNCTION_SINGLE_VECTOR \ | 
|  | 1010 | call_function_single_interrupt smp_call_function_single_interrupt | 
|  | 1011 | apicinterrupt CALL_FUNCTION_VECTOR \ | 
|  | 1012 | call_function_interrupt smp_call_function_interrupt | 
|  | 1013 | apicinterrupt RESCHEDULE_VECTOR \ | 
|  | 1014 | reschedule_interrupt smp_reschedule_interrupt | 
|  | 1015 | #endif | 
|  | 1016 |  | 
|  | 1017 | apicinterrupt ERROR_APIC_VECTOR \ | 
|  | 1018 | error_interrupt smp_error_interrupt | 
|  | 1019 | apicinterrupt SPURIOUS_APIC_VECTOR \ | 
|  | 1020 | spurious_interrupt smp_spurious_interrupt | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 1021 |  | 
| Ingo Molnar | 241771e | 2008-12-03 10:39:53 +0100 | [diff] [blame] | 1022 | #ifdef CONFIG_PERF_COUNTERS | 
| Peter Zijlstra | b6276f3 | 2009-04-06 11:45:03 +0200 | [diff] [blame] | 1023 | apicinterrupt LOCAL_PENDING_VECTOR \ | 
|  | 1024 | perf_pending_interrupt smp_perf_pending_interrupt | 
| Ingo Molnar | 241771e | 2008-12-03 10:39:53 +0100 | [diff] [blame] | 1025 | #endif | 
|  | 1026 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1027 | /* | 
|  | 1028 | * Exception entry points. | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 1029 | */ | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1030 | .macro zeroentry sym do_sym | 
|  | 1031 | ENTRY(\sym) | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1032 | INTR_FRAME | 
| Jeremy Fitzhardinge | fab5842 | 2008-06-25 00:19:31 -0400 | [diff] [blame] | 1033 | PARAVIRT_ADJUST_EXCEPTION_FRAME | 
| Ingo Molnar | 14ae22b | 2008-11-21 15:20:47 +0100 | [diff] [blame] | 1034 | pushq_cfi $-1		/* ORIG_RAX: no syscall to restart */ | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 1035 | subq $15*8,%rsp | 
|  | 1036 | CFI_ADJUST_CFA_OFFSET 15*8 | 
|  | 1037 | call error_entry | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 1038 | DEFAULT_FRAME 0 | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 1039 | movq %rsp,%rdi		/* pt_regs pointer */ | 
|  | 1040 | xorl %esi,%esi		/* no error code */ | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1041 | call \do_sym | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 1042 | jmp error_exit		/* %ebx: no swapgs flag */ | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1043 | CFI_ENDPROC | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1044 | END(\sym) | 
|  | 1045 | .endm | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1046 |  | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1047 | .macro paranoidzeroentry sym do_sym | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1048 | ENTRY(\sym) | 
| Alexander van Heukelum | b8b1d08 | 2008-11-21 16:44:28 +0100 | [diff] [blame] | 1049 | INTR_FRAME | 
|  | 1050 | PARAVIRT_ADJUST_EXCEPTION_FRAME | 
|  | 1051 | pushq $-1		/* ORIG_RAX: no syscall to restart */ | 
|  | 1052 | CFI_ADJUST_CFA_OFFSET 8 | 
|  | 1053 | subq $15*8, %rsp | 
|  | 1054 | call save_paranoid | 
|  | 1055 | TRACE_IRQS_OFF | 
|  | 1056 | movq %rsp,%rdi		/* pt_regs pointer */ | 
|  | 1057 | xorl %esi,%esi		/* no error code */ | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1058 | call \do_sym | 
| Alexander van Heukelum | b8b1d08 | 2008-11-21 16:44:28 +0100 | [diff] [blame] | 1059 | jmp paranoid_exit	/* %ebx: no swapgs flag */ | 
|  | 1060 | CFI_ENDPROC | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1061 | END(\sym) | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1062 | .endm | 
| Alexander van Heukelum | b8b1d08 | 2008-11-21 16:44:28 +0100 | [diff] [blame] | 1063 |  | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1064 | .macro paranoidzeroentry_ist sym do_sym ist | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1065 | ENTRY(\sym) | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1066 | INTR_FRAME | 
| Alexander van Heukelum | b8b1d08 | 2008-11-21 16:44:28 +0100 | [diff] [blame] | 1067 | PARAVIRT_ADJUST_EXCEPTION_FRAME | 
|  | 1068 | pushq $-1		/* ORIG_RAX: no syscall to restart */ | 
|  | 1069 | CFI_ADJUST_CFA_OFFSET 8 | 
|  | 1070 | subq $15*8, %rsp | 
|  | 1071 | call save_paranoid | 
|  | 1072 | TRACE_IRQS_OFF | 
|  | 1073 | movq %rsp,%rdi		/* pt_regs pointer */ | 
|  | 1074 | xorl %esi,%esi		/* no error code */ | 
| Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 1075 | PER_CPU(init_tss, %rbp) | 
|  | 1076 | subq $EXCEPTION_STKSZ, TSS_ist + (\ist - 1) * 8(%rbp) | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1077 | call \do_sym | 
| Tejun Heo | 9939dda | 2009-01-13 20:41:35 +0900 | [diff] [blame] | 1078 | addq $EXCEPTION_STKSZ, TSS_ist + (\ist - 1) * 8(%rbp) | 
| Alexander van Heukelum | b8b1d08 | 2008-11-21 16:44:28 +0100 | [diff] [blame] | 1079 | jmp paranoid_exit	/* %ebx: no swapgs flag */ | 
|  | 1080 | CFI_ENDPROC | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1081 | END(\sym) | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1082 | .endm | 
| Alexander van Heukelum | b8b1d08 | 2008-11-21 16:44:28 +0100 | [diff] [blame] | 1083 |  | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1084 | .macro errorentry sym do_sym | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1085 | ENTRY(\sym) | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1086 | XCPT_FRAME | 
| Jeremy Fitzhardinge | fab5842 | 2008-06-25 00:19:31 -0400 | [diff] [blame] | 1087 | PARAVIRT_ADJUST_EXCEPTION_FRAME | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 1088 | subq $15*8,%rsp | 
|  | 1089 | CFI_ADJUST_CFA_OFFSET 15*8 | 
|  | 1090 | call error_entry | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 1091 | DEFAULT_FRAME 0 | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 1092 | movq %rsp,%rdi			/* pt_regs pointer */ | 
|  | 1093 | movq ORIG_RAX(%rsp),%rsi	/* get error code */ | 
|  | 1094 | movq $-1,ORIG_RAX(%rsp)		/* no syscall to restart */ | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1095 | call \do_sym | 
| Alexander van Heukelum | d99015b | 2008-11-19 01:18:11 +0100 | [diff] [blame] | 1096 | jmp error_exit			/* %ebx: no swapgs flag */ | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1097 | CFI_ENDPROC | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1098 | END(\sym) | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1099 | .endm | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1100 |  | 
|  | 1101 | /* error code is on the stack already */ | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1102 | .macro paranoiderrorentry sym do_sym | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1103 | ENTRY(\sym) | 
| Alexander van Heukelum | b8b1d08 | 2008-11-21 16:44:28 +0100 | [diff] [blame] | 1104 | XCPT_FRAME | 
|  | 1105 | PARAVIRT_ADJUST_EXCEPTION_FRAME | 
|  | 1106 | subq $15*8,%rsp | 
| Alexander van Heukelum | e2f6bc2 | 2008-11-21 16:43:18 +0100 | [diff] [blame] | 1107 | CFI_ADJUST_CFA_OFFSET 15*8 | 
|  | 1108 | call save_paranoid | 
|  | 1109 | DEFAULT_FRAME 0 | 
| Alexander van Heukelum | 7e61a79 | 2008-09-26 14:03:03 +0200 | [diff] [blame] | 1110 | TRACE_IRQS_OFF | 
| Alexander van Heukelum | b8b1d08 | 2008-11-21 16:44:28 +0100 | [diff] [blame] | 1111 | movq %rsp,%rdi			/* pt_regs pointer */ | 
|  | 1112 | movq ORIG_RAX(%rsp),%rsi	/* get error code */ | 
|  | 1113 | movq $-1,ORIG_RAX(%rsp)		/* no syscall to restart */ | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1114 | call \do_sym | 
| Alexander van Heukelum | b8b1d08 | 2008-11-21 16:44:28 +0100 | [diff] [blame] | 1115 | jmp paranoid_exit		/* %ebx: no swapgs flag */ | 
|  | 1116 | CFI_ENDPROC | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1117 | END(\sym) | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1118 | .endm | 
|  | 1119 |  | 
|  | 1120 | zeroentry divide_error do_divide_error | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1121 | zeroentry overflow do_overflow | 
|  | 1122 | zeroentry bounds do_bounds | 
|  | 1123 | zeroentry invalid_op do_invalid_op | 
|  | 1124 | zeroentry device_not_available do_device_not_available | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1125 | paranoiderrorentry double_fault do_double_fault | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1126 | zeroentry coprocessor_segment_overrun do_coprocessor_segment_overrun | 
|  | 1127 | errorentry invalid_TSS do_invalid_TSS | 
|  | 1128 | errorentry segment_not_present do_segment_not_present | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1129 | zeroentry spurious_interrupt_bug do_spurious_interrupt_bug | 
|  | 1130 | zeroentry coprocessor_error do_coprocessor_error | 
|  | 1131 | errorentry alignment_check do_alignment_check | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1132 | zeroentry simd_coprocessor_error do_simd_coprocessor_error | 
| Ingo Molnar | 2601e64 | 2006-07-03 00:24:45 -0700 | [diff] [blame] | 1133 |  | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1134 | /* Reload gs selector with exception handling */ | 
|  | 1135 | /* edi:  new selector */ | 
| Jeremy Fitzhardinge | 9f9d489 | 2008-06-25 00:19:32 -0400 | [diff] [blame] | 1136 | ENTRY(native_load_gs_index) | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1137 | CFI_STARTPROC | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1138 | pushf | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1139 | CFI_ADJUST_CFA_OFFSET 8 | 
| Jeremy Fitzhardinge | b8aa287 | 2009-01-28 14:35:03 -0800 | [diff] [blame] | 1140 | DISABLE_INTERRUPTS(CLBR_ANY & ~CLBR_RDI) | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1141 | SWAPGS | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 1142 | gs_change: | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1143 | movl %edi,%gs | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1144 | 2:	mfence		/* workaround */ | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 1145 | SWAPGS | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1146 | popf | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1147 | CFI_ADJUST_CFA_OFFSET -8 | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1148 | ret | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1149 | CFI_ENDPROC | 
| Alexander van Heukelum | 6efdcfa | 2008-11-23 10:15:32 +0100 | [diff] [blame] | 1150 | END(native_load_gs_index) | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 1151 |  | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1152 | .section __ex_table,"a" | 
|  | 1153 | .align 8 | 
|  | 1154 | .quad gs_change,bad_gs | 
|  | 1155 | .previous | 
|  | 1156 | .section .fixup,"ax" | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1157 | /* running with kernelgs */ | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 1158 | bad_gs: | 
| Glauber de Oliveira Costa | 72fe485 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 1159 | SWAPGS			/* switch back to user gs */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1160 | xorl %eax,%eax | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1161 | movl %eax,%gs | 
|  | 1162 | jmp  2b | 
|  | 1163 | .previous | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 1164 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1165 | /* | 
|  | 1166 | * Create a kernel thread. | 
|  | 1167 | * | 
|  | 1168 | * C extern interface: | 
|  | 1169 | *	extern long kernel_thread(int (*fn)(void *), void * arg, unsigned long flags) | 
|  | 1170 | * | 
|  | 1171 | * asm input arguments: | 
|  | 1172 | *	rdi: fn, rsi: arg, rdx: flags | 
|  | 1173 | */ | 
|  | 1174 | ENTRY(kernel_thread) | 
|  | 1175 | CFI_STARTPROC | 
|  | 1176 | FAKE_STACK_FRAME $child_rip | 
|  | 1177 | SAVE_ALL | 
|  | 1178 |  | 
|  | 1179 | # rdi: flags, rsi: usp, rdx: will be &pt_regs | 
|  | 1180 | movq %rdx,%rdi | 
|  | 1181 | orq  kernel_thread_flags(%rip),%rdi | 
|  | 1182 | movq $-1, %rsi | 
|  | 1183 | movq %rsp, %rdx | 
|  | 1184 |  | 
|  | 1185 | xorl %r8d,%r8d | 
|  | 1186 | xorl %r9d,%r9d | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 1187 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1188 | # clone now | 
|  | 1189 | call do_fork | 
|  | 1190 | movq %rax,RAX(%rsp) | 
|  | 1191 | xorl %edi,%edi | 
|  | 1192 |  | 
|  | 1193 | /* | 
|  | 1194 | * It isn't worth to check for reschedule here, | 
|  | 1195 | * so internally to the x86_64 port you can rely on kernel_thread() | 
|  | 1196 | * not to reschedule the child before returning, this avoids the need | 
|  | 1197 | * of hacks for example to fork off the per-CPU idle tasks. | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1198 | * [Hopefully no generic code relies on the reschedule -AK] | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1199 | */ | 
|  | 1200 | RESTORE_ALL | 
|  | 1201 | UNFAKE_STACK_FRAME | 
|  | 1202 | ret | 
|  | 1203 | CFI_ENDPROC | 
| Alexander van Heukelum | 6efdcfa | 2008-11-23 10:15:32 +0100 | [diff] [blame] | 1204 | END(kernel_thread) | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 1205 |  | 
| Cyrill Gorcunov | c2c631e | 2008-11-26 22:17:00 +0300 | [diff] [blame] | 1206 | ENTRY(child_rip) | 
| Andi Kleen | c05991e | 2006-08-30 19:37:08 +0200 | [diff] [blame] | 1207 | pushq $0		# fake return address | 
|  | 1208 | CFI_STARTPROC | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1209 | /* | 
|  | 1210 | * Here we are in the child and the registers are set as they were | 
|  | 1211 | * at kernel_thread() invocation in the parent. | 
|  | 1212 | */ | 
|  | 1213 | movq %rdi, %rax | 
|  | 1214 | movq %rsi, %rdi | 
|  | 1215 | call *%rax | 
|  | 1216 | # exit | 
| Andrey Mirkin | 1c5b5cf | 2007-10-17 18:04:33 +0200 | [diff] [blame] | 1217 | mov %eax, %edi | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1218 | call do_exit | 
| jia zhang | 5f5db59 | 2008-11-23 22:47:10 +0800 | [diff] [blame] | 1219 | ud2			# padding for call trace | 
| Andi Kleen | c05991e | 2006-08-30 19:37:08 +0200 | [diff] [blame] | 1220 | CFI_ENDPROC | 
| Alexander van Heukelum | 6efdcfa | 2008-11-23 10:15:32 +0100 | [diff] [blame] | 1221 | END(child_rip) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1222 |  | 
|  | 1223 | /* | 
|  | 1224 | * execve(). This function needs to use IRET, not SYSRET, to set up all state properly. | 
|  | 1225 | * | 
|  | 1226 | * C extern interface: | 
|  | 1227 | *	 extern long execve(char *name, char **argv, char **envp) | 
|  | 1228 | * | 
|  | 1229 | * asm input arguments: | 
|  | 1230 | *	rdi: name, rsi: argv, rdx: envp | 
|  | 1231 | * | 
|  | 1232 | * We want to fallback into: | 
| Ingo Molnar | 5d119b2 | 2008-02-26 12:55:57 +0100 | [diff] [blame] | 1233 | *	extern long sys_execve(char *name, char **argv,char **envp, struct pt_regs *regs) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1234 | * | 
|  | 1235 | * do_sys_execve asm fallback arguments: | 
| Ingo Molnar | 5d119b2 | 2008-02-26 12:55:57 +0100 | [diff] [blame] | 1236 | *	rdi: name, rsi: argv, rdx: envp, rcx: fake frame on the stack | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1237 | */ | 
| Arnd Bergmann | 3db03b4 | 2006-10-02 02:18:31 -0700 | [diff] [blame] | 1238 | ENTRY(kernel_execve) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1239 | CFI_STARTPROC | 
|  | 1240 | FAKE_STACK_FRAME $0 | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 1241 | SAVE_ALL | 
| Ingo Molnar | 5d119b2 | 2008-02-26 12:55:57 +0100 | [diff] [blame] | 1242 | movq %rsp,%rcx | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1243 | call sys_execve | 
| Alexander van Heukelum | 0bd7b79 | 2008-11-16 15:29:00 +0100 | [diff] [blame] | 1244 | movq %rax, RAX(%rsp) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1245 | RESTORE_REST | 
|  | 1246 | testq %rax,%rax | 
|  | 1247 | je int_ret_from_sys_call | 
|  | 1248 | RESTORE_ARGS | 
|  | 1249 | UNFAKE_STACK_FRAME | 
|  | 1250 | ret | 
|  | 1251 | CFI_ENDPROC | 
| Alexander van Heukelum | 6efdcfa | 2008-11-23 10:15:32 +0100 | [diff] [blame] | 1252 | END(kernel_execve) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1253 |  | 
| Andi Kleen | 2699500 | 2006-08-02 22:37:28 +0200 | [diff] [blame] | 1254 | /* Call softirq on interrupt stack. Interrupts are off. */ | 
| Andi Kleen | ed6b676 | 2005-07-28 21:15:49 -0700 | [diff] [blame] | 1255 | ENTRY(call_softirq) | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1256 | CFI_STARTPROC | 
| Andi Kleen | 2699500 | 2006-08-02 22:37:28 +0200 | [diff] [blame] | 1257 | push %rbp | 
|  | 1258 | CFI_ADJUST_CFA_OFFSET	8 | 
|  | 1259 | CFI_REL_OFFSET rbp,0 | 
|  | 1260 | mov  %rsp,%rbp | 
|  | 1261 | CFI_DEF_CFA_REGISTER rbp | 
| Brian Gerst | 5689553 | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 1262 | incl PER_CPU_VAR(irq_count) | 
| Brian Gerst | 26f80bd | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 1263 | cmove PER_CPU_VAR(irq_stack_ptr),%rsp | 
| Andi Kleen | 2699500 | 2006-08-02 22:37:28 +0200 | [diff] [blame] | 1264 | push  %rbp			# backlink for old unwinder | 
| Andi Kleen | ed6b676 | 2005-07-28 21:15:49 -0700 | [diff] [blame] | 1265 | call __do_softirq | 
| Andi Kleen | 2699500 | 2006-08-02 22:37:28 +0200 | [diff] [blame] | 1266 | leaveq | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1267 | CFI_DEF_CFA_REGISTER	rsp | 
| Andi Kleen | 2699500 | 2006-08-02 22:37:28 +0200 | [diff] [blame] | 1268 | CFI_ADJUST_CFA_OFFSET   -8 | 
| Brian Gerst | 5689553 | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 1269 | decl PER_CPU_VAR(irq_count) | 
| Andi Kleen | ed6b676 | 2005-07-28 21:15:49 -0700 | [diff] [blame] | 1270 | ret | 
| Jan Beulich | 7effaa8 | 2005-09-12 18:49:24 +0200 | [diff] [blame] | 1271 | CFI_ENDPROC | 
| Alexander van Heukelum | 6efdcfa | 2008-11-23 10:15:32 +0100 | [diff] [blame] | 1272 | END(call_softirq) | 
| Andi Kleen | 75154f4 | 2007-06-23 02:29:25 +0200 | [diff] [blame] | 1273 |  | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1274 | #ifdef CONFIG_XEN | 
| Alexander van Heukelum | 322648d | 2008-11-23 10:08:28 +0100 | [diff] [blame] | 1275 | zeroentry xen_hypervisor_callback xen_do_hypervisor_callback | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1276 |  | 
|  | 1277 | /* | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1278 | * A note on the "critical region" in our callback handler. | 
|  | 1279 | * We want to avoid stacking callback handlers due to events occurring | 
|  | 1280 | * during handling of the last event. To do this, we keep events disabled | 
|  | 1281 | * until we've done all processing. HOWEVER, we must enable events before | 
|  | 1282 | * popping the stack frame (can't be done atomically) and so it would still | 
|  | 1283 | * be possible to get enough handler activations to overflow the stack. | 
|  | 1284 | * Although unlikely, bugs of that kind are hard to track down, so we'd | 
|  | 1285 | * like to avoid the possibility. | 
|  | 1286 | * So, on entry to the handler we detect whether we interrupted an | 
|  | 1287 | * existing activation in its critical region -- if so, we pop the current | 
|  | 1288 | * activation and restart the handler using the previous one. | 
|  | 1289 | */ | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1290 | ENTRY(xen_do_hypervisor_callback)   # do_hypervisor_callback(struct *pt_regs) | 
|  | 1291 | CFI_STARTPROC | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1292 | /* | 
|  | 1293 | * Since we don't modify %rdi, evtchn_do_upall(struct *pt_regs) will | 
|  | 1294 | * see the correct pointer to the pt_regs | 
|  | 1295 | */ | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1296 | movq %rdi, %rsp            # we don't return, adjust the stack frame | 
|  | 1297 | CFI_ENDPROC | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 1298 | DEFAULT_FRAME | 
| Brian Gerst | 5689553 | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 1299 | 11:	incl PER_CPU_VAR(irq_count) | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1300 | movq %rsp,%rbp | 
|  | 1301 | CFI_DEF_CFA_REGISTER rbp | 
| Brian Gerst | 26f80bd | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 1302 | cmovzq PER_CPU_VAR(irq_stack_ptr),%rsp | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1303 | pushq %rbp			# backlink for old unwinder | 
|  | 1304 | call xen_evtchn_do_upcall | 
|  | 1305 | popq %rsp | 
|  | 1306 | CFI_DEF_CFA_REGISTER rsp | 
| Brian Gerst | 5689553 | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 1307 | decl PER_CPU_VAR(irq_count) | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1308 | jmp  error_exit | 
|  | 1309 | CFI_ENDPROC | 
|  | 1310 | END(do_hypervisor_callback) | 
|  | 1311 |  | 
|  | 1312 | /* | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1313 | * Hypervisor uses this for application faults while it executes. | 
|  | 1314 | * We get here for two reasons: | 
|  | 1315 | *  1. Fault while reloading DS, ES, FS or GS | 
|  | 1316 | *  2. Fault while executing IRET | 
|  | 1317 | * Category 1 we do not need to fix up as Xen has already reloaded all segment | 
|  | 1318 | * registers that could be reloaded and zeroed the others. | 
|  | 1319 | * Category 2 we fix up by killing the current process. We cannot use the | 
|  | 1320 | * normal Linux return path in this case because if we use the IRET hypercall | 
|  | 1321 | * to pop the stack frame we end up in an infinite loop of failsafe callbacks. | 
|  | 1322 | * We distinguish between categories by comparing each saved segment register | 
|  | 1323 | * with its current contents: any discrepancy means we in category 1. | 
|  | 1324 | */ | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1325 | ENTRY(xen_failsafe_callback) | 
| Alexander van Heukelum | dcd072e | 2008-11-20 14:40:11 +0100 | [diff] [blame] | 1326 | INTR_FRAME 1 (6*8) | 
|  | 1327 | /*CFI_REL_OFFSET gs,GS*/ | 
|  | 1328 | /*CFI_REL_OFFSET fs,FS*/ | 
|  | 1329 | /*CFI_REL_OFFSET es,ES*/ | 
|  | 1330 | /*CFI_REL_OFFSET ds,DS*/ | 
|  | 1331 | CFI_REL_OFFSET r11,8 | 
|  | 1332 | CFI_REL_OFFSET rcx,0 | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1333 | movw %ds,%cx | 
|  | 1334 | cmpw %cx,0x10(%rsp) | 
|  | 1335 | CFI_REMEMBER_STATE | 
|  | 1336 | jne 1f | 
|  | 1337 | movw %es,%cx | 
|  | 1338 | cmpw %cx,0x18(%rsp) | 
|  | 1339 | jne 1f | 
|  | 1340 | movw %fs,%cx | 
|  | 1341 | cmpw %cx,0x20(%rsp) | 
|  | 1342 | jne 1f | 
|  | 1343 | movw %gs,%cx | 
|  | 1344 | cmpw %cx,0x28(%rsp) | 
|  | 1345 | jne 1f | 
|  | 1346 | /* All segments match their saved values => Category 2 (Bad IRET). */ | 
|  | 1347 | movq (%rsp),%rcx | 
|  | 1348 | CFI_RESTORE rcx | 
|  | 1349 | movq 8(%rsp),%r11 | 
|  | 1350 | CFI_RESTORE r11 | 
|  | 1351 | addq $0x30,%rsp | 
|  | 1352 | CFI_ADJUST_CFA_OFFSET -0x30 | 
| Ingo Molnar | 14ae22b | 2008-11-21 15:20:47 +0100 | [diff] [blame] | 1353 | pushq_cfi $0	/* RIP */ | 
|  | 1354 | pushq_cfi %r11 | 
|  | 1355 | pushq_cfi %rcx | 
| Jeremy Fitzhardinge | 4a5c3e7 | 2008-07-08 15:07:09 -0700 | [diff] [blame] | 1356 | jmp general_protection | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1357 | CFI_RESTORE_STATE | 
|  | 1358 | 1:	/* Segment mismatch => Category 1 (Bad segment). Retry the IRET. */ | 
|  | 1359 | movq (%rsp),%rcx | 
|  | 1360 | CFI_RESTORE rcx | 
|  | 1361 | movq 8(%rsp),%r11 | 
|  | 1362 | CFI_RESTORE r11 | 
|  | 1363 | addq $0x30,%rsp | 
|  | 1364 | CFI_ADJUST_CFA_OFFSET -0x30 | 
| Ingo Molnar | 14ae22b | 2008-11-21 15:20:47 +0100 | [diff] [blame] | 1365 | pushq_cfi $0 | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1366 | SAVE_ALL | 
|  | 1367 | jmp error_exit | 
|  | 1368 | CFI_ENDPROC | 
| Jeremy Fitzhardinge | 3d75e1b | 2008-07-08 15:06:49 -0700 | [diff] [blame] | 1369 | END(xen_failsafe_callback) | 
|  | 1370 |  | 
|  | 1371 | #endif /* CONFIG_XEN */ | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1372 |  | 
|  | 1373 | /* | 
|  | 1374 | * Some functions should be protected against kprobes | 
|  | 1375 | */ | 
|  | 1376 | .pushsection .kprobes.text, "ax" | 
|  | 1377 |  | 
|  | 1378 | paranoidzeroentry_ist debug do_debug DEBUG_STACK | 
|  | 1379 | paranoidzeroentry_ist int3 do_int3 DEBUG_STACK | 
|  | 1380 | paranoiderrorentry stack_segment do_stack_segment | 
| Jeremy Fitzhardinge | 6cac5a9 | 2009-03-29 19:56:29 -0700 | [diff] [blame] | 1381 | #ifdef CONFIG_XEN | 
|  | 1382 | zeroentry xen_debug do_debug | 
|  | 1383 | zeroentry xen_int3 do_int3 | 
|  | 1384 | errorentry xen_stack_segment do_stack_segment | 
|  | 1385 | #endif | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1386 | errorentry general_protection do_general_protection | 
|  | 1387 | errorentry page_fault do_page_fault | 
|  | 1388 | #ifdef CONFIG_X86_MCE | 
| Andi Kleen | 5d72792 | 2009-04-27 19:25:48 +0200 | [diff] [blame] | 1389 | paranoidzeroentry machine_check *machine_check_vector(%rip) | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1390 | #endif | 
|  | 1391 |  | 
|  | 1392 | /* | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1393 | * "Paranoid" exit path from exception stack. | 
|  | 1394 | * Paranoid because this is used by NMIs and cannot take | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1395 | * any kernel state for granted. | 
|  | 1396 | * We don't do kernel preemption checks here, because only | 
|  | 1397 | * NMI should be common and it does not enable IRQs and | 
|  | 1398 | * cannot get reschedule ticks. | 
|  | 1399 | * | 
|  | 1400 | * "trace" is 0 for the NMI handler only, because irq-tracing | 
|  | 1401 | * is fundamentally NMI-unsafe. (we cannot change the soft and | 
|  | 1402 | * hard flags at once, atomically) | 
|  | 1403 | */ | 
|  | 1404 |  | 
|  | 1405 | /* ebx:	no swapgs flag */ | 
|  | 1406 | ENTRY(paranoid_exit) | 
|  | 1407 | INTR_FRAME | 
|  | 1408 | DISABLE_INTERRUPTS(CLBR_NONE) | 
|  | 1409 | TRACE_IRQS_OFF | 
|  | 1410 | testl %ebx,%ebx				/* swapgs needed? */ | 
|  | 1411 | jnz paranoid_restore | 
|  | 1412 | testl $3,CS(%rsp) | 
|  | 1413 | jnz   paranoid_userspace | 
|  | 1414 | paranoid_swapgs: | 
|  | 1415 | TRACE_IRQS_IRETQ 0 | 
|  | 1416 | SWAPGS_UNSAFE_STACK | 
| Steven Rostedt | 0300e7f1 | 2009-04-17 08:33:52 -0400 | [diff] [blame] | 1417 | RESTORE_ALL 8 | 
|  | 1418 | jmp irq_return | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1419 | paranoid_restore: | 
| Steven Rostedt | 0300e7f1 | 2009-04-17 08:33:52 -0400 | [diff] [blame] | 1420 | TRACE_IRQS_IRETQ 0 | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1421 | RESTORE_ALL 8 | 
|  | 1422 | jmp irq_return | 
|  | 1423 | paranoid_userspace: | 
|  | 1424 | GET_THREAD_INFO(%rcx) | 
|  | 1425 | movl TI_flags(%rcx),%ebx | 
|  | 1426 | andl $_TIF_WORK_MASK,%ebx | 
|  | 1427 | jz paranoid_swapgs | 
|  | 1428 | movq %rsp,%rdi			/* &pt_regs */ | 
|  | 1429 | call sync_regs | 
|  | 1430 | movq %rax,%rsp			/* switch stack for scheduling */ | 
|  | 1431 | testl $_TIF_NEED_RESCHED,%ebx | 
|  | 1432 | jnz paranoid_schedule | 
|  | 1433 | movl %ebx,%edx			/* arg3: thread flags */ | 
|  | 1434 | TRACE_IRQS_ON | 
|  | 1435 | ENABLE_INTERRUPTS(CLBR_NONE) | 
|  | 1436 | xorl %esi,%esi 			/* arg2: oldset */ | 
|  | 1437 | movq %rsp,%rdi 			/* arg1: &pt_regs */ | 
|  | 1438 | call do_notify_resume | 
|  | 1439 | DISABLE_INTERRUPTS(CLBR_NONE) | 
|  | 1440 | TRACE_IRQS_OFF | 
|  | 1441 | jmp paranoid_userspace | 
|  | 1442 | paranoid_schedule: | 
|  | 1443 | TRACE_IRQS_ON | 
|  | 1444 | ENABLE_INTERRUPTS(CLBR_ANY) | 
|  | 1445 | call schedule | 
|  | 1446 | DISABLE_INTERRUPTS(CLBR_ANY) | 
|  | 1447 | TRACE_IRQS_OFF | 
|  | 1448 | jmp paranoid_userspace | 
|  | 1449 | CFI_ENDPROC | 
|  | 1450 | END(paranoid_exit) | 
|  | 1451 |  | 
|  | 1452 | /* | 
|  | 1453 | * Exception entry point. This expects an error code/orig_rax on the stack. | 
|  | 1454 | * returns in "no swapgs flag" in %ebx. | 
|  | 1455 | */ | 
|  | 1456 | ENTRY(error_entry) | 
|  | 1457 | XCPT_FRAME | 
|  | 1458 | CFI_ADJUST_CFA_OFFSET 15*8 | 
|  | 1459 | /* oldrax contains error code */ | 
|  | 1460 | cld | 
|  | 1461 | movq_cfi rdi, RDI+8 | 
|  | 1462 | movq_cfi rsi, RSI+8 | 
|  | 1463 | movq_cfi rdx, RDX+8 | 
|  | 1464 | movq_cfi rcx, RCX+8 | 
|  | 1465 | movq_cfi rax, RAX+8 | 
|  | 1466 | movq_cfi  r8,  R8+8 | 
|  | 1467 | movq_cfi  r9,  R9+8 | 
|  | 1468 | movq_cfi r10, R10+8 | 
|  | 1469 | movq_cfi r11, R11+8 | 
|  | 1470 | movq_cfi rbx, RBX+8 | 
|  | 1471 | movq_cfi rbp, RBP+8 | 
|  | 1472 | movq_cfi r12, R12+8 | 
|  | 1473 | movq_cfi r13, R13+8 | 
|  | 1474 | movq_cfi r14, R14+8 | 
|  | 1475 | movq_cfi r15, R15+8 | 
|  | 1476 | xorl %ebx,%ebx | 
|  | 1477 | testl $3,CS+8(%rsp) | 
|  | 1478 | je error_kernelspace | 
|  | 1479 | error_swapgs: | 
|  | 1480 | SWAPGS | 
|  | 1481 | error_sti: | 
|  | 1482 | TRACE_IRQS_OFF | 
|  | 1483 | ret | 
|  | 1484 | CFI_ENDPROC | 
|  | 1485 |  | 
|  | 1486 | /* | 
|  | 1487 | * There are two places in the kernel that can potentially fault with | 
|  | 1488 | * usergs. Handle them here. The exception handlers after iret run with | 
|  | 1489 | * kernel gs again, so don't set the user space flag. B stepping K8s | 
|  | 1490 | * sometimes report an truncated RIP for IRET exceptions returning to | 
|  | 1491 | * compat mode. Check for these here too. | 
|  | 1492 | */ | 
|  | 1493 | error_kernelspace: | 
|  | 1494 | incl %ebx | 
|  | 1495 | leaq irq_return(%rip),%rcx | 
|  | 1496 | cmpq %rcx,RIP+8(%rsp) | 
|  | 1497 | je error_swapgs | 
|  | 1498 | movl %ecx,%ecx	/* zero extend */ | 
|  | 1499 | cmpq %rcx,RIP+8(%rsp) | 
|  | 1500 | je error_swapgs | 
|  | 1501 | cmpq $gs_change,RIP+8(%rsp) | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1502 | je error_swapgs | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1503 | jmp error_sti | 
|  | 1504 | END(error_entry) | 
|  | 1505 |  | 
|  | 1506 |  | 
|  | 1507 | /* ebx:	no swapgs flag (1: don't need swapgs, 0: need it) */ | 
|  | 1508 | ENTRY(error_exit) | 
|  | 1509 | DEFAULT_FRAME | 
|  | 1510 | movl %ebx,%eax | 
|  | 1511 | RESTORE_REST | 
|  | 1512 | DISABLE_INTERRUPTS(CLBR_NONE) | 
|  | 1513 | TRACE_IRQS_OFF | 
|  | 1514 | GET_THREAD_INFO(%rcx) | 
|  | 1515 | testl %eax,%eax | 
|  | 1516 | jne retint_kernel | 
|  | 1517 | LOCKDEP_SYS_EXIT_IRQ | 
|  | 1518 | movl TI_flags(%rcx),%edx | 
|  | 1519 | movl $_TIF_WORK_MASK,%edi | 
|  | 1520 | andl %edi,%edx | 
|  | 1521 | jnz retint_careful | 
|  | 1522 | jmp retint_swapgs | 
|  | 1523 | CFI_ENDPROC | 
|  | 1524 | END(error_exit) | 
|  | 1525 |  | 
|  | 1526 |  | 
|  | 1527 | /* runs on exception stack */ | 
|  | 1528 | ENTRY(nmi) | 
|  | 1529 | INTR_FRAME | 
|  | 1530 | PARAVIRT_ADJUST_EXCEPTION_FRAME | 
|  | 1531 | pushq_cfi $-1 | 
|  | 1532 | subq $15*8, %rsp | 
|  | 1533 | CFI_ADJUST_CFA_OFFSET 15*8 | 
|  | 1534 | call save_paranoid | 
|  | 1535 | DEFAULT_FRAME 0 | 
|  | 1536 | /* paranoidentry do_nmi, 0; without TRACE_IRQS_OFF */ | 
|  | 1537 | movq %rsp,%rdi | 
|  | 1538 | movq $-1,%rsi | 
|  | 1539 | call do_nmi | 
|  | 1540 | #ifdef CONFIG_TRACE_IRQFLAGS | 
|  | 1541 | /* paranoidexit; without TRACE_IRQS_OFF */ | 
|  | 1542 | /* ebx:	no swapgs flag */ | 
|  | 1543 | DISABLE_INTERRUPTS(CLBR_NONE) | 
|  | 1544 | testl %ebx,%ebx				/* swapgs needed? */ | 
|  | 1545 | jnz nmi_restore | 
|  | 1546 | testl $3,CS(%rsp) | 
|  | 1547 | jnz nmi_userspace | 
|  | 1548 | nmi_swapgs: | 
|  | 1549 | SWAPGS_UNSAFE_STACK | 
|  | 1550 | nmi_restore: | 
|  | 1551 | RESTORE_ALL 8 | 
|  | 1552 | jmp irq_return | 
|  | 1553 | nmi_userspace: | 
|  | 1554 | GET_THREAD_INFO(%rcx) | 
|  | 1555 | movl TI_flags(%rcx),%ebx | 
|  | 1556 | andl $_TIF_WORK_MASK,%ebx | 
|  | 1557 | jz nmi_swapgs | 
|  | 1558 | movq %rsp,%rdi			/* &pt_regs */ | 
|  | 1559 | call sync_regs | 
|  | 1560 | movq %rax,%rsp			/* switch stack for scheduling */ | 
|  | 1561 | testl $_TIF_NEED_RESCHED,%ebx | 
|  | 1562 | jnz nmi_schedule | 
|  | 1563 | movl %ebx,%edx			/* arg3: thread flags */ | 
|  | 1564 | ENABLE_INTERRUPTS(CLBR_NONE) | 
|  | 1565 | xorl %esi,%esi 			/* arg2: oldset */ | 
|  | 1566 | movq %rsp,%rdi 			/* arg1: &pt_regs */ | 
|  | 1567 | call do_notify_resume | 
|  | 1568 | DISABLE_INTERRUPTS(CLBR_NONE) | 
|  | 1569 | jmp nmi_userspace | 
|  | 1570 | nmi_schedule: | 
|  | 1571 | ENABLE_INTERRUPTS(CLBR_ANY) | 
|  | 1572 | call schedule | 
|  | 1573 | DISABLE_INTERRUPTS(CLBR_ANY) | 
|  | 1574 | jmp nmi_userspace | 
|  | 1575 | CFI_ENDPROC | 
|  | 1576 | #else | 
|  | 1577 | jmp paranoid_exit | 
| Cyrill Gorcunov | 9f1e87e | 2008-11-27 21:10:08 +0300 | [diff] [blame] | 1578 | CFI_ENDPROC | 
| Alexander van Heukelum | ddeb8f2 | 2008-11-24 13:24:28 +0100 | [diff] [blame] | 1579 | #endif | 
|  | 1580 | END(nmi) | 
|  | 1581 |  | 
|  | 1582 | ENTRY(ignore_sysret) | 
|  | 1583 | CFI_STARTPROC | 
|  | 1584 | mov $-ENOSYS,%eax | 
|  | 1585 | sysret | 
|  | 1586 | CFI_ENDPROC | 
|  | 1587 | END(ignore_sysret) | 
|  | 1588 |  | 
|  | 1589 | /* | 
|  | 1590 | * End of kprobes section | 
|  | 1591 | */ | 
|  | 1592 | .popsection |