Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 1 | /* |
| 2 | Asm versions of Xen pv-ops, suitable for either direct use or inlining. |
| 3 | The inline versions are the same as the direct-use versions, with the |
| 4 | pre- and post-amble chopped off. |
| 5 | |
| 6 | This code is encoded for size rather than absolute efficiency, |
| 7 | with a view to being able to inline as much as possible. |
| 8 | |
| 9 | We only bother with direct forms (ie, vcpu in pda) of the operations |
| 10 | here; the indirect forms are better handled in C, since they're |
| 11 | generally too large to inline anyway. |
| 12 | */ |
| 13 | |
| 14 | #include <linux/linkage.h> |
| 15 | |
| 16 | #include <asm/asm-offsets.h> |
| 17 | #include <asm/processor-flags.h> |
Jeremy Fitzhardinge | 6fcac6d | 2008-07-08 15:07:14 -0700 | [diff] [blame] | 18 | #include <asm/errno.h> |
| 19 | #include <asm/segment.h> |
Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame^] | 20 | #include <asm/percpu.h> |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 21 | |
| 22 | #include <xen/interface/xen.h> |
| 23 | |
| 24 | #define RELOC(x, v) .globl x##_reloc; x##_reloc=v |
| 25 | #define ENDPATCH(x) .globl x##_end; x##_end=. |
| 26 | |
| 27 | /* Pseudo-flag used for virtual NMI, which we don't implement yet */ |
| 28 | #define XEN_EFLAGS_NMI 0x80000000 |
| 29 | |
Jeremy Fitzhardinge | db053b8 | 2008-10-02 16:41:31 -0700 | [diff] [blame] | 30 | #if 1 |
| 31 | /* |
Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame^] | 32 | FIXME: x86_64 now can support direct access to percpu variables |
| 33 | via a segment override. Update xen accordingly. |
Jeremy Fitzhardinge | db053b8 | 2008-10-02 16:41:31 -0700 | [diff] [blame] | 34 | */ |
| 35 | #define BUG ud2a |
Jeremy Fitzhardinge | db053b8 | 2008-10-02 16:41:31 -0700 | [diff] [blame] | 36 | #endif |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 37 | |
| 38 | /* |
| 39 | Enable events. This clears the event mask and tests the pending |
| 40 | event status with one and operation. If there are pending |
| 41 | events, then enter the hypervisor to get them handled. |
| 42 | */ |
| 43 | ENTRY(xen_irq_enable_direct) |
Jeremy Fitzhardinge | db053b8 | 2008-10-02 16:41:31 -0700 | [diff] [blame] | 44 | BUG |
| 45 | |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 46 | /* Unmask events */ |
Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame^] | 47 | movb $0, PER_CPU_VAR(xen_vcpu_info) + XEN_vcpu_info_mask |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 48 | |
| 49 | /* Preempt here doesn't matter because that will deal with |
| 50 | any pending interrupts. The pending check may end up being |
| 51 | run on the wrong CPU, but that doesn't hurt. */ |
| 52 | |
| 53 | /* Test for pending */ |
Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame^] | 54 | testb $0xff, PER_CPU_VAR(xen_vcpu_info) + XEN_vcpu_info_pending |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 55 | jz 1f |
| 56 | |
| 57 | 2: call check_events |
| 58 | 1: |
| 59 | ENDPATCH(xen_irq_enable_direct) |
| 60 | ret |
| 61 | ENDPROC(xen_irq_enable_direct) |
| 62 | RELOC(xen_irq_enable_direct, 2b+1) |
| 63 | |
| 64 | /* |
| 65 | Disabling events is simply a matter of making the event mask |
| 66 | non-zero. |
| 67 | */ |
| 68 | ENTRY(xen_irq_disable_direct) |
Jeremy Fitzhardinge | db053b8 | 2008-10-02 16:41:31 -0700 | [diff] [blame] | 69 | BUG |
| 70 | |
Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame^] | 71 | movb $1, PER_CPU_VAR(xen_vcpu_info) + XEN_vcpu_info_mask |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 72 | ENDPATCH(xen_irq_disable_direct) |
| 73 | ret |
| 74 | ENDPROC(xen_irq_disable_direct) |
| 75 | RELOC(xen_irq_disable_direct, 0) |
| 76 | |
| 77 | /* |
| 78 | (xen_)save_fl is used to get the current interrupt enable status. |
| 79 | Callers expect the status to be in X86_EFLAGS_IF, and other bits |
| 80 | may be set in the return value. We take advantage of this by |
| 81 | making sure that X86_EFLAGS_IF has the right value (and other bits |
| 82 | in that byte are 0), but other bits in the return value are |
| 83 | undefined. We need to toggle the state of the bit, because |
| 84 | Xen and x86 use opposite senses (mask vs enable). |
| 85 | */ |
| 86 | ENTRY(xen_save_fl_direct) |
Jeremy Fitzhardinge | db053b8 | 2008-10-02 16:41:31 -0700 | [diff] [blame] | 87 | BUG |
| 88 | |
Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame^] | 89 | testb $0xff, PER_CPU_VAR(xen_vcpu_info) + XEN_vcpu_info_mask |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 90 | setz %ah |
| 91 | addb %ah,%ah |
| 92 | ENDPATCH(xen_save_fl_direct) |
| 93 | ret |
| 94 | ENDPROC(xen_save_fl_direct) |
| 95 | RELOC(xen_save_fl_direct, 0) |
| 96 | |
| 97 | /* |
| 98 | In principle the caller should be passing us a value return |
| 99 | from xen_save_fl_direct, but for robustness sake we test only |
| 100 | the X86_EFLAGS_IF flag rather than the whole byte. After |
| 101 | setting the interrupt mask state, it checks for unmasked |
| 102 | pending events and enters the hypervisor to get them delivered |
| 103 | if so. |
| 104 | */ |
| 105 | ENTRY(xen_restore_fl_direct) |
Jeremy Fitzhardinge | db053b8 | 2008-10-02 16:41:31 -0700 | [diff] [blame] | 106 | BUG |
| 107 | |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 108 | testb $X86_EFLAGS_IF>>8, %ah |
Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame^] | 109 | setz PER_CPU_VAR(xen_vcpu_info) + XEN_vcpu_info_mask |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 110 | /* Preempt here doesn't matter because that will deal with |
| 111 | any pending interrupts. The pending check may end up being |
| 112 | run on the wrong CPU, but that doesn't hurt. */ |
| 113 | |
| 114 | /* check for unmasked and pending */ |
Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame^] | 115 | cmpw $0x0001, PER_CPU_VAR(xen_vcpu_info) + XEN_vcpu_info_pending |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 116 | jz 1f |
| 117 | 2: call check_events |
| 118 | 1: |
| 119 | ENDPATCH(xen_restore_fl_direct) |
| 120 | ret |
| 121 | ENDPROC(xen_restore_fl_direct) |
| 122 | RELOC(xen_restore_fl_direct, 2b+1) |
| 123 | |
| 124 | |
| 125 | /* |
| 126 | Force an event check by making a hypercall, |
| 127 | but preserve regs before making the call. |
| 128 | */ |
| 129 | check_events: |
| 130 | push %rax |
| 131 | push %rcx |
| 132 | push %rdx |
| 133 | push %rsi |
| 134 | push %rdi |
| 135 | push %r8 |
| 136 | push %r9 |
| 137 | push %r10 |
| 138 | push %r11 |
Jeremy Fitzhardinge | 0d1edf4 | 2008-07-28 11:53:57 -0700 | [diff] [blame] | 139 | call xen_force_evtchn_callback |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 140 | pop %r11 |
| 141 | pop %r10 |
| 142 | pop %r9 |
| 143 | pop %r8 |
| 144 | pop %rdi |
| 145 | pop %rsi |
| 146 | pop %rdx |
| 147 | pop %rcx |
| 148 | pop %rax |
| 149 | ret |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 150 | |
Jeremy Fitzhardinge | 997409d | 2008-07-08 15:07:00 -0700 | [diff] [blame] | 151 | ENTRY(xen_adjust_exception_frame) |
| 152 | mov 8+0(%rsp),%rcx |
| 153 | mov 8+8(%rsp),%r11 |
| 154 | ret $16 |
| 155 | |
Jeremy Fitzhardinge | 6fcac6d | 2008-07-08 15:07:14 -0700 | [diff] [blame] | 156 | hypercall_iret = hypercall_page + __HYPERVISOR_iret * 32 |
| 157 | /* |
| 158 | Xen64 iret frame: |
| 159 | |
| 160 | ss |
| 161 | rsp |
| 162 | rflags |
| 163 | cs |
| 164 | rip <-- standard iret frame |
| 165 | |
| 166 | flags |
| 167 | |
| 168 | rcx } |
| 169 | r11 }<-- pushed by hypercall page |
| 170 | rsp -> rax } |
| 171 | */ |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 172 | ENTRY(xen_iret) |
| 173 | pushq $0 |
Jeremy Fitzhardinge | 6fcac6d | 2008-07-08 15:07:14 -0700 | [diff] [blame] | 174 | 1: jmp hypercall_iret |
| 175 | ENDPATCH(xen_iret) |
| 176 | RELOC(xen_iret, 1b+1) |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 177 | |
Jeremy Fitzhardinge | 6fcac6d | 2008-07-08 15:07:14 -0700 | [diff] [blame] | 178 | /* |
| 179 | sysexit is not used for 64-bit processes, so it's |
| 180 | only ever used to return to 32-bit compat userspace. |
| 181 | */ |
Jeremy Fitzhardinge | cdacc12 | 2008-07-08 15:06:46 -0700 | [diff] [blame] | 182 | ENTRY(xen_sysexit) |
Jeremy Fitzhardinge | 6fcac6d | 2008-07-08 15:07:14 -0700 | [diff] [blame] | 183 | pushq $__USER32_DS |
| 184 | pushq %rcx |
| 185 | pushq $X86_EFLAGS_IF |
| 186 | pushq $__USER32_CS |
| 187 | pushq %rdx |
| 188 | |
Jeremy Fitzhardinge | 2dc1697 | 2008-07-21 16:49:58 -0700 | [diff] [blame] | 189 | pushq $0 |
Jeremy Fitzhardinge | 6fcac6d | 2008-07-08 15:07:14 -0700 | [diff] [blame] | 190 | 1: jmp hypercall_iret |
| 191 | ENDPATCH(xen_sysexit) |
| 192 | RELOC(xen_sysexit, 1b+1) |
| 193 | |
| 194 | ENTRY(xen_sysret64) |
| 195 | /* We're already on the usermode stack at this point, but still |
| 196 | with the kernel gs, so we can easily switch back */ |
| 197 | movq %rsp, %gs:pda_oldrsp |
Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame^] | 198 | movq PER_CPU_VAR(kernel_stack),%rsp |
Jeremy Fitzhardinge | 6fcac6d | 2008-07-08 15:07:14 -0700 | [diff] [blame] | 199 | |
| 200 | pushq $__USER_DS |
| 201 | pushq %gs:pda_oldrsp |
| 202 | pushq %r11 |
| 203 | pushq $__USER_CS |
| 204 | pushq %rcx |
| 205 | |
| 206 | pushq $VGCF_in_syscall |
| 207 | 1: jmp hypercall_iret |
| 208 | ENDPATCH(xen_sysret64) |
| 209 | RELOC(xen_sysret64, 1b+1) |
| 210 | |
| 211 | ENTRY(xen_sysret32) |
| 212 | /* We're already on the usermode stack at this point, but still |
| 213 | with the kernel gs, so we can easily switch back */ |
| 214 | movq %rsp, %gs:pda_oldrsp |
Brian Gerst | 9af4565 | 2009-01-19 00:38:58 +0900 | [diff] [blame^] | 215 | movq PER_CPU_VAR(kernel_stack), %rsp |
Jeremy Fitzhardinge | 6fcac6d | 2008-07-08 15:07:14 -0700 | [diff] [blame] | 216 | |
| 217 | pushq $__USER32_DS |
| 218 | pushq %gs:pda_oldrsp |
| 219 | pushq %r11 |
| 220 | pushq $__USER32_CS |
| 221 | pushq %rcx |
| 222 | |
| 223 | pushq $VGCF_in_syscall |
| 224 | 1: jmp hypercall_iret |
| 225 | ENDPATCH(xen_sysret32) |
| 226 | RELOC(xen_sysret32, 1b+1) |
| 227 | |
| 228 | /* |
| 229 | Xen handles syscall callbacks much like ordinary exceptions, |
| 230 | which means we have: |
| 231 | - kernel gs |
| 232 | - kernel rsp |
| 233 | - an iret-like stack frame on the stack (including rcx and r11): |
| 234 | ss |
| 235 | rsp |
| 236 | rflags |
| 237 | cs |
| 238 | rip |
| 239 | r11 |
| 240 | rsp-> rcx |
| 241 | |
| 242 | In all the entrypoints, we undo all that to make it look |
| 243 | like a CPU-generated syscall/sysenter and jump to the normal |
| 244 | entrypoint. |
| 245 | */ |
| 246 | |
| 247 | .macro undo_xen_syscall |
| 248 | mov 0*8(%rsp),%rcx |
| 249 | mov 1*8(%rsp),%r11 |
| 250 | mov 5*8(%rsp),%rsp |
| 251 | .endm |
| 252 | |
| 253 | /* Normal 64-bit system call target */ |
| 254 | ENTRY(xen_syscall_target) |
| 255 | undo_xen_syscall |
| 256 | jmp system_call_after_swapgs |
| 257 | ENDPROC(xen_syscall_target) |
| 258 | |
| 259 | #ifdef CONFIG_IA32_EMULATION |
| 260 | |
| 261 | /* 32-bit compat syscall target */ |
| 262 | ENTRY(xen_syscall32_target) |
| 263 | undo_xen_syscall |
| 264 | jmp ia32_cstar_target |
| 265 | ENDPROC(xen_syscall32_target) |
| 266 | |
| 267 | /* 32-bit compat sysenter target */ |
| 268 | ENTRY(xen_sysenter_target) |
| 269 | undo_xen_syscall |
| 270 | jmp ia32_sysenter_target |
| 271 | ENDPROC(xen_sysenter_target) |
| 272 | |
| 273 | #else /* !CONFIG_IA32_EMULATION */ |
| 274 | |
| 275 | ENTRY(xen_syscall32_target) |
| 276 | ENTRY(xen_sysenter_target) |
| 277 | lea 16(%rsp), %rsp /* strip %rcx,%r11 */ |
| 278 | mov $-ENOSYS, %rax |
| 279 | pushq $VGCF_in_syscall |
| 280 | jmp hypercall_iret |
| 281 | ENDPROC(xen_syscall32_target) |
| 282 | ENDPROC(xen_sysenter_target) |
| 283 | |
| 284 | #endif /* CONFIG_IA32_EMULATION */ |