blob: 74c607b37e873176e3e91c4cf5b3bf8e7ed18455 [file] [log] [blame]
Roland McGrath1eeaed72008-01-30 13:31:51 +01001/*
2 * Copyright (C) 1994 Linus Torvalds
3 *
4 * Pentium III FXSR, SSE support
5 * General FPU state handling cleanups
6 * Gareth Hughes <gareth@valinux.com>, May 2000
7 * x86-64 work by Andi Kleen 2002
8 */
9
H. Peter Anvin1965aae2008-10-22 22:26:29 -070010#ifndef _ASM_X86_I387_H
11#define _ASM_X86_I387_H
Roland McGrath1eeaed72008-01-30 13:31:51 +010012
Herbert Xu3b0d6592009-11-03 09:11:15 -050013#ifndef __ASSEMBLY__
14
Roland McGrath1eeaed72008-01-30 13:31:51 +010015#include <linux/sched.h>
16#include <linux/kernel_stat.h>
17#include <linux/regset.h>
Suresh Siddhae4914012008-08-13 22:02:26 +100018#include <linux/hardirq.h>
Avi Kivity86603282010-05-06 11:45:46 +030019#include <linux/slab.h>
H. Peter Anvin92c37fa2008-02-04 16:47:58 +010020#include <asm/asm.h>
H. Peter Anvinc9775b42010-05-11 17:49:54 -070021#include <asm/cpufeature.h>
Roland McGrath1eeaed72008-01-30 13:31:51 +010022#include <asm/processor.h>
23#include <asm/sigcontext.h>
24#include <asm/user.h>
25#include <asm/uaccess.h>
Suresh Siddhadc1e35c2008-07-29 10:29:19 -070026#include <asm/xsave.h>
Roland McGrath1eeaed72008-01-30 13:31:51 +010027
Suresh Siddha3c1c7f12008-07-29 10:29:21 -070028extern unsigned int sig_xstate_size;
Roland McGrath1eeaed72008-01-30 13:31:51 +010029extern void fpu_init(void);
Roland McGrath1eeaed72008-01-30 13:31:51 +010030extern void mxcsr_feature_mask_init(void);
Suresh Siddhaaa283f42008-03-10 15:28:05 -070031extern int init_fpu(struct task_struct *child);
Linus Torvaldsbe98c2c2012-02-13 13:47:25 -080032extern void math_state_restore(void);
Jaswinder Singh36454932008-07-21 22:31:57 +053033extern int dump_fpu(struct pt_regs *, struct user_i387_struct *);
Roland McGrath1eeaed72008-01-30 13:31:51 +010034
35extern user_regset_active_fn fpregs_active, xfpregs_active;
Suresh Siddha5b3efd52010-02-11 11:50:59 -080036extern user_regset_get_fn fpregs_get, xfpregs_get, fpregs_soft_get,
37 xstateregs_get;
38extern user_regset_set_fn fpregs_set, xfpregs_set, fpregs_soft_set,
39 xstateregs_set;
40
41/*
42 * xstateregs_active == fpregs_active. Please refer to the comment
43 * at the definition of fpregs_active.
44 */
45#define xstateregs_active fpregs_active
Roland McGrath1eeaed72008-01-30 13:31:51 +010046
Suresh Siddhac37b5ef2008-07-29 10:29:25 -070047extern struct _fpx_sw_bytes fx_sw_reserved;
Roland McGrath1eeaed72008-01-30 13:31:51 +010048#ifdef CONFIG_IA32_EMULATION
Suresh Siddha3c1c7f12008-07-29 10:29:21 -070049extern unsigned int sig_xstate_ia32_size;
Suresh Siddhac37b5ef2008-07-29 10:29:25 -070050extern struct _fpx_sw_bytes fx_sw_reserved_ia32;
Roland McGrath1eeaed72008-01-30 13:31:51 +010051struct _fpstate_ia32;
Suresh Siddhaab513702008-07-29 10:29:22 -070052struct _xstate_ia32;
53extern int save_i387_xstate_ia32(void __user *buf);
54extern int restore_i387_xstate_ia32(void __user *buf);
Roland McGrath1eeaed72008-01-30 13:31:51 +010055#endif
56
Brian Gerst8eb91a52010-09-03 21:17:16 -040057#ifdef CONFIG_MATH_EMULATION
58extern void finit_soft_fpu(struct i387_soft_struct *soft);
59#else
60static inline void finit_soft_fpu(struct i387_soft_struct *soft) {}
61#endif
62
Suresh Siddhab359e8a2008-07-29 10:29:20 -070063#define X87_FSW_ES (1 << 7) /* Exception Summary */
64
Suresh Siddha29104e12010-07-19 16:05:49 -070065static __always_inline __pure bool use_xsaveopt(void)
66{
Suresh Siddha6bad06b2010-07-19 16:05:52 -070067 return static_cpu_has(X86_FEATURE_XSAVEOPT);
Suresh Siddha29104e12010-07-19 16:05:49 -070068}
69
H. Peter Anvinc9775b42010-05-11 17:49:54 -070070static __always_inline __pure bool use_xsave(void)
Avi Kivityc9ad4882010-05-06 11:45:45 +030071{
H. Peter Anvinc9775b42010-05-11 17:49:54 -070072 return static_cpu_has(X86_FEATURE_XSAVE);
Avi Kivityc9ad4882010-05-06 11:45:45 +030073}
74
Brian Gerst58a992b2010-09-03 21:17:18 -040075static __always_inline __pure bool use_fxsr(void)
76{
77 return static_cpu_has(X86_FEATURE_FXSR);
78}
79
Suresh Siddha29104e12010-07-19 16:05:49 -070080extern void __sanitize_i387_state(struct task_struct *);
81
82static inline void sanitize_i387_state(struct task_struct *tsk)
83{
84 if (!use_xsaveopt())
85 return;
86 __sanitize_i387_state(tsk);
87}
88
Roland McGrath1eeaed72008-01-30 13:31:51 +010089#ifdef CONFIG_X86_64
Suresh Siddhab359e8a2008-07-29 10:29:20 -070090static inline int fxrstor_checking(struct i387_fxsave_struct *fx)
Roland McGrath1eeaed72008-01-30 13:31:51 +010091{
92 int err;
93
Brian Gerst82024132010-09-03 21:17:14 -040094 /* See comment in fxsave() below. */
H. Peter Anvinfd35fbc2010-10-22 15:33:38 -070095#ifdef CONFIG_AS_FXSAVEQ
96 asm volatile("1: fxrstorq %[fx]\n\t"
97 "2:\n"
98 ".section .fixup,\"ax\"\n"
99 "3: movl $-1,%[err]\n"
100 " jmp 2b\n"
101 ".previous\n"
102 _ASM_EXTABLE(1b, 3b)
103 : [err] "=r" (err)
104 : [fx] "m" (*fx), "0" (0));
105#else
Roland McGrath1eeaed72008-01-30 13:31:51 +0100106 asm volatile("1: rex64/fxrstor (%[fx])\n\t"
107 "2:\n"
108 ".section .fixup,\"ax\"\n"
109 "3: movl $-1,%[err]\n"
110 " jmp 2b\n"
111 ".previous\n"
Joe Perchesaffe6632008-03-23 01:02:18 -0700112 _ASM_EXTABLE(1b, 3b)
Roland McGrath1eeaed72008-01-30 13:31:51 +0100113 : [err] "=r" (err)
Brian Gerst82024132010-09-03 21:17:14 -0400114 : [fx] "R" (fx), "m" (*fx), "0" (0));
H. Peter Anvinfd35fbc2010-10-22 15:33:38 -0700115#endif
Roland McGrath1eeaed72008-01-30 13:31:51 +0100116 return err;
117}
118
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700119static inline int fxsave_user(struct i387_fxsave_struct __user *fx)
Roland McGrath1eeaed72008-01-30 13:31:51 +0100120{
121 int err;
122
Suresh Siddha8e221b62010-06-22 16:23:37 -0700123 /*
124 * Clear the bytes not touched by the fxsave and reserved
125 * for the SW usage.
126 */
127 err = __clear_user(&fx->sw_reserved,
128 sizeof(struct _fpx_sw_bytes));
129 if (unlikely(err))
130 return -EFAULT;
131
Brian Gerst82024132010-09-03 21:17:14 -0400132 /* See comment in fxsave() below. */
H. Peter Anvinfd35fbc2010-10-22 15:33:38 -0700133#ifdef CONFIG_AS_FXSAVEQ
134 asm volatile("1: fxsaveq %[fx]\n\t"
135 "2:\n"
136 ".section .fixup,\"ax\"\n"
137 "3: movl $-1,%[err]\n"
138 " jmp 2b\n"
139 ".previous\n"
140 _ASM_EXTABLE(1b, 3b)
141 : [err] "=r" (err), [fx] "=m" (*fx)
142 : "0" (0));
143#else
Roland McGrath1eeaed72008-01-30 13:31:51 +0100144 asm volatile("1: rex64/fxsave (%[fx])\n\t"
145 "2:\n"
146 ".section .fixup,\"ax\"\n"
147 "3: movl $-1,%[err]\n"
148 " jmp 2b\n"
149 ".previous\n"
Joe Perchesaffe6632008-03-23 01:02:18 -0700150 _ASM_EXTABLE(1b, 3b)
Roland McGrath1eeaed72008-01-30 13:31:51 +0100151 : [err] "=r" (err), "=m" (*fx)
Brian Gerst82024132010-09-03 21:17:14 -0400152 : [fx] "R" (fx), "0" (0));
H. Peter Anvinfd35fbc2010-10-22 15:33:38 -0700153#endif
Joe Perchesaffe6632008-03-23 01:02:18 -0700154 if (unlikely(err) &&
155 __clear_user(fx, sizeof(struct i387_fxsave_struct)))
Roland McGrath1eeaed72008-01-30 13:31:51 +0100156 err = -EFAULT;
157 /* No need to clear here because the caller clears USED_MATH */
158 return err;
159}
160
Avi Kivity86603282010-05-06 11:45:46 +0300161static inline void fpu_fxsave(struct fpu *fpu)
Roland McGrath1eeaed72008-01-30 13:31:51 +0100162{
163 /* Using "rex64; fxsave %0" is broken because, if the memory operand
164 uses any extended registers for addressing, a second REX prefix
165 will be generated (to the assembler, rex64 followed by semicolon
166 is a separate instruction), and hence the 64-bitness is lost. */
Linus Torvaldsb6f7e382010-10-21 13:34:32 -0700167
H. Peter Anvind7acb922010-10-13 16:00:29 -0700168#ifdef CONFIG_AS_FXSAVEQ
Roland McGrath1eeaed72008-01-30 13:31:51 +0100169 /* Using "fxsaveq %0" would be the ideal choice, but is only supported
170 starting with gas 2.16. */
171 __asm__ __volatile__("fxsaveq %0"
Avi Kivity86603282010-05-06 11:45:46 +0300172 : "=m" (fpu->state->fxsave));
Linus Torvaldsb6f7e382010-10-21 13:34:32 -0700173#else
Roland McGrath1eeaed72008-01-30 13:31:51 +0100174 /* Using, as a workaround, the properly prefixed form below isn't
175 accepted by any binutils version so far released, complaining that
176 the same type of prefix is used twice if an extended register is
Brian Gerst82024132010-09-03 21:17:14 -0400177 needed for addressing (fix submitted to mainline 2005-11-21).
178 asm volatile("rex64/fxsave %0"
179 : "=m" (fpu->state->fxsave));
180 This, however, we can work around by forcing the compiler to select
Roland McGrath1eeaed72008-01-30 13:31:51 +0100181 an addressing mode that doesn't require extended registers. */
Brian Gerst82024132010-09-03 21:17:14 -0400182 asm volatile("rex64/fxsave (%[fx])"
183 : "=m" (fpu->state->fxsave)
184 : [fx] "R" (&fpu->state->fxsave));
Roland McGrath1eeaed72008-01-30 13:31:51 +0100185#endif
Suresh Siddhab359e8a2008-07-29 10:29:20 -0700186}
187
Roland McGrath1eeaed72008-01-30 13:31:51 +0100188#else /* CONFIG_X86_32 */
189
Jiri Slaby34ba4762009-04-08 13:31:59 +0200190/* perform fxrstor iff the processor has extended states, otherwise frstor */
191static inline int fxrstor_checking(struct i387_fxsave_struct *fx)
Roland McGrath1eeaed72008-01-30 13:31:51 +0100192{
193 /*
194 * The "nop" is needed to make the instructions the same
195 * length.
196 */
197 alternative_input(
198 "nop ; frstor %1",
199 "fxrstor %1",
200 X86_FEATURE_FXSR,
Jiri Slaby34ba4762009-04-08 13:31:59 +0200201 "m" (*fx));
202
Jiri Slabyfcb2ac52009-04-08 13:31:58 +0200203 return 0;
Roland McGrath1eeaed72008-01-30 13:31:51 +0100204}
205
Brian Gerst58a992b2010-09-03 21:17:18 -0400206static inline void fpu_fxsave(struct fpu *fpu)
207{
208 asm volatile("fxsave %[fx]"
209 : [fx] "=m" (fpu->state->fxsave));
210}
211
Brian Gerstb2b57fe2010-09-03 21:17:19 -0400212#endif /* CONFIG_X86_64 */
213
Roland McGrath1eeaed72008-01-30 13:31:51 +0100214/*
Linus Torvalds34ddc812012-02-18 12:56:35 -0800215 * These must be called with preempt disabled. Returns
216 * 'true' if the FPU state is still intact.
Roland McGrath1eeaed72008-01-30 13:31:51 +0100217 */
Linus Torvalds34ddc812012-02-18 12:56:35 -0800218static inline int fpu_save_init(struct fpu *fpu)
Roland McGrath1eeaed72008-01-30 13:31:51 +0100219{
Avi Kivityc9ad4882010-05-06 11:45:45 +0300220 if (use_xsave()) {
Avi Kivity86603282010-05-06 11:45:46 +0300221 fpu_xsave(fpu);
Suresh Siddhab359e8a2008-07-29 10:29:20 -0700222
223 /*
224 * xsave header may indicate the init state of the FP.
225 */
Brian Gerst58a992b2010-09-03 21:17:18 -0400226 if (!(fpu->state->xsave.xsave_hdr.xstate_bv & XSTATE_FP))
Linus Torvalds34ddc812012-02-18 12:56:35 -0800227 return 1;
Brian Gerst58a992b2010-09-03 21:17:18 -0400228 } else if (use_fxsr()) {
229 fpu_fxsave(fpu);
230 } else {
Hans Rosenfeldf994d992011-04-06 18:06:43 +0200231 asm volatile("fnsave %[fx]; fwait"
Brian Gerst58a992b2010-09-03 21:17:18 -0400232 : [fx] "=m" (fpu->state->fsave));
Linus Torvalds34ddc812012-02-18 12:56:35 -0800233 return 0;
Suresh Siddhab359e8a2008-07-29 10:29:20 -0700234 }
235
Linus Torvalds34ddc812012-02-18 12:56:35 -0800236 /*
237 * If exceptions are pending, we need to clear them so
238 * that we don't randomly get exceptions later.
239 *
240 * FIXME! Is this perhaps only true for the old-style
241 * irq13 case? Maybe we could leave the x87 state
242 * intact otherwise?
243 */
244 if (unlikely(fpu->state->fxsave.swd & X87_FSW_ES)) {
Brian Gerst58a992b2010-09-03 21:17:18 -0400245 asm volatile("fnclex");
Linus Torvalds34ddc812012-02-18 12:56:35 -0800246 return 0;
247 }
248 return 1;
Avi Kivity86603282010-05-06 11:45:46 +0300249}
250
Linus Torvalds34ddc812012-02-18 12:56:35 -0800251static inline int __save_init_fpu(struct task_struct *tsk)
Avi Kivity86603282010-05-06 11:45:46 +0300252{
Linus Torvalds34ddc812012-02-18 12:56:35 -0800253 return fpu_save_init(&tsk->thread.fpu);
Roland McGrath1eeaed72008-01-30 13:31:51 +0100254}
255
Avi Kivity86603282010-05-06 11:45:46 +0300256static inline int fpu_fxrstor_checking(struct fpu *fpu)
257{
258 return fxrstor_checking(&fpu->state->fxsave);
259}
260
261static inline int fpu_restore_checking(struct fpu *fpu)
262{
263 if (use_xsave())
264 return fpu_xrstor_checking(fpu);
265 else
266 return fpu_fxrstor_checking(fpu);
267}
268
Jiri Slaby34ba4762009-04-08 13:31:59 +0200269static inline int restore_fpu_checking(struct task_struct *tsk)
270{
Linus Torvalds80ab6f12012-02-19 11:48:44 -0800271 /* AMD K7/K8 CPUs don't save/restore FDP/FIP/FOP unless an exception
272 is pending. Clear the x87 state here by setting it to fixed
273 values. "m" is a random variable that should be in L1 */
274 alternative_input(
275 ASM_NOP8 ASM_NOP2,
276 "emms\n\t" /* clear stack tags */
277 "fildl %P[addr]", /* set F?P to defined value */
278 X86_FEATURE_FXSAVE_LEAK,
279 [addr] "m" (tsk->thread.has_fpu));
280
Avi Kivity86603282010-05-06 11:45:46 +0300281 return fpu_restore_checking(&tsk->thread.fpu);
Jiri Slaby34ba4762009-04-08 13:31:59 +0200282}
283
Roland McGrath1eeaed72008-01-30 13:31:51 +0100284/*
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800285 * Software FPU state helpers. Careful: these need to
286 * be preemption protection *and* they need to be
287 * properly paired with the CR0.TS changes!
288 */
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800289static inline int __thread_has_fpu(struct task_struct *tsk)
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800290{
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800291 return tsk->thread.has_fpu;
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800292}
293
294/* Must be paired with an 'stts' after! */
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800295static inline void __thread_clear_has_fpu(struct task_struct *tsk)
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800296{
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800297 tsk->thread.has_fpu = 0;
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800298}
299
300/* Must be paired with a 'clts' before! */
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800301static inline void __thread_set_has_fpu(struct task_struct *tsk)
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800302{
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800303 tsk->thread.has_fpu = 1;
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800304}
305
306/*
307 * Encapsulate the CR0.TS handling together with the
308 * software flag.
309 *
310 * These generally need preemption protection to work,
311 * do try to avoid using these on their own.
312 */
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800313static inline void __thread_fpu_end(struct task_struct *tsk)
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800314{
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800315 __thread_clear_has_fpu(tsk);
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800316 stts();
317}
318
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800319static inline void __thread_fpu_begin(struct task_struct *tsk)
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800320{
321 clts();
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800322 __thread_set_has_fpu(tsk);
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800323}
324
325/*
Linus Torvalds34ddc812012-02-18 12:56:35 -0800326 * FPU state switching for scheduling.
327 *
328 * This is a two-stage process:
329 *
330 * - switch_fpu_prepare() saves the old state and
331 * sets the new state of the CR0.TS bit. This is
332 * done within the context of the old process.
333 *
334 * - switch_fpu_finish() restores the new state as
335 * necessary.
336 */
337typedef struct { int preload; } fpu_switch_t;
338
339/*
340 * FIXME! We could do a totally lazy restore, but we need to
341 * add a per-cpu "this was the task that last touched the FPU
342 * on this CPU" variable, and the task needs to have a "I last
343 * touched the FPU on this CPU" and check them.
344 *
345 * We don't do that yet, so "fpu_lazy_restore()" always returns
346 * false, but some day..
347 */
348#define fpu_lazy_restore(tsk) (0)
349#define fpu_lazy_state_intact(tsk) do { } while (0)
350
351static inline fpu_switch_t switch_fpu_prepare(struct task_struct *old, struct task_struct *new)
352{
353 fpu_switch_t fpu;
354
355 fpu.preload = tsk_used_math(new) && new->fpu_counter > 5;
356 if (__thread_has_fpu(old)) {
357 if (__save_init_fpu(old))
358 fpu_lazy_state_intact(old);
359 __thread_clear_has_fpu(old);
Linus Torvalds34ddc812012-02-18 12:56:35 -0800360
361 /* Don't change CR0.TS if we just switch! */
362 if (fpu.preload) {
Linus Torvaldscea20ca2012-02-20 10:24:09 -0800363 new->fpu_counter++;
Linus Torvalds34ddc812012-02-18 12:56:35 -0800364 __thread_set_has_fpu(new);
365 prefetch(new->thread.fpu.state);
366 } else
367 stts();
368 } else {
369 old->fpu_counter = 0;
370 if (fpu.preload) {
Linus Torvaldscea20ca2012-02-20 10:24:09 -0800371 new->fpu_counter++;
Linus Torvalds34ddc812012-02-18 12:56:35 -0800372 if (fpu_lazy_restore(new))
373 fpu.preload = 0;
374 else
375 prefetch(new->thread.fpu.state);
376 __thread_fpu_begin(new);
377 }
378 }
379 return fpu;
380}
381
382/*
383 * By the time this gets called, we've already cleared CR0.TS and
384 * given the process the FPU if we are going to preload the FPU
385 * state - all we need to do is to conditionally restore the register
386 * state itself.
387 */
388static inline void switch_fpu_finish(struct task_struct *new, fpu_switch_t fpu)
389{
Linus Torvalds80ab6f12012-02-19 11:48:44 -0800390 if (fpu.preload) {
391 if (unlikely(restore_fpu_checking(new)))
392 __thread_fpu_end(new);
393 }
Linus Torvalds34ddc812012-02-18 12:56:35 -0800394}
395
396/*
Roland McGrath1eeaed72008-01-30 13:31:51 +0100397 * Signal frame handlers...
398 */
Suresh Siddhaab513702008-07-29 10:29:22 -0700399extern int save_i387_xstate(void __user *buf);
400extern int restore_i387_xstate(void __user *buf);
Roland McGrath1eeaed72008-01-30 13:31:51 +0100401
Roland McGrath1eeaed72008-01-30 13:31:51 +0100402static inline void __clear_fpu(struct task_struct *tsk)
403{
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800404 if (__thread_has_fpu(tsk)) {
Brian Gerst51115d42010-09-03 21:17:10 -0400405 /* Ignore delayed exceptions from user space */
406 asm volatile("1: fwait\n"
407 "2:\n"
408 _ASM_EXTABLE(1b, 2b));
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800409 __thread_fpu_end(tsk);
Roland McGrath1eeaed72008-01-30 13:31:51 +0100410 }
411}
412
Linus Torvalds5b1cbac2012-02-13 13:56:14 -0800413/*
414 * Were we in an interrupt that interrupted kernel mode?
415 *
416 * We can do a kernel_fpu_begin/end() pair *ONLY* if that
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800417 * pair does nothing at all: the thread must not have fpu (so
Linus Torvalds5b1cbac2012-02-13 13:56:14 -0800418 * that we don't try to save the FPU state), and TS must
419 * be set (so that the clts/stts pair does nothing that is
420 * visible in the interrupted kernel thread).
421 */
422static inline bool interrupted_kernel_fpu_idle(void)
423{
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800424 return !__thread_has_fpu(current) &&
Linus Torvalds5b1cbac2012-02-13 13:56:14 -0800425 (read_cr0() & X86_CR0_TS);
426}
427
428/*
429 * Were we in user mode (or vm86 mode) when we were
430 * interrupted?
431 *
432 * Doing kernel_fpu_begin/end() is ok if we are running
433 * in an interrupt context from user mode - we'll just
434 * save the FPU state as required.
435 */
436static inline bool interrupted_user_mode(void)
437{
438 struct pt_regs *regs = get_irq_regs();
439 return regs && user_mode_vm(regs);
440}
441
442/*
443 * Can we use the FPU in kernel mode with the
444 * whole "kernel_fpu_begin/end()" sequence?
445 *
446 * It's always ok in process context (ie "not interrupt")
447 * but it is sometimes ok even from an irq.
448 */
449static inline bool irq_fpu_usable(void)
450{
451 return !in_interrupt() ||
452 interrupted_user_mode() ||
453 interrupted_kernel_fpu_idle();
454}
455
Roland McGrath1eeaed72008-01-30 13:31:51 +0100456static inline void kernel_fpu_begin(void)
457{
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800458 struct task_struct *me = current;
Linus Torvalds5b1cbac2012-02-13 13:56:14 -0800459
460 WARN_ON_ONCE(!irq_fpu_usable());
Roland McGrath1eeaed72008-01-30 13:31:51 +0100461 preempt_disable();
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800462 if (__thread_has_fpu(me)) {
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800463 __save_init_fpu(me);
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800464 __thread_clear_has_fpu(me);
Linus Torvaldsb6c66412012-02-16 12:22:48 -0800465 /* We do 'stts()' in kernel_fpu_end() */
466 } else
Roland McGrath1eeaed72008-01-30 13:31:51 +0100467 clts();
468}
469
470static inline void kernel_fpu_end(void)
471{
472 stts();
473 preempt_enable();
474}
475
Suresh Siddhae4914012008-08-13 22:02:26 +1000476/*
477 * Some instructions like VIA's padlock instructions generate a spurious
478 * DNA fault but don't modify SSE registers. And these instructions
Chuck Ebbert0b8c3d52009-06-09 10:40:50 -0400479 * get used from interrupt context as well. To prevent these kernel instructions
480 * in interrupt context interacting wrongly with other user/kernel fpu usage, we
Suresh Siddhae4914012008-08-13 22:02:26 +1000481 * should use them only in the context of irq_ts_save/restore()
482 */
483static inline int irq_ts_save(void)
484{
485 /*
Chuck Ebbert0b8c3d52009-06-09 10:40:50 -0400486 * If in process context and not atomic, we can take a spurious DNA fault.
487 * Otherwise, doing clts() in process context requires disabling preemption
488 * or some heavy lifting like kernel_fpu_begin()
Suresh Siddhae4914012008-08-13 22:02:26 +1000489 */
Chuck Ebbert0b8c3d52009-06-09 10:40:50 -0400490 if (!in_atomic())
Suresh Siddhae4914012008-08-13 22:02:26 +1000491 return 0;
492
493 if (read_cr0() & X86_CR0_TS) {
494 clts();
495 return 1;
496 }
497
498 return 0;
499}
500
501static inline void irq_ts_restore(int TS_state)
502{
503 if (TS_state)
504 stts();
505}
506
Roland McGrath1eeaed72008-01-30 13:31:51 +0100507/*
Linus Torvalds15d87912012-02-16 09:15:04 -0800508 * The question "does this thread have fpu access?"
509 * is slightly racy, since preemption could come in
510 * and revoke it immediately after the test.
511 *
512 * However, even in that very unlikely scenario,
513 * we can just assume we have FPU access - typically
514 * to save the FP state - we'll just take a #NM
515 * fault and get the FPU access back.
516 *
517 * The actual user_fpu_begin/end() functions
518 * need to be preemption-safe, though.
519 *
520 * NOTE! user_fpu_end() must be used only after you
521 * have saved the FP state, and user_fpu_begin() must
522 * be used only immediately before restoring it.
523 * These functions do not do any save/restore on
524 * their own.
525 */
526static inline int user_has_fpu(void)
527{
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800528 return __thread_has_fpu(current);
Linus Torvalds15d87912012-02-16 09:15:04 -0800529}
530
531static inline void user_fpu_end(void)
532{
533 preempt_disable();
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800534 __thread_fpu_end(current);
Linus Torvalds15d87912012-02-16 09:15:04 -0800535 preempt_enable();
536}
537
538static inline void user_fpu_begin(void)
539{
540 preempt_disable();
Linus Torvalds6d59d7a2012-02-16 13:33:12 -0800541 if (!user_has_fpu())
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800542 __thread_fpu_begin(current);
Linus Torvalds15d87912012-02-16 09:15:04 -0800543 preempt_enable();
544}
545
546/*
Roland McGrath1eeaed72008-01-30 13:31:51 +0100547 * These disable preemption on their own and are safe
548 */
549static inline void save_init_fpu(struct task_struct *tsk)
550{
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800551 WARN_ON_ONCE(!__thread_has_fpu(tsk));
Roland McGrath1eeaed72008-01-30 13:31:51 +0100552 preempt_disable();
553 __save_init_fpu(tsk);
Linus Torvaldsf94edac2012-02-17 21:48:54 -0800554 __thread_fpu_end(tsk);
Roland McGrath1eeaed72008-01-30 13:31:51 +0100555 preempt_enable();
556}
557
558static inline void unlazy_fpu(struct task_struct *tsk)
559{
560 preempt_disable();
Linus Torvalds34ddc812012-02-18 12:56:35 -0800561 if (__thread_has_fpu(tsk)) {
562 __save_init_fpu(tsk);
563 __thread_fpu_end(tsk);
564 } else
565 tsk->fpu_counter = 0;
Roland McGrath1eeaed72008-01-30 13:31:51 +0100566 preempt_enable();
567}
568
569static inline void clear_fpu(struct task_struct *tsk)
570{
571 preempt_disable();
572 __clear_fpu(tsk);
573 preempt_enable();
574}
575
Roland McGrath1eeaed72008-01-30 13:31:51 +0100576/*
Roland McGrath1eeaed72008-01-30 13:31:51 +0100577 * i387 state interaction
578 */
579static inline unsigned short get_fpu_cwd(struct task_struct *tsk)
580{
581 if (cpu_has_fxsr) {
Avi Kivity86603282010-05-06 11:45:46 +0300582 return tsk->thread.fpu.state->fxsave.cwd;
Roland McGrath1eeaed72008-01-30 13:31:51 +0100583 } else {
Avi Kivity86603282010-05-06 11:45:46 +0300584 return (unsigned short)tsk->thread.fpu.state->fsave.cwd;
Roland McGrath1eeaed72008-01-30 13:31:51 +0100585 }
586}
587
588static inline unsigned short get_fpu_swd(struct task_struct *tsk)
589{
590 if (cpu_has_fxsr) {
Avi Kivity86603282010-05-06 11:45:46 +0300591 return tsk->thread.fpu.state->fxsave.swd;
Roland McGrath1eeaed72008-01-30 13:31:51 +0100592 } else {
Avi Kivity86603282010-05-06 11:45:46 +0300593 return (unsigned short)tsk->thread.fpu.state->fsave.swd;
Roland McGrath1eeaed72008-01-30 13:31:51 +0100594 }
595}
596
597static inline unsigned short get_fpu_mxcsr(struct task_struct *tsk)
598{
599 if (cpu_has_xmm) {
Avi Kivity86603282010-05-06 11:45:46 +0300600 return tsk->thread.fpu.state->fxsave.mxcsr;
Roland McGrath1eeaed72008-01-30 13:31:51 +0100601 } else {
602 return MXCSR_DEFAULT;
603 }
604}
605
Avi Kivity86603282010-05-06 11:45:46 +0300606static bool fpu_allocated(struct fpu *fpu)
607{
608 return fpu->state != NULL;
609}
610
611static inline int fpu_alloc(struct fpu *fpu)
612{
613 if (fpu_allocated(fpu))
614 return 0;
615 fpu->state = kmem_cache_alloc(task_xstate_cachep, GFP_KERNEL);
616 if (!fpu->state)
617 return -ENOMEM;
618 WARN_ON((unsigned long)fpu->state & 15);
619 return 0;
620}
621
622static inline void fpu_free(struct fpu *fpu)
623{
624 if (fpu->state) {
625 kmem_cache_free(task_xstate_cachep, fpu->state);
626 fpu->state = NULL;
627 }
628}
629
630static inline void fpu_copy(struct fpu *dst, struct fpu *src)
631{
632 memcpy(dst->state, src->state, xstate_size);
633}
634
Sheng Yang5ee481d2010-05-17 17:22:23 +0800635extern void fpu_finit(struct fpu *fpu);
636
Herbert Xu3b0d6592009-11-03 09:11:15 -0500637#endif /* __ASSEMBLY__ */
638
H. Peter Anvin1965aae2008-10-22 22:26:29 -0700639#endif /* _ASM_X86_I387_H */