blob: 17b7549c4134f997289729bfeb17855c1cf62dad [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * Copyright (C) 1994 Linus Torvalds
3 *
4 * Pentium III FXSR, SSE support
5 * General FPU state handling cleanups
6 * Gareth Hughes <gareth@valinux.com>, May 2000
7 */
Alexey Dobriyan129f6942005-06-23 00:08:33 -07008#include <linux/module.h>
Roland McGrath44210112008-01-30 13:31:50 +01009#include <linux/regset.h>
Ingo Molnarf6689642008-03-05 15:37:32 +010010#include <linux/sched.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090011#include <linux/slab.h>
Ingo Molnarf6689642008-03-05 15:37:32 +010012
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include <asm/sigcontext.h>
Ingo Molnarf6689642008-03-05 15:37:32 +010014#include <asm/processor.h>
15#include <asm/math_emu.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <asm/uaccess.h>
Ingo Molnarf6689642008-03-05 15:37:32 +010017#include <asm/ptrace.h>
18#include <asm/i387.h>
19#include <asm/user.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020
Roland McGrath44210112008-01-30 13:31:50 +010021#ifdef CONFIG_X86_64
Ingo Molnarf6689642008-03-05 15:37:32 +010022# include <asm/sigcontext32.h>
23# include <asm/user32.h>
Roland McGrath44210112008-01-30 13:31:50 +010024#else
Suresh Siddhaab513702008-07-29 10:29:22 -070025# define save_i387_xstate_ia32 save_i387_xstate
26# define restore_i387_xstate_ia32 restore_i387_xstate
Ingo Molnarf6689642008-03-05 15:37:32 +010027# define _fpstate_ia32 _fpstate
Suresh Siddhaab513702008-07-29 10:29:22 -070028# define _xstate_ia32 _xstate
Suresh Siddha3c1c7f12008-07-29 10:29:21 -070029# define sig_xstate_ia32_size sig_xstate_size
Suresh Siddhac37b5ef2008-07-29 10:29:25 -070030# define fx_sw_reserved_ia32 fx_sw_reserved
Ingo Molnarf6689642008-03-05 15:37:32 +010031# define user_i387_ia32_struct user_i387_struct
32# define user32_fxsr_struct user_fxsr_struct
Roland McGrath44210112008-01-30 13:31:50 +010033#endif
34
Linus Torvalds8546c002012-02-21 10:25:45 -080035/*
36 * Were we in an interrupt that interrupted kernel mode?
37 *
38 * We can do a kernel_fpu_begin/end() pair *ONLY* if that
39 * pair does nothing at all: the thread must not have fpu (so
40 * that we don't try to save the FPU state), and TS must
41 * be set (so that the clts/stts pair does nothing that is
42 * visible in the interrupted kernel thread).
43 */
44static inline bool interrupted_kernel_fpu_idle(void)
45{
46 return !__thread_has_fpu(current) &&
47 (read_cr0() & X86_CR0_TS);
48}
49
50/*
51 * Were we in user mode (or vm86 mode) when we were
52 * interrupted?
53 *
54 * Doing kernel_fpu_begin/end() is ok if we are running
55 * in an interrupt context from user mode - we'll just
56 * save the FPU state as required.
57 */
58static inline bool interrupted_user_mode(void)
59{
60 struct pt_regs *regs = get_irq_regs();
61 return regs && user_mode_vm(regs);
62}
63
64/*
65 * Can we use the FPU in kernel mode with the
66 * whole "kernel_fpu_begin/end()" sequence?
67 *
68 * It's always ok in process context (ie "not interrupt")
69 * but it is sometimes ok even from an irq.
70 */
71bool irq_fpu_usable(void)
72{
73 return !in_interrupt() ||
74 interrupted_user_mode() ||
75 interrupted_kernel_fpu_idle();
76}
77EXPORT_SYMBOL(irq_fpu_usable);
78
79void kernel_fpu_begin(void)
80{
81 struct task_struct *me = current;
82
83 WARN_ON_ONCE(!irq_fpu_usable());
84 preempt_disable();
85 if (__thread_has_fpu(me)) {
86 __save_init_fpu(me);
87 __thread_clear_has_fpu(me);
88 /* We do 'stts()' in kernel_fpu_end() */
89 } else {
90 percpu_write(fpu_owner_task, NULL);
91 clts();
92 }
93}
94EXPORT_SYMBOL(kernel_fpu_begin);
95
96void kernel_fpu_end(void)
97{
98 stts();
99 preempt_enable();
100}
101EXPORT_SYMBOL(kernel_fpu_end);
102
103void unlazy_fpu(struct task_struct *tsk)
104{
105 preempt_disable();
106 if (__thread_has_fpu(tsk)) {
107 __save_init_fpu(tsk);
108 __thread_fpu_end(tsk);
109 } else
110 tsk->fpu_counter = 0;
111 preempt_enable();
112}
113EXPORT_SYMBOL(unlazy_fpu);
114
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115#ifdef CONFIG_MATH_EMULATION
Ingo Molnarf6689642008-03-05 15:37:32 +0100116# define HAVE_HWFP (boot_cpu_data.hard_math)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117#else
Ingo Molnarf6689642008-03-05 15:37:32 +0100118# define HAVE_HWFP 1
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119#endif
120
Ingo Molnarf6689642008-03-05 15:37:32 +0100121static unsigned int mxcsr_feature_mask __read_mostly = 0xffffffffu;
Suresh Siddha61c46282008-03-10 15:28:04 -0700122unsigned int xstate_size;
Xiaotian Fengf45755b2010-08-13 15:19:11 +0800123EXPORT_SYMBOL_GPL(xstate_size);
Suresh Siddha3c1c7f12008-07-29 10:29:21 -0700124unsigned int sig_xstate_ia32_size = sizeof(struct _fpstate_ia32);
Suresh Siddha61c46282008-03-10 15:28:04 -0700125static struct i387_fxsave_struct fx_scratch __cpuinitdata;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126
Suresh Siddha61c46282008-03-10 15:28:04 -0700127void __cpuinit mxcsr_feature_mask_init(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128{
129 unsigned long mask = 0;
Ingo Molnarf6689642008-03-05 15:37:32 +0100130
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131 clts();
132 if (cpu_has_fxsr) {
Suresh Siddha61c46282008-03-10 15:28:04 -0700133 memset(&fx_scratch, 0, sizeof(struct i387_fxsave_struct));
134 asm volatile("fxsave %0" : : "m" (fx_scratch));
135 mask = fx_scratch.mxcsr_mask;
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100136 if (mask == 0)
137 mask = 0x0000ffbf;
138 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139 mxcsr_feature_mask &= mask;
140 stts();
141}
142
Robert Richter0e49bf62010-07-21 19:03:52 +0200143static void __cpuinit init_thread_xstate(void)
Suresh Siddha61c46282008-03-10 15:28:04 -0700144{
Robert Richter0e49bf62010-07-21 19:03:52 +0200145 /*
146 * Note that xstate_size might be overwriten later during
147 * xsave_init().
148 */
149
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700150 if (!HAVE_HWFP) {
Robert Richter1f999ab2010-07-21 19:03:57 +0200151 /*
152 * Disable xsave as we do not support it if i387
153 * emulation is enabled.
154 */
155 setup_clear_cpu_cap(X86_FEATURE_XSAVE);
156 setup_clear_cpu_cap(X86_FEATURE_XSAVEOPT);
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700157 xstate_size = sizeof(struct i387_soft_struct);
158 return;
159 }
160
Suresh Siddha61c46282008-03-10 15:28:04 -0700161 if (cpu_has_fxsr)
162 xstate_size = sizeof(struct i387_fxsave_struct);
Suresh Siddha61c46282008-03-10 15:28:04 -0700163 else
164 xstate_size = sizeof(struct i387_fsave_struct);
Suresh Siddha61c46282008-03-10 15:28:04 -0700165}
166
Roland McGrath44210112008-01-30 13:31:50 +0100167/*
168 * Called at bootup to set up the initial FPU state that is later cloned
169 * into all processes.
170 */
Robert Richter0e49bf62010-07-21 19:03:52 +0200171
Roland McGrath44210112008-01-30 13:31:50 +0100172void __cpuinit fpu_init(void)
173{
Brian Gerst6ac8bac2010-09-03 21:17:09 -0400174 unsigned long cr0;
175 unsigned long cr4_mask = 0;
Ingo Molnarf6689642008-03-05 15:37:32 +0100176
Brian Gerst6ac8bac2010-09-03 21:17:09 -0400177 if (cpu_has_fxsr)
178 cr4_mask |= X86_CR4_OSFXSR;
179 if (cpu_has_xmm)
180 cr4_mask |= X86_CR4_OSXMMEXCPT;
181 if (cr4_mask)
182 set_in_cr4(cr4_mask);
Roland McGrath44210112008-01-30 13:31:50 +0100183
Brian Gerst6ac8bac2010-09-03 21:17:09 -0400184 cr0 = read_cr0();
185 cr0 &= ~(X86_CR0_TS|X86_CR0_EM); /* clear TS and EM */
186 if (!HAVE_HWFP)
187 cr0 |= X86_CR0_EM;
188 write_cr0(cr0);
Roland McGrath44210112008-01-30 13:31:50 +0100189
Suresh Siddhadc1e35c2008-07-29 10:29:19 -0700190 if (!smp_processor_id())
191 init_thread_xstate();
Suresh Siddhadc1e35c2008-07-29 10:29:19 -0700192
Roland McGrath44210112008-01-30 13:31:50 +0100193 mxcsr_feature_mask_init();
194 /* clean state in init */
Avi Kivityc9ad4882010-05-06 11:45:45 +0300195 current_thread_info()->status = 0;
Roland McGrath44210112008-01-30 13:31:50 +0100196 clear_used_math();
197}
Robert Richter0e49bf62010-07-21 19:03:52 +0200198
Sheng Yang5ee481d2010-05-17 17:22:23 +0800199void fpu_finit(struct fpu *fpu)
Avi Kivity86603282010-05-06 11:45:46 +0300200{
Avi Kivity86603282010-05-06 11:45:46 +0300201 if (!HAVE_HWFP) {
202 finit_soft_fpu(&fpu->state->soft);
203 return;
204 }
Avi Kivity86603282010-05-06 11:45:46 +0300205
206 if (cpu_has_fxsr) {
207 struct i387_fxsave_struct *fx = &fpu->state->fxsave;
208
209 memset(fx, 0, xstate_size);
210 fx->cwd = 0x37f;
211 if (cpu_has_xmm)
212 fx->mxcsr = MXCSR_DEFAULT;
213 } else {
214 struct i387_fsave_struct *fp = &fpu->state->fsave;
215 memset(fp, 0, xstate_size);
216 fp->cwd = 0xffff037fu;
217 fp->swd = 0xffff0000u;
218 fp->twd = 0xffffffffu;
219 fp->fos = 0xffff0000u;
220 }
221}
Sheng Yang5ee481d2010-05-17 17:22:23 +0800222EXPORT_SYMBOL_GPL(fpu_finit);
Avi Kivity86603282010-05-06 11:45:46 +0300223
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224/*
225 * The _current_ task is using the FPU for the first time
226 * so initialize it and set the mxcsr to its default
227 * value at reset if we support XMM instructions and then
Lucas De Marchi0d2eb442011-03-17 16:24:16 -0300228 * remember the current task has used the FPU.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 */
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700230int init_fpu(struct task_struct *tsk)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231{
Avi Kivity86603282010-05-06 11:45:46 +0300232 int ret;
233
Roland McGrath44210112008-01-30 13:31:50 +0100234 if (tsk_used_math(tsk)) {
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700235 if (HAVE_HWFP && tsk == current)
Roland McGrath44210112008-01-30 13:31:50 +0100236 unlazy_fpu(tsk);
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700237 return 0;
238 }
239
240 /*
241 * Memory allocation at the first usage of the FPU and other state.
242 */
Avi Kivity86603282010-05-06 11:45:46 +0300243 ret = fpu_alloc(&tsk->thread.fpu);
244 if (ret)
245 return ret;
Roland McGrath44210112008-01-30 13:31:50 +0100246
Avi Kivity86603282010-05-06 11:45:46 +0300247 fpu_finit(&tsk->thread.fpu);
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700248
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249 set_stopped_child_used_math(tsk);
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700250 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251}
Avi Kivitye5c30142011-01-11 12:15:54 +0200252EXPORT_SYMBOL_GPL(init_fpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800254/*
255 * The xstateregs_active() routine is the same as the fpregs_active() routine,
256 * as the "regset->n" for the xstate regset will be updated based on the feature
257 * capabilites supported by the xsave.
258 */
Roland McGrath44210112008-01-30 13:31:50 +0100259int fpregs_active(struct task_struct *target, const struct user_regset *regset)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260{
Roland McGrath44210112008-01-30 13:31:50 +0100261 return tsk_used_math(target) ? regset->n : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262}
Roland McGrath44210112008-01-30 13:31:50 +0100263
264int xfpregs_active(struct task_struct *target, const struct user_regset *regset)
265{
266 return (cpu_has_fxsr && tsk_used_math(target)) ? regset->n : 0;
267}
268
269int xfpregs_get(struct task_struct *target, const struct user_regset *regset,
270 unsigned int pos, unsigned int count,
271 void *kbuf, void __user *ubuf)
272{
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700273 int ret;
274
Roland McGrath44210112008-01-30 13:31:50 +0100275 if (!cpu_has_fxsr)
276 return -ENODEV;
277
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700278 ret = init_fpu(target);
279 if (ret)
280 return ret;
Roland McGrath44210112008-01-30 13:31:50 +0100281
Suresh Siddha29104e12010-07-19 16:05:49 -0700282 sanitize_i387_state(target);
283
Roland McGrath44210112008-01-30 13:31:50 +0100284 return user_regset_copyout(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300285 &target->thread.fpu.state->fxsave, 0, -1);
Roland McGrath44210112008-01-30 13:31:50 +0100286}
287
288int xfpregs_set(struct task_struct *target, const struct user_regset *regset,
289 unsigned int pos, unsigned int count,
290 const void *kbuf, const void __user *ubuf)
291{
292 int ret;
293
294 if (!cpu_has_fxsr)
295 return -ENODEV;
296
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700297 ret = init_fpu(target);
298 if (ret)
299 return ret;
300
Suresh Siddha29104e12010-07-19 16:05:49 -0700301 sanitize_i387_state(target);
302
Roland McGrath44210112008-01-30 13:31:50 +0100303 ret = user_regset_copyin(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300304 &target->thread.fpu.state->fxsave, 0, -1);
Roland McGrath44210112008-01-30 13:31:50 +0100305
306 /*
307 * mxcsr reserved bits must be masked to zero for security reasons.
308 */
Avi Kivity86603282010-05-06 11:45:46 +0300309 target->thread.fpu.state->fxsave.mxcsr &= mxcsr_feature_mask;
Roland McGrath44210112008-01-30 13:31:50 +0100310
Suresh Siddha42deec62008-07-29 10:29:26 -0700311 /*
312 * update the header bits in the xsave header, indicating the
313 * presence of FP and SSE state.
314 */
315 if (cpu_has_xsave)
Avi Kivity86603282010-05-06 11:45:46 +0300316 target->thread.fpu.state->xsave.xsave_hdr.xstate_bv |= XSTATE_FPSSE;
Suresh Siddha42deec62008-07-29 10:29:26 -0700317
Roland McGrath44210112008-01-30 13:31:50 +0100318 return ret;
319}
320
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800321int xstateregs_get(struct task_struct *target, const struct user_regset *regset,
322 unsigned int pos, unsigned int count,
323 void *kbuf, void __user *ubuf)
324{
325 int ret;
326
327 if (!cpu_has_xsave)
328 return -ENODEV;
329
330 ret = init_fpu(target);
331 if (ret)
332 return ret;
333
334 /*
Suresh Siddhaff7fbc72010-02-22 14:51:33 -0800335 * Copy the 48bytes defined by the software first into the xstate
336 * memory layout in the thread struct, so that we can copy the entire
337 * xstateregs to the user using one user_regset_copyout().
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800338 */
Avi Kivity86603282010-05-06 11:45:46 +0300339 memcpy(&target->thread.fpu.state->fxsave.sw_reserved,
Suresh Siddhaff7fbc72010-02-22 14:51:33 -0800340 xstate_fx_sw_bytes, sizeof(xstate_fx_sw_bytes));
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800341
342 /*
Suresh Siddhaff7fbc72010-02-22 14:51:33 -0800343 * Copy the xstate memory layout.
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800344 */
345 ret = user_regset_copyout(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300346 &target->thread.fpu.state->xsave, 0, -1);
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800347 return ret;
348}
349
350int xstateregs_set(struct task_struct *target, const struct user_regset *regset,
351 unsigned int pos, unsigned int count,
352 const void *kbuf, const void __user *ubuf)
353{
354 int ret;
355 struct xsave_hdr_struct *xsave_hdr;
356
357 if (!cpu_has_xsave)
358 return -ENODEV;
359
360 ret = init_fpu(target);
361 if (ret)
362 return ret;
363
364 ret = user_regset_copyin(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300365 &target->thread.fpu.state->xsave, 0, -1);
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800366
367 /*
368 * mxcsr reserved bits must be masked to zero for security reasons.
369 */
Avi Kivity86603282010-05-06 11:45:46 +0300370 target->thread.fpu.state->fxsave.mxcsr &= mxcsr_feature_mask;
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800371
Avi Kivity86603282010-05-06 11:45:46 +0300372 xsave_hdr = &target->thread.fpu.state->xsave.xsave_hdr;
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800373
374 xsave_hdr->xstate_bv &= pcntxt_mask;
375 /*
376 * These bits must be zero.
377 */
378 xsave_hdr->reserved1[0] = xsave_hdr->reserved1[1] = 0;
379
380 return ret;
381}
382
Roland McGrath44210112008-01-30 13:31:50 +0100383#if defined CONFIG_X86_32 || defined CONFIG_IA32_EMULATION
Linus Torvalds1da177e2005-04-16 15:20:36 -0700384
Linus Torvalds1da177e2005-04-16 15:20:36 -0700385/*
386 * FPU tag word conversions.
387 */
388
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100389static inline unsigned short twd_i387_to_fxsr(unsigned short twd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700390{
391 unsigned int tmp; /* to avoid 16 bit prefixes in the code */
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100392
Linus Torvalds1da177e2005-04-16 15:20:36 -0700393 /* Transform each pair of bits into 01 (valid) or 00 (empty) */
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100394 tmp = ~twd;
Roland McGrath44210112008-01-30 13:31:50 +0100395 tmp = (tmp | (tmp>>1)) & 0x5555; /* 0V0V0V0V0V0V0V0V */
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100396 /* and move the valid bits to the lower byte. */
397 tmp = (tmp | (tmp >> 1)) & 0x3333; /* 00VV00VV00VV00VV */
398 tmp = (tmp | (tmp >> 2)) & 0x0f0f; /* 0000VVVV0000VVVV */
399 tmp = (tmp | (tmp >> 4)) & 0x00ff; /* 00000000VVVVVVVV */
Ingo Molnarf6689642008-03-05 15:37:32 +0100400
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100401 return tmp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402}
403
Phil Carmody497888c2011-07-14 15:07:13 +0300404#define FPREG_ADDR(f, n) ((void *)&(f)->st_space + (n) * 16)
Roland McGrath44210112008-01-30 13:31:50 +0100405#define FP_EXP_TAG_VALID 0
406#define FP_EXP_TAG_ZERO 1
407#define FP_EXP_TAG_SPECIAL 2
408#define FP_EXP_TAG_EMPTY 3
409
410static inline u32 twd_fxsr_to_i387(struct i387_fxsave_struct *fxsave)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700411{
Roland McGrath44210112008-01-30 13:31:50 +0100412 struct _fpxreg *st;
413 u32 tos = (fxsave->swd >> 11) & 7;
414 u32 twd = (unsigned long) fxsave->twd;
415 u32 tag;
416 u32 ret = 0xffff0000u;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 int i;
418
Roland McGrath44210112008-01-30 13:31:50 +0100419 for (i = 0; i < 8; i++, twd >>= 1) {
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100420 if (twd & 0x1) {
421 st = FPREG_ADDR(fxsave, (i - tos) & 7);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700422
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100423 switch (st->exponent & 0x7fff) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700424 case 0x7fff:
Roland McGrath44210112008-01-30 13:31:50 +0100425 tag = FP_EXP_TAG_SPECIAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700426 break;
427 case 0x0000:
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100428 if (!st->significand[0] &&
429 !st->significand[1] &&
430 !st->significand[2] &&
Roland McGrath44210112008-01-30 13:31:50 +0100431 !st->significand[3])
432 tag = FP_EXP_TAG_ZERO;
433 else
434 tag = FP_EXP_TAG_SPECIAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435 break;
436 default:
Roland McGrath44210112008-01-30 13:31:50 +0100437 if (st->significand[3] & 0x8000)
438 tag = FP_EXP_TAG_VALID;
439 else
440 tag = FP_EXP_TAG_SPECIAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700441 break;
442 }
443 } else {
Roland McGrath44210112008-01-30 13:31:50 +0100444 tag = FP_EXP_TAG_EMPTY;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445 }
Roland McGrath44210112008-01-30 13:31:50 +0100446 ret |= tag << (2 * i);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700447 }
448 return ret;
449}
450
451/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700452 * FXSR floating point environment conversions.
453 */
454
Ingo Molnarf6689642008-03-05 15:37:32 +0100455static void
456convert_from_fxsr(struct user_i387_ia32_struct *env, struct task_struct *tsk)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457{
Avi Kivity86603282010-05-06 11:45:46 +0300458 struct i387_fxsave_struct *fxsave = &tsk->thread.fpu.state->fxsave;
Roland McGrath44210112008-01-30 13:31:50 +0100459 struct _fpreg *to = (struct _fpreg *) &env->st_space[0];
460 struct _fpxreg *from = (struct _fpxreg *) &fxsave->st_space[0];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700461 int i;
462
Roland McGrath44210112008-01-30 13:31:50 +0100463 env->cwd = fxsave->cwd | 0xffff0000u;
464 env->swd = fxsave->swd | 0xffff0000u;
465 env->twd = twd_fxsr_to_i387(fxsave);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700466
Roland McGrath44210112008-01-30 13:31:50 +0100467#ifdef CONFIG_X86_64
468 env->fip = fxsave->rip;
469 env->foo = fxsave->rdp;
Brian Gerst10c11f32010-09-03 21:17:13 -0400470 /*
471 * should be actually ds/cs at fpu exception time, but
472 * that information is not available in 64bit mode.
473 */
474 env->fcs = task_pt_regs(tsk)->cs;
Roland McGrath44210112008-01-30 13:31:50 +0100475 if (tsk == current) {
Brian Gerst10c11f32010-09-03 21:17:13 -0400476 savesegment(ds, env->fos);
Roland McGrath44210112008-01-30 13:31:50 +0100477 } else {
Brian Gerst10c11f32010-09-03 21:17:13 -0400478 env->fos = tsk->thread.ds;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700479 }
Brian Gerst10c11f32010-09-03 21:17:13 -0400480 env->fos |= 0xffff0000;
Roland McGrath44210112008-01-30 13:31:50 +0100481#else
482 env->fip = fxsave->fip;
Jan Beulich609b5292008-03-05 08:35:14 +0000483 env->fcs = (u16) fxsave->fcs | ((u32) fxsave->fop << 16);
Roland McGrath44210112008-01-30 13:31:50 +0100484 env->foo = fxsave->foo;
485 env->fos = fxsave->fos;
486#endif
487
488 for (i = 0; i < 8; ++i)
489 memcpy(&to[i], &from[i], sizeof(to[0]));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490}
491
Roland McGrath44210112008-01-30 13:31:50 +0100492static void convert_to_fxsr(struct task_struct *tsk,
493 const struct user_i387_ia32_struct *env)
494
Linus Torvalds1da177e2005-04-16 15:20:36 -0700495{
Avi Kivity86603282010-05-06 11:45:46 +0300496 struct i387_fxsave_struct *fxsave = &tsk->thread.fpu.state->fxsave;
Roland McGrath44210112008-01-30 13:31:50 +0100497 struct _fpreg *from = (struct _fpreg *) &env->st_space[0];
498 struct _fpxreg *to = (struct _fpxreg *) &fxsave->st_space[0];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499 int i;
500
Roland McGrath44210112008-01-30 13:31:50 +0100501 fxsave->cwd = env->cwd;
502 fxsave->swd = env->swd;
503 fxsave->twd = twd_i387_to_fxsr(env->twd);
504 fxsave->fop = (u16) ((u32) env->fcs >> 16);
505#ifdef CONFIG_X86_64
506 fxsave->rip = env->fip;
507 fxsave->rdp = env->foo;
508 /* cs and ds ignored */
509#else
510 fxsave->fip = env->fip;
511 fxsave->fcs = (env->fcs & 0xffff);
512 fxsave->foo = env->foo;
513 fxsave->fos = env->fos;
514#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700515
Roland McGrath44210112008-01-30 13:31:50 +0100516 for (i = 0; i < 8; ++i)
517 memcpy(&to[i], &from[i], sizeof(from[0]));
518}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700519
Roland McGrath44210112008-01-30 13:31:50 +0100520int fpregs_get(struct task_struct *target, const struct user_regset *regset,
521 unsigned int pos, unsigned int count,
522 void *kbuf, void __user *ubuf)
523{
524 struct user_i387_ia32_struct env;
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700525 int ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700526
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700527 ret = init_fpu(target);
528 if (ret)
529 return ret;
Roland McGrath44210112008-01-30 13:31:50 +0100530
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700531 if (!HAVE_HWFP)
532 return fpregs_soft_get(target, regset, pos, count, kbuf, ubuf);
533
Ingo Molnarf6689642008-03-05 15:37:32 +0100534 if (!cpu_has_fxsr) {
Roland McGrath44210112008-01-30 13:31:50 +0100535 return user_regset_copyout(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300536 &target->thread.fpu.state->fsave, 0,
Suresh Siddha61c46282008-03-10 15:28:04 -0700537 -1);
Ingo Molnarf6689642008-03-05 15:37:32 +0100538 }
Roland McGrath44210112008-01-30 13:31:50 +0100539
Suresh Siddha29104e12010-07-19 16:05:49 -0700540 sanitize_i387_state(target);
541
Roland McGrath44210112008-01-30 13:31:50 +0100542 if (kbuf && pos == 0 && count == sizeof(env)) {
543 convert_from_fxsr(kbuf, target);
544 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700545 }
Roland McGrath44210112008-01-30 13:31:50 +0100546
547 convert_from_fxsr(&env, target);
Ingo Molnarf6689642008-03-05 15:37:32 +0100548
Roland McGrath44210112008-01-30 13:31:50 +0100549 return user_regset_copyout(&pos, &count, &kbuf, &ubuf, &env, 0, -1);
550}
551
552int fpregs_set(struct task_struct *target, const struct user_regset *regset,
553 unsigned int pos, unsigned int count,
554 const void *kbuf, const void __user *ubuf)
555{
556 struct user_i387_ia32_struct env;
557 int ret;
558
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700559 ret = init_fpu(target);
560 if (ret)
561 return ret;
562
Suresh Siddha29104e12010-07-19 16:05:49 -0700563 sanitize_i387_state(target);
564
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700565 if (!HAVE_HWFP)
566 return fpregs_soft_set(target, regset, pos, count, kbuf, ubuf);
567
Ingo Molnarf6689642008-03-05 15:37:32 +0100568 if (!cpu_has_fxsr) {
Roland McGrath44210112008-01-30 13:31:50 +0100569 return user_regset_copyin(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300570 &target->thread.fpu.state->fsave, 0, -1);
Ingo Molnarf6689642008-03-05 15:37:32 +0100571 }
Roland McGrath44210112008-01-30 13:31:50 +0100572
573 if (pos > 0 || count < sizeof(env))
574 convert_from_fxsr(&env, target);
575
576 ret = user_regset_copyin(&pos, &count, &kbuf, &ubuf, &env, 0, -1);
577 if (!ret)
578 convert_to_fxsr(target, &env);
579
Suresh Siddha42deec62008-07-29 10:29:26 -0700580 /*
581 * update the header bit in the xsave header, indicating the
582 * presence of FP.
583 */
584 if (cpu_has_xsave)
Avi Kivity86603282010-05-06 11:45:46 +0300585 target->thread.fpu.state->xsave.xsave_hdr.xstate_bv |= XSTATE_FP;
Roland McGrath44210112008-01-30 13:31:50 +0100586 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700587}
588
589/*
590 * Signal frame handlers.
591 */
592
Roland McGrath44210112008-01-30 13:31:50 +0100593static inline int save_i387_fsave(struct _fpstate_ia32 __user *buf)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700594{
595 struct task_struct *tsk = current;
Avi Kivity86603282010-05-06 11:45:46 +0300596 struct i387_fsave_struct *fp = &tsk->thread.fpu.state->fsave;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597
Suresh Siddha61c46282008-03-10 15:28:04 -0700598 fp->status = fp->swd;
599 if (__copy_to_user(buf, fp, sizeof(struct i387_fsave_struct)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700600 return -1;
601 return 1;
602}
603
Roland McGrath44210112008-01-30 13:31:50 +0100604static int save_i387_fxsave(struct _fpstate_ia32 __user *buf)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700605{
606 struct task_struct *tsk = current;
Avi Kivity86603282010-05-06 11:45:46 +0300607 struct i387_fxsave_struct *fx = &tsk->thread.fpu.state->fxsave;
Roland McGrath44210112008-01-30 13:31:50 +0100608 struct user_i387_ia32_struct env;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700609 int err = 0;
610
Roland McGrath44210112008-01-30 13:31:50 +0100611 convert_from_fxsr(&env, tsk);
612 if (__copy_to_user(buf, &env, sizeof(env)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 return -1;
614
Suresh Siddha61c46282008-03-10 15:28:04 -0700615 err |= __put_user(fx->swd, &buf->status);
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100616 err |= __put_user(X86_FXSR_MAGIC, &buf->magic);
617 if (err)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618 return -1;
619
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700620 if (__copy_to_user(&buf->_fxsr_env[0], fx, xstate_size))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700621 return -1;
622 return 1;
623}
624
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700625static int save_i387_xsave(void __user *buf)
626{
Suresh Siddha04944b72008-10-07 14:04:28 -0700627 struct task_struct *tsk = current;
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700628 struct _fpstate_ia32 __user *fx = buf;
629 int err = 0;
630
Suresh Siddha29104e12010-07-19 16:05:49 -0700631
632 sanitize_i387_state(tsk);
633
Suresh Siddha04944b72008-10-07 14:04:28 -0700634 /*
635 * For legacy compatible, we always set FP/SSE bits in the bit
636 * vector while saving the state to the user context.
637 * This will enable us capturing any changes(during sigreturn) to
638 * the FP/SSE bits by the legacy applications which don't touch
639 * xstate_bv in the xsave header.
640 *
641 * xsave aware applications can change the xstate_bv in the xsave
642 * header as well as change any contents in the memory layout.
643 * xrestore as part of sigreturn will capture all the changes.
644 */
Avi Kivity86603282010-05-06 11:45:46 +0300645 tsk->thread.fpu.state->xsave.xsave_hdr.xstate_bv |= XSTATE_FPSSE;
Suresh Siddha04944b72008-10-07 14:04:28 -0700646
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700647 if (save_i387_fxsave(fx) < 0)
648 return -1;
649
650 err = __copy_to_user(&fx->sw_reserved, &fx_sw_reserved_ia32,
651 sizeof(struct _fpx_sw_bytes));
652 err |= __put_user(FP_XSTATE_MAGIC2,
653 (__u32 __user *) (buf + sig_xstate_ia32_size
654 - FP_XSTATE_MAGIC2_SIZE));
655 if (err)
656 return -1;
657
658 return 1;
659}
660
Suresh Siddhaab513702008-07-29 10:29:22 -0700661int save_i387_xstate_ia32(void __user *buf)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700662{
Suresh Siddhaab513702008-07-29 10:29:22 -0700663 struct _fpstate_ia32 __user *fp = (struct _fpstate_ia32 __user *) buf;
664 struct task_struct *tsk = current;
665
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100666 if (!used_math())
Linus Torvalds1da177e2005-04-16 15:20:36 -0700667 return 0;
Suresh Siddhaab513702008-07-29 10:29:22 -0700668
669 if (!access_ok(VERIFY_WRITE, buf, sig_xstate_ia32_size))
670 return -EACCES;
Ingo Molnarf6689642008-03-05 15:37:32 +0100671 /*
672 * This will cause a "finit" to be triggered by the next
Linus Torvalds1da177e2005-04-16 15:20:36 -0700673 * attempted FPU operation by the 'current' process.
674 */
675 clear_used_math();
676
Ingo Molnarf6689642008-03-05 15:37:32 +0100677 if (!HAVE_HWFP) {
Roland McGrath44210112008-01-30 13:31:50 +0100678 return fpregs_soft_get(current, NULL,
679 0, sizeof(struct user_i387_ia32_struct),
Suresh Siddhaab513702008-07-29 10:29:22 -0700680 NULL, fp) ? -1 : 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700681 }
Ingo Molnarf6689642008-03-05 15:37:32 +0100682
Suresh Siddhaab513702008-07-29 10:29:22 -0700683 unlazy_fpu(tsk);
684
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700685 if (cpu_has_xsave)
686 return save_i387_xsave(fp);
Ingo Molnarf6689642008-03-05 15:37:32 +0100687 if (cpu_has_fxsr)
Suresh Siddhaab513702008-07-29 10:29:22 -0700688 return save_i387_fxsave(fp);
Ingo Molnarf6689642008-03-05 15:37:32 +0100689 else
Suresh Siddhaab513702008-07-29 10:29:22 -0700690 return save_i387_fsave(fp);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700691}
692
Roland McGrath44210112008-01-30 13:31:50 +0100693static inline int restore_i387_fsave(struct _fpstate_ia32 __user *buf)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694{
695 struct task_struct *tsk = current;
Ingo Molnarf6689642008-03-05 15:37:32 +0100696
Avi Kivity86603282010-05-06 11:45:46 +0300697 return __copy_from_user(&tsk->thread.fpu.state->fsave, buf,
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100698 sizeof(struct i387_fsave_struct));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700699}
700
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700701static int restore_i387_fxsave(struct _fpstate_ia32 __user *buf,
702 unsigned int size)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700703{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704 struct task_struct *tsk = current;
Roland McGrath44210112008-01-30 13:31:50 +0100705 struct user_i387_ia32_struct env;
Ingo Molnarf6689642008-03-05 15:37:32 +0100706 int err;
707
Avi Kivity86603282010-05-06 11:45:46 +0300708 err = __copy_from_user(&tsk->thread.fpu.state->fxsave, &buf->_fxsr_env[0],
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700709 size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710 /* mxcsr reserved bits must be masked to zero for security reasons */
Avi Kivity86603282010-05-06 11:45:46 +0300711 tsk->thread.fpu.state->fxsave.mxcsr &= mxcsr_feature_mask;
Roland McGrath44210112008-01-30 13:31:50 +0100712 if (err || __copy_from_user(&env, buf, sizeof(env)))
713 return 1;
714 convert_to_fxsr(tsk, &env);
Ingo Molnarf6689642008-03-05 15:37:32 +0100715
Roland McGrath44210112008-01-30 13:31:50 +0100716 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700717}
718
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700719static int restore_i387_xsave(void __user *buf)
720{
721 struct _fpx_sw_bytes fx_sw_user;
722 struct _fpstate_ia32 __user *fx_user =
723 ((struct _fpstate_ia32 __user *) buf);
724 struct i387_fxsave_struct __user *fx =
725 (struct i387_fxsave_struct __user *) &fx_user->_fxsr_env[0];
726 struct xsave_hdr_struct *xsave_hdr =
Avi Kivity86603282010-05-06 11:45:46 +0300727 &current->thread.fpu.state->xsave.xsave_hdr;
H. Peter Anvin6152e4b2008-07-29 17:23:16 -0700728 u64 mask;
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700729 int err;
730
731 if (check_for_xstate(fx, buf, &fx_sw_user))
732 goto fx_only;
733
H. Peter Anvin6152e4b2008-07-29 17:23:16 -0700734 mask = fx_sw_user.xstate_bv;
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700735
736 err = restore_i387_fxsave(buf, fx_sw_user.xstate_size);
737
H. Peter Anvin6152e4b2008-07-29 17:23:16 -0700738 xsave_hdr->xstate_bv &= pcntxt_mask;
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700739 /*
740 * These bits must be zero.
741 */
742 xsave_hdr->reserved1[0] = xsave_hdr->reserved1[1] = 0;
743
744 /*
745 * Init the state that is not present in the memory layout
746 * and enabled by the OS.
747 */
H. Peter Anvin6152e4b2008-07-29 17:23:16 -0700748 mask = ~(pcntxt_mask & ~mask);
749 xsave_hdr->xstate_bv &= mask;
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700750
751 return err;
752fx_only:
753 /*
754 * Couldn't find the extended state information in the memory
755 * layout. Restore the FP/SSE and init the other extended state
756 * enabled by the OS.
757 */
758 xsave_hdr->xstate_bv = XSTATE_FPSSE;
759 return restore_i387_fxsave(buf, sizeof(struct i387_fxsave_struct));
760}
761
Suresh Siddhaab513702008-07-29 10:29:22 -0700762int restore_i387_xstate_ia32(void __user *buf)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700763{
764 int err;
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700765 struct task_struct *tsk = current;
Suresh Siddhaab513702008-07-29 10:29:22 -0700766 struct _fpstate_ia32 __user *fp = (struct _fpstate_ia32 __user *) buf;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700767
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700768 if (HAVE_HWFP)
Suresh Siddhafd3c3ed2008-05-07 12:09:52 -0700769 clear_fpu(tsk);
770
Suresh Siddhaab513702008-07-29 10:29:22 -0700771 if (!buf) {
772 if (used_math()) {
773 clear_fpu(tsk);
774 clear_used_math();
775 }
776
777 return 0;
778 } else
779 if (!access_ok(VERIFY_READ, buf, sig_xstate_ia32_size))
780 return -EACCES;
781
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700782 if (!used_math()) {
783 err = init_fpu(tsk);
784 if (err)
785 return err;
786 }
Suresh Siddhafd3c3ed2008-05-07 12:09:52 -0700787
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700788 if (HAVE_HWFP) {
Suresh Siddhac37b5ef2008-07-29 10:29:25 -0700789 if (cpu_has_xsave)
790 err = restore_i387_xsave(buf);
791 else if (cpu_has_fxsr)
792 err = restore_i387_fxsave(fp, sizeof(struct
793 i387_fxsave_struct));
Ingo Molnarf6689642008-03-05 15:37:32 +0100794 else
Suresh Siddhaab513702008-07-29 10:29:22 -0700795 err = restore_i387_fsave(fp);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796 } else {
Roland McGrath44210112008-01-30 13:31:50 +0100797 err = fpregs_soft_set(current, NULL,
798 0, sizeof(struct user_i387_ia32_struct),
Suresh Siddhaab513702008-07-29 10:29:22 -0700799 NULL, fp) != 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700800 }
801 set_used_math();
Ingo Molnarf6689642008-03-05 15:37:32 +0100802
Linus Torvalds1da177e2005-04-16 15:20:36 -0700803 return err;
804}
805
Linus Torvalds1da177e2005-04-16 15:20:36 -0700806/*
807 * FPU state for core dumps.
Roland McGrath60b3b9a2008-01-30 13:31:55 +0100808 * This is only used for a.out dumps now.
809 * It is declared generically using elf_fpregset_t (which is
810 * struct user_i387_struct) but is in fact only used for 32-bit
811 * dumps, so on 64-bit it is really struct user_i387_ia32_struct.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700812 */
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100813int dump_fpu(struct pt_regs *regs, struct user_i387_struct *fpu)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700814{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700815 struct task_struct *tsk = current;
Ingo Molnarf6689642008-03-05 15:37:32 +0100816 int fpvalid;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700817
818 fpvalid = !!used_math();
Roland McGrath60b3b9a2008-01-30 13:31:55 +0100819 if (fpvalid)
820 fpvalid = !fpregs_get(tsk, NULL,
821 0, sizeof(struct user_i387_ia32_struct),
822 fpu, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700823
824 return fpvalid;
825}
Alexey Dobriyan129f6942005-06-23 00:08:33 -0700826EXPORT_SYMBOL(dump_fpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700827
Roland McGrath60b3b9a2008-01-30 13:31:55 +0100828#endif /* CONFIG_X86_32 || CONFIG_IA32_EMULATION */