blob: d5dd808144190ffd1d443229b4dbbd56740fface [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * Copyright (C) 1994 Linus Torvalds
3 *
4 * Pentium III FXSR, SSE support
5 * General FPU state handling cleanups
6 * Gareth Hughes <gareth@valinux.com>, May 2000
7 */
Alexey Dobriyan129f6942005-06-23 00:08:33 -07008#include <linux/module.h>
Roland McGrath44210112008-01-30 13:31:50 +01009#include <linux/regset.h>
Ingo Molnarf6689642008-03-05 15:37:32 +010010#include <linux/sched.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090011#include <linux/slab.h>
Ingo Molnarf6689642008-03-05 15:37:32 +010012
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include <asm/sigcontext.h>
Ingo Molnarf6689642008-03-05 15:37:32 +010014#include <asm/processor.h>
15#include <asm/math_emu.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <asm/uaccess.h>
Ingo Molnarf6689642008-03-05 15:37:32 +010017#include <asm/ptrace.h>
18#include <asm/i387.h>
Linus Torvalds1361b832012-02-21 13:19:22 -080019#include <asm/fpu-internal.h>
Ingo Molnarf6689642008-03-05 15:37:32 +010020#include <asm/user.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021
Linus Torvalds8546c002012-02-21 10:25:45 -080022/*
23 * Were we in an interrupt that interrupted kernel mode?
24 *
Suresh Siddha304bced2012-08-24 14:13:02 -070025 * On others, we can do a kernel_fpu_begin/end() pair *ONLY* if that
Linus Torvalds8546c002012-02-21 10:25:45 -080026 * pair does nothing at all: the thread must not have fpu (so
27 * that we don't try to save the FPU state), and TS must
28 * be set (so that the clts/stts pair does nothing that is
29 * visible in the interrupted kernel thread).
Pekka Riikonen5187b282013-05-13 14:32:07 +020030 *
31 * Except for the eagerfpu case when we return 1 unless we've already
32 * been eager and saved the state in kernel_fpu_begin().
Linus Torvalds8546c002012-02-21 10:25:45 -080033 */
34static inline bool interrupted_kernel_fpu_idle(void)
35{
Suresh Siddha5d2bd702012-09-06 14:58:52 -070036 if (use_eager_fpu())
Pekka Riikonen5187b282013-05-13 14:32:07 +020037 return __thread_has_fpu(current);
Suresh Siddha304bced2012-08-24 14:13:02 -070038
Linus Torvalds8546c002012-02-21 10:25:45 -080039 return !__thread_has_fpu(current) &&
40 (read_cr0() & X86_CR0_TS);
41}
42
43/*
44 * Were we in user mode (or vm86 mode) when we were
45 * interrupted?
46 *
47 * Doing kernel_fpu_begin/end() is ok if we are running
48 * in an interrupt context from user mode - we'll just
49 * save the FPU state as required.
50 */
51static inline bool interrupted_user_mode(void)
52{
53 struct pt_regs *regs = get_irq_regs();
54 return regs && user_mode_vm(regs);
55}
56
57/*
58 * Can we use the FPU in kernel mode with the
59 * whole "kernel_fpu_begin/end()" sequence?
60 *
61 * It's always ok in process context (ie "not interrupt")
62 * but it is sometimes ok even from an irq.
63 */
64bool irq_fpu_usable(void)
65{
66 return !in_interrupt() ||
67 interrupted_user_mode() ||
68 interrupted_kernel_fpu_idle();
69}
70EXPORT_SYMBOL(irq_fpu_usable);
71
Suresh Siddhab1a74bf2012-09-20 11:01:49 -070072void __kernel_fpu_begin(void)
Linus Torvalds8546c002012-02-21 10:25:45 -080073{
74 struct task_struct *me = current;
75
Linus Torvalds8546c002012-02-21 10:25:45 -080076 if (__thread_has_fpu(me)) {
Linus Torvalds8546c002012-02-21 10:25:45 -080077 __thread_clear_has_fpu(me);
Pekka Riikonen5187b282013-05-13 14:32:07 +020078 __save_init_fpu(me);
Suresh Siddhab1a74bf2012-09-20 11:01:49 -070079 /* We do 'stts()' in __kernel_fpu_end() */
Suresh Siddha5d2bd702012-09-06 14:58:52 -070080 } else if (!use_eager_fpu()) {
Alex Shic6ae41e2012-05-11 15:35:27 +080081 this_cpu_write(fpu_owner_task, NULL);
Linus Torvalds8546c002012-02-21 10:25:45 -080082 clts();
83 }
84}
Suresh Siddhab1a74bf2012-09-20 11:01:49 -070085EXPORT_SYMBOL(__kernel_fpu_begin);
Linus Torvalds8546c002012-02-21 10:25:45 -080086
Suresh Siddhab1a74bf2012-09-20 11:01:49 -070087void __kernel_fpu_end(void)
Linus Torvalds8546c002012-02-21 10:25:45 -080088{
Suresh Siddha731bd6a92014-02-02 22:56:23 -080089 if (use_eager_fpu()) {
90 /*
91 * For eager fpu, most the time, tsk_used_math() is true.
92 * Restore the user math as we are done with the kernel usage.
93 * At few instances during thread exit, signal handling etc,
94 * tsk_used_math() is false. Those few places will take proper
95 * actions, so we don't need to restore the math here.
96 */
97 if (likely(tsk_used_math(current)))
98 math_state_restore();
99 } else {
Suresh Siddha304bced2012-08-24 14:13:02 -0700100 stts();
Suresh Siddha731bd6a92014-02-02 22:56:23 -0800101 }
Linus Torvalds8546c002012-02-21 10:25:45 -0800102}
Suresh Siddhab1a74bf2012-09-20 11:01:49 -0700103EXPORT_SYMBOL(__kernel_fpu_end);
Linus Torvalds8546c002012-02-21 10:25:45 -0800104
105void unlazy_fpu(struct task_struct *tsk)
106{
107 preempt_disable();
108 if (__thread_has_fpu(tsk)) {
109 __save_init_fpu(tsk);
110 __thread_fpu_end(tsk);
111 } else
Vineet Guptac375f152013-11-12 15:08:46 -0800112 tsk->thread.fpu_counter = 0;
Linus Torvalds8546c002012-02-21 10:25:45 -0800113 preempt_enable();
114}
115EXPORT_SYMBOL(unlazy_fpu);
116
Suresh Siddha72a671c2012-07-24 16:05:29 -0700117unsigned int mxcsr_feature_mask __read_mostly = 0xffffffffu;
Suresh Siddha61c46282008-03-10 15:28:04 -0700118unsigned int xstate_size;
Xiaotian Fengf45755b2010-08-13 15:19:11 +0800119EXPORT_SYMBOL_GPL(xstate_size);
Paul Gortmaker148f9bb2013-06-18 18:23:59 -0400120static struct i387_fxsave_struct fx_scratch;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700121
Paul Gortmaker148f9bb2013-06-18 18:23:59 -0400122static void mxcsr_feature_mask_init(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700123{
124 unsigned long mask = 0;
Ingo Molnarf6689642008-03-05 15:37:32 +0100125
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126 if (cpu_has_fxsr) {
Suresh Siddha61c46282008-03-10 15:28:04 -0700127 memset(&fx_scratch, 0, sizeof(struct i387_fxsave_struct));
H.J. Lueaa5a992013-07-26 09:11:56 -0700128 asm volatile("fxsave %0" : "+m" (fx_scratch));
Suresh Siddha61c46282008-03-10 15:28:04 -0700129 mask = fx_scratch.mxcsr_mask;
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100130 if (mask == 0)
131 mask = 0x0000ffbf;
132 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700133 mxcsr_feature_mask &= mask;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134}
135
Paul Gortmaker148f9bb2013-06-18 18:23:59 -0400136static void init_thread_xstate(void)
Suresh Siddha61c46282008-03-10 15:28:04 -0700137{
Robert Richter0e49bf62010-07-21 19:03:52 +0200138 /*
139 * Note that xstate_size might be overwriten later during
140 * xsave_init().
141 */
142
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200143 if (!cpu_has_fpu) {
Robert Richter1f999ab2010-07-21 19:03:57 +0200144 /*
145 * Disable xsave as we do not support it if i387
146 * emulation is enabled.
147 */
148 setup_clear_cpu_cap(X86_FEATURE_XSAVE);
149 setup_clear_cpu_cap(X86_FEATURE_XSAVEOPT);
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700150 xstate_size = sizeof(struct i387_soft_struct);
151 return;
152 }
153
Suresh Siddha61c46282008-03-10 15:28:04 -0700154 if (cpu_has_fxsr)
155 xstate_size = sizeof(struct i387_fxsave_struct);
Suresh Siddha61c46282008-03-10 15:28:04 -0700156 else
157 xstate_size = sizeof(struct i387_fsave_struct);
Suresh Siddha61c46282008-03-10 15:28:04 -0700158}
159
Roland McGrath44210112008-01-30 13:31:50 +0100160/*
161 * Called at bootup to set up the initial FPU state that is later cloned
162 * into all processes.
163 */
Robert Richter0e49bf62010-07-21 19:03:52 +0200164
Paul Gortmaker148f9bb2013-06-18 18:23:59 -0400165void fpu_init(void)
Roland McGrath44210112008-01-30 13:31:50 +0100166{
Brian Gerst6ac8bac2010-09-03 21:17:09 -0400167 unsigned long cr0;
168 unsigned long cr4_mask = 0;
Ingo Molnarf6689642008-03-05 15:37:32 +0100169
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200170#ifndef CONFIG_MATH_EMULATION
171 if (!cpu_has_fpu) {
172 pr_emerg("No FPU found and no math emulation present\n");
173 pr_emerg("Giving up\n");
174 for (;;)
175 asm volatile("hlt");
176 }
177#endif
Brian Gerst6ac8bac2010-09-03 21:17:09 -0400178 if (cpu_has_fxsr)
179 cr4_mask |= X86_CR4_OSFXSR;
180 if (cpu_has_xmm)
181 cr4_mask |= X86_CR4_OSXMMEXCPT;
182 if (cr4_mask)
183 set_in_cr4(cr4_mask);
Roland McGrath44210112008-01-30 13:31:50 +0100184
Brian Gerst6ac8bac2010-09-03 21:17:09 -0400185 cr0 = read_cr0();
186 cr0 &= ~(X86_CR0_TS|X86_CR0_EM); /* clear TS and EM */
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200187 if (!cpu_has_fpu)
Brian Gerst6ac8bac2010-09-03 21:17:09 -0400188 cr0 |= X86_CR0_EM;
189 write_cr0(cr0);
Roland McGrath44210112008-01-30 13:31:50 +0100190
Fenghua Yu6f5298c2012-11-13 11:32:50 -0800191 /*
192 * init_thread_xstate is only called once to avoid overriding
193 * xstate_size during boot time or during CPU hotplug.
194 */
195 if (xstate_size == 0)
Suresh Siddhadc1e35c2008-07-29 10:29:19 -0700196 init_thread_xstate();
Suresh Siddhadc1e35c2008-07-29 10:29:19 -0700197
Roland McGrath44210112008-01-30 13:31:50 +0100198 mxcsr_feature_mask_init();
Suresh Siddha5d2bd702012-09-06 14:58:52 -0700199 xsave_init();
200 eager_fpu_init();
Roland McGrath44210112008-01-30 13:31:50 +0100201}
Robert Richter0e49bf62010-07-21 19:03:52 +0200202
Sheng Yang5ee481d2010-05-17 17:22:23 +0800203void fpu_finit(struct fpu *fpu)
Avi Kivity86603282010-05-06 11:45:46 +0300204{
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200205 if (!cpu_has_fpu) {
Avi Kivity86603282010-05-06 11:45:46 +0300206 finit_soft_fpu(&fpu->state->soft);
207 return;
208 }
Avi Kivity86603282010-05-06 11:45:46 +0300209
210 if (cpu_has_fxsr) {
Suresh Siddha5d2bd702012-09-06 14:58:52 -0700211 fx_finit(&fpu->state->fxsave);
Avi Kivity86603282010-05-06 11:45:46 +0300212 } else {
213 struct i387_fsave_struct *fp = &fpu->state->fsave;
214 memset(fp, 0, xstate_size);
215 fp->cwd = 0xffff037fu;
216 fp->swd = 0xffff0000u;
217 fp->twd = 0xffffffffu;
218 fp->fos = 0xffff0000u;
219 }
220}
Sheng Yang5ee481d2010-05-17 17:22:23 +0800221EXPORT_SYMBOL_GPL(fpu_finit);
Avi Kivity86603282010-05-06 11:45:46 +0300222
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223/*
224 * The _current_ task is using the FPU for the first time
225 * so initialize it and set the mxcsr to its default
226 * value at reset if we support XMM instructions and then
Lucas De Marchi0d2eb442011-03-17 16:24:16 -0300227 * remember the current task has used the FPU.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228 */
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700229int init_fpu(struct task_struct *tsk)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230{
Avi Kivity86603282010-05-06 11:45:46 +0300231 int ret;
232
Roland McGrath44210112008-01-30 13:31:50 +0100233 if (tsk_used_math(tsk)) {
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200234 if (cpu_has_fpu && tsk == current)
Roland McGrath44210112008-01-30 13:31:50 +0100235 unlazy_fpu(tsk);
Oleg Nesterov089f9fb2012-04-16 22:48:15 +0200236 tsk->thread.fpu.last_cpu = ~0;
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700237 return 0;
238 }
239
240 /*
241 * Memory allocation at the first usage of the FPU and other state.
242 */
Avi Kivity86603282010-05-06 11:45:46 +0300243 ret = fpu_alloc(&tsk->thread.fpu);
244 if (ret)
245 return ret;
Roland McGrath44210112008-01-30 13:31:50 +0100246
Avi Kivity86603282010-05-06 11:45:46 +0300247 fpu_finit(&tsk->thread.fpu);
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700248
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249 set_stopped_child_used_math(tsk);
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700250 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251}
Avi Kivitye5c30142011-01-11 12:15:54 +0200252EXPORT_SYMBOL_GPL(init_fpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800254/*
255 * The xstateregs_active() routine is the same as the fpregs_active() routine,
256 * as the "regset->n" for the xstate regset will be updated based on the feature
257 * capabilites supported by the xsave.
258 */
Roland McGrath44210112008-01-30 13:31:50 +0100259int fpregs_active(struct task_struct *target, const struct user_regset *regset)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260{
Roland McGrath44210112008-01-30 13:31:50 +0100261 return tsk_used_math(target) ? regset->n : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262}
Roland McGrath44210112008-01-30 13:31:50 +0100263
264int xfpregs_active(struct task_struct *target, const struct user_regset *regset)
265{
266 return (cpu_has_fxsr && tsk_used_math(target)) ? regset->n : 0;
267}
268
269int xfpregs_get(struct task_struct *target, const struct user_regset *regset,
270 unsigned int pos, unsigned int count,
271 void *kbuf, void __user *ubuf)
272{
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700273 int ret;
274
Roland McGrath44210112008-01-30 13:31:50 +0100275 if (!cpu_has_fxsr)
276 return -ENODEV;
277
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700278 ret = init_fpu(target);
279 if (ret)
280 return ret;
Roland McGrath44210112008-01-30 13:31:50 +0100281
Suresh Siddha29104e12010-07-19 16:05:49 -0700282 sanitize_i387_state(target);
283
Roland McGrath44210112008-01-30 13:31:50 +0100284 return user_regset_copyout(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300285 &target->thread.fpu.state->fxsave, 0, -1);
Roland McGrath44210112008-01-30 13:31:50 +0100286}
287
288int xfpregs_set(struct task_struct *target, const struct user_regset *regset,
289 unsigned int pos, unsigned int count,
290 const void *kbuf, const void __user *ubuf)
291{
292 int ret;
293
294 if (!cpu_has_fxsr)
295 return -ENODEV;
296
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700297 ret = init_fpu(target);
298 if (ret)
299 return ret;
300
Suresh Siddha29104e12010-07-19 16:05:49 -0700301 sanitize_i387_state(target);
302
Roland McGrath44210112008-01-30 13:31:50 +0100303 ret = user_regset_copyin(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300304 &target->thread.fpu.state->fxsave, 0, -1);
Roland McGrath44210112008-01-30 13:31:50 +0100305
306 /*
307 * mxcsr reserved bits must be masked to zero for security reasons.
308 */
Avi Kivity86603282010-05-06 11:45:46 +0300309 target->thread.fpu.state->fxsave.mxcsr &= mxcsr_feature_mask;
Roland McGrath44210112008-01-30 13:31:50 +0100310
Suresh Siddha42deec62008-07-29 10:29:26 -0700311 /*
312 * update the header bits in the xsave header, indicating the
313 * presence of FP and SSE state.
314 */
315 if (cpu_has_xsave)
Avi Kivity86603282010-05-06 11:45:46 +0300316 target->thread.fpu.state->xsave.xsave_hdr.xstate_bv |= XSTATE_FPSSE;
Suresh Siddha42deec62008-07-29 10:29:26 -0700317
Roland McGrath44210112008-01-30 13:31:50 +0100318 return ret;
319}
320
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800321int xstateregs_get(struct task_struct *target, const struct user_regset *regset,
322 unsigned int pos, unsigned int count,
323 void *kbuf, void __user *ubuf)
324{
325 int ret;
326
327 if (!cpu_has_xsave)
328 return -ENODEV;
329
330 ret = init_fpu(target);
331 if (ret)
332 return ret;
333
334 /*
Suresh Siddhaff7fbc72010-02-22 14:51:33 -0800335 * Copy the 48bytes defined by the software first into the xstate
336 * memory layout in the thread struct, so that we can copy the entire
337 * xstateregs to the user using one user_regset_copyout().
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800338 */
Avi Kivity86603282010-05-06 11:45:46 +0300339 memcpy(&target->thread.fpu.state->fxsave.sw_reserved,
Suresh Siddhaff7fbc72010-02-22 14:51:33 -0800340 xstate_fx_sw_bytes, sizeof(xstate_fx_sw_bytes));
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800341
342 /*
Suresh Siddhaff7fbc72010-02-22 14:51:33 -0800343 * Copy the xstate memory layout.
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800344 */
345 ret = user_regset_copyout(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300346 &target->thread.fpu.state->xsave, 0, -1);
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800347 return ret;
348}
349
350int xstateregs_set(struct task_struct *target, const struct user_regset *regset,
351 unsigned int pos, unsigned int count,
352 const void *kbuf, const void __user *ubuf)
353{
354 int ret;
355 struct xsave_hdr_struct *xsave_hdr;
356
357 if (!cpu_has_xsave)
358 return -ENODEV;
359
360 ret = init_fpu(target);
361 if (ret)
362 return ret;
363
364 ret = user_regset_copyin(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300365 &target->thread.fpu.state->xsave, 0, -1);
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800366
367 /*
368 * mxcsr reserved bits must be masked to zero for security reasons.
369 */
Avi Kivity86603282010-05-06 11:45:46 +0300370 target->thread.fpu.state->fxsave.mxcsr &= mxcsr_feature_mask;
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800371
Avi Kivity86603282010-05-06 11:45:46 +0300372 xsave_hdr = &target->thread.fpu.state->xsave.xsave_hdr;
Suresh Siddha5b3efd52010-02-11 11:50:59 -0800373
374 xsave_hdr->xstate_bv &= pcntxt_mask;
375 /*
376 * These bits must be zero.
377 */
378 xsave_hdr->reserved1[0] = xsave_hdr->reserved1[1] = 0;
379
380 return ret;
381}
382
Roland McGrath44210112008-01-30 13:31:50 +0100383#if defined CONFIG_X86_32 || defined CONFIG_IA32_EMULATION
Linus Torvalds1da177e2005-04-16 15:20:36 -0700384
Linus Torvalds1da177e2005-04-16 15:20:36 -0700385/*
386 * FPU tag word conversions.
387 */
388
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100389static inline unsigned short twd_i387_to_fxsr(unsigned short twd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700390{
391 unsigned int tmp; /* to avoid 16 bit prefixes in the code */
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100392
Linus Torvalds1da177e2005-04-16 15:20:36 -0700393 /* Transform each pair of bits into 01 (valid) or 00 (empty) */
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100394 tmp = ~twd;
Roland McGrath44210112008-01-30 13:31:50 +0100395 tmp = (tmp | (tmp>>1)) & 0x5555; /* 0V0V0V0V0V0V0V0V */
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100396 /* and move the valid bits to the lower byte. */
397 tmp = (tmp | (tmp >> 1)) & 0x3333; /* 00VV00VV00VV00VV */
398 tmp = (tmp | (tmp >> 2)) & 0x0f0f; /* 0000VVVV0000VVVV */
399 tmp = (tmp | (tmp >> 4)) & 0x00ff; /* 00000000VVVVVVVV */
Ingo Molnarf6689642008-03-05 15:37:32 +0100400
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100401 return tmp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402}
403
Phil Carmody497888c2011-07-14 15:07:13 +0300404#define FPREG_ADDR(f, n) ((void *)&(f)->st_space + (n) * 16)
Roland McGrath44210112008-01-30 13:31:50 +0100405#define FP_EXP_TAG_VALID 0
406#define FP_EXP_TAG_ZERO 1
407#define FP_EXP_TAG_SPECIAL 2
408#define FP_EXP_TAG_EMPTY 3
409
410static inline u32 twd_fxsr_to_i387(struct i387_fxsave_struct *fxsave)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700411{
Roland McGrath44210112008-01-30 13:31:50 +0100412 struct _fpxreg *st;
413 u32 tos = (fxsave->swd >> 11) & 7;
414 u32 twd = (unsigned long) fxsave->twd;
415 u32 tag;
416 u32 ret = 0xffff0000u;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 int i;
418
Roland McGrath44210112008-01-30 13:31:50 +0100419 for (i = 0; i < 8; i++, twd >>= 1) {
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100420 if (twd & 0x1) {
421 st = FPREG_ADDR(fxsave, (i - tos) & 7);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700422
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100423 switch (st->exponent & 0x7fff) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700424 case 0x7fff:
Roland McGrath44210112008-01-30 13:31:50 +0100425 tag = FP_EXP_TAG_SPECIAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700426 break;
427 case 0x0000:
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100428 if (!st->significand[0] &&
429 !st->significand[1] &&
430 !st->significand[2] &&
Roland McGrath44210112008-01-30 13:31:50 +0100431 !st->significand[3])
432 tag = FP_EXP_TAG_ZERO;
433 else
434 tag = FP_EXP_TAG_SPECIAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435 break;
436 default:
Roland McGrath44210112008-01-30 13:31:50 +0100437 if (st->significand[3] & 0x8000)
438 tag = FP_EXP_TAG_VALID;
439 else
440 tag = FP_EXP_TAG_SPECIAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700441 break;
442 }
443 } else {
Roland McGrath44210112008-01-30 13:31:50 +0100444 tag = FP_EXP_TAG_EMPTY;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445 }
Roland McGrath44210112008-01-30 13:31:50 +0100446 ret |= tag << (2 * i);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700447 }
448 return ret;
449}
450
451/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700452 * FXSR floating point environment conversions.
453 */
454
Suresh Siddha72a671c2012-07-24 16:05:29 -0700455void
Ingo Molnarf6689642008-03-05 15:37:32 +0100456convert_from_fxsr(struct user_i387_ia32_struct *env, struct task_struct *tsk)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457{
Avi Kivity86603282010-05-06 11:45:46 +0300458 struct i387_fxsave_struct *fxsave = &tsk->thread.fpu.state->fxsave;
Roland McGrath44210112008-01-30 13:31:50 +0100459 struct _fpreg *to = (struct _fpreg *) &env->st_space[0];
460 struct _fpxreg *from = (struct _fpxreg *) &fxsave->st_space[0];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700461 int i;
462
Roland McGrath44210112008-01-30 13:31:50 +0100463 env->cwd = fxsave->cwd | 0xffff0000u;
464 env->swd = fxsave->swd | 0xffff0000u;
465 env->twd = twd_fxsr_to_i387(fxsave);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700466
Roland McGrath44210112008-01-30 13:31:50 +0100467#ifdef CONFIG_X86_64
468 env->fip = fxsave->rip;
469 env->foo = fxsave->rdp;
Brian Gerst10c11f32010-09-03 21:17:13 -0400470 /*
471 * should be actually ds/cs at fpu exception time, but
472 * that information is not available in 64bit mode.
473 */
474 env->fcs = task_pt_regs(tsk)->cs;
Roland McGrath44210112008-01-30 13:31:50 +0100475 if (tsk == current) {
Brian Gerst10c11f32010-09-03 21:17:13 -0400476 savesegment(ds, env->fos);
Roland McGrath44210112008-01-30 13:31:50 +0100477 } else {
Brian Gerst10c11f32010-09-03 21:17:13 -0400478 env->fos = tsk->thread.ds;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700479 }
Brian Gerst10c11f32010-09-03 21:17:13 -0400480 env->fos |= 0xffff0000;
Roland McGrath44210112008-01-30 13:31:50 +0100481#else
482 env->fip = fxsave->fip;
Jan Beulich609b5292008-03-05 08:35:14 +0000483 env->fcs = (u16) fxsave->fcs | ((u32) fxsave->fop << 16);
Roland McGrath44210112008-01-30 13:31:50 +0100484 env->foo = fxsave->foo;
485 env->fos = fxsave->fos;
486#endif
487
488 for (i = 0; i < 8; ++i)
489 memcpy(&to[i], &from[i], sizeof(to[0]));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490}
491
Suresh Siddha72a671c2012-07-24 16:05:29 -0700492void convert_to_fxsr(struct task_struct *tsk,
493 const struct user_i387_ia32_struct *env)
Roland McGrath44210112008-01-30 13:31:50 +0100494
Linus Torvalds1da177e2005-04-16 15:20:36 -0700495{
Avi Kivity86603282010-05-06 11:45:46 +0300496 struct i387_fxsave_struct *fxsave = &tsk->thread.fpu.state->fxsave;
Roland McGrath44210112008-01-30 13:31:50 +0100497 struct _fpreg *from = (struct _fpreg *) &env->st_space[0];
498 struct _fpxreg *to = (struct _fpxreg *) &fxsave->st_space[0];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499 int i;
500
Roland McGrath44210112008-01-30 13:31:50 +0100501 fxsave->cwd = env->cwd;
502 fxsave->swd = env->swd;
503 fxsave->twd = twd_i387_to_fxsr(env->twd);
504 fxsave->fop = (u16) ((u32) env->fcs >> 16);
505#ifdef CONFIG_X86_64
506 fxsave->rip = env->fip;
507 fxsave->rdp = env->foo;
508 /* cs and ds ignored */
509#else
510 fxsave->fip = env->fip;
511 fxsave->fcs = (env->fcs & 0xffff);
512 fxsave->foo = env->foo;
513 fxsave->fos = env->fos;
514#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700515
Roland McGrath44210112008-01-30 13:31:50 +0100516 for (i = 0; i < 8; ++i)
517 memcpy(&to[i], &from[i], sizeof(from[0]));
518}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700519
Roland McGrath44210112008-01-30 13:31:50 +0100520int fpregs_get(struct task_struct *target, const struct user_regset *regset,
521 unsigned int pos, unsigned int count,
522 void *kbuf, void __user *ubuf)
523{
524 struct user_i387_ia32_struct env;
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700525 int ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700526
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700527 ret = init_fpu(target);
528 if (ret)
529 return ret;
Roland McGrath44210112008-01-30 13:31:50 +0100530
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200531 if (!static_cpu_has(X86_FEATURE_FPU))
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700532 return fpregs_soft_get(target, regset, pos, count, kbuf, ubuf);
533
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200534 if (!cpu_has_fxsr)
Roland McGrath44210112008-01-30 13:31:50 +0100535 return user_regset_copyout(&pos, &count, &kbuf, &ubuf,
Avi Kivity86603282010-05-06 11:45:46 +0300536 &target->thread.fpu.state->fsave, 0,
Suresh Siddha61c46282008-03-10 15:28:04 -0700537 -1);
Roland McGrath44210112008-01-30 13:31:50 +0100538
Suresh Siddha29104e12010-07-19 16:05:49 -0700539 sanitize_i387_state(target);
540
Roland McGrath44210112008-01-30 13:31:50 +0100541 if (kbuf && pos == 0 && count == sizeof(env)) {
542 convert_from_fxsr(kbuf, target);
543 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700544 }
Roland McGrath44210112008-01-30 13:31:50 +0100545
546 convert_from_fxsr(&env, target);
Ingo Molnarf6689642008-03-05 15:37:32 +0100547
Roland McGrath44210112008-01-30 13:31:50 +0100548 return user_regset_copyout(&pos, &count, &kbuf, &ubuf, &env, 0, -1);
549}
550
551int fpregs_set(struct task_struct *target, const struct user_regset *regset,
552 unsigned int pos, unsigned int count,
553 const void *kbuf, const void __user *ubuf)
554{
555 struct user_i387_ia32_struct env;
556 int ret;
557
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700558 ret = init_fpu(target);
559 if (ret)
560 return ret;
561
Suresh Siddha29104e12010-07-19 16:05:49 -0700562 sanitize_i387_state(target);
563
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200564 if (!static_cpu_has(X86_FEATURE_FPU))
Suresh Siddhae8a496a2008-05-23 16:26:37 -0700565 return fpregs_soft_set(target, regset, pos, count, kbuf, ubuf);
566
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200567 if (!cpu_has_fxsr)
Roland McGrath44210112008-01-30 13:31:50 +0100568 return user_regset_copyin(&pos, &count, &kbuf, &ubuf,
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200569 &target->thread.fpu.state->fsave, 0,
570 -1);
Roland McGrath44210112008-01-30 13:31:50 +0100571
572 if (pos > 0 || count < sizeof(env))
573 convert_from_fxsr(&env, target);
574
575 ret = user_regset_copyin(&pos, &count, &kbuf, &ubuf, &env, 0, -1);
576 if (!ret)
577 convert_to_fxsr(target, &env);
578
Suresh Siddha42deec62008-07-29 10:29:26 -0700579 /*
580 * update the header bit in the xsave header, indicating the
581 * presence of FP.
582 */
583 if (cpu_has_xsave)
Avi Kivity86603282010-05-06 11:45:46 +0300584 target->thread.fpu.state->xsave.xsave_hdr.xstate_bv |= XSTATE_FP;
Roland McGrath44210112008-01-30 13:31:50 +0100585 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586}
587
588/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700589 * FPU state for core dumps.
Roland McGrath60b3b9a2008-01-30 13:31:55 +0100590 * This is only used for a.out dumps now.
591 * It is declared generically using elf_fpregset_t (which is
592 * struct user_i387_struct) but is in fact only used for 32-bit
593 * dumps, so on 64-bit it is really struct user_i387_ia32_struct.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700594 */
Cyrill Gorcunov3b095a02008-01-30 13:31:26 +0100595int dump_fpu(struct pt_regs *regs, struct user_i387_struct *fpu)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597 struct task_struct *tsk = current;
Ingo Molnarf6689642008-03-05 15:37:32 +0100598 int fpvalid;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700599
600 fpvalid = !!used_math();
Roland McGrath60b3b9a2008-01-30 13:31:55 +0100601 if (fpvalid)
602 fpvalid = !fpregs_get(tsk, NULL,
603 0, sizeof(struct user_i387_ia32_struct),
604 fpu, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700605
606 return fpvalid;
607}
Alexey Dobriyan129f6942005-06-23 00:08:33 -0700608EXPORT_SYMBOL(dump_fpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700609
Roland McGrath60b3b9a2008-01-30 13:31:55 +0100610#endif /* CONFIG_X86_32 || CONFIG_IA32_EMULATION */
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200611
612static int __init no_387(char *s)
613{
614 setup_clear_cpu_cap(X86_FEATURE_FPU);
615 return 1;
616}
617
618__setup("no387", no_387);
619
Paul Gortmaker148f9bb2013-06-18 18:23:59 -0400620void fpu_detect(struct cpuinfo_x86 *c)
H. Peter Anvin60e019e2013-04-29 16:04:20 +0200621{
622 unsigned long cr0;
623 u16 fsw, fcw;
624
625 fsw = fcw = 0xffff;
626
627 cr0 = read_cr0();
628 cr0 &= ~(X86_CR0_TS | X86_CR0_EM);
629 write_cr0(cr0);
630
631 asm volatile("fninit ; fnstsw %0 ; fnstcw %1"
632 : "+m" (fsw), "+m" (fcw));
633
634 if (fsw == 0 && (fcw & 0x103f) == 0x003f)
635 set_cpu_cap(c, X86_FEATURE_FPU);
636 else
637 clear_cpu_cap(c, X86_FEATURE_FPU);
638
639 /* The final cr0 value is set in fpu_init() */
640}