diff options
author | Linus Torvalds <torvalds@linux-foundation.org> | 2012-02-21 16:19:22 -0500 |
---|---|---|
committer | H. Peter Anvin <hpa@linux.intel.com> | 2012-02-21 17:12:54 -0500 |
commit | 1361b83a13d4d92e53fbb6c877528713e118b821 (patch) | |
tree | 2656beeee7061c7ae08f6078f2f1565ac702be48 /arch | |
parent | 8546c008924d5fd1724fa698eaa92b414bafd50d (diff) |
i387: Split up <asm/i387.h> into exported and internal interfaces
While various modules include <asm/i387.h> to get access to things we
actually *intend* for them to use, most of that header file was really
pretty low-level internal stuff that we really don't want to expose to
others.
So split the header file into two: the small exported interfaces remain
in <asm/i387.h>, while the internal definitions that are only used by
core architecture code are now in <asm/fpu-internal.h>.
The guiding principle for this was to expose functions that we export to
modules, and leave them in <asm/i387.h>, while stuff that is used by
task switching or was marked GPL-only is in <asm/fpu-internal.h>.
The fpu-internal.h file could be further split up too, especially since
arch/x86/kvm/ uses some of the remaining stuff for its module. But that
kvm usage should probably be abstracted out a bit, and at least now the
internal FPU accessor functions are much more contained. Even if it
isn't perhaps as contained as it _could_ be.
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Link: http://lkml.kernel.org/r/alpine.LFD.2.02.1202211340330.5354@i5.linux-foundation.org
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Diffstat (limited to 'arch')
-rw-r--r-- | arch/x86/ia32/ia32_signal.c | 1 | ||||
-rw-r--r-- | arch/x86/include/asm/fpu-internal.h | 520 | ||||
-rw-r--r-- | arch/x86/include/asm/i387.h | 512 | ||||
-rw-r--r-- | arch/x86/kernel/cpu/common.c | 1 | ||||
-rw-r--r-- | arch/x86/kernel/i387.c | 3 | ||||
-rw-r--r-- | arch/x86/kernel/process.c | 1 | ||||
-rw-r--r-- | arch/x86/kernel/process_32.c | 1 | ||||
-rw-r--r-- | arch/x86/kernel/process_64.c | 1 | ||||
-rw-r--r-- | arch/x86/kernel/ptrace.c | 1 | ||||
-rw-r--r-- | arch/x86/kernel/signal.c | 1 | ||||
-rw-r--r-- | arch/x86/kernel/traps.c | 1 | ||||
-rw-r--r-- | arch/x86/kernel/xsave.c | 1 | ||||
-rw-r--r-- | arch/x86/kvm/vmx.c | 2 | ||||
-rw-r--r-- | arch/x86/kvm/x86.c | 1 | ||||
-rw-r--r-- | arch/x86/power/cpu.c | 1 |
15 files changed, 540 insertions, 508 deletions
diff --git a/arch/x86/ia32/ia32_signal.c b/arch/x86/ia32/ia32_signal.c index 65577698cab2..5563ba1cf513 100644 --- a/arch/x86/ia32/ia32_signal.c +++ b/arch/x86/ia32/ia32_signal.c | |||
@@ -24,6 +24,7 @@ | |||
24 | #include <asm/ucontext.h> | 24 | #include <asm/ucontext.h> |
25 | #include <asm/uaccess.h> | 25 | #include <asm/uaccess.h> |
26 | #include <asm/i387.h> | 26 | #include <asm/i387.h> |
27 | #include <asm/fpu-internal.h> | ||
27 | #include <asm/ptrace.h> | 28 | #include <asm/ptrace.h> |
28 | #include <asm/ia32_unistd.h> | 29 | #include <asm/ia32_unistd.h> |
29 | #include <asm/user32.h> | 30 | #include <asm/user32.h> |
diff --git a/arch/x86/include/asm/fpu-internal.h b/arch/x86/include/asm/fpu-internal.h new file mode 100644 index 000000000000..4fa88154e4de --- /dev/null +++ b/arch/x86/include/asm/fpu-internal.h | |||
@@ -0,0 +1,520 @@ | |||
1 | /* | ||
2 | * Copyright (C) 1994 Linus Torvalds | ||
3 | * | ||
4 | * Pentium III FXSR, SSE support | ||
5 | * General FPU state handling cleanups | ||
6 | * Gareth Hughes <gareth@valinux.com>, May 2000 | ||
7 | * x86-64 work by Andi Kleen 2002 | ||
8 | */ | ||
9 | |||
10 | #ifndef _FPU_INTERNAL_H | ||
11 | #define _FPU_INTERNAL_H | ||
12 | |||
13 | #include <linux/kernel_stat.h> | ||
14 | #include <linux/regset.h> | ||
15 | #include <linux/slab.h> | ||
16 | #include <asm/asm.h> | ||
17 | #include <asm/cpufeature.h> | ||
18 | #include <asm/processor.h> | ||
19 | #include <asm/sigcontext.h> | ||
20 | #include <asm/user.h> | ||
21 | #include <asm/uaccess.h> | ||
22 | #include <asm/xsave.h> | ||
23 | |||
24 | extern unsigned int sig_xstate_size; | ||
25 | extern void fpu_init(void); | ||
26 | |||
27 | DECLARE_PER_CPU(struct task_struct *, fpu_owner_task); | ||
28 | |||
29 | extern user_regset_active_fn fpregs_active, xfpregs_active; | ||
30 | extern user_regset_get_fn fpregs_get, xfpregs_get, fpregs_soft_get, | ||
31 | xstateregs_get; | ||
32 | extern user_regset_set_fn fpregs_set, xfpregs_set, fpregs_soft_set, | ||
33 | xstateregs_set; | ||
34 | |||
35 | |||
36 | /* | ||
37 | * xstateregs_active == fpregs_active. Please refer to the comment | ||
38 | * at the definition of fpregs_active. | ||
39 | */ | ||
40 | #define xstateregs_active fpregs_active | ||
41 | |||
42 | extern struct _fpx_sw_bytes fx_sw_reserved; | ||
43 | #ifdef CONFIG_IA32_EMULATION | ||
44 | extern unsigned int sig_xstate_ia32_size; | ||
45 | extern struct _fpx_sw_bytes fx_sw_reserved_ia32; | ||
46 | struct _fpstate_ia32; | ||
47 | struct _xstate_ia32; | ||
48 | extern int save_i387_xstate_ia32(void __user *buf); | ||
49 | extern int restore_i387_xstate_ia32(void __user *buf); | ||
50 | #endif | ||
51 | |||
52 | #ifdef CONFIG_MATH_EMULATION | ||
53 | extern void finit_soft_fpu(struct i387_soft_struct *soft); | ||
54 | #else | ||
55 | static inline void finit_soft_fpu(struct i387_soft_struct *soft) {} | ||
56 | #endif | ||
57 | |||
58 | #define X87_FSW_ES (1 << 7) /* Exception Summary */ | ||
59 | |||
60 | static __always_inline __pure bool use_xsaveopt(void) | ||
61 | { | ||
62 | return static_cpu_has(X86_FEATURE_XSAVEOPT); | ||
63 | } | ||
64 | |||
65 | static __always_inline __pure bool use_xsave(void) | ||
66 | { | ||
67 | return static_cpu_has(X86_FEATURE_XSAVE); | ||
68 | } | ||
69 | |||
70 | static __always_inline __pure bool use_fxsr(void) | ||
71 | { | ||
72 | return static_cpu_has(X86_FEATURE_FXSR); | ||
73 | } | ||
74 | |||
75 | extern void __sanitize_i387_state(struct task_struct *); | ||
76 | |||
77 | static inline void sanitize_i387_state(struct task_struct *tsk) | ||
78 | { | ||
79 | if (!use_xsaveopt()) | ||
80 | return; | ||
81 | __sanitize_i387_state(tsk); | ||
82 | } | ||
83 | |||
84 | #ifdef CONFIG_X86_64 | ||
85 | static inline int fxrstor_checking(struct i387_fxsave_struct *fx) | ||
86 | { | ||
87 | int err; | ||
88 | |||
89 | /* See comment in fxsave() below. */ | ||
90 | #ifdef CONFIG_AS_FXSAVEQ | ||
91 | asm volatile("1: fxrstorq %[fx]\n\t" | ||
92 | "2:\n" | ||
93 | ".section .fixup,\"ax\"\n" | ||
94 | "3: movl $-1,%[err]\n" | ||
95 | " jmp 2b\n" | ||
96 | ".previous\n" | ||
97 | _ASM_EXTABLE(1b, 3b) | ||
98 | : [err] "=r" (err) | ||
99 | : [fx] "m" (*fx), "0" (0)); | ||
100 | #else | ||
101 | asm volatile("1: rex64/fxrstor (%[fx])\n\t" | ||
102 | "2:\n" | ||
103 | ".section .fixup,\"ax\"\n" | ||
104 | "3: movl $-1,%[err]\n" | ||
105 | " jmp 2b\n" | ||
106 | ".previous\n" | ||
107 | _ASM_EXTABLE(1b, 3b) | ||
108 | : [err] "=r" (err) | ||
109 | : [fx] "R" (fx), "m" (*fx), "0" (0)); | ||
110 | #endif | ||
111 | return err; | ||
112 | } | ||
113 | |||
114 | static inline int fxsave_user(struct i387_fxsave_struct __user *fx) | ||
115 | { | ||
116 | int err; | ||
117 | |||
118 | /* | ||
119 | * Clear the bytes not touched by the fxsave and reserved | ||
120 | * for the SW usage. | ||
121 | */ | ||
122 | err = __clear_user(&fx->sw_reserved, | ||
123 | sizeof(struct _fpx_sw_bytes)); | ||
124 | if (unlikely(err)) | ||
125 | return -EFAULT; | ||
126 | |||
127 | /* See comment in fxsave() below. */ | ||
128 | #ifdef CONFIG_AS_FXSAVEQ | ||
129 | asm volatile("1: fxsaveq %[fx]\n\t" | ||
130 | "2:\n" | ||
131 | ".section .fixup,\"ax\"\n" | ||
132 | "3: movl $-1,%[err]\n" | ||
133 | " jmp 2b\n" | ||
134 | ".previous\n" | ||
135 | _ASM_EXTABLE(1b, 3b) | ||
136 | : [err] "=r" (err), [fx] "=m" (*fx) | ||
137 | : "0" (0)); | ||
138 | #else | ||
139 | asm volatile("1: rex64/fxsave (%[fx])\n\t" | ||
140 | "2:\n" | ||
141 | ".section .fixup,\"ax\"\n" | ||
142 | "3: movl $-1,%[err]\n" | ||
143 | " jmp 2b\n" | ||
144 | ".previous\n" | ||
145 | _ASM_EXTABLE(1b, 3b) | ||
146 | : [err] "=r" (err), "=m" (*fx) | ||
147 | : [fx] "R" (fx), "0" (0)); | ||
148 | #endif | ||
149 | if (unlikely(err) && | ||
150 | __clear_user(fx, sizeof(struct i387_fxsave_struct))) | ||
151 | err = -EFAULT; | ||
152 | /* No need to clear here because the caller clears USED_MATH */ | ||
153 | return err; | ||
154 | } | ||
155 | |||
156 | static inline void fpu_fxsave(struct fpu *fpu) | ||
157 | { | ||
158 | /* Using "rex64; fxsave %0" is broken because, if the memory operand | ||
159 | uses any extended registers for addressing, a second REX prefix | ||
160 | will be generated (to the assembler, rex64 followed by semicolon | ||
161 | is a separate instruction), and hence the 64-bitness is lost. */ | ||
162 | |||
163 | #ifdef CONFIG_AS_FXSAVEQ | ||
164 | /* Using "fxsaveq %0" would be the ideal choice, but is only supported | ||
165 | starting with gas 2.16. */ | ||
166 | __asm__ __volatile__("fxsaveq %0" | ||
167 | : "=m" (fpu->state->fxsave)); | ||
168 | #else | ||
169 | /* Using, as a workaround, the properly prefixed form below isn't | ||
170 | accepted by any binutils version so far released, complaining that | ||
171 | the same type of prefix is used twice if an extended register is | ||
172 | needed for addressing (fix submitted to mainline 2005-11-21). | ||
173 | asm volatile("rex64/fxsave %0" | ||
174 | : "=m" (fpu->state->fxsave)); | ||
175 | This, however, we can work around by forcing the compiler to select | ||
176 | an addressing mode that doesn't require extended registers. */ | ||
177 | asm volatile("rex64/fxsave (%[fx])" | ||
178 | : "=m" (fpu->state->fxsave) | ||
179 | : [fx] "R" (&fpu->state->fxsave)); | ||
180 | #endif | ||
181 | } | ||
182 | |||
183 | #else /* CONFIG_X86_32 */ | ||
184 | |||
185 | /* perform fxrstor iff the processor has extended states, otherwise frstor */ | ||
186 | static inline int fxrstor_checking(struct i387_fxsave_struct *fx) | ||
187 | { | ||
188 | /* | ||
189 | * The "nop" is needed to make the instructions the same | ||
190 | * length. | ||
191 | */ | ||
192 | alternative_input( | ||
193 | "nop ; frstor %1", | ||
194 | "fxrstor %1", | ||
195 | X86_FEATURE_FXSR, | ||
196 | "m" (*fx)); | ||
197 | |||
198 | return 0; | ||
199 | } | ||
200 | |||
201 | static inline void fpu_fxsave(struct fpu *fpu) | ||
202 | { | ||
203 | asm volatile("fxsave %[fx]" | ||
204 | : [fx] "=m" (fpu->state->fxsave)); | ||
205 | } | ||
206 | |||
207 | #endif /* CONFIG_X86_64 */ | ||
208 | |||
209 | /* | ||
210 | * These must be called with preempt disabled. Returns | ||
211 | * 'true' if the FPU state is still intact. | ||
212 | */ | ||
213 | static inline int fpu_save_init(struct fpu *fpu) | ||
214 | { | ||
215 | if (use_xsave()) { | ||
216 | fpu_xsave(fpu); | ||
217 | |||
218 | /* | ||
219 | * xsave header may indicate the init state of the FP. | ||
220 | */ | ||
221 | if (!(fpu->state->xsave.xsave_hdr.xstate_bv & XSTATE_FP)) | ||
222 | return 1; | ||
223 | } else if (use_fxsr()) { | ||
224 | fpu_fxsave(fpu); | ||
225 | } else { | ||
226 | asm volatile("fnsave %[fx]; fwait" | ||
227 | : [fx] "=m" (fpu->state->fsave)); | ||
228 | return 0; | ||
229 | } | ||
230 | |||
231 | /* | ||
232 | * If exceptions are pending, we need to clear them so | ||
233 | * that we don't randomly get exceptions later. | ||
234 | * | ||
235 | * FIXME! Is this perhaps only true for the old-style | ||
236 | * irq13 case? Maybe we could leave the x87 state | ||
237 | * intact otherwise? | ||
238 | */ | ||
239 | if (unlikely(fpu->state->fxsave.swd & X87_FSW_ES)) { | ||
240 | asm volatile("fnclex"); | ||
241 | return 0; | ||
242 | } | ||
243 | return 1; | ||
244 | } | ||
245 | |||
246 | static inline int __save_init_fpu(struct task_struct *tsk) | ||
247 | { | ||
248 | return fpu_save_init(&tsk->thread.fpu); | ||
249 | } | ||
250 | |||
251 | static inline int fpu_fxrstor_checking(struct fpu *fpu) | ||
252 | { | ||
253 | return fxrstor_checking(&fpu->state->fxsave); | ||
254 | } | ||
255 | |||
256 | static inline int fpu_restore_checking(struct fpu *fpu) | ||
257 | { | ||
258 | if (use_xsave()) | ||
259 | return fpu_xrstor_checking(fpu); | ||
260 | else | ||
261 | return fpu_fxrstor_checking(fpu); | ||
262 | } | ||
263 | |||
264 | static inline int restore_fpu_checking(struct task_struct *tsk) | ||
265 | { | ||
266 | /* AMD K7/K8 CPUs don't save/restore FDP/FIP/FOP unless an exception | ||
267 | is pending. Clear the x87 state here by setting it to fixed | ||
268 | values. "m" is a random variable that should be in L1 */ | ||
269 | alternative_input( | ||
270 | ASM_NOP8 ASM_NOP2, | ||
271 | "emms\n\t" /* clear stack tags */ | ||
272 | "fildl %P[addr]", /* set F?P to defined value */ | ||
273 | X86_FEATURE_FXSAVE_LEAK, | ||
274 | [addr] "m" (tsk->thread.fpu.has_fpu)); | ||
275 | |||
276 | return fpu_restore_checking(&tsk->thread.fpu); | ||
277 | } | ||
278 | |||
279 | /* | ||
280 | * Software FPU state helpers. Careful: these need to | ||
281 | * be preemption protection *and* they need to be | ||
282 | * properly paired with the CR0.TS changes! | ||
283 | */ | ||
284 | static inline int __thread_has_fpu(struct task_struct *tsk) | ||
285 | { | ||
286 | return tsk->thread.fpu.has_fpu; | ||
287 | } | ||
288 | |||
289 | /* Must be paired with an 'stts' after! */ | ||
290 | static inline void __thread_clear_has_fpu(struct task_struct *tsk) | ||
291 | { | ||
292 | tsk->thread.fpu.has_fpu = 0; | ||
293 | percpu_write(fpu_owner_task, NULL); | ||
294 | } | ||
295 | |||
296 | /* Must be paired with a 'clts' before! */ | ||
297 | static inline void __thread_set_has_fpu(struct task_struct *tsk) | ||
298 | { | ||
299 | tsk->thread.fpu.has_fpu = 1; | ||
300 | percpu_write(fpu_owner_task, tsk); | ||
301 | } | ||
302 | |||
303 | /* | ||
304 | * Encapsulate the CR0.TS handling together with the | ||
305 | * software flag. | ||
306 | * | ||
307 | * These generally need preemption protection to work, | ||
308 | * do try to avoid using these on their own. | ||
309 | */ | ||
310 | static inline void __thread_fpu_end(struct task_struct *tsk) | ||
311 | { | ||
312 | __thread_clear_has_fpu(tsk); | ||
313 | stts(); | ||
314 | } | ||
315 | |||
316 | static inline void __thread_fpu_begin(struct task_struct *tsk) | ||
317 | { | ||
318 | clts(); | ||
319 | __thread_set_has_fpu(tsk); | ||
320 | } | ||
321 | |||
322 | /* | ||
323 | * FPU state switching for scheduling. | ||
324 | * | ||
325 | * This is a two-stage process: | ||
326 | * | ||
327 | * - switch_fpu_prepare() saves the old state and | ||
328 | * sets the new state of the CR0.TS bit. This is | ||
329 | * done within the context of the old process. | ||
330 | * | ||
331 | * - switch_fpu_finish() restores the new state as | ||
332 | * necessary. | ||
333 | */ | ||
334 | typedef struct { int preload; } fpu_switch_t; | ||
335 | |||
336 | /* | ||
337 | * FIXME! We could do a totally lazy restore, but we need to | ||
338 | * add a per-cpu "this was the task that last touched the FPU | ||
339 | * on this CPU" variable, and the task needs to have a "I last | ||
340 | * touched the FPU on this CPU" and check them. | ||
341 | * | ||
342 | * We don't do that yet, so "fpu_lazy_restore()" always returns | ||
343 | * false, but some day.. | ||
344 | */ | ||
345 | static inline int fpu_lazy_restore(struct task_struct *new, unsigned int cpu) | ||
346 | { | ||
347 | return new == percpu_read_stable(fpu_owner_task) && | ||
348 | cpu == new->thread.fpu.last_cpu; | ||
349 | } | ||
350 | |||
351 | static inline fpu_switch_t switch_fpu_prepare(struct task_struct *old, struct task_struct *new, int cpu) | ||
352 | { | ||
353 | fpu_switch_t fpu; | ||
354 | |||
355 | fpu.preload = tsk_used_math(new) && new->fpu_counter > 5; | ||
356 | if (__thread_has_fpu(old)) { | ||
357 | if (!__save_init_fpu(old)) | ||
358 | cpu = ~0; | ||
359 | old->thread.fpu.last_cpu = cpu; | ||
360 | old->thread.fpu.has_fpu = 0; /* But leave fpu_owner_task! */ | ||
361 | |||
362 | /* Don't change CR0.TS if we just switch! */ | ||
363 | if (fpu.preload) { | ||
364 | new->fpu_counter++; | ||
365 | __thread_set_has_fpu(new); | ||
366 | prefetch(new->thread.fpu.state); | ||
367 | } else | ||
368 | stts(); | ||
369 | } else { | ||
370 | old->fpu_counter = 0; | ||
371 | old->thread.fpu.last_cpu = ~0; | ||
372 | if (fpu.preload) { | ||
373 | new->fpu_counter++; | ||
374 | if (fpu_lazy_restore(new, cpu)) | ||
375 | fpu.preload = 0; | ||
376 | else | ||
377 | prefetch(new->thread.fpu.state); | ||
378 | __thread_fpu_begin(new); | ||
379 | } | ||
380 | } | ||
381 | return fpu; | ||
382 | } | ||
383 | |||
384 | /* | ||
385 | * By the time this gets called, we've already cleared CR0.TS and | ||
386 | * given the process the FPU if we are going to preload the FPU | ||
387 | * state - all we need to do is to conditionally restore the register | ||
388 | * state itself. | ||
389 | */ | ||
390 | static inline void switch_fpu_finish(struct task_struct *new, fpu_switch_t fpu) | ||
391 | { | ||
392 | if (fpu.preload) { | ||
393 | if (unlikely(restore_fpu_checking(new))) | ||
394 | __thread_fpu_end(new); | ||
395 | } | ||
396 | } | ||
397 | |||
398 | /* | ||
399 | * Signal frame handlers... | ||
400 | */ | ||
401 | extern int save_i387_xstate(void __user *buf); | ||
402 | extern int restore_i387_xstate(void __user *buf); | ||
403 | |||
404 | static inline void __clear_fpu(struct task_struct *tsk) | ||
405 | { | ||
406 | if (__thread_has_fpu(tsk)) { | ||
407 | /* Ignore delayed exceptions from user space */ | ||
408 | asm volatile("1: fwait\n" | ||
409 | "2:\n" | ||
410 | _ASM_EXTABLE(1b, 2b)); | ||
411 | __thread_fpu_end(tsk); | ||
412 | } | ||
413 | } | ||
414 | |||
415 | /* | ||
416 | * The actual user_fpu_begin/end() functions | ||
417 | * need to be preemption-safe. | ||
418 | * | ||
419 | * NOTE! user_fpu_end() must be used only after you | ||
420 | * have saved the FP state, and user_fpu_begin() must | ||
421 | * be used only immediately before restoring it. | ||
422 | * These functions do not do any save/restore on | ||
423 | * their own. | ||
424 | */ | ||
425 | static inline void user_fpu_end(void) | ||
426 | { | ||
427 | preempt_disable(); | ||
428 | __thread_fpu_end(current); | ||
429 | preempt_enable(); | ||
430 | } | ||
431 | |||
432 | static inline void user_fpu_begin(void) | ||
433 | { | ||
434 | preempt_disable(); | ||
435 | if (!user_has_fpu()) | ||
436 | __thread_fpu_begin(current); | ||
437 | preempt_enable(); | ||
438 | } | ||
439 | |||
440 | /* | ||
441 | * These disable preemption on their own and are safe | ||
442 | */ | ||
443 | static inline void save_init_fpu(struct task_struct *tsk) | ||
444 | { | ||
445 | WARN_ON_ONCE(!__thread_has_fpu(tsk)); | ||
446 | preempt_disable(); | ||
447 | __save_init_fpu(tsk); | ||
448 | __thread_fpu_end(tsk); | ||
449 | preempt_enable(); | ||
450 | } | ||
451 | |||
452 | static inline void clear_fpu(struct task_struct *tsk) | ||
453 | { | ||
454 | preempt_disable(); | ||
455 | __clear_fpu(tsk); | ||
456 | preempt_enable(); | ||
457 | } | ||
458 | |||
459 | /* | ||
460 | * i387 state interaction | ||
461 | */ | ||
462 | static inline unsigned short get_fpu_cwd(struct task_struct *tsk) | ||
463 | { | ||
464 | if (cpu_has_fxsr) { | ||
465 | return tsk->thread.fpu.state->fxsave.cwd; | ||
466 | } else { | ||
467 | return (unsigned short)tsk->thread.fpu.state->fsave.cwd; | ||
468 | } | ||
469 | } | ||
470 | |||
471 | static inline unsigned short get_fpu_swd(struct task_struct *tsk) | ||
472 | { | ||
473 | if (cpu_has_fxsr) { | ||
474 | return tsk->thread.fpu.state->fxsave.swd; | ||
475 | } else { | ||
476 | return (unsigned short)tsk->thread.fpu.state->fsave.swd; | ||
477 | } | ||
478 | } | ||
479 | |||
480 | static inline unsigned short get_fpu_mxcsr(struct task_struct *tsk) | ||
481 | { | ||
482 | if (cpu_has_xmm) { | ||
483 | return tsk->thread.fpu.state->fxsave.mxcsr; | ||
484 | } else { | ||
485 | return MXCSR_DEFAULT; | ||
486 | } | ||
487 | } | ||
488 | |||
489 | static bool fpu_allocated(struct fpu *fpu) | ||
490 | { | ||
491 | return fpu->state != NULL; | ||
492 | } | ||
493 | |||
494 | static inline int fpu_alloc(struct fpu *fpu) | ||
495 | { | ||
496 | if (fpu_allocated(fpu)) | ||
497 | return 0; | ||
498 | fpu->state = kmem_cache_alloc(task_xstate_cachep, GFP_KERNEL); | ||
499 | if (!fpu->state) | ||
500 | return -ENOMEM; | ||
501 | WARN_ON((unsigned long)fpu->state & 15); | ||
502 | return 0; | ||
503 | } | ||
504 | |||
505 | static inline void fpu_free(struct fpu *fpu) | ||
506 | { | ||
507 | if (fpu->state) { | ||
508 | kmem_cache_free(task_xstate_cachep, fpu->state); | ||
509 | fpu->state = NULL; | ||
510 | } | ||
511 | } | ||
512 | |||
513 | static inline void fpu_copy(struct fpu *dst, struct fpu *src) | ||
514 | { | ||
515 | memcpy(dst->state, src->state, xstate_size); | ||
516 | } | ||
517 | |||
518 | extern void fpu_finit(struct fpu *fpu); | ||
519 | |||
520 | #endif | ||
diff --git a/arch/x86/include/asm/i387.h b/arch/x86/include/asm/i387.h index 0c1031d354f2..7ce0798b1b26 100644 --- a/arch/x86/include/asm/i387.h +++ b/arch/x86/include/asm/i387.h | |||
@@ -13,411 +13,15 @@ | |||
13 | #ifndef __ASSEMBLY__ | 13 | #ifndef __ASSEMBLY__ |
14 | 14 | ||
15 | #include <linux/sched.h> | 15 | #include <linux/sched.h> |
16 | #include <linux/kernel_stat.h> | ||
17 | #include <linux/regset.h> | ||
18 | #include <linux/hardirq.h> | 16 | #include <linux/hardirq.h> |
19 | #include <linux/slab.h> | 17 | #include <asm/system.h> |
20 | #include <asm/asm.h> | 18 | |
21 | #include <asm/cpufeature.h> | 19 | struct pt_regs; |
22 | #include <asm/processor.h> | 20 | struct user_i387_struct; |
23 | #include <asm/sigcontext.h> | ||
24 | #include <asm/user.h> | ||
25 | #include <asm/uaccess.h> | ||
26 | #include <asm/xsave.h> | ||
27 | 21 | ||
28 | extern unsigned int sig_xstate_size; | ||
29 | extern void fpu_init(void); | ||
30 | extern void mxcsr_feature_mask_init(void); | ||
31 | extern int init_fpu(struct task_struct *child); | 22 | extern int init_fpu(struct task_struct *child); |
32 | extern void math_state_restore(void); | ||
33 | extern int dump_fpu(struct pt_regs *, struct user_i387_struct *); | 23 | extern int dump_fpu(struct pt_regs *, struct user_i387_struct *); |
34 | 24 | extern void math_state_restore(void); | |
35 | DECLARE_PER_CPU(struct task_struct *, fpu_owner_task); | ||
36 | |||
37 | extern user_regset_active_fn fpregs_active, xfpregs_active; | ||
38 | extern user_regset_get_fn fpregs_get, xfpregs_get, fpregs_soft_get, | ||
39 | xstateregs_get; | ||
40 | extern user_regset_set_fn fpregs_set, xfpregs_set, fpregs_soft_set, | ||
41 | xstateregs_set; | ||
42 | |||
43 | /* | ||
44 | * xstateregs_active == fpregs_active. Please refer to the comment | ||
45 | * at the definition of fpregs_active. | ||
46 | */ | ||
47 | #define xstateregs_active fpregs_active | ||
48 | |||
49 | extern struct _fpx_sw_bytes fx_sw_reserved; | ||
50 | #ifdef CONFIG_IA32_EMULATION | ||
51 | extern unsigned int sig_xstate_ia32_size; | ||
52 | extern struct _fpx_sw_bytes fx_sw_reserved_ia32; | ||
53 | struct _fpstate_ia32; | ||
54 | struct _xstate_ia32; | ||
55 | extern int save_i387_xstate_ia32(void __user *buf); | ||
56 | extern int restore_i387_xstate_ia32(void __user *buf); | ||
57 | #endif | ||
58 | |||
59 | #ifdef CONFIG_MATH_EMULATION | ||
60 | extern void finit_soft_fpu(struct i387_soft_struct *soft); | ||
61 | #else | ||
62 | static inline void finit_soft_fpu(struct i387_soft_struct *soft) {} | ||
63 | #endif | ||
64 | |||
65 | #define X87_FSW_ES (1 << 7) /* Exception Summary */ | ||
66 | |||
67 | static __always_inline __pure bool use_xsaveopt(void) | ||
68 | { | ||
69 | return static_cpu_has(X86_FEATURE_XSAVEOPT); | ||
70 | } | ||
71 | |||
72 | static __always_inline __pure bool use_xsave(void) | ||
73 | { | ||
74 | return static_cpu_has(X86_FEATURE_XSAVE); | ||
75 | } | ||
76 | |||
77 | static __always_inline __pure bool use_fxsr(void) | ||
78 | { | ||
79 | return static_cpu_has(X86_FEATURE_FXSR); | ||
80 | } | ||
81 | |||
82 | extern void __sanitize_i387_state(struct task_struct *); | ||
83 | |||
84 | static inline void sanitize_i387_state(struct task_struct *tsk) | ||
85 | { | ||
86 | if (!use_xsaveopt()) | ||
87 | return; | ||
88 | __sanitize_i387_state(tsk); | ||
89 | } | ||
90 | |||
91 | #ifdef CONFIG_X86_64 | ||
92 | static inline int fxrstor_checking(struct i387_fxsave_struct *fx) | ||
93 | { | ||
94 | int err; | ||
95 | |||
96 | /* See comment in fxsave() below. */ | ||
97 | #ifdef CONFIG_AS_FXSAVEQ | ||
98 | asm volatile("1: fxrstorq %[fx]\n\t" | ||
99 | "2:\n" | ||
100 | ".section .fixup,\"ax\"\n" | ||
101 | "3: movl $-1,%[err]\n" | ||
102 | " jmp 2b\n" | ||
103 | ".previous\n" | ||
104 | _ASM_EXTABLE(1b, 3b) | ||
105 | : [err] "=r" (err) | ||
106 | : [fx] "m" (*fx), "0" (0)); | ||
107 | #else | ||
108 | asm volatile("1: rex64/fxrstor (%[fx])\n\t" | ||
109 | "2:\n" | ||
110 | ".section .fixup,\"ax\"\n" | ||
111 | "3: movl $-1,%[err]\n" | ||
112 | " jmp 2b\n" | ||
113 | ".previous\n" | ||
114 | _ASM_EXTABLE(1b, 3b) | ||
115 | : [err] "=r" (err) | ||
116 | : [fx] "R" (fx), "m" (*fx), "0" (0)); | ||
117 | #endif | ||
118 | return err; | ||
119 | } | ||
120 | |||
121 | static inline int fxsave_user(struct i387_fxsave_struct __user *fx) | ||
122 | { | ||
123 | int err; | ||
124 | |||
125 | /* | ||
126 | * Clear the bytes not touched by the fxsave and reserved | ||
127 | * for the SW usage. | ||
128 | */ | ||
129 | err = __clear_user(&fx->sw_reserved, | ||
130 | sizeof(struct _fpx_sw_bytes)); | ||
131 | if (unlikely(err)) | ||
132 | return -EFAULT; | ||
133 | |||
134 | /* See comment in fxsave() below. */ | ||
135 | #ifdef CONFIG_AS_FXSAVEQ | ||
136 | asm volatile("1: fxsaveq %[fx]\n\t" | ||
137 | "2:\n" | ||
138 | ".section .fixup,\"ax\"\n" | ||
139 | "3: movl $-1,%[err]\n" | ||
140 | " jmp 2b\n" | ||
141 | ".previous\n" | ||
142 | _ASM_EXTABLE(1b, 3b) | ||
143 | : [err] "=r" (err), [fx] "=m" (*fx) | ||
144 | : "0" (0)); | ||
145 | #else | ||
146 | asm volatile("1: rex64/fxsave (%[fx])\n\t" | ||
147 | "2:\n" | ||
148 | ".section .fixup,\"ax\"\n" | ||
149 | "3: movl $-1,%[err]\n" | ||
150 | " jmp 2b\n" | ||
151 | ".previous\n" | ||
152 | _ASM_EXTABLE(1b, 3b) | ||
153 | : [err] "=r" (err), "=m" (*fx) | ||
154 | : [fx] "R" (fx), "0" (0)); | ||
155 | #endif | ||
156 | if (unlikely(err) && | ||
157 | __clear_user(fx, sizeof(struct i387_fxsave_struct))) | ||
158 | err = -EFAULT; | ||
159 | /* No need to clear here because the caller clears USED_MATH */ | ||
160 | return err; | ||
161 | } | ||
162 | |||
163 | static inline void fpu_fxsave(struct fpu *fpu) | ||
164 | { | ||
165 | /* Using "rex64; fxsave %0" is broken because, if the memory operand | ||
166 | uses any extended registers for addressing, a second REX prefix | ||
167 | will be generated (to the assembler, rex64 followed by semicolon | ||
168 | is a separate instruction), and hence the 64-bitness is lost. */ | ||
169 | |||
170 | #ifdef CONFIG_AS_FXSAVEQ | ||
171 | /* Using "fxsaveq %0" would be the ideal choice, but is only supported | ||
172 | starting with gas 2.16. */ | ||
173 | __asm__ __volatile__("fxsaveq %0" | ||
174 | : "=m" (fpu->state->fxsave)); | ||
175 | #else | ||
176 | /* Using, as a workaround, the properly prefixed form below isn't | ||
177 | accepted by any binutils version so far released, complaining that | ||
178 | the same type of prefix is used twice if an extended register is | ||
179 | needed for addressing (fix submitted to mainline 2005-11-21). | ||
180 | asm volatile("rex64/fxsave %0" | ||
181 | : "=m" (fpu->state->fxsave)); | ||
182 | This, however, we can work around by forcing the compiler to select | ||
183 | an addressing mode that doesn't require extended registers. */ | ||
184 | asm volatile("rex64/fxsave (%[fx])" | ||
185 | : "=m" (fpu->state->fxsave) | ||
186 | : [fx] "R" (&fpu->state->fxsave)); | ||
187 | #endif | ||
188 | } | ||
189 | |||
190 | #else /* CONFIG_X86_32 */ | ||
191 | |||
192 | /* perform fxrstor iff the processor has extended states, otherwise frstor */ | ||
193 | static inline int fxrstor_checking(struct i387_fxsave_struct *fx) | ||
194 | { | ||
195 | /* | ||
196 | * The "nop" is needed to make the instructions the same | ||
197 | * length. | ||
198 | */ | ||
199 | alternative_input( | ||
200 | "nop ; frstor %1", | ||
201 | "fxrstor %1", | ||
202 | X86_FEATURE_FXSR, | ||
203 | "m" (*fx)); | ||
204 | |||
205 | return 0; | ||
206 | } | ||
207 | |||
208 | static inline void fpu_fxsave(struct fpu *fpu) | ||
209 | { | ||
210 | asm volatile("fxsave %[fx]" | ||
211 | : [fx] "=m" (fpu->state->fxsave)); | ||
212 | } | ||
213 | |||
214 | #endif /* CONFIG_X86_64 */ | ||
215 | |||
216 | /* | ||
217 | * These must be called with preempt disabled. Returns | ||
218 | * 'true' if the FPU state is still intact. | ||
219 | */ | ||
220 | static inline int fpu_save_init(struct fpu *fpu) | ||
221 | { | ||
222 | if (use_xsave()) { | ||
223 | fpu_xsave(fpu); | ||
224 | |||
225 | /* | ||
226 | * xsave header may indicate the init state of the FP. | ||
227 | */ | ||
228 | if (!(fpu->state->xsave.xsave_hdr.xstate_bv & XSTATE_FP)) | ||
229 | return 1; | ||
230 | } else if (use_fxsr()) { | ||
231 | fpu_fxsave(fpu); | ||
232 | } else { | ||
233 | asm volatile("fnsave %[fx]; fwait" | ||
234 | : [fx] "=m" (fpu->state->fsave)); | ||
235 | return 0; | ||
236 | } | ||
237 | |||
238 | /* | ||
239 | * If exceptions are pending, we need to clear them so | ||
240 | * that we don't randomly get exceptions later. | ||
241 | * | ||
242 | * FIXME! Is this perhaps only true for the old-style | ||
243 | * irq13 case? Maybe we could leave the x87 state | ||
244 | * intact otherwise? | ||
245 | */ | ||
246 | if (unlikely(fpu->state->fxsave.swd & X87_FSW_ES)) { | ||
247 | asm volatile("fnclex"); | ||
248 | return 0; | ||
249 | } | ||
250 | return 1; | ||
251 | } | ||
252 | |||
253 | static inline int __save_init_fpu(struct task_struct *tsk) | ||
254 | { | ||
255 | return fpu_save_init(&tsk->thread.fpu); | ||
256 | } | ||
257 | |||
258 | static inline int fpu_fxrstor_checking(struct fpu *fpu) | ||
259 | { | ||
260 | return fxrstor_checking(&fpu->state->fxsave); | ||
261 | } | ||
262 | |||
263 | static inline int fpu_restore_checking(struct fpu *fpu) | ||
264 | { | ||
265 | if (use_xsave()) | ||
266 | return fpu_xrstor_checking(fpu); | ||
267 | else | ||
268 | return fpu_fxrstor_checking(fpu); | ||
269 | } | ||
270 | |||
271 | static inline int restore_fpu_checking(struct task_struct *tsk) | ||
272 | { | ||
273 | /* AMD K7/K8 CPUs don't save/restore FDP/FIP/FOP unless an exception | ||
274 | is pending. Clear the x87 state here by setting it to fixed | ||
275 | values. "m" is a random variable that should be in L1 */ | ||
276 | alternative_input( | ||
277 | ASM_NOP8 ASM_NOP2, | ||
278 | "emms\n\t" /* clear stack tags */ | ||
279 | "fildl %P[addr]", /* set F?P to defined value */ | ||
280 | X86_FEATURE_FXSAVE_LEAK, | ||
281 | [addr] "m" (tsk->thread.fpu.has_fpu)); | ||
282 | |||
283 | return fpu_restore_checking(&tsk->thread.fpu); | ||
284 | } | ||
285 | |||
286 | /* | ||
287 | * Software FPU state helpers. Careful: these need to | ||
288 | * be preemption protection *and* they need to be | ||
289 | * properly paired with the CR0.TS changes! | ||
290 | */ | ||
291 | static inline int __thread_has_fpu(struct task_struct *tsk) | ||
292 | { | ||
293 | return tsk->thread.fpu.has_fpu; | ||
294 | } | ||
295 | |||
296 | /* Must be paired with an 'stts' after! */ | ||
297 | static inline void __thread_clear_has_fpu(struct task_struct *tsk) | ||
298 | { | ||
299 | tsk->thread.fpu.has_fpu = 0; | ||
300 | percpu_write(fpu_owner_task, NULL); | ||
301 | } | ||
302 | |||
303 | /* Must be paired with a 'clts' before! */ | ||
304 | static inline void __thread_set_has_fpu(struct task_struct *tsk) | ||
305 | { | ||
306 | tsk->thread.fpu.has_fpu = 1; | ||
307 | percpu_write(fpu_owner_task, tsk); | ||
308 | } | ||
309 | |||
310 | /* | ||
311 | * Encapsulate the CR0.TS handling together with the | ||
312 | * software flag. | ||
313 | * | ||
314 | * These generally need preemption protection to work, | ||
315 | * do try to avoid using these on their own. | ||
316 | */ | ||
317 | static inline void __thread_fpu_end(struct task_struct *tsk) | ||
318 | { | ||
319 | __thread_clear_has_fpu(tsk); | ||
320 | stts(); | ||
321 | } | ||
322 | |||
323 | static inline void __thread_fpu_begin(struct task_struct *tsk) | ||
324 | { | ||
325 | clts(); | ||
326 | __thread_set_has_fpu(tsk); | ||
327 | } | ||
328 | |||
329 | /* | ||
330 | * FPU state switching for scheduling. | ||
331 | * | ||
332 | * This is a two-stage process: | ||
333 | * | ||
334 | * - switch_fpu_prepare() saves the old state and | ||
335 | * sets the new state of the CR0.TS bit. This is | ||
336 | * done within the context of the old process. | ||
337 | * | ||
338 | * - switch_fpu_finish() restores the new state as | ||
339 | * necessary. | ||
340 | */ | ||
341 | typedef struct { int preload; } fpu_switch_t; | ||
342 | |||
343 | /* | ||
344 | * FIXME! We could do a totally lazy restore, but we need to | ||
345 | * add a per-cpu "this was the task that last touched the FPU | ||
346 | * on this CPU" variable, and the task needs to have a "I last | ||
347 | * touched the FPU on this CPU" and check them. | ||
348 | * | ||
349 | * We don't do that yet, so "fpu_lazy_restore()" always returns | ||
350 | * false, but some day.. | ||
351 | */ | ||
352 | static inline int fpu_lazy_restore(struct task_struct *new, unsigned int cpu) | ||
353 | { | ||
354 | return new == percpu_read_stable(fpu_owner_task) && | ||
355 | cpu == new->thread.fpu.last_cpu; | ||
356 | } | ||
357 | |||
358 | static inline fpu_switch_t switch_fpu_prepare(struct task_struct *old, struct task_struct *new, int cpu) | ||
359 | { | ||
360 | fpu_switch_t fpu; | ||
361 | |||
362 | fpu.preload = tsk_used_math(new) && new->fpu_counter > 5; | ||
363 | if (__thread_has_fpu(old)) { | ||
364 | if (!__save_init_fpu(old)) | ||
365 | cpu = ~0; | ||
366 | old->thread.fpu.last_cpu = cpu; | ||
367 | old->thread.fpu.has_fpu = 0; /* But leave fpu_owner_task! */ | ||
368 | |||
369 | /* Don't change CR0.TS if we just switch! */ | ||
370 | if (fpu.preload) { | ||
371 | new->fpu_counter++; | ||
372 | __thread_set_has_fpu(new); | ||
373 | prefetch(new->thread.fpu.state); | ||
374 | } else | ||
375 | stts(); | ||
376 | } else { | ||
377 | old->fpu_counter = 0; | ||
378 | old->thread.fpu.last_cpu = ~0; | ||
379 | if (fpu.preload) { | ||
380 | new->fpu_counter++; | ||
381 | if (fpu_lazy_restore(new, cpu)) | ||
382 | fpu.preload = 0; | ||
383 | else | ||
384 | prefetch(new->thread.fpu.state); | ||
385 | __thread_fpu_begin(new); | ||
386 | } | ||
387 | } | ||
388 | return fpu; | ||
389 | } | ||
390 | |||
391 | /* | ||
392 | * By the time this gets called, we've already cleared CR0.TS and | ||
393 | * given the process the FPU if we are going to preload the FPU | ||
394 | * state - all we need to do is to conditionally restore the register | ||
395 | * state itself. | ||
396 | */ | ||
397 | static inline void switch_fpu_finish(struct task_struct *new, fpu_switch_t fpu) | ||
398 | { | ||
399 | if (fpu.preload) { | ||
400 | if (unlikely(restore_fpu_checking(new))) | ||
401 | __thread_fpu_end(new); | ||
402 | } | ||
403 | } | ||
404 | |||
405 | /* | ||
406 | * Signal frame handlers... | ||
407 | */ | ||
408 | extern int save_i387_xstate(void __user *buf); | ||
409 | extern int restore_i387_xstate(void __user *buf); | ||
410 | |||
411 | static inline void __clear_fpu(struct task_struct *tsk) | ||
412 | { | ||
413 | if (__thread_has_fpu(tsk)) { | ||
414 | /* Ignore delayed exceptions from user space */ | ||
415 | asm volatile("1: fwait\n" | ||
416 | "2:\n" | ||
417 | _ASM_EXTABLE(1b, 2b)); | ||
418 | __thread_fpu_end(tsk); | ||
419 | } | ||
420 | } | ||
421 | 25 | ||
422 | extern bool irq_fpu_usable(void); | 26 | extern bool irq_fpu_usable(void); |
423 | extern void kernel_fpu_begin(void); | 27 | extern void kernel_fpu_begin(void); |
@@ -463,118 +67,14 @@ static inline void irq_ts_restore(int TS_state) | |||
463 | * we can just assume we have FPU access - typically | 67 | * we can just assume we have FPU access - typically |
464 | * to save the FP state - we'll just take a #NM | 68 | * to save the FP state - we'll just take a #NM |
465 | * fault and get the FPU access back. | 69 | * fault and get the FPU access back. |
466 | * | ||
467 | * The actual user_fpu_begin/end() functions | ||
468 | * need to be preemption-safe, though. | ||
469 | * | ||
470 | * NOTE! user_fpu_end() must be used only after you | ||
471 | * have saved the FP state, and user_fpu_begin() must | ||
472 | * be used only immediately before restoring it. | ||
473 | * These functions do not do any save/restore on | ||
474 | * their own. | ||
475 | */ | 70 | */ |
476 | static inline int user_has_fpu(void) | 71 | static inline int user_has_fpu(void) |
477 | { | 72 | { |
478 | return __thread_has_fpu(current); | 73 | return current->thread.fpu.has_fpu; |
479 | } | ||
480 | |||
481 | static inline void user_fpu_end(void) | ||
482 | { | ||
483 | preempt_disable(); | ||
484 | __thread_fpu_end(current); | ||
485 | preempt_enable(); | ||
486 | } | ||
487 | |||
488 | static inline void user_fpu_begin(void) | ||
489 | { | ||
490 | preempt_disable(); | ||
491 | if (!user_has_fpu()) | ||
492 | __thread_fpu_begin(current); | ||
493 | preempt_enable(); | ||
494 | } | ||
495 | |||
496 | /* | ||
497 | * These disable preemption on their own and are safe | ||
498 | */ | ||
499 | static inline void save_init_fpu(struct task_struct *tsk) | ||
500 | { | ||
501 | WARN_ON_ONCE(!__thread_has_fpu(tsk)); | ||
502 | preempt_disable(); | ||
503 | __save_init_fpu(tsk); | ||
504 | __thread_fpu_end(tsk); | ||
505 | preempt_enable(); | ||
506 | } | 74 | } |
507 | 75 | ||
508 | extern void unlazy_fpu(struct task_struct *tsk); | 76 | extern void unlazy_fpu(struct task_struct *tsk); |
509 | 77 | ||
510 | static inline void clear_fpu(struct task_struct *tsk) | ||
511 | { | ||
512 | preempt_disable(); | ||
513 | __clear_fpu(tsk); | ||
514 | preempt_enable(); | ||
515 | } | ||
516 | |||
517 | /* | ||
518 | * i387 state interaction | ||
519 | */ | ||
520 | static inline unsigned short get_fpu_cwd(struct task_struct *tsk) | ||
521 | { | ||
522 | if (cpu_has_fxsr) { | ||
523 | return tsk->thread.fpu.state->fxsave.cwd; | ||
524 | } else { | ||
525 | return (unsigned short)tsk->thread.fpu.state->fsave.cwd; | ||
526 | } | ||
527 | } | ||
528 | |||
529 | static inline unsigned short get_fpu_swd(struct task_struct *tsk) | ||
530 | { | ||
531 | if (cpu_has_fxsr) { | ||
532 | return tsk->thread.fpu.state->fxsave.swd; | ||
533 | } else { | ||
534 | return (unsigned short)tsk->thread.fpu.state->fsave.swd; | ||
535 | } | ||
536 | } | ||
537 | |||
538 | static inline unsigned short get_fpu_mxcsr(struct task_struct *tsk) | ||
539 | { | ||
540 | if (cpu_has_xmm) { | ||
541 | return tsk->thread.fpu.state->fxsave.mxcsr; | ||
542 | } else { | ||
543 | return MXCSR_DEFAULT; | ||
544 | } | ||
545 | } | ||
546 | |||
547 | static bool fpu_allocated(struct fpu *fpu) | ||
548 | { | ||
549 | return fpu->state != NULL; | ||
550 | } | ||
551 | |||
552 | static inline int fpu_alloc(struct fpu *fpu) | ||
553 | { | ||
554 | if (fpu_allocated(fpu)) | ||
555 | return 0; | ||
556 | fpu->state = kmem_cache_alloc(task_xstate_cachep, GFP_KERNEL); | ||
557 | if (!fpu->state) | ||
558 | return -ENOMEM; | ||
559 | WARN_ON((unsigned long)fpu->state & 15); | ||
560 | return 0; | ||
561 | } | ||
562 | |||
563 | static inline void fpu_free(struct fpu *fpu) | ||
564 | { | ||
565 | if (fpu->state) { | ||
566 | kmem_cache_free(task_xstate_cachep, fpu->state); | ||
567 | fpu->state = NULL; | ||
568 | } | ||
569 | } | ||
570 | |||
571 | static inline void fpu_copy(struct fpu *dst, struct fpu *src) | ||
572 | { | ||
573 | memcpy(dst->state, src->state, xstate_size); | ||
574 | } | ||
575 | |||
576 | extern void fpu_finit(struct fpu *fpu); | ||
577 | |||
578 | #endif /* __ASSEMBLY__ */ | 78 | #endif /* __ASSEMBLY__ */ |
579 | 79 | ||
580 | #endif /* _ASM_X86_I387_H */ | 80 | #endif /* _ASM_X86_I387_H */ |
diff --git a/arch/x86/kernel/cpu/common.c b/arch/x86/kernel/cpu/common.c index cb71b01ab66e..89620b1725d4 100644 --- a/arch/x86/kernel/cpu/common.c +++ b/arch/x86/kernel/cpu/common.c | |||
@@ -28,6 +28,7 @@ | |||
28 | #include <asm/apic.h> | 28 | #include <asm/apic.h> |
29 | #include <asm/desc.h> | 29 | #include <asm/desc.h> |
30 | #include <asm/i387.h> | 30 | #include <asm/i387.h> |
31 | #include <asm/fpu-internal.h> | ||
31 | #include <asm/mtrr.h> | 32 | #include <asm/mtrr.h> |
32 | #include <linux/numa.h> | 33 | #include <linux/numa.h> |
33 | #include <asm/asm.h> | 34 | #include <asm/asm.h> |
diff --git a/arch/x86/kernel/i387.c b/arch/x86/kernel/i387.c index 17b7549c4134..7734bcbb5a3a 100644 --- a/arch/x86/kernel/i387.c +++ b/arch/x86/kernel/i387.c | |||
@@ -16,6 +16,7 @@ | |||
16 | #include <asm/uaccess.h> | 16 | #include <asm/uaccess.h> |
17 | #include <asm/ptrace.h> | 17 | #include <asm/ptrace.h> |
18 | #include <asm/i387.h> | 18 | #include <asm/i387.h> |
19 | #include <asm/fpu-internal.h> | ||
19 | #include <asm/user.h> | 20 | #include <asm/user.h> |
20 | 21 | ||
21 | #ifdef CONFIG_X86_64 | 22 | #ifdef CONFIG_X86_64 |
@@ -124,7 +125,7 @@ EXPORT_SYMBOL_GPL(xstate_size); | |||
124 | unsigned int sig_xstate_ia32_size = sizeof(struct _fpstate_ia32); | 125 | unsigned int sig_xstate_ia32_size = sizeof(struct _fpstate_ia32); |
125 | static struct i387_fxsave_struct fx_scratch __cpuinitdata; | 126 | static struct i387_fxsave_struct fx_scratch __cpuinitdata; |
126 | 127 | ||
127 | void __cpuinit mxcsr_feature_mask_init(void) | 128 | static void __cpuinit mxcsr_feature_mask_init(void) |
128 | { | 129 | { |
129 | unsigned long mask = 0; | 130 | unsigned long mask = 0; |
130 | 131 | ||
diff --git a/arch/x86/kernel/process.c b/arch/x86/kernel/process.c index 15763af7bfe3..c38d84e01022 100644 --- a/arch/x86/kernel/process.c +++ b/arch/x86/kernel/process.c | |||
@@ -21,6 +21,7 @@ | |||
21 | #include <asm/idle.h> | 21 | #include <asm/idle.h> |
22 | #include <asm/uaccess.h> | 22 | #include <asm/uaccess.h> |
23 | #include <asm/i387.h> | 23 | #include <asm/i387.h> |
24 | #include <asm/fpu-internal.h> | ||
24 | #include <asm/debugreg.h> | 25 | #include <asm/debugreg.h> |
25 | 26 | ||
26 | struct kmem_cache *task_xstate_cachep; | 27 | struct kmem_cache *task_xstate_cachep; |
diff --git a/arch/x86/kernel/process_32.c b/arch/x86/kernel/process_32.c index c08d1ff12b7c..ee32dee7a0a3 100644 --- a/arch/x86/kernel/process_32.c +++ b/arch/x86/kernel/process_32.c | |||
@@ -45,6 +45,7 @@ | |||
45 | #include <asm/ldt.h> | 45 | #include <asm/ldt.h> |
46 | #include <asm/processor.h> | 46 | #include <asm/processor.h> |
47 | #include <asm/i387.h> | 47 | #include <asm/i387.h> |
48 | #include <asm/fpu-internal.h> | ||
48 | #include <asm/desc.h> | 49 | #include <asm/desc.h> |
49 | #ifdef CONFIG_MATH_EMULATION | 50 | #ifdef CONFIG_MATH_EMULATION |
50 | #include <asm/math_emu.h> | 51 | #include <asm/math_emu.h> |
diff --git a/arch/x86/kernel/process_64.c b/arch/x86/kernel/process_64.c index cfa5c90c01db..5bad3c71e48f 100644 --- a/arch/x86/kernel/process_64.c +++ b/arch/x86/kernel/process_64.c | |||
@@ -43,6 +43,7 @@ | |||
43 | #include <asm/system.h> | 43 | #include <asm/system.h> |
44 | #include <asm/processor.h> | 44 | #include <asm/processor.h> |
45 | #include <asm/i387.h> | 45 | #include <asm/i387.h> |
46 | #include <asm/fpu-internal.h> | ||
46 | #include <asm/mmu_context.h> | 47 | #include <asm/mmu_context.h> |
47 | #include <asm/prctl.h> | 48 | #include <asm/prctl.h> |
48 | #include <asm/desc.h> | 49 | #include <asm/desc.h> |
diff --git a/arch/x86/kernel/ptrace.c b/arch/x86/kernel/ptrace.c index 50267386b766..78f05e438be5 100644 --- a/arch/x86/kernel/ptrace.c +++ b/arch/x86/kernel/ptrace.c | |||
@@ -27,6 +27,7 @@ | |||
27 | #include <asm/system.h> | 27 | #include <asm/system.h> |
28 | #include <asm/processor.h> | 28 | #include <asm/processor.h> |
29 | #include <asm/i387.h> | 29 | #include <asm/i387.h> |
30 | #include <asm/fpu-internal.h> | ||
30 | #include <asm/debugreg.h> | 31 | #include <asm/debugreg.h> |
31 | #include <asm/ldt.h> | 32 | #include <asm/ldt.h> |
32 | #include <asm/desc.h> | 33 | #include <asm/desc.h> |
diff --git a/arch/x86/kernel/signal.c b/arch/x86/kernel/signal.c index 46a01bdc27e2..25edcfc9ba5b 100644 --- a/arch/x86/kernel/signal.c +++ b/arch/x86/kernel/signal.c | |||
@@ -24,6 +24,7 @@ | |||
24 | #include <asm/processor.h> | 24 | #include <asm/processor.h> |
25 | #include <asm/ucontext.h> | 25 | #include <asm/ucontext.h> |
26 | #include <asm/i387.h> | 26 | #include <asm/i387.h> |
27 | #include <asm/fpu-internal.h> | ||
27 | #include <asm/vdso.h> | 28 | #include <asm/vdso.h> |
28 | #include <asm/mce.h> | 29 | #include <asm/mce.h> |
29 | 30 | ||
diff --git a/arch/x86/kernel/traps.c b/arch/x86/kernel/traps.c index 4bbe04d96744..ec61d4c1b93b 100644 --- a/arch/x86/kernel/traps.c +++ b/arch/x86/kernel/traps.c | |||
@@ -54,6 +54,7 @@ | |||
54 | #include <asm/traps.h> | 54 | #include <asm/traps.h> |
55 | #include <asm/desc.h> | 55 | #include <asm/desc.h> |
56 | #include <asm/i387.h> | 56 | #include <asm/i387.h> |
57 | #include <asm/fpu-internal.h> | ||
57 | #include <asm/mce.h> | 58 | #include <asm/mce.h> |
58 | 59 | ||
59 | #include <asm/mach_traps.h> | 60 | #include <asm/mach_traps.h> |
diff --git a/arch/x86/kernel/xsave.c b/arch/x86/kernel/xsave.c index 711091114119..e62728e30b01 100644 --- a/arch/x86/kernel/xsave.c +++ b/arch/x86/kernel/xsave.c | |||
@@ -6,6 +6,7 @@ | |||
6 | #include <linux/bootmem.h> | 6 | #include <linux/bootmem.h> |
7 | #include <linux/compat.h> | 7 | #include <linux/compat.h> |
8 | #include <asm/i387.h> | 8 | #include <asm/i387.h> |
9 | #include <asm/fpu-internal.h> | ||
9 | #ifdef CONFIG_IA32_EMULATION | 10 | #ifdef CONFIG_IA32_EMULATION |
10 | #include <asm/sigcontext32.h> | 11 | #include <asm/sigcontext32.h> |
11 | #endif | 12 | #endif |
diff --git a/arch/x86/kvm/vmx.c b/arch/x86/kvm/vmx.c index 3b4c8d8ad906..246490f643b6 100644 --- a/arch/x86/kvm/vmx.c +++ b/arch/x86/kvm/vmx.c | |||
@@ -1457,7 +1457,7 @@ static void __vmx_load_host_state(struct vcpu_vmx *vmx) | |||
1457 | #ifdef CONFIG_X86_64 | 1457 | #ifdef CONFIG_X86_64 |
1458 | wrmsrl(MSR_KERNEL_GS_BASE, vmx->msr_host_kernel_gs_base); | 1458 | wrmsrl(MSR_KERNEL_GS_BASE, vmx->msr_host_kernel_gs_base); |
1459 | #endif | 1459 | #endif |
1460 | if (__thread_has_fpu(current)) | 1460 | if (user_has_fpu()) |
1461 | clts(); | 1461 | clts(); |
1462 | load_gdt(&__get_cpu_var(host_gdt)); | 1462 | load_gdt(&__get_cpu_var(host_gdt)); |
1463 | } | 1463 | } |
diff --git a/arch/x86/kvm/x86.c b/arch/x86/kvm/x86.c index 9cbfc0698118..b937b6179d80 100644 --- a/arch/x86/kvm/x86.c +++ b/arch/x86/kvm/x86.c | |||
@@ -57,6 +57,7 @@ | |||
57 | #include <asm/mtrr.h> | 57 | #include <asm/mtrr.h> |
58 | #include <asm/mce.h> | 58 | #include <asm/mce.h> |
59 | #include <asm/i387.h> | 59 | #include <asm/i387.h> |
60 | #include <asm/fpu-internal.h> /* Ugh! */ | ||
60 | #include <asm/xcr.h> | 61 | #include <asm/xcr.h> |
61 | #include <asm/pvclock.h> | 62 | #include <asm/pvclock.h> |
62 | #include <asm/div64.h> | 63 | #include <asm/div64.h> |
diff --git a/arch/x86/power/cpu.c b/arch/x86/power/cpu.c index f10c0afa1cb4..4889655ba784 100644 --- a/arch/x86/power/cpu.c +++ b/arch/x86/power/cpu.c | |||
@@ -20,6 +20,7 @@ | |||
20 | #include <asm/xcr.h> | 20 | #include <asm/xcr.h> |
21 | #include <asm/suspend.h> | 21 | #include <asm/suspend.h> |
22 | #include <asm/debugreg.h> | 22 | #include <asm/debugreg.h> |
23 | #include <asm/fpu-internal.h> /* pcntxt_mask */ | ||
23 | 24 | ||
24 | #ifdef CONFIG_X86_32 | 25 | #ifdef CONFIG_X86_32 |
25 | static struct saved_context saved_context; | 26 | static struct saved_context saved_context; |