2 * linux/arch/i386/kernel/i387.c
4 * Copyright (C) 1994 Linus Torvalds
6 * Pentium III FXSR, SSE support
7 * General FPU state handling cleanups
8 * Gareth Hughes <gareth@valinux.com>, May 2000
11 #include <linux/config.h>
12 #include <linux/sched.h>
13 #include <asm/processor.h>
15 #include <asm/math_emu.h>
16 #include <asm/sigcontext.h>
18 #include <asm/ptrace.h>
19 #include <asm/uaccess.h>
21 #ifdef CONFIG_MATH_EMULATION
22 #define HAVE_HWFP (boot_cpu_data.hard_math)
27 unsigned long mxcsr_feature_mask = 0xffffffff;
29 void mxcsr_feature_mask_init(void)
31 unsigned long mask = 0;
34 memset(¤t->thread.i387.fxsave, 0, sizeof(struct i387_fxsave_struct));
35 asm volatile("fxsave %0" : : "m" (current->thread.i387.fxsave));
36 mask = current->thread.i387.fxsave.mxcsr_mask;
37 if (mask == 0) mask = 0x0000ffbf;
39 mxcsr_feature_mask &= mask;
44 * The _current_ task is using the FPU for the first time
45 * so initialize it and set the mxcsr to its default
46 * value at reset if we support XMM instructions and then
47 * remeber the current task has used the FPU.
49 void init_fpu(struct task_struct *tsk)
52 memset(&tsk->thread.i387.fxsave, 0, sizeof(struct i387_fxsave_struct));
53 tsk->thread.i387.fxsave.cwd = 0x37f;
55 tsk->thread.i387.fxsave.mxcsr = 0x1f80;
57 memset(&tsk->thread.i387.fsave, 0, sizeof(struct i387_fsave_struct));
58 tsk->thread.i387.fsave.cwd = 0xffff037fu;
59 tsk->thread.i387.fsave.swd = 0xffff0000u;
60 tsk->thread.i387.fsave.twd = 0xffffffffu;
61 tsk->thread.i387.fsave.fos = 0xffff0000u;
67 * FPU lazy state save handling.
70 void kernel_fpu_begin(void)
72 struct thread_info *thread = current_thread_info();
75 if (thread->status & TS_USEDFPU) {
76 __save_init_fpu(thread->task);
82 void restore_fpu( struct task_struct *tsk )
85 asm volatile( "fxrstor %0"
86 : : "m" (tsk->thread.i387.fxsave) );
88 asm volatile( "frstor %0"
89 : : "m" (tsk->thread.i387.fsave) );
94 * FPU tag word conversions.
97 static inline unsigned short twd_i387_to_fxsr( unsigned short twd )
99 unsigned int tmp; /* to avoid 16 bit prefixes in the code */
101 /* Transform each pair of bits into 01 (valid) or 00 (empty) */
103 tmp = (tmp | (tmp>>1)) & 0x5555; /* 0V0V0V0V0V0V0V0V */
104 /* and move the valid bits to the lower byte. */
105 tmp = (tmp | (tmp >> 1)) & 0x3333; /* 00VV00VV00VV00VV */
106 tmp = (tmp | (tmp >> 2)) & 0x0f0f; /* 0000VVVV0000VVVV */
107 tmp = (tmp | (tmp >> 4)) & 0x00ff; /* 00000000VVVVVVVV */
111 static inline unsigned long twd_fxsr_to_i387( struct i387_fxsave_struct *fxsave )
113 struct _fpxreg *st = NULL;
114 unsigned long twd = (unsigned long) fxsave->twd;
116 unsigned long ret = 0xffff0000u;
119 #define FPREG_ADDR(f, n) ((char *)&(f)->st_space + (n) * 16);
121 for ( i = 0 ; i < 8 ; i++ ) {
123 st = (struct _fpxreg *) FPREG_ADDR( fxsave, i );
125 switch ( st->exponent & 0x7fff ) {
127 tag = 2; /* Special */
130 if ( !st->significand[0] &&
131 !st->significand[1] &&
132 !st->significand[2] &&
133 !st->significand[3] ) {
136 tag = 2; /* Special */
140 if ( st->significand[3] & 0x8000 ) {
143 tag = 2; /* Special */
150 ret |= (tag << (2 * i));
157 * FPU state interaction.
160 unsigned short get_fpu_cwd( struct task_struct *tsk )
162 if ( cpu_has_fxsr ) {
163 return tsk->thread.i387.fxsave.cwd;
165 return (unsigned short)tsk->thread.i387.fsave.cwd;
169 unsigned short get_fpu_swd( struct task_struct *tsk )
171 if ( cpu_has_fxsr ) {
172 return tsk->thread.i387.fxsave.swd;
174 return (unsigned short)tsk->thread.i387.fsave.swd;
178 unsigned short get_fpu_twd( struct task_struct *tsk )
180 if ( cpu_has_fxsr ) {
181 return tsk->thread.i387.fxsave.twd;
183 return (unsigned short)tsk->thread.i387.fsave.twd;
187 unsigned short get_fpu_mxcsr( struct task_struct *tsk )
190 return tsk->thread.i387.fxsave.mxcsr;
196 void set_fpu_cwd( struct task_struct *tsk, unsigned short cwd )
198 if ( cpu_has_fxsr ) {
199 tsk->thread.i387.fxsave.cwd = cwd;
201 tsk->thread.i387.fsave.cwd = ((long)cwd | 0xffff0000u);
205 void set_fpu_swd( struct task_struct *tsk, unsigned short swd )
207 if ( cpu_has_fxsr ) {
208 tsk->thread.i387.fxsave.swd = swd;
210 tsk->thread.i387.fsave.swd = ((long)swd | 0xffff0000u);
214 void set_fpu_twd( struct task_struct *tsk, unsigned short twd )
216 if ( cpu_has_fxsr ) {
217 tsk->thread.i387.fxsave.twd = twd_i387_to_fxsr(twd);
219 tsk->thread.i387.fsave.twd = ((long)twd | 0xffff0000u);
224 * FXSR floating point environment conversions.
227 static int convert_fxsr_to_user( struct _fpstate __user *buf,
228 struct i387_fxsave_struct *fxsave )
230 struct _fpreg tmp[8]; /* 80 bytes scratch area */
231 unsigned long env[7];
232 struct _fpreg __user *to;
233 struct _fpxreg *from;
236 env[0] = (unsigned long)fxsave->cwd | 0xffff0000ul;
237 env[1] = (unsigned long)fxsave->swd | 0xffff0000ul;
238 env[2] = twd_fxsr_to_i387(fxsave);
239 env[3] = fxsave->fip;
240 env[4] = fxsave->fcs | ((unsigned long)fxsave->fop << 16);
241 env[5] = fxsave->foo;
242 env[6] = fxsave->fos;
244 if ( __copy_to_user( buf, env, 7 * sizeof(unsigned long) ) )
248 from = (struct _fpxreg *) &fxsave->st_space[0];
249 for ( i = 0 ; i < 8 ; i++, to++, from++ ) {
250 unsigned long __user *t = (unsigned long __user *)to;
251 unsigned long *f = (unsigned long *)from;
255 to->exponent = from->exponent;
257 if (copy_to_user(buf->_st, tmp, sizeof(struct _fpreg [8])))
262 static int convert_fxsr_from_user( struct i387_fxsave_struct *fxsave,
263 struct _fpstate __user *buf )
265 struct _fpreg tmp[8]; /* 80 bytes scratch area */
266 unsigned long env[7];
268 struct _fpreg __user *from;
271 if ( __copy_from_user( env, buf, 7 * sizeof(long) ) )
273 if (copy_from_user(tmp, buf->_st, sizeof(struct _fpreg [8])))
276 fxsave->cwd = (unsigned short)(env[0] & 0xffff);
277 fxsave->swd = (unsigned short)(env[1] & 0xffff);
278 fxsave->twd = twd_i387_to_fxsr((unsigned short)(env[2] & 0xffff));
279 fxsave->fip = env[3];
280 fxsave->fop = (unsigned short)((env[4] & 0xffff0000ul) >> 16);
281 fxsave->fcs = (env[4] & 0xffff);
282 fxsave->foo = env[5];
283 fxsave->fos = env[6];
285 to = (struct _fpxreg *) &fxsave->st_space[0];
287 for ( i = 0 ; i < 8 ; i++, to++, from++ ) {
288 unsigned long *t = (unsigned long *)to;
289 unsigned long __user *f = (unsigned long __user *)from;
293 to->exponent = from->exponent;
299 * Signal frame handlers.
302 static inline int save_i387_fsave( struct _fpstate __user *buf )
304 struct task_struct *tsk = current;
307 tsk->thread.i387.fsave.status = tsk->thread.i387.fsave.swd;
308 if ( __copy_to_user( buf, &tsk->thread.i387.fsave,
309 sizeof(struct i387_fsave_struct) ) )
314 static int save_i387_fxsave( struct _fpstate __user *buf )
316 struct task_struct *tsk = current;
321 if ( convert_fxsr_to_user( buf, &tsk->thread.i387.fxsave ) )
324 err |= __put_user( tsk->thread.i387.fxsave.swd, &buf->status );
325 err |= __put_user( X86_FXSR_MAGIC, &buf->magic );
329 if ( __copy_to_user( &buf->_fxsr_env[0], &tsk->thread.i387.fxsave,
330 sizeof(struct i387_fxsave_struct) ) )
335 int save_i387( struct _fpstate __user *buf )
337 if ( !current->used_math )
340 /* This will cause a "finit" to be triggered by the next
341 * attempted FPU operation by the 'current' process.
343 current->used_math = 0;
346 if ( cpu_has_fxsr ) {
347 return save_i387_fxsave( buf );
349 return save_i387_fsave( buf );
352 return save_i387_soft( ¤t->thread.i387.soft, buf );
356 static inline int restore_i387_fsave( struct _fpstate __user *buf )
358 struct task_struct *tsk = current;
360 return __copy_from_user( &tsk->thread.i387.fsave, buf,
361 sizeof(struct i387_fsave_struct) );
364 static int restore_i387_fxsave( struct _fpstate __user *buf )
367 struct task_struct *tsk = current;
369 err = __copy_from_user( &tsk->thread.i387.fxsave, &buf->_fxsr_env[0],
370 sizeof(struct i387_fxsave_struct) );
371 /* mxcsr reserved bits must be masked to zero for security reasons */
372 tsk->thread.i387.fxsave.mxcsr &= mxcsr_feature_mask;
373 return err ? 1 : convert_fxsr_from_user( &tsk->thread.i387.fxsave, buf );
376 int restore_i387( struct _fpstate __user *buf )
381 if ( cpu_has_fxsr ) {
382 err = restore_i387_fxsave( buf );
384 err = restore_i387_fsave( buf );
387 err = restore_i387_soft( ¤t->thread.i387.soft, buf );
389 current->used_math = 1;
394 * ptrace request handlers.
397 static inline int get_fpregs_fsave( struct user_i387_struct __user *buf,
398 struct task_struct *tsk )
400 return __copy_to_user( buf, &tsk->thread.i387.fsave,
401 sizeof(struct user_i387_struct) );
404 static inline int get_fpregs_fxsave( struct user_i387_struct __user *buf,
405 struct task_struct *tsk )
407 return convert_fxsr_to_user( (struct _fpstate __user *)buf,
408 &tsk->thread.i387.fxsave );
411 int get_fpregs( struct user_i387_struct __user *buf, struct task_struct *tsk )
414 if ( cpu_has_fxsr ) {
415 return get_fpregs_fxsave( buf, tsk );
417 return get_fpregs_fsave( buf, tsk );
420 return save_i387_soft( &tsk->thread.i387.soft,
421 (struct _fpstate __user *)buf );
425 static inline int set_fpregs_fsave( struct task_struct *tsk,
426 struct user_i387_struct __user *buf )
428 return __copy_from_user( &tsk->thread.i387.fsave, buf,
429 sizeof(struct user_i387_struct) );
432 static inline int set_fpregs_fxsave( struct task_struct *tsk,
433 struct user_i387_struct __user *buf )
435 return convert_fxsr_from_user( &tsk->thread.i387.fxsave,
436 (struct _fpstate __user *)buf );
439 int set_fpregs( struct task_struct *tsk, struct user_i387_struct __user *buf )
442 if ( cpu_has_fxsr ) {
443 return set_fpregs_fxsave( tsk, buf );
445 return set_fpregs_fsave( tsk, buf );
448 return restore_i387_soft( &tsk->thread.i387.soft,
449 (struct _fpstate __user *)buf );
453 int get_fpxregs( struct user_fxsr_struct __user *buf, struct task_struct *tsk )
455 if ( cpu_has_fxsr ) {
456 if (__copy_to_user( buf, &tsk->thread.i387.fxsave,
457 sizeof(struct user_fxsr_struct) ))
465 int set_fpxregs( struct task_struct *tsk, struct user_fxsr_struct __user *buf )
469 if ( cpu_has_fxsr ) {
470 if (__copy_from_user( &tsk->thread.i387.fxsave, buf,
471 sizeof(struct user_fxsr_struct) ))
473 /* mxcsr reserved bits must be masked to zero for security reasons */
474 tsk->thread.i387.fxsave.mxcsr &= mxcsr_feature_mask;
482 * FPU state for core dumps.
485 static inline void copy_fpu_fsave( struct task_struct *tsk,
486 struct user_i387_struct *fpu )
488 memcpy( fpu, &tsk->thread.i387.fsave,
489 sizeof(struct user_i387_struct) );
492 static inline void copy_fpu_fxsave( struct task_struct *tsk,
493 struct user_i387_struct *fpu )
496 unsigned short *from;
499 memcpy( fpu, &tsk->thread.i387.fxsave, 7 * sizeof(long) );
501 to = (unsigned short *)&fpu->st_space[0];
502 from = (unsigned short *)&tsk->thread.i387.fxsave.st_space[0];
503 for ( i = 0 ; i < 8 ; i++, to += 5, from += 8 ) {
504 memcpy( to, from, 5 * sizeof(unsigned short) );
508 int dump_fpu( struct pt_regs *regs, struct user_i387_struct *fpu )
511 struct task_struct *tsk = current;
513 fpvalid = tsk->used_math;
516 if ( cpu_has_fxsr ) {
517 copy_fpu_fxsave( tsk, fpu );
519 copy_fpu_fsave( tsk, fpu );
526 int dump_extended_fpu( struct pt_regs *regs, struct user_fxsr_struct *fpu )
529 struct task_struct *tsk = current;
531 fpvalid = tsk->used_math && cpu_has_fxsr;
534 memcpy( fpu, &tsk->thread.i387.fxsave,
535 sizeof(struct user_fxsr_struct) );
541 int dump_task_fpu(struct task_struct *tsk, struct user_i387_struct *fpu)
543 int fpvalid = tsk->used_math;
549 copy_fpu_fxsave(tsk, fpu);
551 copy_fpu_fsave(tsk, fpu);
556 int dump_task_extended_fpu(struct task_struct *tsk, struct user_fxsr_struct *fpu)
558 int fpvalid = tsk->used_math && cpu_has_fxsr;
563 memcpy(fpu, &tsk->thread.i387.fxsave, sizeof(*fpu));