i387.c 12.4 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9
/*
 *  Copyright (C) 1994 Linus Torvalds
 *
 *  Pentium III FXSR, SSE support
 *  General FPU state handling cleanups
 *	Gareth Hughes <gareth@valinux.com>, May 2000
 */

#include <linux/sched.h>
10
#include <linux/module.h>
L
Linus Torvalds 已提交
11 12 13 14 15 16 17 18 19 20 21 22 23 24
#include <asm/processor.h>
#include <asm/i387.h>
#include <asm/math_emu.h>
#include <asm/sigcontext.h>
#include <asm/user.h>
#include <asm/ptrace.h>
#include <asm/uaccess.h>

#ifdef CONFIG_MATH_EMULATION
#define HAVE_HWFP (boot_cpu_data.hard_math)
#else
#define HAVE_HWFP 1
#endif

25
static unsigned long mxcsr_feature_mask __read_mostly = 0xffffffff;
L
Linus Torvalds 已提交
26 27 28 29 30 31

void mxcsr_feature_mask_init(void)
{
	unsigned long mask = 0;
	clts();
	if (cpu_has_fxsr) {
32 33 34
		memset(&current->thread.i387.fxsave, 0,
		       sizeof(struct i387_fxsave_struct));
		asm volatile("fxsave %0" : : "m" (current->thread.i387.fxsave));
L
Linus Torvalds 已提交
35
		mask = current->thread.i387.fxsave.mxcsr_mask;
36 37 38
		if (mask == 0)
			mask = 0x0000ffbf;
	}
L
Linus Torvalds 已提交
39 40 41 42 43 44 45 46 47 48 49 50 51
	mxcsr_feature_mask &= mask;
	stts();
}

/*
 * The _current_ task is using the FPU for the first time
 * so initialize it and set the mxcsr to its default
 * value at reset if we support XMM instructions and then
 * remeber the current task has used the FPU.
 */
void init_fpu(struct task_struct *tsk)
{
	if (cpu_has_fxsr) {
52 53
		memset(&tsk->thread.i387.fxsave, 0,
		       sizeof(struct i387_fxsave_struct));
L
Linus Torvalds 已提交
54 55 56 57
		tsk->thread.i387.fxsave.cwd = 0x37f;
		if (cpu_has_xmm)
			tsk->thread.i387.fxsave.mxcsr = 0x1f80;
	} else {
58 59
		memset(&tsk->thread.i387.fsave, 0,
		       sizeof(struct i387_fsave_struct));
L
Linus Torvalds 已提交
60 61 62 63 64
		tsk->thread.i387.fsave.cwd = 0xffff037fu;
		tsk->thread.i387.fsave.swd = 0xffff0000u;
		tsk->thread.i387.fsave.twd = 0xffffffffu;
		tsk->thread.i387.fsave.fos = 0xffff0000u;
	}
65 66
	/* only the device not available exception
	 * or ptrace can call init_fpu */
L
Linus Torvalds 已提交
67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84
	set_stopped_child_used_math(tsk);
}

/*
 * FPU lazy state save handling.
 */

void kernel_fpu_begin(void)
{
	struct thread_info *thread = current_thread_info();

	preempt_disable();
	if (thread->status & TS_USEDFPU) {
		__save_init_fpu(thread->task);
		return;
	}
	clts();
}
85
EXPORT_SYMBOL_GPL(kernel_fpu_begin);
L
Linus Torvalds 已提交
86 87 88 89 90

/*
 * FPU tag word conversions.
 */

91
static inline unsigned short twd_i387_to_fxsr(unsigned short twd)
L
Linus Torvalds 已提交
92 93
{
	unsigned int tmp; /* to avoid 16 bit prefixes in the code */
94

L
Linus Torvalds 已提交
95
	/* Transform each pair of bits into 01 (valid) or 00 (empty) */
96 97 98 99 100 101 102 103
	tmp = ~twd;
	tmp = (tmp | (tmp >> 1)) & 0x5555; /* 0V0V0V0V0V0V0V0V */
	/* and move the valid bits to the lower byte. */
	tmp = (tmp | (tmp >> 1)) & 0x3333; /* 00VV00VV00VV00VV */
	tmp = (tmp | (tmp >> 2)) & 0x0f0f; /* 0000VVVV0000VVVV */
	tmp = (tmp | (tmp >> 4)) & 0x00ff; /* 00000000VVVVVVVV */

	return tmp;
L
Linus Torvalds 已提交
104 105
}

106
static inline unsigned long twd_fxsr_to_i387(struct i387_fxsave_struct *fxsave)
L
Linus Torvalds 已提交
107 108 109 110 111 112 113 114 115 116
{
	struct _fpxreg *st = NULL;
	unsigned long tos = (fxsave->swd >> 11) & 7;
	unsigned long twd = (unsigned long) fxsave->twd;
	unsigned long tag;
	unsigned long ret = 0xffff0000u;
	int i;

#define FPREG_ADDR(f, n)	((void *)&(f)->st_space + (n) * 16);

117 118 119
	for (i = 0; i < 8; i++) {
		if (twd & 0x1) {
			st = FPREG_ADDR(fxsave, (i - tos) & 7);
L
Linus Torvalds 已提交
120

121
			switch (st->exponent & 0x7fff) {
L
Linus Torvalds 已提交
122 123 124 125
			case 0x7fff:
				tag = 2;		/* Special */
				break;
			case 0x0000:
126 127 128 129
				if (!st->significand[0] &&
				    !st->significand[1] &&
				    !st->significand[2] &&
				    !st->significand[3]) {
L
Linus Torvalds 已提交
130 131 132 133 134 135
					tag = 1;	/* Zero */
				} else {
					tag = 2;	/* Special */
				}
				break;
			default:
136
				if (st->significand[3] & 0x8000) {
L
Linus Torvalds 已提交
137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155
					tag = 0;	/* Valid */
				} else {
					tag = 2;	/* Special */
				}
				break;
			}
		} else {
			tag = 3;			/* Empty */
		}
		ret |= (tag << (2 * i));
		twd = twd >> 1;
	}
	return ret;
}

/*
 * FPU state interaction.
 */

156
unsigned short get_fpu_cwd(struct task_struct *tsk)
L
Linus Torvalds 已提交
157
{
158
	if (cpu_has_fxsr) {
L
Linus Torvalds 已提交
159 160 161 162 163 164
		return tsk->thread.i387.fxsave.cwd;
	} else {
		return (unsigned short)tsk->thread.i387.fsave.cwd;
	}
}

165
unsigned short get_fpu_swd(struct task_struct *tsk)
L
Linus Torvalds 已提交
166
{
167
	if (cpu_has_fxsr) {
L
Linus Torvalds 已提交
168 169 170 171 172 173 174
		return tsk->thread.i387.fxsave.swd;
	} else {
		return (unsigned short)tsk->thread.i387.fsave.swd;
	}
}

#if 0
175
unsigned short get_fpu_twd(struct task_struct *tsk)
L
Linus Torvalds 已提交
176
{
177
	if (cpu_has_fxsr) {
L
Linus Torvalds 已提交
178 179 180 181 182 183 184
		return tsk->thread.i387.fxsave.twd;
	} else {
		return (unsigned short)tsk->thread.i387.fsave.twd;
	}
}
#endif  /*  0  */

185
unsigned short get_fpu_mxcsr(struct task_struct *tsk)
L
Linus Torvalds 已提交
186
{
187
	if (cpu_has_xmm) {
L
Linus Torvalds 已提交
188 189 190 191 192 193 194 195
		return tsk->thread.i387.fxsave.mxcsr;
	} else {
		return 0x1f80;
	}
}

#if 0

196
void set_fpu_cwd(struct task_struct *tsk, unsigned short cwd)
L
Linus Torvalds 已提交
197
{
198
	if (cpu_has_fxsr) {
L
Linus Torvalds 已提交
199 200 201 202 203 204
		tsk->thread.i387.fxsave.cwd = cwd;
	} else {
		tsk->thread.i387.fsave.cwd = ((long)cwd | 0xffff0000u);
	}
}

205
void set_fpu_swd(struct task_struct *tsk, unsigned short swd)
L
Linus Torvalds 已提交
206
{
207
	if (cpu_has_fxsr) {
L
Linus Torvalds 已提交
208 209 210 211 212 213
		tsk->thread.i387.fxsave.swd = swd;
	} else {
		tsk->thread.i387.fsave.swd = ((long)swd | 0xffff0000u);
	}
}

214
void set_fpu_twd(struct task_struct *tsk, unsigned short twd)
L
Linus Torvalds 已提交
215
{
216
	if (cpu_has_fxsr) {
L
Linus Torvalds 已提交
217 218 219 220 221 222 223 224 225 226 227 228
		tsk->thread.i387.fxsave.twd = twd_i387_to_fxsr(twd);
	} else {
		tsk->thread.i387.fsave.twd = ((long)twd | 0xffff0000u);
	}
}

#endif  /*  0  */

/*
 * FXSR floating point environment conversions.
 */

229 230
static int convert_fxsr_to_user(struct _fpstate __user *buf,
				struct i387_fxsave_struct *fxsave)
L
Linus Torvalds 已提交
231 232 233 234 235 236 237 238 239 240 241 242 243 244
{
	unsigned long env[7];
	struct _fpreg __user *to;
	struct _fpxreg *from;
	int i;

	env[0] = (unsigned long)fxsave->cwd | 0xffff0000ul;
	env[1] = (unsigned long)fxsave->swd | 0xffff0000ul;
	env[2] = twd_fxsr_to_i387(fxsave);
	env[3] = fxsave->fip;
	env[4] = fxsave->fcs | ((unsigned long)fxsave->fop << 16);
	env[5] = fxsave->foo;
	env[6] = fxsave->fos;

245
	if (__copy_to_user(buf, env, 7 * sizeof(unsigned long)))
L
Linus Torvalds 已提交
246 247 248 249
		return 1;

	to = &buf->_st[0];
	from = (struct _fpxreg *) &fxsave->st_space[0];
250
	for (i = 0; i < 8; i++, to++, from++) {
L
Linus Torvalds 已提交
251 252 253 254
		unsigned long __user *t = (unsigned long __user *)to;
		unsigned long *f = (unsigned long *)from;

		if (__put_user(*f, t) ||
255 256
		    __put_user(*(f + 1), t + 1) ||
		    __put_user(from->exponent, &to->exponent))
L
Linus Torvalds 已提交
257 258 259 260 261
			return 1;
	}
	return 0;
}

262 263
static int convert_fxsr_from_user(struct i387_fxsave_struct *fxsave,
				  struct _fpstate __user *buf)
L
Linus Torvalds 已提交
264 265 266 267 268 269
{
	unsigned long env[7];
	struct _fpxreg *to;
	struct _fpreg __user *from;
	int i;

270
	if (__copy_from_user(env, buf, 7 * sizeof(long)))
L
Linus Torvalds 已提交
271 272 273 274 275 276 277 278 279 280 281 282 283
		return 1;

	fxsave->cwd = (unsigned short)(env[0] & 0xffff);
	fxsave->swd = (unsigned short)(env[1] & 0xffff);
	fxsave->twd = twd_i387_to_fxsr((unsigned short)(env[2] & 0xffff));
	fxsave->fip = env[3];
	fxsave->fop = (unsigned short)((env[4] & 0xffff0000ul) >> 16);
	fxsave->fcs = (env[4] & 0xffff);
	fxsave->foo = env[5];
	fxsave->fos = env[6];

	to = (struct _fpxreg *) &fxsave->st_space[0];
	from = &buf->_st[0];
284
	for (i = 0; i < 8; i++, to++, from++) {
L
Linus Torvalds 已提交
285 286 287 288
		unsigned long *t = (unsigned long *)to;
		unsigned long __user *f = (unsigned long __user *)from;

		if (__get_user(*t, f) ||
289 290
		    __get_user(*(t + 1), f + 1) ||
		    __get_user(to->exponent, &from->exponent))
L
Linus Torvalds 已提交
291 292 293 294 295 296 297 298 299
			return 1;
	}
	return 0;
}

/*
 * Signal frame handlers.
 */

300
static inline int save_i387_fsave(struct _fpstate __user *buf)
L
Linus Torvalds 已提交
301 302 303
{
	struct task_struct *tsk = current;

304
	unlazy_fpu(tsk);
L
Linus Torvalds 已提交
305
	tsk->thread.i387.fsave.status = tsk->thread.i387.fsave.swd;
306 307
	if (__copy_to_user(buf, &tsk->thread.i387.fsave,
			   sizeof(struct i387_fsave_struct)))
L
Linus Torvalds 已提交
308 309 310 311
		return -1;
	return 1;
}

312
static int save_i387_fxsave(struct _fpstate __user *buf)
L
Linus Torvalds 已提交
313 314 315 316
{
	struct task_struct *tsk = current;
	int err = 0;

317
	unlazy_fpu(tsk);
L
Linus Torvalds 已提交
318

319
	if (convert_fxsr_to_user(buf, &tsk->thread.i387.fxsave))
L
Linus Torvalds 已提交
320 321
		return -1;

322 323 324
	err |= __put_user(tsk->thread.i387.fxsave.swd, &buf->status);
	err |= __put_user(X86_FXSR_MAGIC, &buf->magic);
	if (err)
L
Linus Torvalds 已提交
325 326
		return -1;

327 328
	if (__copy_to_user(&buf->_fxsr_env[0], &tsk->thread.i387.fxsave,
			   sizeof(struct i387_fxsave_struct)))
L
Linus Torvalds 已提交
329 330 331 332
		return -1;
	return 1;
}

333
int save_i387(struct _fpstate __user *buf)
L
Linus Torvalds 已提交
334
{
335
	if (!used_math())
L
Linus Torvalds 已提交
336 337 338 339 340 341 342
		return 0;

	/* This will cause a "finit" to be triggered by the next
	 * attempted FPU operation by the 'current' process.
	 */
	clear_used_math();

343 344 345
	if (HAVE_HWFP) {
		if (cpu_has_fxsr) {
			return save_i387_fxsave(buf);
L
Linus Torvalds 已提交
346
		} else {
347
			return save_i387_fsave(buf);
L
Linus Torvalds 已提交
348 349
		}
	} else {
350
		return save_i387_soft(&current->thread.i387.soft, buf);
L
Linus Torvalds 已提交
351 352 353
	}
}

354
static inline int restore_i387_fsave(struct _fpstate __user *buf)
L
Linus Torvalds 已提交
355 356
{
	struct task_struct *tsk = current;
357 358 359
	clear_fpu(tsk);
	return __copy_from_user(&tsk->thread.i387.fsave, buf,
				sizeof(struct i387_fsave_struct));
L
Linus Torvalds 已提交
360 361
}

362
static int restore_i387_fxsave(struct _fpstate __user *buf)
L
Linus Torvalds 已提交
363 364 365
{
	int err;
	struct task_struct *tsk = current;
366 367 368
	clear_fpu(tsk);
	err = __copy_from_user(&tsk->thread.i387.fxsave, &buf->_fxsr_env[0],
			       sizeof(struct i387_fxsave_struct));
L
Linus Torvalds 已提交
369 370
	/* mxcsr reserved bits must be masked to zero for security reasons */
	tsk->thread.i387.fxsave.mxcsr &= mxcsr_feature_mask;
371
	return err ? 1 : convert_fxsr_from_user(&tsk->thread.i387.fxsave, buf);
L
Linus Torvalds 已提交
372 373
}

374
int restore_i387(struct _fpstate __user *buf)
L
Linus Torvalds 已提交
375 376 377
{
	int err;

378 379 380
	if (HAVE_HWFP) {
		if (cpu_has_fxsr) {
			err = restore_i387_fxsave(buf);
L
Linus Torvalds 已提交
381
		} else {
382
			err = restore_i387_fsave(buf);
L
Linus Torvalds 已提交
383 384
		}
	} else {
385
		err = restore_i387_soft(&current->thread.i387.soft, buf);
L
Linus Torvalds 已提交
386 387 388 389 390 391 392 393 394
	}
	set_used_math();
	return err;
}

/*
 * ptrace request handlers.
 */

395 396
static inline int get_fpregs_fsave(struct user_i387_struct __user *buf,
				   struct task_struct *tsk)
L
Linus Torvalds 已提交
397
{
398 399
	return __copy_to_user(buf, &tsk->thread.i387.fsave,
			      sizeof(struct user_i387_struct));
L
Linus Torvalds 已提交
400 401
}

402 403
static inline int get_fpregs_fxsave(struct user_i387_struct __user *buf,
				    struct task_struct *tsk)
L
Linus Torvalds 已提交
404
{
405 406
	return convert_fxsr_to_user((struct _fpstate __user *)buf,
				    &tsk->thread.i387.fxsave);
L
Linus Torvalds 已提交
407 408
}

409
int get_fpregs(struct user_i387_struct __user *buf, struct task_struct *tsk)
L
Linus Torvalds 已提交
410
{
411 412 413
	if (HAVE_HWFP) {
		if (cpu_has_fxsr) {
			return get_fpregs_fxsave(buf, tsk);
L
Linus Torvalds 已提交
414
		} else {
415
			return get_fpregs_fsave(buf, tsk);
L
Linus Torvalds 已提交
416 417
		}
	} else {
418 419
		return save_i387_soft(&tsk->thread.i387.soft,
				      (struct _fpstate __user *)buf);
L
Linus Torvalds 已提交
420 421 422
	}
}

423 424
static inline int set_fpregs_fsave(struct task_struct *tsk,
				   struct user_i387_struct __user *buf)
L
Linus Torvalds 已提交
425
{
426 427
	return __copy_from_user(&tsk->thread.i387.fsave, buf,
				sizeof(struct user_i387_struct));
L
Linus Torvalds 已提交
428 429
}

430 431
static inline int set_fpregs_fxsave(struct task_struct *tsk,
				    struct user_i387_struct __user *buf)
L
Linus Torvalds 已提交
432
{
433 434
	return convert_fxsr_from_user(&tsk->thread.i387.fxsave,
				      (struct _fpstate __user *)buf);
L
Linus Torvalds 已提交
435 436
}

437
int set_fpregs(struct task_struct *tsk, struct user_i387_struct __user *buf)
L
Linus Torvalds 已提交
438
{
439 440 441
	if (HAVE_HWFP) {
		if (cpu_has_fxsr) {
			return set_fpregs_fxsave(tsk, buf);
L
Linus Torvalds 已提交
442
		} else {
443
			return set_fpregs_fsave(tsk, buf);
L
Linus Torvalds 已提交
444 445
		}
	} else {
446 447
		return restore_i387_soft(&tsk->thread.i387.soft,
					 (struct _fpstate __user *)buf);
L
Linus Torvalds 已提交
448 449 450
	}
}

451
int get_fpxregs(struct user_fxsr_struct __user *buf, struct task_struct *tsk)
L
Linus Torvalds 已提交
452
{
453 454 455
	if (cpu_has_fxsr) {
		if (__copy_to_user(buf, &tsk->thread.i387.fxsave,
				   sizeof(struct user_fxsr_struct)))
L
Linus Torvalds 已提交
456 457 458 459 460 461 462
			return -EFAULT;
		return 0;
	} else {
		return -EIO;
	}
}

463
int set_fpxregs(struct task_struct *tsk, struct user_fxsr_struct __user *buf)
L
Linus Torvalds 已提交
464 465 466
{
	int ret = 0;

467 468 469
	if (cpu_has_fxsr) {
		if (__copy_from_user(&tsk->thread.i387.fxsave, buf,
				     sizeof(struct user_fxsr_struct)))
L
Linus Torvalds 已提交
470
			ret = -EFAULT;
471 472
		/* mxcsr reserved bits must be masked to zero
		 * for security reasons */
L
Linus Torvalds 已提交
473 474 475 476 477 478 479 480 481 482 483
		tsk->thread.i387.fxsave.mxcsr &= mxcsr_feature_mask;
	} else {
		ret = -EIO;
	}
	return ret;
}

/*
 * FPU state for core dumps.
 */

484 485
static inline void copy_fpu_fsave(struct task_struct *tsk,
				  struct user_i387_struct *fpu)
L
Linus Torvalds 已提交
486
{
487 488
	memcpy(fpu, &tsk->thread.i387.fsave,
	       sizeof(struct user_i387_struct));
L
Linus Torvalds 已提交
489 490
}

491 492
static inline void copy_fpu_fxsave(struct task_struct *tsk,
				   struct user_i387_struct *fpu)
L
Linus Torvalds 已提交
493 494 495 496 497
{
	unsigned short *to;
	unsigned short *from;
	int i;

498
	memcpy(fpu, &tsk->thread.i387.fxsave, 7 * sizeof(long));
L
Linus Torvalds 已提交
499 500 501

	to = (unsigned short *)&fpu->st_space[0];
	from = (unsigned short *)&tsk->thread.i387.fxsave.st_space[0];
502 503
	for (i = 0; i < 8; i++, to += 5, from += 8)
		memcpy(to, from, 5 * sizeof(unsigned short));
L
Linus Torvalds 已提交
504 505
}

506
int dump_fpu(struct pt_regs *regs, struct user_i387_struct *fpu)
L
Linus Torvalds 已提交
507 508 509 510 511
{
	int fpvalid;
	struct task_struct *tsk = current;

	fpvalid = !!used_math();
512 513 514 515
	if (fpvalid) {
		unlazy_fpu(tsk);
		if (cpu_has_fxsr) {
			copy_fpu_fxsave(tsk, fpu);
L
Linus Torvalds 已提交
516
		} else {
517
			copy_fpu_fsave(tsk, fpu);
L
Linus Torvalds 已提交
518 519 520 521 522
		}
	}

	return fpvalid;
}
523
EXPORT_SYMBOL(dump_fpu);
L
Linus Torvalds 已提交
524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539

int dump_task_fpu(struct task_struct *tsk, struct user_i387_struct *fpu)
{
	int fpvalid = !!tsk_used_math(tsk);

	if (fpvalid) {
		if (tsk == current)
			unlazy_fpu(tsk);
		if (cpu_has_fxsr)
			copy_fpu_fxsave(tsk, fpu);
		else
			copy_fpu_fsave(tsk, fpu);
	}
	return fpvalid;
}

540 541
int dump_task_extended_fpu(struct task_struct *tsk,
			   struct user_fxsr_struct *fpu)
L
Linus Torvalds 已提交
542 543 544 545 546 547 548 549 550 551
{
	int fpvalid = tsk_used_math(tsk) && cpu_has_fxsr;

	if (fpvalid) {
		if (tsk == current)
		       unlazy_fpu(tsk);
		memcpy(fpu, &tsk->thread.i387.fxsave, sizeof(*fpu));
	}
	return fpvalid;
}