ieee754dp.c 5.3 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/* IEEE754 floating point arithmetic
 * double precision: common utilities
 */
/*
 * MIPS floating point support
 * Copyright (C) 1994-2000 Algorithmics Ltd.
 *
 * ########################################################################
 *
 *  This program is free software; you can distribute it and/or modify it
 *  under the terms of the GNU General Public License (Version 2) as
 *  published by the Free Software Foundation.
 *
 *  This program is distributed in the hope it will be useful, but WITHOUT
 *  ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 *  FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 *  for more details.
 *
 *  You should have received a copy of the GNU General Public License along
 *  with this program; if not, write to the Free Software Foundation, Inc.,
 *  59 Temple Place - Suite 330, Boston MA 02111-1307, USA.
 *
 * ########################################################################
 */

26
#include <stdarg.h>
27
#include <linux/compiler.h>
L
Linus Torvalds 已提交
28 29 30

#include "ieee754dp.h"

31
int ieee754dp_class(union ieee754dp x)
L
Linus Torvalds 已提交
32 33 34 35 36 37
{
	COMPXDP;
	EXPLODEXDP;
	return xc;
}

38
int ieee754dp_isnan(union ieee754dp x)
L
Linus Torvalds 已提交
39 40 41 42
{
	return ieee754dp_class(x) >= IEEE754_CLASS_SNAN;
}

43
static inline int ieee754dp_issnan(union ieee754dp x)
L
Linus Torvalds 已提交
44 45
{
	assert(ieee754dp_isnan(x));
46
	return ((DPMANT(x) & DP_MBIT(DP_FBITS-1)) == DP_MBIT(DP_FBITS-1));
L
Linus Torvalds 已提交
47 48 49
}


50
union ieee754dp __cold ieee754dp_xcpt(union ieee754dp r, const char *op, ...)
L
Linus Torvalds 已提交
51 52
{
	struct ieee754xctx ax;
53
	if (!ieee754_tstx())
L
Linus Torvalds 已提交
54 55 56 57 58 59 60
		return r;

	ax.op = op;
	ax.rt = IEEE754_RT_DP;
	ax.rv.dp = r;
	va_start(ax.ap, op);
	ieee754_xcpt(&ax);
61
	va_end(ax.ap);
L
Linus Torvalds 已提交
62 63 64
	return ax.rv.dp;
}

65
union ieee754dp __cold ieee754dp_nanxcpt(union ieee754dp r, const char *op, ...)
L
Linus Torvalds 已提交
66 67 68 69 70 71 72 73
{
	struct ieee754xctx ax;

	assert(ieee754dp_isnan(r));

	if (!ieee754dp_issnan(r))	/* QNAN does not cause invalid op !! */
		return r;

74
	if (!ieee754_setandtestcx(IEEE754_INVALID_OPERATION)) {
L
Linus Torvalds 已提交
75
		/* not enabled convert to a quiet NaN */
76
		DPMANT(r) &= (~DP_MBIT(DP_FBITS-1));
L
Linus Torvalds 已提交
77 78 79 80 81 82 83 84 85 86 87
		if (ieee754dp_isnan(r))
			return r;
		else
			return ieee754dp_indef();
	}

	ax.op = op;
	ax.rt = 0;
	ax.rv.dp = r;
	va_start(ax.ap, op);
	ieee754_xcpt(&ax);
88
	va_end(ax.ap);
L
Linus Torvalds 已提交
89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
	return ax.rv.dp;
}

static u64 get_rounding(int sn, u64 xm)
{
	/* inexact must round of 3 bits
	 */
	if (xm & (DP_MBIT(3) - 1)) {
		switch (ieee754_csr.rm) {
		case IEEE754_RZ:
			break;
		case IEEE754_RN:
			xm += 0x3 + ((xm >> 3) & 1);
			/* xm += (xm&0x8)?0x4:0x3 */
			break;
		case IEEE754_RU:	/* toward +Infinity */
			if (!sn)	/* ?? */
				xm += 0x8;
			break;
		case IEEE754_RD:	/* toward -Infinity */
R
Ralf Baechle 已提交
109
			if (sn) /* ?? */
L
Linus Torvalds 已提交
110 111 112 113 114 115 116 117 118 119 120 121 122
				xm += 0x8;
			break;
		}
	}
	return xm;
}


/* generate a normal/denormal number with over,under handling
 * sn is sign
 * xe is an unbiased exponent
 * xm is 3bit extended precision value.
 */
123
union ieee754dp ieee754dp_format(int sn, int xe, u64 xm)
L
Linus Torvalds 已提交
124 125 126
{
	assert(xm);		/* we don't gen exact zeros (probably should) */

127
	assert((xm >> (DP_FBITS + 1 + 3)) == 0);	/* no execess */
L
Linus Torvalds 已提交
128 129 130 131 132 133 134
	assert(xm & (DP_HIDDEN_BIT << 3));

	if (xe < DP_EMIN) {
		/* strip lower bits */
		int es = DP_EMIN - xe;

		if (ieee754_csr.nod) {
135 136
			ieee754_setcx(IEEE754_UNDERFLOW);
			ieee754_setcx(IEEE754_INEXACT);
L
Linus Torvalds 已提交
137 138 139 140 141 142

			switch(ieee754_csr.rm) {
			case IEEE754_RN:
			case IEEE754_RZ:
				return ieee754dp_zero(sn);
			case IEEE754_RU:    /* toward +Infinity */
143
				if (sn == 0)
L
Linus Torvalds 已提交
144 145 146 147
					return ieee754dp_min(0);
				else
					return ieee754dp_zero(1);
			case IEEE754_RD:    /* toward -Infinity */
148
				if (sn == 0)
L
Linus Torvalds 已提交
149 150 151 152 153 154 155
					return ieee754dp_zero(0);
				else
					return ieee754dp_min(1);
			}
		}

		if (xe == DP_EMIN - 1
156
				&& get_rounding(sn, xm) >> (DP_FBITS + 1 + 3))
L
Linus Torvalds 已提交
157 158
		{
			/* Not tiny after rounding */
159
			ieee754_setcx(IEEE754_INEXACT);
L
Linus Torvalds 已提交
160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175
			xm = get_rounding(sn, xm);
			xm >>= 1;
			/* Clear grs bits */
			xm &= ~(DP_MBIT(3) - 1);
			xe++;
		}
		else {
			/* sticky right shift es bits
			 */
			xm = XDPSRS(xm, es);
			xe += es;
			assert((xm & (DP_HIDDEN_BIT << 3)) == 0);
			assert(xe == DP_EMIN);
		}
	}
	if (xm & (DP_MBIT(3) - 1)) {
176
		ieee754_setcx(IEEE754_INEXACT);
L
Linus Torvalds 已提交
177
		if ((xm & (DP_HIDDEN_BIT << 3)) == 0) {
178
			ieee754_setcx(IEEE754_UNDERFLOW);
L
Linus Torvalds 已提交
179 180 181 182 183 184 185
		}

		/* inexact must round of 3 bits
		 */
		xm = get_rounding(sn, xm);
		/* adjust exponent for rounding add overflowing
		 */
186
		if (xm >> (DP_FBITS + 3 + 1)) {
L
Linus Torvalds 已提交
187 188 189 190 191 192 193 194
			/* add causes mantissa overflow */
			xm >>= 1;
			xe++;
		}
	}
	/* strip grs bits */
	xm >>= 3;

195
	assert((xm >> (DP_FBITS + 1)) == 0);	/* no execess */
L
Linus Torvalds 已提交
196 197 198
	assert(xe >= DP_EMIN);

	if (xe > DP_EMAX) {
199 200
		ieee754_setcx(IEEE754_OVERFLOW);
		ieee754_setcx(IEEE754_INEXACT);
L
Linus Torvalds 已提交
201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224
		/* -O can be table indexed by (rm,sn) */
		switch (ieee754_csr.rm) {
		case IEEE754_RN:
			return ieee754dp_inf(sn);
		case IEEE754_RZ:
			return ieee754dp_max(sn);
		case IEEE754_RU:	/* toward +Infinity */
			if (sn == 0)
				return ieee754dp_inf(0);
			else
				return ieee754dp_max(1);
		case IEEE754_RD:	/* toward -Infinity */
			if (sn == 0)
				return ieee754dp_max(0);
			else
				return ieee754dp_inf(1);
		}
	}
	/* gen norm/denorm/zero */

	if ((xm & DP_HIDDEN_BIT) == 0) {
		/* we underflow (tiny/zero) */
		assert(xe == DP_EMIN);
		if (ieee754_csr.mx & IEEE754_UNDERFLOW)
225
			ieee754_setcx(IEEE754_UNDERFLOW);
L
Linus Torvalds 已提交
226 227
		return builddp(sn, DP_EMIN - 1 + DP_EBIAS, xm);
	} else {
228
		assert((xm >> (DP_FBITS + 1)) == 0);	/* no execess */
L
Linus Torvalds 已提交
229 230 231 232 233
		assert(xm & DP_HIDDEN_BIT);

		return builddp(sn, xe + DP_EBIAS, xm & ~DP_HIDDEN_BIT);
	}
}