floatscan.c 9.1 KB
Newer Older
1 2 3 4 5
#include <stdint.h>
#include <stdio.h>
#include <math.h>
#include <float.h>
#include <limits.h>
6
#include <errno.h>
7

8
#include "shgetc.h"
9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26
#include "floatscan.h"

#if LDBL_MANT_DIG == 53 && LDBL_MAX_EXP == 1024

#define LD_B1B_DIG 2
#define LD_B1B_MAX 9007199, 254740991
#define KMAX 128

#else /* LDBL_MANT_DIG == 64 && LDBL_MAX_EXP == 16384 */

#define LD_B1B_DIG 3
#define LD_B1B_MAX 18, 446744073, 709551615
#define KMAX 2048

#endif

#define MASK (KMAX-1)

27 28
#define CONCAT2(x,y) x ## y
#define CONCAT(x,y) CONCAT2(x,y)
29

30
static long long scanexp(FILE *f, int pok)
31 32 33 34 35 36
{
	int c;
	int x;
	long long y;
	int neg = 0;
	
37
	c = shgetc(f);
38 39
	if (c=='+' || c=='-') {
		neg = (c=='-');
40 41 42 43 44 45
		c = shgetc(f);
		if (c-'0'>=10U && pok) shunget(f);
	}
	if (c-'0'>=10U) {
		shunget(f);
		return LLONG_MIN;
46
	}
47
	for (x=0; c-'0'<10U && x<INT_MAX/10; c = shgetc(f))
48
		x = 10*x + c-'0';
49
	for (y=x; c-'0'<10U && y<LLONG_MAX/100; c = shgetc(f))
50
		y = 10*y + c-'0';
51 52
	for (; c-'0'<10U; c = shgetc(f));
	shunget(f);
53 54 55 56
	return neg ? -y : y;
}


57
static long double decfloat(FILE *f, int c, int bits, int emin, int sign, int pok)
58 59 60 61
{
	uint32_t x[KMAX];
	static const uint32_t th[] = { LD_B1B_MAX };
	int i, j, k, a, z;
62
	long long lrp=0, dc=0;
63
	long long e10=0;
64
	int lnz = 0;
65
	int gotdig = 0, gotrad = 0;
66 67
	int rp;
	int e2;
68 69
	int emax = -emin-bits+3;
	int denormal = 0;
70 71 72
	long double y;
	long double frac=0;
	long double bias=0;
73 74
	static const int p10s[] = { 10, 100, 1000, 10000,
		100000, 1000000, 10000000, 100000000 };
75 76 77 78 79

	j=0;
	k=0;

	/* Don't let leading zeros consume buffer space */
80
	for (; c=='0'; c = shgetc(f)) gotdig=1;
81 82 83 84
	if (c=='.') {
		gotrad = 1;
		for (c = shgetc(f); c=='0'; c = shgetc(f)) gotdig=1, lrp--;
	}
85 86

	x[0] = 0;
87
	for (; c-'0'<10U || c=='.'; c = shgetc(f)) {
88
		if (c == '.') {
89 90
			if (gotrad) break;
			gotrad = 1;
91
			lrp = dc;
92
		} else if (k < KMAX-3) {
93
			dc++;
94
			if (c!='0') lnz = dc;
95 96 97 98 99 100 101 102 103
			if (j) x[k] = x[k]*10 + c-'0';
			else x[k] = c-'0';
			if (++j==9) {
				k++;
				j=0;
			}
			gotdig=1;
		} else {
			dc++;
104
			if (c!='0') x[KMAX-4] |= 1;
105 106
		}
	}
107
	if (!gotrad) lrp=dc;
108 109

	if (gotdig && (c|32)=='e') {
110
		e10 = scanexp(f, pok);
111
		if (e10 == LLONG_MIN) {
112 113 114 115
			if (pok) {
				shunget(f);
			} else {
				shlim(f, 0);
116 117 118 119 120 121
				return 0;
			}
			e10 = 0;
		}
		lrp += e10;
	} else if (c>=0) {
122
		shunget(f);
123 124
	}
	if (!gotdig) {
125
		errno = EINVAL;
126
		shlim(f, 0);
127 128 129
		return 0;
	}

130 131 132 133 134
	/* Handle zero specially to avoid nasty special cases later */
	if (!x[0]) return sign * 0.0;

	/* Optimize small integers (w/no exponent) and over/under-flow */
	if (lrp==dc && dc<10 && (bits>30 || x[0]>>bits==0))
135
		return sign * (long double)x[0];
136 137
	if (lrp > -emin/2) {
		errno = ERANGE;
138
		return sign * LDBL_MAX * LDBL_MAX;
139 140 141
	}
	if (lrp < emin-2*LDBL_MANT_DIG) {
		errno = ERANGE;
142
		return sign * LDBL_MIN * LDBL_MIN;
143
	}
144

145
	/* Align incomplete final B1B digit */
146
	if (j) {
147 148 149 150 151 152 153 154 155 156
		for (; j<9; j++) x[k]*=10;
		k++;
		j=0;
	}

	a = 0;
	z = k;
	e2 = 0;
	rp = lrp;

157 158 159 160 161 162 163 164 165 166
	/* Optimize small to mid-size integers (even in exp. notation) */
	if (lnz<9 && lnz<=rp && rp < 18) {
		if (rp == 9) return sign * (long double)x[0];
		if (rp < 9) return sign * (long double)x[0] / p10s[8-rp];
		int bitlim = bits-3*(int)(rp-9);
		if (bitlim>30 || x[0]>>bitlim==0)
			return sign * (long double)x[0] * p10s[rp-10];
	}

	/* Align radix point to B1B digit boundary */
167
	if (rp % 9) {
168
		int rpm9 = rp>=0 ? rp%9 : rp%9+9;
169
		int p10 = p10s[8-rpm9];
170
		uint32_t carry = 0;
171
		for (k=a; k!=z; k++) {
172 173 174 175 176 177 178 179
			uint32_t tmp = x[k] % p10;
			x[k] = x[k]/p10 + carry;
			carry = 1000000000/p10 * tmp;
			if (k==a && !x[k]) {
				a = (a+1 & MASK);
				rp -= 9;
			}
		}
180
		if (carry) x[z++] = carry;
181 182 183
		rp += 9-rpm9;
	}

184
	/* Upscale until desired number of bits are left of radix point */
185
	while (rp < 9*LD_B1B_DIG || (rp == 9*LD_B1B_DIG && x[a]<th[0])) {
186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201
		uint32_t carry = 0;
		e2 -= 29;
		for (k=(z-1 & MASK); ; k=(k-1 & MASK)) {
			uint64_t tmp = ((uint64_t)x[k] << 29) + carry;
			if (tmp > 1000000000) {
				carry = tmp / 1000000000;
				x[k] = tmp % 1000000000;
			} else {
				carry = 0;
				x[k] = tmp;
			}
			if (k==(z-1 & MASK) && k!=a && !x[k]) z = k;
			if (k==a) break;
		}
		if (carry) {
			rp += 9;
202
			a = (a-1 & MASK);
203 204 205 206 207 208 209 210
			if (a == z) {
				z = (z-1 & MASK);
				x[z-1 & MASK] |= x[z];
			}
			x[a] = carry;
		}
	}

211
	/* Downscale until exactly number of bits are left of radix point */
212 213 214 215 216 217 218 219 220 221 222 223 224 225 226
	for (;;) {
		uint32_t carry = 0;
		int sh = 1;
		for (i=0; i<LD_B1B_DIG; i++) {
			k = (a+i & MASK);
			if (k == z || x[k] < th[i]) {
				i=LD_B1B_DIG;
				break;
			}
			if (x[a+i & MASK] > th[i]) break;
		}
		if (i==LD_B1B_DIG && rp==9*LD_B1B_DIG) break;
		/* FIXME: find a way to compute optimal sh */
		if (rp > 9+9*LD_B1B_DIG) sh = 9;
		e2 += sh;
227
		for (k=a; k!=z; k=(k+1 & MASK)) {
228 229 230 231 232
			uint32_t tmp = x[k] & (1<<sh)-1;
			x[k] = (x[k]>>sh) + carry;
			carry = (1000000000>>sh) * tmp;
			if (k==a && !x[k]) {
				a = (a+1 & MASK);
233
				i--;
234 235 236
				rp -= 9;
			}
		}
237
		if (carry) {
238 239 240 241 242 243 244
			if ((z+1 & MASK) != a) {
				x[z] = carry;
				z = (z+1 & MASK);
			} else x[z-1 & MASK] |= 1;
		}
	}

245
	/* Assemble desired bits into floating point variable */
246
	for (y=i=0; i<LD_B1B_DIG; i++) {
247
		if ((a+i & MASK)==z) x[(z=(z+1 & MASK))-1] = 0;
248
		y = 1000000000.0L * y + x[a+i & MASK];
249
	}
250 251 252

	y *= sign;

253
	/* Limit precision for denormal results */
254 255 256
	if (bits > LDBL_MANT_DIG+e2-emin) {
		bits = LDBL_MANT_DIG+e2-emin;
		if (bits<0) bits=0;
257
		denormal = 1;
258 259
	}

260
	/* Calculate bias term to force rounding, move out lower bits */
261 262 263 264 265 266 267
	if (bits < LDBL_MANT_DIG) {
		bias = copysignl(scalbn(1, 2*LDBL_MANT_DIG-bits-1), y);
		frac = fmodl(y, scalbn(1, LDBL_MANT_DIG-bits));
		y -= frac;
		y += bias;
	}

268
	/* Process tail of decimal input so it can affect rounding */
269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287
	if ((a+i & MASK) != z) {
		uint32_t t = x[a+i & MASK];
		if (t < 500000000 && (t || (a+i+1 & MASK) != z))
			frac += 0.25*sign;
		else if (t > 500000000)
			frac += 0.75*sign;
		else if (t == 500000000) {
			if ((a+i+1 & MASK) == z)
				frac += 0.5*sign;
			else
				frac += 0.75*sign;
		}
		if (LDBL_MANT_DIG-bits >= 2 && !fmodl(frac, 1))
			frac++;
	}

	y += frac;
	y -= bias;

288 289 290 291 292 293 294 295 296 297
	if ((e2+LDBL_MANT_DIG & INT_MAX) > emax-5) {
		if (fabs(y) >= CONCAT(0x1p, LDBL_MANT_DIG)) {
			if (denormal && bits==LDBL_MANT_DIG+e2-emin)
				denormal = 0;
			y *= 0.5;
			e2++;
		}
		if (e2+LDBL_MANT_DIG>emax || (denormal && frac))
			errno = ERANGE;
	}
298

299
	return scalbnl(y, e2);
300 301
}

302
static long double hexfloat(FILE *f, int bits, int emin, int sign, int pok)
303 304 305 306 307 308 309 310 311 312
{
	uint32_t x = 0;
	long double y = 0;
	long double scale = 1;
	long double bias = 0;
	int gottail = 0, gotrad = 0, gotdig = 0;
	long long rp = 0;
	long long dc = 0;
	long long e2 = 0;
	int d;
313
	int c;
314

315
	c = shgetc(f);
316 317

	/* Skip leading zeros */
318
	for (; c=='0'; c = shgetc(f)) gotdig = 1;
319 320 321

	if (c=='.') {
		gotrad = 1;
322
		c = shgetc(f);
323
		/* Count zeros after the radix point before significand */
324
		for (rp=0; c=='0'; c = shgetc(f), rp--) gotdig = 1;
325 326
	}

327
	for (; c-'0'<10U || (c|32)-'a'<6U || c=='.'; c = shgetc(f)) {
328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347
		if (c=='.') {
			if (gotrad) break;
			rp = dc;
			gotrad = 1;
		} else {
			gotdig = 1;
			if (c > '9') d = (c|32)+10-'a';
			else d = c-'0';
			if (dc<8) {
				x = x*16 + d;
			} else if (dc < LDBL_MANT_DIG/4+1) {
				y += d*(scale/=16);
			} else if (d && !gottail) {
				y += 0.5*scale;
				gottail = 1;
			}
			dc++;
		}
	}
	if (!gotdig) {
348 349 350 351 352 353
		shunget(f);
		if (pok) {
			shunget(f);
			if (gotrad) shunget(f);
		} else {
			shlim(f, 0);
354
		}
355
		return sign * 0.0;
356 357 358 359
	}
	if (!gotrad) rp = dc;
	while (dc<8) x *= 16, dc++;
	if ((c|32)=='p') {
360
		e2 = scanexp(f, pok);
361
		if (e2 == LLONG_MIN) {
362 363 364 365
			if (pok) {
				shunget(f);
			} else {
				shlim(f, 0);
366 367 368 369
				return 0;
			}
			e2 = 0;
		}
370 371
	} else {
		shunget(f);
372 373 374 375
	}
	e2 += 4*rp - 32;

	if (!x) return sign * 0.0;
376 377 378 379 380 381 382 383
	if (e2 > -emin) {
		errno = ERANGE;
		return sign * LDBL_MAX * LDBL_MAX;
	}
	if (e2 < emin-2*LDBL_MANT_DIG) {
		errno = ERANGE;
		return sign * LDBL_MIN * LDBL_MIN;
	}
384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408

	while (x < 0x80000000) {
		if (y>=0.5) {
			x += x + 1;
			y += y - 1;
		} else {
			x += x;
			y += y;
		}
		e2--;
	}

	if (bits > 32+e2-emin) {
		bits = 32+e2-emin;
		if (bits<0) bits=0;
	}

	if (bits < LDBL_MANT_DIG)
		bias = copysignl(scalbn(1, 32+LDBL_MANT_DIG-bits-1), sign);

	if (bits<32 && y && !(x&1)) x++, y=0;

	y = bias + sign*(long double)x + sign*y;
	y -= bias;

409 410
	if (!y) errno = ERANGE;

411 412 413
	return scalbnl(y, e2);
}

414
long double __floatscan(FILE *f, int prec, int pok)
415 416 417 418 419
{
	int sign = 1;
	int i;
	int bits;
	int emin;
420
	int c;
421 422 423

	switch (prec) {
	case 0:
424 425
		bits = FLT_MANT_DIG;
		emin = FLT_MIN_EXP-bits;
426 427
		break;
	case 1:
428 429
		bits = DBL_MANT_DIG;
		emin = DBL_MIN_EXP-bits;
430 431 432
		break;
	case 2:
		bits = LDBL_MANT_DIG;
433
		emin = LDBL_MIN_EXP-bits;
434 435 436 437 438
		break;
	default:
		return 0;
	}

439
	while (isspace((c=shgetc(f))));
440 441 442

	if (c=='+' || c=='-') {
		sign -= 2*(c=='-');
443
		c = shgetc(f);
444 445 446
	}

	for (i=0; i<8 && (c|32)=="infinity"[i]; i++)
447
		if (i<7) c = shgetc(f);
448
	if (i==3 || i==8 || (i>3 && pok)) {
449 450 451 452
		if (i!=8) {
			shunget(f);
			if (pok) for (; i>3; i--) shunget(f);
		}
453 454 455
		return sign * INFINITY;
	}
	if (!i) for (i=0; i<3 && (c|32)=="nan"[i]; i++)
456
		if (i<2) c = shgetc(f);
457
	if (i==3) {
458
		return NAN;
459 460 461
	}

	if (i) {
462
		shunget(f);
463
		errno = EINVAL;
464
		shlim(f, 0);
465 466 467 468
		return 0;
	}

	if (c=='0') {
469
		c = shgetc(f);
470
		if ((c|32) == 'x')
471
			return hexfloat(f, bits, emin, sign, pok);
472
		shunget(f);
473 474 475
		c = '0';
	}

476
	return decfloat(f, c, bits, emin, sign, pok);
477
}