bn_exp.c 18.8 KB
Newer Older
1
/* crypto/bn/bn_exp.c */
2
/* Copyright (C) 1995-1998 Eric Young (eay@cryptsoft.com)
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57
 * All rights reserved.
 *
 * This package is an SSL implementation written
 * by Eric Young (eay@cryptsoft.com).
 * The implementation was written so as to conform with Netscapes SSL.
 * 
 * This library is free for commercial and non-commercial use as long as
 * the following conditions are aheared to.  The following conditions
 * apply to all code found in this distribution, be it the RC4, RSA,
 * lhash, DES, etc., code; not just the SSL code.  The SSL documentation
 * included with this distribution is covered by the same copyright terms
 * except that the holder is Tim Hudson (tjh@cryptsoft.com).
 * 
 * Copyright remains Eric Young's, and as such any Copyright notices in
 * the code are not to be removed.
 * If this package is used in a product, Eric Young should be given attribution
 * as the author of the parts of the library used.
 * This can be in the form of a textual message at program startup or
 * in documentation (online or textual) provided with the package.
 * 
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. All advertising materials mentioning features or use of this software
 *    must display the following acknowledgement:
 *    "This product includes cryptographic software written by
 *     Eric Young (eay@cryptsoft.com)"
 *    The word 'cryptographic' can be left out if the rouines from the library
 *    being used are not cryptographic related :-).
 * 4. If you include any Windows specific code (or a derivative thereof) from 
 *    the apps directory (application code) you must include an acknowledgement:
 *    "This product includes software written by Tim Hudson (tjh@cryptsoft.com)"
 * 
 * THIS SOFTWARE IS PROVIDED BY ERIC YOUNG ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 * 
 * The licence and distribution terms for any publically available version or
 * derivative of this code cannot be changed.  i.e. this code cannot simply be
 * copied and put under another distribution licence
 * [including the GNU Public Licence.]
 */
58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
/* ====================================================================
 * Copyright (c) 1998-2000 The OpenSSL Project.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 *
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer. 
 *
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in
 *    the documentation and/or other materials provided with the
 *    distribution.
 *
 * 3. All advertising materials mentioning features or use of this
 *    software must display the following acknowledgment:
 *    "This product includes software developed by the OpenSSL Project
 *    for use in the OpenSSL Toolkit. (http://www.openssl.org/)"
 *
 * 4. The names "OpenSSL Toolkit" and "OpenSSL Project" must not be used to
 *    endorse or promote products derived from this software without
 *    prior written permission. For written permission, please contact
 *    openssl-core@openssl.org.
 *
 * 5. Products derived from this software may not be called "OpenSSL"
 *    nor may "OpenSSL" appear in their names without prior written
 *    permission of the OpenSSL Project.
 *
 * 6. Redistributions of any form whatsoever must retain the following
 *    acknowledgment:
 *    "This product includes software developed by the OpenSSL Project
 *    for use in the OpenSSL Toolkit (http://www.openssl.org/)"
 *
 * THIS SOFTWARE IS PROVIDED BY THE OpenSSL PROJECT ``AS IS'' AND ANY
 * EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
 * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE OpenSSL PROJECT OR
 * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
 * OF THE POSSIBILITY OF SUCH DAMAGE.
 * ====================================================================
 *
 * This product includes cryptographic software written by Eric Young
 * (eay@cryptsoft.com).  This product includes software written by Tim
 * Hudson (tjh@cryptsoft.com).
 *
 */

112 113 114

#include "cryptlib.h"
#include "bn_lcl.h"
B
Bodo Möller 已提交
115

116
#define TABLE_SIZE	32
117

118
/* this one works - simple but works */
119
int BN_exp(BIGNUM *r, const BIGNUM *a, const BIGNUM *p, BN_CTX *ctx)
120
	{
121
	int i,bits,ret=0;
122
	BIGNUM *v,*rr;
123

124
	BN_CTX_start(ctx);
125
	if ((r == a) || (r == p))
126
		rr = BN_CTX_get(ctx);
127
	else
128 129
		rr = r;
	if ((v = BN_CTX_get(ctx)) == NULL) goto err;
130 131 132 133 134

	if (BN_copy(v,a) == NULL) goto err;
	bits=BN_num_bits(p);

	if (BN_is_odd(p))
135 136
		{ if (BN_copy(rr,a) == NULL) goto err; }
	else	{ if (!BN_one(rr)) goto err; }
137 138 139

	for (i=1; i<bits; i++)
		{
140
		if (!BN_sqr(v,v,ctx)) goto err;
141 142
		if (BN_is_bit_set(p,i))
			{
143
			if (!BN_mul(rr,rr,v,ctx)) goto err;
144 145 146 147
			}
		}
	ret=1;
err:
148
	if (r != rr) BN_copy(r,rr);
149
	BN_CTX_end(ctx);
150 151 152
	return(ret);
	}

B
Bodo Möller 已提交
153

154
int BN_mod_exp(BIGNUM *r, const BIGNUM *a, const BIGNUM *p, const BIGNUM *m,
155
	       BN_CTX *ctx)
156 157 158
	{
	int ret;

159 160 161 162
	bn_check_top(a);
	bn_check_top(p);
	bn_check_top(m);

B
Bodo Möller 已提交
163 164 165 166 167 168 169 170 171
	/* For even modulus  m = 2^k*m_odd,  it might make sense to compute
	 * a^p mod m_odd  and  a^p mod 2^k  separately (with Montgomery
	 * exponentiation for the odd part), using appropriate exponent
	 * reductions, and combine the results using the CRT.
	 *
	 * For now, we use Montgomery only if the modulus is odd; otherwise,
	 * exponentiation using the reciprocal-based quick remaindering
	 * algorithm is used.
	 *
B
Bodo Möller 已提交
172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190
	 * (Timing obtained with expspeed.c [computations  a^p mod m
	 * where  a, p, m  are of the same length: 256, 512, 1024, 2048,
	 * 4096, 8192 bits], compared to the running time of the
	 * standard algorithm:
	 *
	 *   BN_mod_exp_mont   33 .. 40 %  [AMD K6-2, Linux, debug configuration]
         *                     55 .. 77 %  [UltraSparc processor, but
	 *                                  debug-solaris-sparcv8-gcc conf.]
	 * 
	 *   BN_mod_exp_recp   50 .. 70 %  [AMD K6-2, Linux, debug configuration]
	 *                     62 .. 118 % [UltraSparc, debug-solaris-sparcv8-gcc]
	 *
	 * On the Sparc, BN_mod_exp_recp was faster than BN_mod_exp_mont
	 * at 2048 and more bits, but at 512 and 1024 bits, it was
	 * slower even than the standard algorithm!
	 *
	 * "Real" timings [linux-elf, solaris-sparcv9-gcc configurations]
	 * should be obtained when the new Montgomery reduction code
	 * has been integrated into OpenSSL.)
B
Bodo Möller 已提交
191 192 193
	 */

#define MONT_MUL_MOD
194
#define MONT_EXP_WORD
B
Bodo Möller 已提交
195 196
#define RECP_MUL_MOD

197 198 199 200 201 202 203 204
#ifdef MONT_MUL_MOD
	/* I have finally been able to take out this pre-condition of
	 * the top bit being set.  It was caused by an error in BN_div
	 * with negatives.  There was also another problem when for a^b%m
	 * a >= m.  eay 07-May-97 */
/*	if ((m->d[m->top-1]&BN_TBIT) && BN_is_odd(m)) */

	if (BN_is_odd(m))
B
Bodo Möller 已提交
205
		{
206
#  ifdef MONT_EXP_WORD
B
Bodo Möller 已提交
207
		if (a->top == 1 && !a->neg)
B
Bodo Möller 已提交
208 209 210 211 212
			{
			BN_ULONG A = a->d[0];
			ret=BN_mod_exp_mont_word(r,A,p,m,ctx,NULL);
			}
		else
213
#  endif
B
Bodo Möller 已提交
214 215
			ret=BN_mod_exp_mont(r,a,p,m,ctx,NULL);
		}
216 217 218 219 220 221 222 223 224 225 226
	else
#endif
#ifdef RECP_MUL_MOD
		{ ret=BN_mod_exp_recp(r,a,p,m,ctx); }
#else
		{ ret=BN_mod_exp_simple(r,a,p,m,ctx); }
#endif

	return(ret);
	}

B
Bodo Möller 已提交
227

228 229
int BN_mod_exp_recp(BIGNUM *r, const BIGNUM *a, const BIGNUM *p,
		    const BIGNUM *m, BN_CTX *ctx)
230
	{
231 232 233 234 235
	int i,j,bits,ret=0,wstart,wend,window,wvalue;
	int start=1,ts=0;
	BIGNUM *aa;
	BIGNUM val[TABLE_SIZE];
	BN_RECP_CTX recp;
236 237 238 239 240

	bits=BN_num_bits(p);

	if (bits == 0)
		{
B
BN_sqrt  
Bodo Möller 已提交
241 242 243
		ret = BN_one(r);
		return ret;
		}
244 245 246 247

	BN_CTX_start(ctx);
	if ((aa = BN_CTX_get(ctx)) == NULL) goto err;

248 249 250 251 252
	BN_RECP_CTX_init(&recp);
	if (BN_RECP_CTX_set(&recp,m,ctx) <= 0) goto err;

	BN_init(&(val[0]));
	ts=1;
253

B
Bodo Möller 已提交
254
	if (!BN_nnmod(&(val[0]),a,m,ctx)) goto err;		/* 1 */
255 256 257 258 259
	if (BN_is_zero(&(val[0])))
		{
		ret = BN_zero(r);
		goto err;
		}
260

261 262
	window = BN_window_bits_for_exponent_size(bits);
	if (window > 1)
263
		{
264 265 266 267 268 269 270 271 272 273
		if (!BN_mod_mul_reciprocal(aa,&(val[0]),&(val[0]),&recp,ctx))
			goto err;				/* 2 */
		j=1<<(window-1);
		for (i=1; i<j; i++)
			{
			BN_init(&val[i]);
			if (!BN_mod_mul_reciprocal(&(val[i]),&(val[i-1]),aa,&recp,ctx))
				goto err;
			}
		ts=i;
274
		}
275
		
276 277 278 279 280 281 282 283 284 285 286 287 288 289
	start=1;	/* This is used to avoid multiplication etc
			 * when there is only the value '1' in the
			 * buffer. */
	wvalue=0;	/* The 'value' of the window */
	wstart=bits-1;	/* The top bit of the window */
	wend=0;		/* The bottom bit of the window */

	if (!BN_one(r)) goto err;

	for (;;)
		{
		if (BN_is_bit_set(p,wstart) == 0)
			{
			if (!start)
290
				if (!BN_mod_mul_reciprocal(r,r,r,&recp,ctx))
291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319
				goto err;
			if (wstart == 0) break;
			wstart--;
			continue;
			}
		/* We now have wstart on a 'set' bit, we now need to work out
		 * how bit a window to do.  To do this we need to scan
		 * forward until the last set bit before the end of the
		 * window */
		j=wstart;
		wvalue=1;
		wend=0;
		for (i=1; i<window; i++)
			{
			if (wstart-i < 0) break;
			if (BN_is_bit_set(p,wstart-i))
				{
				wvalue<<=(i-wend);
				wvalue|=1;
				wend=i;
				}
			}

		/* wend is the size of the current window */
		j=wend+1;
		/* add the 'bytes above' */
		if (!start)
			for (i=0; i<j; i++)
				{
320
				if (!BN_mod_mul_reciprocal(r,r,r,&recp,ctx))
321 322 323 324
					goto err;
				}
		
		/* wvalue will be an odd number < 2^window */
325
		if (!BN_mod_mul_reciprocal(r,r,&(val[wvalue>>1]),&recp,ctx))
326 327 328 329 330 331 332 333 334 335
			goto err;

		/* move the 'window' down further */
		wstart-=wend+1;
		wvalue=0;
		start=0;
		if (wstart < 0) break;
		}
	ret=1;
err:
336
	BN_CTX_end(ctx);
337 338 339
	for (i=0; i<ts; i++)
		BN_clear_free(&(val[i]));
	BN_RECP_CTX_free(&recp);
340 341 342
	return(ret);
	}

B
Bodo Möller 已提交
343

344
int BN_mod_exp_mont(BIGNUM *rr, const BIGNUM *a, const BIGNUM *p,
345
		    const BIGNUM *m, BN_CTX *ctx, BN_MONT_CTX *in_mont)
346 347
	{
	int i,j,bits,ret=0,wstart,wend,window,wvalue;
348
	int start=1,ts=0;
349
	BIGNUM *d,*r;
350
	const BIGNUM *aa;
351
	BIGNUM val[TABLE_SIZE];
352 353
	BN_MONT_CTX *mont=NULL;

354 355 356 357
	bn_check_top(a);
	bn_check_top(p);
	bn_check_top(m);

358 359 360 361 362 363 364 365
	if (!(m->d[0] & 1))
		{
		BNerr(BN_F_BN_MOD_EXP_MONT,BN_R_CALLED_WITH_EVEN_MODULUS);
		return(0);
		}
	bits=BN_num_bits(p);
	if (bits == 0)
		{
B
BN_sqrt  
Bodo Möller 已提交
366 367 368
		ret = BN_one(rr);
		return ret;
		}
369

370 371 372 373
	BN_CTX_start(ctx);
	d = BN_CTX_get(ctx);
	r = BN_CTX_get(ctx);
	if (d == NULL || r == NULL) goto err;
374 375 376 377

	/* If this is not done, things will break in the montgomery
	 * part */

378 379 380 381 382 383 384
	if (in_mont != NULL)
		mont=in_mont;
	else
		{
		if ((mont=BN_MONT_CTX_new()) == NULL) goto err;
		if (!BN_MONT_CTX_set(mont,m,ctx)) goto err;
		}
385

386 387
	BN_init(&val[0]);
	ts=1;
B
Bodo Möller 已提交
388
	if (a->neg || BN_ucmp(a,m) >= 0)
389
		{
B
Bodo Möller 已提交
390
		if (!BN_nnmod(&(val[0]),a,m,ctx))
B
Bodo Möller 已提交
391
			goto err;
392
		aa= &(val[0]);
393 394 395
		}
	else
		aa=a;
396 397 398 399 400
	if (BN_is_zero(aa))
		{
		ret = BN_zero(rr);
		goto err;
		}
401
	if (!BN_to_montgomery(&(val[0]),aa,mont,ctx)) goto err; /* 1 */
402

403 404
	window = BN_window_bits_for_exponent_size(bits);
	if (window > 1)
405
		{
406 407 408 409 410 411 412 413 414
		if (!BN_mod_mul_montgomery(d,&(val[0]),&(val[0]),mont,ctx)) goto err; /* 2 */
		j=1<<(window-1);
		for (i=1; i<j; i++)
			{
			BN_init(&(val[i]));
			if (!BN_mod_mul_montgomery(&(val[i]),&(val[i-1]),d,mont,ctx))
				goto err;
			}
		ts=i;
415 416 417 418 419 420 421 422 423
		}

	start=1;	/* This is used to avoid multiplication etc
			 * when there is only the value '1' in the
			 * buffer. */
	wvalue=0;	/* The 'value' of the window */
	wstart=bits-1;	/* The top bit of the window */
	wend=0;		/* The bottom bit of the window */

B
Bodo Möller 已提交
424
	if (!BN_to_montgomery(r,BN_value_one(),mont,ctx)) goto err;
425 426 427 428 429
	for (;;)
		{
		if (BN_is_bit_set(p,wstart) == 0)
			{
			if (!start)
430
				{
431 432
				if (!BN_mod_mul_montgomery(r,r,r,mont,ctx))
				goto err;
433
				}
434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466
			if (wstart == 0) break;
			wstart--;
			continue;
			}
		/* We now have wstart on a 'set' bit, we now need to work out
		 * how bit a window to do.  To do this we need to scan
		 * forward until the last set bit before the end of the
		 * window */
		j=wstart;
		wvalue=1;
		wend=0;
		for (i=1; i<window; i++)
			{
			if (wstart-i < 0) break;
			if (BN_is_bit_set(p,wstart-i))
				{
				wvalue<<=(i-wend);
				wvalue|=1;
				wend=i;
				}
			}

		/* wend is the size of the current window */
		j=wend+1;
		/* add the 'bytes above' */
		if (!start)
			for (i=0; i<j; i++)
				{
				if (!BN_mod_mul_montgomery(r,r,r,mont,ctx))
					goto err;
				}
		
		/* wvalue will be an odd number < 2^window */
467
		if (!BN_mod_mul_montgomery(r,r,&(val[wvalue>>1]),mont,ctx))
468 469 470 471 472 473 474 475
			goto err;

		/* move the 'window' down further */
		wstart-=wend+1;
		wvalue=0;
		start=0;
		if (wstart < 0) break;
		}
476
	if (!BN_from_montgomery(rr,r,mont,ctx)) goto err;
477 478
	ret=1;
err:
479
	if ((in_mont == NULL) && (mont != NULL)) BN_MONT_CTX_free(mont);
480
	BN_CTX_end(ctx);
481 482
	for (i=0; i<ts; i++)
		BN_clear_free(&(val[i]));
483 484
	return(ret);
	}
B
Bodo Möller 已提交
485 486 487 488

int BN_mod_exp_mont_word(BIGNUM *rr, BN_ULONG a, const BIGNUM *p,
                         const BIGNUM *m, BN_CTX *ctx, BN_MONT_CTX *in_mont)
	{
489
	BN_MONT_CTX *mont = NULL;
B
Bodo Möller 已提交
490
	int b, bits, ret=0;
491
	int r_is_one;
492
	BN_ULONG w, next_w;
B
Bodo Möller 已提交
493
	BIGNUM *d, *r, *t;
494 495 496
	BIGNUM *swap_tmp;
#define BN_MOD_MUL_WORD(r, w, m) \
		(BN_mul_word(r, (w)) && \
497
		(/* BN_ucmp(r, (m)) < 0 ? 1 :*/  \
498 499 500 501 502 503 504
			(BN_mod(t, r, m, ctx) && (swap_tmp = r, r = t, t = swap_tmp, 1))))
		/* BN_MOD_MUL_WORD is only used with 'w' large,
		  * so the BN_ucmp test is probably more overhead
		  * than always using BN_mod (which uses BN_copy if
		  * a similar test returns true). */
#define BN_TO_MONTGOMERY_WORD(r, w, mont) \
		(BN_set_word(r, (w)) && BN_to_montgomery(r, r, (mont), ctx))
B
Bodo Möller 已提交
505 506 507 508

	bn_check_top(p);
	bn_check_top(m);

509
	if (m->top == 0 || !(m->d[0] & 1))
B
Bodo Möller 已提交
510 511 512 513
		{
		BNerr(BN_F_BN_MOD_EXP_MONT_WORD,BN_R_CALLED_WITH_EVEN_MODULUS);
		return(0);
		}
514 515 516
	if (m->top == 1)
		a %= m->d[0]; /* make sure that 'a' is reduced */

B
Bodo Möller 已提交
517 518 519
	bits = BN_num_bits(p);
	if (bits == 0)
		{
B
BN_sqrt  
Bodo Möller 已提交
520 521
		ret = BN_one(rr);
		return ret;
B
Bodo Möller 已提交
522
		}
B
BN_sqrt  
Bodo Möller 已提交
523 524 525 526 527 528
	if (a == 0)
		{
		ret = BN_zero(rr);
		return ret;
		}

B
Bodo Möller 已提交
529 530 531 532 533 534 535 536 537 538 539 540 541 542
	BN_CTX_start(ctx);
	d = BN_CTX_get(ctx);
	r = BN_CTX_get(ctx);
	t = BN_CTX_get(ctx);
	if (d == NULL || r == NULL || t == NULL) goto err;

	if (in_mont != NULL)
		mont=in_mont;
	else
		{
		if ((mont = BN_MONT_CTX_new()) == NULL) goto err;
		if (!BN_MONT_CTX_set(mont, m, ctx)) goto err;
		}

543
	r_is_one = 1; /* except for Montgomery factor */
544 545 546 547 548 549

	/* bits-1 >= 0 */

	/* The result is accumulated in the product r*w. */
	w = a; /* bit 'bits-1' of 'p' is always set */
	for (b = bits-2; b >= 0; b--)
B
Bodo Möller 已提交
550
		{
551 552 553
		/* First, square r*w. */
		next_w = w*w;
		if ((next_w/w) != w) /* overflow */
B
Bodo Möller 已提交
554
			{
555 556 557 558 559 560 561 562 563
			if (r_is_one)
				{
				if (!BN_TO_MONTGOMERY_WORD(r, w, mont)) goto err;
				r_is_one = 0;
				}
			else
				{
				if (!BN_MOD_MUL_WORD(r, w, m)) goto err;
				}
564 565 566
			next_w = 1;
			}
		w = next_w;
567 568 569 570
		if (!r_is_one)
			{
			if (!BN_mod_mul_montgomery(r, r, r, mont, ctx)) goto err;
			}
571 572 573 574 575 576

		/* Second, multiply r*w by 'a' if exponent bit is set. */
		if (BN_is_bit_set(p, b))
			{
			next_w = w*a;
			if ((next_w/a) != w) /* overflow */
B
Bodo Möller 已提交
577
				{
578 579 580 581 582 583 584 585 586
				if (r_is_one)
					{
					if (!BN_TO_MONTGOMERY_WORD(r, w, mont)) goto err;
					r_is_one = 0;
					}
				else
					{
					if (!BN_MOD_MUL_WORD(r, w, m)) goto err;
					}
587
				next_w = a;
B
Bodo Möller 已提交
588
				}
589
			w = next_w;
B
Bodo Möller 已提交
590 591
			}
		}
592

593 594 595
	/* Finally, set r:=r*w. */
	if (w != 1)
		{
596 597 598 599 600 601 602 603 604
		if (r_is_one)
			{
			if (!BN_TO_MONTGOMERY_WORD(r, w, mont)) goto err;
			r_is_one = 0;
			}
		else
			{
			if (!BN_MOD_MUL_WORD(r, w, m)) goto err;
			}
605 606
		}

607 608 609 610 611 612 613 614
	if (r_is_one) /* can happen only if a == 1*/
		{
		if (!BN_one(rr)) goto err;
		}
	else
		{
		if (!BN_from_montgomery(rr, r, mont, ctx)) goto err;
		}
B
Bodo Möller 已提交
615 616 617 618 619 620 621
	ret = 1;
err:
	if ((in_mont == NULL) && (mont != NULL)) BN_MONT_CTX_free(mont);
	BN_CTX_end(ctx);
	return(ret);
	}

622 623

/* The old fallback, simple version :-) */
624 625 626
int BN_mod_exp_simple(BIGNUM *r,
	const BIGNUM *a, const BIGNUM *p, const BIGNUM *m,
	BN_CTX *ctx)
627
	{
628
	int i,j,bits,ret=0,wstart,wend,window,wvalue,ts=0;
629 630
	int start=1;
	BIGNUM *d;
631
	BIGNUM val[TABLE_SIZE];
632 633 634 635 636

	bits=BN_num_bits(p);

	if (bits == 0)
		{
B
BN_sqrt  
Bodo Möller 已提交
637 638 639
		ret = BN_one(r);
		return ret;
		}
640

641 642 643
	BN_CTX_start(ctx);
	if ((d = BN_CTX_get(ctx)) == NULL) goto err;

644 645
	BN_init(&(val[0]));
	ts=1;
B
Bodo Möller 已提交
646
	if (!BN_nnmod(&(val[0]),a,m,ctx)) goto err;		/* 1 */
647 648
	if (BN_is_zero(&(val[0])))
		{
649 650
		ret = BN_zero(r);
		goto err;
651
		}
652

653 654
	window = BN_window_bits_for_exponent_size(bits);
	if (window > 1)
655
		{
656 657 658 659 660 661 662 663 664 665
		if (!BN_mod_mul(d,&(val[0]),&(val[0]),m,ctx))
			goto err;				/* 2 */
		j=1<<(window-1);
		for (i=1; i<j; i++)
			{
			BN_init(&(val[i]));
			if (!BN_mod_mul(&(val[i]),&(val[i-1]),d,m,ctx))
				goto err;
			}
		ts=i;
666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716
		}

	start=1;	/* This is used to avoid multiplication etc
			 * when there is only the value '1' in the
			 * buffer. */
	wvalue=0;	/* The 'value' of the window */
	wstart=bits-1;	/* The top bit of the window */
	wend=0;		/* The bottom bit of the window */

	if (!BN_one(r)) goto err;

	for (;;)
		{
		if (BN_is_bit_set(p,wstart) == 0)
			{
			if (!start)
				if (!BN_mod_mul(r,r,r,m,ctx))
				goto err;
			if (wstart == 0) break;
			wstart--;
			continue;
			}
		/* We now have wstart on a 'set' bit, we now need to work out
		 * how bit a window to do.  To do this we need to scan
		 * forward until the last set bit before the end of the
		 * window */
		j=wstart;
		wvalue=1;
		wend=0;
		for (i=1; i<window; i++)
			{
			if (wstart-i < 0) break;
			if (BN_is_bit_set(p,wstart-i))
				{
				wvalue<<=(i-wend);
				wvalue|=1;
				wend=i;
				}
			}

		/* wend is the size of the current window */
		j=wend+1;
		/* add the 'bytes above' */
		if (!start)
			for (i=0; i<j; i++)
				{
				if (!BN_mod_mul(r,r,r,m,ctx))
					goto err;
				}
		
		/* wvalue will be an odd number < 2^window */
717
		if (!BN_mod_mul(r,r,&(val[wvalue>>1]),m,ctx))
718 719 720 721 722 723 724 725 726 727
			goto err;

		/* move the 'window' down further */
		wstart-=wend+1;
		wvalue=0;
		start=0;
		if (wstart < 0) break;
		}
	ret=1;
err:
728
	BN_CTX_end(ctx);
729 730
	for (i=0; i<ts; i++)
		BN_clear_free(&(val[i]));
731 732 733
	return(ret);
	}