dropbear: bn_fast_s_mp_sqr.c annotate

annotate bn_fast_s_mp_sqr.c @ 190:d8254fc979e9 libtommath-orig LTM_0.35

Initial import of libtommath 0.35

author	Matt Johnston <matt@ucc.asn.au>
date	Fri, 06 May 2005 08:59:30 +0000
parents	d29b64170cf0
children

rev	line source
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	1 #include <tommath.h>
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	2 #ifdef BN_FAST_S_MP_SQR_C
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	3 /* LibTomMath, multiple-precision integer library -- Tom St Denis
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	4 *
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	5 * LibTomMath is a library that provides multiple-precision
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	6 * integer arithmetic as well as number theoretic functionality.
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	7 *
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	8 * The library was designed directly after the MPI library by
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	9 * Michael Fromberger but has been written from scratch with
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	10 * additional optimizations in place.
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	11 *
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	12 * The library is free for all purposes without any express
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	13 * guarantee it works.
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	14 *
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	15 * Tom St Denis, [email protected], http://math.libtomcrypt.org
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	16 */
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	17
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	18 /* the jist of squaring...
190 d8254fc979e9 Initial import of libtommath 0.35 Matt Johnston <matt@ucc.asn.au> parents: 142 diff changeset	19 * you do like mult except the offset of the tmpx [one that
d8254fc979e9 Initial import of libtommath 0.35 Matt Johnston <matt@ucc.asn.au> parents: 142 diff changeset	20 * starts closer to zero] can't equal the offset of tmpy.
d8254fc979e9 Initial import of libtommath 0.35 Matt Johnston <matt@ucc.asn.au> parents: 142 diff changeset	21 * So basically you set up iy like before then you min it with
d8254fc979e9 Initial import of libtommath 0.35 Matt Johnston <matt@ucc.asn.au> parents: 142 diff changeset	22 * (ty-tx) so that it never happens. You double all those
d8254fc979e9 Initial import of libtommath 0.35 Matt Johnston <matt@ucc.asn.au> parents: 142 diff changeset	23 * you add in the inner loop
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	24
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	25 After that loop you do the squares and add them in.
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	26 */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	27
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	28 int fast_s_mp_sqr (mp_int * a, mp_int * b)
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	29 {
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	30 int olduse, res, pa, ix, iz;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	31 mp_digit W[MP_WARRAY], *tmpx;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	32 mp_word W1;
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	33
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	34 /* grow the destination as required */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	35 pa = a->used + a->used;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	36 if (b->alloc < pa) {
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	37 if ((res = mp_grow (b, pa)) != MP_OKAY) {
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	38 return res;
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	39 }
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	40 }
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	41
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	42 /* number of output digits to produce */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	43 W1 = 0;
190 d8254fc979e9 Initial import of libtommath 0.35 Matt Johnston <matt@ucc.asn.au> parents: 142 diff changeset	44 for (ix = 0; ix < pa; ix++) {
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	45 int tx, ty, iy;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	46 mp_word _W;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	47 mp_digit *tmpy;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	48
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	49 /* clear counter */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	50 _W = 0;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	51
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	52 /* get offsets into the two bignums */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	53 ty = MIN(a->used-1, ix);
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	54 tx = ix - ty;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	55
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	56 /* setup temp aliases */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	57 tmpx = a->dp + tx;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	58 tmpy = a->dp + ty;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	59
190 d8254fc979e9 Initial import of libtommath 0.35 Matt Johnston <matt@ucc.asn.au> parents: 142 diff changeset	60 /* this is the number of times the loop will iterrate, essentially
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	61 while (tx++ < a->used && ty-- >= 0) { ... }
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	62 */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	63 iy = MIN(a->used-tx, ty+1);
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	64
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	65 /* now for squaring tx can never equal ty
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	66 * we halve the distance since they approach at a rate of 2x
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	67 * and we have to round because odd cases need to be executed
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	68 */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	69 iy = MIN(iy, (ty-tx+1)>>1);
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	70
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	71 /* execute loop */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	72 for (iz = 0; iz < iy; iz++) {
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	73 _W += ((mp_word)tmpx++)((mp_word)*tmpy--);
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	74 }
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	75
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	76 /* double the inner product and add carry */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	77 _W = _W + _W + W1;
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	78
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	79 /* even columns have the square term in them */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	80 if ((ix&1) == 0) {
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	81 _W += ((mp_word)a->dp[ix>>1])*((mp_word)a->dp[ix>>1]);
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	82 }
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	83
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	84 /* store it */
190 d8254fc979e9 Initial import of libtommath 0.35 Matt Johnston <matt@ucc.asn.au> parents: 142 diff changeset	85 W[ix] = (mp_digit)(_W & MP_MASK);
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	86
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	87 /* make next carry */
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	88 W1 = _W >> ((mp_word)DIGIT_BIT);
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	89 }
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	90
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	91 /* setup dest */
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	92 olduse = b->used;
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	93 b->used = a->used+a->used;
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	94
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	95 {
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	96 mp_digit *tmpb;
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	97 tmpb = b->dp;
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	98 for (ix = 0; ix < pa; ix++) {
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	99 *tmpb++ = W[ix] & MP_MASK;
d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	100 }
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	101
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	102 /* clear unused digits [that existed in the old copy of c] */
2 86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	103 for (; ix < olduse; ix++) {
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	104 *tmpb++ = 0;
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	105 }
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	106 }
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	107 mp_clamp (b);
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	108 return MP_OKAY;
86e0b50a9b58 ltm 0.30 orig import Matt Johnston <matt@ucc.asn.au> parents: diff changeset	109 }
142 d29b64170cf0 import of libtommath 0.32 Matt Johnston <matt@ucc.asn.au> parents: 2 diff changeset	110 #endif

Mercurial > dropbear

annotate bn_fast_s_mp_sqr.c @ 190:d8254fc979e9 libtommath-orig LTM_0.35