1 /* crypto/bn/bn_nist.c */
2 /*
3 * Written by Nils Larsch for the OpenSSL project
4 */
5 /* ====================================================================
6 * Copyright (c) 1998-2005 The OpenSSL Project. All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 *
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 *
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in
17 * the documentation and/or other materials provided with the
18 * distribution.
19 *
20 * 3. All advertising materials mentioning features or use of this
21 * software must display the following acknowledgment:
22 * "This product includes software developed by the OpenSSL Project
23 * for use in the OpenSSL Toolkit. (http://www.openssl.org/)"
24 *
25 * 4. The names "OpenSSL Toolkit" and "OpenSSL Project" must not be used to
26 * endorse or promote products derived from this software without
27 * prior written permission. For written permission, please contact
28 * openssl-core@openssl.org.
29 *
30 * 5. Products derived from this software may not be called "OpenSSL"
31 * nor may "OpenSSL" appear in their names without prior written
32 * permission of the OpenSSL Project.
33 *
34 * 6. Redistributions of any form whatsoever must retain the following
35 * acknowledgment:
36 * "This product includes software developed by the OpenSSL Project
37 * for use in the OpenSSL Toolkit (http://www.openssl.org/)"
38 *
39 * THIS SOFTWARE IS PROVIDED BY THE OpenSSL PROJECT ``AS IS'' AND ANY
40 * EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
41 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
42 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE OpenSSL PROJECT OR
43 * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
44 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
45 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
46 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
47 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
48 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
49 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
50 * OF THE POSSIBILITY OF SUCH DAMAGE.
51 * ====================================================================
52 *
53 * This product includes cryptographic software written by Eric Young
54 * (eay@cryptsoft.com). This product includes software written by Tim
55 * Hudson (tjh@cryptsoft.com).
56 *
57 */
58
59 #include "bn_lcl.h"
60 #include "cryptlib.h"
61
62
63 #define BN_NIST_192_TOP (192+BN_BITS2-1)/BN_BITS2
64 #define BN_NIST_224_TOP (224+BN_BITS2-1)/BN_BITS2
65 #define BN_NIST_256_TOP (256+BN_BITS2-1)/BN_BITS2
66 #define BN_NIST_384_TOP (384+BN_BITS2-1)/BN_BITS2
67 #define BN_NIST_521_TOP (521+BN_BITS2-1)/BN_BITS2
68
69 /* pre-computed tables are "carry-less" values of modulus*(i+1) */
70 #if BN_BITS2 == 64
71 static const BN_ULONG _nist_p_192[][BN_NIST_192_TOP] = {
72 {0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFEULL,0xFFFFFFFFFFFFFFFFULL},
73 {0xFFFFFFFFFFFFFFFEULL,0xFFFFFFFFFFFFFFFDULL,0xFFFFFFFFFFFFFFFFULL},
74 {0xFFFFFFFFFFFFFFFDULL,0xFFFFFFFFFFFFFFFCULL,0xFFFFFFFFFFFFFFFFULL}
75 };
76 static const BN_ULONG _nist_p_192_sqr[] = {
77 0x0000000000000001ULL,0x0000000000000002ULL,0x0000000000000001ULL,
78 0xFFFFFFFFFFFFFFFEULL,0xFFFFFFFFFFFFFFFDULL,0xFFFFFFFFFFFFFFFFULL
79 };
80 static const BN_ULONG _nist_p_224[][BN_NIST_224_TOP] = {
81 {0x0000000000000001ULL,0xFFFFFFFF00000000ULL,
82 0xFFFFFFFFFFFFFFFFULL,0x00000000FFFFFFFFULL},
83 {0x0000000000000002ULL,0xFFFFFFFE00000000ULL,
84 0xFFFFFFFFFFFFFFFFULL,0x00000001FFFFFFFFULL} /* this one is "carry-full" */
85 };
86 static const BN_ULONG _nist_p_224_sqr[] = {
87 0x0000000000000001ULL,0xFFFFFFFE00000000ULL,
88 0xFFFFFFFFFFFFFFFFULL,0x0000000200000000ULL,
89 0x0000000000000000ULL,0xFFFFFFFFFFFFFFFEULL,
90 0xFFFFFFFFFFFFFFFFULL
91 };
92 static const BN_ULONG _nist_p_256[][BN_NIST_256_TOP] = {
93 {0xFFFFFFFFFFFFFFFFULL,0x00000000FFFFFFFFULL,
94 0x0000000000000000ULL,0xFFFFFFFF00000001ULL},
95 {0xFFFFFFFFFFFFFFFEULL,0x00000001FFFFFFFFULL,
96 0x0000000000000000ULL,0xFFFFFFFE00000002ULL},
97 {0xFFFFFFFFFFFFFFFDULL,0x00000002FFFFFFFFULL,
98 0x0000000000000000ULL,0xFFFFFFFD00000003ULL},
99 {0xFFFFFFFFFFFFFFFCULL,0x00000003FFFFFFFFULL,
100 0x0000000000000000ULL,0xFFFFFFFC00000004ULL},
101 {0xFFFFFFFFFFFFFFFBULL,0x00000004FFFFFFFFULL,
102 0x0000000000000000ULL,0xFFFFFFFB00000005ULL},
103 };
104 static const BN_ULONG _nist_p_256_sqr[] = {
105 0x0000000000000001ULL,0xFFFFFFFE00000000ULL,
106 0xFFFFFFFFFFFFFFFFULL,0x00000001FFFFFFFEULL,
107 0x00000001FFFFFFFEULL,0x00000001FFFFFFFEULL,
108 0xFFFFFFFE00000001ULL,0xFFFFFFFE00000002ULL
109 };
110 static const BN_ULONG _nist_p_384[][BN_NIST_384_TOP] = {
111 {0x00000000FFFFFFFFULL,0xFFFFFFFF00000000ULL,0xFFFFFFFFFFFFFFFEULL,
112 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL},
113 {0x00000001FFFFFFFEULL,0xFFFFFFFE00000000ULL,0xFFFFFFFFFFFFFFFDULL,
114 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL},
115 {0x00000002FFFFFFFDULL,0xFFFFFFFD00000000ULL,0xFFFFFFFFFFFFFFFCULL,
116 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL},
117 {0x00000003FFFFFFFCULL,0xFFFFFFFC00000000ULL,0xFFFFFFFFFFFFFFFBULL,
118 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL},
119 {0x00000004FFFFFFFBULL,0xFFFFFFFB00000000ULL,0xFFFFFFFFFFFFFFFAULL,
120 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL},
121 };
122 static const BN_ULONG _nist_p_384_sqr[] = {
123 0xFFFFFFFE00000001ULL,0x0000000200000000ULL,0xFFFFFFFE00000000ULL,
124 0x0000000200000000ULL,0x0000000000000001ULL,0x0000000000000000ULL,
125 0x00000001FFFFFFFEULL,0xFFFFFFFE00000000ULL,0xFFFFFFFFFFFFFFFDULL,
126 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL
127 };
128 static const BN_ULONG _nist_p_521[] =
129 {0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,
130 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,
131 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,
132 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,
133 0x00000000000001FFULL};
134 static const BN_ULONG _nist_p_521_sqr[] = {
135 0x0000000000000001ULL,0x0000000000000000ULL,0x0000000000000000ULL,
136 0x0000000000000000ULL,0x0000000000000000ULL,0x0000000000000000ULL,
137 0x0000000000000000ULL,0x0000000000000000ULL,0xFFFFFFFFFFFFFC00ULL,
138 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,
139 0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,0xFFFFFFFFFFFFFFFFULL,
140 0xFFFFFFFFFFFFFFFFULL,0x000000000003FFFFULL
141 };
142 #elif BN_BITS2 == 32
143 static const BN_ULONG _nist_p_192[][BN_NIST_192_TOP] = {
144 {0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFE,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF},
145 {0xFFFFFFFE,0xFFFFFFFF,0xFFFFFFFD,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF},
146 {0xFFFFFFFD,0xFFFFFFFF,0xFFFFFFFC,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF}
147 };
148 static const BN_ULONG _nist_p_192_sqr[] = {
149 0x00000001,0x00000000,0x00000002,0x00000000,0x00000001,0x00000000,
150 0xFFFFFFFE,0xFFFFFFFF,0xFFFFFFFD,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF
151 };
152 static const BN_ULONG _nist_p_224[][BN_NIST_224_TOP] = {
153 {0x00000001,0x00000000,0x00000000,0xFFFFFFFF,
154 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF},
155 {0x00000002,0x00000000,0x00000000,0xFFFFFFFE,
156 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF}
157 };
158 static const BN_ULONG _nist_p_224_sqr[] = {
159 0x00000001,0x00000000,0x00000000,0xFFFFFFFE,
160 0xFFFFFFFF,0xFFFFFFFF,0x00000000,0x00000002,
161 0x00000000,0x00000000,0xFFFFFFFE,0xFFFFFFFF,
162 0xFFFFFFFF,0xFFFFFFFF
163 };
164 static const BN_ULONG _nist_p_256[][BN_NIST_256_TOP] = {
165 {0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0x00000000,
166 0x00000000,0x00000000,0x00000001,0xFFFFFFFF},
167 {0xFFFFFFFE,0xFFFFFFFF,0xFFFFFFFF,0x00000001,
168 0x00000000,0x00000000,0x00000002,0xFFFFFFFE},
169 {0xFFFFFFFD,0xFFFFFFFF,0xFFFFFFFF,0x00000002,
170 0x00000000,0x00000000,0x00000003,0xFFFFFFFD},
171 {0xFFFFFFFC,0xFFFFFFFF,0xFFFFFFFF,0x00000003,
172 0x00000000,0x00000000,0x00000004,0xFFFFFFFC},
173 {0xFFFFFFFB,0xFFFFFFFF,0xFFFFFFFF,0x00000004,
174 0x00000000,0x00000000,0x00000005,0xFFFFFFFB},
175 };
176 static const BN_ULONG _nist_p_256_sqr[] = {
177 0x00000001,0x00000000,0x00000000,0xFFFFFFFE,
178 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFE,0x00000001,
179 0xFFFFFFFE,0x00000001,0xFFFFFFFE,0x00000001,
180 0x00000001,0xFFFFFFFE,0x00000002,0xFFFFFFFE
181 };
182 static const BN_ULONG _nist_p_384[][BN_NIST_384_TOP] = {
183 {0xFFFFFFFF,0x00000000,0x00000000,0xFFFFFFFF,0xFFFFFFFE,0xFFFFFFFF,
184 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF},
185 {0xFFFFFFFE,0x00000001,0x00000000,0xFFFFFFFE,0xFFFFFFFD,0xFFFFFFFF,
186 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF},
187 {0xFFFFFFFD,0x00000002,0x00000000,0xFFFFFFFD,0xFFFFFFFC,0xFFFFFFFF,
188 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF},
189 {0xFFFFFFFC,0x00000003,0x00000000,0xFFFFFFFC,0xFFFFFFFB,0xFFFFFFFF,
190 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF},
191 {0xFFFFFFFB,0x00000004,0x00000000,0xFFFFFFFB,0xFFFFFFFA,0xFFFFFFFF,
192 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF},
193 };
194 static const BN_ULONG _nist_p_384_sqr[] = {
195 0x00000001,0xFFFFFFFE,0x00000000,0x00000002,0x00000000,0xFFFFFFFE,
196 0x00000000,0x00000002,0x00000001,0x00000000,0x00000000,0x00000000,
197 0xFFFFFFFE,0x00000001,0x00000000,0xFFFFFFFE,0xFFFFFFFD,0xFFFFFFFF,
198 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF
199 };
200 static const BN_ULONG _nist_p_521[] = {0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,
201 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,
202 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,
203 0xFFFFFFFF,0x000001FF};
204 static const BN_ULONG _nist_p_521_sqr[] = {
205 0x00000001,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
206 0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,
207 0x00000000,0x00000000,0x00000000,0x00000000,0xFFFFFC00,0xFFFFFFFF,
208 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,
209 0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,0xFFFFFFFF,
210 0xFFFFFFFF,0xFFFFFFFF,0x0003FFFF
211 };
212 #else
213 #error "unsupported BN_BITS2"
214 #endif
215
216
217 static const BIGNUM _bignum_nist_p_192 =
218 {
219 (BN_ULONG *)_nist_p_192[0],
220 BN_NIST_192_TOP,
221 BN_NIST_192_TOP,
222 0,
223 BN_FLG_STATIC_DATA
224 };
225
226 static const BIGNUM _bignum_nist_p_224 =
227 {
228 (BN_ULONG *)_nist_p_224[0],
229 BN_NIST_224_TOP,
230 BN_NIST_224_TOP,
231 0,
232 BN_FLG_STATIC_DATA
233 };
234
235 static const BIGNUM _bignum_nist_p_256 =
236 {
237 (BN_ULONG *)_nist_p_256[0],
238 BN_NIST_256_TOP,
239 BN_NIST_256_TOP,
240 0,
241 BN_FLG_STATIC_DATA
242 };
243
244 static const BIGNUM _bignum_nist_p_384 =
245 {
246 (BN_ULONG *)_nist_p_384[0],
247 BN_NIST_384_TOP,
248 BN_NIST_384_TOP,
249 0,
250 BN_FLG_STATIC_DATA
251 };
252
253 static const BIGNUM _bignum_nist_p_521 =
254 {
255 (BN_ULONG *)_nist_p_521,
256 BN_NIST_521_TOP,
257 BN_NIST_521_TOP,
258 0,
259 BN_FLG_STATIC_DATA
260 };
261
262
BN_get0_nist_prime_192(void)263 const BIGNUM *BN_get0_nist_prime_192(void)
264 {
265 return &_bignum_nist_p_192;
266 }
267
BN_get0_nist_prime_224(void)268 const BIGNUM *BN_get0_nist_prime_224(void)
269 {
270 return &_bignum_nist_p_224;
271 }
272
BN_get0_nist_prime_256(void)273 const BIGNUM *BN_get0_nist_prime_256(void)
274 {
275 return &_bignum_nist_p_256;
276 }
277
BN_get0_nist_prime_384(void)278 const BIGNUM *BN_get0_nist_prime_384(void)
279 {
280 return &_bignum_nist_p_384;
281 }
282
BN_get0_nist_prime_521(void)283 const BIGNUM *BN_get0_nist_prime_521(void)
284 {
285 return &_bignum_nist_p_521;
286 }
287
288
nist_cp_bn_0(BN_ULONG * dst,const BN_ULONG * src,int top,int max)289 static void nist_cp_bn_0(BN_ULONG *dst, const BN_ULONG *src, int top, int max)
290 {
291 int i;
292
293 #ifdef BN_DEBUG
294 OPENSSL_assert(top <= max);
295 #endif
296 for (i = 0; i < top; i++)
297 dst[i] = src[i];
298 for (; i < max; i++)
299 dst[i] = 0;
300 }
301
nist_cp_bn(BN_ULONG * dst,const BN_ULONG * src,int top)302 static void nist_cp_bn(BN_ULONG *dst, const BN_ULONG *src, int top)
303 {
304 int i;
305
306 for (i = 0; i < top; i++)
307 dst[i] = src[i];
308 }
309
310 #if BN_BITS2 == 64
311 #define bn_cp_64(to, n, from, m) (to)[n] = (m>=0)?((from)[m]):0;
312 #define bn_64_set_0(to, n) (to)[n] = (BN_ULONG)0;
313 /*
314 * two following macros are implemented under assumption that they
315 * are called in a sequence with *ascending* n, i.e. as they are...
316 */
317 #define bn_cp_32_naked(to, n, from, m) (((n)&1)?(to[(n)/2]|=((m)&1)?(from[(m)/2]&BN_MASK2h):(from[(m)/2]<<32))\
318 :(to[(n)/2] =((m)&1)?(from[(m)/2]>>32):(from[(m)/2]&BN_MASK2l)))
319 #define bn_32_set_0(to, n) (((n)&1)?(to[(n)/2]&=BN_MASK2l):(to[(n)/2]=0));
320 #define bn_cp_32(to,n,from,m) ((m)>=0)?bn_cp_32_naked(to,n,from,m):bn_32_set_0(to,n)
321 # if defined(L_ENDIAN)
322 # if defined(__arch64__)
323 # define NIST_INT64 long
324 # else
325 # define NIST_INT64 long long
326 # endif
327 # endif
328 #else
329 #define bn_cp_64(to, n, from, m) \
330 { \
331 bn_cp_32(to, (n)*2, from, (m)*2); \
332 bn_cp_32(to, (n)*2+1, from, (m)*2+1); \
333 }
334 #define bn_64_set_0(to, n) \
335 { \
336 bn_32_set_0(to, (n)*2); \
337 bn_32_set_0(to, (n)*2+1); \
338 }
339 #define bn_cp_32(to, n, from, m) (to)[n] = (m>=0)?((from)[m]):0;
340 #define bn_32_set_0(to, n) (to)[n] = (BN_ULONG)0;
341 # if defined(_WIN32) && !defined(__GNUC__)
342 # define NIST_INT64 __int64
343 # elif defined(BN_LLONG)
344 # define NIST_INT64 long long
345 # endif
346 #endif /* BN_BITS2 != 64 */
347
348 #define nist_set_192(to, from, a1, a2, a3) \
349 { \
350 bn_cp_64(to, 0, from, (a3) - 3) \
351 bn_cp_64(to, 1, from, (a2) - 3) \
352 bn_cp_64(to, 2, from, (a1) - 3) \
353 }
354
BN_nist_mod_192(BIGNUM * r,const BIGNUM * a,const BIGNUM * field,BN_CTX * ctx)355 int BN_nist_mod_192(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
356 BN_CTX *ctx)
357 {
358 int top = a->top, i;
359 int carry;
360 register BN_ULONG *r_d, *a_d = a->d;
361 union {
362 BN_ULONG bn[BN_NIST_192_TOP];
363 unsigned int ui[BN_NIST_192_TOP*sizeof(BN_ULONG)/sizeof(unsigned int)];
364 } buf;
365 BN_ULONG c_d[BN_NIST_192_TOP],
366 *res;
367 PTR_SIZE_INT mask;
368 static const BIGNUM _bignum_nist_p_192_sqr = {
369 (BN_ULONG *)_nist_p_192_sqr,
370 sizeof(_nist_p_192_sqr)/sizeof(_nist_p_192_sqr[0]),
371 sizeof(_nist_p_192_sqr)/sizeof(_nist_p_192_sqr[0]),
372 0,BN_FLG_STATIC_DATA };
373
374 field = &_bignum_nist_p_192; /* just to make sure */
375
376 if (BN_is_negative(a) || BN_ucmp(a,&_bignum_nist_p_192_sqr)>=0)
377 return BN_nnmod(r, a, field, ctx);
378
379 i = BN_ucmp(field, a);
380 if (i == 0)
381 {
382 BN_zero(r);
383 return 1;
384 }
385 else if (i > 0)
386 return (r == a) ? 1 : (BN_copy(r ,a) != NULL);
387
388 if (r != a)
389 {
390 if (!bn_wexpand(r, BN_NIST_192_TOP))
391 return 0;
392 r_d = r->d;
393 nist_cp_bn(r_d, a_d, BN_NIST_192_TOP);
394 }
395 else
396 r_d = a_d;
397
398 nist_cp_bn_0(buf.bn, a_d + BN_NIST_192_TOP, top - BN_NIST_192_TOP, BN_NIST_192_TOP);
399
400 #if defined(NIST_INT64)
401 {
402 NIST_INT64 acc; /* accumulator */
403 unsigned int *rp=(unsigned int *)r_d;
404 const unsigned int *bp=(const unsigned int *)buf.ui;
405
406 acc = rp[0]; acc += bp[3*2-6];
407 acc += bp[5*2-6]; rp[0] = (unsigned int)acc; acc >>= 32;
408
409 acc += rp[1]; acc += bp[3*2-5];
410 acc += bp[5*2-5]; rp[1] = (unsigned int)acc; acc >>= 32;
411
412 acc += rp[2]; acc += bp[3*2-6];
413 acc += bp[4*2-6];
414 acc += bp[5*2-6]; rp[2] = (unsigned int)acc; acc >>= 32;
415
416 acc += rp[3]; acc += bp[3*2-5];
417 acc += bp[4*2-5];
418 acc += bp[5*2-5]; rp[3] = (unsigned int)acc; acc >>= 32;
419
420 acc += rp[4]; acc += bp[4*2-6];
421 acc += bp[5*2-6]; rp[4] = (unsigned int)acc; acc >>= 32;
422
423 acc += rp[5]; acc += bp[4*2-5];
424 acc += bp[5*2-5]; rp[5] = (unsigned int)acc;
425
426 carry = (int)(acc>>32);
427 }
428 #else
429 {
430 BN_ULONG t_d[BN_NIST_192_TOP];
431
432 nist_set_192(t_d, buf.bn, 0, 3, 3);
433 carry = (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
434 nist_set_192(t_d, buf.bn, 4, 4, 0);
435 carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
436 nist_set_192(t_d, buf.bn, 5, 5, 5)
437 carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
438 }
439 #endif
440 if (carry > 0)
441 carry = (int)bn_sub_words(r_d,r_d,_nist_p_192[carry-1],BN_NIST_192_TOP);
442 else
443 carry = 1;
444
445 /*
446 * we need 'if (carry==0 || result>=modulus) result-=modulus;'
447 * as comparison implies subtraction, we can write
448 * 'tmp=result-modulus; if (!carry || !borrow) result=tmp;'
449 * this is what happens below, but without explicit if:-) a.
450 */
451 mask = 0-(PTR_SIZE_INT)bn_sub_words(c_d,r_d,_nist_p_192[0],BN_NIST_192_TOP);
452 mask &= 0-(PTR_SIZE_INT)carry;
453 res = c_d;
454 res = (BN_ULONG *)
455 (((PTR_SIZE_INT)res&~mask) | ((PTR_SIZE_INT)r_d&mask));
456 nist_cp_bn(r_d, res, BN_NIST_192_TOP);
457 r->top = BN_NIST_192_TOP;
458 bn_correct_top(r);
459
460 return 1;
461 }
462
463 typedef BN_ULONG (*bn_addsub_f)(BN_ULONG *,const BN_ULONG *,const BN_ULONG *,int);
464
465 #define nist_set_224(to, from, a1, a2, a3, a4, a5, a6, a7) \
466 { \
467 bn_cp_32(to, 0, from, (a7) - 7) \
468 bn_cp_32(to, 1, from, (a6) - 7) \
469 bn_cp_32(to, 2, from, (a5) - 7) \
470 bn_cp_32(to, 3, from, (a4) - 7) \
471 bn_cp_32(to, 4, from, (a3) - 7) \
472 bn_cp_32(to, 5, from, (a2) - 7) \
473 bn_cp_32(to, 6, from, (a1) - 7) \
474 }
475
BN_nist_mod_224(BIGNUM * r,const BIGNUM * a,const BIGNUM * field,BN_CTX * ctx)476 int BN_nist_mod_224(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
477 BN_CTX *ctx)
478 {
479 int top = a->top, i;
480 int carry;
481 BN_ULONG *r_d, *a_d = a->d;
482 union {
483 BN_ULONG bn[BN_NIST_224_TOP];
484 unsigned int ui[BN_NIST_224_TOP*sizeof(BN_ULONG)/sizeof(unsigned int)];
485 } buf;
486 BN_ULONG c_d[BN_NIST_224_TOP],
487 *res;
488 PTR_SIZE_INT mask;
489 union { bn_addsub_f f; PTR_SIZE_INT p; } u;
490 static const BIGNUM _bignum_nist_p_224_sqr = {
491 (BN_ULONG *)_nist_p_224_sqr,
492 sizeof(_nist_p_224_sqr)/sizeof(_nist_p_224_sqr[0]),
493 sizeof(_nist_p_224_sqr)/sizeof(_nist_p_224_sqr[0]),
494 0,BN_FLG_STATIC_DATA };
495
496
497 field = &_bignum_nist_p_224; /* just to make sure */
498
499 if (BN_is_negative(a) || BN_ucmp(a,&_bignum_nist_p_224_sqr)>=0)
500 return BN_nnmod(r, a, field, ctx);
501
502 i = BN_ucmp(field, a);
503 if (i == 0)
504 {
505 BN_zero(r);
506 return 1;
507 }
508 else if (i > 0)
509 return (r == a)? 1 : (BN_copy(r ,a) != NULL);
510
511 if (r != a)
512 {
513 if (!bn_wexpand(r, BN_NIST_224_TOP))
514 return 0;
515 r_d = r->d;
516 nist_cp_bn(r_d, a_d, BN_NIST_224_TOP);
517 }
518 else
519 r_d = a_d;
520
521 #if BN_BITS2==64
522 /* copy upper 256 bits of 448 bit number ... */
523 nist_cp_bn_0(c_d, a_d + (BN_NIST_224_TOP-1), top - (BN_NIST_224_TOP-1), BN_NIST_224_TOP);
524 /* ... and right shift by 32 to obtain upper 224 bits */
525 nist_set_224(buf.bn, c_d, 14, 13, 12, 11, 10, 9, 8);
526 /* truncate lower part to 224 bits too */
527 r_d[BN_NIST_224_TOP-1] &= BN_MASK2l;
528 #else
529 nist_cp_bn_0(buf.bn, a_d + BN_NIST_224_TOP, top - BN_NIST_224_TOP, BN_NIST_224_TOP);
530 #endif
531
532 #if defined(NIST_INT64) && BN_BITS2!=64
533 {
534 NIST_INT64 acc; /* accumulator */
535 unsigned int *rp=(unsigned int *)r_d;
536 const unsigned int *bp=(const unsigned int *)buf.ui;
537
538 acc = rp[0]; acc -= bp[7-7];
539 acc -= bp[11-7]; rp[0] = (unsigned int)acc; acc >>= 32;
540
541 acc += rp[1]; acc -= bp[8-7];
542 acc -= bp[12-7]; rp[1] = (unsigned int)acc; acc >>= 32;
543
544 acc += rp[2]; acc -= bp[9-7];
545 acc -= bp[13-7]; rp[2] = (unsigned int)acc; acc >>= 32;
546
547 acc += rp[3]; acc += bp[7-7];
548 acc += bp[11-7];
549 acc -= bp[10-7]; rp[3] = (unsigned int)acc; acc>>= 32;
550
551 acc += rp[4]; acc += bp[8-7];
552 acc += bp[12-7];
553 acc -= bp[11-7]; rp[4] = (unsigned int)acc; acc >>= 32;
554
555 acc += rp[5]; acc += bp[9-7];
556 acc += bp[13-7];
557 acc -= bp[12-7]; rp[5] = (unsigned int)acc; acc >>= 32;
558
559 acc += rp[6]; acc += bp[10-7];
560 acc -= bp[13-7]; rp[6] = (unsigned int)acc;
561
562 carry = (int)(acc>>32);
563 # if BN_BITS2==64
564 rp[7] = carry;
565 # endif
566 }
567 #else
568 {
569 BN_ULONG t_d[BN_NIST_224_TOP];
570
571 nist_set_224(t_d, buf.bn, 10, 9, 8, 7, 0, 0, 0);
572 carry = (int)bn_add_words(r_d, r_d, t_d, BN_NIST_224_TOP);
573 nist_set_224(t_d, buf.bn, 0, 13, 12, 11, 0, 0, 0);
574 carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_224_TOP);
575 nist_set_224(t_d, buf.bn, 13, 12, 11, 10, 9, 8, 7);
576 carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_224_TOP);
577 nist_set_224(t_d, buf.bn, 0, 0, 0, 0, 13, 12, 11);
578 carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_224_TOP);
579
580 #if BN_BITS2==64
581 carry = (int)(r_d[BN_NIST_224_TOP-1]>>32);
582 #endif
583 }
584 #endif
585 u.f = bn_sub_words;
586 if (carry > 0)
587 {
588 carry = (int)bn_sub_words(r_d,r_d,_nist_p_224[carry-1],BN_NIST_224_TOP);
589 #if BN_BITS2==64
590 carry=(int)(~(r_d[BN_NIST_224_TOP-1]>>32))&1;
591 #endif
592 }
593 else if (carry < 0)
594 {
595 /* it's a bit more comlicated logic in this case.
596 * if bn_add_words yields no carry, then result
597 * has to be adjusted by unconditionally *adding*
598 * the modulus. but if it does, then result has
599 * to be compared to the modulus and conditionally
600 * adjusted by *subtracting* the latter. */
601 carry = (int)bn_add_words(r_d,r_d,_nist_p_224[-carry-1],BN_NIST_224_TOP);
602 mask = 0-(PTR_SIZE_INT)carry;
603 u.p = ((PTR_SIZE_INT)bn_sub_words&mask) |
604 ((PTR_SIZE_INT)bn_add_words&~mask);
605 }
606 else
607 carry = 1;
608
609 /* otherwise it's effectively same as in BN_nist_mod_192... */
610 mask = 0-(PTR_SIZE_INT)(*u.f)(c_d,r_d,_nist_p_224[0],BN_NIST_224_TOP);
611 mask &= 0-(PTR_SIZE_INT)carry;
612 res = c_d;
613 res = (BN_ULONG *)(((PTR_SIZE_INT)res&~mask) |
614 ((PTR_SIZE_INT)r_d&mask));
615 nist_cp_bn(r_d, res, BN_NIST_224_TOP);
616 r->top = BN_NIST_224_TOP;
617 bn_correct_top(r);
618
619 return 1;
620 }
621
622 #define nist_set_256(to, from, a1, a2, a3, a4, a5, a6, a7, a8) \
623 { \
624 bn_cp_32(to, 0, from, (a8) - 8) \
625 bn_cp_32(to, 1, from, (a7) - 8) \
626 bn_cp_32(to, 2, from, (a6) - 8) \
627 bn_cp_32(to, 3, from, (a5) - 8) \
628 bn_cp_32(to, 4, from, (a4) - 8) \
629 bn_cp_32(to, 5, from, (a3) - 8) \
630 bn_cp_32(to, 6, from, (a2) - 8) \
631 bn_cp_32(to, 7, from, (a1) - 8) \
632 }
633
BN_nist_mod_256(BIGNUM * r,const BIGNUM * a,const BIGNUM * field,BN_CTX * ctx)634 int BN_nist_mod_256(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
635 BN_CTX *ctx)
636 {
637 int i, top = a->top;
638 int carry = 0;
639 register BN_ULONG *a_d = a->d, *r_d;
640 union {
641 BN_ULONG bn[BN_NIST_256_TOP];
642 unsigned int ui[BN_NIST_256_TOP*sizeof(BN_ULONG)/sizeof(unsigned int)];
643 } buf;
644 BN_ULONG c_d[BN_NIST_256_TOP],
645 *res;
646 PTR_SIZE_INT mask;
647 union { bn_addsub_f f; PTR_SIZE_INT p; } u;
648 static const BIGNUM _bignum_nist_p_256_sqr = {
649 (BN_ULONG *)_nist_p_256_sqr,
650 sizeof(_nist_p_256_sqr)/sizeof(_nist_p_256_sqr[0]),
651 sizeof(_nist_p_256_sqr)/sizeof(_nist_p_256_sqr[0]),
652 0,BN_FLG_STATIC_DATA };
653
654 field = &_bignum_nist_p_256; /* just to make sure */
655
656 if (BN_is_negative(a) || BN_ucmp(a,&_bignum_nist_p_256_sqr)>=0)
657 return BN_nnmod(r, a, field, ctx);
658
659 i = BN_ucmp(field, a);
660 if (i == 0)
661 {
662 BN_zero(r);
663 return 1;
664 }
665 else if (i > 0)
666 return (r == a)? 1 : (BN_copy(r ,a) != NULL);
667
668 if (r != a)
669 {
670 if (!bn_wexpand(r, BN_NIST_256_TOP))
671 return 0;
672 r_d = r->d;
673 nist_cp_bn(r_d, a_d, BN_NIST_256_TOP);
674 }
675 else
676 r_d = a_d;
677
678 nist_cp_bn_0(buf.bn, a_d + BN_NIST_256_TOP, top - BN_NIST_256_TOP, BN_NIST_256_TOP);
679
680 #if defined(NIST_INT64)
681 {
682 NIST_INT64 acc; /* accumulator */
683 unsigned int *rp=(unsigned int *)r_d;
684 const unsigned int *bp=(const unsigned int *)buf.ui;
685
686 acc = rp[0]; acc += bp[8-8];
687 acc += bp[9-8];
688 acc -= bp[11-8];
689 acc -= bp[12-8];
690 acc -= bp[13-8];
691 acc -= bp[14-8]; rp[0] = (unsigned int)acc; acc >>= 32;
692
693 acc += rp[1]; acc += bp[9-8];
694 acc += bp[10-8];
695 acc -= bp[12-8];
696 acc -= bp[13-8];
697 acc -= bp[14-8];
698 acc -= bp[15-8]; rp[1] = (unsigned int)acc; acc >>= 32;
699
700 acc += rp[2]; acc += bp[10-8];
701 acc += bp[11-8];
702 acc -= bp[13-8];
703 acc -= bp[14-8];
704 acc -= bp[15-8]; rp[2] = (unsigned int)acc; acc >>= 32;
705
706 acc += rp[3]; acc += bp[11-8];
707 acc += bp[11-8];
708 acc += bp[12-8];
709 acc += bp[12-8];
710 acc += bp[13-8];
711 acc -= bp[15-8];
712 acc -= bp[8-8];
713 acc -= bp[9-8]; rp[3] = (unsigned int)acc; acc >>= 32;
714
715 acc += rp[4]; acc += bp[12-8];
716 acc += bp[12-8];
717 acc += bp[13-8];
718 acc += bp[13-8];
719 acc += bp[14-8];
720 acc -= bp[9-8];
721 acc -= bp[10-8]; rp[4] = (unsigned int)acc; acc >>= 32;
722
723 acc += rp[5]; acc += bp[13-8];
724 acc += bp[13-8];
725 acc += bp[14-8];
726 acc += bp[14-8];
727 acc += bp[15-8];
728 acc -= bp[10-8];
729 acc -= bp[11-8]; rp[5] = (unsigned int)acc; acc >>= 32;
730
731 acc += rp[6]; acc += bp[14-8];
732 acc += bp[14-8];
733 acc += bp[15-8];
734 acc += bp[15-8];
735 acc += bp[14-8];
736 acc += bp[13-8];
737 acc -= bp[8-8];
738 acc -= bp[9-8]; rp[6] = (unsigned int)acc; acc >>= 32;
739
740 acc += rp[7]; acc += bp[15-8];
741 acc += bp[15-8];
742 acc += bp[15-8];
743 acc += bp[8 -8];
744 acc -= bp[10-8];
745 acc -= bp[11-8];
746 acc -= bp[12-8];
747 acc -= bp[13-8]; rp[7] = (unsigned int)acc;
748
749 carry = (int)(acc>>32);
750 }
751 #else
752 {
753 BN_ULONG t_d[BN_NIST_256_TOP];
754
755 /*S1*/
756 nist_set_256(t_d, buf.bn, 15, 14, 13, 12, 11, 0, 0, 0);
757 /*S2*/
758 nist_set_256(c_d, buf.bn, 0, 15, 14, 13, 12, 0, 0, 0);
759 carry = (int)bn_add_words(t_d, t_d, c_d, BN_NIST_256_TOP);
760 /* left shift */
761 {
762 register BN_ULONG *ap,t,c;
763 ap = t_d;
764 c=0;
765 for (i = BN_NIST_256_TOP; i != 0; --i)
766 {
767 t= *ap;
768 *(ap++)=((t<<1)|c)&BN_MASK2;
769 c=(t & BN_TBIT)?1:0;
770 }
771 carry <<= 1;
772 carry |= c;
773 }
774 carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
775 /*S3*/
776 nist_set_256(t_d, buf.bn, 15, 14, 0, 0, 0, 10, 9, 8);
777 carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
778 /*S4*/
779 nist_set_256(t_d, buf.bn, 8, 13, 15, 14, 13, 11, 10, 9);
780 carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
781 /*D1*/
782 nist_set_256(t_d, buf.bn, 10, 8, 0, 0, 0, 13, 12, 11);
783 carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
784 /*D2*/
785 nist_set_256(t_d, buf.bn, 11, 9, 0, 0, 15, 14, 13, 12);
786 carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
787 /*D3*/
788 nist_set_256(t_d, buf.bn, 12, 0, 10, 9, 8, 15, 14, 13);
789 carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
790 /*D4*/
791 nist_set_256(t_d, buf.bn, 13, 0, 11, 10, 9, 0, 15, 14);
792 carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
793
794 }
795 #endif
796 /* see BN_nist_mod_224 for explanation */
797 u.f = bn_sub_words;
798 if (carry > 0)
799 carry = (int)bn_sub_words(r_d,r_d,_nist_p_256[carry-1],BN_NIST_256_TOP);
800 else if (carry < 0)
801 {
802 carry = (int)bn_add_words(r_d,r_d,_nist_p_256[-carry-1],BN_NIST_256_TOP);
803 mask = 0-(PTR_SIZE_INT)carry;
804 u.p = ((PTR_SIZE_INT)bn_sub_words&mask) |
805 ((PTR_SIZE_INT)bn_add_words&~mask);
806 }
807 else
808 carry = 1;
809
810 mask = 0-(PTR_SIZE_INT)(*u.f)(c_d,r_d,_nist_p_256[0],BN_NIST_256_TOP);
811 mask &= 0-(PTR_SIZE_INT)carry;
812 res = c_d;
813 res = (BN_ULONG *)(((PTR_SIZE_INT)res&~mask) |
814 ((PTR_SIZE_INT)r_d&mask));
815 nist_cp_bn(r_d, res, BN_NIST_256_TOP);
816 r->top = BN_NIST_256_TOP;
817 bn_correct_top(r);
818
819 return 1;
820 }
821
822 #define nist_set_384(to,from,a1,a2,a3,a4,a5,a6,a7,a8,a9,a10,a11,a12) \
823 { \
824 bn_cp_32(to, 0, from, (a12) - 12) \
825 bn_cp_32(to, 1, from, (a11) - 12) \
826 bn_cp_32(to, 2, from, (a10) - 12) \
827 bn_cp_32(to, 3, from, (a9) - 12) \
828 bn_cp_32(to, 4, from, (a8) - 12) \
829 bn_cp_32(to, 5, from, (a7) - 12) \
830 bn_cp_32(to, 6, from, (a6) - 12) \
831 bn_cp_32(to, 7, from, (a5) - 12) \
832 bn_cp_32(to, 8, from, (a4) - 12) \
833 bn_cp_32(to, 9, from, (a3) - 12) \
834 bn_cp_32(to, 10, from, (a2) - 12) \
835 bn_cp_32(to, 11, from, (a1) - 12) \
836 }
837
BN_nist_mod_384(BIGNUM * r,const BIGNUM * a,const BIGNUM * field,BN_CTX * ctx)838 int BN_nist_mod_384(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
839 BN_CTX *ctx)
840 {
841 int i, top = a->top;
842 int carry = 0;
843 register BN_ULONG *r_d, *a_d = a->d;
844 union {
845 BN_ULONG bn[BN_NIST_384_TOP];
846 unsigned int ui[BN_NIST_384_TOP*sizeof(BN_ULONG)/sizeof(unsigned int)];
847 } buf;
848 BN_ULONG c_d[BN_NIST_384_TOP],
849 *res;
850 PTR_SIZE_INT mask;
851 union { bn_addsub_f f; PTR_SIZE_INT p; } u;
852 static const BIGNUM _bignum_nist_p_384_sqr = {
853 (BN_ULONG *)_nist_p_384_sqr,
854 sizeof(_nist_p_384_sqr)/sizeof(_nist_p_384_sqr[0]),
855 sizeof(_nist_p_384_sqr)/sizeof(_nist_p_384_sqr[0]),
856 0,BN_FLG_STATIC_DATA };
857
858
859 field = &_bignum_nist_p_384; /* just to make sure */
860
861 if (BN_is_negative(a) || BN_ucmp(a,&_bignum_nist_p_384_sqr)>=0)
862 return BN_nnmod(r, a, field, ctx);
863
864 i = BN_ucmp(field, a);
865 if (i == 0)
866 {
867 BN_zero(r);
868 return 1;
869 }
870 else if (i > 0)
871 return (r == a)? 1 : (BN_copy(r ,a) != NULL);
872
873 if (r != a)
874 {
875 if (!bn_wexpand(r, BN_NIST_384_TOP))
876 return 0;
877 r_d = r->d;
878 nist_cp_bn(r_d, a_d, BN_NIST_384_TOP);
879 }
880 else
881 r_d = a_d;
882
883 nist_cp_bn_0(buf.bn, a_d + BN_NIST_384_TOP, top - BN_NIST_384_TOP, BN_NIST_384_TOP);
884
885 #if defined(NIST_INT64)
886 {
887 NIST_INT64 acc; /* accumulator */
888 unsigned int *rp=(unsigned int *)r_d;
889 const unsigned int *bp=(const unsigned int *)buf.ui;
890
891 acc = rp[0]; acc += bp[12-12];
892 acc += bp[21-12];
893 acc += bp[20-12];
894 acc -= bp[23-12]; rp[0] = (unsigned int)acc; acc >>= 32;
895
896 acc += rp[1]; acc += bp[13-12];
897 acc += bp[22-12];
898 acc += bp[23-12];
899 acc -= bp[12-12];
900 acc -= bp[20-12]; rp[1] = (unsigned int)acc; acc >>= 32;
901
902 acc += rp[2]; acc += bp[14-12];
903 acc += bp[23-12];
904 acc -= bp[13-12];
905 acc -= bp[21-12]; rp[2] = (unsigned int)acc; acc >>= 32;
906
907 acc += rp[3]; acc += bp[15-12];
908 acc += bp[12-12];
909 acc += bp[20-12];
910 acc += bp[21-12];
911 acc -= bp[14-12];
912 acc -= bp[22-12];
913 acc -= bp[23-12]; rp[3] = (unsigned int)acc; acc >>= 32;
914
915 acc += rp[4]; acc += bp[21-12];
916 acc += bp[21-12];
917 acc += bp[16-12];
918 acc += bp[13-12];
919 acc += bp[12-12];
920 acc += bp[20-12];
921 acc += bp[22-12];
922 acc -= bp[15-12];
923 acc -= bp[23-12];
924 acc -= bp[23-12]; rp[4] = (unsigned int)acc; acc >>= 32;
925
926 acc += rp[5]; acc += bp[22-12];
927 acc += bp[22-12];
928 acc += bp[17-12];
929 acc += bp[14-12];
930 acc += bp[13-12];
931 acc += bp[21-12];
932 acc += bp[23-12];
933 acc -= bp[16-12]; rp[5] = (unsigned int)acc; acc >>= 32;
934
935 acc += rp[6]; acc += bp[23-12];
936 acc += bp[23-12];
937 acc += bp[18-12];
938 acc += bp[15-12];
939 acc += bp[14-12];
940 acc += bp[22-12];
941 acc -= bp[17-12]; rp[6] = (unsigned int)acc; acc >>= 32;
942
943 acc += rp[7]; acc += bp[19-12];
944 acc += bp[16-12];
945 acc += bp[15-12];
946 acc += bp[23-12];
947 acc -= bp[18-12]; rp[7] = (unsigned int)acc; acc >>= 32;
948
949 acc += rp[8]; acc += bp[20-12];
950 acc += bp[17-12];
951 acc += bp[16-12];
952 acc -= bp[19-12]; rp[8] = (unsigned int)acc; acc >>= 32;
953
954 acc += rp[9]; acc += bp[21-12];
955 acc += bp[18-12];
956 acc += bp[17-12];
957 acc -= bp[20-12]; rp[9] = (unsigned int)acc; acc >>= 32;
958
959 acc += rp[10]; acc += bp[22-12];
960 acc += bp[19-12];
961 acc += bp[18-12];
962 acc -= bp[21-12]; rp[10] = (unsigned int)acc; acc >>= 32;
963
964 acc += rp[11]; acc += bp[23-12];
965 acc += bp[20-12];
966 acc += bp[19-12];
967 acc -= bp[22-12]; rp[11] = (unsigned int)acc;
968
969 carry = (int)(acc>>32);
970 }
971 #else
972 {
973 BN_ULONG t_d[BN_NIST_384_TOP];
974
975 /*S1*/
976 nist_set_256(t_d, buf.bn, 0, 0, 0, 0, 0, 23-4, 22-4, 21-4);
977 /* left shift */
978 {
979 register BN_ULONG *ap,t,c;
980 ap = t_d;
981 c=0;
982 for (i = 3; i != 0; --i)
983 {
984 t= *ap;
985 *(ap++)=((t<<1)|c)&BN_MASK2;
986 c=(t & BN_TBIT)?1:0;
987 }
988 *ap=c;
989 }
990 carry = (int)bn_add_words(r_d+(128/BN_BITS2), r_d+(128/BN_BITS2),
991 t_d, BN_NIST_256_TOP);
992 /*S2 */
993 carry += (int)bn_add_words(r_d, r_d, buf.bn, BN_NIST_384_TOP);
994 /*S3*/
995 nist_set_384(t_d,buf.bn,20,19,18,17,16,15,14,13,12,23,22,21);
996 carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
997 /*S4*/
998 nist_set_384(t_d,buf.bn,19,18,17,16,15,14,13,12,20,0,23,0);
999 carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1000 /*S5*/
1001 nist_set_384(t_d, buf.bn,0,0,0,0,23,22,21,20,0,0,0,0);
1002 carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1003 /*S6*/
1004 nist_set_384(t_d,buf.bn,0,0,0,0,0,0,23,22,21,0,0,20);
1005 carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1006 /*D1*/
1007 nist_set_384(t_d,buf.bn,22,21,20,19,18,17,16,15,14,13,12,23);
1008 carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1009 /*D2*/
1010 nist_set_384(t_d,buf.bn,0,0,0,0,0,0,0,23,22,21,20,0);
1011 carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1012 /*D3*/
1013 nist_set_384(t_d,buf.bn,0,0,0,0,0,0,0,23,23,0,0,0);
1014 carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1015
1016 }
1017 #endif
1018 /* see BN_nist_mod_224 for explanation */
1019 u.f = bn_sub_words;
1020 if (carry > 0)
1021 carry = (int)bn_sub_words(r_d,r_d,_nist_p_384[carry-1],BN_NIST_384_TOP);
1022 else if (carry < 0)
1023 {
1024 carry = (int)bn_add_words(r_d,r_d,_nist_p_384[-carry-1],BN_NIST_384_TOP);
1025 mask = 0-(PTR_SIZE_INT)carry;
1026 u.p = ((PTR_SIZE_INT)bn_sub_words&mask) |
1027 ((PTR_SIZE_INT)bn_add_words&~mask);
1028 }
1029 else
1030 carry = 1;
1031
1032 mask = 0-(PTR_SIZE_INT)(*u.f)(c_d,r_d,_nist_p_384[0],BN_NIST_384_TOP);
1033 mask &= 0-(PTR_SIZE_INT)carry;
1034 res = c_d;
1035 res = (BN_ULONG *)(((PTR_SIZE_INT)res&~mask) |
1036 ((PTR_SIZE_INT)r_d&mask));
1037 nist_cp_bn(r_d, res, BN_NIST_384_TOP);
1038 r->top = BN_NIST_384_TOP;
1039 bn_correct_top(r);
1040
1041 return 1;
1042 }
1043
1044 #define BN_NIST_521_RSHIFT (521%BN_BITS2)
1045 #define BN_NIST_521_LSHIFT (BN_BITS2-BN_NIST_521_RSHIFT)
1046 #define BN_NIST_521_TOP_MASK ((BN_ULONG)BN_MASK2>>BN_NIST_521_LSHIFT)
1047
BN_nist_mod_521(BIGNUM * r,const BIGNUM * a,const BIGNUM * field,BN_CTX * ctx)1048 int BN_nist_mod_521(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
1049 BN_CTX *ctx)
1050 {
1051 int top = a->top, i;
1052 BN_ULONG *r_d, *a_d = a->d,
1053 t_d[BN_NIST_521_TOP],
1054 val,tmp,*res;
1055 PTR_SIZE_INT mask;
1056 static const BIGNUM _bignum_nist_p_521_sqr = {
1057 (BN_ULONG *)_nist_p_521_sqr,
1058 sizeof(_nist_p_521_sqr)/sizeof(_nist_p_521_sqr[0]),
1059 sizeof(_nist_p_521_sqr)/sizeof(_nist_p_521_sqr[0]),
1060 0,BN_FLG_STATIC_DATA };
1061
1062 field = &_bignum_nist_p_521; /* just to make sure */
1063
1064 if (BN_is_negative(a) || BN_ucmp(a,&_bignum_nist_p_521_sqr)>=0)
1065 return BN_nnmod(r, a, field, ctx);
1066
1067 i = BN_ucmp(field, a);
1068 if (i == 0)
1069 {
1070 BN_zero(r);
1071 return 1;
1072 }
1073 else if (i > 0)
1074 return (r == a)? 1 : (BN_copy(r ,a) != NULL);
1075
1076 if (r != a)
1077 {
1078 if (!bn_wexpand(r,BN_NIST_521_TOP))
1079 return 0;
1080 r_d = r->d;
1081 nist_cp_bn(r_d,a_d, BN_NIST_521_TOP);
1082 }
1083 else
1084 r_d = a_d;
1085
1086 /* upper 521 bits, copy ... */
1087 nist_cp_bn_0(t_d,a_d + (BN_NIST_521_TOP-1), top - (BN_NIST_521_TOP-1),BN_NIST_521_TOP);
1088 /* ... and right shift */
1089 for (val=t_d[0],i=0; i<BN_NIST_521_TOP-1; i++)
1090 {
1091 t_d[i] = ( val>>BN_NIST_521_RSHIFT |
1092 (tmp=t_d[i+1])<<BN_NIST_521_LSHIFT ) & BN_MASK2;
1093 val=tmp;
1094 }
1095 t_d[i] = val>>BN_NIST_521_RSHIFT;
1096 /* lower 521 bits */
1097 r_d[i] &= BN_NIST_521_TOP_MASK;
1098
1099 bn_add_words(r_d,r_d,t_d,BN_NIST_521_TOP);
1100 mask = 0-(PTR_SIZE_INT)bn_sub_words(t_d,r_d,_nist_p_521,BN_NIST_521_TOP);
1101 res = t_d;
1102 res = (BN_ULONG *)(((PTR_SIZE_INT)res&~mask) |
1103 ((PTR_SIZE_INT)r_d&mask));
1104 nist_cp_bn(r_d,res,BN_NIST_521_TOP);
1105 r->top = BN_NIST_521_TOP;
1106 bn_correct_top(r);
1107
1108 return 1;
1109 }
1110