Coverage Report

Created: 2026-04-09 06:50

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/openssl30/crypto/bn/bn_nist.c
Line
Count
Source
1
/*
2
 * Copyright 2002-2026 The OpenSSL Project Authors. All Rights Reserved.
3
 *
4
 * Licensed under the Apache License 2.0 (the "License").  You may not use
5
 * this file except in compliance with the License.  You can obtain a copy
6
 * in the file LICENSE in the source distribution or at
7
 * https://www.openssl.org/source/license.html
8
 */
9
10
#include "bn_local.h"
11
#include "internal/cryptlib.h"
12
13
0
#define BN_NIST_192_TOP (192 + BN_BITS2 - 1) / BN_BITS2
14
3.86M
#define BN_NIST_224_TOP (224 + BN_BITS2 - 1) / BN_BITS2
15
0
#define BN_NIST_256_TOP (256 + BN_BITS2 - 1) / BN_BITS2
16
481k
#define BN_NIST_384_TOP (384 + BN_BITS2 - 1) / BN_BITS2
17
2.23M
#define BN_NIST_521_TOP (521 + BN_BITS2 - 1) / BN_BITS2
18
19
/* pre-computed tables are "carry-less" values of modulus*(i+1) */
20
#if BN_BITS2 == 64
21
static const BN_ULONG _nist_p_192[][BN_NIST_192_TOP] = {
22
    { 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFEULL, 0xFFFFFFFFFFFFFFFFULL },
23
    { 0xFFFFFFFFFFFFFFFEULL, 0xFFFFFFFFFFFFFFFDULL, 0xFFFFFFFFFFFFFFFFULL },
24
    { 0xFFFFFFFFFFFFFFFDULL, 0xFFFFFFFFFFFFFFFCULL, 0xFFFFFFFFFFFFFFFFULL }
25
};
26
27
static const BN_ULONG _nist_p_192_sqr[] = {
28
    0x0000000000000001ULL, 0x0000000000000002ULL, 0x0000000000000001ULL,
29
    0xFFFFFFFFFFFFFFFEULL, 0xFFFFFFFFFFFFFFFDULL, 0xFFFFFFFFFFFFFFFFULL
30
};
31
32
static const BN_ULONG _nist_p_224[][BN_NIST_224_TOP] = {
33
    { 0x0000000000000001ULL, 0xFFFFFFFF00000000ULL,
34
        0xFFFFFFFFFFFFFFFFULL, 0x00000000FFFFFFFFULL },
35
    { 0x0000000000000002ULL, 0xFFFFFFFE00000000ULL,
36
        0xFFFFFFFFFFFFFFFFULL, 0x00000001FFFFFFFFULL } /* this one is
37
                                                        * "carry-full" */
38
};
39
40
static const BN_ULONG _nist_p_224_sqr[] = {
41
    0x0000000000000001ULL, 0xFFFFFFFE00000000ULL,
42
    0xFFFFFFFFFFFFFFFFULL, 0x0000000200000000ULL,
43
    0x0000000000000000ULL, 0xFFFFFFFFFFFFFFFEULL,
44
    0xFFFFFFFFFFFFFFFFULL
45
};
46
47
static const BN_ULONG _nist_p_256[][BN_NIST_256_TOP] = {
48
    { 0xFFFFFFFFFFFFFFFFULL, 0x00000000FFFFFFFFULL,
49
        0x0000000000000000ULL, 0xFFFFFFFF00000001ULL },
50
    { 0xFFFFFFFFFFFFFFFEULL, 0x00000001FFFFFFFFULL,
51
        0x0000000000000000ULL, 0xFFFFFFFE00000002ULL },
52
    { 0xFFFFFFFFFFFFFFFDULL, 0x00000002FFFFFFFFULL,
53
        0x0000000000000000ULL, 0xFFFFFFFD00000003ULL },
54
    { 0xFFFFFFFFFFFFFFFCULL, 0x00000003FFFFFFFFULL,
55
        0x0000000000000000ULL, 0xFFFFFFFC00000004ULL },
56
    { 0xFFFFFFFFFFFFFFFBULL, 0x00000004FFFFFFFFULL,
57
        0x0000000000000000ULL, 0xFFFFFFFB00000005ULL },
58
};
59
60
static const BN_ULONG _nist_p_256_sqr[] = {
61
    0x0000000000000001ULL, 0xFFFFFFFE00000000ULL,
62
    0xFFFFFFFFFFFFFFFFULL, 0x00000001FFFFFFFEULL,
63
    0x00000001FFFFFFFEULL, 0x00000001FFFFFFFEULL,
64
    0xFFFFFFFE00000001ULL, 0xFFFFFFFE00000002ULL
65
};
66
67
static const BN_ULONG _nist_p_384[][BN_NIST_384_TOP] = {
68
    { 0x00000000FFFFFFFFULL, 0xFFFFFFFF00000000ULL, 0xFFFFFFFFFFFFFFFEULL,
69
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
70
    { 0x00000001FFFFFFFEULL, 0xFFFFFFFE00000000ULL, 0xFFFFFFFFFFFFFFFDULL,
71
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
72
    { 0x00000002FFFFFFFDULL, 0xFFFFFFFD00000000ULL, 0xFFFFFFFFFFFFFFFCULL,
73
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
74
    { 0x00000003FFFFFFFCULL, 0xFFFFFFFC00000000ULL, 0xFFFFFFFFFFFFFFFBULL,
75
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
76
    { 0x00000004FFFFFFFBULL, 0xFFFFFFFB00000000ULL, 0xFFFFFFFFFFFFFFFAULL,
77
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
78
};
79
80
static const BN_ULONG _nist_p_384_sqr[] = {
81
    0xFFFFFFFE00000001ULL, 0x0000000200000000ULL, 0xFFFFFFFE00000000ULL,
82
    0x0000000200000000ULL, 0x0000000000000001ULL, 0x0000000000000000ULL,
83
    0x00000001FFFFFFFEULL, 0xFFFFFFFE00000000ULL, 0xFFFFFFFFFFFFFFFDULL,
84
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL
85
};
86
87
static const BN_ULONG _nist_p_521[] = { 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
88
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
89
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
90
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
91
    0x00000000000001FFULL };
92
93
static const BN_ULONG _nist_p_521_sqr[] = {
94
    0x0000000000000001ULL, 0x0000000000000000ULL, 0x0000000000000000ULL,
95
    0x0000000000000000ULL, 0x0000000000000000ULL, 0x0000000000000000ULL,
96
    0x0000000000000000ULL, 0x0000000000000000ULL, 0xFFFFFFFFFFFFFC00ULL,
97
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
98
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
99
    0xFFFFFFFFFFFFFFFFULL, 0x000000000003FFFFULL
100
};
101
#elif BN_BITS2 == 32
102
static const BN_ULONG _nist_p_192[][BN_NIST_192_TOP] = {
103
    { 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
104
    { 0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
105
    { 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFC, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF }
106
};
107
108
static const BN_ULONG _nist_p_192_sqr[] = {
109
    0x00000001, 0x00000000, 0x00000002, 0x00000000, 0x00000001, 0x00000000,
110
    0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF
111
};
112
113
static const BN_ULONG _nist_p_224[][BN_NIST_224_TOP] = {
114
    { 0x00000001, 0x00000000, 0x00000000, 0xFFFFFFFF,
115
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
116
    { 0x00000002, 0x00000000, 0x00000000, 0xFFFFFFFE,
117
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF }
118
};
119
120
static const BN_ULONG _nist_p_224_sqr[] = {
121
    0x00000001, 0x00000000, 0x00000000, 0xFFFFFFFE,
122
    0xFFFFFFFF, 0xFFFFFFFF, 0x00000000, 0x00000002,
123
    0x00000000, 0x00000000, 0xFFFFFFFE, 0xFFFFFFFF,
124
    0xFFFFFFFF, 0xFFFFFFFF
125
};
126
127
static const BN_ULONG _nist_p_256[][BN_NIST_256_TOP] = {
128
    { 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000000,
129
        0x00000000, 0x00000000, 0x00000001, 0xFFFFFFFF },
130
    { 0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000001,
131
        0x00000000, 0x00000000, 0x00000002, 0xFFFFFFFE },
132
    { 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000002,
133
        0x00000000, 0x00000000, 0x00000003, 0xFFFFFFFD },
134
    { 0xFFFFFFFC, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000003,
135
        0x00000000, 0x00000000, 0x00000004, 0xFFFFFFFC },
136
    { 0xFFFFFFFB, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000004,
137
        0x00000000, 0x00000000, 0x00000005, 0xFFFFFFFB },
138
};
139
140
static const BN_ULONG _nist_p_256_sqr[] = {
141
    0x00000001, 0x00000000, 0x00000000, 0xFFFFFFFE,
142
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFE, 0x00000001,
143
    0xFFFFFFFE, 0x00000001, 0xFFFFFFFE, 0x00000001,
144
    0x00000001, 0xFFFFFFFE, 0x00000002, 0xFFFFFFFE
145
};
146
147
static const BN_ULONG _nist_p_384[][BN_NIST_384_TOP] = {
148
    { 0xFFFFFFFF, 0x00000000, 0x00000000, 0xFFFFFFFF, 0xFFFFFFFE, 0xFFFFFFFF,
149
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
150
    { 0xFFFFFFFE, 0x00000001, 0x00000000, 0xFFFFFFFE, 0xFFFFFFFD, 0xFFFFFFFF,
151
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
152
    { 0xFFFFFFFD, 0x00000002, 0x00000000, 0xFFFFFFFD, 0xFFFFFFFC, 0xFFFFFFFF,
153
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
154
    { 0xFFFFFFFC, 0x00000003, 0x00000000, 0xFFFFFFFC, 0xFFFFFFFB, 0xFFFFFFFF,
155
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
156
    { 0xFFFFFFFB, 0x00000004, 0x00000000, 0xFFFFFFFB, 0xFFFFFFFA, 0xFFFFFFFF,
157
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
158
};
159
160
static const BN_ULONG _nist_p_384_sqr[] = {
161
    0x00000001, 0xFFFFFFFE, 0x00000000, 0x00000002, 0x00000000, 0xFFFFFFFE,
162
    0x00000000, 0x00000002, 0x00000001, 0x00000000, 0x00000000, 0x00000000,
163
    0xFFFFFFFE, 0x00000001, 0x00000000, 0xFFFFFFFE, 0xFFFFFFFD, 0xFFFFFFFF,
164
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF
165
};
166
167
static const BN_ULONG _nist_p_521[] = { 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
168
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
169
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
170
    0xFFFFFFFF, 0x000001FF };
171
172
static const BN_ULONG _nist_p_521_sqr[] = {
173
    0x00000001, 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
174
    0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
175
    0x00000000, 0x00000000, 0x00000000, 0x00000000, 0xFFFFFC00, 0xFFFFFFFF,
176
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
177
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
178
    0xFFFFFFFF, 0xFFFFFFFF, 0x0003FFFF
179
};
180
#else
181
#error "unsupported BN_BITS2"
182
#endif
183
184
static const BIGNUM ossl_bignum_nist_p_192 = {
185
    (BN_ULONG *)_nist_p_192[0],
186
    BN_NIST_192_TOP,
187
    BN_NIST_192_TOP,
188
    0,
189
    BN_FLG_STATIC_DATA
190
};
191
192
static const BIGNUM ossl_bignum_nist_p_224 = {
193
    (BN_ULONG *)_nist_p_224[0],
194
    BN_NIST_224_TOP,
195
    BN_NIST_224_TOP,
196
    0,
197
    BN_FLG_STATIC_DATA
198
};
199
200
static const BIGNUM ossl_bignum_nist_p_256 = {
201
    (BN_ULONG *)_nist_p_256[0],
202
    BN_NIST_256_TOP,
203
    BN_NIST_256_TOP,
204
    0,
205
    BN_FLG_STATIC_DATA
206
};
207
208
static const BIGNUM ossl_bignum_nist_p_384 = {
209
    (BN_ULONG *)_nist_p_384[0],
210
    BN_NIST_384_TOP,
211
    BN_NIST_384_TOP,
212
    0,
213
    BN_FLG_STATIC_DATA
214
};
215
216
static const BIGNUM ossl_bignum_nist_p_521 = {
217
    (BN_ULONG *)_nist_p_521,
218
    BN_NIST_521_TOP,
219
    BN_NIST_521_TOP,
220
    0,
221
    BN_FLG_STATIC_DATA
222
};
223
224
const BIGNUM *BN_get0_nist_prime_192(void)
225
0
{
226
0
    return &ossl_bignum_nist_p_192;
227
0
}
228
229
const BIGNUM *BN_get0_nist_prime_224(void)
230
0
{
231
0
    return &ossl_bignum_nist_p_224;
232
0
}
233
234
const BIGNUM *BN_get0_nist_prime_256(void)
235
0
{
236
0
    return &ossl_bignum_nist_p_256;
237
0
}
238
239
const BIGNUM *BN_get0_nist_prime_384(void)
240
0
{
241
0
    return &ossl_bignum_nist_p_384;
242
0
}
243
244
const BIGNUM *BN_get0_nist_prime_521(void)
245
0
{
246
0
    return &ossl_bignum_nist_p_521;
247
0
}
248
249
/*
250
 * To avoid more recent compilers (specifically clang-14) from treating this
251
 * code as a violation of the strict aliasing conditions and omitting it, this
252
 * cannot be declared as a function.  Moreover, the dst parameter cannot be
253
 * cached in a local since this no longer references the union and again falls
254
 * foul of the strict aliasing criteria.  Refer to #18225 for the initial
255
 * diagnostics and llvm/llvm-project#55255 for the later discussions with the
256
 * LLVM developers.  The problem boils down to if an array in the union is
257
 * converted to a pointer or if it is used directly.
258
 *
259
 * This function was inlined regardless, so there is no space cost to be
260
 * paid for making it a macro.
261
 */
262
#define nist_cp_bn_0(dst, src_in, top, max) \
263
696k
    {                                       \
264
696k
        int ii;                             \
265
696k
        const BN_ULONG *src = src_in;       \
266
696k
                                            \
267
4.46M
        for (ii = 0; ii < top; ii++)        \
268
3.76M
            (dst)[ii] = src[ii];            \
269
848k
        for (; ii < max; ii++)              \
270
696k
            (dst)[ii] = 0;                  \
271
696k
    }
272
273
static void nist_cp_bn(BN_ULONG *dst, const BN_ULONG *src, int top)
274
696k
{
275
696k
    int i;
276
277
4.61M
    for (i = 0; i < top; i++)
278
3.91M
        dst[i] = src[i];
279
696k
}
280
281
#if BN_BITS2 == 64
282
#define bn_cp_64(to, n, from, m) (to)[n] = (m >= 0) ? ((from)[m]) : 0;
283
#define bn_64_set_0(to, n) (to)[n] = (BN_ULONG)0;
284
/*
285
 * two following macros are implemented under assumption that they
286
 * are called in a sequence with *ascending* n, i.e. as they are...
287
 */
288
9.37M
#define bn_cp_32_naked(to, n, from, m) (((n) & 1) ? (to[(n) / 2] |= ((m) & 1) ? (from[(m) / 2] & BN_MASK2h) : (from[(m) / 2] << 32)) \
289
9.37M
                                                  : (to[(n) / 2] = ((m) & 1) ? (from[(m) / 2] >> 32) : (from[(m) / 2] & BN_MASK2l)))
290
4.29M
#define bn_32_set_0(to, n) (((n) & 1) ? (to[(n) / 2] &= BN_MASK2l) : (to[(n) / 2] = 0));
291
13.6M
#define bn_cp_32(to, n, from, m) ((m) >= 0) ? bn_cp_32_naked(to, n, from, m) : bn_32_set_0(to, n)
292
#if defined(L_ENDIAN)
293
#if defined(__arch64__)
294
#define NIST_INT64 long
295
#else
296
133k
#define NIST_INT64 long long
297
#endif
298
#endif
299
#else
300
#define bn_cp_64(to, n, from, m)                      \
301
    {                                                 \
302
        bn_cp_32(to, (n) * 2, from, (m) * 2);         \
303
        bn_cp_32(to, (n) * 2 + 1, from, (m) * 2 + 1); \
304
    }
305
#define bn_64_set_0(to, n)            \
306
    {                                 \
307
        bn_32_set_0(to, (n) * 2);     \
308
        bn_32_set_0(to, (n) * 2 + 1); \
309
    }
310
#define bn_cp_32(to, n, from, m) (to)[n] = (m >= 0) ? ((from)[m]) : 0;
311
#define bn_32_set_0(to, n) (to)[n] = (BN_ULONG)0;
312
#if defined(_WIN32) && !defined(__GNUC__)
313
#define NIST_INT64 __int64
314
#elif defined(BN_LLONG)
315
#define NIST_INT64 long long
316
#endif
317
#endif /* BN_BITS2 != 64 */
318
319
#ifdef NIST_INT64
320
/* Helpers to load/store a 32-bit word (uint32_t) from/into a memory
321
 * location and avoid potential aliasing issue.  */
322
static ossl_inline uint32_t load_u32(const void *ptr)
323
1.60M
{
324
1.60M
    uint32_t tmp;
325
326
1.60M
    memcpy(&tmp, ptr, sizeof(tmp));
327
1.60M
    return tmp;
328
1.60M
}
329
330
static ossl_inline void store_lo32(void *ptr, NIST_INT64 val)
331
1.60M
{
332
    /* A cast is needed for big-endian system: on a 32-bit BE system
333
     * NIST_INT64 may be defined as well if the compiler supports 64-bit
334
     * long long.  */
335
1.60M
    uint32_t tmp = (uint32_t)val;
336
337
1.60M
    memcpy(ptr, &tmp, sizeof(tmp));
338
1.60M
}
339
#endif /* NIST_INT64 */
340
341
#define nist_set_192(to, from, a1, a2, a3)      \
342
    {                                           \
343
        bn_cp_64(to, 0, from, (a3) - 3)         \
344
            bn_cp_64(to, 1, from, (a2) - 3)     \
345
                bn_cp_64(to, 2, from, (a1) - 3) \
346
    }
347
348
int BN_nist_mod_192(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
349
    BN_CTX *ctx)
350
0
{
351
0
    int top = a->top, i;
352
0
    int carry;
353
0
    register BN_ULONG *r_d, *a_d = a->d;
354
0
    union {
355
0
        BN_ULONG bn[BN_NIST_192_TOP];
356
0
        unsigned int ui[BN_NIST_192_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
357
0
    } buf;
358
0
    BN_ULONG c_d[BN_NIST_192_TOP], *res;
359
0
    static const BIGNUM ossl_bignum_nist_p_192_sqr = {
360
0
        (BN_ULONG *)_nist_p_192_sqr,
361
0
        OSSL_NELEM(_nist_p_192_sqr),
362
0
        OSSL_NELEM(_nist_p_192_sqr),
363
0
        0, BN_FLG_STATIC_DATA
364
0
    };
365
366
0
    field = &ossl_bignum_nist_p_192; /* just to make sure */
367
368
0
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_192_sqr) >= 0)
369
0
        return BN_nnmod(r, a, field, ctx);
370
371
0
    i = BN_ucmp(field, a);
372
0
    if (i == 0) {
373
0
        BN_zero(r);
374
0
        return 1;
375
0
    } else if (i > 0)
376
0
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
377
378
0
    if (r != a) {
379
0
        if (!bn_wexpand(r, BN_NIST_192_TOP))
380
0
            return 0;
381
0
        r_d = r->d;
382
0
        nist_cp_bn(r_d, a_d, BN_NIST_192_TOP);
383
0
    } else
384
0
        r_d = a_d;
385
386
0
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_192_TOP, top - BN_NIST_192_TOP,
387
0
        BN_NIST_192_TOP);
388
389
0
#if defined(NIST_INT64)
390
0
    {
391
0
        NIST_INT64 acc; /* accumulator */
392
0
        unsigned int *rp = (unsigned int *)r_d;
393
0
        const unsigned int *bp = (const unsigned int *)buf.ui;
394
395
0
        acc = load_u32(&rp[0]);
396
0
        acc += bp[3 * 2 - 6];
397
0
        acc += bp[5 * 2 - 6];
398
0
        store_lo32(&rp[0], acc);
399
0
        acc >>= 32;
400
401
0
        acc += load_u32(&rp[1]);
402
0
        acc += bp[3 * 2 - 5];
403
0
        acc += bp[5 * 2 - 5];
404
0
        store_lo32(&rp[1], acc);
405
0
        acc >>= 32;
406
407
0
        acc += load_u32(&rp[2]);
408
0
        acc += bp[3 * 2 - 6];
409
0
        acc += bp[4 * 2 - 6];
410
0
        acc += bp[5 * 2 - 6];
411
0
        store_lo32(&rp[2], acc);
412
0
        acc >>= 32;
413
414
0
        acc += load_u32(&rp[3]);
415
0
        acc += bp[3 * 2 - 5];
416
0
        acc += bp[4 * 2 - 5];
417
0
        acc += bp[5 * 2 - 5];
418
0
        store_lo32(&rp[3], acc);
419
0
        acc >>= 32;
420
421
0
        acc += load_u32(&rp[4]);
422
0
        acc += bp[4 * 2 - 6];
423
0
        acc += bp[5 * 2 - 6];
424
0
        store_lo32(&rp[4], acc);
425
0
        acc >>= 32;
426
427
0
        acc += load_u32(&rp[5]);
428
0
        acc += bp[4 * 2 - 5];
429
0
        acc += bp[5 * 2 - 5];
430
0
        store_lo32(&rp[5], acc);
431
432
0
        carry = (int)(acc >> 32);
433
0
    }
434
#else
435
    {
436
        BN_ULONG t_d[BN_NIST_192_TOP];
437
438
        nist_set_192(t_d, buf.bn, 0, 3, 3);
439
        carry = (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
440
        nist_set_192(t_d, buf.bn, 4, 4, 0);
441
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
442
        nist_set_192(t_d, buf.bn, 5, 5, 5)
443
            carry
444
            += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
445
    }
446
#endif
447
0
    if (carry > 0)
448
0
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_192[carry - 1],
449
0
            BN_NIST_192_TOP);
450
0
    else
451
0
        carry = 1;
452
453
    /*
454
     * we need 'if (carry==0 || result>=modulus) result-=modulus;'
455
     * as comparison implies subtraction, we can write
456
     * 'tmp=result-modulus; if (!carry || !borrow) result=tmp;'
457
     * this is what happens below, but without explicit if:-) a.
458
     */
459
0
    res = (bn_sub_words(c_d, r_d, _nist_p_192[0], BN_NIST_192_TOP) && carry)
460
0
        ? r_d
461
0
        : c_d;
462
0
    nist_cp_bn(r_d, res, BN_NIST_192_TOP);
463
0
    r->top = BN_NIST_192_TOP;
464
0
    bn_correct_top(r);
465
466
0
    return 1;
467
0
}
468
469
typedef BN_ULONG (*bn_addsub_f)(BN_ULONG *, const BN_ULONG *,
470
    const BN_ULONG *, int);
471
472
#define nist_set_224(to, from, a1, a2, a3, a4, a5, a6, a7)      \
473
1.95M
    {                                                           \
474
1.95M
        bn_cp_32(to, 0, from, (a7) - 7)                         \
475
1.95M
            bn_cp_32(to, 1, from, (a6) - 7)                     \
476
1.95M
                bn_cp_32(to, 2, from, (a5) - 7)                 \
477
1.95M
                    bn_cp_32(to, 3, from, (a4) - 7)             \
478
1.95M
                        bn_cp_32(to, 4, from, (a3) - 7)         \
479
1.95M
                            bn_cp_32(to, 5, from, (a2) - 7)     \
480
1.95M
                                bn_cp_32(to, 6, from, (a1) - 7) \
481
1.95M
    }
482
483
int BN_nist_mod_224(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
484
    BN_CTX *ctx)
485
396k
{
486
396k
    int top = a->top, i;
487
396k
    int carry;
488
396k
    BN_ULONG *r_d, *a_d = a->d;
489
396k
    union {
490
396k
        BN_ULONG bn[BN_NIST_224_TOP];
491
396k
        unsigned int ui[BN_NIST_224_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
492
396k
    } buf;
493
396k
    BN_ULONG c_d[BN_NIST_224_TOP], *res;
494
396k
    bn_addsub_f adjust;
495
396k
    static const BIGNUM ossl_bignum_nist_p_224_sqr = {
496
396k
        (BN_ULONG *)_nist_p_224_sqr,
497
396k
        OSSL_NELEM(_nist_p_224_sqr),
498
396k
        OSSL_NELEM(_nist_p_224_sqr),
499
396k
        0, BN_FLG_STATIC_DATA
500
396k
    };
501
502
396k
    field = &ossl_bignum_nist_p_224; /* just to make sure */
503
504
396k
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_224_sqr) >= 0)
505
0
        return BN_nnmod(r, a, field, ctx);
506
507
396k
    i = BN_ucmp(field, a);
508
396k
    if (i == 0) {
509
0
        BN_zero(r);
510
0
        return 1;
511
396k
    } else if (i > 0)
512
5.39k
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
513
514
390k
    if (r != a) {
515
0
        if (!bn_wexpand(r, BN_NIST_224_TOP))
516
0
            return 0;
517
0
        r_d = r->d;
518
0
        nist_cp_bn(r_d, a_d, BN_NIST_224_TOP);
519
0
    } else
520
390k
        r_d = a_d;
521
522
390k
#if BN_BITS2 == 64
523
    /* copy upper 256 bits of 448 bit number ... */
524
390k
    nist_cp_bn_0(c_d, a_d + (BN_NIST_224_TOP - 1),
525
390k
        top - (BN_NIST_224_TOP - 1), BN_NIST_224_TOP);
526
    /* ... and right shift by 32 to obtain upper 224 bits */
527
390k
    nist_set_224(buf.bn, c_d, 14, 13, 12, 11, 10, 9, 8);
528
    /* truncate lower part to 224 bits too */
529
390k
    r_d[BN_NIST_224_TOP - 1] &= BN_MASK2l;
530
#else
531
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_224_TOP, top - BN_NIST_224_TOP,
532
        BN_NIST_224_TOP);
533
#endif
534
535
#if defined(NIST_INT64) && BN_BITS2 != 64
536
    {
537
        NIST_INT64 acc; /* accumulator */
538
        unsigned int *rp = (unsigned int *)r_d;
539
        const unsigned int *bp = (const unsigned int *)buf.ui;
540
541
        acc = rp[0];
542
        acc -= bp[7 - 7];
543
        acc -= bp[11 - 7];
544
        rp[0] = (unsigned int)acc;
545
        acc >>= 32;
546
547
        acc += rp[1];
548
        acc -= bp[8 - 7];
549
        acc -= bp[12 - 7];
550
        rp[1] = (unsigned int)acc;
551
        acc >>= 32;
552
553
        acc += rp[2];
554
        acc -= bp[9 - 7];
555
        acc -= bp[13 - 7];
556
        rp[2] = (unsigned int)acc;
557
        acc >>= 32;
558
559
        acc += rp[3];
560
        acc += bp[7 - 7];
561
        acc += bp[11 - 7];
562
        acc -= bp[10 - 7];
563
        rp[3] = (unsigned int)acc;
564
        acc >>= 32;
565
566
        acc += rp[4];
567
        acc += bp[8 - 7];
568
        acc += bp[12 - 7];
569
        acc -= bp[11 - 7];
570
        rp[4] = (unsigned int)acc;
571
        acc >>= 32;
572
573
        acc += rp[5];
574
        acc += bp[9 - 7];
575
        acc += bp[13 - 7];
576
        acc -= bp[12 - 7];
577
        rp[5] = (unsigned int)acc;
578
        acc >>= 32;
579
580
        acc += rp[6];
581
        acc += bp[10 - 7];
582
        acc -= bp[13 - 7];
583
        rp[6] = (unsigned int)acc;
584
585
        carry = (int)(acc >> 32);
586
#if BN_BITS2 == 64
587
        rp[7] = carry;
588
#endif
589
    }
590
#else
591
390k
    {
592
390k
        BN_ULONG t_d[BN_NIST_224_TOP];
593
594
390k
        nist_set_224(t_d, buf.bn, 10, 9, 8, 7, 0, 0, 0);
595
390k
        carry = (int)bn_add_words(r_d, r_d, t_d, BN_NIST_224_TOP);
596
390k
        nist_set_224(t_d, buf.bn, 0, 13, 12, 11, 0, 0, 0);
597
390k
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_224_TOP);
598
390k
        nist_set_224(t_d, buf.bn, 13, 12, 11, 10, 9, 8, 7);
599
390k
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_224_TOP);
600
390k
        nist_set_224(t_d, buf.bn, 0, 0, 0, 0, 13, 12, 11);
601
390k
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_224_TOP);
602
603
390k
#if BN_BITS2 == 64
604
390k
        carry = (int)(r_d[BN_NIST_224_TOP - 1] >> 32);
605
390k
#endif
606
390k
    }
607
390k
#endif
608
390k
    adjust = bn_sub_words;
609
390k
    if (carry > 0) {
610
166k
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_224[carry - 1],
611
166k
            BN_NIST_224_TOP);
612
166k
#if BN_BITS2 == 64
613
166k
        carry = (int)(~(r_d[BN_NIST_224_TOP - 1] >> 32)) & 1;
614
166k
#endif
615
224k
    } else if (carry < 0) {
616
        /*
617
         * it's a bit more complicated logic in this case. if bn_add_words
618
         * yields no carry, then result has to be adjusted by unconditionally
619
         * *adding* the modulus. but if it does, then result has to be
620
         * compared to the modulus and conditionally adjusted by
621
         * *subtracting* the latter.
622
         */
623
19.8k
        carry = (int)bn_add_words(r_d, r_d, _nist_p_224[-carry - 1],
624
19.8k
            BN_NIST_224_TOP);
625
19.8k
        adjust = carry ? bn_sub_words : bn_add_words;
626
19.8k
    } else
627
204k
        carry = 1;
628
629
    /* otherwise it's effectively same as in BN_nist_mod_192... */
630
390k
    res = ((*adjust)(c_d, r_d, _nist_p_224[0], BN_NIST_224_TOP) && carry)
631
390k
        ? r_d
632
390k
        : c_d;
633
390k
    nist_cp_bn(r_d, res, BN_NIST_224_TOP);
634
390k
    r->top = BN_NIST_224_TOP;
635
390k
    bn_correct_top(r);
636
637
390k
    return 1;
638
390k
}
639
640
#define nist_set_256(to, from, a1, a2, a3, a4, a5, a6, a7, a8)      \
641
    {                                                               \
642
        bn_cp_32(to, 0, from, (a8) - 8)                             \
643
            bn_cp_32(to, 1, from, (a7) - 8)                         \
644
                bn_cp_32(to, 2, from, (a6) - 8)                     \
645
                    bn_cp_32(to, 3, from, (a5) - 8)                 \
646
                        bn_cp_32(to, 4, from, (a4) - 8)             \
647
                            bn_cp_32(to, 5, from, (a3) - 8)         \
648
                                bn_cp_32(to, 6, from, (a2) - 8)     \
649
                                    bn_cp_32(to, 7, from, (a1) - 8) \
650
    }
651
652
int BN_nist_mod_256(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
653
    BN_CTX *ctx)
654
0
{
655
0
    int i, top = a->top;
656
0
    int carry = 0;
657
0
    register BN_ULONG *a_d = a->d, *r_d;
658
0
    union {
659
0
        BN_ULONG bn[BN_NIST_256_TOP];
660
0
        unsigned int ui[BN_NIST_256_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
661
0
    } buf;
662
0
    BN_ULONG c_d[BN_NIST_256_TOP], *res;
663
0
    bn_addsub_f adjust;
664
0
    static const BIGNUM ossl_bignum_nist_p_256_sqr = {
665
0
        (BN_ULONG *)_nist_p_256_sqr,
666
0
        OSSL_NELEM(_nist_p_256_sqr),
667
0
        OSSL_NELEM(_nist_p_256_sqr),
668
0
        0, BN_FLG_STATIC_DATA
669
0
    };
670
671
0
    field = &ossl_bignum_nist_p_256; /* just to make sure */
672
673
0
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_256_sqr) >= 0)
674
0
        return BN_nnmod(r, a, field, ctx);
675
676
0
    i = BN_ucmp(field, a);
677
0
    if (i == 0) {
678
0
        BN_zero(r);
679
0
        return 1;
680
0
    } else if (i > 0)
681
0
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
682
683
0
    if (r != a) {
684
0
        if (!bn_wexpand(r, BN_NIST_256_TOP))
685
0
            return 0;
686
0
        r_d = r->d;
687
0
        nist_cp_bn(r_d, a_d, BN_NIST_256_TOP);
688
0
    } else
689
0
        r_d = a_d;
690
691
0
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_256_TOP, top - BN_NIST_256_TOP,
692
0
        BN_NIST_256_TOP);
693
694
0
#if defined(NIST_INT64)
695
0
    {
696
0
        NIST_INT64 acc; /* accumulator */
697
0
        unsigned int *rp = (unsigned int *)r_d;
698
0
        const unsigned int *bp = (const unsigned int *)buf.ui;
699
700
0
        acc = load_u32(&rp[0]);
701
0
        acc += bp[8 - 8];
702
0
        acc += bp[9 - 8];
703
0
        acc -= bp[11 - 8];
704
0
        acc -= bp[12 - 8];
705
0
        acc -= bp[13 - 8];
706
0
        acc -= bp[14 - 8];
707
0
        store_lo32(&rp[0], acc);
708
0
        acc >>= 32;
709
710
0
        acc += load_u32(&rp[1]);
711
0
        acc += bp[9 - 8];
712
0
        acc += bp[10 - 8];
713
0
        acc -= bp[12 - 8];
714
0
        acc -= bp[13 - 8];
715
0
        acc -= bp[14 - 8];
716
0
        acc -= bp[15 - 8];
717
0
        store_lo32(&rp[1], acc);
718
0
        acc >>= 32;
719
720
0
        acc += load_u32(&rp[2]);
721
0
        acc += bp[10 - 8];
722
0
        acc += bp[11 - 8];
723
0
        acc -= bp[13 - 8];
724
0
        acc -= bp[14 - 8];
725
0
        acc -= bp[15 - 8];
726
0
        store_lo32(&rp[2], acc);
727
0
        acc >>= 32;
728
729
0
        acc += load_u32(&rp[3]);
730
0
        acc += bp[11 - 8];
731
0
        acc += bp[11 - 8];
732
0
        acc += bp[12 - 8];
733
0
        acc += bp[12 - 8];
734
0
        acc += bp[13 - 8];
735
0
        acc -= bp[15 - 8];
736
0
        acc -= bp[8 - 8];
737
0
        acc -= bp[9 - 8];
738
0
        store_lo32(&rp[3], acc);
739
0
        acc >>= 32;
740
741
0
        acc += load_u32(&rp[4]);
742
0
        acc += bp[12 - 8];
743
0
        acc += bp[12 - 8];
744
0
        acc += bp[13 - 8];
745
0
        acc += bp[13 - 8];
746
0
        acc += bp[14 - 8];
747
0
        acc -= bp[9 - 8];
748
0
        acc -= bp[10 - 8];
749
0
        store_lo32(&rp[4], acc);
750
0
        acc >>= 32;
751
752
0
        acc += load_u32(&rp[5]);
753
0
        acc += bp[13 - 8];
754
0
        acc += bp[13 - 8];
755
0
        acc += bp[14 - 8];
756
0
        acc += bp[14 - 8];
757
0
        acc += bp[15 - 8];
758
0
        acc -= bp[10 - 8];
759
0
        acc -= bp[11 - 8];
760
0
        store_lo32(&rp[5], acc);
761
0
        acc >>= 32;
762
763
0
        acc += load_u32(&rp[6]);
764
0
        acc += bp[14 - 8];
765
0
        acc += bp[14 - 8];
766
0
        acc += bp[15 - 8];
767
0
        acc += bp[15 - 8];
768
0
        acc += bp[14 - 8];
769
0
        acc += bp[13 - 8];
770
0
        acc -= bp[8 - 8];
771
0
        acc -= bp[9 - 8];
772
0
        store_lo32(&rp[6], acc);
773
0
        acc >>= 32;
774
775
0
        acc += load_u32(&rp[7]);
776
0
        acc += bp[15 - 8];
777
0
        acc += bp[15 - 8];
778
0
        acc += bp[15 - 8];
779
0
        acc += bp[8 - 8];
780
0
        acc -= bp[10 - 8];
781
0
        acc -= bp[11 - 8];
782
0
        acc -= bp[12 - 8];
783
0
        acc -= bp[13 - 8];
784
0
        store_lo32(&rp[7], acc);
785
786
0
        carry = (int)(acc >> 32);
787
0
    }
788
#else
789
    {
790
        BN_ULONG t_d[BN_NIST_256_TOP];
791
792
        /*
793
         * S1
794
         */
795
        nist_set_256(t_d, buf.bn, 15, 14, 13, 12, 11, 0, 0, 0);
796
        /*
797
         * S2
798
         */
799
        nist_set_256(c_d, buf.bn, 0, 15, 14, 13, 12, 0, 0, 0);
800
        carry = (int)bn_add_words(t_d, t_d, c_d, BN_NIST_256_TOP);
801
        /* left shift */
802
        {
803
            register BN_ULONG *ap, t, c;
804
            ap = t_d;
805
            c = 0;
806
            for (i = BN_NIST_256_TOP; i != 0; --i) {
807
                t = *ap;
808
                *(ap++) = ((t << 1) | c) & BN_MASK2;
809
                c = (t & BN_TBIT) ? 1 : 0;
810
            }
811
            carry <<= 1;
812
            carry |= c;
813
        }
814
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
815
        /*
816
         * S3
817
         */
818
        nist_set_256(t_d, buf.bn, 15, 14, 0, 0, 0, 10, 9, 8);
819
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
820
        /*
821
         * S4
822
         */
823
        nist_set_256(t_d, buf.bn, 8, 13, 15, 14, 13, 11, 10, 9);
824
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
825
        /*
826
         * D1
827
         */
828
        nist_set_256(t_d, buf.bn, 10, 8, 0, 0, 0, 13, 12, 11);
829
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
830
        /*
831
         * D2
832
         */
833
        nist_set_256(t_d, buf.bn, 11, 9, 0, 0, 15, 14, 13, 12);
834
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
835
        /*
836
         * D3
837
         */
838
        nist_set_256(t_d, buf.bn, 12, 0, 10, 9, 8, 15, 14, 13);
839
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
840
        /*
841
         * D4
842
         */
843
        nist_set_256(t_d, buf.bn, 13, 0, 11, 10, 9, 0, 15, 14);
844
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
845
    }
846
#endif
847
    /* see BN_nist_mod_224 for explanation */
848
0
    adjust = bn_sub_words;
849
0
    if (carry > 0)
850
0
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_256[carry - 1],
851
0
            BN_NIST_256_TOP);
852
0
    else if (carry < 0) {
853
0
        carry = (int)bn_add_words(r_d, r_d, _nist_p_256[-carry - 1],
854
0
            BN_NIST_256_TOP);
855
0
        adjust = carry ? bn_sub_words : bn_add_words;
856
0
    } else
857
0
        carry = 1;
858
859
0
    res = ((*adjust)(c_d, r_d, _nist_p_256[0], BN_NIST_256_TOP) && carry)
860
0
        ? r_d
861
0
        : c_d;
862
0
    nist_cp_bn(r_d, res, BN_NIST_256_TOP);
863
0
    r->top = BN_NIST_256_TOP;
864
0
    bn_correct_top(r);
865
866
0
    return 1;
867
0
}
868
869
#define nist_set_384(to, from, a1, a2, a3, a4, a5, a6, a7, a8, a9, a10, a11, a12)     \
870
    {                                                                                 \
871
        bn_cp_32(to, 0, from, (a12) - 12)                                             \
872
            bn_cp_32(to, 1, from, (a11) - 12)                                         \
873
                bn_cp_32(to, 2, from, (a10) - 12)                                     \
874
                    bn_cp_32(to, 3, from, (a9) - 12)                                  \
875
                        bn_cp_32(to, 4, from, (a8) - 12)                              \
876
                            bn_cp_32(to, 5, from, (a7) - 12)                          \
877
                                bn_cp_32(to, 6, from, (a6) - 12)                      \
878
                                    bn_cp_32(to, 7, from, (a5) - 12)                  \
879
                                        bn_cp_32(to, 8, from, (a4) - 12)              \
880
                                            bn_cp_32(to, 9, from, (a3) - 12)          \
881
                                                bn_cp_32(to, 10, from, (a2) - 12)     \
882
                                                    bn_cp_32(to, 11, from, (a1) - 12) \
883
    }
884
885
int BN_nist_mod_384(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
886
    BN_CTX *ctx)
887
135k
{
888
135k
    int i, top = a->top;
889
135k
    int carry = 0;
890
135k
    register BN_ULONG *r_d, *a_d = a->d;
891
135k
    union {
892
135k
        BN_ULONG bn[BN_NIST_384_TOP];
893
135k
        unsigned int ui[BN_NIST_384_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
894
135k
    } buf;
895
135k
    BN_ULONG c_d[BN_NIST_384_TOP], *res;
896
135k
    bn_addsub_f adjust;
897
135k
    static const BIGNUM ossl_bignum_nist_p_384_sqr = {
898
135k
        (BN_ULONG *)_nist_p_384_sqr,
899
135k
        OSSL_NELEM(_nist_p_384_sqr),
900
135k
        OSSL_NELEM(_nist_p_384_sqr),
901
135k
        0, BN_FLG_STATIC_DATA
902
135k
    };
903
904
135k
    field = &ossl_bignum_nist_p_384; /* just to make sure */
905
906
135k
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_384_sqr) >= 0)
907
0
        return BN_nnmod(r, a, field, ctx);
908
909
135k
    i = BN_ucmp(field, a);
910
135k
    if (i == 0) {
911
0
        BN_zero(r);
912
0
        return 1;
913
135k
    } else if (i > 0)
914
2.03k
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
915
916
133k
    if (r != a) {
917
0
        if (!bn_wexpand(r, BN_NIST_384_TOP))
918
0
            return 0;
919
0
        r_d = r->d;
920
0
        nist_cp_bn(r_d, a_d, BN_NIST_384_TOP);
921
0
    } else
922
133k
        r_d = a_d;
923
924
133k
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_384_TOP, top - BN_NIST_384_TOP,
925
133k
        BN_NIST_384_TOP);
926
927
133k
#if defined(NIST_INT64)
928
133k
    {
929
133k
        NIST_INT64 acc; /* accumulator */
930
133k
        unsigned int *rp = (unsigned int *)r_d;
931
133k
        const unsigned int *bp = (const unsigned int *)buf.ui;
932
933
133k
        acc = load_u32(&rp[0]);
934
133k
        acc += bp[12 - 12];
935
133k
        acc += bp[21 - 12];
936
133k
        acc += bp[20 - 12];
937
133k
        acc -= bp[23 - 12];
938
133k
        store_lo32(&rp[0], acc);
939
133k
        acc >>= 32;
940
941
133k
        acc += load_u32(&rp[1]);
942
133k
        acc += bp[13 - 12];
943
133k
        acc += bp[22 - 12];
944
133k
        acc += bp[23 - 12];
945
133k
        acc -= bp[12 - 12];
946
133k
        acc -= bp[20 - 12];
947
133k
        store_lo32(&rp[1], acc);
948
133k
        acc >>= 32;
949
950
133k
        acc += load_u32(&rp[2]);
951
133k
        acc += bp[14 - 12];
952
133k
        acc += bp[23 - 12];
953
133k
        acc -= bp[13 - 12];
954
133k
        acc -= bp[21 - 12];
955
133k
        store_lo32(&rp[2], acc);
956
133k
        acc >>= 32;
957
958
133k
        acc += load_u32(&rp[3]);
959
133k
        acc += bp[15 - 12];
960
133k
        acc += bp[12 - 12];
961
133k
        acc += bp[20 - 12];
962
133k
        acc += bp[21 - 12];
963
133k
        acc -= bp[14 - 12];
964
133k
        acc -= bp[22 - 12];
965
133k
        acc -= bp[23 - 12];
966
133k
        store_lo32(&rp[3], acc);
967
133k
        acc >>= 32;
968
969
133k
        acc += load_u32(&rp[4]);
970
133k
        acc += bp[21 - 12];
971
133k
        acc += bp[21 - 12];
972
133k
        acc += bp[16 - 12];
973
133k
        acc += bp[13 - 12];
974
133k
        acc += bp[12 - 12];
975
133k
        acc += bp[20 - 12];
976
133k
        acc += bp[22 - 12];
977
133k
        acc -= bp[15 - 12];
978
133k
        acc -= bp[23 - 12];
979
133k
        acc -= bp[23 - 12];
980
133k
        store_lo32(&rp[4], acc);
981
133k
        acc >>= 32;
982
983
133k
        acc += load_u32(&rp[5]);
984
133k
        acc += bp[22 - 12];
985
133k
        acc += bp[22 - 12];
986
133k
        acc += bp[17 - 12];
987
133k
        acc += bp[14 - 12];
988
133k
        acc += bp[13 - 12];
989
133k
        acc += bp[21 - 12];
990
133k
        acc += bp[23 - 12];
991
133k
        acc -= bp[16 - 12];
992
133k
        store_lo32(&rp[5], acc);
993
133k
        acc >>= 32;
994
995
133k
        acc += load_u32(&rp[6]);
996
133k
        acc += bp[23 - 12];
997
133k
        acc += bp[23 - 12];
998
133k
        acc += bp[18 - 12];
999
133k
        acc += bp[15 - 12];
1000
133k
        acc += bp[14 - 12];
1001
133k
        acc += bp[22 - 12];
1002
133k
        acc -= bp[17 - 12];
1003
133k
        store_lo32(&rp[6], acc);
1004
133k
        acc >>= 32;
1005
1006
133k
        acc += load_u32(&rp[7]);
1007
133k
        acc += bp[19 - 12];
1008
133k
        acc += bp[16 - 12];
1009
133k
        acc += bp[15 - 12];
1010
133k
        acc += bp[23 - 12];
1011
133k
        acc -= bp[18 - 12];
1012
133k
        store_lo32(&rp[7], acc);
1013
133k
        acc >>= 32;
1014
1015
133k
        acc += load_u32(&rp[8]);
1016
133k
        acc += bp[20 - 12];
1017
133k
        acc += bp[17 - 12];
1018
133k
        acc += bp[16 - 12];
1019
133k
        acc -= bp[19 - 12];
1020
133k
        store_lo32(&rp[8], acc);
1021
133k
        acc >>= 32;
1022
1023
133k
        acc += load_u32(&rp[9]);
1024
133k
        acc += bp[21 - 12];
1025
133k
        acc += bp[18 - 12];
1026
133k
        acc += bp[17 - 12];
1027
133k
        acc -= bp[20 - 12];
1028
133k
        store_lo32(&rp[9], acc);
1029
133k
        acc >>= 32;
1030
1031
133k
        acc += load_u32(&rp[10]);
1032
133k
        acc += bp[22 - 12];
1033
133k
        acc += bp[19 - 12];
1034
133k
        acc += bp[18 - 12];
1035
133k
        acc -= bp[21 - 12];
1036
133k
        store_lo32(&rp[10], acc);
1037
133k
        acc >>= 32;
1038
1039
133k
        acc += load_u32(&rp[11]);
1040
133k
        acc += bp[23 - 12];
1041
133k
        acc += bp[20 - 12];
1042
133k
        acc += bp[19 - 12];
1043
133k
        acc -= bp[22 - 12];
1044
133k
        store_lo32(&rp[11], acc);
1045
1046
133k
        carry = (int)(acc >> 32);
1047
133k
    }
1048
#else
1049
    {
1050
        BN_ULONG t_d[BN_NIST_384_TOP];
1051
1052
        /*
1053
         * S1
1054
         */
1055
        nist_set_256(t_d, buf.bn, 0, 0, 0, 0, 0, 23 - 4, 22 - 4, 21 - 4);
1056
        /* left shift */
1057
        {
1058
            register BN_ULONG *ap, t, c;
1059
            ap = t_d;
1060
            c = 0;
1061
            for (i = 3; i != 0; --i) {
1062
                t = *ap;
1063
                *(ap++) = ((t << 1) | c) & BN_MASK2;
1064
                c = (t & BN_TBIT) ? 1 : 0;
1065
            }
1066
            *ap = c;
1067
        }
1068
        carry = (int)bn_add_words(r_d + (128 / BN_BITS2), r_d + (128 / BN_BITS2),
1069
            t_d, BN_NIST_256_TOP);
1070
        /*
1071
         * S2
1072
         */
1073
        carry += (int)bn_add_words(r_d, r_d, buf.bn, BN_NIST_384_TOP);
1074
        /*
1075
         * S3
1076
         */
1077
        nist_set_384(t_d, buf.bn, 20, 19, 18, 17, 16, 15, 14, 13, 12, 23, 22,
1078
            21);
1079
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1080
        /*
1081
         * S4
1082
         */
1083
        nist_set_384(t_d, buf.bn, 19, 18, 17, 16, 15, 14, 13, 12, 20, 0, 23,
1084
            0);
1085
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1086
        /*
1087
         * S5
1088
         */
1089
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 23, 22, 21, 20, 0, 0, 0, 0);
1090
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1091
        /*
1092
         * S6
1093
         */
1094
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 0, 0, 23, 22, 21, 0, 0, 20);
1095
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1096
        /*
1097
         * D1
1098
         */
1099
        nist_set_384(t_d, buf.bn, 22, 21, 20, 19, 18, 17, 16, 15, 14, 13, 12,
1100
            23);
1101
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1102
        /*
1103
         * D2
1104
         */
1105
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 0, 0, 0, 23, 22, 21, 20, 0);
1106
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1107
        /*
1108
         * D3
1109
         */
1110
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 0, 0, 0, 23, 23, 0, 0, 0);
1111
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1112
    }
1113
#endif
1114
    /* see BN_nist_mod_224 for explanation */
1115
133k
    adjust = bn_sub_words;
1116
133k
    if (carry > 0)
1117
76.4k
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_384[carry - 1],
1118
76.4k
            BN_NIST_384_TOP);
1119
57.3k
    else if (carry < 0) {
1120
3.76k
        carry = (int)bn_add_words(r_d, r_d, _nist_p_384[-carry - 1],
1121
3.76k
            BN_NIST_384_TOP);
1122
3.76k
        adjust = carry ? bn_sub_words : bn_add_words;
1123
3.76k
    } else
1124
53.6k
        carry = 1;
1125
1126
133k
    res = ((*adjust)(c_d, r_d, _nist_p_384[0], BN_NIST_384_TOP) && carry)
1127
133k
        ? r_d
1128
133k
        : c_d;
1129
133k
    nist_cp_bn(r_d, res, BN_NIST_384_TOP);
1130
133k
    r->top = BN_NIST_384_TOP;
1131
133k
    bn_correct_top(r);
1132
1133
133k
    return 1;
1134
133k
}
1135
1136
3.10M
#define BN_NIST_521_RSHIFT (521 % BN_BITS2)
1137
1.55M
#define BN_NIST_521_LSHIFT (BN_BITS2 - BN_NIST_521_RSHIFT)
1138
172k
#define BN_NIST_521_TOP_MASK ((BN_ULONG)BN_MASK2 >> BN_NIST_521_LSHIFT)
1139
1140
int BN_nist_mod_521(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
1141
    BN_CTX *ctx)
1142
177k
{
1143
177k
    int top = a->top, i;
1144
177k
    BN_ULONG *r_d, *a_d = a->d, t_d[BN_NIST_521_TOP], val, tmp, *res;
1145
177k
    static const BIGNUM ossl_bignum_nist_p_521_sqr = {
1146
177k
        (BN_ULONG *)_nist_p_521_sqr,
1147
177k
        OSSL_NELEM(_nist_p_521_sqr),
1148
177k
        OSSL_NELEM(_nist_p_521_sqr),
1149
177k
        0, BN_FLG_STATIC_DATA
1150
177k
    };
1151
1152
177k
    field = &ossl_bignum_nist_p_521; /* just to make sure */
1153
1154
177k
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_521_sqr) >= 0)
1155
0
        return BN_nnmod(r, a, field, ctx);
1156
1157
177k
    i = BN_ucmp(field, a);
1158
177k
    if (i == 0) {
1159
0
        BN_zero(r);
1160
0
        return 1;
1161
177k
    } else if (i > 0)
1162
4.76k
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
1163
1164
172k
    if (r != a) {
1165
0
        if (!bn_wexpand(r, BN_NIST_521_TOP))
1166
0
            return 0;
1167
0
        r_d = r->d;
1168
0
        nist_cp_bn(r_d, a_d, BN_NIST_521_TOP);
1169
0
    } else
1170
172k
        r_d = a_d;
1171
1172
    /* upper 521 bits, copy ... */
1173
172k
    nist_cp_bn_0(t_d, a_d + (BN_NIST_521_TOP - 1),
1174
172k
        top - (BN_NIST_521_TOP - 1), BN_NIST_521_TOP);
1175
    /* ... and right shift */
1176
1.55M
    for (val = t_d[0], i = 0; i < BN_NIST_521_TOP - 1; i++) {
1177
#if 0
1178
        /*
1179
         * MSC ARM compiler [version 2013, presumably even earlier,
1180
         * much earlier] miscompiles this code, but not one in
1181
         * #else section. See RT#3541.
1182
         */
1183
        tmp = val >> BN_NIST_521_RSHIFT;
1184
        val = t_d[i + 1];
1185
        t_d[i] = (tmp | val << BN_NIST_521_LSHIFT) & BN_MASK2;
1186
#else
1187
1.37M
        t_d[i] = (val >> BN_NIST_521_RSHIFT | (tmp = t_d[i + 1]) << BN_NIST_521_LSHIFT) & BN_MASK2;
1188
1.37M
        val = tmp;
1189
1.37M
#endif
1190
1.37M
    }
1191
172k
    t_d[i] = val >> BN_NIST_521_RSHIFT;
1192
    /* lower 521 bits */
1193
172k
    r_d[i] &= BN_NIST_521_TOP_MASK;
1194
1195
172k
    bn_add_words(r_d, r_d, t_d, BN_NIST_521_TOP);
1196
172k
    res = bn_sub_words(t_d, r_d, _nist_p_521,
1197
172k
              BN_NIST_521_TOP)
1198
172k
        ? r_d
1199
172k
        : t_d;
1200
172k
    nist_cp_bn(r_d, res, BN_NIST_521_TOP);
1201
172k
    r->top = BN_NIST_521_TOP;
1202
172k
    bn_correct_top(r);
1203
1204
172k
    return 1;
1205
172k
}
1206
1207
int (*BN_nist_mod_func(const BIGNUM *p))(BIGNUM *r, const BIGNUM *a,
1208
    const BIGNUM *field, BN_CTX *ctx)
1209
0
{
1210
0
    if (BN_ucmp(&ossl_bignum_nist_p_192, p) == 0)
1211
0
        return BN_nist_mod_192;
1212
0
    if (BN_ucmp(&ossl_bignum_nist_p_224, p) == 0)
1213
0
        return BN_nist_mod_224;
1214
0
    if (BN_ucmp(&ossl_bignum_nist_p_256, p) == 0)
1215
0
        return BN_nist_mod_256;
1216
0
    if (BN_ucmp(&ossl_bignum_nist_p_384, p) == 0)
1217
0
        return BN_nist_mod_384;
1218
0
    if (BN_ucmp(&ossl_bignum_nist_p_521, p) == 0)
1219
0
        return BN_nist_mod_521;
1220
0
    return 0;
1221
0
}