Coverage Report

Created: 2025-12-31 06:58

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/openssl34/crypto/bn/bn_nist.c
Line
Count
Source
1
/*
2
 * Copyright 2002-2024 The OpenSSL Project Authors. All Rights Reserved.
3
 *
4
 * Licensed under the Apache License 2.0 (the "License").  You may not use
5
 * this file except in compliance with the License.  You can obtain a copy
6
 * in the file LICENSE in the source distribution or at
7
 * https://www.openssl.org/source/license.html
8
 */
9
10
#include "bn_local.h"
11
#include "internal/cryptlib.h"
12
13
0
#define BN_NIST_192_TOP (192 + BN_BITS2 - 1) / BN_BITS2
14
3.44M
#define BN_NIST_224_TOP (224 + BN_BITS2 - 1) / BN_BITS2
15
0
#define BN_NIST_256_TOP (256 + BN_BITS2 - 1) / BN_BITS2
16
385k
#define BN_NIST_384_TOP (384 + BN_BITS2 - 1) / BN_BITS2
17
2.58M
#define BN_NIST_521_TOP (521 + BN_BITS2 - 1) / BN_BITS2
18
19
/* pre-computed tables are "carry-less" values of modulus*(i+1) */
20
#if BN_BITS2 == 64
21
static const BN_ULONG _nist_p_192[][BN_NIST_192_TOP] = {
22
    { 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFEULL, 0xFFFFFFFFFFFFFFFFULL },
23
    { 0xFFFFFFFFFFFFFFFEULL, 0xFFFFFFFFFFFFFFFDULL, 0xFFFFFFFFFFFFFFFFULL },
24
    { 0xFFFFFFFFFFFFFFFDULL, 0xFFFFFFFFFFFFFFFCULL, 0xFFFFFFFFFFFFFFFFULL }
25
};
26
27
static const BN_ULONG _nist_p_192_sqr[] = {
28
    0x0000000000000001ULL, 0x0000000000000002ULL, 0x0000000000000001ULL,
29
    0xFFFFFFFFFFFFFFFEULL, 0xFFFFFFFFFFFFFFFDULL, 0xFFFFFFFFFFFFFFFFULL
30
};
31
32
static const BN_ULONG _nist_p_224[][BN_NIST_224_TOP] = {
33
    { 0x0000000000000001ULL, 0xFFFFFFFF00000000ULL,
34
        0xFFFFFFFFFFFFFFFFULL, 0x00000000FFFFFFFFULL },
35
    { 0x0000000000000002ULL, 0xFFFFFFFE00000000ULL,
36
        0xFFFFFFFFFFFFFFFFULL, 0x00000001FFFFFFFFULL } /* this one is
37
                                                        * "carry-full" */
38
};
39
40
static const BN_ULONG _nist_p_224_sqr[] = {
41
    0x0000000000000001ULL, 0xFFFFFFFE00000000ULL,
42
    0xFFFFFFFFFFFFFFFFULL, 0x0000000200000000ULL,
43
    0x0000000000000000ULL, 0xFFFFFFFFFFFFFFFEULL,
44
    0xFFFFFFFFFFFFFFFFULL
45
};
46
47
static const BN_ULONG _nist_p_256[][BN_NIST_256_TOP] = {
48
    { 0xFFFFFFFFFFFFFFFFULL, 0x00000000FFFFFFFFULL,
49
        0x0000000000000000ULL, 0xFFFFFFFF00000001ULL },
50
    { 0xFFFFFFFFFFFFFFFEULL, 0x00000001FFFFFFFFULL,
51
        0x0000000000000000ULL, 0xFFFFFFFE00000002ULL },
52
    { 0xFFFFFFFFFFFFFFFDULL, 0x00000002FFFFFFFFULL,
53
        0x0000000000000000ULL, 0xFFFFFFFD00000003ULL },
54
    { 0xFFFFFFFFFFFFFFFCULL, 0x00000003FFFFFFFFULL,
55
        0x0000000000000000ULL, 0xFFFFFFFC00000004ULL },
56
    { 0xFFFFFFFFFFFFFFFBULL, 0x00000004FFFFFFFFULL,
57
        0x0000000000000000ULL, 0xFFFFFFFB00000005ULL },
58
};
59
60
static const BN_ULONG _nist_p_256_sqr[] = {
61
    0x0000000000000001ULL, 0xFFFFFFFE00000000ULL,
62
    0xFFFFFFFFFFFFFFFFULL, 0x00000001FFFFFFFEULL,
63
    0x00000001FFFFFFFEULL, 0x00000001FFFFFFFEULL,
64
    0xFFFFFFFE00000001ULL, 0xFFFFFFFE00000002ULL
65
};
66
67
static const BN_ULONG _nist_p_384[][BN_NIST_384_TOP] = {
68
    { 0x00000000FFFFFFFFULL, 0xFFFFFFFF00000000ULL, 0xFFFFFFFFFFFFFFFEULL,
69
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
70
    { 0x00000001FFFFFFFEULL, 0xFFFFFFFE00000000ULL, 0xFFFFFFFFFFFFFFFDULL,
71
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
72
    { 0x00000002FFFFFFFDULL, 0xFFFFFFFD00000000ULL, 0xFFFFFFFFFFFFFFFCULL,
73
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
74
    { 0x00000003FFFFFFFCULL, 0xFFFFFFFC00000000ULL, 0xFFFFFFFFFFFFFFFBULL,
75
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
76
    { 0x00000004FFFFFFFBULL, 0xFFFFFFFB00000000ULL, 0xFFFFFFFFFFFFFFFAULL,
77
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
78
};
79
80
static const BN_ULONG _nist_p_384_sqr[] = {
81
    0xFFFFFFFE00000001ULL, 0x0000000200000000ULL, 0xFFFFFFFE00000000ULL,
82
    0x0000000200000000ULL, 0x0000000000000001ULL, 0x0000000000000000ULL,
83
    0x00000001FFFFFFFEULL, 0xFFFFFFFE00000000ULL, 0xFFFFFFFFFFFFFFFDULL,
84
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL
85
};
86
87
static const BN_ULONG _nist_p_521[] = {
88
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
89
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
90
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
91
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
92
    0x00000000000001FFULL
93
};
94
95
static const BN_ULONG _nist_p_521_sqr[] = {
96
    0x0000000000000001ULL, 0x0000000000000000ULL, 0x0000000000000000ULL,
97
    0x0000000000000000ULL, 0x0000000000000000ULL, 0x0000000000000000ULL,
98
    0x0000000000000000ULL, 0x0000000000000000ULL, 0xFFFFFFFFFFFFFC00ULL,
99
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
100
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
101
    0xFFFFFFFFFFFFFFFFULL, 0x000000000003FFFFULL
102
};
103
#elif BN_BITS2 == 32
104
static const BN_ULONG _nist_p_192[][BN_NIST_192_TOP] = {
105
    { 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
106
    { 0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
107
    { 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFC, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF }
108
};
109
110
static const BN_ULONG _nist_p_192_sqr[] = {
111
    0x00000001, 0x00000000, 0x00000002, 0x00000000, 0x00000001, 0x00000000,
112
    0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF
113
};
114
115
static const BN_ULONG _nist_p_224[][BN_NIST_224_TOP] = {
116
    { 0x00000001, 0x00000000, 0x00000000, 0xFFFFFFFF,
117
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
118
    { 0x00000002, 0x00000000, 0x00000000, 0xFFFFFFFE,
119
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF }
120
};
121
122
static const BN_ULONG _nist_p_224_sqr[] = {
123
    0x00000001, 0x00000000, 0x00000000, 0xFFFFFFFE,
124
    0xFFFFFFFF, 0xFFFFFFFF, 0x00000000, 0x00000002,
125
    0x00000000, 0x00000000, 0xFFFFFFFE, 0xFFFFFFFF,
126
    0xFFFFFFFF, 0xFFFFFFFF
127
};
128
129
static const BN_ULONG _nist_p_256[][BN_NIST_256_TOP] = {
130
    { 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000000,
131
        0x00000000, 0x00000000, 0x00000001, 0xFFFFFFFF },
132
    { 0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000001,
133
        0x00000000, 0x00000000, 0x00000002, 0xFFFFFFFE },
134
    { 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000002,
135
        0x00000000, 0x00000000, 0x00000003, 0xFFFFFFFD },
136
    { 0xFFFFFFFC, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000003,
137
        0x00000000, 0x00000000, 0x00000004, 0xFFFFFFFC },
138
    { 0xFFFFFFFB, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000004,
139
        0x00000000, 0x00000000, 0x00000005, 0xFFFFFFFB },
140
};
141
142
static const BN_ULONG _nist_p_256_sqr[] = {
143
    0x00000001, 0x00000000, 0x00000000, 0xFFFFFFFE,
144
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFE, 0x00000001,
145
    0xFFFFFFFE, 0x00000001, 0xFFFFFFFE, 0x00000001,
146
    0x00000001, 0xFFFFFFFE, 0x00000002, 0xFFFFFFFE
147
};
148
149
static const BN_ULONG _nist_p_384[][BN_NIST_384_TOP] = {
150
    { 0xFFFFFFFF, 0x00000000, 0x00000000, 0xFFFFFFFF, 0xFFFFFFFE, 0xFFFFFFFF,
151
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
152
    { 0xFFFFFFFE, 0x00000001, 0x00000000, 0xFFFFFFFE, 0xFFFFFFFD, 0xFFFFFFFF,
153
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
154
    { 0xFFFFFFFD, 0x00000002, 0x00000000, 0xFFFFFFFD, 0xFFFFFFFC, 0xFFFFFFFF,
155
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
156
    { 0xFFFFFFFC, 0x00000003, 0x00000000, 0xFFFFFFFC, 0xFFFFFFFB, 0xFFFFFFFF,
157
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
158
    { 0xFFFFFFFB, 0x00000004, 0x00000000, 0xFFFFFFFB, 0xFFFFFFFA, 0xFFFFFFFF,
159
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
160
};
161
162
static const BN_ULONG _nist_p_384_sqr[] = {
163
    0x00000001, 0xFFFFFFFE, 0x00000000, 0x00000002, 0x00000000, 0xFFFFFFFE,
164
    0x00000000, 0x00000002, 0x00000001, 0x00000000, 0x00000000, 0x00000000,
165
    0xFFFFFFFE, 0x00000001, 0x00000000, 0xFFFFFFFE, 0xFFFFFFFD, 0xFFFFFFFF,
166
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF
167
};
168
169
static const BN_ULONG _nist_p_521[] = { 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
170
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
171
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
172
    0xFFFFFFFF, 0x000001FF };
173
174
static const BN_ULONG _nist_p_521_sqr[] = {
175
    0x00000001, 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
176
    0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
177
    0x00000000, 0x00000000, 0x00000000, 0x00000000, 0xFFFFFC00, 0xFFFFFFFF,
178
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
179
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
180
    0xFFFFFFFF, 0xFFFFFFFF, 0x0003FFFF
181
};
182
#else
183
#error "unsupported BN_BITS2"
184
#endif
185
186
static const BIGNUM ossl_bignum_nist_p_192 = {
187
    (BN_ULONG *)_nist_p_192[0],
188
    BN_NIST_192_TOP,
189
    BN_NIST_192_TOP,
190
    0,
191
    BN_FLG_STATIC_DATA
192
};
193
194
static const BIGNUM ossl_bignum_nist_p_224 = {
195
    (BN_ULONG *)_nist_p_224[0],
196
    BN_NIST_224_TOP,
197
    BN_NIST_224_TOP,
198
    0,
199
    BN_FLG_STATIC_DATA
200
};
201
202
static const BIGNUM ossl_bignum_nist_p_256 = {
203
    (BN_ULONG *)_nist_p_256[0],
204
    BN_NIST_256_TOP,
205
    BN_NIST_256_TOP,
206
    0,
207
    BN_FLG_STATIC_DATA
208
};
209
210
static const BIGNUM ossl_bignum_nist_p_384 = {
211
    (BN_ULONG *)_nist_p_384[0],
212
    BN_NIST_384_TOP,
213
    BN_NIST_384_TOP,
214
    0,
215
    BN_FLG_STATIC_DATA
216
};
217
218
static const BIGNUM ossl_bignum_nist_p_521 = {
219
    (BN_ULONG *)_nist_p_521,
220
    BN_NIST_521_TOP,
221
    BN_NIST_521_TOP,
222
    0,
223
    BN_FLG_STATIC_DATA
224
};
225
226
const BIGNUM *BN_get0_nist_prime_192(void)
227
0
{
228
0
    return &ossl_bignum_nist_p_192;
229
0
}
230
231
const BIGNUM *BN_get0_nist_prime_224(void)
232
0
{
233
0
    return &ossl_bignum_nist_p_224;
234
0
}
235
236
const BIGNUM *BN_get0_nist_prime_256(void)
237
0
{
238
0
    return &ossl_bignum_nist_p_256;
239
0
}
240
241
const BIGNUM *BN_get0_nist_prime_384(void)
242
0
{
243
0
    return &ossl_bignum_nist_p_384;
244
0
}
245
246
const BIGNUM *BN_get0_nist_prime_521(void)
247
0
{
248
0
    return &ossl_bignum_nist_p_521;
249
0
}
250
251
/*
252
 * To avoid more recent compilers (specifically clang-14) from treating this
253
 * code as a violation of the strict aliasing conditions and omitting it, this
254
 * cannot be declared as a function.  Moreover, the dst parameter cannot be
255
 * cached in a local since this no longer references the union and again falls
256
 * foul of the strict aliasing criteria.  Refer to #18225 for the initial
257
 * diagnostics and llvm/llvm-project#55255 for the later discussions with the
258
 * LLVM developers.  The problem boils down to if an array in the union is
259
 * converted to a pointer or if it is used directly.
260
 *
261
 * This function was inlined regardless, so there is no space cost to be
262
 * paid for making it a macro.
263
 */
264
#define nist_cp_bn_0(dst, src_in, top, max) \
265
653k
    {                                       \
266
653k
        int ii;                             \
267
653k
        const BN_ULONG *src = src_in;       \
268
653k
                                            \
269
4.30M
        for (ii = 0; ii < top; ii++)        \
270
3.64M
            (dst)[ii] = src[ii];            \
271
829k
        for (; ii < max; ii++)              \
272
653k
            (dst)[ii] = 0;                  \
273
653k
    }
274
275
static void nist_cp_bn(BN_ULONG *dst, const BN_ULONG *src, int top)
276
653k
{
277
653k
    int i;
278
279
4.47M
    for (i = 0; i < top; i++)
280
3.82M
        dst[i] = src[i];
281
653k
}
282
283
#if BN_BITS2 == 64
284
#define bn_cp_64(to, n, from, m) (to)[n] = (m >= 0) ? ((from)[m]) : 0;
285
#define bn_64_set_0(to, n) (to)[n] = (BN_ULONG)0;
286
/*
287
 * two following macros are implemented under assumption that they
288
 * are called in a sequence with *ascending* n, i.e. as they are...
289
 */
290
8.34M
#define bn_cp_32_naked(to, n, from, m) (((n) & 1) ? (to[(n) / 2] |= ((m) & 1) ? (from[(m) / 2] & BN_MASK2h) : (from[(m) / 2] << 32)) \
291
8.34M
                                                  : (to[(n) / 2] = ((m) & 1) ? (from[(m) / 2] >> 32) : (from[(m) / 2] & BN_MASK2l)))
292
3.82M
#define bn_32_set_0(to, n) (((n) & 1) ? (to[(n) / 2] &= BN_MASK2l) : (to[(n) / 2] = 0));
293
12.1M
#define bn_cp_32(to, n, from, m) ((m) >= 0) ? bn_cp_32_naked(to, n, from, m) : bn_32_set_0(to, n)
294
#if defined(L_ENDIAN)
295
#if defined(__arch64__)
296
#define NIST_INT64 long
297
#else
298
106k
#define NIST_INT64 long long
299
#endif
300
#endif
301
#else
302
#define bn_cp_64(to, n, from, m)                      \
303
    {                                                 \
304
        bn_cp_32(to, (n) * 2, from, (m) * 2);         \
305
        bn_cp_32(to, (n) * 2 + 1, from, (m) * 2 + 1); \
306
    }
307
#define bn_64_set_0(to, n)            \
308
    {                                 \
309
        bn_32_set_0(to, (n) * 2);     \
310
        bn_32_set_0(to, (n) * 2 + 1); \
311
    }
312
#define bn_cp_32(to, n, from, m) (to)[n] = (m >= 0) ? ((from)[m]) : 0;
313
#define bn_32_set_0(to, n) (to)[n] = (BN_ULONG)0;
314
#if defined(_WIN32) && !defined(__GNUC__)
315
#define NIST_INT64 __int64
316
#elif defined(BN_LLONG)
317
#define NIST_INT64 long long
318
#endif
319
#endif /* BN_BITS2 != 64 */
320
321
#ifdef NIST_INT64
322
/* Helpers to load/store a 32-bit word (uint32_t) from/into a memory
323
 * location and avoid potential aliasing issue.  */
324
static ossl_inline uint32_t load_u32(const void *ptr)
325
1.28M
{
326
1.28M
    uint32_t tmp;
327
328
1.28M
    memcpy(&tmp, ptr, sizeof(tmp));
329
1.28M
    return tmp;
330
1.28M
}
331
332
static ossl_inline void store_lo32(void *ptr, NIST_INT64 val)
333
1.28M
{
334
    /* A cast is needed for big-endian system: on a 32-bit BE system
335
     * NIST_INT64 may be defined as well if the compiler supports 64-bit
336
     * long long.  */
337
1.28M
    uint32_t tmp = (uint32_t)val;
338
339
1.28M
    memcpy(ptr, &tmp, sizeof(tmp));
340
1.28M
}
341
#endif /* NIST_INT64 */
342
343
#define nist_set_192(to, from, a1, a2, a3)      \
344
    {                                           \
345
        bn_cp_64(to, 0, from, (a3) - 3)         \
346
            bn_cp_64(to, 1, from, (a2) - 3)     \
347
                bn_cp_64(to, 2, from, (a1) - 3) \
348
    }
349
350
int BN_nist_mod_192(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
351
    BN_CTX *ctx)
352
0
{
353
0
    int top = a->top, i;
354
0
    int carry;
355
0
    register BN_ULONG *r_d, *a_d = a->d;
356
0
    union {
357
0
        BN_ULONG bn[BN_NIST_192_TOP];
358
0
        unsigned int ui[BN_NIST_192_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
359
0
    } buf;
360
0
    BN_ULONG c_d[BN_NIST_192_TOP], *res;
361
0
    static const BIGNUM ossl_bignum_nist_p_192_sqr = {
362
0
        (BN_ULONG *)_nist_p_192_sqr,
363
0
        OSSL_NELEM(_nist_p_192_sqr),
364
0
        OSSL_NELEM(_nist_p_192_sqr),
365
0
        0, BN_FLG_STATIC_DATA
366
0
    };
367
368
0
    field = &ossl_bignum_nist_p_192; /* just to make sure */
369
370
0
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_192_sqr) >= 0)
371
0
        return BN_nnmod(r, a, field, ctx);
372
373
0
    i = BN_ucmp(field, a);
374
0
    if (i == 0) {
375
0
        BN_zero(r);
376
0
        return 1;
377
0
    } else if (i > 0)
378
0
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
379
380
0
    if (r != a) {
381
0
        if (!bn_wexpand(r, BN_NIST_192_TOP))
382
0
            return 0;
383
0
        r_d = r->d;
384
0
        nist_cp_bn(r_d, a_d, BN_NIST_192_TOP);
385
0
    } else
386
0
        r_d = a_d;
387
388
0
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_192_TOP, top - BN_NIST_192_TOP,
389
0
        BN_NIST_192_TOP);
390
391
0
#if defined(NIST_INT64)
392
0
    {
393
0
        NIST_INT64 acc; /* accumulator */
394
0
        unsigned int *rp = (unsigned int *)r_d;
395
0
        const unsigned int *bp = (const unsigned int *)buf.ui;
396
397
0
        acc = load_u32(&rp[0]);
398
0
        acc += bp[3 * 2 - 6];
399
0
        acc += bp[5 * 2 - 6];
400
0
        store_lo32(&rp[0], acc);
401
0
        acc >>= 32;
402
403
0
        acc += load_u32(&rp[1]);
404
0
        acc += bp[3 * 2 - 5];
405
0
        acc += bp[5 * 2 - 5];
406
0
        store_lo32(&rp[1], acc);
407
0
        acc >>= 32;
408
409
0
        acc += load_u32(&rp[2]);
410
0
        acc += bp[3 * 2 - 6];
411
0
        acc += bp[4 * 2 - 6];
412
0
        acc += bp[5 * 2 - 6];
413
0
        store_lo32(&rp[2], acc);
414
0
        acc >>= 32;
415
416
0
        acc += load_u32(&rp[3]);
417
0
        acc += bp[3 * 2 - 5];
418
0
        acc += bp[4 * 2 - 5];
419
0
        acc += bp[5 * 2 - 5];
420
0
        store_lo32(&rp[3], acc);
421
0
        acc >>= 32;
422
423
0
        acc += load_u32(&rp[4]);
424
0
        acc += bp[4 * 2 - 6];
425
0
        acc += bp[5 * 2 - 6];
426
0
        store_lo32(&rp[4], acc);
427
0
        acc >>= 32;
428
429
0
        acc += load_u32(&rp[5]);
430
0
        acc += bp[4 * 2 - 5];
431
0
        acc += bp[5 * 2 - 5];
432
0
        store_lo32(&rp[5], acc);
433
434
0
        carry = (int)(acc >> 32);
435
0
    }
436
#else
437
    {
438
        BN_ULONG t_d[BN_NIST_192_TOP];
439
440
        nist_set_192(t_d, buf.bn, 0, 3, 3);
441
        carry = (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
442
        nist_set_192(t_d, buf.bn, 4, 4, 0);
443
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
444
        nist_set_192(t_d, buf.bn, 5, 5, 5)
445
            carry
446
            += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
447
    }
448
#endif
449
0
    if (carry > 0)
450
0
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_192[carry - 1],
451
0
            BN_NIST_192_TOP);
452
0
    else
453
0
        carry = 1;
454
455
    /*
456
     * we need 'if (carry==0 || result>=modulus) result-=modulus;'
457
     * as comparison implies subtraction, we can write
458
     * 'tmp=result-modulus; if (!carry || !borrow) result=tmp;'
459
     * this is what happens below, but without explicit if:-) a.
460
     */
461
0
    res = (bn_sub_words(c_d, r_d, _nist_p_192[0], BN_NIST_192_TOP) && carry)
462
0
        ? r_d
463
0
        : c_d;
464
0
    nist_cp_bn(r_d, res, BN_NIST_192_TOP);
465
0
    r->top = BN_NIST_192_TOP;
466
0
    bn_correct_top(r);
467
468
0
    return 1;
469
0
}
470
471
typedef BN_ULONG (*bn_addsub_f)(BN_ULONG *, const BN_ULONG *,
472
    const BN_ULONG *, int);
473
474
#define nist_set_224(to, from, a1, a2, a3, a4, a5, a6, a7)      \
475
1.73M
    {                                                           \
476
1.73M
        bn_cp_32(to, 0, from, (a7) - 7)                         \
477
1.73M
            bn_cp_32(to, 1, from, (a6) - 7)                     \
478
1.73M
                bn_cp_32(to, 2, from, (a5) - 7)                 \
479
1.73M
                    bn_cp_32(to, 3, from, (a4) - 7)             \
480
1.73M
                        bn_cp_32(to, 4, from, (a3) - 7)         \
481
1.73M
                            bn_cp_32(to, 5, from, (a2) - 7)     \
482
1.73M
                                bn_cp_32(to, 6, from, (a1) - 7) \
483
1.73M
    }
484
485
int BN_nist_mod_224(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
486
    BN_CTX *ctx)
487
352k
{
488
352k
    int top = a->top, i;
489
352k
    int carry;
490
352k
    BN_ULONG *r_d, *a_d = a->d;
491
352k
    union {
492
352k
        BN_ULONG bn[BN_NIST_224_TOP];
493
352k
        unsigned int ui[BN_NIST_224_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
494
352k
    } buf;
495
352k
    BN_ULONG c_d[BN_NIST_224_TOP], *res;
496
352k
    bn_addsub_f adjust;
497
352k
    static const BIGNUM ossl_bignum_nist_p_224_sqr = {
498
352k
        (BN_ULONG *)_nist_p_224_sqr,
499
352k
        OSSL_NELEM(_nist_p_224_sqr),
500
352k
        OSSL_NELEM(_nist_p_224_sqr),
501
352k
        0, BN_FLG_STATIC_DATA
502
352k
    };
503
504
352k
    field = &ossl_bignum_nist_p_224; /* just to make sure */
505
506
352k
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_224_sqr) >= 0)
507
0
        return BN_nnmod(r, a, field, ctx);
508
509
352k
    i = BN_ucmp(field, a);
510
352k
    if (i == 0) {
511
0
        BN_zero(r);
512
0
        return 1;
513
352k
    } else if (i > 0)
514
4.62k
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
515
516
347k
    if (r != a) {
517
0
        if (!bn_wexpand(r, BN_NIST_224_TOP))
518
0
            return 0;
519
0
        r_d = r->d;
520
0
        nist_cp_bn(r_d, a_d, BN_NIST_224_TOP);
521
0
    } else
522
347k
        r_d = a_d;
523
524
347k
#if BN_BITS2 == 64
525
    /* copy upper 256 bits of 448 bit number ... */
526
347k
    nist_cp_bn_0(c_d, a_d + (BN_NIST_224_TOP - 1),
527
347k
        top - (BN_NIST_224_TOP - 1), BN_NIST_224_TOP);
528
    /* ... and right shift by 32 to obtain upper 224 bits */
529
347k
    nist_set_224(buf.bn, c_d, 14, 13, 12, 11, 10, 9, 8);
530
    /* truncate lower part to 224 bits too */
531
347k
    r_d[BN_NIST_224_TOP - 1] &= BN_MASK2l;
532
#else
533
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_224_TOP, top - BN_NIST_224_TOP,
534
        BN_NIST_224_TOP);
535
#endif
536
537
#if defined(NIST_INT64) && BN_BITS2 != 64
538
    {
539
        NIST_INT64 acc; /* accumulator */
540
        unsigned int *rp = (unsigned int *)r_d;
541
        const unsigned int *bp = (const unsigned int *)buf.ui;
542
543
        acc = rp[0];
544
        acc -= bp[7 - 7];
545
        acc -= bp[11 - 7];
546
        rp[0] = (unsigned int)acc;
547
        acc >>= 32;
548
549
        acc += rp[1];
550
        acc -= bp[8 - 7];
551
        acc -= bp[12 - 7];
552
        rp[1] = (unsigned int)acc;
553
        acc >>= 32;
554
555
        acc += rp[2];
556
        acc -= bp[9 - 7];
557
        acc -= bp[13 - 7];
558
        rp[2] = (unsigned int)acc;
559
        acc >>= 32;
560
561
        acc += rp[3];
562
        acc += bp[7 - 7];
563
        acc += bp[11 - 7];
564
        acc -= bp[10 - 7];
565
        rp[3] = (unsigned int)acc;
566
        acc >>= 32;
567
568
        acc += rp[4];
569
        acc += bp[8 - 7];
570
        acc += bp[12 - 7];
571
        acc -= bp[11 - 7];
572
        rp[4] = (unsigned int)acc;
573
        acc >>= 32;
574
575
        acc += rp[5];
576
        acc += bp[9 - 7];
577
        acc += bp[13 - 7];
578
        acc -= bp[12 - 7];
579
        rp[5] = (unsigned int)acc;
580
        acc >>= 32;
581
582
        acc += rp[6];
583
        acc += bp[10 - 7];
584
        acc -= bp[13 - 7];
585
        rp[6] = (unsigned int)acc;
586
587
        carry = (int)(acc >> 32);
588
#if BN_BITS2 == 64
589
        rp[7] = carry;
590
#endif
591
    }
592
#else
593
347k
    {
594
347k
        BN_ULONG t_d[BN_NIST_224_TOP];
595
596
347k
        nist_set_224(t_d, buf.bn, 10, 9, 8, 7, 0, 0, 0);
597
347k
        carry = (int)bn_add_words(r_d, r_d, t_d, BN_NIST_224_TOP);
598
347k
        nist_set_224(t_d, buf.bn, 0, 13, 12, 11, 0, 0, 0);
599
347k
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_224_TOP);
600
347k
        nist_set_224(t_d, buf.bn, 13, 12, 11, 10, 9, 8, 7);
601
347k
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_224_TOP);
602
347k
        nist_set_224(t_d, buf.bn, 0, 0, 0, 0, 13, 12, 11);
603
347k
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_224_TOP);
604
605
347k
#if BN_BITS2 == 64
606
347k
        carry = (int)(r_d[BN_NIST_224_TOP - 1] >> 32);
607
347k
#endif
608
347k
    }
609
347k
#endif
610
347k
    adjust = bn_sub_words;
611
347k
    if (carry > 0) {
612
146k
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_224[carry - 1],
613
146k
            BN_NIST_224_TOP);
614
146k
#if BN_BITS2 == 64
615
146k
        carry = (int)(~(r_d[BN_NIST_224_TOP - 1] >> 32)) & 1;
616
146k
#endif
617
201k
    } else if (carry < 0) {
618
        /*
619
         * it's a bit more complicated logic in this case. if bn_add_words
620
         * yields no carry, then result has to be adjusted by unconditionally
621
         * *adding* the modulus. but if it does, then result has to be
622
         * compared to the modulus and conditionally adjusted by
623
         * *subtracting* the latter.
624
         */
625
20.6k
        carry = (int)bn_add_words(r_d, r_d, _nist_p_224[-carry - 1],
626
20.6k
            BN_NIST_224_TOP);
627
20.6k
        adjust = carry ? bn_sub_words : bn_add_words;
628
20.6k
    } else
629
180k
        carry = 1;
630
631
    /* otherwise it's effectively same as in BN_nist_mod_192... */
632
347k
    res = ((*adjust)(c_d, r_d, _nist_p_224[0], BN_NIST_224_TOP) && carry)
633
347k
        ? r_d
634
347k
        : c_d;
635
347k
    nist_cp_bn(r_d, res, BN_NIST_224_TOP);
636
347k
    r->top = BN_NIST_224_TOP;
637
347k
    bn_correct_top(r);
638
639
347k
    return 1;
640
347k
}
641
642
#define nist_set_256(to, from, a1, a2, a3, a4, a5, a6, a7, a8)      \
643
    {                                                               \
644
        bn_cp_32(to, 0, from, (a8) - 8)                             \
645
            bn_cp_32(to, 1, from, (a7) - 8)                         \
646
                bn_cp_32(to, 2, from, (a6) - 8)                     \
647
                    bn_cp_32(to, 3, from, (a5) - 8)                 \
648
                        bn_cp_32(to, 4, from, (a4) - 8)             \
649
                            bn_cp_32(to, 5, from, (a3) - 8)         \
650
                                bn_cp_32(to, 6, from, (a2) - 8)     \
651
                                    bn_cp_32(to, 7, from, (a1) - 8) \
652
    }
653
654
int BN_nist_mod_256(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
655
    BN_CTX *ctx)
656
0
{
657
0
    int i, top = a->top;
658
0
    int carry = 0;
659
0
    register BN_ULONG *a_d = a->d, *r_d;
660
0
    union {
661
0
        BN_ULONG bn[BN_NIST_256_TOP];
662
0
        unsigned int ui[BN_NIST_256_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
663
0
    } buf;
664
0
    BN_ULONG c_d[BN_NIST_256_TOP], *res;
665
0
    bn_addsub_f adjust;
666
0
    static const BIGNUM ossl_bignum_nist_p_256_sqr = {
667
0
        (BN_ULONG *)_nist_p_256_sqr,
668
0
        OSSL_NELEM(_nist_p_256_sqr),
669
0
        OSSL_NELEM(_nist_p_256_sqr),
670
0
        0, BN_FLG_STATIC_DATA
671
0
    };
672
673
0
    field = &ossl_bignum_nist_p_256; /* just to make sure */
674
675
0
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_256_sqr) >= 0)
676
0
        return BN_nnmod(r, a, field, ctx);
677
678
0
    i = BN_ucmp(field, a);
679
0
    if (i == 0) {
680
0
        BN_zero(r);
681
0
        return 1;
682
0
    } else if (i > 0)
683
0
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
684
685
0
    if (r != a) {
686
0
        if (!bn_wexpand(r, BN_NIST_256_TOP))
687
0
            return 0;
688
0
        r_d = r->d;
689
0
        nist_cp_bn(r_d, a_d, BN_NIST_256_TOP);
690
0
    } else
691
0
        r_d = a_d;
692
693
0
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_256_TOP, top - BN_NIST_256_TOP,
694
0
        BN_NIST_256_TOP);
695
696
0
#if defined(NIST_INT64)
697
0
    {
698
0
        NIST_INT64 acc; /* accumulator */
699
0
        unsigned int *rp = (unsigned int *)r_d;
700
0
        const unsigned int *bp = (const unsigned int *)buf.ui;
701
702
0
        acc = load_u32(&rp[0]);
703
0
        acc += bp[8 - 8];
704
0
        acc += bp[9 - 8];
705
0
        acc -= bp[11 - 8];
706
0
        acc -= bp[12 - 8];
707
0
        acc -= bp[13 - 8];
708
0
        acc -= bp[14 - 8];
709
0
        store_lo32(&rp[0], acc);
710
0
        acc >>= 32;
711
712
0
        acc += load_u32(&rp[1]);
713
0
        acc += bp[9 - 8];
714
0
        acc += bp[10 - 8];
715
0
        acc -= bp[12 - 8];
716
0
        acc -= bp[13 - 8];
717
0
        acc -= bp[14 - 8];
718
0
        acc -= bp[15 - 8];
719
0
        store_lo32(&rp[1], acc);
720
0
        acc >>= 32;
721
722
0
        acc += load_u32(&rp[2]);
723
0
        acc += bp[10 - 8];
724
0
        acc += bp[11 - 8];
725
0
        acc -= bp[13 - 8];
726
0
        acc -= bp[14 - 8];
727
0
        acc -= bp[15 - 8];
728
0
        store_lo32(&rp[2], acc);
729
0
        acc >>= 32;
730
731
0
        acc += load_u32(&rp[3]);
732
0
        acc += bp[11 - 8];
733
0
        acc += bp[11 - 8];
734
0
        acc += bp[12 - 8];
735
0
        acc += bp[12 - 8];
736
0
        acc += bp[13 - 8];
737
0
        acc -= bp[15 - 8];
738
0
        acc -= bp[8 - 8];
739
0
        acc -= bp[9 - 8];
740
0
        store_lo32(&rp[3], acc);
741
0
        acc >>= 32;
742
743
0
        acc += load_u32(&rp[4]);
744
0
        acc += bp[12 - 8];
745
0
        acc += bp[12 - 8];
746
0
        acc += bp[13 - 8];
747
0
        acc += bp[13 - 8];
748
0
        acc += bp[14 - 8];
749
0
        acc -= bp[9 - 8];
750
0
        acc -= bp[10 - 8];
751
0
        store_lo32(&rp[4], acc);
752
0
        acc >>= 32;
753
754
0
        acc += load_u32(&rp[5]);
755
0
        acc += bp[13 - 8];
756
0
        acc += bp[13 - 8];
757
0
        acc += bp[14 - 8];
758
0
        acc += bp[14 - 8];
759
0
        acc += bp[15 - 8];
760
0
        acc -= bp[10 - 8];
761
0
        acc -= bp[11 - 8];
762
0
        store_lo32(&rp[5], acc);
763
0
        acc >>= 32;
764
765
0
        acc += load_u32(&rp[6]);
766
0
        acc += bp[14 - 8];
767
0
        acc += bp[14 - 8];
768
0
        acc += bp[15 - 8];
769
0
        acc += bp[15 - 8];
770
0
        acc += bp[14 - 8];
771
0
        acc += bp[13 - 8];
772
0
        acc -= bp[8 - 8];
773
0
        acc -= bp[9 - 8];
774
0
        store_lo32(&rp[6], acc);
775
0
        acc >>= 32;
776
777
0
        acc += load_u32(&rp[7]);
778
0
        acc += bp[15 - 8];
779
0
        acc += bp[15 - 8];
780
0
        acc += bp[15 - 8];
781
0
        acc += bp[8 - 8];
782
0
        acc -= bp[10 - 8];
783
0
        acc -= bp[11 - 8];
784
0
        acc -= bp[12 - 8];
785
0
        acc -= bp[13 - 8];
786
0
        store_lo32(&rp[7], acc);
787
788
0
        carry = (int)(acc >> 32);
789
0
    }
790
#else
791
    {
792
        BN_ULONG t_d[BN_NIST_256_TOP];
793
794
        /*
795
         * S1
796
         */
797
        nist_set_256(t_d, buf.bn, 15, 14, 13, 12, 11, 0, 0, 0);
798
        /*
799
         * S2
800
         */
801
        nist_set_256(c_d, buf.bn, 0, 15, 14, 13, 12, 0, 0, 0);
802
        carry = (int)bn_add_words(t_d, t_d, c_d, BN_NIST_256_TOP);
803
        /* left shift */
804
        {
805
            register BN_ULONG *ap, t, c;
806
            ap = t_d;
807
            c = 0;
808
            for (i = BN_NIST_256_TOP; i != 0; --i) {
809
                t = *ap;
810
                *(ap++) = ((t << 1) | c) & BN_MASK2;
811
                c = (t & BN_TBIT) ? 1 : 0;
812
            }
813
            carry <<= 1;
814
            carry |= c;
815
        }
816
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
817
        /*
818
         * S3
819
         */
820
        nist_set_256(t_d, buf.bn, 15, 14, 0, 0, 0, 10, 9, 8);
821
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
822
        /*
823
         * S4
824
         */
825
        nist_set_256(t_d, buf.bn, 8, 13, 15, 14, 13, 11, 10, 9);
826
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
827
        /*
828
         * D1
829
         */
830
        nist_set_256(t_d, buf.bn, 10, 8, 0, 0, 0, 13, 12, 11);
831
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
832
        /*
833
         * D2
834
         */
835
        nist_set_256(t_d, buf.bn, 11, 9, 0, 0, 15, 14, 13, 12);
836
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
837
        /*
838
         * D3
839
         */
840
        nist_set_256(t_d, buf.bn, 12, 0, 10, 9, 8, 15, 14, 13);
841
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
842
        /*
843
         * D4
844
         */
845
        nist_set_256(t_d, buf.bn, 13, 0, 11, 10, 9, 0, 15, 14);
846
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
847
    }
848
#endif
849
    /* see BN_nist_mod_224 for explanation */
850
0
    adjust = bn_sub_words;
851
0
    if (carry > 0)
852
0
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_256[carry - 1],
853
0
            BN_NIST_256_TOP);
854
0
    else if (carry < 0) {
855
0
        carry = (int)bn_add_words(r_d, r_d, _nist_p_256[-carry - 1],
856
0
            BN_NIST_256_TOP);
857
0
        adjust = carry ? bn_sub_words : bn_add_words;
858
0
    } else
859
0
        carry = 1;
860
861
0
    res = ((*adjust)(c_d, r_d, _nist_p_256[0], BN_NIST_256_TOP) && carry)
862
0
        ? r_d
863
0
        : c_d;
864
0
    nist_cp_bn(r_d, res, BN_NIST_256_TOP);
865
0
    r->top = BN_NIST_256_TOP;
866
0
    bn_correct_top(r);
867
868
0
    return 1;
869
0
}
870
871
#define nist_set_384(to, from, a1, a2, a3, a4, a5, a6, a7, a8, a9, a10, a11, a12)     \
872
    {                                                                                 \
873
        bn_cp_32(to, 0, from, (a12) - 12)                                             \
874
            bn_cp_32(to, 1, from, (a11) - 12)                                         \
875
                bn_cp_32(to, 2, from, (a10) - 12)                                     \
876
                    bn_cp_32(to, 3, from, (a9) - 12)                                  \
877
                        bn_cp_32(to, 4, from, (a8) - 12)                              \
878
                            bn_cp_32(to, 5, from, (a7) - 12)                          \
879
                                bn_cp_32(to, 6, from, (a6) - 12)                      \
880
                                    bn_cp_32(to, 7, from, (a5) - 12)                  \
881
                                        bn_cp_32(to, 8, from, (a4) - 12)              \
882
                                            bn_cp_32(to, 9, from, (a3) - 12)          \
883
                                                bn_cp_32(to, 10, from, (a2) - 12)     \
884
                                                    bn_cp_32(to, 11, from, (a1) - 12) \
885
    }
886
887
int BN_nist_mod_384(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
888
    BN_CTX *ctx)
889
108k
{
890
108k
    int i, top = a->top;
891
108k
    int carry = 0;
892
108k
    register BN_ULONG *r_d, *a_d = a->d;
893
108k
    union {
894
108k
        BN_ULONG bn[BN_NIST_384_TOP];
895
108k
        unsigned int ui[BN_NIST_384_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
896
108k
    } buf;
897
108k
    BN_ULONG c_d[BN_NIST_384_TOP], *res;
898
108k
    bn_addsub_f adjust;
899
108k
    static const BIGNUM ossl_bignum_nist_p_384_sqr = {
900
108k
        (BN_ULONG *)_nist_p_384_sqr,
901
108k
        OSSL_NELEM(_nist_p_384_sqr),
902
108k
        OSSL_NELEM(_nist_p_384_sqr),
903
108k
        0, BN_FLG_STATIC_DATA
904
108k
    };
905
906
108k
    field = &ossl_bignum_nist_p_384; /* just to make sure */
907
908
108k
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_384_sqr) >= 0)
909
0
        return BN_nnmod(r, a, field, ctx);
910
911
108k
    i = BN_ucmp(field, a);
912
108k
    if (i == 0) {
913
0
        BN_zero(r);
914
0
        return 1;
915
108k
    } else if (i > 0)
916
1.65k
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
917
918
106k
    if (r != a) {
919
0
        if (!bn_wexpand(r, BN_NIST_384_TOP))
920
0
            return 0;
921
0
        r_d = r->d;
922
0
        nist_cp_bn(r_d, a_d, BN_NIST_384_TOP);
923
0
    } else
924
106k
        r_d = a_d;
925
926
106k
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_384_TOP, top - BN_NIST_384_TOP,
927
106k
        BN_NIST_384_TOP);
928
929
106k
#if defined(NIST_INT64)
930
106k
    {
931
106k
        NIST_INT64 acc; /* accumulator */
932
106k
        unsigned int *rp = (unsigned int *)r_d;
933
106k
        const unsigned int *bp = (const unsigned int *)buf.ui;
934
935
106k
        acc = load_u32(&rp[0]);
936
106k
        acc += bp[12 - 12];
937
106k
        acc += bp[21 - 12];
938
106k
        acc += bp[20 - 12];
939
106k
        acc -= bp[23 - 12];
940
106k
        store_lo32(&rp[0], acc);
941
106k
        acc >>= 32;
942
943
106k
        acc += load_u32(&rp[1]);
944
106k
        acc += bp[13 - 12];
945
106k
        acc += bp[22 - 12];
946
106k
        acc += bp[23 - 12];
947
106k
        acc -= bp[12 - 12];
948
106k
        acc -= bp[20 - 12];
949
106k
        store_lo32(&rp[1], acc);
950
106k
        acc >>= 32;
951
952
106k
        acc += load_u32(&rp[2]);
953
106k
        acc += bp[14 - 12];
954
106k
        acc += bp[23 - 12];
955
106k
        acc -= bp[13 - 12];
956
106k
        acc -= bp[21 - 12];
957
106k
        store_lo32(&rp[2], acc);
958
106k
        acc >>= 32;
959
960
106k
        acc += load_u32(&rp[3]);
961
106k
        acc += bp[15 - 12];
962
106k
        acc += bp[12 - 12];
963
106k
        acc += bp[20 - 12];
964
106k
        acc += bp[21 - 12];
965
106k
        acc -= bp[14 - 12];
966
106k
        acc -= bp[22 - 12];
967
106k
        acc -= bp[23 - 12];
968
106k
        store_lo32(&rp[3], acc);
969
106k
        acc >>= 32;
970
971
106k
        acc += load_u32(&rp[4]);
972
106k
        acc += bp[21 - 12];
973
106k
        acc += bp[21 - 12];
974
106k
        acc += bp[16 - 12];
975
106k
        acc += bp[13 - 12];
976
106k
        acc += bp[12 - 12];
977
106k
        acc += bp[20 - 12];
978
106k
        acc += bp[22 - 12];
979
106k
        acc -= bp[15 - 12];
980
106k
        acc -= bp[23 - 12];
981
106k
        acc -= bp[23 - 12];
982
106k
        store_lo32(&rp[4], acc);
983
106k
        acc >>= 32;
984
985
106k
        acc += load_u32(&rp[5]);
986
106k
        acc += bp[22 - 12];
987
106k
        acc += bp[22 - 12];
988
106k
        acc += bp[17 - 12];
989
106k
        acc += bp[14 - 12];
990
106k
        acc += bp[13 - 12];
991
106k
        acc += bp[21 - 12];
992
106k
        acc += bp[23 - 12];
993
106k
        acc -= bp[16 - 12];
994
106k
        store_lo32(&rp[5], acc);
995
106k
        acc >>= 32;
996
997
106k
        acc += load_u32(&rp[6]);
998
106k
        acc += bp[23 - 12];
999
106k
        acc += bp[23 - 12];
1000
106k
        acc += bp[18 - 12];
1001
106k
        acc += bp[15 - 12];
1002
106k
        acc += bp[14 - 12];
1003
106k
        acc += bp[22 - 12];
1004
106k
        acc -= bp[17 - 12];
1005
106k
        store_lo32(&rp[6], acc);
1006
106k
        acc >>= 32;
1007
1008
106k
        acc += load_u32(&rp[7]);
1009
106k
        acc += bp[19 - 12];
1010
106k
        acc += bp[16 - 12];
1011
106k
        acc += bp[15 - 12];
1012
106k
        acc += bp[23 - 12];
1013
106k
        acc -= bp[18 - 12];
1014
106k
        store_lo32(&rp[7], acc);
1015
106k
        acc >>= 32;
1016
1017
106k
        acc += load_u32(&rp[8]);
1018
106k
        acc += bp[20 - 12];
1019
106k
        acc += bp[17 - 12];
1020
106k
        acc += bp[16 - 12];
1021
106k
        acc -= bp[19 - 12];
1022
106k
        store_lo32(&rp[8], acc);
1023
106k
        acc >>= 32;
1024
1025
106k
        acc += load_u32(&rp[9]);
1026
106k
        acc += bp[21 - 12];
1027
106k
        acc += bp[18 - 12];
1028
106k
        acc += bp[17 - 12];
1029
106k
        acc -= bp[20 - 12];
1030
106k
        store_lo32(&rp[9], acc);
1031
106k
        acc >>= 32;
1032
1033
106k
        acc += load_u32(&rp[10]);
1034
106k
        acc += bp[22 - 12];
1035
106k
        acc += bp[19 - 12];
1036
106k
        acc += bp[18 - 12];
1037
106k
        acc -= bp[21 - 12];
1038
106k
        store_lo32(&rp[10], acc);
1039
106k
        acc >>= 32;
1040
1041
106k
        acc += load_u32(&rp[11]);
1042
106k
        acc += bp[23 - 12];
1043
106k
        acc += bp[20 - 12];
1044
106k
        acc += bp[19 - 12];
1045
106k
        acc -= bp[22 - 12];
1046
106k
        store_lo32(&rp[11], acc);
1047
1048
106k
        carry = (int)(acc >> 32);
1049
106k
    }
1050
#else
1051
    {
1052
        BN_ULONG t_d[BN_NIST_384_TOP];
1053
1054
        /*
1055
         * S1
1056
         */
1057
        nist_set_256(t_d, buf.bn, 0, 0, 0, 0, 0, 23 - 4, 22 - 4, 21 - 4);
1058
        /* left shift */
1059
        {
1060
            register BN_ULONG *ap, t, c;
1061
            ap = t_d;
1062
            c = 0;
1063
            for (i = 3; i != 0; --i) {
1064
                t = *ap;
1065
                *(ap++) = ((t << 1) | c) & BN_MASK2;
1066
                c = (t & BN_TBIT) ? 1 : 0;
1067
            }
1068
            *ap = c;
1069
        }
1070
        carry = (int)bn_add_words(r_d + (128 / BN_BITS2), r_d + (128 / BN_BITS2),
1071
            t_d, BN_NIST_256_TOP);
1072
        /*
1073
         * S2
1074
         */
1075
        carry += (int)bn_add_words(r_d, r_d, buf.bn, BN_NIST_384_TOP);
1076
        /*
1077
         * S3
1078
         */
1079
        nist_set_384(t_d, buf.bn, 20, 19, 18, 17, 16, 15, 14, 13, 12, 23, 22,
1080
            21);
1081
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1082
        /*
1083
         * S4
1084
         */
1085
        nist_set_384(t_d, buf.bn, 19, 18, 17, 16, 15, 14, 13, 12, 20, 0, 23,
1086
            0);
1087
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1088
        /*
1089
         * S5
1090
         */
1091
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 23, 22, 21, 20, 0, 0, 0, 0);
1092
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1093
        /*
1094
         * S6
1095
         */
1096
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 0, 0, 23, 22, 21, 0, 0, 20);
1097
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1098
        /*
1099
         * D1
1100
         */
1101
        nist_set_384(t_d, buf.bn, 22, 21, 20, 19, 18, 17, 16, 15, 14, 13, 12,
1102
            23);
1103
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1104
        /*
1105
         * D2
1106
         */
1107
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 0, 0, 0, 23, 22, 21, 20, 0);
1108
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1109
        /*
1110
         * D3
1111
         */
1112
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 0, 0, 0, 23, 23, 0, 0, 0);
1113
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1114
    }
1115
#endif
1116
    /* see BN_nist_mod_224 for explanation */
1117
106k
    adjust = bn_sub_words;
1118
106k
    if (carry > 0)
1119
61.3k
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_384[carry - 1],
1120
61.3k
            BN_NIST_384_TOP);
1121
45.5k
    else if (carry < 0) {
1122
3.46k
        carry = (int)bn_add_words(r_d, r_d, _nist_p_384[-carry - 1],
1123
3.46k
            BN_NIST_384_TOP);
1124
3.46k
        adjust = carry ? bn_sub_words : bn_add_words;
1125
3.46k
    } else
1126
42.0k
        carry = 1;
1127
1128
106k
    res = ((*adjust)(c_d, r_d, _nist_p_384[0], BN_NIST_384_TOP) && carry)
1129
106k
        ? r_d
1130
106k
        : c_d;
1131
106k
    nist_cp_bn(r_d, res, BN_NIST_384_TOP);
1132
106k
    r->top = BN_NIST_384_TOP;
1133
106k
    bn_correct_top(r);
1134
1135
106k
    return 1;
1136
106k
}
1137
1138
3.58M
#define BN_NIST_521_RSHIFT (521 % BN_BITS2)
1139
1.79M
#define BN_NIST_521_LSHIFT (BN_BITS2 - BN_NIST_521_RSHIFT)
1140
199k
#define BN_NIST_521_TOP_MASK ((BN_ULONG)BN_MASK2 >> BN_NIST_521_LSHIFT)
1141
1142
int BN_nist_mod_521(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
1143
    BN_CTX *ctx)
1144
204k
{
1145
204k
    int top = a->top, i;
1146
204k
    BN_ULONG *r_d, *a_d = a->d, t_d[BN_NIST_521_TOP], val, tmp, *res;
1147
204k
    static const BIGNUM ossl_bignum_nist_p_521_sqr = {
1148
204k
        (BN_ULONG *)_nist_p_521_sqr,
1149
204k
        OSSL_NELEM(_nist_p_521_sqr),
1150
204k
        OSSL_NELEM(_nist_p_521_sqr),
1151
204k
        0, BN_FLG_STATIC_DATA
1152
204k
    };
1153
1154
204k
    field = &ossl_bignum_nist_p_521; /* just to make sure */
1155
1156
204k
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_521_sqr) >= 0)
1157
0
        return BN_nnmod(r, a, field, ctx);
1158
1159
204k
    i = BN_ucmp(field, a);
1160
204k
    if (i == 0) {
1161
0
        BN_zero(r);
1162
0
        return 1;
1163
204k
    } else if (i > 0)
1164
5.53k
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
1165
1166
199k
    if (r != a) {
1167
0
        if (!bn_wexpand(r, BN_NIST_521_TOP))
1168
0
            return 0;
1169
0
        r_d = r->d;
1170
0
        nist_cp_bn(r_d, a_d, BN_NIST_521_TOP);
1171
0
    } else
1172
199k
        r_d = a_d;
1173
1174
    /* upper 521 bits, copy ... */
1175
199k
    nist_cp_bn_0(t_d, a_d + (BN_NIST_521_TOP - 1),
1176
199k
        top - (BN_NIST_521_TOP - 1), BN_NIST_521_TOP);
1177
    /* ... and right shift */
1178
1.79M
    for (val = t_d[0], i = 0; i < BN_NIST_521_TOP - 1; i++) {
1179
#if 0
1180
        /*
1181
         * MSC ARM compiler [version 2013, presumably even earlier,
1182
         * much earlier] miscompiles this code, but not one in
1183
         * #else section. See RT#3541.
1184
         */
1185
        tmp = val >> BN_NIST_521_RSHIFT;
1186
        val = t_d[i + 1];
1187
        t_d[i] = (tmp | val << BN_NIST_521_LSHIFT) & BN_MASK2;
1188
#else
1189
1.59M
        t_d[i] = (val >> BN_NIST_521_RSHIFT | (tmp = t_d[i + 1]) << BN_NIST_521_LSHIFT) & BN_MASK2;
1190
1.59M
        val = tmp;
1191
1.59M
#endif
1192
1.59M
    }
1193
199k
    t_d[i] = val >> BN_NIST_521_RSHIFT;
1194
    /* lower 521 bits */
1195
199k
    r_d[i] &= BN_NIST_521_TOP_MASK;
1196
1197
199k
    bn_add_words(r_d, r_d, t_d, BN_NIST_521_TOP);
1198
199k
    res = bn_sub_words(t_d, r_d, _nist_p_521,
1199
199k
              BN_NIST_521_TOP)
1200
199k
        ? r_d
1201
199k
        : t_d;
1202
199k
    nist_cp_bn(r_d, res, BN_NIST_521_TOP);
1203
199k
    r->top = BN_NIST_521_TOP;
1204
199k
    bn_correct_top(r);
1205
1206
199k
    return 1;
1207
199k
}
1208
1209
int (*BN_nist_mod_func(const BIGNUM *p))(BIGNUM *r, const BIGNUM *a,
1210
    const BIGNUM *field, BN_CTX *ctx)
1211
0
{
1212
0
    if (BN_ucmp(&ossl_bignum_nist_p_192, p) == 0)
1213
0
        return BN_nist_mod_192;
1214
0
    if (BN_ucmp(&ossl_bignum_nist_p_224, p) == 0)
1215
0
        return BN_nist_mod_224;
1216
0
    if (BN_ucmp(&ossl_bignum_nist_p_256, p) == 0)
1217
0
        return BN_nist_mod_256;
1218
0
    if (BN_ucmp(&ossl_bignum_nist_p_384, p) == 0)
1219
0
        return BN_nist_mod_384;
1220
0
    if (BN_ucmp(&ossl_bignum_nist_p_521, p) == 0)
1221
0
        return BN_nist_mod_521;
1222
0
    return 0;
1223
0
}