Coverage Report

Created: 2025-12-10 06:24

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/openssl/crypto/bn/bn_nist.c
Line
Count
Source
1
/*
2
 * Copyright 2002-2024 The OpenSSL Project Authors. All Rights Reserved.
3
 *
4
 * Licensed under the Apache License 2.0 (the "License").  You may not use
5
 * this file except in compliance with the License.  You can obtain a copy
6
 * in the file LICENSE in the source distribution or at
7
 * https://www.openssl.org/source/license.html
8
 */
9
10
#include "bn_local.h"
11
#include "internal/cryptlib.h"
12
13
0
#define BN_NIST_192_TOP (192 + BN_BITS2 - 1) / BN_BITS2
14
0
#define BN_NIST_224_TOP (224 + BN_BITS2 - 1) / BN_BITS2
15
0
#define BN_NIST_256_TOP (256 + BN_BITS2 - 1) / BN_BITS2
16
0
#define BN_NIST_384_TOP (384 + BN_BITS2 - 1) / BN_BITS2
17
0
#define BN_NIST_521_TOP (521 + BN_BITS2 - 1) / BN_BITS2
18
19
/* pre-computed tables are "carry-less" values of modulus*(i+1) */
20
#if BN_BITS2 == 64
21
static const BN_ULONG _nist_p_192[][BN_NIST_192_TOP] = {
22
    { 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFEULL, 0xFFFFFFFFFFFFFFFFULL },
23
    { 0xFFFFFFFFFFFFFFFEULL, 0xFFFFFFFFFFFFFFFDULL, 0xFFFFFFFFFFFFFFFFULL },
24
    { 0xFFFFFFFFFFFFFFFDULL, 0xFFFFFFFFFFFFFFFCULL, 0xFFFFFFFFFFFFFFFFULL }
25
};
26
27
static const BN_ULONG _nist_p_192_sqr[] = {
28
    0x0000000000000001ULL, 0x0000000000000002ULL, 0x0000000000000001ULL,
29
    0xFFFFFFFFFFFFFFFEULL, 0xFFFFFFFFFFFFFFFDULL, 0xFFFFFFFFFFFFFFFFULL
30
};
31
32
static const BN_ULONG _nist_p_224[][BN_NIST_224_TOP] = {
33
    { 0x0000000000000001ULL, 0xFFFFFFFF00000000ULL,
34
        0xFFFFFFFFFFFFFFFFULL, 0x00000000FFFFFFFFULL },
35
    { 0x0000000000000002ULL, 0xFFFFFFFE00000000ULL,
36
        0xFFFFFFFFFFFFFFFFULL, 0x00000001FFFFFFFFULL } /* this one is
37
                                                        * "carry-full" */
38
};
39
40
static const BN_ULONG _nist_p_224_sqr[] = {
41
    0x0000000000000001ULL, 0xFFFFFFFE00000000ULL,
42
    0xFFFFFFFFFFFFFFFFULL, 0x0000000200000000ULL,
43
    0x0000000000000000ULL, 0xFFFFFFFFFFFFFFFEULL,
44
    0xFFFFFFFFFFFFFFFFULL
45
};
46
47
static const BN_ULONG _nist_p_256[][BN_NIST_256_TOP] = {
48
    { 0xFFFFFFFFFFFFFFFFULL, 0x00000000FFFFFFFFULL,
49
        0x0000000000000000ULL, 0xFFFFFFFF00000001ULL },
50
    { 0xFFFFFFFFFFFFFFFEULL, 0x00000001FFFFFFFFULL,
51
        0x0000000000000000ULL, 0xFFFFFFFE00000002ULL },
52
    { 0xFFFFFFFFFFFFFFFDULL, 0x00000002FFFFFFFFULL,
53
        0x0000000000000000ULL, 0xFFFFFFFD00000003ULL },
54
    { 0xFFFFFFFFFFFFFFFCULL, 0x00000003FFFFFFFFULL,
55
        0x0000000000000000ULL, 0xFFFFFFFC00000004ULL },
56
    { 0xFFFFFFFFFFFFFFFBULL, 0x00000004FFFFFFFFULL,
57
        0x0000000000000000ULL, 0xFFFFFFFB00000005ULL },
58
};
59
60
static const BN_ULONG _nist_p_256_sqr[] = {
61
    0x0000000000000001ULL, 0xFFFFFFFE00000000ULL,
62
    0xFFFFFFFFFFFFFFFFULL, 0x00000001FFFFFFFEULL,
63
    0x00000001FFFFFFFEULL, 0x00000001FFFFFFFEULL,
64
    0xFFFFFFFE00000001ULL, 0xFFFFFFFE00000002ULL
65
};
66
67
static const BN_ULONG _nist_p_384[][BN_NIST_384_TOP] = {
68
    { 0x00000000FFFFFFFFULL, 0xFFFFFFFF00000000ULL, 0xFFFFFFFFFFFFFFFEULL,
69
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
70
    { 0x00000001FFFFFFFEULL, 0xFFFFFFFE00000000ULL, 0xFFFFFFFFFFFFFFFDULL,
71
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
72
    { 0x00000002FFFFFFFDULL, 0xFFFFFFFD00000000ULL, 0xFFFFFFFFFFFFFFFCULL,
73
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
74
    { 0x00000003FFFFFFFCULL, 0xFFFFFFFC00000000ULL, 0xFFFFFFFFFFFFFFFBULL,
75
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
76
    { 0x00000004FFFFFFFBULL, 0xFFFFFFFB00000000ULL, 0xFFFFFFFFFFFFFFFAULL,
77
        0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL },
78
};
79
80
static const BN_ULONG _nist_p_384_sqr[] = {
81
    0xFFFFFFFE00000001ULL, 0x0000000200000000ULL, 0xFFFFFFFE00000000ULL,
82
    0x0000000200000000ULL, 0x0000000000000001ULL, 0x0000000000000000ULL,
83
    0x00000001FFFFFFFEULL, 0xFFFFFFFE00000000ULL, 0xFFFFFFFFFFFFFFFDULL,
84
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL
85
};
86
87
static const BN_ULONG _nist_p_521[] = {
88
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
89
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
90
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
91
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
92
    0x00000000000001FFULL
93
};
94
95
static const BN_ULONG _nist_p_521_sqr[] = {
96
    0x0000000000000001ULL, 0x0000000000000000ULL, 0x0000000000000000ULL,
97
    0x0000000000000000ULL, 0x0000000000000000ULL, 0x0000000000000000ULL,
98
    0x0000000000000000ULL, 0x0000000000000000ULL, 0xFFFFFFFFFFFFFC00ULL,
99
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
100
    0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL, 0xFFFFFFFFFFFFFFFFULL,
101
    0xFFFFFFFFFFFFFFFFULL, 0x000000000003FFFFULL
102
};
103
#elif BN_BITS2 == 32
104
static const BN_ULONG _nist_p_192[][BN_NIST_192_TOP] = {
105
    { 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
106
    { 0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
107
    { 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFC, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF }
108
};
109
110
static const BN_ULONG _nist_p_192_sqr[] = {
111
    0x00000001, 0x00000000, 0x00000002, 0x00000000, 0x00000001, 0x00000000,
112
    0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF
113
};
114
115
static const BN_ULONG _nist_p_224[][BN_NIST_224_TOP] = {
116
    { 0x00000001, 0x00000000, 0x00000000, 0xFFFFFFFF,
117
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
118
    { 0x00000002, 0x00000000, 0x00000000, 0xFFFFFFFE,
119
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF }
120
};
121
122
static const BN_ULONG _nist_p_224_sqr[] = {
123
    0x00000001, 0x00000000, 0x00000000, 0xFFFFFFFE,
124
    0xFFFFFFFF, 0xFFFFFFFF, 0x00000000, 0x00000002,
125
    0x00000000, 0x00000000, 0xFFFFFFFE, 0xFFFFFFFF,
126
    0xFFFFFFFF, 0xFFFFFFFF
127
};
128
129
static const BN_ULONG _nist_p_256[][BN_NIST_256_TOP] = {
130
    { 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000000,
131
        0x00000000, 0x00000000, 0x00000001, 0xFFFFFFFF },
132
    { 0xFFFFFFFE, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000001,
133
        0x00000000, 0x00000000, 0x00000002, 0xFFFFFFFE },
134
    { 0xFFFFFFFD, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000002,
135
        0x00000000, 0x00000000, 0x00000003, 0xFFFFFFFD },
136
    { 0xFFFFFFFC, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000003,
137
        0x00000000, 0x00000000, 0x00000004, 0xFFFFFFFC },
138
    { 0xFFFFFFFB, 0xFFFFFFFF, 0xFFFFFFFF, 0x00000004,
139
        0x00000000, 0x00000000, 0x00000005, 0xFFFFFFFB },
140
};
141
142
static const BN_ULONG _nist_p_256_sqr[] = {
143
    0x00000001, 0x00000000, 0x00000000, 0xFFFFFFFE,
144
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFE, 0x00000001,
145
    0xFFFFFFFE, 0x00000001, 0xFFFFFFFE, 0x00000001,
146
    0x00000001, 0xFFFFFFFE, 0x00000002, 0xFFFFFFFE
147
};
148
149
static const BN_ULONG _nist_p_384[][BN_NIST_384_TOP] = {
150
    { 0xFFFFFFFF, 0x00000000, 0x00000000, 0xFFFFFFFF, 0xFFFFFFFE, 0xFFFFFFFF,
151
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
152
    { 0xFFFFFFFE, 0x00000001, 0x00000000, 0xFFFFFFFE, 0xFFFFFFFD, 0xFFFFFFFF,
153
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
154
    { 0xFFFFFFFD, 0x00000002, 0x00000000, 0xFFFFFFFD, 0xFFFFFFFC, 0xFFFFFFFF,
155
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
156
    { 0xFFFFFFFC, 0x00000003, 0x00000000, 0xFFFFFFFC, 0xFFFFFFFB, 0xFFFFFFFF,
157
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
158
    { 0xFFFFFFFB, 0x00000004, 0x00000000, 0xFFFFFFFB, 0xFFFFFFFA, 0xFFFFFFFF,
159
        0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF },
160
};
161
162
static const BN_ULONG _nist_p_384_sqr[] = {
163
    0x00000001, 0xFFFFFFFE, 0x00000000, 0x00000002, 0x00000000, 0xFFFFFFFE,
164
    0x00000000, 0x00000002, 0x00000001, 0x00000000, 0x00000000, 0x00000000,
165
    0xFFFFFFFE, 0x00000001, 0x00000000, 0xFFFFFFFE, 0xFFFFFFFD, 0xFFFFFFFF,
166
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF
167
};
168
169
static const BN_ULONG _nist_p_521[] = { 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
170
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
171
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
172
    0xFFFFFFFF, 0x000001FF };
173
174
static const BN_ULONG _nist_p_521_sqr[] = {
175
    0x00000001, 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
176
    0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000, 0x00000000,
177
    0x00000000, 0x00000000, 0x00000000, 0x00000000, 0xFFFFFC00, 0xFFFFFFFF,
178
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
179
    0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
180
    0xFFFFFFFF, 0xFFFFFFFF, 0x0003FFFF
181
};
182
#else
183
#error "unsupported BN_BITS2"
184
#endif
185
186
static const BIGNUM ossl_bignum_nist_p_192 = {
187
    (BN_ULONG *)_nist_p_192[0],
188
    BN_NIST_192_TOP,
189
    BN_NIST_192_TOP,
190
    0,
191
    BN_FLG_STATIC_DATA
192
};
193
194
static const BIGNUM ossl_bignum_nist_p_224 = {
195
    (BN_ULONG *)_nist_p_224[0],
196
    BN_NIST_224_TOP,
197
    BN_NIST_224_TOP,
198
    0,
199
    BN_FLG_STATIC_DATA
200
};
201
202
static const BIGNUM ossl_bignum_nist_p_256 = {
203
    (BN_ULONG *)_nist_p_256[0],
204
    BN_NIST_256_TOP,
205
    BN_NIST_256_TOP,
206
    0,
207
    BN_FLG_STATIC_DATA
208
};
209
210
static const BIGNUM ossl_bignum_nist_p_384 = {
211
    (BN_ULONG *)_nist_p_384[0],
212
    BN_NIST_384_TOP,
213
    BN_NIST_384_TOP,
214
    0,
215
    BN_FLG_STATIC_DATA
216
};
217
218
static const BIGNUM ossl_bignum_nist_p_521 = {
219
    (BN_ULONG *)_nist_p_521,
220
    BN_NIST_521_TOP,
221
    BN_NIST_521_TOP,
222
    0,
223
    BN_FLG_STATIC_DATA
224
};
225
226
const BIGNUM *BN_get0_nist_prime_192(void)
227
0
{
228
0
    return &ossl_bignum_nist_p_192;
229
0
}
230
231
const BIGNUM *BN_get0_nist_prime_224(void)
232
0
{
233
0
    return &ossl_bignum_nist_p_224;
234
0
}
235
236
const BIGNUM *BN_get0_nist_prime_256(void)
237
0
{
238
0
    return &ossl_bignum_nist_p_256;
239
0
}
240
241
const BIGNUM *BN_get0_nist_prime_384(void)
242
0
{
243
0
    return &ossl_bignum_nist_p_384;
244
0
}
245
246
const BIGNUM *BN_get0_nist_prime_521(void)
247
0
{
248
0
    return &ossl_bignum_nist_p_521;
249
0
}
250
251
/*
252
 * To avoid more recent compilers (specifically clang-14) from treating this
253
 * code as a violation of the strict aliasing conditions and omitting it, this
254
 * cannot be declared as a function.  Moreover, the dst parameter cannot be
255
 * cached in a local since this no longer references the union and again falls
256
 * foul of the strict aliasing criteria.  Refer to #18225 for the initial
257
 * diagnostics and llvm/llvm-project#55255 for the later discussions with the
258
 * LLVM developers.  The problem boils down to if an array in the union is
259
 * converted to a pointer or if it is used directly.
260
 *
261
 * This function was inlined regardless, so there is no space cost to be
262
 * paid for making it a macro.
263
 */
264
#define nist_cp_bn_0(dst, src_in, top, max) \
265
0
    {                                       \
266
0
        int ii;                             \
267
0
        const BN_ULONG *src = src_in;       \
268
0
                                            \
269
0
        for (ii = 0; ii < top; ii++)        \
270
0
            (dst)[ii] = src[ii];            \
271
0
        for (; ii < max; ii++)              \
272
0
            (dst)[ii] = 0;                  \
273
0
    }
274
275
static void nist_cp_bn(BN_ULONG *dst, const BN_ULONG *src, int top)
276
0
{
277
0
    int i;
278
279
0
    for (i = 0; i < top; i++)
280
0
        dst[i] = src[i];
281
0
}
282
283
#if BN_BITS2 == 64
284
#define bn_cp_64(to, n, from, m) (to)[n] = (m >= 0) ? ((from)[m]) : 0;
285
#define bn_64_set_0(to, n) (to)[n] = (BN_ULONG)0;
286
/*
287
 * two following macros are implemented under assumption that they
288
 * are called in a sequence with *ascending* n, i.e. as they are...
289
 */
290
0
#define bn_cp_32_naked(to, n, from, m) (((n) & 1) ? (to[(n) / 2] |= ((m) & 1) ? (from[(m) / 2] & BN_MASK2h) : (from[(m) / 2] << 32)) \
291
0
                                                  : (to[(n) / 2] = ((m) & 1) ? (from[(m) / 2] >> 32) : (from[(m) / 2] & BN_MASK2l)))
292
0
#define bn_32_set_0(to, n) (((n) & 1) ? (to[(n) / 2] &= BN_MASK2l) : (to[(n) / 2] = 0));
293
0
#define bn_cp_32(to, n, from, m) ((m) >= 0) ? bn_cp_32_naked(to, n, from, m) : bn_32_set_0(to, n)
294
#if defined(L_ENDIAN)
295
#if defined(__arch64__)
296
#define NIST_INT64 long
297
#else
298
0
#define NIST_INT64 long long
299
#endif
300
#endif
301
#else
302
#define bn_cp_64(to, n, from, m)                      \
303
    {                                                 \
304
        bn_cp_32(to, (n) * 2, from, (m) * 2);         \
305
        bn_cp_32(to, (n) * 2 + 1, from, (m) * 2 + 1); \
306
    }
307
#define bn_64_set_0(to, n)            \
308
    {                                 \
309
        bn_32_set_0(to, (n) * 2);     \
310
        bn_32_set_0(to, (n) * 2 + 1); \
311
    }
312
#define bn_cp_32(to, n, from, m) (to)[n] = (m >= 0) ? ((from)[m]) : 0;
313
#define bn_32_set_0(to, n) (to)[n] = (BN_ULONG)0;
314
#if defined(_WIN32) && !defined(__GNUC__)
315
#define NIST_INT64 __int64
316
#elif defined(BN_LLONG)
317
#define NIST_INT64 long long
318
#endif
319
#endif /* BN_BITS2 != 64 */
320
321
#ifdef NIST_INT64
322
/* Helpers to load/store a 32-bit word (uint32_t) from/into a memory
323
 * location and avoid potential aliasing issue.  */
324
static ossl_inline uint32_t load_u32(const void *ptr)
325
0
{
326
0
    uint32_t tmp;
327
328
0
    memcpy(&tmp, ptr, sizeof(tmp));
329
0
    return tmp;
330
0
}
331
332
static ossl_inline void store_lo32(void *ptr, NIST_INT64 val)
333
0
{
334
    /* A cast is needed for big-endian system: on a 32-bit BE system
335
     * NIST_INT64 may be defined as well if the compiler supports 64-bit
336
     * long long.  */
337
0
    uint32_t tmp = (uint32_t)val;
338
339
0
    memcpy(ptr, &tmp, sizeof(tmp));
340
0
}
341
#endif /* NIST_INT64 */
342
343
#define nist_set_192(to, from, a1, a2, a3)      \
344
    {                                           \
345
        bn_cp_64(to, 0, from, (a3) - 3)         \
346
            bn_cp_64(to, 1, from, (a2) - 3)     \
347
                bn_cp_64(to, 2, from, (a1) - 3) \
348
    }
349
350
int BN_nist_mod_192(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
351
    BN_CTX *ctx)
352
0
{
353
0
    int top = a->top, i;
354
0
    int carry;
355
0
    register BN_ULONG *r_d, *a_d = a->d;
356
0
    union {
357
0
        BN_ULONG bn[BN_NIST_192_TOP];
358
0
        unsigned int ui[BN_NIST_192_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
359
0
    } buf;
360
0
    BN_ULONG c_d[BN_NIST_192_TOP], *res;
361
0
    static const BIGNUM ossl_bignum_nist_p_192_sqr = {
362
0
        (BN_ULONG *)_nist_p_192_sqr,
363
0
        OSSL_NELEM(_nist_p_192_sqr),
364
0
        OSSL_NELEM(_nist_p_192_sqr),
365
0
        0, BN_FLG_STATIC_DATA
366
0
    };
367
368
0
    field = &ossl_bignum_nist_p_192; /* just to make sure */
369
370
0
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_192_sqr) >= 0)
371
0
        return BN_nnmod(r, a, field, ctx);
372
373
0
    i = BN_ucmp(field, a);
374
0
    if (i == 0) {
375
0
        BN_zero(r);
376
0
        return 1;
377
0
    } else if (i > 0)
378
0
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
379
380
0
    if (r != a) {
381
0
        if (!bn_wexpand(r, BN_NIST_192_TOP))
382
0
            return 0;
383
0
        r_d = r->d;
384
0
        nist_cp_bn(r_d, a_d, BN_NIST_192_TOP);
385
0
    } else
386
0
        r_d = a_d;
387
388
0
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_192_TOP, top - BN_NIST_192_TOP,
389
0
        BN_NIST_192_TOP);
390
391
0
#if defined(NIST_INT64)
392
0
    {
393
0
        NIST_INT64 acc; /* accumulator */
394
0
        unsigned int *rp = (unsigned int *)r_d;
395
0
        const unsigned int *bp = (const unsigned int *)buf.ui;
396
397
0
        acc = load_u32(&rp[0]);
398
0
        acc += bp[3 * 2 - 6];
399
0
        acc += bp[5 * 2 - 6];
400
0
        store_lo32(&rp[0], acc);
401
0
        acc >>= 32;
402
403
0
        acc += load_u32(&rp[1]);
404
0
        acc += bp[3 * 2 - 5];
405
0
        acc += bp[5 * 2 - 5];
406
0
        store_lo32(&rp[1], acc);
407
0
        acc >>= 32;
408
409
0
        acc += load_u32(&rp[2]);
410
0
        acc += bp[3 * 2 - 6];
411
0
        acc += bp[4 * 2 - 6];
412
0
        acc += bp[5 * 2 - 6];
413
0
        store_lo32(&rp[2], acc);
414
0
        acc >>= 32;
415
416
0
        acc += load_u32(&rp[3]);
417
0
        acc += bp[3 * 2 - 5];
418
0
        acc += bp[4 * 2 - 5];
419
0
        acc += bp[5 * 2 - 5];
420
0
        store_lo32(&rp[3], acc);
421
0
        acc >>= 32;
422
423
0
        acc += load_u32(&rp[4]);
424
0
        acc += bp[4 * 2 - 6];
425
0
        acc += bp[5 * 2 - 6];
426
0
        store_lo32(&rp[4], acc);
427
0
        acc >>= 32;
428
429
0
        acc += load_u32(&rp[5]);
430
0
        acc += bp[4 * 2 - 5];
431
0
        acc += bp[5 * 2 - 5];
432
0
        store_lo32(&rp[5], acc);
433
434
0
        carry = (int)(acc >> 32);
435
0
    }
436
#else
437
    {
438
        BN_ULONG t_d[BN_NIST_192_TOP];
439
440
        nist_set_192(t_d, buf.bn, 0, 3, 3);
441
        carry = (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
442
        nist_set_192(t_d, buf.bn, 4, 4, 0);
443
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
444
        nist_set_192(t_d, buf.bn, 5, 5, 5)
445
            carry
446
            += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_192_TOP);
447
    }
448
#endif
449
0
    if (carry > 0)
450
0
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_192[carry - 1],
451
0
            BN_NIST_192_TOP);
452
0
    else
453
0
        carry = 1;
454
455
    /*
456
     * we need 'if (carry==0 || result>=modulus) result-=modulus;'
457
     * as comparison implies subtraction, we can write
458
     * 'tmp=result-modulus; if (!carry || !borrow) result=tmp;'
459
     * this is what happens below, but without explicit if:-) a.
460
     */
461
0
    res = (bn_sub_words(c_d, r_d, _nist_p_192[0], BN_NIST_192_TOP) && carry)
462
0
        ? r_d
463
0
        : c_d;
464
0
    nist_cp_bn(r_d, res, BN_NIST_192_TOP);
465
0
    r->top = BN_NIST_192_TOP;
466
0
    bn_correct_top(r);
467
468
0
    return 1;
469
0
}
470
471
typedef BN_ULONG (*bn_addsub_f)(BN_ULONG *, const BN_ULONG *,
472
    const BN_ULONG *, int);
473
474
#define nist_set_224(to, from, a1, a2, a3, a4, a5, a6, a7)      \
475
0
    {                                                           \
476
0
        bn_cp_32(to, 0, from, (a7) - 7)                         \
477
0
            bn_cp_32(to, 1, from, (a6) - 7)                     \
478
0
                bn_cp_32(to, 2, from, (a5) - 7)                 \
479
0
                    bn_cp_32(to, 3, from, (a4) - 7)             \
480
0
                        bn_cp_32(to, 4, from, (a3) - 7)         \
481
0
                            bn_cp_32(to, 5, from, (a2) - 7)     \
482
0
                                bn_cp_32(to, 6, from, (a1) - 7) \
483
0
    }
484
485
int BN_nist_mod_224(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
486
    BN_CTX *ctx)
487
0
{
488
0
    int top = a->top, i;
489
0
    int carry;
490
0
    BN_ULONG *r_d, *a_d = a->d;
491
0
    union {
492
0
        BN_ULONG bn[BN_NIST_224_TOP];
493
0
        unsigned int ui[BN_NIST_224_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
494
0
    } buf;
495
0
    BN_ULONG c_d[BN_NIST_224_TOP], *res;
496
0
    bn_addsub_f adjust;
497
0
    static const BIGNUM ossl_bignum_nist_p_224_sqr = {
498
0
        (BN_ULONG *)_nist_p_224_sqr,
499
0
        OSSL_NELEM(_nist_p_224_sqr),
500
0
        OSSL_NELEM(_nist_p_224_sqr),
501
0
        0, BN_FLG_STATIC_DATA
502
0
    };
503
504
0
    field = &ossl_bignum_nist_p_224; /* just to make sure */
505
506
0
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_224_sqr) >= 0)
507
0
        return BN_nnmod(r, a, field, ctx);
508
509
0
    i = BN_ucmp(field, a);
510
0
    if (i == 0) {
511
0
        BN_zero(r);
512
0
        return 1;
513
0
    } else if (i > 0)
514
0
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
515
516
0
    if (r != a) {
517
0
        if (!bn_wexpand(r, BN_NIST_224_TOP))
518
0
            return 0;
519
0
        r_d = r->d;
520
0
        nist_cp_bn(r_d, a_d, BN_NIST_224_TOP);
521
0
    } else
522
0
        r_d = a_d;
523
524
0
#if BN_BITS2 == 64
525
    /* copy upper 256 bits of 448 bit number ... */
526
0
    nist_cp_bn_0(c_d, a_d + (BN_NIST_224_TOP - 1),
527
0
        top - (BN_NIST_224_TOP - 1), BN_NIST_224_TOP);
528
    /* ... and right shift by 32 to obtain upper 224 bits */
529
0
    nist_set_224(buf.bn, c_d, 14, 13, 12, 11, 10, 9, 8);
530
    /* truncate lower part to 224 bits too */
531
0
    r_d[BN_NIST_224_TOP - 1] &= BN_MASK2l;
532
#else
533
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_224_TOP, top - BN_NIST_224_TOP,
534
        BN_NIST_224_TOP);
535
#endif
536
537
#if defined(NIST_INT64) && BN_BITS2 != 64
538
    {
539
        NIST_INT64 acc; /* accumulator */
540
        unsigned int *rp = (unsigned int *)r_d;
541
        const unsigned int *bp = (const unsigned int *)buf.ui;
542
543
        acc = rp[0];
544
        acc -= bp[7 - 7];
545
        acc -= bp[11 - 7];
546
        rp[0] = (unsigned int)acc;
547
        acc >>= 32;
548
549
        acc += rp[1];
550
        acc -= bp[8 - 7];
551
        acc -= bp[12 - 7];
552
        rp[1] = (unsigned int)acc;
553
        acc >>= 32;
554
555
        acc += rp[2];
556
        acc -= bp[9 - 7];
557
        acc -= bp[13 - 7];
558
        rp[2] = (unsigned int)acc;
559
        acc >>= 32;
560
561
        acc += rp[3];
562
        acc += bp[7 - 7];
563
        acc += bp[11 - 7];
564
        acc -= bp[10 - 7];
565
        rp[3] = (unsigned int)acc;
566
        acc >>= 32;
567
568
        acc += rp[4];
569
        acc += bp[8 - 7];
570
        acc += bp[12 - 7];
571
        acc -= bp[11 - 7];
572
        rp[4] = (unsigned int)acc;
573
        acc >>= 32;
574
575
        acc += rp[5];
576
        acc += bp[9 - 7];
577
        acc += bp[13 - 7];
578
        acc -= bp[12 - 7];
579
        rp[5] = (unsigned int)acc;
580
        acc >>= 32;
581
582
        acc += rp[6];
583
        acc += bp[10 - 7];
584
        acc -= bp[13 - 7];
585
        rp[6] = (unsigned int)acc;
586
587
        carry = (int)(acc >> 32);
588
#if BN_BITS2 == 64
589
        rp[7] = carry;
590
#endif
591
    }
592
#else
593
0
    {
594
0
        BN_ULONG t_d[BN_NIST_224_TOP];
595
596
0
        nist_set_224(t_d, buf.bn, 10, 9, 8, 7, 0, 0, 0);
597
0
        carry = (int)bn_add_words(r_d, r_d, t_d, BN_NIST_224_TOP);
598
0
        nist_set_224(t_d, buf.bn, 0, 13, 12, 11, 0, 0, 0);
599
0
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_224_TOP);
600
0
        nist_set_224(t_d, buf.bn, 13, 12, 11, 10, 9, 8, 7);
601
0
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_224_TOP);
602
0
        nist_set_224(t_d, buf.bn, 0, 0, 0, 0, 13, 12, 11);
603
0
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_224_TOP);
604
605
0
#if BN_BITS2 == 64
606
0
        carry = (int)(r_d[BN_NIST_224_TOP - 1] >> 32);
607
0
#endif
608
0
    }
609
0
#endif
610
0
    adjust = bn_sub_words;
611
0
    if (carry > 0) {
612
0
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_224[carry - 1],
613
0
            BN_NIST_224_TOP);
614
0
#if BN_BITS2 == 64
615
0
        carry = (int)(~(r_d[BN_NIST_224_TOP - 1] >> 32)) & 1;
616
0
#endif
617
0
    } else if (carry < 0) {
618
        /*
619
         * it's a bit more complicated logic in this case. if bn_add_words
620
         * yields no carry, then result has to be adjusted by unconditionally
621
         * *adding* the modulus. but if it does, then result has to be
622
         * compared to the modulus and conditionally adjusted by
623
         * *subtracting* the latter.
624
         */
625
0
        carry = (int)bn_add_words(r_d, r_d, _nist_p_224[-carry - 1],
626
0
            BN_NIST_224_TOP);
627
0
        adjust = carry ? bn_sub_words : bn_add_words;
628
0
    } else
629
0
        carry = 1;
630
631
    /* otherwise it's effectively same as in BN_nist_mod_192... */
632
0
    res = ((*adjust)(c_d, r_d, _nist_p_224[0], BN_NIST_224_TOP) && carry)
633
0
        ? r_d
634
0
        : c_d;
635
0
    nist_cp_bn(r_d, res, BN_NIST_224_TOP);
636
0
    r->top = BN_NIST_224_TOP;
637
0
    bn_correct_top(r);
638
639
0
    return 1;
640
0
}
641
642
#define nist_set_256(to, from, a1, a2, a3, a4, a5, a6, a7, a8)      \
643
    {                                                               \
644
        bn_cp_32(to, 0, from, (a8) - 8)                             \
645
            bn_cp_32(to, 1, from, (a7) - 8)                         \
646
                bn_cp_32(to, 2, from, (a6) - 8)                     \
647
                    bn_cp_32(to, 3, from, (a5) - 8)                 \
648
                        bn_cp_32(to, 4, from, (a4) - 8)             \
649
                            bn_cp_32(to, 5, from, (a3) - 8)         \
650
                                bn_cp_32(to, 6, from, (a2) - 8)     \
651
                                    bn_cp_32(to, 7, from, (a1) - 8) \
652
    }
653
654
int BN_nist_mod_256(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
655
    BN_CTX *ctx)
656
0
{
657
0
    int i, top = a->top;
658
0
    int carry = 0;
659
0
    register BN_ULONG *a_d = a->d, *r_d;
660
0
    union {
661
0
        BN_ULONG bn[BN_NIST_256_TOP];
662
0
        unsigned int ui[BN_NIST_256_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
663
0
    } buf;
664
0
    BN_ULONG c_d[BN_NIST_256_TOP], *res;
665
0
    bn_addsub_f adjust;
666
0
    static const BIGNUM ossl_bignum_nist_p_256_sqr = {
667
0
        (BN_ULONG *)_nist_p_256_sqr,
668
0
        OSSL_NELEM(_nist_p_256_sqr),
669
0
        OSSL_NELEM(_nist_p_256_sqr),
670
0
        0, BN_FLG_STATIC_DATA
671
0
    };
672
673
0
    field = &ossl_bignum_nist_p_256; /* just to make sure */
674
675
0
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_256_sqr) >= 0)
676
0
        return BN_nnmod(r, a, field, ctx);
677
678
0
    i = BN_ucmp(field, a);
679
0
    if (i == 0) {
680
0
        BN_zero(r);
681
0
        return 1;
682
0
    } else if (i > 0)
683
0
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
684
685
0
    if (r != a) {
686
0
        if (!bn_wexpand(r, BN_NIST_256_TOP))
687
0
            return 0;
688
0
        r_d = r->d;
689
0
        nist_cp_bn(r_d, a_d, BN_NIST_256_TOP);
690
0
    } else
691
0
        r_d = a_d;
692
693
0
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_256_TOP, top - BN_NIST_256_TOP,
694
0
        BN_NIST_256_TOP);
695
696
0
#if defined(NIST_INT64)
697
0
    {
698
0
        NIST_INT64 acc; /* accumulator */
699
0
        unsigned int *rp = (unsigned int *)r_d;
700
0
        const unsigned int *bp = (const unsigned int *)buf.ui;
701
702
0
        acc = load_u32(&rp[0]);
703
0
        acc += bp[8 - 8];
704
0
        acc += bp[9 - 8];
705
0
        acc -= bp[11 - 8];
706
0
        acc -= bp[12 - 8];
707
0
        acc -= bp[13 - 8];
708
0
        acc -= bp[14 - 8];
709
0
        store_lo32(&rp[0], acc);
710
0
        acc >>= 32;
711
712
0
        acc += load_u32(&rp[1]);
713
0
        acc += bp[9 - 8];
714
0
        acc += bp[10 - 8];
715
0
        acc -= bp[12 - 8];
716
0
        acc -= bp[13 - 8];
717
0
        acc -= bp[14 - 8];
718
0
        acc -= bp[15 - 8];
719
0
        store_lo32(&rp[1], acc);
720
0
        acc >>= 32;
721
722
0
        acc += load_u32(&rp[2]);
723
0
        acc += bp[10 - 8];
724
0
        acc += bp[11 - 8];
725
0
        acc -= bp[13 - 8];
726
0
        acc -= bp[14 - 8];
727
0
        acc -= bp[15 - 8];
728
0
        store_lo32(&rp[2], acc);
729
0
        acc >>= 32;
730
731
0
        acc += load_u32(&rp[3]);
732
0
        acc += bp[11 - 8];
733
0
        acc += bp[11 - 8];
734
0
        acc += bp[12 - 8];
735
0
        acc += bp[12 - 8];
736
0
        acc += bp[13 - 8];
737
0
        acc -= bp[15 - 8];
738
0
        acc -= bp[8 - 8];
739
0
        acc -= bp[9 - 8];
740
0
        store_lo32(&rp[3], acc);
741
0
        acc >>= 32;
742
743
0
        acc += load_u32(&rp[4]);
744
0
        acc += bp[12 - 8];
745
0
        acc += bp[12 - 8];
746
0
        acc += bp[13 - 8];
747
0
        acc += bp[13 - 8];
748
0
        acc += bp[14 - 8];
749
0
        acc -= bp[9 - 8];
750
0
        acc -= bp[10 - 8];
751
0
        store_lo32(&rp[4], acc);
752
0
        acc >>= 32;
753
754
0
        acc += load_u32(&rp[5]);
755
0
        acc += bp[13 - 8];
756
0
        acc += bp[13 - 8];
757
0
        acc += bp[14 - 8];
758
0
        acc += bp[14 - 8];
759
0
        acc += bp[15 - 8];
760
0
        acc -= bp[10 - 8];
761
0
        acc -= bp[11 - 8];
762
0
        store_lo32(&rp[5], acc);
763
0
        acc >>= 32;
764
765
0
        acc += load_u32(&rp[6]);
766
0
        acc += bp[14 - 8];
767
0
        acc += bp[14 - 8];
768
0
        acc += bp[15 - 8];
769
0
        acc += bp[15 - 8];
770
0
        acc += bp[14 - 8];
771
0
        acc += bp[13 - 8];
772
0
        acc -= bp[8 - 8];
773
0
        acc -= bp[9 - 8];
774
0
        store_lo32(&rp[6], acc);
775
0
        acc >>= 32;
776
777
0
        acc += load_u32(&rp[7]);
778
0
        acc += bp[15 - 8];
779
0
        acc += bp[15 - 8];
780
0
        acc += bp[15 - 8];
781
0
        acc += bp[8 - 8];
782
0
        acc -= bp[10 - 8];
783
0
        acc -= bp[11 - 8];
784
0
        acc -= bp[12 - 8];
785
0
        acc -= bp[13 - 8];
786
0
        store_lo32(&rp[7], acc);
787
788
0
        carry = (int)(acc >> 32);
789
0
    }
790
#else
791
    {
792
        BN_ULONG t_d[BN_NIST_256_TOP];
793
794
        /*
795
         * S1
796
         */
797
        nist_set_256(t_d, buf.bn, 15, 14, 13, 12, 11, 0, 0, 0);
798
        /*
799
         * S2
800
         */
801
        nist_set_256(c_d, buf.bn, 0, 15, 14, 13, 12, 0, 0, 0);
802
        carry = (int)bn_add_words(t_d, t_d, c_d, BN_NIST_256_TOP);
803
        /* left shift */
804
        {
805
            register BN_ULONG *ap, t, c;
806
            ap = t_d;
807
            c = 0;
808
            for (i = BN_NIST_256_TOP; i != 0; --i) {
809
                t = *ap;
810
                *(ap++) = ((t << 1) | c) & BN_MASK2;
811
                c = (t & BN_TBIT) ? 1 : 0;
812
            }
813
            carry <<= 1;
814
            carry |= c;
815
        }
816
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
817
        /*
818
         * S3
819
         */
820
        nist_set_256(t_d, buf.bn, 15, 14, 0, 0, 0, 10, 9, 8);
821
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
822
        /*
823
         * S4
824
         */
825
        nist_set_256(t_d, buf.bn, 8, 13, 15, 14, 13, 11, 10, 9);
826
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_256_TOP);
827
        /*
828
         * D1
829
         */
830
        nist_set_256(t_d, buf.bn, 10, 8, 0, 0, 0, 13, 12, 11);
831
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
832
        /*
833
         * D2
834
         */
835
        nist_set_256(t_d, buf.bn, 11, 9, 0, 0, 15, 14, 13, 12);
836
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
837
        /*
838
         * D3
839
         */
840
        nist_set_256(t_d, buf.bn, 12, 0, 10, 9, 8, 15, 14, 13);
841
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
842
        /*
843
         * D4
844
         */
845
        nist_set_256(t_d, buf.bn, 13, 0, 11, 10, 9, 0, 15, 14);
846
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_256_TOP);
847
    }
848
#endif
849
    /* see BN_nist_mod_224 for explanation */
850
0
    adjust = bn_sub_words;
851
0
    if (carry > 0)
852
0
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_256[carry - 1],
853
0
            BN_NIST_256_TOP);
854
0
    else if (carry < 0) {
855
0
        carry = (int)bn_add_words(r_d, r_d, _nist_p_256[-carry - 1],
856
0
            BN_NIST_256_TOP);
857
0
        adjust = carry ? bn_sub_words : bn_add_words;
858
0
    } else
859
0
        carry = 1;
860
861
0
    res = ((*adjust)(c_d, r_d, _nist_p_256[0], BN_NIST_256_TOP) && carry)
862
0
        ? r_d
863
0
        : c_d;
864
0
    nist_cp_bn(r_d, res, BN_NIST_256_TOP);
865
0
    r->top = BN_NIST_256_TOP;
866
0
    bn_correct_top(r);
867
868
0
    return 1;
869
0
}
870
871
#define nist_set_384(to, from, a1, a2, a3, a4, a5, a6, a7, a8, a9, a10, a11, a12)     \
872
    {                                                                                 \
873
        bn_cp_32(to, 0, from, (a12) - 12)                                             \
874
            bn_cp_32(to, 1, from, (a11) - 12)                                         \
875
                bn_cp_32(to, 2, from, (a10) - 12)                                     \
876
                    bn_cp_32(to, 3, from, (a9) - 12)                                  \
877
                        bn_cp_32(to, 4, from, (a8) - 12)                              \
878
                            bn_cp_32(to, 5, from, (a7) - 12)                          \
879
                                bn_cp_32(to, 6, from, (a6) - 12)                      \
880
                                    bn_cp_32(to, 7, from, (a5) - 12)                  \
881
                                        bn_cp_32(to, 8, from, (a4) - 12)              \
882
                                            bn_cp_32(to, 9, from, (a3) - 12)          \
883
                                                bn_cp_32(to, 10, from, (a2) - 12)     \
884
                                                    bn_cp_32(to, 11, from, (a1) - 12) \
885
    }
886
887
int BN_nist_mod_384(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
888
    BN_CTX *ctx)
889
0
{
890
0
    int i, top = a->top;
891
0
    int carry = 0;
892
0
    register BN_ULONG *r_d, *a_d = a->d;
893
0
    union {
894
0
        BN_ULONG bn[BN_NIST_384_TOP];
895
0
        unsigned int ui[BN_NIST_384_TOP * sizeof(BN_ULONG) / sizeof(unsigned int)];
896
0
    } buf;
897
0
    BN_ULONG c_d[BN_NIST_384_TOP], *res;
898
0
    bn_addsub_f adjust;
899
0
    static const BIGNUM ossl_bignum_nist_p_384_sqr = {
900
0
        (BN_ULONG *)_nist_p_384_sqr,
901
0
        OSSL_NELEM(_nist_p_384_sqr),
902
0
        OSSL_NELEM(_nist_p_384_sqr),
903
0
        0, BN_FLG_STATIC_DATA
904
0
    };
905
906
0
    field = &ossl_bignum_nist_p_384; /* just to make sure */
907
908
0
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_384_sqr) >= 0)
909
0
        return BN_nnmod(r, a, field, ctx);
910
911
0
    i = BN_ucmp(field, a);
912
0
    if (i == 0) {
913
0
        BN_zero(r);
914
0
        return 1;
915
0
    } else if (i > 0)
916
0
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
917
918
0
    if (r != a) {
919
0
        if (!bn_wexpand(r, BN_NIST_384_TOP))
920
0
            return 0;
921
0
        r_d = r->d;
922
0
        nist_cp_bn(r_d, a_d, BN_NIST_384_TOP);
923
0
    } else
924
0
        r_d = a_d;
925
926
0
    nist_cp_bn_0(buf.bn, a_d + BN_NIST_384_TOP, top - BN_NIST_384_TOP,
927
0
        BN_NIST_384_TOP);
928
929
0
#if defined(NIST_INT64)
930
0
    {
931
0
        NIST_INT64 acc; /* accumulator */
932
0
        unsigned int *rp = (unsigned int *)r_d;
933
0
        const unsigned int *bp = (const unsigned int *)buf.ui;
934
935
0
        acc = load_u32(&rp[0]);
936
0
        acc += bp[12 - 12];
937
0
        acc += bp[21 - 12];
938
0
        acc += bp[20 - 12];
939
0
        acc -= bp[23 - 12];
940
0
        store_lo32(&rp[0], acc);
941
0
        acc >>= 32;
942
943
0
        acc += load_u32(&rp[1]);
944
0
        acc += bp[13 - 12];
945
0
        acc += bp[22 - 12];
946
0
        acc += bp[23 - 12];
947
0
        acc -= bp[12 - 12];
948
0
        acc -= bp[20 - 12];
949
0
        store_lo32(&rp[1], acc);
950
0
        acc >>= 32;
951
952
0
        acc += load_u32(&rp[2]);
953
0
        acc += bp[14 - 12];
954
0
        acc += bp[23 - 12];
955
0
        acc -= bp[13 - 12];
956
0
        acc -= bp[21 - 12];
957
0
        store_lo32(&rp[2], acc);
958
0
        acc >>= 32;
959
960
0
        acc += load_u32(&rp[3]);
961
0
        acc += bp[15 - 12];
962
0
        acc += bp[12 - 12];
963
0
        acc += bp[20 - 12];
964
0
        acc += bp[21 - 12];
965
0
        acc -= bp[14 - 12];
966
0
        acc -= bp[22 - 12];
967
0
        acc -= bp[23 - 12];
968
0
        store_lo32(&rp[3], acc);
969
0
        acc >>= 32;
970
971
0
        acc += load_u32(&rp[4]);
972
0
        acc += bp[21 - 12];
973
0
        acc += bp[21 - 12];
974
0
        acc += bp[16 - 12];
975
0
        acc += bp[13 - 12];
976
0
        acc += bp[12 - 12];
977
0
        acc += bp[20 - 12];
978
0
        acc += bp[22 - 12];
979
0
        acc -= bp[15 - 12];
980
0
        acc -= bp[23 - 12];
981
0
        acc -= bp[23 - 12];
982
0
        store_lo32(&rp[4], acc);
983
0
        acc >>= 32;
984
985
0
        acc += load_u32(&rp[5]);
986
0
        acc += bp[22 - 12];
987
0
        acc += bp[22 - 12];
988
0
        acc += bp[17 - 12];
989
0
        acc += bp[14 - 12];
990
0
        acc += bp[13 - 12];
991
0
        acc += bp[21 - 12];
992
0
        acc += bp[23 - 12];
993
0
        acc -= bp[16 - 12];
994
0
        store_lo32(&rp[5], acc);
995
0
        acc >>= 32;
996
997
0
        acc += load_u32(&rp[6]);
998
0
        acc += bp[23 - 12];
999
0
        acc += bp[23 - 12];
1000
0
        acc += bp[18 - 12];
1001
0
        acc += bp[15 - 12];
1002
0
        acc += bp[14 - 12];
1003
0
        acc += bp[22 - 12];
1004
0
        acc -= bp[17 - 12];
1005
0
        store_lo32(&rp[6], acc);
1006
0
        acc >>= 32;
1007
1008
0
        acc += load_u32(&rp[7]);
1009
0
        acc += bp[19 - 12];
1010
0
        acc += bp[16 - 12];
1011
0
        acc += bp[15 - 12];
1012
0
        acc += bp[23 - 12];
1013
0
        acc -= bp[18 - 12];
1014
0
        store_lo32(&rp[7], acc);
1015
0
        acc >>= 32;
1016
1017
0
        acc += load_u32(&rp[8]);
1018
0
        acc += bp[20 - 12];
1019
0
        acc += bp[17 - 12];
1020
0
        acc += bp[16 - 12];
1021
0
        acc -= bp[19 - 12];
1022
0
        store_lo32(&rp[8], acc);
1023
0
        acc >>= 32;
1024
1025
0
        acc += load_u32(&rp[9]);
1026
0
        acc += bp[21 - 12];
1027
0
        acc += bp[18 - 12];
1028
0
        acc += bp[17 - 12];
1029
0
        acc -= bp[20 - 12];
1030
0
        store_lo32(&rp[9], acc);
1031
0
        acc >>= 32;
1032
1033
0
        acc += load_u32(&rp[10]);
1034
0
        acc += bp[22 - 12];
1035
0
        acc += bp[19 - 12];
1036
0
        acc += bp[18 - 12];
1037
0
        acc -= bp[21 - 12];
1038
0
        store_lo32(&rp[10], acc);
1039
0
        acc >>= 32;
1040
1041
0
        acc += load_u32(&rp[11]);
1042
0
        acc += bp[23 - 12];
1043
0
        acc += bp[20 - 12];
1044
0
        acc += bp[19 - 12];
1045
0
        acc -= bp[22 - 12];
1046
0
        store_lo32(&rp[11], acc);
1047
1048
0
        carry = (int)(acc >> 32);
1049
0
    }
1050
#else
1051
    {
1052
        BN_ULONG t_d[BN_NIST_384_TOP];
1053
1054
        /*
1055
         * S1
1056
         */
1057
        nist_set_256(t_d, buf.bn, 0, 0, 0, 0, 0, 23 - 4, 22 - 4, 21 - 4);
1058
        /* left shift */
1059
        {
1060
            register BN_ULONG *ap, t, c;
1061
            ap = t_d;
1062
            c = 0;
1063
            for (i = 3; i != 0; --i) {
1064
                t = *ap;
1065
                *(ap++) = ((t << 1) | c) & BN_MASK2;
1066
                c = (t & BN_TBIT) ? 1 : 0;
1067
            }
1068
            *ap = c;
1069
        }
1070
        carry = (int)bn_add_words(r_d + (128 / BN_BITS2), r_d + (128 / BN_BITS2),
1071
            t_d, BN_NIST_256_TOP);
1072
        /*
1073
         * S2
1074
         */
1075
        carry += (int)bn_add_words(r_d, r_d, buf.bn, BN_NIST_384_TOP);
1076
        /*
1077
         * S3
1078
         */
1079
        nist_set_384(t_d, buf.bn, 20, 19, 18, 17, 16, 15, 14, 13, 12, 23, 22,
1080
            21);
1081
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1082
        /*
1083
         * S4
1084
         */
1085
        nist_set_384(t_d, buf.bn, 19, 18, 17, 16, 15, 14, 13, 12, 20, 0, 23,
1086
            0);
1087
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1088
        /*
1089
         * S5
1090
         */
1091
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 23, 22, 21, 20, 0, 0, 0, 0);
1092
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1093
        /*
1094
         * S6
1095
         */
1096
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 0, 0, 23, 22, 21, 0, 0, 20);
1097
        carry += (int)bn_add_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1098
        /*
1099
         * D1
1100
         */
1101
        nist_set_384(t_d, buf.bn, 22, 21, 20, 19, 18, 17, 16, 15, 14, 13, 12,
1102
            23);
1103
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1104
        /*
1105
         * D2
1106
         */
1107
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 0, 0, 0, 23, 22, 21, 20, 0);
1108
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1109
        /*
1110
         * D3
1111
         */
1112
        nist_set_384(t_d, buf.bn, 0, 0, 0, 0, 0, 0, 0, 23, 23, 0, 0, 0);
1113
        carry -= (int)bn_sub_words(r_d, r_d, t_d, BN_NIST_384_TOP);
1114
    }
1115
#endif
1116
    /* see BN_nist_mod_224 for explanation */
1117
0
    adjust = bn_sub_words;
1118
0
    if (carry > 0)
1119
0
        carry = (int)bn_sub_words(r_d, r_d, _nist_p_384[carry - 1],
1120
0
            BN_NIST_384_TOP);
1121
0
    else if (carry < 0) {
1122
0
        carry = (int)bn_add_words(r_d, r_d, _nist_p_384[-carry - 1],
1123
0
            BN_NIST_384_TOP);
1124
0
        adjust = carry ? bn_sub_words : bn_add_words;
1125
0
    } else
1126
0
        carry = 1;
1127
1128
0
    res = ((*adjust)(c_d, r_d, _nist_p_384[0], BN_NIST_384_TOP) && carry)
1129
0
        ? r_d
1130
0
        : c_d;
1131
0
    nist_cp_bn(r_d, res, BN_NIST_384_TOP);
1132
0
    r->top = BN_NIST_384_TOP;
1133
0
    bn_correct_top(r);
1134
1135
0
    return 1;
1136
0
}
1137
1138
0
#define BN_NIST_521_RSHIFT (521 % BN_BITS2)
1139
0
#define BN_NIST_521_LSHIFT (BN_BITS2 - BN_NIST_521_RSHIFT)
1140
0
#define BN_NIST_521_TOP_MASK ((BN_ULONG)BN_MASK2 >> BN_NIST_521_LSHIFT)
1141
1142
int BN_nist_mod_521(BIGNUM *r, const BIGNUM *a, const BIGNUM *field,
1143
    BN_CTX *ctx)
1144
0
{
1145
0
    int top = a->top, i;
1146
0
    BN_ULONG *r_d, *a_d = a->d, t_d[BN_NIST_521_TOP], val, tmp, *res;
1147
0
    static const BIGNUM ossl_bignum_nist_p_521_sqr = {
1148
0
        (BN_ULONG *)_nist_p_521_sqr,
1149
0
        OSSL_NELEM(_nist_p_521_sqr),
1150
0
        OSSL_NELEM(_nist_p_521_sqr),
1151
0
        0, BN_FLG_STATIC_DATA
1152
0
    };
1153
1154
0
    field = &ossl_bignum_nist_p_521; /* just to make sure */
1155
1156
0
    if (BN_is_negative(a) || BN_ucmp(a, &ossl_bignum_nist_p_521_sqr) >= 0)
1157
0
        return BN_nnmod(r, a, field, ctx);
1158
1159
0
    i = BN_ucmp(field, a);
1160
0
    if (i == 0) {
1161
0
        BN_zero(r);
1162
0
        return 1;
1163
0
    } else if (i > 0)
1164
0
        return (r == a) ? 1 : (BN_copy(r, a) != NULL);
1165
1166
0
    if (r != a) {
1167
0
        if (!bn_wexpand(r, BN_NIST_521_TOP))
1168
0
            return 0;
1169
0
        r_d = r->d;
1170
0
        nist_cp_bn(r_d, a_d, BN_NIST_521_TOP);
1171
0
    } else
1172
0
        r_d = a_d;
1173
1174
    /* upper 521 bits, copy ... */
1175
0
    nist_cp_bn_0(t_d, a_d + (BN_NIST_521_TOP - 1),
1176
0
        top - (BN_NIST_521_TOP - 1), BN_NIST_521_TOP);
1177
    /* ... and right shift */
1178
0
    for (val = t_d[0], i = 0; i < BN_NIST_521_TOP - 1; i++) {
1179
#if 0
1180
        /*
1181
         * MSC ARM compiler [version 2013, presumably even earlier,
1182
         * much earlier] miscompiles this code, but not one in
1183
         * #else section. See RT#3541.
1184
         */
1185
        tmp = val >> BN_NIST_521_RSHIFT;
1186
        val = t_d[i + 1];
1187
        t_d[i] = (tmp | val << BN_NIST_521_LSHIFT) & BN_MASK2;
1188
#else
1189
0
        t_d[i] = (val >> BN_NIST_521_RSHIFT | (tmp = t_d[i + 1]) << BN_NIST_521_LSHIFT) & BN_MASK2;
1190
0
        val = tmp;
1191
0
#endif
1192
0
    }
1193
0
    t_d[i] = val >> BN_NIST_521_RSHIFT;
1194
    /* lower 521 bits */
1195
0
    r_d[i] &= BN_NIST_521_TOP_MASK;
1196
1197
0
    bn_add_words(r_d, r_d, t_d, BN_NIST_521_TOP);
1198
0
    res = bn_sub_words(t_d, r_d, _nist_p_521,
1199
0
              BN_NIST_521_TOP)
1200
0
        ? r_d
1201
0
        : t_d;
1202
0
    nist_cp_bn(r_d, res, BN_NIST_521_TOP);
1203
0
    r->top = BN_NIST_521_TOP;
1204
0
    bn_correct_top(r);
1205
1206
0
    return 1;
1207
0
}
1208
1209
int (*BN_nist_mod_func(const BIGNUM *p))(BIGNUM *r, const BIGNUM *a,
1210
    const BIGNUM *field, BN_CTX *ctx)
1211
0
{
1212
0
    if (BN_ucmp(&ossl_bignum_nist_p_192, p) == 0)
1213
0
        return BN_nist_mod_192;
1214
0
    if (BN_ucmp(&ossl_bignum_nist_p_224, p) == 0)
1215
0
        return BN_nist_mod_224;
1216
0
    if (BN_ucmp(&ossl_bignum_nist_p_256, p) == 0)
1217
0
        return BN_nist_mod_256;
1218
0
    if (BN_ucmp(&ossl_bignum_nist_p_384, p) == 0)
1219
0
        return BN_nist_mod_384;
1220
0
    if (BN_ucmp(&ossl_bignum_nist_p_521, p) == 0)
1221
0
        return BN_nist_mod_521;
1222
0
    return 0;
1223
0
}