Coverage Report

Created: 2026-05-30 06:56

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/openssl/crypto/ec/ecp_nistp224.c
Line
Count
Source
1
/*
2
 * Copyright 2010-2025 The OpenSSL Project Authors. All Rights Reserved.
3
 *
4
 * Licensed under the Apache License 2.0 (the "License").  You may not use
5
 * this file except in compliance with the License.  You can obtain a copy
6
 * in the file LICENSE in the source distribution or at
7
 * https://www.openssl.org/source/license.html
8
 */
9
10
/* Copyright 2011 Google Inc.
11
 *
12
 * Licensed under the Apache License, Version 2.0 (the "License");
13
 *
14
 * you may not use this file except in compliance with the License.
15
 * You may obtain a copy of the License at
16
 *
17
 *     http://www.apache.org/licenses/LICENSE-2.0
18
 *
19
 *  Unless required by applicable law or agreed to in writing, software
20
 *  distributed under the License is distributed on an "AS IS" BASIS,
21
 *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
22
 *  See the License for the specific language governing permissions and
23
 *  limitations under the License.
24
 */
25
26
/*
27
 * ECDSA low level APIs are deprecated for public use, but still ok for
28
 * internal use.
29
 */
30
#include "internal/deprecated.h"
31
32
/*
33
 * A 64-bit implementation of the NIST P-224 elliptic curve point multiplication
34
 *
35
 * Inspired by Daniel J. Bernstein's public domain nistp224 implementation
36
 * and Adam Langley's public domain 64-bit C implementation of curve25519
37
 */
38
39
#include <openssl/opensslconf.h>
40
41
#include <stdint.h>
42
#include <string.h>
43
#include <openssl/err.h>
44
#include "ec_local.h"
45
46
#include "internal/numbers.h"
47
48
#ifndef INT128_MAX
49
#error "Your compiler doesn't appear to support 128-bit integer types"
50
#endif
51
52
/******************************************************************************/
53
/*-
54
 * INTERNAL REPRESENTATION OF FIELD ELEMENTS
55
 *
56
 * Field elements are represented as a_0 + 2^56*a_1 + 2^112*a_2 + 2^168*a_3
57
 * using 64-bit coefficients called 'limbs',
58
 * and sometimes (for multiplication results) as
59
 * b_0 + 2^56*b_1 + 2^112*b_2 + 2^168*b_3 + 2^224*b_4 + 2^280*b_5 + 2^336*b_6
60
 * using 128-bit coefficients called 'widelimbs'.
61
 * A 4-limb representation is an 'felem';
62
 * a 7-widelimb representation is a 'widefelem'.
63
 * Even within felems, bits of adjacent limbs overlap, and we don't always
64
 * reduce the representations: we ensure that inputs to each felem
65
 * multiplication satisfy a_i < 2^60, so outputs satisfy b_i < 4*2^60*2^60,
66
 * and fit into a 128-bit word without overflow. The coefficients are then
67
 * again partially reduced to obtain an felem satisfying a_i < 2^57.
68
 * We only reduce to the unique minimal representation at the end of the
69
 * computation.
70
 */
71
72
typedef uint64_t limb;
73
typedef uint64_t limb_aX __attribute((__aligned__(1)));
74
typedef uint128_t widelimb;
75
76
typedef limb felem[4];
77
typedef widelimb widefelem[7];
78
79
/*
80
 * Field element represented as a byte array. 28*8 = 224 bits is also the
81
 * group order size for the elliptic curve, and we also use this type for
82
 * scalars for point multiplication.
83
 */
84
typedef uint8_t felem_bytearray[28];
85
86
static const felem_bytearray nistp224_curve_params[5] = {
87
    { 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, /* p */
88
        0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0x00, 0x00, 0x00, 0x00,
89
        0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x01 },
90
    { 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, /* a */
91
        0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFE, 0xFF, 0xFF, 0xFF, 0xFF,
92
        0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFE },
93
    { 0xB4, 0x05, 0x0A, 0x85, 0x0C, 0x04, 0xB3, 0xAB, 0xF5, 0x41, /* b */
94
        0x32, 0x56, 0x50, 0x44, 0xB0, 0xB7, 0xD7, 0xBF, 0xD8, 0xBA,
95
        0x27, 0x0B, 0x39, 0x43, 0x23, 0x55, 0xFF, 0xB4 },
96
    { 0xB7, 0x0E, 0x0C, 0xBD, 0x6B, 0xB4, 0xBF, 0x7F, 0x32, 0x13, /* x */
97
        0x90, 0xB9, 0x4A, 0x03, 0xC1, 0xD3, 0x56, 0xC2, 0x11, 0x22,
98
        0x34, 0x32, 0x80, 0xD6, 0x11, 0x5C, 0x1D, 0x21 },
99
    { 0xbd, 0x37, 0x63, 0x88, 0xb5, 0xf7, 0x23, 0xfb, 0x4c, 0x22, /* y */
100
        0xdf, 0xe6, 0xcd, 0x43, 0x75, 0xa0, 0x5a, 0x07, 0x47, 0x64,
101
        0x44, 0xd5, 0x81, 0x99, 0x85, 0x00, 0x7e, 0x34 }
102
};
103
104
/*-
105
 * Precomputed multiples of the standard generator
106
 * Points are given in coordinates (X, Y, Z) where Z normally is 1
107
 * (0 for the point at infinity).
108
 * For each field element, slice a_0 is word 0, etc.
109
 *
110
 * The table has 2 * 16 elements, starting with the following:
111
 * index | bits    | point
112
 * ------+---------+------------------------------
113
 *     0 | 0 0 0 0 | 0G
114
 *     1 | 0 0 0 1 | 1G
115
 *     2 | 0 0 1 0 | 2^56G
116
 *     3 | 0 0 1 1 | (2^56 + 1)G
117
 *     4 | 0 1 0 0 | 2^112G
118
 *     5 | 0 1 0 1 | (2^112 + 1)G
119
 *     6 | 0 1 1 0 | (2^112 + 2^56)G
120
 *     7 | 0 1 1 1 | (2^112 + 2^56 + 1)G
121
 *     8 | 1 0 0 0 | 2^168G
122
 *     9 | 1 0 0 1 | (2^168 + 1)G
123
 *    10 | 1 0 1 0 | (2^168 + 2^56)G
124
 *    11 | 1 0 1 1 | (2^168 + 2^56 + 1)G
125
 *    12 | 1 1 0 0 | (2^168 + 2^112)G
126
 *    13 | 1 1 0 1 | (2^168 + 2^112 + 1)G
127
 *    14 | 1 1 1 0 | (2^168 + 2^112 + 2^56)G
128
 *    15 | 1 1 1 1 | (2^168 + 2^112 + 2^56 + 1)G
129
 * followed by a copy of this with each element multiplied by 2^28.
130
 *
131
 * The reason for this is so that we can clock bits into four different
132
 * locations when doing simple scalar multiplies against the base point,
133
 * and then another four locations using the second 16 elements.
134
 */
135
static const felem gmul[2][16][3] = {
136
    { { { 0, 0, 0, 0 },
137
          { 0, 0, 0, 0 },
138
          { 0, 0, 0, 0 } },
139
        { { 0x3280d6115c1d21, 0xc1d356c2112234, 0x7f321390b94a03, 0xb70e0cbd6bb4bf },
140
            { 0xd5819985007e34, 0x75a05a07476444, 0xfb4c22dfe6cd43, 0xbd376388b5f723 },
141
            { 1, 0, 0, 0 } },
142
        { { 0xfd9675666ebbe9, 0xbca7664d40ce5e, 0x2242df8d8a2a43, 0x1f49bbb0f99bc5 },
143
            { 0x29e0b892dc9c43, 0xece8608436e662, 0xdc858f185310d0, 0x9812dd4eb8d321 },
144
            { 1, 0, 0, 0 } },
145
        { { 0x6d3e678d5d8eb8, 0x559eed1cb362f1, 0x16e9a3bbce8a3f, 0xeedcccd8c2a748 },
146
            { 0xf19f90ed50266d, 0xabf2b4bf65f9df, 0x313865468fafec, 0x5cb379ba910a17 },
147
            { 1, 0, 0, 0 } },
148
        { { 0x0641966cab26e3, 0x91fb2991fab0a0, 0xefec27a4e13a0b, 0x0499aa8a5f8ebe },
149
            { 0x7510407766af5d, 0x84d929610d5450, 0x81d77aae82f706, 0x6916f6d4338c5b },
150
            { 1, 0, 0, 0 } },
151
        { { 0xea95ac3b1f15c6, 0x086000905e82d4, 0xdd323ae4d1c8b1, 0x932b56be7685a3 },
152
            { 0x9ef93dea25dbbf, 0x41665960f390f0, 0xfdec76dbe2a8a7, 0x523e80f019062a },
153
            { 1, 0, 0, 0 } },
154
        { { 0x822fdd26732c73, 0xa01c83531b5d0f, 0x363f37347c1ba4, 0xc391b45c84725c },
155
            { 0xbbd5e1b2d6ad24, 0xddfbcde19dfaec, 0xc393da7e222a7f, 0x1efb7890ede244 },
156
            { 1, 0, 0, 0 } },
157
        { { 0x4c9e90ca217da1, 0xd11beca79159bb, 0xff8d33c2c98b7c, 0x2610b39409f849 },
158
            { 0x44d1352ac64da0, 0xcdbb7b2c46b4fb, 0x966c079b753c89, 0xfe67e4e820b112 },
159
            { 1, 0, 0, 0 } },
160
        { { 0xe28cae2df5312d, 0xc71b61d16f5c6e, 0x79b7619a3e7c4c, 0x05c73240899b47 },
161
            { 0x9f7f6382c73e3a, 0x18615165c56bda, 0x641fab2116fd56, 0x72855882b08394 },
162
            { 1, 0, 0, 0 } },
163
        { { 0x0469182f161c09, 0x74a98ca8d00fb5, 0xb89da93489a3e0, 0x41c98768fb0c1d },
164
            { 0xe5ea05fb32da81, 0x3dce9ffbca6855, 0x1cfe2d3fbf59e6, 0x0e5e03408738a7 },
165
            { 1, 0, 0, 0 } },
166
        { { 0xdab22b2333e87f, 0x4430137a5dd2f6, 0xe03ab9f738beb8, 0xcb0c5d0dc34f24 },
167
            { 0x764a7df0c8fda5, 0x185ba5c3fa2044, 0x9281d688bcbe50, 0xc40331df893881 },
168
            { 1, 0, 0, 0 } },
169
        { { 0xb89530796f0f60, 0xade92bd26909a3, 0x1a0c83fb4884da, 0x1765bf22a5a984 },
170
            { 0x772a9ee75db09e, 0x23bc6c67cec16f, 0x4c1edba8b14e2f, 0xe2a215d9611369 },
171
            { 1, 0, 0, 0 } },
172
        { { 0x571e509fb5efb3, 0xade88696410552, 0xc8ae85fada74fe, 0x6c7e4be83bbde3 },
173
            { 0xff9f51160f4652, 0xb47ce2495a6539, 0xa2946c53b582f4, 0x286d2db3ee9a60 },
174
            { 1, 0, 0, 0 } },
175
        { { 0x40bbd5081a44af, 0x0995183b13926c, 0xbcefba6f47f6d0, 0x215619e9cc0057 },
176
            { 0x8bc94d3b0df45e, 0xf11c54a3694f6f, 0x8631b93cdfe8b5, 0xe7e3f4b0982db9 },
177
            { 1, 0, 0, 0 } },
178
        { { 0xb17048ab3e1c7b, 0xac38f36ff8a1d8, 0x1c29819435d2c6, 0xc813132f4c07e9 },
179
            { 0x2891425503b11f, 0x08781030579fea, 0xf5426ba5cc9674, 0x1e28ebf18562bc },
180
            { 1, 0, 0, 0 } },
181
        { { 0x9f31997cc864eb, 0x06cd91d28b5e4c, 0xff17036691a973, 0xf1aef351497c58 },
182
            { 0xdd1f2d600564ff, 0xdead073b1402db, 0x74a684435bd693, 0xeea7471f962558 },
183
            { 1, 0, 0, 0 } } },
184
    { { { 0, 0, 0, 0 },
185
          { 0, 0, 0, 0 },
186
          { 0, 0, 0, 0 } },
187
        { { 0x9665266dddf554, 0x9613d78b60ef2d, 0xce27a34cdba417, 0xd35ab74d6afc31 },
188
            { 0x85ccdd22deb15e, 0x2137e5783a6aab, 0xa141cffd8c93c6, 0x355a1830e90f2d },
189
            { 1, 0, 0, 0 } },
190
        { { 0x1a494eadaade65, 0xd6da4da77fe53c, 0xe7992996abec86, 0x65c3553c6090e3 },
191
            { 0xfa610b1fb09346, 0xf1c6540b8a4aaf, 0xc51a13ccd3cbab, 0x02995b1b18c28a },
192
            { 1, 0, 0, 0 } },
193
        { { 0x7874568e7295ef, 0x86b419fbe38d04, 0xdc0690a7550d9a, 0xd3966a44beac33 },
194
            { 0x2b7280ec29132f, 0xbeaa3b6a032df3, 0xdc7dd88ae41200, 0xd25e2513e3a100 },
195
            { 1, 0, 0, 0 } },
196
        { { 0x924857eb2efafd, 0xac2bce41223190, 0x8edaa1445553fc, 0x825800fd3562d5 },
197
            { 0x8d79148ea96621, 0x23a01c3dd9ed8d, 0xaf8b219f9416b5, 0xd8db0cc277daea },
198
            { 1, 0, 0, 0 } },
199
        { { 0x76a9c3b1a700f0, 0xe9acd29bc7e691, 0x69212d1a6b0327, 0x6322e97fe154be },
200
            { 0x469fc5465d62aa, 0x8d41ed18883b05, 0x1f8eae66c52b88, 0xe4fcbe9325be51 },
201
            { 1, 0, 0, 0 } },
202
        { { 0x825fdf583cac16, 0x020b857c7b023a, 0x683c17744b0165, 0x14ffd0a2daf2f1 },
203
            { 0x323b36184218f9, 0x4944ec4e3b47d4, 0xc15b3080841acf, 0x0bced4b01a28bb },
204
            { 1, 0, 0, 0 } },
205
        { { 0x92ac22230df5c4, 0x52f33b4063eda8, 0xcb3f19870c0c93, 0x40064f2ba65233 },
206
            { 0xfe16f0924f8992, 0x012da25af5b517, 0x1a57bb24f723a6, 0x06f8bc76760def },
207
            { 1, 0, 0, 0 } },
208
        { { 0x4a7084f7817cb9, 0xbcab0738ee9a78, 0x3ec11e11d9c326, 0xdc0fe90e0f1aae },
209
            { 0xcf639ea5f98390, 0x5c350aa22ffb74, 0x9afae98a4047b7, 0x956ec2d617fc45 },
210
            { 1, 0, 0, 0 } },
211
        { { 0x4306d648c1be6a, 0x9247cd8bc9a462, 0xf5595e377d2f2e, 0xbd1c3caff1a52e },
212
            { 0x045e14472409d0, 0x29f3e17078f773, 0x745a602b2d4f7d, 0x191837685cdfbb },
213
            { 1, 0, 0, 0 } },
214
        { { 0x5b6ee254a8cb79, 0x4953433f5e7026, 0xe21faeb1d1def4, 0xc4c225785c09de },
215
            { 0x307ce7bba1e518, 0x31b125b1036db8, 0x47e91868839e8f, 0xc765866e33b9f3 },
216
            { 1, 0, 0, 0 } },
217
        { { 0x3bfece24f96906, 0x4794da641e5093, 0xde5df64f95db26, 0x297ecd89714b05 },
218
            { 0x701bd3ebb2c3aa, 0x7073b4f53cb1d5, 0x13c5665658af16, 0x9895089d66fe58 },
219
            { 1, 0, 0, 0 } },
220
        { { 0x0fef05f78c4790, 0x2d773633b05d2e, 0x94229c3a951c94, 0xbbbd70df4911bb },
221
            { 0xb2c6963d2c1168, 0x105f47a72b0d73, 0x9fdf6111614080, 0x7b7e94b39e67b0 },
222
            { 1, 0, 0, 0 } },
223
        { { 0xad1a7d6efbe2b3, 0xf012482c0da69d, 0x6b3bdf12438345, 0x40d7558d7aa4d9 },
224
            { 0x8a09fffb5c6d3d, 0x9a356e5d9ffd38, 0x5973f15f4f9b1c, 0xdcd5f59f63c3ea },
225
            { 1, 0, 0, 0 } },
226
        { { 0xacf39f4c5ca7ab, 0x4c8071cc5fd737, 0xc64e3602cd1184, 0x0acd4644c9abba },
227
            { 0x6c011a36d8bf6e, 0xfecd87ba24e32a, 0x19f6f56574fad8, 0x050b204ced9405 },
228
            { 1, 0, 0, 0 } },
229
        { { 0xed4f1cae7d9a96, 0x5ceef7ad94c40a, 0x778e4a3bf3ef9b, 0x7405783dc3b55e },
230
            { 0x32477c61b6e8c6, 0xb46a97570f018b, 0x91176d0a7e95d1, 0x3df90fbc4c7d0e },
231
            { 1, 0, 0, 0 } } }
232
};
233
234
/* Precomputation for the group generator. */
235
struct nistp224_pre_comp_st {
236
    felem g_pre_comp[2][16][3];
237
    CRYPTO_REF_COUNT references;
238
};
239
240
const EC_METHOD *EC_GFp_nistp224_method(void)
241
0
{
242
0
    static const EC_METHOD ret = {
243
0
        EC_FLAGS_DEFAULT_OCT,
244
0
        NID_X9_62_prime_field,
245
0
        ossl_ec_GFp_nistp224_group_init,
246
0
        ossl_ec_GFp_simple_group_finish,
247
0
        ossl_ec_GFp_simple_group_clear_finish,
248
0
        ossl_ec_GFp_nist_group_copy,
249
0
        ossl_ec_GFp_nistp224_group_set_curve,
250
0
        ossl_ec_GFp_simple_group_get_curve,
251
0
        ossl_ec_GFp_simple_group_get_degree,
252
0
        ossl_ec_group_simple_order_bits,
253
0
        ossl_ec_GFp_simple_group_check_discriminant,
254
0
        ossl_ec_GFp_simple_point_init,
255
0
        ossl_ec_GFp_simple_point_finish,
256
0
        ossl_ec_GFp_simple_point_clear_finish,
257
0
        ossl_ec_GFp_simple_point_copy,
258
0
        ossl_ec_GFp_simple_point_set_to_infinity,
259
0
        ossl_ec_GFp_simple_point_set_affine_coordinates,
260
0
        ossl_ec_GFp_nistp224_point_get_affine_coordinates,
261
0
        0 /* point_set_compressed_coordinates */,
262
0
        0 /* point2oct */,
263
0
        0 /* oct2point */,
264
0
        ossl_ec_GFp_simple_add,
265
0
        ossl_ec_GFp_simple_dbl,
266
0
        ossl_ec_GFp_simple_invert,
267
0
        ossl_ec_GFp_simple_is_at_infinity,
268
0
        ossl_ec_GFp_simple_is_on_curve,
269
0
        ossl_ec_GFp_simple_cmp,
270
0
        ossl_ec_GFp_simple_make_affine,
271
0
        ossl_ec_GFp_simple_points_make_affine,
272
0
        ossl_ec_GFp_nistp224_points_mul,
273
0
        ossl_ec_GFp_nistp224_precompute_mult,
274
0
        ossl_ec_GFp_nistp224_have_precompute_mult,
275
0
        ossl_ec_GFp_nist_field_mul,
276
0
        ossl_ec_GFp_nist_field_sqr,
277
0
        0 /* field_div */,
278
0
        ossl_ec_GFp_simple_field_inv,
279
0
        0 /* field_encode */,
280
0
        0 /* field_decode */,
281
0
        0, /* field_set_to_one */
282
0
        ossl_ec_key_simple_priv2oct,
283
0
        ossl_ec_key_simple_oct2priv,
284
0
        0, /* set private */
285
0
        ossl_ec_key_simple_generate_key,
286
0
        ossl_ec_key_simple_check_key,
287
0
        ossl_ec_key_simple_generate_public_key,
288
0
        0, /* keycopy */
289
0
        0, /* keyfinish */
290
0
        ossl_ecdh_simple_compute_key,
291
0
        ossl_ecdsa_simple_sign_setup,
292
0
        ossl_ecdsa_simple_sign_sig,
293
0
        ossl_ecdsa_simple_verify_sig,
294
0
        0, /* field_inverse_mod_ord */
295
0
        0, /* blind_coordinates */
296
0
        0, /* ladder_pre */
297
0
        0, /* ladder_step */
298
0
        0 /* ladder_post */
299
0
    };
300
301
0
    return &ret;
302
0
}
303
304
/*
305
 * Helper functions to convert field elements to/from internal representation
306
 */
307
static void bin28_to_felem(felem out, const uint8_t in[28])
308
0
{
309
0
    out[0] = *((const limb *)(in)) & 0x00ffffffffffffff;
310
0
    out[1] = (*((const limb_aX *)(in + 7))) & 0x00ffffffffffffff;
311
0
    out[2] = (*((const limb_aX *)(in + 14))) & 0x00ffffffffffffff;
312
0
    out[3] = (*((const limb_aX *)(in + 20))) >> 8;
313
0
}
314
315
static void felem_to_bin28(uint8_t out[28], const felem in)
316
0
{
317
0
    unsigned i;
318
0
    for (i = 0; i < 7; ++i) {
319
0
        out[i] = in[0] >> (8 * i);
320
0
        out[i + 7] = in[1] >> (8 * i);
321
0
        out[i + 14] = in[2] >> (8 * i);
322
0
        out[i + 21] = in[3] >> (8 * i);
323
0
    }
324
0
}
325
326
/* From OpenSSL BIGNUM to internal representation */
327
static int BN_to_felem(felem out, const BIGNUM *bn)
328
0
{
329
0
    felem_bytearray b_out;
330
0
    int num_bytes;
331
332
0
    if (BN_is_negative(bn)) {
333
0
        ERR_raise(ERR_LIB_EC, EC_R_BIGNUM_OUT_OF_RANGE);
334
0
        return 0;
335
0
    }
336
0
    num_bytes = BN_bn2lebinpad(bn, b_out, sizeof(b_out));
337
0
    if (num_bytes < 0) {
338
0
        ERR_raise(ERR_LIB_EC, EC_R_BIGNUM_OUT_OF_RANGE);
339
0
        return 0;
340
0
    }
341
0
    bin28_to_felem(out, b_out);
342
0
    return 1;
343
0
}
344
345
/* From internal representation to OpenSSL BIGNUM */
346
static BIGNUM *felem_to_BN(BIGNUM *out, const felem in)
347
0
{
348
0
    felem_bytearray b_out;
349
0
    felem_to_bin28(b_out, in);
350
0
    return BN_lebin2bn(b_out, sizeof(b_out), out);
351
0
}
352
353
/******************************************************************************/
354
/*-
355
 *                              FIELD OPERATIONS
356
 *
357
 * Field operations, using the internal representation of field elements.
358
 * NB! These operations are specific to our point multiplication and cannot be
359
 * expected to be correct in general - e.g., multiplication with a large scalar
360
 * will cause an overflow.
361
 *
362
 */
363
364
static void felem_one(felem out)
365
0
{
366
0
    out[0] = 1;
367
0
    out[1] = 0;
368
0
    out[2] = 0;
369
0
    out[3] = 0;
370
0
}
371
372
static void felem_assign(felem out, const felem in)
373
0
{
374
0
    out[0] = in[0];
375
0
    out[1] = in[1];
376
0
    out[2] = in[2];
377
0
    out[3] = in[3];
378
0
}
379
380
/* Sum two field elements: out += in */
381
static void felem_sum(felem out, const felem in)
382
0
{
383
0
    out[0] += in[0];
384
0
    out[1] += in[1];
385
0
    out[2] += in[2];
386
0
    out[3] += in[3];
387
0
}
388
389
/* Subtract field elements: out -= in */
390
/* Assumes in[i] < 2^57 */
391
static void felem_diff(felem out, const felem in)
392
0
{
393
0
    static const limb two58p2 = (((limb)1) << 58) + (((limb)1) << 2);
394
0
    static const limb two58m2 = (((limb)1) << 58) - (((limb)1) << 2);
395
0
    static const limb two58m42m2 = (((limb)1) << 58) - (((limb)1) << 42) - (((limb)1) << 2);
396
397
    /* Add 0 mod 2^224-2^96+1 to ensure out > in */
398
0
    out[0] += two58p2;
399
0
    out[1] += two58m42m2;
400
0
    out[2] += two58m2;
401
0
    out[3] += two58m2;
402
403
0
    out[0] -= in[0];
404
0
    out[1] -= in[1];
405
0
    out[2] -= in[2];
406
0
    out[3] -= in[3];
407
0
}
408
409
/* Subtract in unreduced 128-bit mode: out -= in */
410
/* Assumes in[i] < 2^119 */
411
static void widefelem_diff(widefelem out, const widefelem in)
412
0
{
413
0
    static const widelimb two120 = ((widelimb)1) << 120;
414
0
    static const widelimb two120m64 = (((widelimb)1) << 120) - (((widelimb)1) << 64);
415
0
    static const widelimb two120m104m64 = (((widelimb)1) << 120) - (((widelimb)1) << 104) - (((widelimb)1) << 64);
416
417
    /* Add 0 mod 2^224-2^96+1 to ensure out > in */
418
0
    out[0] += two120;
419
0
    out[1] += two120m64;
420
0
    out[2] += two120m64;
421
0
    out[3] += two120;
422
0
    out[4] += two120m104m64;
423
0
    out[5] += two120m64;
424
0
    out[6] += two120m64;
425
426
0
    out[0] -= in[0];
427
0
    out[1] -= in[1];
428
0
    out[2] -= in[2];
429
0
    out[3] -= in[3];
430
0
    out[4] -= in[4];
431
0
    out[5] -= in[5];
432
0
    out[6] -= in[6];
433
0
}
434
435
/* Subtract in mixed mode: out128 -= in64 */
436
/* in[i] < 2^63 */
437
static void felem_diff_128_64(widefelem out, const felem in)
438
0
{
439
0
    static const widelimb two64p8 = (((widelimb)1) << 64) + (((widelimb)1) << 8);
440
0
    static const widelimb two64m8 = (((widelimb)1) << 64) - (((widelimb)1) << 8);
441
0
    static const widelimb two64m48m8 = (((widelimb)1) << 64) - (((widelimb)1) << 48) - (((widelimb)1) << 8);
442
443
    /* Add 0 mod 2^224-2^96+1 to ensure out > in */
444
0
    out[0] += two64p8;
445
0
    out[1] += two64m48m8;
446
0
    out[2] += two64m8;
447
0
    out[3] += two64m8;
448
449
0
    out[0] -= in[0];
450
0
    out[1] -= in[1];
451
0
    out[2] -= in[2];
452
0
    out[3] -= in[3];
453
0
}
454
455
/*
456
 * Multiply a field element by a scalar: out = out * scalar The scalars we
457
 * actually use are small, so results fit without overflow
458
 */
459
static void felem_scalar(felem out, const limb scalar)
460
0
{
461
0
    out[0] *= scalar;
462
0
    out[1] *= scalar;
463
0
    out[2] *= scalar;
464
0
    out[3] *= scalar;
465
0
}
466
467
/*
468
 * Multiply an unreduced field element by a scalar: out = out * scalar The
469
 * scalars we actually use are small, so results fit without overflow
470
 */
471
static void widefelem_scalar(widefelem out, const widelimb scalar)
472
0
{
473
0
    out[0] *= scalar;
474
0
    out[1] *= scalar;
475
0
    out[2] *= scalar;
476
0
    out[3] *= scalar;
477
0
    out[4] *= scalar;
478
0
    out[5] *= scalar;
479
0
    out[6] *= scalar;
480
0
}
481
482
/* Square a field element: out = in^2 */
483
static void felem_square(widefelem out, const felem in)
484
0
{
485
0
    limb tmp0, tmp1, tmp2;
486
0
    tmp0 = 2 * in[0];
487
0
    tmp1 = 2 * in[1];
488
0
    tmp2 = 2 * in[2];
489
0
    out[0] = ((widelimb)in[0]) * in[0];
490
0
    out[1] = ((widelimb)in[0]) * tmp1;
491
0
    out[2] = ((widelimb)in[0]) * tmp2 + ((widelimb)in[1]) * in[1];
492
0
    out[3] = ((widelimb)in[3]) * tmp0 + ((widelimb)in[1]) * tmp2;
493
0
    out[4] = ((widelimb)in[3]) * tmp1 + ((widelimb)in[2]) * in[2];
494
0
    out[5] = ((widelimb)in[3]) * tmp2;
495
0
    out[6] = ((widelimb)in[3]) * in[3];
496
0
}
497
498
/* Multiply two field elements: out = in1 * in2 */
499
static void felem_mul(widefelem out, const felem in1, const felem in2)
500
0
{
501
0
    out[0] = ((widelimb)in1[0]) * in2[0];
502
0
    out[1] = ((widelimb)in1[0]) * in2[1] + ((widelimb)in1[1]) * in2[0];
503
0
    out[2] = ((widelimb)in1[0]) * in2[2] + ((widelimb)in1[1]) * in2[1] + ((widelimb)in1[2]) * in2[0];
504
0
    out[3] = ((widelimb)in1[0]) * in2[3] + ((widelimb)in1[1]) * in2[2] + ((widelimb)in1[2]) * in2[1] + ((widelimb)in1[3]) * in2[0];
505
0
    out[4] = ((widelimb)in1[1]) * in2[3] + ((widelimb)in1[2]) * in2[2] + ((widelimb)in1[3]) * in2[1];
506
0
    out[5] = ((widelimb)in1[2]) * in2[3] + ((widelimb)in1[3]) * in2[2];
507
0
    out[6] = ((widelimb)in1[3]) * in2[3];
508
0
}
509
510
/*-
511
 * Reduce seven 128-bit coefficients to four 64-bit coefficients.
512
 * Requires in[i] < 2^126,
513
 * ensures out[0] < 2^56, out[1] < 2^56, out[2] < 2^56, out[3] <= 2^56 + 2^16 */
514
static void felem_reduce(felem out, const widefelem in)
515
0
{
516
0
    static const widelimb two127p15 = (((widelimb)1) << 127) + (((widelimb)1) << 15);
517
0
    static const widelimb two127m71 = (((widelimb)1) << 127) - (((widelimb)1) << 71);
518
0
    static const widelimb two127m71m55 = (((widelimb)1) << 127) - (((widelimb)1) << 71) - (((widelimb)1) << 55);
519
0
    widelimb output[5];
520
521
    /* Add 0 mod 2^224-2^96+1 to ensure all differences are positive */
522
0
    output[0] = in[0] + two127p15;
523
0
    output[1] = in[1] + two127m71m55;
524
0
    output[2] = in[2] + two127m71;
525
0
    output[3] = in[3];
526
0
    output[4] = in[4];
527
528
    /* Eliminate in[4], in[5], in[6] */
529
0
    output[4] += in[6] >> 16;
530
0
    output[3] += (in[6] & 0xffff) << 40;
531
0
    output[2] -= in[6];
532
533
0
    output[3] += in[5] >> 16;
534
0
    output[2] += (in[5] & 0xffff) << 40;
535
0
    output[1] -= in[5];
536
537
0
    output[2] += output[4] >> 16;
538
0
    output[1] += (output[4] & 0xffff) << 40;
539
0
    output[0] -= output[4];
540
541
    /* Carry 2 -> 3 -> 4 */
542
0
    output[3] += output[2] >> 56;
543
0
    output[2] &= 0x00ffffffffffffff;
544
545
0
    output[4] = output[3] >> 56;
546
0
    output[3] &= 0x00ffffffffffffff;
547
548
    /* Now output[2] < 2^56, output[3] < 2^56, output[4] < 2^72 */
549
550
    /* Eliminate output[4] */
551
0
    output[2] += output[4] >> 16;
552
    /* output[2] < 2^56 + 2^56 = 2^57 */
553
0
    output[1] += (output[4] & 0xffff) << 40;
554
0
    output[0] -= output[4];
555
556
    /* Carry 0 -> 1 -> 2 -> 3 */
557
0
    output[1] += output[0] >> 56;
558
0
    out[0] = output[0] & 0x00ffffffffffffff;
559
560
0
    output[2] += output[1] >> 56;
561
    /* output[2] < 2^57 + 2^72 */
562
0
    out[1] = output[1] & 0x00ffffffffffffff;
563
0
    output[3] += output[2] >> 56;
564
    /* output[3] <= 2^56 + 2^16 */
565
0
    out[2] = output[2] & 0x00ffffffffffffff;
566
567
    /*-
568
     * out[0] < 2^56, out[1] < 2^56, out[2] < 2^56,
569
     * out[3] <= 2^56 + 2^16 (due to final carry),
570
     * so out < 2*p
571
     */
572
0
    out[3] = output[3];
573
0
}
574
575
static void felem_square_reduce(felem out, const felem in)
576
0
{
577
0
    widefelem tmp;
578
0
    felem_square(tmp, in);
579
0
    felem_reduce(out, tmp);
580
0
}
581
582
static void felem_mul_reduce(felem out, const felem in1, const felem in2)
583
0
{
584
0
    widefelem tmp;
585
0
    felem_mul(tmp, in1, in2);
586
0
    felem_reduce(out, tmp);
587
0
}
588
589
/*
590
 * Reduce to unique minimal representation. Requires 0 <= in < 2*p (always
591
 * call felem_reduce first)
592
 */
593
static void felem_contract(felem out, const felem in)
594
0
{
595
0
    static const int64_t two56 = ((limb)1) << 56;
596
    /* 0 <= in < 2*p, p = 2^224 - 2^96 + 1 */
597
    /* if in > p , reduce in = in - 2^224 + 2^96 - 1 */
598
0
    int64_t tmp[4], a;
599
0
    tmp[0] = in[0];
600
0
    tmp[1] = in[1];
601
0
    tmp[2] = in[2];
602
0
    tmp[3] = in[3];
603
    /* Case 1: a = 1 iff in >= 2^224 */
604
0
    a = (in[3] >> 56);
605
0
    tmp[0] -= a;
606
0
    tmp[1] += a << 40;
607
0
    tmp[3] &= 0x00ffffffffffffff;
608
    /*
609
     * Case 2: a = 0 iff p <= in < 2^224, i.e., the high 128 bits are all 1
610
     * and the lower part is non-zero
611
     */
612
0
    a = ((in[3] & in[2] & (in[1] | 0x000000ffffffffff)) + 1) | (((int64_t)(in[0] + (in[1] & 0x000000ffffffffff)) - 1) >> 63);
613
0
    a &= 0x00ffffffffffffff;
614
    /* turn a into an all-one mask (if a = 0) or an all-zero mask */
615
0
    a = (a - 1) >> 63;
616
    /* subtract 2^224 - 2^96 + 1 if a is all-one */
617
0
    tmp[3] &= a ^ 0xffffffffffffffff;
618
0
    tmp[2] &= a ^ 0xffffffffffffffff;
619
0
    tmp[1] &= (a ^ 0xffffffffffffffff) | 0x000000ffffffffff;
620
0
    tmp[0] -= 1 & a;
621
622
    /*
623
     * eliminate negative coefficients: if tmp[0] is negative, tmp[1] must be
624
     * non-zero, so we only need one step
625
     */
626
0
    a = tmp[0] >> 63;
627
0
    tmp[0] += two56 & a;
628
0
    tmp[1] -= 1 & a;
629
630
    /* carry 1 -> 2 -> 3 */
631
0
    tmp[2] += tmp[1] >> 56;
632
0
    tmp[1] &= 0x00ffffffffffffff;
633
634
0
    tmp[3] += tmp[2] >> 56;
635
0
    tmp[2] &= 0x00ffffffffffffff;
636
637
    /* Now 0 <= out < p */
638
0
    out[0] = tmp[0];
639
0
    out[1] = tmp[1];
640
0
    out[2] = tmp[2];
641
0
    out[3] = tmp[3];
642
0
}
643
644
/*
645
 * Get negative value: out = -in
646
 * Requires in[i] < 2^63,
647
 * ensures out[0] < 2^56, out[1] < 2^56, out[2] < 2^56, out[3] <= 2^56 + 2^16
648
 */
649
static void felem_neg(felem out, const felem in)
650
0
{
651
0
    widefelem tmp;
652
653
0
    memset(tmp, 0, sizeof(tmp));
654
0
    felem_diff_128_64(tmp, in);
655
0
    felem_reduce(out, tmp);
656
0
}
657
658
/*
659
 * Zero-check: returns 1 if input is 0, and 0 otherwise. We know that field
660
 * elements are reduced to in < 2^225, so we only need to check three cases:
661
 * 0, 2^224 - 2^96 + 1, and 2^225 - 2^97 + 2
662
 */
663
static limb felem_is_zero(const felem in)
664
0
{
665
0
    limb zero, two224m96p1, two225m97p2;
666
667
0
    zero = in[0] | in[1] | in[2] | in[3];
668
0
    zero = (((int64_t)(zero)-1) >> 63) & 1;
669
0
    two224m96p1 = (in[0] ^ 1) | (in[1] ^ 0x00ffff0000000000)
670
0
        | (in[2] ^ 0x00ffffffffffffff) | (in[3] ^ 0x00ffffffffffffff);
671
0
    two224m96p1 = (((int64_t)(two224m96p1)-1) >> 63) & 1;
672
0
    two225m97p2 = (in[0] ^ 2) | (in[1] ^ 0x00fffe0000000000)
673
0
        | (in[2] ^ 0x00ffffffffffffff) | (in[3] ^ 0x01ffffffffffffff);
674
0
    two225m97p2 = (((int64_t)(two225m97p2)-1) >> 63) & 1;
675
0
    return (zero | two224m96p1 | two225m97p2);
676
0
}
677
678
static int felem_is_zero_int(const void *in)
679
0
{
680
0
    return (int)(felem_is_zero(in) & ((limb)1));
681
0
}
682
683
/* Invert a field element */
684
/* Computation chain copied from djb's code */
685
static void felem_inv(felem out, const felem in)
686
0
{
687
0
    felem ftmp, ftmp2, ftmp3, ftmp4;
688
0
    widefelem tmp;
689
0
    unsigned i;
690
691
0
    felem_square(tmp, in);
692
0
    felem_reduce(ftmp, tmp); /* 2 */
693
0
    felem_mul(tmp, in, ftmp);
694
0
    felem_reduce(ftmp, tmp); /* 2^2 - 1 */
695
0
    felem_square(tmp, ftmp);
696
0
    felem_reduce(ftmp, tmp); /* 2^3 - 2 */
697
0
    felem_mul(tmp, in, ftmp);
698
0
    felem_reduce(ftmp, tmp); /* 2^3 - 1 */
699
0
    felem_square(tmp, ftmp);
700
0
    felem_reduce(ftmp2, tmp); /* 2^4 - 2 */
701
0
    felem_square(tmp, ftmp2);
702
0
    felem_reduce(ftmp2, tmp); /* 2^5 - 4 */
703
0
    felem_square(tmp, ftmp2);
704
0
    felem_reduce(ftmp2, tmp); /* 2^6 - 8 */
705
0
    felem_mul(tmp, ftmp2, ftmp);
706
0
    felem_reduce(ftmp, tmp); /* 2^6 - 1 */
707
0
    felem_square(tmp, ftmp);
708
0
    felem_reduce(ftmp2, tmp); /* 2^7 - 2 */
709
0
    for (i = 0; i < 5; ++i) { /* 2^12 - 2^6 */
710
0
        felem_square(tmp, ftmp2);
711
0
        felem_reduce(ftmp2, tmp);
712
0
    }
713
0
    felem_mul(tmp, ftmp2, ftmp);
714
0
    felem_reduce(ftmp2, tmp); /* 2^12 - 1 */
715
0
    felem_square(tmp, ftmp2);
716
0
    felem_reduce(ftmp3, tmp); /* 2^13 - 2 */
717
0
    for (i = 0; i < 11; ++i) { /* 2^24 - 2^12 */
718
0
        felem_square(tmp, ftmp3);
719
0
        felem_reduce(ftmp3, tmp);
720
0
    }
721
0
    felem_mul(tmp, ftmp3, ftmp2);
722
0
    felem_reduce(ftmp2, tmp); /* 2^24 - 1 */
723
0
    felem_square(tmp, ftmp2);
724
0
    felem_reduce(ftmp3, tmp); /* 2^25 - 2 */
725
0
    for (i = 0; i < 23; ++i) { /* 2^48 - 2^24 */
726
0
        felem_square(tmp, ftmp3);
727
0
        felem_reduce(ftmp3, tmp);
728
0
    }
729
0
    felem_mul(tmp, ftmp3, ftmp2);
730
0
    felem_reduce(ftmp3, tmp); /* 2^48 - 1 */
731
0
    felem_square(tmp, ftmp3);
732
0
    felem_reduce(ftmp4, tmp); /* 2^49 - 2 */
733
0
    for (i = 0; i < 47; ++i) { /* 2^96 - 2^48 */
734
0
        felem_square(tmp, ftmp4);
735
0
        felem_reduce(ftmp4, tmp);
736
0
    }
737
0
    felem_mul(tmp, ftmp3, ftmp4);
738
0
    felem_reduce(ftmp3, tmp); /* 2^96 - 1 */
739
0
    felem_square(tmp, ftmp3);
740
0
    felem_reduce(ftmp4, tmp); /* 2^97 - 2 */
741
0
    for (i = 0; i < 23; ++i) { /* 2^120 - 2^24 */
742
0
        felem_square(tmp, ftmp4);
743
0
        felem_reduce(ftmp4, tmp);
744
0
    }
745
0
    felem_mul(tmp, ftmp2, ftmp4);
746
0
    felem_reduce(ftmp2, tmp); /* 2^120 - 1 */
747
0
    for (i = 0; i < 6; ++i) { /* 2^126 - 2^6 */
748
0
        felem_square(tmp, ftmp2);
749
0
        felem_reduce(ftmp2, tmp);
750
0
    }
751
0
    felem_mul(tmp, ftmp2, ftmp);
752
0
    felem_reduce(ftmp, tmp); /* 2^126 - 1 */
753
0
    felem_square(tmp, ftmp);
754
0
    felem_reduce(ftmp, tmp); /* 2^127 - 2 */
755
0
    felem_mul(tmp, ftmp, in);
756
0
    felem_reduce(ftmp, tmp); /* 2^127 - 1 */
757
0
    for (i = 0; i < 97; ++i) { /* 2^224 - 2^97 */
758
0
        felem_square(tmp, ftmp);
759
0
        felem_reduce(ftmp, tmp);
760
0
    }
761
0
    felem_mul(tmp, ftmp, ftmp3);
762
0
    felem_reduce(out, tmp); /* 2^224 - 2^96 - 1 */
763
0
}
764
765
/*
766
 * Copy in constant time: if icopy == 1, copy in to out, if icopy == 0, copy
767
 * out to itself.
768
 */
769
static void copy_conditional(felem out, const felem in, limb icopy)
770
0
{
771
0
    unsigned i;
772
    /*
773
     * icopy is a (64-bit) 0 or 1, so copy is either all-zero or all-one
774
     */
775
0
    const limb copy = -icopy;
776
0
    for (i = 0; i < 4; ++i) {
777
0
        const limb tmp = copy & (in[i] ^ out[i]);
778
0
        out[i] ^= tmp;
779
0
    }
780
0
}
781
782
/******************************************************************************/
783
/*-
784
 *                       ELLIPTIC CURVE POINT OPERATIONS
785
 *
786
 * Points are represented in Jacobian projective coordinates:
787
 * (X, Y, Z) corresponds to the affine point (X/Z^2, Y/Z^3),
788
 * or to the point at infinity if Z == 0.
789
 *
790
 */
791
792
/*-
793
 * Double an elliptic curve point:
794
 * (X', Y', Z') = 2 * (X, Y, Z), where
795
 * X' = (3 * (X - Z^2) * (X + Z^2))^2 - 8 * X * Y^2
796
 * Y' = 3 * (X - Z^2) * (X + Z^2) * (4 * X * Y^2 - X') - 8 * Y^4
797
 * Z' = (Y + Z)^2 - Y^2 - Z^2 = 2 * Y * Z
798
 * Outputs can equal corresponding inputs, i.e., x_out == x_in is allowed,
799
 * while x_out == y_in is not (maybe this works, but it's not tested).
800
 */
801
static void
802
point_double(felem x_out, felem y_out, felem z_out,
803
    const felem x_in, const felem y_in, const felem z_in)
804
0
{
805
0
    widefelem tmp, tmp2;
806
0
    felem delta, gamma, beta, alpha, ftmp, ftmp2;
807
808
0
    felem_assign(ftmp, x_in);
809
0
    felem_assign(ftmp2, x_in);
810
811
    /* delta = z^2 */
812
0
    felem_square(tmp, z_in);
813
0
    felem_reduce(delta, tmp);
814
815
    /* gamma = y^2 */
816
0
    felem_square(tmp, y_in);
817
0
    felem_reduce(gamma, tmp);
818
819
    /* beta = x*gamma */
820
0
    felem_mul(tmp, x_in, gamma);
821
0
    felem_reduce(beta, tmp);
822
823
    /* alpha = 3*(x-delta)*(x+delta) */
824
0
    felem_diff(ftmp, delta);
825
    /* ftmp[i] < 2^57 + 2^58 + 2 < 2^59 */
826
0
    felem_sum(ftmp2, delta);
827
    /* ftmp2[i] < 2^57 + 2^57 = 2^58 */
828
0
    felem_scalar(ftmp2, 3);
829
    /* ftmp2[i] < 3 * 2^58 < 2^60 */
830
0
    felem_mul(tmp, ftmp, ftmp2);
831
    /* tmp[i] < 2^60 * 2^59 * 4 = 2^121 */
832
0
    felem_reduce(alpha, tmp);
833
834
    /* x' = alpha^2 - 8*beta */
835
0
    felem_square(tmp, alpha);
836
    /* tmp[i] < 4 * 2^57 * 2^57 = 2^116 */
837
0
    felem_assign(ftmp, beta);
838
0
    felem_scalar(ftmp, 8);
839
    /* ftmp[i] < 8 * 2^57 = 2^60 */
840
0
    felem_diff_128_64(tmp, ftmp);
841
    /* tmp[i] < 2^116 + 2^64 + 8 < 2^117 */
842
0
    felem_reduce(x_out, tmp);
843
844
    /* z' = (y + z)^2 - gamma - delta */
845
0
    felem_sum(delta, gamma);
846
    /* delta[i] < 2^57 + 2^57 = 2^58 */
847
0
    felem_assign(ftmp, y_in);
848
0
    felem_sum(ftmp, z_in);
849
    /* ftmp[i] < 2^57 + 2^57 = 2^58 */
850
0
    felem_square(tmp, ftmp);
851
    /* tmp[i] < 4 * 2^58 * 2^58 = 2^118 */
852
0
    felem_diff_128_64(tmp, delta);
853
    /* tmp[i] < 2^118 + 2^64 + 8 < 2^119 */
854
0
    felem_reduce(z_out, tmp);
855
856
    /* y' = alpha*(4*beta - x') - 8*gamma^2 */
857
0
    felem_scalar(beta, 4);
858
    /* beta[i] < 4 * 2^57 = 2^59 */
859
0
    felem_diff(beta, x_out);
860
    /* beta[i] < 2^59 + 2^58 + 2 < 2^60 */
861
0
    felem_mul(tmp, alpha, beta);
862
    /* tmp[i] < 4 * 2^57 * 2^60 = 2^119 */
863
0
    felem_square(tmp2, gamma);
864
    /* tmp2[i] < 4 * 2^57 * 2^57 = 2^116 */
865
0
    widefelem_scalar(tmp2, 8);
866
    /* tmp2[i] < 8 * 2^116 = 2^119 */
867
0
    widefelem_diff(tmp, tmp2);
868
    /* tmp[i] < 2^119 + 2^120 < 2^121 */
869
0
    felem_reduce(y_out, tmp);
870
0
}
871
872
/*-
873
 * Add two elliptic curve points:
874
 * (X_1, Y_1, Z_1) + (X_2, Y_2, Z_2) = (X_3, Y_3, Z_3), where
875
 * X_3 = (Z_1^3 * Y_2 - Z_2^3 * Y_1)^2 - (Z_1^2 * X_2 - Z_2^2 * X_1)^3 -
876
 * 2 * Z_2^2 * X_1 * (Z_1^2 * X_2 - Z_2^2 * X_1)^2
877
 * Y_3 = (Z_1^3 * Y_2 - Z_2^3 * Y_1) * (Z_2^2 * X_1 * (Z_1^2 * X_2 - Z_2^2 * X_1)^2 - X_3) -
878
 *        Z_2^3 * Y_1 * (Z_1^2 * X_2 - Z_2^2 * X_1)^3
879
 * Z_3 = (Z_1^2 * X_2 - Z_2^2 * X_1) * (Z_1 * Z_2)
880
 *
881
 * This runs faster if 'mixed' is set, which requires Z_2 = 1 or Z_2 = 0.
882
 */
883
884
/*
885
 * This function is not entirely constant-time: it includes a branch for
886
 * checking whether the two input points are equal, (while not equal to the
887
 * point at infinity). This case never happens during single point
888
 * multiplication, so there is no timing leak for ECDH or ECDSA signing.
889
 */
890
static void point_add(felem x3, felem y3, felem z3,
891
    const felem x1, const felem y1, const felem z1,
892
    const int mixed, const felem x2, const felem y2,
893
    const felem z2)
894
0
{
895
0
    felem ftmp, ftmp2, ftmp3, ftmp4, ftmp5, x_out, y_out, z_out;
896
0
    widefelem tmp, tmp2;
897
0
    limb z1_is_zero, z2_is_zero, x_equal, y_equal;
898
0
    limb points_equal;
899
900
0
    if (!mixed) {
901
        /* ftmp2 = z2^2 */
902
0
        felem_square(tmp, z2);
903
0
        felem_reduce(ftmp2, tmp);
904
905
        /* ftmp4 = z2^3 */
906
0
        felem_mul(tmp, ftmp2, z2);
907
0
        felem_reduce(ftmp4, tmp);
908
909
        /* ftmp4 = z2^3*y1 */
910
0
        felem_mul(tmp2, ftmp4, y1);
911
0
        felem_reduce(ftmp4, tmp2);
912
913
        /* ftmp2 = z2^2*x1 */
914
0
        felem_mul(tmp2, ftmp2, x1);
915
0
        felem_reduce(ftmp2, tmp2);
916
0
    } else {
917
        /*
918
         * We'll assume z2 = 1 (special case z2 = 0 is handled later)
919
         */
920
921
        /* ftmp4 = z2^3*y1 */
922
0
        felem_assign(ftmp4, y1);
923
924
        /* ftmp2 = z2^2*x1 */
925
0
        felem_assign(ftmp2, x1);
926
0
    }
927
928
    /* ftmp = z1^2 */
929
0
    felem_square(tmp, z1);
930
0
    felem_reduce(ftmp, tmp);
931
932
    /* ftmp3 = z1^3 */
933
0
    felem_mul(tmp, ftmp, z1);
934
0
    felem_reduce(ftmp3, tmp);
935
936
    /* tmp = z1^3*y2 */
937
0
    felem_mul(tmp, ftmp3, y2);
938
    /* tmp[i] < 4 * 2^57 * 2^57 = 2^116 */
939
940
    /* ftmp3 = z1^3*y2 - z2^3*y1 */
941
0
    felem_diff_128_64(tmp, ftmp4);
942
    /* tmp[i] < 2^116 + 2^64 + 8 < 2^117 */
943
0
    felem_reduce(ftmp3, tmp);
944
945
    /* tmp = z1^2*x2 */
946
0
    felem_mul(tmp, ftmp, x2);
947
    /* tmp[i] < 4 * 2^57 * 2^57 = 2^116 */
948
949
    /* ftmp = z1^2*x2 - z2^2*x1 */
950
0
    felem_diff_128_64(tmp, ftmp2);
951
    /* tmp[i] < 2^116 + 2^64 + 8 < 2^117 */
952
0
    felem_reduce(ftmp, tmp);
953
954
    /*
955
     * The formulae are incorrect if the points are equal, in affine coordinates
956
     * (X_1, Y_1) == (X_2, Y_2), so we check for this and do doubling if this
957
     * happens.
958
     *
959
     * We use bitwise operations to avoid potential side-channels introduced by
960
     * the short-circuiting behaviour of boolean operators.
961
     */
962
0
    x_equal = felem_is_zero(ftmp);
963
0
    y_equal = felem_is_zero(ftmp3);
964
    /*
965
     * The special case of either point being the point at infinity (z1 and/or
966
     * z2 are zero), is handled separately later on in this function, so we
967
     * avoid jumping to point_double here in those special cases.
968
     */
969
0
    z1_is_zero = felem_is_zero(z1);
970
0
    z2_is_zero = felem_is_zero(z2);
971
972
    /*
973
     * Compared to `ecp_nistp256.c` and `ecp_nistp521.c`, in this
974
     * specific implementation `felem_is_zero()` returns truth as `0x1`
975
     * (rather than `0xff..ff`).
976
     *
977
     * This implies that `~true` in this implementation becomes
978
     * `0xff..fe` (rather than `0x0`): for this reason, to be used in
979
     * the if expression, we mask out only the last bit in the next
980
     * line.
981
     */
982
0
    points_equal = (x_equal & y_equal & (~z1_is_zero) & (~z2_is_zero)) & 1;
983
984
0
    if (points_equal) {
985
        /*
986
         * This is obviously not constant-time but, as mentioned before, this
987
         * case never happens during single point multiplication, so there is no
988
         * timing leak for ECDH or ECDSA signing.
989
         */
990
0
        point_double(x3, y3, z3, x1, y1, z1);
991
0
        return;
992
0
    }
993
994
    /* ftmp5 = z1*z2 */
995
0
    if (!mixed) {
996
0
        felem_mul(tmp, z1, z2);
997
0
        felem_reduce(ftmp5, tmp);
998
0
    } else {
999
        /* special case z2 = 0 is handled later */
1000
0
        felem_assign(ftmp5, z1);
1001
0
    }
1002
1003
    /* z_out = (z1^2*x2 - z2^2*x1)*(z1*z2) */
1004
0
    felem_mul(tmp, ftmp, ftmp5);
1005
0
    felem_reduce(z_out, tmp);
1006
1007
    /* ftmp = (z1^2*x2 - z2^2*x1)^2 */
1008
0
    felem_assign(ftmp5, ftmp);
1009
0
    felem_square(tmp, ftmp);
1010
0
    felem_reduce(ftmp, tmp);
1011
1012
    /* ftmp5 = (z1^2*x2 - z2^2*x1)^3 */
1013
0
    felem_mul(tmp, ftmp, ftmp5);
1014
0
    felem_reduce(ftmp5, tmp);
1015
1016
    /* ftmp2 = z2^2*x1*(z1^2*x2 - z2^2*x1)^2 */
1017
0
    felem_mul(tmp, ftmp2, ftmp);
1018
0
    felem_reduce(ftmp2, tmp);
1019
1020
    /* tmp = z2^3*y1*(z1^2*x2 - z2^2*x1)^3 */
1021
0
    felem_mul(tmp, ftmp4, ftmp5);
1022
    /* tmp[i] < 4 * 2^57 * 2^57 = 2^116 */
1023
1024
    /* tmp2 = (z1^3*y2 - z2^3*y1)^2 */
1025
0
    felem_square(tmp2, ftmp3);
1026
    /* tmp2[i] < 4 * 2^57 * 2^57 < 2^116 */
1027
1028
    /* tmp2 = (z1^3*y2 - z2^3*y1)^2 - (z1^2*x2 - z2^2*x1)^3 */
1029
0
    felem_diff_128_64(tmp2, ftmp5);
1030
    /* tmp2[i] < 2^116 + 2^64 + 8 < 2^117 */
1031
1032
    /* ftmp5 = 2*z2^2*x1*(z1^2*x2 - z2^2*x1)^2 */
1033
0
    felem_assign(ftmp5, ftmp2);
1034
0
    felem_scalar(ftmp5, 2);
1035
    /* ftmp5[i] < 2 * 2^57 = 2^58 */
1036
1037
    /*-
1038
     * x_out = (z1^3*y2 - z2^3*y1)^2 - (z1^2*x2 - z2^2*x1)^3 -
1039
     *  2*z2^2*x1*(z1^2*x2 - z2^2*x1)^2
1040
     */
1041
0
    felem_diff_128_64(tmp2, ftmp5);
1042
    /* tmp2[i] < 2^117 + 2^64 + 8 < 2^118 */
1043
0
    felem_reduce(x_out, tmp2);
1044
1045
    /* ftmp2 = z2^2*x1*(z1^2*x2 - z2^2*x1)^2 - x_out */
1046
0
    felem_diff(ftmp2, x_out);
1047
    /* ftmp2[i] < 2^57 + 2^58 + 2 < 2^59 */
1048
1049
    /*
1050
     * tmp2 = (z1^3*y2 - z2^3*y1)*(z2^2*x1*(z1^2*x2 - z2^2*x1)^2 - x_out)
1051
     */
1052
0
    felem_mul(tmp2, ftmp3, ftmp2);
1053
    /* tmp2[i] < 4 * 2^57 * 2^59 = 2^118 */
1054
1055
    /*-
1056
     * y_out = (z1^3*y2 - z2^3*y1)*(z2^2*x1*(z1^2*x2 - z2^2*x1)^2 - x_out) -
1057
     *  z2^3*y1*(z1^2*x2 - z2^2*x1)^3
1058
     */
1059
0
    widefelem_diff(tmp2, tmp);
1060
    /* tmp2[i] < 2^118 + 2^120 < 2^121 */
1061
0
    felem_reduce(y_out, tmp2);
1062
1063
    /*
1064
     * the result (x_out, y_out, z_out) is incorrect if one of the inputs is
1065
     * the point at infinity, so we need to check for this separately
1066
     */
1067
1068
    /*
1069
     * if point 1 is at infinity, copy point 2 to output, and vice versa
1070
     */
1071
0
    copy_conditional(x_out, x2, z1_is_zero);
1072
0
    copy_conditional(x_out, x1, z2_is_zero);
1073
0
    copy_conditional(y_out, y2, z1_is_zero);
1074
0
    copy_conditional(y_out, y1, z2_is_zero);
1075
0
    copy_conditional(z_out, z2, z1_is_zero);
1076
0
    copy_conditional(z_out, z1, z2_is_zero);
1077
0
    felem_assign(x3, x_out);
1078
0
    felem_assign(y3, y_out);
1079
0
    felem_assign(z3, z_out);
1080
0
}
1081
1082
/*
1083
 * select_point selects the |idx|th point from a precomputation table and
1084
 * copies it to out.
1085
 * The pre_comp array argument should be size of |size| argument
1086
 */
1087
static void select_point(const uint64_t idx, unsigned int size,
1088
    const felem pre_comp[][3], felem out[3])
1089
0
{
1090
0
    unsigned i, j;
1091
0
    limb *outlimbs = &out[0][0];
1092
1093
0
    memset(out, 0, sizeof(*out) * 3);
1094
0
    for (i = 0; i < size; i++) {
1095
0
        const limb *inlimbs = &pre_comp[i][0][0];
1096
0
        uint64_t mask = i ^ idx;
1097
0
        mask |= mask >> 4;
1098
0
        mask |= mask >> 2;
1099
0
        mask |= mask >> 1;
1100
0
        mask &= 1;
1101
0
        mask--;
1102
0
        for (j = 0; j < 4 * 3; j++)
1103
0
            outlimbs[j] |= inlimbs[j] & mask;
1104
0
    }
1105
0
}
1106
1107
/* get_bit returns the |i|th bit in |in| */
1108
static char get_bit(const felem_bytearray in, unsigned i)
1109
0
{
1110
0
    if (i >= 224)
1111
0
        return 0;
1112
0
    return (in[i >> 3] >> (i & 7)) & 1;
1113
0
}
1114
1115
/*
1116
 * Interleaved point multiplication using precomputed point multiples: The
1117
 * small point multiples 0*P, 1*P, ..., 16*P are in pre_comp[], the scalars
1118
 * in scalars[]. If g_scalar is non-NULL, we also add this multiple of the
1119
 * generator, using certain (large) precomputed multiples in g_pre_comp.
1120
 * Output point (X, Y, Z) is stored in x_out, y_out, z_out
1121
 */
1122
static void batch_mul(felem x_out, felem y_out, felem z_out,
1123
    const felem_bytearray scalars[],
1124
    const unsigned num_points, const uint8_t *g_scalar,
1125
    const int mixed, const felem pre_comp[][17][3],
1126
    const felem g_pre_comp[2][16][3])
1127
0
{
1128
0
    int i, skip;
1129
0
    unsigned num;
1130
0
    unsigned gen_mul = (g_scalar != NULL);
1131
0
    felem nq[3], tmp[4];
1132
0
    uint64_t bits;
1133
0
    uint8_t sign, digit;
1134
1135
    /* set nq to the point at infinity */
1136
0
    memset(nq, 0, sizeof(nq));
1137
1138
    /*
1139
     * Loop over all scalars msb-to-lsb, interleaving additions of multiples
1140
     * of the generator (two in each of the last 28 rounds) and additions of
1141
     * other points multiples (every 5th round).
1142
     */
1143
0
    skip = 1; /* save two point operations in the first
1144
               * round */
1145
0
    for (i = (num_points ? 220 : 27); i >= 0; --i) {
1146
        /* double */
1147
0
        if (!skip)
1148
0
            point_double(nq[0], nq[1], nq[2], nq[0], nq[1], nq[2]);
1149
1150
        /* add multiples of the generator */
1151
0
        if (gen_mul && (i <= 27)) {
1152
            /* first, look 28 bits upwards */
1153
0
            bits = get_bit(g_scalar, i + 196) << 3;
1154
0
            bits |= get_bit(g_scalar, i + 140) << 2;
1155
0
            bits |= get_bit(g_scalar, i + 84) << 1;
1156
0
            bits |= get_bit(g_scalar, i + 28);
1157
            /* select the point to add, in constant time */
1158
0
            select_point(bits, 16, g_pre_comp[1], tmp);
1159
1160
0
            if (!skip) {
1161
                /* value 1 below is argument for "mixed" */
1162
0
                point_add(nq[0], nq[1], nq[2],
1163
0
                    nq[0], nq[1], nq[2], 1, tmp[0], tmp[1], tmp[2]);
1164
0
            } else {
1165
0
                memcpy(nq, tmp, 3 * sizeof(felem));
1166
0
                skip = 0;
1167
0
            }
1168
1169
            /* second, look at the current position */
1170
0
            bits = get_bit(g_scalar, i + 168) << 3;
1171
0
            bits |= get_bit(g_scalar, i + 112) << 2;
1172
0
            bits |= get_bit(g_scalar, i + 56) << 1;
1173
0
            bits |= get_bit(g_scalar, i);
1174
            /* select the point to add, in constant time */
1175
0
            select_point(bits, 16, g_pre_comp[0], tmp);
1176
0
            point_add(nq[0], nq[1], nq[2],
1177
0
                nq[0], nq[1], nq[2],
1178
0
                1 /* mixed */, tmp[0], tmp[1], tmp[2]);
1179
0
        }
1180
1181
        /* do other additions every 5 doublings */
1182
0
        if (num_points && (i % 5 == 0)) {
1183
            /* loop over all scalars */
1184
0
            for (num = 0; num < num_points; ++num) {
1185
0
                bits = get_bit(scalars[num], i + 4) << 5;
1186
0
                bits |= get_bit(scalars[num], i + 3) << 4;
1187
0
                bits |= get_bit(scalars[num], i + 2) << 3;
1188
0
                bits |= get_bit(scalars[num], i + 1) << 2;
1189
0
                bits |= get_bit(scalars[num], i) << 1;
1190
0
                bits |= get_bit(scalars[num], i - 1);
1191
0
                ossl_ec_GFp_nistp_recode_scalar_bits(&sign, &digit, bits);
1192
1193
                /* select the point to add or subtract */
1194
0
                select_point(digit, 17, pre_comp[num], tmp);
1195
0
                felem_neg(tmp[3], tmp[1]); /* (X, -Y, Z) is the negative
1196
                                            * point */
1197
0
                copy_conditional(tmp[1], tmp[3], sign);
1198
1199
0
                if (!skip) {
1200
0
                    point_add(nq[0], nq[1], nq[2],
1201
0
                        nq[0], nq[1], nq[2],
1202
0
                        mixed, tmp[0], tmp[1], tmp[2]);
1203
0
                } else {
1204
0
                    memcpy(nq, tmp, 3 * sizeof(felem));
1205
0
                    skip = 0;
1206
0
                }
1207
0
            }
1208
0
        }
1209
0
    }
1210
0
    felem_assign(x_out, nq[0]);
1211
0
    felem_assign(y_out, nq[1]);
1212
0
    felem_assign(z_out, nq[2]);
1213
0
}
1214
1215
/******************************************************************************/
1216
/*
1217
 * FUNCTIONS TO MANAGE PRECOMPUTATION
1218
 */
1219
1220
static NISTP224_PRE_COMP *nistp224_pre_comp_new(void)
1221
0
{
1222
0
    NISTP224_PRE_COMP *ret = OPENSSL_zalloc(sizeof(*ret));
1223
1224
0
    if (ret == NULL)
1225
0
        return ret;
1226
1227
0
    if (!CRYPTO_NEW_REF(&ret->references, 1)) {
1228
0
        OPENSSL_free(ret);
1229
0
        return NULL;
1230
0
    }
1231
0
    return ret;
1232
0
}
1233
1234
NISTP224_PRE_COMP *EC_nistp224_pre_comp_dup(NISTP224_PRE_COMP *p)
1235
0
{
1236
0
    int i;
1237
0
    if (p != NULL)
1238
0
        CRYPTO_UP_REF(&p->references, &i);
1239
0
    return p;
1240
0
}
1241
1242
void EC_nistp224_pre_comp_free(NISTP224_PRE_COMP *p)
1243
0
{
1244
0
    int i;
1245
1246
0
    if (p == NULL)
1247
0
        return;
1248
1249
0
    CRYPTO_DOWN_REF(&p->references, &i);
1250
0
    REF_PRINT_COUNT("EC_nistp224", i, p);
1251
0
    if (i > 0)
1252
0
        return;
1253
0
    REF_ASSERT_ISNT(i < 0);
1254
1255
0
    CRYPTO_FREE_REF(&p->references);
1256
0
    OPENSSL_free(p);
1257
0
}
1258
1259
/******************************************************************************/
1260
/*
1261
 * OPENSSL EC_METHOD FUNCTIONS
1262
 */
1263
1264
int ossl_ec_GFp_nistp224_group_init(EC_GROUP *group)
1265
0
{
1266
0
    int ret;
1267
0
    ret = ossl_ec_GFp_simple_group_init(group);
1268
0
    group->a_is_minus3 = 1;
1269
0
    return ret;
1270
0
}
1271
1272
int ossl_ec_GFp_nistp224_group_set_curve(EC_GROUP *group, const BIGNUM *p,
1273
    const BIGNUM *a, const BIGNUM *b,
1274
    BN_CTX *ctx)
1275
0
{
1276
0
    int ret = 0;
1277
0
    BIGNUM *curve_p, *curve_a, *curve_b;
1278
0
#ifndef FIPS_MODULE
1279
0
    BN_CTX *new_ctx = NULL;
1280
1281
0
    if (ctx == NULL)
1282
0
        ctx = new_ctx = BN_CTX_new();
1283
0
#endif
1284
0
    if (ctx == NULL)
1285
0
        return 0;
1286
1287
0
    BN_CTX_start(ctx);
1288
0
    curve_p = BN_CTX_get(ctx);
1289
0
    curve_a = BN_CTX_get(ctx);
1290
0
    curve_b = BN_CTX_get(ctx);
1291
0
    if (curve_b == NULL)
1292
0
        goto err;
1293
0
    BN_bin2bn(nistp224_curve_params[0], sizeof(felem_bytearray), curve_p);
1294
0
    BN_bin2bn(nistp224_curve_params[1], sizeof(felem_bytearray), curve_a);
1295
0
    BN_bin2bn(nistp224_curve_params[2], sizeof(felem_bytearray), curve_b);
1296
0
    if ((BN_cmp(curve_p, p)) || (BN_cmp(curve_a, a)) || (BN_cmp(curve_b, b))) {
1297
0
        ERR_raise(ERR_LIB_EC, EC_R_WRONG_CURVE_PARAMETERS);
1298
0
        goto err;
1299
0
    }
1300
0
    group->field_mod_func = BN_nist_mod_224;
1301
0
    ret = ossl_ec_GFp_simple_group_set_curve(group, p, a, b, ctx);
1302
0
err:
1303
0
    BN_CTX_end(ctx);
1304
0
#ifndef FIPS_MODULE
1305
0
    BN_CTX_free(new_ctx);
1306
0
#endif
1307
0
    return ret;
1308
0
}
1309
1310
/*
1311
 * Takes the Jacobian coordinates (X, Y, Z) of a point and returns (X', Y') =
1312
 * (X/Z^2, Y/Z^3)
1313
 */
1314
int ossl_ec_GFp_nistp224_point_get_affine_coordinates(const EC_GROUP *group,
1315
    const EC_POINT *point,
1316
    BIGNUM *x, BIGNUM *y,
1317
    BN_CTX *ctx)
1318
0
{
1319
0
    felem z1, z2, x_in, y_in, x_out, y_out;
1320
0
    widefelem tmp;
1321
1322
0
    if (EC_POINT_is_at_infinity(group, point)) {
1323
0
        ERR_raise(ERR_LIB_EC, EC_R_POINT_AT_INFINITY);
1324
0
        return 0;
1325
0
    }
1326
0
    if ((!BN_to_felem(x_in, point->X)) || (!BN_to_felem(y_in, point->Y)) || (!BN_to_felem(z1, point->Z)))
1327
0
        return 0;
1328
0
    felem_inv(z2, z1);
1329
0
    felem_square(tmp, z2);
1330
0
    felem_reduce(z1, tmp);
1331
0
    felem_mul(tmp, x_in, z1);
1332
0
    felem_reduce(x_in, tmp);
1333
0
    felem_contract(x_out, x_in);
1334
0
    if (x != NULL) {
1335
0
        if (!felem_to_BN(x, x_out)) {
1336
0
            ERR_raise(ERR_LIB_EC, ERR_R_BN_LIB);
1337
0
            return 0;
1338
0
        }
1339
0
    }
1340
0
    felem_mul(tmp, z1, z2);
1341
0
    felem_reduce(z1, tmp);
1342
0
    felem_mul(tmp, y_in, z1);
1343
0
    felem_reduce(y_in, tmp);
1344
0
    felem_contract(y_out, y_in);
1345
0
    if (y != NULL) {
1346
0
        if (!felem_to_BN(y, y_out)) {
1347
0
            ERR_raise(ERR_LIB_EC, ERR_R_BN_LIB);
1348
0
            return 0;
1349
0
        }
1350
0
    }
1351
0
    return 1;
1352
0
}
1353
1354
static void make_points_affine(size_t num, felem points[/* num */][3],
1355
    felem tmp_felems[/* num+1 */])
1356
0
{
1357
    /*
1358
     * Runs in constant time, unless an input is the point at infinity (which
1359
     * normally shouldn't happen).
1360
     */
1361
0
    ossl_ec_GFp_nistp_points_make_affine_internal(num,
1362
0
        points,
1363
0
        sizeof(felem),
1364
0
        tmp_felems,
1365
0
        (void (*)(void *))felem_one,
1366
0
        felem_is_zero_int,
1367
0
        (void (*)(void *, const void *))
1368
0
            felem_assign,
1369
0
        (void (*)(void *, const void *))
1370
0
            felem_square_reduce,
1371
0
        (void (*)(void *,
1372
0
            const void
1373
0
                *,
1374
0
            const void
1375
0
                *))
1376
0
            felem_mul_reduce,
1377
0
        (void (*)(void *, const void *))
1378
0
            felem_inv,
1379
0
        (void (*)(void *, const void *))
1380
0
            felem_contract);
1381
0
}
1382
1383
/*
1384
 * Computes scalar*generator + \sum scalars[i]*points[i], ignoring NULL
1385
 * values Result is stored in r (r can equal one of the inputs).
1386
 */
1387
int ossl_ec_GFp_nistp224_points_mul(const EC_GROUP *group, EC_POINT *r,
1388
    const BIGNUM *scalar, size_t num,
1389
    const EC_POINT *points[],
1390
    const BIGNUM *scalars[], BN_CTX *ctx)
1391
0
{
1392
0
    int ret = 0;
1393
0
    int j;
1394
0
    unsigned i;
1395
0
    int mixed = 0;
1396
0
    BIGNUM *x, *y, *z, *tmp_scalar;
1397
0
    felem_bytearray g_secret;
1398
0
    felem_bytearray *secrets = NULL;
1399
0
    felem(*pre_comp)[17][3] = NULL;
1400
0
    felem *tmp_felems = NULL;
1401
0
    int num_bytes;
1402
0
    int have_pre_comp = 0;
1403
0
    size_t num_points = num;
1404
0
    felem x_in, y_in, z_in, x_out, y_out, z_out;
1405
0
    NISTP224_PRE_COMP *pre = NULL;
1406
0
    const felem(*g_pre_comp)[16][3] = NULL;
1407
0
    EC_POINT *generator = NULL;
1408
0
    const EC_POINT *p = NULL;
1409
0
    const BIGNUM *p_scalar = NULL;
1410
1411
0
    BN_CTX_start(ctx);
1412
0
    x = BN_CTX_get(ctx);
1413
0
    y = BN_CTX_get(ctx);
1414
0
    z = BN_CTX_get(ctx);
1415
0
    tmp_scalar = BN_CTX_get(ctx);
1416
0
    if (tmp_scalar == NULL)
1417
0
        goto err;
1418
1419
0
    if (scalar != NULL) {
1420
0
        pre = group->pre_comp.nistp224;
1421
0
        if (pre)
1422
            /* we have precomputation, try to use it */
1423
0
            g_pre_comp = (const felem(*)[16][3])pre->g_pre_comp;
1424
0
        else
1425
            /* try to use the standard precomputation */
1426
0
            g_pre_comp = &gmul[0];
1427
0
        generator = EC_POINT_new(group);
1428
0
        if (generator == NULL)
1429
0
            goto err;
1430
        /* get the generator from precomputation */
1431
0
        if (!felem_to_BN(x, g_pre_comp[0][1][0]) || !felem_to_BN(y, g_pre_comp[0][1][1]) || !felem_to_BN(z, g_pre_comp[0][1][2])) {
1432
0
            ERR_raise(ERR_LIB_EC, ERR_R_BN_LIB);
1433
0
            goto err;
1434
0
        }
1435
0
        if (!ossl_ec_GFp_simple_set_Jprojective_coordinates_GFp(group,
1436
0
                generator,
1437
0
                x, y, z, ctx))
1438
0
            goto err;
1439
0
        if (0 == EC_POINT_cmp(group, generator, group->generator, ctx))
1440
            /* precomputation matches generator */
1441
0
            have_pre_comp = 1;
1442
0
        else
1443
            /*
1444
             * we don't have valid precomputation: treat the generator as a
1445
             * random point
1446
             */
1447
0
            num_points = num_points + 1;
1448
0
    }
1449
1450
0
    if (num_points > 0) {
1451
0
        if (num_points >= 3) {
1452
            /*
1453
             * unless we precompute multiples for just one or two points,
1454
             * converting those into affine form is time well spent
1455
             */
1456
0
            mixed = 1;
1457
0
        }
1458
0
        secrets = OPENSSL_calloc(num_points, sizeof(*secrets));
1459
0
        pre_comp = OPENSSL_calloc(num_points, sizeof(*pre_comp));
1460
0
        if (mixed)
1461
0
            tmp_felems = OPENSSL_malloc_array(num_points * 17 + 1, sizeof(felem));
1462
0
        if ((secrets == NULL) || (pre_comp == NULL)
1463
0
            || (mixed && (tmp_felems == NULL)))
1464
0
            goto err;
1465
1466
        /*
1467
         * we treat NULL scalars as 0, and NULL points as points at infinity,
1468
         * i.e., they contribute nothing to the linear combination
1469
         */
1470
0
        for (i = 0; i < num_points; ++i) {
1471
0
            if (i == num) {
1472
                /* the generator */
1473
0
                p = EC_GROUP_get0_generator(group);
1474
0
                p_scalar = scalar;
1475
0
            } else {
1476
                /* the i^th point */
1477
0
                p = points[i];
1478
0
                p_scalar = scalars[i];
1479
0
            }
1480
0
            if ((p_scalar != NULL) && (p != NULL)) {
1481
                /* reduce scalar to 0 <= scalar < 2^224 */
1482
0
                if ((BN_num_bits(p_scalar) > 224)
1483
0
                    || (BN_is_negative(p_scalar))) {
1484
                    /*
1485
                     * this is an unusual input, and we don't guarantee
1486
                     * constant-timeness
1487
                     */
1488
0
                    if (!BN_nnmod(tmp_scalar, p_scalar, group->order, ctx)) {
1489
0
                        ERR_raise(ERR_LIB_EC, ERR_R_BN_LIB);
1490
0
                        goto err;
1491
0
                    }
1492
0
                    num_bytes = BN_bn2lebinpad(tmp_scalar,
1493
0
                        secrets[i], sizeof(secrets[i]));
1494
0
                } else {
1495
0
                    num_bytes = BN_bn2lebinpad(p_scalar,
1496
0
                        secrets[i], sizeof(secrets[i]));
1497
0
                }
1498
0
                if (num_bytes < 0) {
1499
0
                    ERR_raise(ERR_LIB_EC, ERR_R_BN_LIB);
1500
0
                    goto err;
1501
0
                }
1502
                /* precompute multiples */
1503
0
                if ((!BN_to_felem(x_out, p->X)) || (!BN_to_felem(y_out, p->Y)) || (!BN_to_felem(z_out, p->Z)))
1504
0
                    goto err;
1505
0
                felem_assign(pre_comp[i][1][0], x_out);
1506
0
                felem_assign(pre_comp[i][1][1], y_out);
1507
0
                felem_assign(pre_comp[i][1][2], z_out);
1508
0
                for (j = 2; j <= 16; ++j) {
1509
0
                    if (j & 1) {
1510
0
                        point_add(pre_comp[i][j][0], pre_comp[i][j][1],
1511
0
                            pre_comp[i][j][2], pre_comp[i][1][0],
1512
0
                            pre_comp[i][1][1], pre_comp[i][1][2], 0,
1513
0
                            pre_comp[i][j - 1][0],
1514
0
                            pre_comp[i][j - 1][1],
1515
0
                            pre_comp[i][j - 1][2]);
1516
0
                    } else {
1517
0
                        point_double(pre_comp[i][j][0], pre_comp[i][j][1],
1518
0
                            pre_comp[i][j][2], pre_comp[i][j / 2][0],
1519
0
                            pre_comp[i][j / 2][1],
1520
0
                            pre_comp[i][j / 2][2]);
1521
0
                    }
1522
0
                }
1523
0
            }
1524
0
        }
1525
0
        if (mixed)
1526
0
            make_points_affine(num_points * 17, pre_comp[0], tmp_felems);
1527
0
    }
1528
1529
    /* the scalar for the generator */
1530
0
    if ((scalar != NULL) && (have_pre_comp)) {
1531
0
        memset(g_secret, 0, sizeof(g_secret));
1532
        /* reduce scalar to 0 <= scalar < 2^224 */
1533
0
        if ((BN_num_bits(scalar) > 224) || (BN_is_negative(scalar))) {
1534
            /*
1535
             * this is an unusual input, and we don't guarantee
1536
             * constant-timeness
1537
             */
1538
0
            if (!BN_nnmod(tmp_scalar, scalar, group->order, ctx)) {
1539
0
                ERR_raise(ERR_LIB_EC, ERR_R_BN_LIB);
1540
0
                goto err;
1541
0
            }
1542
0
            num_bytes = BN_bn2lebinpad(tmp_scalar, g_secret, sizeof(g_secret));
1543
0
        } else {
1544
0
            num_bytes = BN_bn2lebinpad(scalar, g_secret, sizeof(g_secret));
1545
0
        }
1546
        /* do the multiplication with generator precomputation */
1547
0
        batch_mul(x_out, y_out, z_out,
1548
0
            (const felem_bytearray(*))secrets, num_points,
1549
0
            g_secret,
1550
0
            mixed, (const felem(*)[17][3])pre_comp, g_pre_comp);
1551
0
    } else {
1552
        /* do the multiplication without generator precomputation */
1553
0
        batch_mul(x_out, y_out, z_out,
1554
0
            (const felem_bytearray(*))secrets, num_points,
1555
0
            NULL, mixed, (const felem(*)[17][3])pre_comp, NULL);
1556
0
    }
1557
    /* reduce the output to its unique minimal representation */
1558
0
    felem_contract(x_in, x_out);
1559
0
    felem_contract(y_in, y_out);
1560
0
    felem_contract(z_in, z_out);
1561
0
    if ((!felem_to_BN(x, x_in)) || (!felem_to_BN(y, y_in)) || (!felem_to_BN(z, z_in))) {
1562
0
        ERR_raise(ERR_LIB_EC, ERR_R_BN_LIB);
1563
0
        goto err;
1564
0
    }
1565
0
    ret = ossl_ec_GFp_simple_set_Jprojective_coordinates_GFp(group, r, x, y, z,
1566
0
        ctx);
1567
1568
0
err:
1569
0
    BN_CTX_end(ctx);
1570
0
    EC_POINT_free(generator);
1571
0
    OPENSSL_free(secrets);
1572
0
    OPENSSL_free(pre_comp);
1573
0
    OPENSSL_free(tmp_felems);
1574
0
    return ret;
1575
0
}
1576
1577
int ossl_ec_GFp_nistp224_precompute_mult(EC_GROUP *group, BN_CTX *ctx)
1578
0
{
1579
0
    int ret = 0;
1580
0
    NISTP224_PRE_COMP *pre = NULL;
1581
0
    int i, j;
1582
0
    BIGNUM *x, *y;
1583
0
    EC_POINT *generator = NULL;
1584
0
    felem tmp_felems[32];
1585
0
#ifndef FIPS_MODULE
1586
0
    BN_CTX *new_ctx = NULL;
1587
0
#endif
1588
1589
    /* throw away old precomputation */
1590
0
    EC_pre_comp_free(group);
1591
1592
0
#ifndef FIPS_MODULE
1593
0
    if (ctx == NULL)
1594
0
        ctx = new_ctx = BN_CTX_new();
1595
0
#endif
1596
0
    if (ctx == NULL)
1597
0
        return 0;
1598
1599
0
    BN_CTX_start(ctx);
1600
0
    x = BN_CTX_get(ctx);
1601
0
    y = BN_CTX_get(ctx);
1602
0
    if (y == NULL)
1603
0
        goto err;
1604
    /* get the generator */
1605
0
    if (group->generator == NULL)
1606
0
        goto err;
1607
0
    generator = EC_POINT_new(group);
1608
0
    if (generator == NULL)
1609
0
        goto err;
1610
0
    BN_bin2bn(nistp224_curve_params[3], sizeof(felem_bytearray), x);
1611
0
    BN_bin2bn(nistp224_curve_params[4], sizeof(felem_bytearray), y);
1612
0
    if (!EC_POINT_set_affine_coordinates(group, generator, x, y, ctx))
1613
0
        goto err;
1614
0
    if ((pre = nistp224_pre_comp_new()) == NULL)
1615
0
        goto err;
1616
    /*
1617
     * if the generator is the standard one, use built-in precomputation
1618
     */
1619
0
    if (0 == EC_POINT_cmp(group, generator, group->generator, ctx)) {
1620
0
        memcpy(pre->g_pre_comp, gmul, sizeof(pre->g_pre_comp));
1621
0
        goto done;
1622
0
    }
1623
0
    if ((!BN_to_felem(pre->g_pre_comp[0][1][0], group->generator->X)) || (!BN_to_felem(pre->g_pre_comp[0][1][1], group->generator->Y)) || (!BN_to_felem(pre->g_pre_comp[0][1][2], group->generator->Z)))
1624
0
        goto err;
1625
    /*
1626
     * compute 2^56*G, 2^112*G, 2^168*G for the first table, 2^28*G, 2^84*G,
1627
     * 2^140*G, 2^196*G for the second one
1628
     */
1629
0
    for (i = 1; i <= 8; i <<= 1) {
1630
0
        point_double(pre->g_pre_comp[1][i][0], pre->g_pre_comp[1][i][1],
1631
0
            pre->g_pre_comp[1][i][2], pre->g_pre_comp[0][i][0],
1632
0
            pre->g_pre_comp[0][i][1], pre->g_pre_comp[0][i][2]);
1633
0
        for (j = 0; j < 27; ++j) {
1634
0
            point_double(pre->g_pre_comp[1][i][0], pre->g_pre_comp[1][i][1],
1635
0
                pre->g_pre_comp[1][i][2], pre->g_pre_comp[1][i][0],
1636
0
                pre->g_pre_comp[1][i][1], pre->g_pre_comp[1][i][2]);
1637
0
        }
1638
0
        if (i == 8)
1639
0
            break;
1640
0
        point_double(pre->g_pre_comp[0][2 * i][0],
1641
0
            pre->g_pre_comp[0][2 * i][1],
1642
0
            pre->g_pre_comp[0][2 * i][2], pre->g_pre_comp[1][i][0],
1643
0
            pre->g_pre_comp[1][i][1], pre->g_pre_comp[1][i][2]);
1644
0
        for (j = 0; j < 27; ++j) {
1645
0
            point_double(pre->g_pre_comp[0][2 * i][0],
1646
0
                pre->g_pre_comp[0][2 * i][1],
1647
0
                pre->g_pre_comp[0][2 * i][2],
1648
0
                pre->g_pre_comp[0][2 * i][0],
1649
0
                pre->g_pre_comp[0][2 * i][1],
1650
0
                pre->g_pre_comp[0][2 * i][2]);
1651
0
        }
1652
0
    }
1653
0
    for (i = 0; i < 2; i++) {
1654
        /* g_pre_comp[i][0] is the point at infinity */
1655
0
        memset(pre->g_pre_comp[i][0], 0, sizeof(pre->g_pre_comp[i][0]));
1656
        /* the remaining multiples */
1657
        /* 2^56*G + 2^112*G resp. 2^84*G + 2^140*G */
1658
0
        point_add(pre->g_pre_comp[i][6][0], pre->g_pre_comp[i][6][1],
1659
0
            pre->g_pre_comp[i][6][2], pre->g_pre_comp[i][4][0],
1660
0
            pre->g_pre_comp[i][4][1], pre->g_pre_comp[i][4][2],
1661
0
            0, pre->g_pre_comp[i][2][0], pre->g_pre_comp[i][2][1],
1662
0
            pre->g_pre_comp[i][2][2]);
1663
        /* 2^56*G + 2^168*G resp. 2^84*G + 2^196*G */
1664
0
        point_add(pre->g_pre_comp[i][10][0], pre->g_pre_comp[i][10][1],
1665
0
            pre->g_pre_comp[i][10][2], pre->g_pre_comp[i][8][0],
1666
0
            pre->g_pre_comp[i][8][1], pre->g_pre_comp[i][8][2],
1667
0
            0, pre->g_pre_comp[i][2][0], pre->g_pre_comp[i][2][1],
1668
0
            pre->g_pre_comp[i][2][2]);
1669
        /* 2^112*G + 2^168*G resp. 2^140*G + 2^196*G */
1670
0
        point_add(pre->g_pre_comp[i][12][0], pre->g_pre_comp[i][12][1],
1671
0
            pre->g_pre_comp[i][12][2], pre->g_pre_comp[i][8][0],
1672
0
            pre->g_pre_comp[i][8][1], pre->g_pre_comp[i][8][2],
1673
0
            0, pre->g_pre_comp[i][4][0], pre->g_pre_comp[i][4][1],
1674
0
            pre->g_pre_comp[i][4][2]);
1675
        /*
1676
         * 2^56*G + 2^112*G + 2^168*G resp. 2^84*G + 2^140*G + 2^196*G
1677
         */
1678
0
        point_add(pre->g_pre_comp[i][14][0], pre->g_pre_comp[i][14][1],
1679
0
            pre->g_pre_comp[i][14][2], pre->g_pre_comp[i][12][0],
1680
0
            pre->g_pre_comp[i][12][1], pre->g_pre_comp[i][12][2],
1681
0
            0, pre->g_pre_comp[i][2][0], pre->g_pre_comp[i][2][1],
1682
0
            pre->g_pre_comp[i][2][2]);
1683
0
        for (j = 1; j < 8; ++j) {
1684
            /* odd multiples: add G resp. 2^28*G */
1685
0
            point_add(pre->g_pre_comp[i][2 * j + 1][0],
1686
0
                pre->g_pre_comp[i][2 * j + 1][1],
1687
0
                pre->g_pre_comp[i][2 * j + 1][2],
1688
0
                pre->g_pre_comp[i][2 * j][0],
1689
0
                pre->g_pre_comp[i][2 * j][1],
1690
0
                pre->g_pre_comp[i][2 * j][2], 0,
1691
0
                pre->g_pre_comp[i][1][0], pre->g_pre_comp[i][1][1],
1692
0
                pre->g_pre_comp[i][1][2]);
1693
0
        }
1694
0
    }
1695
0
    make_points_affine(31, &(pre->g_pre_comp[0][1]), tmp_felems);
1696
1697
0
done:
1698
0
    SETPRECOMP(group, nistp224, pre);
1699
0
    pre = NULL;
1700
0
    ret = 1;
1701
0
err:
1702
0
    BN_CTX_end(ctx);
1703
0
    EC_POINT_free(generator);
1704
0
#ifndef FIPS_MODULE
1705
0
    BN_CTX_free(new_ctx);
1706
0
#endif
1707
0
    EC_nistp224_pre_comp_free(pre);
1708
0
    return ret;
1709
0
}
1710
1711
int ossl_ec_GFp_nistp224_have_precompute_mult(const EC_GROUP *group)
1712
0
{
1713
    return HAVEPRECOMP(group, nistp224);
1714
0
}