Coverage Report

Created: 2025-06-13 06:58

/src/openssl30/crypto/bn/bn_mul.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * Copyright 1995-2018 The OpenSSL Project Authors. All Rights Reserved.
3
 *
4
 * Licensed under the Apache License 2.0 (the "License").  You may not use
5
 * this file except in compliance with the License.  You can obtain a copy
6
 * in the file LICENSE in the source distribution or at
7
 * https://www.openssl.org/source/license.html
8
 */
9
10
#include <assert.h>
11
#include "internal/cryptlib.h"
12
#include "bn_local.h"
13
14
#if defined(OPENSSL_NO_ASM) || !defined(OPENSSL_BN_ASM_PART_WORDS)
15
/*
16
 * Here follows specialised variants of bn_add_words() and bn_sub_words().
17
 * They have the property performing operations on arrays of different sizes.
18
 * The sizes of those arrays is expressed through cl, which is the common
19
 * length ( basically, min(len(a),len(b)) ), and dl, which is the delta
20
 * between the two lengths, calculated as len(a)-len(b). All lengths are the
21
 * number of BN_ULONGs...  For the operations that require a result array as
22
 * parameter, it must have the length cl+abs(dl). These functions should
23
 * probably end up in bn_asm.c as soon as there are assembler counterparts
24
 * for the systems that use assembler files.
25
 */
26
27
BN_ULONG bn_sub_part_words(BN_ULONG *r,
28
                           const BN_ULONG *a, const BN_ULONG *b,
29
                           int cl, int dl)
30
48.9M
{
31
48.9M
    BN_ULONG c, t;
32
33
48.9M
    assert(cl >= 0);
34
48.9M
    c = bn_sub_words(r, a, b, cl);
35
36
48.9M
    if (dl == 0)
37
48.1M
        return c;
38
39
824k
    r += cl;
40
824k
    a += cl;
41
824k
    b += cl;
42
43
824k
    if (dl < 0) {
44
260k
        for (;;) {
45
260k
            t = b[0];
46
260k
            r[0] = (0 - t - c) & BN_MASK2;
47
260k
            if (t != 0)
48
0
                c = 1;
49
260k
            if (++dl >= 0)
50
24.1k
                break;
51
52
236k
            t = b[1];
53
236k
            r[1] = (0 - t - c) & BN_MASK2;
54
236k
            if (t != 0)
55
0
                c = 1;
56
236k
            if (++dl >= 0)
57
16.3k
                break;
58
59
220k
            t = b[2];
60
220k
            r[2] = (0 - t - c) & BN_MASK2;
61
220k
            if (t != 0)
62
0
                c = 1;
63
220k
            if (++dl >= 0)
64
33.5k
                break;
65
66
186k
            t = b[3];
67
186k
            r[3] = (0 - t - c) & BN_MASK2;
68
186k
            if (t != 0)
69
0
                c = 1;
70
186k
            if (++dl >= 0)
71
7.96k
                break;
72
73
178k
            b += 4;
74
178k
            r += 4;
75
178k
        }
76
742k
    } else {
77
742k
        int save_dl = dl;
78
940k
        while (c) {
79
252k
            t = a[0];
80
252k
            r[0] = (t - c) & BN_MASK2;
81
252k
            if (t != 0)
82
84.3k
                c = 0;
83
252k
            if (--dl <= 0)
84
17.0k
                break;
85
86
235k
            t = a[1];
87
235k
            r[1] = (t - c) & BN_MASK2;
88
235k
            if (t != 0)
89
75.0k
                c = 0;
90
235k
            if (--dl <= 0)
91
8.02k
                break;
92
93
227k
            t = a[2];
94
227k
            r[2] = (t - c) & BN_MASK2;
95
227k
            if (t != 0)
96
84.3k
                c = 0;
97
227k
            if (--dl <= 0)
98
14.8k
                break;
99
100
212k
            t = a[3];
101
212k
            r[3] = (t - c) & BN_MASK2;
102
212k
            if (t != 0)
103
74.0k
                c = 0;
104
212k
            if (--dl <= 0)
105
14.5k
                break;
106
107
197k
            save_dl = dl;
108
197k
            a += 4;
109
197k
            r += 4;
110
197k
        }
111
742k
        if (dl > 0) {
112
688k
            if (save_dl > dl) {
113
0
                switch (save_dl - dl) {
114
0
                case 1:
115
0
                    r[1] = a[1];
116
0
                    if (--dl <= 0)
117
0
                        break;
118
                    /* fall thru */
119
0
                case 2:
120
0
                    r[2] = a[2];
121
0
                    if (--dl <= 0)
122
0
                        break;
123
                    /* fall thru */
124
0
                case 3:
125
0
                    r[3] = a[3];
126
0
                    if (--dl <= 0)
127
0
                        break;
128
0
                }
129
0
                a += 4;
130
0
                r += 4;
131
0
            }
132
688k
        }
133
742k
        if (dl > 0) {
134
5.69M
            for (;;) {
135
5.69M
                r[0] = a[0];
136
5.69M
                if (--dl <= 0)
137
140k
                    break;
138
5.55M
                r[1] = a[1];
139
5.55M
                if (--dl <= 0)
140
64.9k
                    break;
141
5.49M
                r[2] = a[2];
142
5.49M
                if (--dl <= 0)
143
273k
                    break;
144
5.22M
                r[3] = a[3];
145
5.22M
                if (--dl <= 0)
146
210k
                    break;
147
148
5.01M
                a += 4;
149
5.01M
                r += 4;
150
5.01M
            }
151
688k
        }
152
742k
    }
153
824k
    return c;
154
824k
}
155
#endif
156
157
#ifdef BN_RECURSION
158
/*
159
 * Karatsuba recursive multiplication algorithm (cf. Knuth, The Art of
160
 * Computer Programming, Vol. 2)
161
 */
162
163
/*-
164
 * r is 2*n2 words in size,
165
 * a and b are both n2 words in size.
166
 * n2 must be a power of 2.
167
 * We multiply and return the result.
168
 * t must be 2*n2 words in size
169
 * We calculate
170
 * a[0]*b[0]
171
 * a[0]*b[0]+a[1]*b[1]+(a[0]-a[1])*(b[1]-b[0])
172
 * a[1]*b[1]
173
 */
174
/* dnX may not be positive, but n2/2+dnX has to be */
175
void bn_mul_recursive(BN_ULONG *r, BN_ULONG *a, BN_ULONG *b, int n2,
176
                      int dna, int dnb, BN_ULONG *t)
177
25.8M
{
178
25.8M
    int n = n2 / 2, c1, c2;
179
25.8M
    int tna = n + dna, tnb = n + dnb;
180
25.8M
    unsigned int neg, zero;
181
25.8M
    BN_ULONG ln, lo, *p;
182
183
25.8M
# ifdef BN_MUL_COMBA
184
#  if 0
185
    if (n2 == 4) {
186
        bn_mul_comba4(r, a, b);
187
        return;
188
    }
189
#  endif
190
    /*
191
     * Only call bn_mul_comba 8 if n2 == 8 and the two arrays are complete
192
     * [steve]
193
     */
194
25.8M
    if (n2 == 8 && dna == 0 && dnb == 0) {
195
31.0k
        bn_mul_comba8(r, a, b);
196
31.0k
        return;
197
31.0k
    }
198
25.7M
# endif                         /* BN_MUL_COMBA */
199
    /* Else do normal multiply */
200
25.7M
    if (n2 < BN_MUL_RECURSIVE_SIZE_NORMAL) {
201
20.0k
        bn_mul_normal(r, a, n2 + dna, b, n2 + dnb);
202
20.0k
        if ((dna + dnb) < 0)
203
20.0k
            memset(&r[2 * n2 + dna + dnb], 0,
204
20.0k
                   sizeof(BN_ULONG) * -(dna + dnb));
205
20.0k
        return;
206
20.0k
    }
207
    /* r=(a[0]-a[1])*(b[1]-b[0]) */
208
25.7M
    c1 = bn_cmp_part_words(a, &(a[n]), tna, n - tna);
209
25.7M
    c2 = bn_cmp_part_words(&(b[n]), b, tnb, tnb - n);
210
25.7M
    zero = neg = 0;
211
25.7M
    switch (c1 * 3 + c2) {
212
4.86M
    case -4:
213
4.86M
        bn_sub_part_words(t, &(a[n]), a, tna, tna - n); /* - */
214
4.86M
        bn_sub_part_words(&(t[n]), b, &(b[n]), tnb, n - tnb); /* - */
215
4.86M
        break;
216
444k
    case -3:
217
444k
        zero = 1;
218
444k
        break;
219
5.34M
    case -2:
220
5.34M
        bn_sub_part_words(t, &(a[n]), a, tna, tna - n); /* - */
221
5.34M
        bn_sub_part_words(&(t[n]), &(b[n]), b, tnb, tnb - n); /* + */
222
5.34M
        neg = 1;
223
5.34M
        break;
224
69.6k
    case -1:
225
687k
    case 0:
226
753k
    case 1:
227
753k
        zero = 1;
228
753k
        break;
229
8.73M
    case 2:
230
8.73M
        bn_sub_part_words(t, a, &(a[n]), tna, n - tna); /* + */
231
8.73M
        bn_sub_part_words(&(t[n]), b, &(b[n]), tnb, n - tnb); /* - */
232
8.73M
        neg = 1;
233
8.73M
        break;
234
481k
    case 3:
235
481k
        zero = 1;
236
481k
        break;
237
5.13M
    case 4:
238
5.13M
        bn_sub_part_words(t, a, &(a[n]), tna, n - tna);
239
5.13M
        bn_sub_part_words(&(t[n]), &(b[n]), b, tnb, tnb - n);
240
5.13M
        break;
241
25.7M
    }
242
243
25.7M
# ifdef BN_MUL_COMBA
244
25.7M
    if (n == 4 && dna == 0 && dnb == 0) { /* XXX: bn_mul_comba4 could take
245
                                           * extra args to do this well */
246
0
        if (!zero)
247
0
            bn_mul_comba4(&(t[n2]), t, &(t[n]));
248
0
        else
249
0
            memset(&t[n2], 0, sizeof(*t) * 8);
250
251
0
        bn_mul_comba4(r, a, b);
252
0
        bn_mul_comba4(&(r[n2]), &(a[n]), &(b[n]));
253
25.7M
    } else if (n == 8 && dna == 0 && dnb == 0) { /* XXX: bn_mul_comba8 could
254
                                                  * take extra args to do
255
                                                  * this well */
256
17.2M
        if (!zero)
257
16.0M
            bn_mul_comba8(&(t[n2]), t, &(t[n]));
258
1.20M
        else
259
1.20M
            memset(&t[n2], 0, sizeof(*t) * 16);
260
261
17.2M
        bn_mul_comba8(r, a, b);
262
17.2M
        bn_mul_comba8(&(r[n2]), &(a[n]), &(b[n]));
263
17.2M
    } else
264
8.49M
# endif                         /* BN_MUL_COMBA */
265
8.49M
    {
266
8.49M
        p = &(t[n2 * 2]);
267
8.49M
        if (!zero)
268
8.02M
            bn_mul_recursive(&(t[n2]), t, &(t[n]), n, 0, 0, p);
269
469k
        else
270
469k
            memset(&t[n2], 0, sizeof(*t) * n2);
271
8.49M
        bn_mul_recursive(r, a, b, n, 0, 0, p);
272
8.49M
        bn_mul_recursive(&(r[n2]), &(a[n]), &(b[n]), n, dna, dnb, p);
273
8.49M
    }
274
275
    /*-
276
     * t[32] holds (a[0]-a[1])*(b[1]-b[0]), c1 is the sign
277
     * r[10] holds (a[0]*b[0])
278
     * r[32] holds (b[1]*b[1])
279
     */
280
281
25.7M
    c1 = (int)(bn_add_words(t, r, &(r[n2]), n2));
282
283
25.7M
    if (neg) {                  /* if t[32] is negative */
284
14.0M
        c1 -= (int)(bn_sub_words(&(t[n2]), t, &(t[n2]), n2));
285
14.0M
    } else {
286
        /* Might have a carry */
287
11.6M
        c1 += (int)(bn_add_words(&(t[n2]), &(t[n2]), t, n2));
288
11.6M
    }
289
290
    /*-
291
     * t[32] holds (a[0]-a[1])*(b[1]-b[0])+(a[0]*b[0])+(a[1]*b[1])
292
     * r[10] holds (a[0]*b[0])
293
     * r[32] holds (b[1]*b[1])
294
     * c1 holds the carry bits
295
     */
296
25.7M
    c1 += (int)(bn_add_words(&(r[n]), &(r[n]), &(t[n2]), n2));
297
25.7M
    if (c1) {
298
9.95M
        p = &(r[n + n2]);
299
9.95M
        lo = *p;
300
9.95M
        ln = (lo + c1) & BN_MASK2;
301
9.95M
        *p = ln;
302
303
        /*
304
         * The overflow will stop before we over write words we should not
305
         * overwrite
306
         */
307
9.95M
        if (ln < (BN_ULONG)c1) {
308
325k
            do {
309
325k
                p++;
310
325k
                lo = *p;
311
325k
                ln = (lo + 1) & BN_MASK2;
312
325k
                *p = ln;
313
325k
            } while (ln == 0);
314
62.6k
        }
315
9.95M
    }
316
25.7M
}
317
318
/*
319
 * n+tn is the word length t needs to be n*4 is size, as does r
320
 */
321
/* tnX may not be negative but less than n */
322
void bn_mul_part_recursive(BN_ULONG *r, BN_ULONG *a, BN_ULONG *b, int n,
323
                           int tna, int tnb, BN_ULONG *t)
324
399k
{
325
399k
    int i, j, n2 = n * 2;
326
399k
    int c1, c2, neg;
327
399k
    BN_ULONG ln, lo, *p;
328
329
399k
    if (n < 8) {
330
0
        bn_mul_normal(r, a, n + tna, b, n + tnb);
331
0
        return;
332
0
    }
333
334
    /* r=(a[0]-a[1])*(b[1]-b[0]) */
335
399k
    c1 = bn_cmp_part_words(a, &(a[n]), tna, n - tna);
336
399k
    c2 = bn_cmp_part_words(&(b[n]), b, tnb, tnb - n);
337
399k
    neg = 0;
338
399k
    switch (c1 * 3 + c2) {
339
41.2k
    case -4:
340
41.2k
        bn_sub_part_words(t, &(a[n]), a, tna, tna - n); /* - */
341
41.2k
        bn_sub_part_words(&(t[n]), b, &(b[n]), tnb, n - tnb); /* - */
342
41.2k
        break;
343
2.25k
    case -3:
344
11.3k
    case -2:
345
11.3k
        bn_sub_part_words(t, &(a[n]), a, tna, tna - n); /* - */
346
11.3k
        bn_sub_part_words(&(t[n]), &(b[n]), b, tnb, tnb - n); /* + */
347
11.3k
        neg = 1;
348
11.3k
        break;
349
5.48k
    case -1:
350
7.05k
    case 0:
351
8.74k
    case 1:
352
331k
    case 2:
353
331k
        bn_sub_part_words(t, a, &(a[n]), tna, n - tna); /* + */
354
331k
        bn_sub_part_words(&(t[n]), b, &(b[n]), tnb, n - tnb); /* - */
355
331k
        neg = 1;
356
331k
        break;
357
4.37k
    case 3:
358
15.6k
    case 4:
359
15.6k
        bn_sub_part_words(t, a, &(a[n]), tna, n - tna);
360
15.6k
        bn_sub_part_words(&(t[n]), &(b[n]), b, tnb, tnb - n);
361
15.6k
        break;
362
399k
    }
363
    /*
364
     * The zero case isn't yet implemented here. The speedup would probably
365
     * be negligible.
366
     */
367
# if 0
368
    if (n == 4) {
369
        bn_mul_comba4(&(t[n2]), t, &(t[n]));
370
        bn_mul_comba4(r, a, b);
371
        bn_mul_normal(&(r[n2]), &(a[n]), tn, &(b[n]), tn);
372
        memset(&r[n2 + tn * 2], 0, sizeof(*r) * (n2 - tn * 2));
373
    } else
374
# endif
375
399k
    if (n == 8) {
376
63.1k
        bn_mul_comba8(&(t[n2]), t, &(t[n]));
377
63.1k
        bn_mul_comba8(r, a, b);
378
63.1k
        bn_mul_normal(&(r[n2]), &(a[n]), tna, &(b[n]), tnb);
379
63.1k
        memset(&r[n2 + tna + tnb], 0, sizeof(*r) * (n2 - tna - tnb));
380
336k
    } else {
381
336k
        p = &(t[n2 * 2]);
382
336k
        bn_mul_recursive(&(t[n2]), t, &(t[n]), n, 0, 0, p);
383
336k
        bn_mul_recursive(r, a, b, n, 0, 0, p);
384
336k
        i = n / 2;
385
        /*
386
         * If there is only a bottom half to the number, just do it
387
         */
388
336k
        if (tna > tnb)
389
39.5k
            j = tna - i;
390
296k
        else
391
296k
            j = tnb - i;
392
336k
        if (j == 0) {
393
11.0k
            bn_mul_recursive(&(r[n2]), &(a[n]), &(b[n]),
394
11.0k
                             i, tna - i, tnb - i, p);
395
11.0k
            memset(&r[n2 + i * 2], 0, sizeof(*r) * (n2 - i * 2));
396
325k
        } else if (j > 0) {     /* eg, n == 16, i == 8 and tn == 11 */
397
83.8k
            bn_mul_part_recursive(&(r[n2]), &(a[n]), &(b[n]),
398
83.8k
                                  i, tna - i, tnb - i, p);
399
83.8k
            memset(&(r[n2 + tna + tnb]), 0,
400
83.8k
                   sizeof(BN_ULONG) * (n2 - tna - tnb));
401
241k
        } else {                /* (j < 0) eg, n == 16, i == 8 and tn == 5 */
402
403
241k
            memset(&r[n2], 0, sizeof(*r) * n2);
404
241k
            if (tna < BN_MUL_RECURSIVE_SIZE_NORMAL
405
241k
                && tnb < BN_MUL_RECURSIVE_SIZE_NORMAL) {
406
186k
                bn_mul_normal(&(r[n2]), &(a[n]), tna, &(b[n]), tnb);
407
186k
            } else {
408
70.7k
                for (;;) {
409
70.7k
                    i /= 2;
410
                    /*
411
                     * these simplified conditions work exclusively because
412
                     * difference between tna and tnb is 1 or 0
413
                     */
414
70.7k
                    if (i < tna || i < tnb) {
415
43.4k
                        bn_mul_part_recursive(&(r[n2]),
416
43.4k
                                              &(a[n]), &(b[n]),
417
43.4k
                                              i, tna - i, tnb - i, p);
418
43.4k
                        break;
419
43.4k
                    } else if (i == tna || i == tnb) {
420
11.2k
                        bn_mul_recursive(&(r[n2]),
421
11.2k
                                         &(a[n]), &(b[n]),
422
11.2k
                                         i, tna - i, tnb - i, p);
423
11.2k
                        break;
424
11.2k
                    }
425
70.7k
                }
426
54.6k
            }
427
241k
        }
428
336k
    }
429
430
    /*-
431
     * t[32] holds (a[0]-a[1])*(b[1]-b[0]), c1 is the sign
432
     * r[10] holds (a[0]*b[0])
433
     * r[32] holds (b[1]*b[1])
434
     */
435
436
399k
    c1 = (int)(bn_add_words(t, r, &(r[n2]), n2));
437
438
399k
    if (neg) {                  /* if t[32] is negative */
439
342k
        c1 -= (int)(bn_sub_words(&(t[n2]), t, &(t[n2]), n2));
440
342k
    } else {
441
        /* Might have a carry */
442
56.8k
        c1 += (int)(bn_add_words(&(t[n2]), &(t[n2]), t, n2));
443
56.8k
    }
444
445
    /*-
446
     * t[32] holds (a[0]-a[1])*(b[1]-b[0])+(a[0]*b[0])+(a[1]*b[1])
447
     * r[10] holds (a[0]*b[0])
448
     * r[32] holds (b[1]*b[1])
449
     * c1 holds the carry bits
450
     */
451
399k
    c1 += (int)(bn_add_words(&(r[n]), &(r[n]), &(t[n2]), n2));
452
399k
    if (c1) {
453
9.29k
        p = &(r[n + n2]);
454
9.29k
        lo = *p;
455
9.29k
        ln = (lo + c1) & BN_MASK2;
456
9.29k
        *p = ln;
457
458
        /*
459
         * The overflow will stop before we over write words we should not
460
         * overwrite
461
         */
462
9.29k
        if (ln < (BN_ULONG)c1) {
463
21.5k
            do {
464
21.5k
                p++;
465
21.5k
                lo = *p;
466
21.5k
                ln = (lo + 1) & BN_MASK2;
467
21.5k
                *p = ln;
468
21.5k
            } while (ln == 0);
469
3.88k
        }
470
9.29k
    }
471
399k
}
472
473
/*-
474
 * a and b must be the same size, which is n2.
475
 * r needs to be n2 words and t needs to be n2*2
476
 */
477
void bn_mul_low_recursive(BN_ULONG *r, BN_ULONG *a, BN_ULONG *b, int n2,
478
                          BN_ULONG *t)
479
0
{
480
0
    int n = n2 / 2;
481
482
0
    bn_mul_recursive(r, a, b, n, 0, 0, &(t[0]));
483
0
    if (n >= BN_MUL_LOW_RECURSIVE_SIZE_NORMAL) {
484
0
        bn_mul_low_recursive(&(t[0]), &(a[0]), &(b[n]), n, &(t[n2]));
485
0
        bn_add_words(&(r[n]), &(r[n]), &(t[0]), n);
486
0
        bn_mul_low_recursive(&(t[0]), &(a[n]), &(b[0]), n, &(t[n2]));
487
0
        bn_add_words(&(r[n]), &(r[n]), &(t[0]), n);
488
0
    } else {
489
0
        bn_mul_low_normal(&(t[0]), &(a[0]), &(b[n]), n);
490
0
        bn_mul_low_normal(&(t[n]), &(a[n]), &(b[0]), n);
491
0
        bn_add_words(&(r[n]), &(r[n]), &(t[0]), n);
492
0
        bn_add_words(&(r[n]), &(r[n]), &(t[n]), n);
493
0
    }
494
0
}
495
#endif                          /* BN_RECURSION */
496
497
int BN_mul(BIGNUM *r, const BIGNUM *a, const BIGNUM *b, BN_CTX *ctx)
498
14.7M
{
499
14.7M
    int ret = bn_mul_fixed_top(r, a, b, ctx);
500
501
14.7M
    bn_correct_top(r);
502
14.7M
    bn_check_top(r);
503
504
14.7M
    return ret;
505
14.7M
}
506
507
int bn_mul_fixed_top(BIGNUM *r, const BIGNUM *a, const BIGNUM *b, BN_CTX *ctx)
508
17.3M
{
509
17.3M
    int ret = 0;
510
17.3M
    int top, al, bl;
511
17.3M
    BIGNUM *rr;
512
17.3M
#if defined(BN_MUL_COMBA) || defined(BN_RECURSION)
513
17.3M
    int i;
514
17.3M
#endif
515
17.3M
#ifdef BN_RECURSION
516
17.3M
    BIGNUM *t = NULL;
517
17.3M
    int j = 0, k;
518
17.3M
#endif
519
520
17.3M
    bn_check_top(a);
521
17.3M
    bn_check_top(b);
522
17.3M
    bn_check_top(r);
523
524
17.3M
    al = a->top;
525
17.3M
    bl = b->top;
526
527
17.3M
    if ((al == 0) || (bl == 0)) {
528
748k
        BN_zero(r);
529
748k
        return 1;
530
748k
    }
531
16.5M
    top = al + bl;
532
533
16.5M
    BN_CTX_start(ctx);
534
16.5M
    if ((r == a) || (r == b)) {
535
94.9k
        if ((rr = BN_CTX_get(ctx)) == NULL)
536
0
            goto err;
537
94.9k
    } else
538
16.4M
        rr = r;
539
540
16.5M
#if defined(BN_MUL_COMBA) || defined(BN_RECURSION)
541
16.5M
    i = al - bl;
542
16.5M
#endif
543
16.5M
#ifdef BN_MUL_COMBA
544
16.5M
    if (i == 0) {
545
# if 0
546
        if (al == 4) {
547
            if (bn_wexpand(rr, 8) == NULL)
548
                goto err;
549
            rr->top = 8;
550
            bn_mul_comba4(rr->d, a->d, b->d);
551
            goto end;
552
        }
553
# endif
554
4.96M
        if (al == 8) {
555
7.52k
            if (bn_wexpand(rr, 16) == NULL)
556
0
                goto err;
557
7.52k
            rr->top = 16;
558
7.52k
            bn_mul_comba8(rr->d, a->d, b->d);
559
7.52k
            goto end;
560
7.52k
        }
561
4.96M
    }
562
16.5M
#endif                          /* BN_MUL_COMBA */
563
16.5M
#ifdef BN_RECURSION
564
16.5M
    if ((al >= BN_MULL_SIZE_NORMAL) && (bl >= BN_MULL_SIZE_NORMAL)) {
565
420k
        if (i >= -1 && i <= 1) {
566
            /*
567
             * Find out the power of two lower or equal to the longest of the
568
             * two numbers
569
             */
570
379k
            if (i >= 0) {
571
313k
                j = BN_num_bits_word((BN_ULONG)al);
572
313k
            }
573
379k
            if (i == -1) {
574
66.2k
                j = BN_num_bits_word((BN_ULONG)bl);
575
66.2k
            }
576
379k
            j = 1 << (j - 1);
577
379k
            assert(j <= al || j <= bl);
578
379k
            k = j + j;
579
379k
            t = BN_CTX_get(ctx);
580
379k
            if (t == NULL)
581
0
                goto err;
582
379k
            if (al > j || bl > j) {
583
272k
                if (bn_wexpand(t, k * 4) == NULL)
584
0
                    goto err;
585
272k
                if (bn_wexpand(rr, k * 4) == NULL)
586
0
                    goto err;
587
272k
                bn_mul_part_recursive(rr->d, a->d, b->d,
588
272k
                                      j, al - j, bl - j, t->d);
589
272k
            } else {            /* al <= j || bl <= j */
590
591
107k
                if (bn_wexpand(t, k * 2) == NULL)
592
0
                    goto err;
593
107k
                if (bn_wexpand(rr, k * 2) == NULL)
594
0
                    goto err;
595
107k
                bn_mul_recursive(rr->d, a->d, b->d, j, al - j, bl - j, t->d);
596
107k
            }
597
379k
            rr->top = top;
598
379k
            goto end;
599
379k
        }
600
420k
    }
601
16.1M
#endif                          /* BN_RECURSION */
602
16.1M
    if (bn_wexpand(rr, top) == NULL)
603
0
        goto err;
604
16.1M
    rr->top = top;
605
16.1M
    bn_mul_normal(rr->d, a->d, al, b->d, bl);
606
607
16.1M
#if defined(BN_MUL_COMBA) || defined(BN_RECURSION)
608
16.5M
 end:
609
16.5M
#endif
610
16.5M
    rr->neg = a->neg ^ b->neg;
611
16.5M
    rr->flags |= BN_FLG_FIXED_TOP;
612
16.5M
    if (r != rr && BN_copy(r, rr) == NULL)
613
0
        goto err;
614
615
16.5M
    ret = 1;
616
16.5M
 err:
617
16.5M
    bn_check_top(r);
618
16.5M
    BN_CTX_end(ctx);
619
16.5M
    return ret;
620
16.5M
}
621
622
void bn_mul_normal(BN_ULONG *r, BN_ULONG *a, int na, BN_ULONG *b, int nb)
623
16.4M
{
624
16.4M
    BN_ULONG *rr;
625
626
16.4M
    if (na < nb) {
627
11.0M
        int itmp;
628
11.0M
        BN_ULONG *ltmp;
629
630
11.0M
        itmp = na;
631
11.0M
        na = nb;
632
11.0M
        nb = itmp;
633
11.0M
        ltmp = a;
634
11.0M
        a = b;
635
11.0M
        b = ltmp;
636
637
11.0M
    }
638
16.4M
    rr = &(r[na]);
639
16.4M
    if (nb <= 0) {
640
64.0k
        (void)bn_mul_words(r, a, na, 0);
641
64.0k
        return;
642
64.0k
    } else
643
16.4M
        rr[0] = bn_mul_words(r, a, na, b[0]);
644
645
17.2M
    for (;;) {
646
17.2M
        if (--nb <= 0)
647
13.1M
            return;
648
4.05M
        rr[1] = bn_mul_add_words(&(r[1]), a, na, b[1]);
649
4.05M
        if (--nb <= 0)
650
313k
            return;
651
3.73M
        rr[2] = bn_mul_add_words(&(r[2]), a, na, b[2]);
652
3.73M
        if (--nb <= 0)
653
147k
            return;
654
3.59M
        rr[3] = bn_mul_add_words(&(r[3]), a, na, b[3]);
655
3.59M
        if (--nb <= 0)
656
2.75M
            return;
657
830k
        rr[4] = bn_mul_add_words(&(r[4]), a, na, b[4]);
658
830k
        rr += 4;
659
830k
        r += 4;
660
830k
        b += 4;
661
830k
    }
662
16.4M
}
663
664
void bn_mul_low_normal(BN_ULONG *r, BN_ULONG *a, BN_ULONG *b, int n)
665
0
{
666
0
    bn_mul_words(r, a, n, b[0]);
667
668
0
    for (;;) {
669
0
        if (--n <= 0)
670
0
            return;
671
0
        bn_mul_add_words(&(r[1]), a, n, b[1]);
672
0
        if (--n <= 0)
673
0
            return;
674
0
        bn_mul_add_words(&(r[2]), a, n, b[2]);
675
0
        if (--n <= 0)
676
0
            return;
677
0
        bn_mul_add_words(&(r[3]), a, n, b[3]);
678
0
        if (--n <= 0)
679
0
            return;
680
0
        bn_mul_add_words(&(r[4]), a, n, b[4]);
681
0
        r += 4;
682
0
        b += 4;
683
0
    }
684
0
}