Coverage Report

Created: 2024-11-25 06:29

/src/nettle/ecc-mul-a.c
Line
Count
Source (jump to first uncovered line)
1
/* ecc-mul-a.c
2
3
   Copyright (C) 2013 Niels Möller
4
5
   This file is part of GNU Nettle.
6
7
   GNU Nettle is free software: you can redistribute it and/or
8
   modify it under the terms of either:
9
10
     * the GNU Lesser General Public License as published by the Free
11
       Software Foundation; either version 3 of the License, or (at your
12
       option) any later version.
13
14
   or
15
16
     * the GNU General Public License as published by the Free
17
       Software Foundation; either version 2 of the License, or (at your
18
       option) any later version.
19
20
   or both in parallel, as here.
21
22
   GNU Nettle is distributed in the hope that it will be useful,
23
   but WITHOUT ANY WARRANTY; without even the implied warranty of
24
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
25
   General Public License for more details.
26
27
   You should have received copies of the GNU General Public License and
28
   the GNU Lesser General Public License along with this program.  If
29
   not, see http://www.gnu.org/licenses/.
30
*/
31
32
/* Development of Nettle's ECC support was funded by the .SE Internet Fund. */
33
34
#if HAVE_CONFIG_H
35
# include "config.h"
36
#endif
37
38
#include <assert.h>
39
40
#include "ecc.h"
41
#include "ecc-internal.h"
42
#include "nettle-internal.h"
43
44
/* Binary algorithm needs 6*ecc->p.size + scratch for ecc_add_jja.
45
   Current total is 12 ecc->p.size, at most 864 bytes.
46
47
   Window algorithm needs (3<<w) * ecc->p.size for the table,
48
   3*ecc->p.size for a temporary point, and scratch for
49
   ecc_add_jjj. */
50
51
#if ECC_MUL_A_WBITS == 0
52
void
53
ecc_mul_a (const struct ecc_curve *ecc,
54
     mp_limb_t *r,
55
     const mp_limb_t *np, const mp_limb_t *p,
56
     mp_limb_t *scratch)
57
{
58
#define tp scratch
59
#define pj (scratch + 3*ecc->p.size)
60
#define scratch_out (scratch + 6*ecc->p.size)
61
62
  int is_zero;
63
64
  unsigned i;
65
66
  ecc_a_to_j (ecc, pj, p);
67
  mpn_zero (r, 3*ecc->p.size);
68
  
69
  for (i = ecc->p.size, is_zero = 1; i-- > 0; )
70
    {
71
      mp_limb_t w = np[i] << (GMP_LIMB_BITS - GMP_NUMB_BITS);
72
      unsigned j;
73
74
      for (j = 0; j < GMP_NUMB_BITS; j++, w <<= 1)
75
  {
76
    int bit;
77
78
    ecc_dup_jj (ecc, r, r, scratch_out);
79
    ecc_add_jja (ecc, tp, r, pj, scratch_out);
80
81
    bit = w >> (GMP_LIMB_BITS - 1);
82
    /* If is_zero is set, r is the zero point,
83
       and ecc_add_jja produced garbage. */
84
    cnd_copy (is_zero, tp, pj, 3*ecc->p.size);
85
    is_zero &= 1 - bit;
86
    /* If we had a one-bit, use the sum. */
87
    cnd_copy (bit, r, tp, 3*ecc->p.size);
88
  }
89
    }
90
}
91
#else /* ECC_MUL_A_WBITS > 1 */
92
93
542k
#define TABLE_SIZE (1U << ECC_MUL_A_WBITS)
94
269k
#define TABLE_MASK (TABLE_SIZE - 1)
95
96
157k
#define TABLE(j) (table + (j) * 3*ecc->p.size)
97
98
static void
99
table_init (const struct ecc_curve *ecc,
100
      mp_limb_t *table, unsigned bits,
101
      const mp_limb_t *p,
102
      mp_limb_t *scratch)
103
4.26k
{
104
4.26k
  unsigned size = 1 << bits;
105
4.26k
  unsigned j;
106
107
4.26k
  mpn_zero (TABLE(0), 3*ecc->p.size);
108
4.26k
  ecc_a_to_j (ecc, TABLE(1), p);
109
110
34.1k
  for (j = 2; j < size; j += 2)
111
29.8k
    {
112
29.8k
      ecc_dup_jj (ecc, TABLE(j), TABLE(j/2), scratch);
113
29.8k
      ecc_add_jja (ecc, TABLE(j+1), TABLE(j), TABLE(1), scratch);
114
29.8k
    }  
115
4.26k
}
116
117
void
118
ecc_mul_a (const struct ecc_curve *ecc,
119
     mp_limb_t *r,
120
     const mp_limb_t *np, const mp_limb_t *p,
121
     mp_limb_t *scratch)
122
4.26k
{
123
1.34M
#define tp scratch
124
282k
#define table (scratch + 3*ecc->p.size)
125
4.26k
  mp_limb_t *scratch_out = table + (3*ecc->p.size << ECC_MUL_A_WBITS);
126
4.26k
  int is_zero = 0;
127
128
  /* Avoid the mp_bitcnt_t type for compatibility with older GMP
129
     versions. */
130
4.26k
  unsigned blocks = (ecc->p.bit_size + ECC_MUL_A_WBITS - 1) / ECC_MUL_A_WBITS;
131
4.26k
  unsigned bit_index = (blocks-1) * ECC_MUL_A_WBITS;
132
133
4.26k
  mp_size_t limb_index = bit_index / GMP_NUMB_BITS;
134
4.26k
  unsigned shift = bit_index % GMP_NUMB_BITS;
135
4.26k
  mp_limb_t w, bits;
136
137
4.26k
  table_init (ecc, table, ECC_MUL_A_WBITS, p, scratch_out);
138
139
4.26k
  w = np[limb_index];
140
4.26k
  bits = w >> shift;
141
4.26k
  if (limb_index < ecc->p.size - 1)
142
0
    bits |= np[limb_index + 1] << (GMP_NUMB_BITS - shift);
143
144
4.26k
  assert (bits < TABLE_SIZE);
145
146
4.26k
  mpn_sec_tabselect (r, table, 3*ecc->p.size, TABLE_SIZE, bits);
147
4.26k
  is_zero = IS_ZERO_SMALL (bits);
148
149
4.26k
  for (;;)
150
273k
    {
151
273k
      int bits_is_zero;
152
273k
      unsigned j;
153
273k
      if (shift >= ECC_MUL_A_WBITS)
154
256k
  {
155
256k
    shift -= ECC_MUL_A_WBITS;
156
256k
    bits = w >> shift;
157
256k
  }
158
17.0k
      else
159
17.0k
  {
160
17.0k
    if (limb_index == 0)
161
4.26k
      {
162
4.26k
        assert (shift == 0);
163
4.26k
        break;
164
4.26k
      }
165
12.8k
    bits = w << (ECC_MUL_A_WBITS - shift);
166
12.8k
    w = np[--limb_index];
167
12.8k
    shift = shift + GMP_NUMB_BITS - ECC_MUL_A_WBITS;
168
12.8k
    bits |= w >> shift;
169
12.8k
  }
170
1.34M
      for (j = 0; j < ECC_MUL_A_WBITS; j++)
171
1.07M
  ecc_dup_jj (ecc, r, r, scratch_out);
172
173
269k
      bits &= TABLE_MASK;
174
269k
      mpn_sec_tabselect (tp, table, 3*ecc->p.size, TABLE_SIZE, bits);
175
269k
      cnd_copy (is_zero, r, tp, 3*ecc->p.size);
176
269k
      ecc_add_jjj (ecc, tp, tp, r, scratch_out);
177
269k
      bits_is_zero = IS_ZERO_SMALL (bits);
178
179
      /* Use the sum when valid. ecc_add_jja produced garbage if
180
   is_zero or bits_is_zero. */
181
269k
      cnd_copy (1 - (bits_is_zero | is_zero), r, tp, 3*ecc->p.size);
182
269k
      is_zero &= bits_is_zero;
183
269k
    }
184
4.26k
#undef table
185
4.26k
#undef tp
186
4.26k
}
187
188
#endif /* ECC_MUL_A_WBITS > 1 */