/src/libssh2/src/chacha.c
Line | Count | Source |
1 | | /* |
2 | | * chacha-merged.c version 20080118 |
3 | | * D. J. Bernstein |
4 | | * Public domain. |
5 | | * Copyright not intended 2024. |
6 | | * |
7 | | * SPDX-License-Identifier: SAX-PD-2.0 |
8 | | */ |
9 | | |
10 | | #include "libssh2_priv.h" |
11 | | |
12 | | #include "chacha.h" |
13 | | |
14 | | /* $OpenBSD: chacha.c,v 1.1 2013/11/21 00:45:44 djm Exp $ */ |
15 | | |
16 | | typedef unsigned char u8; |
17 | | typedef unsigned int u32; |
18 | | |
19 | | typedef struct chacha_ctx chacha_ctx; |
20 | | |
21 | 0 | #define U8C(v) (v##U) |
22 | 0 | #define U32C(v) (v##U) |
23 | | |
24 | 0 | #define U8V(v) ((u8)(v) & U8C(0xFF)) |
25 | 0 | #define U32V(v) ((u32)(v) & U32C(0xFFFFFFFF)) |
26 | | |
27 | | #define ROTL32(v, n) \ |
28 | 0 | (U32V((v) << (n)) | ((v) >> (32 - (n)))) |
29 | | |
30 | | #define U8TO32_LITTLE(p) \ |
31 | 0 | (((u32)((p)[0]) ) | \ |
32 | 0 | ((u32)((p)[1]) << 8) | \ |
33 | 0 | ((u32)((p)[2]) << 16) | \ |
34 | 0 | ((u32)((p)[3]) << 24)) |
35 | | |
36 | | #define U32TO8_LITTLE(p, v) \ |
37 | 0 | do { \ |
38 | 0 | (p)[0] = U8V((v) ); \ |
39 | 0 | (p)[1] = U8V((v) >> 8); \ |
40 | 0 | (p)[2] = U8V((v) >> 16); \ |
41 | 0 | (p)[3] = U8V((v) >> 24); \ |
42 | 0 | } while (0) |
43 | | |
44 | 0 | #define ROTATE(v,c) (ROTL32(v,c)) |
45 | 0 | #define XOR(v,w) ((v) ^ (w)) |
46 | 0 | #define PLUS(v,w) (U32V((v) + (w))) |
47 | 0 | #define PLUSONE(v) (PLUS((v),1)) |
48 | | |
49 | | #define QUARTERROUND(a,b,c,d) \ |
50 | 0 | a = PLUS(a,b); d = ROTATE(XOR(d,a),16); \ |
51 | 0 | c = PLUS(c,d); b = ROTATE(XOR(b,c),12); \ |
52 | 0 | a = PLUS(a,b); d = ROTATE(XOR(d,a), 8); \ |
53 | 0 | c = PLUS(c,d); b = ROTATE(XOR(b,c), 7); |
54 | | |
55 | | static const char sigma[17] = "expand 32-byte k"; |
56 | | static const char tau[17] = "expand 16-byte k"; |
57 | | |
58 | | void |
59 | | chacha_keysetup(chacha_ctx *x, const u8 *k, u32 kbits) |
60 | 0 | { |
61 | 0 | const char *constants; |
62 | |
|
63 | 0 | x->input[4] = U8TO32_LITTLE(k + 0); |
64 | 0 | x->input[5] = U8TO32_LITTLE(k + 4); |
65 | 0 | x->input[6] = U8TO32_LITTLE(k + 8); |
66 | 0 | x->input[7] = U8TO32_LITTLE(k + 12); |
67 | 0 | if(kbits == 256) { /* recommended */ |
68 | 0 | k += 16; |
69 | 0 | constants = sigma; |
70 | 0 | } |
71 | 0 | else { /* kbits == 128 */ |
72 | 0 | constants = tau; |
73 | 0 | } |
74 | 0 | x->input[8] = U8TO32_LITTLE(k + 0); |
75 | 0 | x->input[9] = U8TO32_LITTLE(k + 4); |
76 | 0 | x->input[10] = U8TO32_LITTLE(k + 8); |
77 | 0 | x->input[11] = U8TO32_LITTLE(k + 12); |
78 | 0 | x->input[0] = U8TO32_LITTLE(constants + 0); |
79 | 0 | x->input[1] = U8TO32_LITTLE(constants + 4); |
80 | 0 | x->input[2] = U8TO32_LITTLE(constants + 8); |
81 | 0 | x->input[3] = U8TO32_LITTLE(constants + 12); |
82 | 0 | } |
83 | | |
84 | | void |
85 | | chacha_ivsetup(chacha_ctx *x, const u8 *iv, const u8 *counter) |
86 | 0 | { |
87 | 0 | x->input[12] = counter == NULL ? 0 : U8TO32_LITTLE(counter + 0); |
88 | 0 | x->input[13] = counter == NULL ? 0 : U8TO32_LITTLE(counter + 4); |
89 | 0 | x->input[14] = U8TO32_LITTLE(iv + 0); |
90 | 0 | x->input[15] = U8TO32_LITTLE(iv + 4); |
91 | 0 | } |
92 | | |
93 | | void |
94 | | chacha_encrypt_bytes(chacha_ctx *x, const u8 *m, u8 *c, u32 bytes) |
95 | 0 | { |
96 | 0 | u32 x0, x1, x2, x3, x4, x5, x6, x7, x8, x9, x10, x11, x12, x13, x14, x15; |
97 | 0 | u32 j0, j1, j2, j3, j4, j5, j6, j7, j8, j9, j10, j11, j12, j13, j14, j15; |
98 | 0 | u8 *ctarget = NULL; |
99 | 0 | u8 tmp[64]; |
100 | 0 | u_int i; |
101 | |
|
102 | 0 | if(!bytes) |
103 | 0 | return; |
104 | | |
105 | 0 | j0 = x->input[0]; |
106 | 0 | j1 = x->input[1]; |
107 | 0 | j2 = x->input[2]; |
108 | 0 | j3 = x->input[3]; |
109 | 0 | j4 = x->input[4]; |
110 | 0 | j5 = x->input[5]; |
111 | 0 | j6 = x->input[6]; |
112 | 0 | j7 = x->input[7]; |
113 | 0 | j8 = x->input[8]; |
114 | 0 | j9 = x->input[9]; |
115 | 0 | j10 = x->input[10]; |
116 | 0 | j11 = x->input[11]; |
117 | 0 | j12 = x->input[12]; |
118 | 0 | j13 = x->input[13]; |
119 | 0 | j14 = x->input[14]; |
120 | 0 | j15 = x->input[15]; |
121 | |
|
122 | 0 | for(;;) { |
123 | 0 | if(bytes < 64) { |
124 | 0 | for(i = 0; i < bytes;++i) tmp[i] = m[i]; |
125 | 0 | m = tmp; |
126 | 0 | ctarget = c; |
127 | 0 | c = tmp; |
128 | 0 | } |
129 | 0 | x0 = j0; |
130 | 0 | x1 = j1; |
131 | 0 | x2 = j2; |
132 | 0 | x3 = j3; |
133 | 0 | x4 = j4; |
134 | 0 | x5 = j5; |
135 | 0 | x6 = j6; |
136 | 0 | x7 = j7; |
137 | 0 | x8 = j8; |
138 | 0 | x9 = j9; |
139 | 0 | x10 = j10; |
140 | 0 | x11 = j11; |
141 | 0 | x12 = j12; |
142 | 0 | x13 = j13; |
143 | 0 | x14 = j14; |
144 | 0 | x15 = j15; |
145 | 0 | for(i = 20; i > 0; i -= 2) { |
146 | 0 | QUARTERROUND(x0, x4, x8, x12) |
147 | 0 | QUARTERROUND(x1, x5, x9, x13) |
148 | 0 | QUARTERROUND(x2, x6, x10, x14) |
149 | 0 | QUARTERROUND(x3, x7, x11, x15) |
150 | 0 | QUARTERROUND(x0, x5, x10, x15) |
151 | 0 | QUARTERROUND(x1, x6, x11, x12) |
152 | 0 | QUARTERROUND(x2, x7, x8, x13) |
153 | 0 | QUARTERROUND(x3, x4, x9, x14) |
154 | 0 | } |
155 | 0 | x0 = PLUS(x0, j0); |
156 | 0 | x1 = PLUS(x1, j1); |
157 | 0 | x2 = PLUS(x2, j2); |
158 | 0 | x3 = PLUS(x3, j3); |
159 | 0 | x4 = PLUS(x4, j4); |
160 | 0 | x5 = PLUS(x5, j5); |
161 | 0 | x6 = PLUS(x6, j6); |
162 | 0 | x7 = PLUS(x7, j7); |
163 | 0 | x8 = PLUS(x8, j8); |
164 | 0 | x9 = PLUS(x9, j9); |
165 | 0 | x10 = PLUS(x10, j10); |
166 | 0 | x11 = PLUS(x11, j11); |
167 | 0 | x12 = PLUS(x12, j12); |
168 | 0 | x13 = PLUS(x13, j13); |
169 | 0 | x14 = PLUS(x14, j14); |
170 | 0 | x15 = PLUS(x15, j15); |
171 | |
|
172 | 0 | x0 = XOR(x0, U8TO32_LITTLE(m + 0)); |
173 | 0 | x1 = XOR(x1, U8TO32_LITTLE(m + 4)); |
174 | 0 | x2 = XOR(x2, U8TO32_LITTLE(m + 8)); |
175 | 0 | x3 = XOR(x3, U8TO32_LITTLE(m + 12)); |
176 | 0 | x4 = XOR(x4, U8TO32_LITTLE(m + 16)); |
177 | 0 | x5 = XOR(x5, U8TO32_LITTLE(m + 20)); |
178 | 0 | x6 = XOR(x6, U8TO32_LITTLE(m + 24)); |
179 | 0 | x7 = XOR(x7, U8TO32_LITTLE(m + 28)); |
180 | 0 | x8 = XOR(x8, U8TO32_LITTLE(m + 32)); |
181 | 0 | x9 = XOR(x9, U8TO32_LITTLE(m + 36)); |
182 | 0 | x10 = XOR(x10, U8TO32_LITTLE(m + 40)); |
183 | 0 | x11 = XOR(x11, U8TO32_LITTLE(m + 44)); |
184 | 0 | x12 = XOR(x12, U8TO32_LITTLE(m + 48)); |
185 | 0 | x13 = XOR(x13, U8TO32_LITTLE(m + 52)); |
186 | 0 | x14 = XOR(x14, U8TO32_LITTLE(m + 56)); |
187 | 0 | x15 = XOR(x15, U8TO32_LITTLE(m + 60)); |
188 | |
|
189 | 0 | j12 = PLUSONE(j12); |
190 | 0 | if(!j12) { |
191 | 0 | j13 = PLUSONE(j13); |
192 | | /* stopping at 2^70 bytes per nonce is user's responsibility */ |
193 | 0 | } |
194 | |
|
195 | 0 | U32TO8_LITTLE(c + 0, x0); |
196 | 0 | U32TO8_LITTLE(c + 4, x1); |
197 | 0 | U32TO8_LITTLE(c + 8, x2); |
198 | 0 | U32TO8_LITTLE(c + 12, x3); |
199 | 0 | U32TO8_LITTLE(c + 16, x4); |
200 | 0 | U32TO8_LITTLE(c + 20, x5); |
201 | 0 | U32TO8_LITTLE(c + 24, x6); |
202 | 0 | U32TO8_LITTLE(c + 28, x7); |
203 | 0 | U32TO8_LITTLE(c + 32, x8); |
204 | 0 | U32TO8_LITTLE(c + 36, x9); |
205 | 0 | U32TO8_LITTLE(c + 40, x10); |
206 | 0 | U32TO8_LITTLE(c + 44, x11); |
207 | 0 | U32TO8_LITTLE(c + 48, x12); |
208 | 0 | U32TO8_LITTLE(c + 52, x13); |
209 | 0 | U32TO8_LITTLE(c + 56, x14); |
210 | 0 | U32TO8_LITTLE(c + 60, x15); |
211 | |
|
212 | 0 | if(bytes <= 64) { |
213 | 0 | if(bytes < 64) { |
214 | 0 | for(i = 0; i < bytes;++i) ctarget[i] = c[i]; |
215 | 0 | } |
216 | 0 | x->input[12] = j12; |
217 | 0 | x->input[13] = j13; |
218 | 0 | return; |
219 | 0 | } |
220 | 0 | bytes -= 64; |
221 | 0 | c += 64; |
222 | 0 | m += 64; |
223 | 0 | } |
224 | 0 | } |