/src/botan/src/lib/hash/sha2_64/sha2_64_bmi2/sha2_64_bmi2.cpp
Line | Count | Source |
1 | | /* |
2 | | * (C) 2019 Jack Lloyd |
3 | | * |
4 | | * Botan is released under the Simplified BSD License (see license.txt) |
5 | | */ |
6 | | |
7 | | #include <botan/sha2_64.h> |
8 | | #include <botan/loadstor.h> |
9 | | #include <botan/rotate.h> |
10 | | |
11 | | namespace Botan { |
12 | | |
13 | | /* |
14 | | * SHA-512 F1 Function |
15 | | * |
16 | | * Use a macro as many compilers won't inline a function this big, |
17 | | * even though it is much faster if inlined. |
18 | | */ |
19 | | #define SHA2_64_F(A, B, C, D, E, F, G, H, M1, M2, M3, M4, magic) \ |
20 | 17.0M | do { \ |
21 | 17.0M | const uint64_t E_rho = rotr<14>(E) ^ rotr<18>(E) ^ rotr<41>(E); \ |
22 | 17.0M | const uint64_t A_rho = rotr<28>(A) ^ rotr<34>(A) ^ rotr<39>(A); \ |
23 | 17.0M | const uint64_t M2_sigma = rotr<19>(M2) ^ rotr<61>(M2) ^ (M2 >> 6); \ |
24 | 17.0M | const uint64_t M4_sigma = rotr<1>(M4) ^ rotr<8>(M4) ^ (M4 >> 7); \ |
25 | 17.0M | H += magic + E_rho + ((E & F) ^ (~E & G)) + M1; \ |
26 | 17.0M | D += H; \ |
27 | 17.0M | H += A_rho + ((A & B) | ((A | B) & C)); \ |
28 | 17.0M | M1 += M2_sigma + M3 + M4_sigma; \ |
29 | 17.0M | } while(0); |
30 | | |
31 | | void SHA_512::compress_digest_bmi2(secure_vector<uint64_t>& digest, |
32 | | const uint8_t input[], size_t blocks) |
33 | 207k | { |
34 | 207k | uint64_t A = digest[0], B = digest[1], C = digest[2], |
35 | 207k | D = digest[3], E = digest[4], F = digest[5], |
36 | 207k | G = digest[6], H = digest[7]; |
37 | 207k | |
38 | 421k | for(size_t i = 0; i != blocks; ++i) |
39 | 213k | { |
40 | 213k | uint64_t W00 = load_be<uint64_t>(input, 0); |
41 | 213k | uint64_t W01 = load_be<uint64_t>(input, 1); |
42 | 213k | uint64_t W02 = load_be<uint64_t>(input, 2); |
43 | 213k | uint64_t W03 = load_be<uint64_t>(input, 3); |
44 | 213k | uint64_t W04 = load_be<uint64_t>(input, 4); |
45 | 213k | uint64_t W05 = load_be<uint64_t>(input, 5); |
46 | 213k | uint64_t W06 = load_be<uint64_t>(input, 6); |
47 | 213k | uint64_t W07 = load_be<uint64_t>(input, 7); |
48 | 213k | uint64_t W08 = load_be<uint64_t>(input, 8); |
49 | 213k | uint64_t W09 = load_be<uint64_t>(input, 9); |
50 | 213k | uint64_t W10 = load_be<uint64_t>(input, 10); |
51 | 213k | uint64_t W11 = load_be<uint64_t>(input, 11); |
52 | 213k | uint64_t W12 = load_be<uint64_t>(input, 12); |
53 | 213k | uint64_t W13 = load_be<uint64_t>(input, 13); |
54 | 213k | uint64_t W14 = load_be<uint64_t>(input, 14); |
55 | 213k | uint64_t W15 = load_be<uint64_t>(input, 15); |
56 | 213k | |
57 | 213k | SHA2_64_F(A, B, C, D, E, F, G, H, W00, W14, W09, W01, 0x428A2F98D728AE22); |
58 | 213k | SHA2_64_F(H, A, B, C, D, E, F, G, W01, W15, W10, W02, 0x7137449123EF65CD); |
59 | 213k | SHA2_64_F(G, H, A, B, C, D, E, F, W02, W00, W11, W03, 0xB5C0FBCFEC4D3B2F); |
60 | 213k | SHA2_64_F(F, G, H, A, B, C, D, E, W03, W01, W12, W04, 0xE9B5DBA58189DBBC); |
61 | 213k | SHA2_64_F(E, F, G, H, A, B, C, D, W04, W02, W13, W05, 0x3956C25BF348B538); |
62 | 213k | SHA2_64_F(D, E, F, G, H, A, B, C, W05, W03, W14, W06, 0x59F111F1B605D019); |
63 | 213k | SHA2_64_F(C, D, E, F, G, H, A, B, W06, W04, W15, W07, 0x923F82A4AF194F9B); |
64 | 213k | SHA2_64_F(B, C, D, E, F, G, H, A, W07, W05, W00, W08, 0xAB1C5ED5DA6D8118); |
65 | 213k | SHA2_64_F(A, B, C, D, E, F, G, H, W08, W06, W01, W09, 0xD807AA98A3030242); |
66 | 213k | SHA2_64_F(H, A, B, C, D, E, F, G, W09, W07, W02, W10, 0x12835B0145706FBE); |
67 | 213k | SHA2_64_F(G, H, A, B, C, D, E, F, W10, W08, W03, W11, 0x243185BE4EE4B28C); |
68 | 213k | SHA2_64_F(F, G, H, A, B, C, D, E, W11, W09, W04, W12, 0x550C7DC3D5FFB4E2); |
69 | 213k | SHA2_64_F(E, F, G, H, A, B, C, D, W12, W10, W05, W13, 0x72BE5D74F27B896F); |
70 | 213k | SHA2_64_F(D, E, F, G, H, A, B, C, W13, W11, W06, W14, 0x80DEB1FE3B1696B1); |
71 | 213k | SHA2_64_F(C, D, E, F, G, H, A, B, W14, W12, W07, W15, 0x9BDC06A725C71235); |
72 | 213k | SHA2_64_F(B, C, D, E, F, G, H, A, W15, W13, W08, W00, 0xC19BF174CF692694); |
73 | 213k | SHA2_64_F(A, B, C, D, E, F, G, H, W00, W14, W09, W01, 0xE49B69C19EF14AD2); |
74 | 213k | SHA2_64_F(H, A, B, C, D, E, F, G, W01, W15, W10, W02, 0xEFBE4786384F25E3); |
75 | 213k | SHA2_64_F(G, H, A, B, C, D, E, F, W02, W00, W11, W03, 0x0FC19DC68B8CD5B5); |
76 | 213k | SHA2_64_F(F, G, H, A, B, C, D, E, W03, W01, W12, W04, 0x240CA1CC77AC9C65); |
77 | 213k | SHA2_64_F(E, F, G, H, A, B, C, D, W04, W02, W13, W05, 0x2DE92C6F592B0275); |
78 | 213k | SHA2_64_F(D, E, F, G, H, A, B, C, W05, W03, W14, W06, 0x4A7484AA6EA6E483); |
79 | 213k | SHA2_64_F(C, D, E, F, G, H, A, B, W06, W04, W15, W07, 0x5CB0A9DCBD41FBD4); |
80 | 213k | SHA2_64_F(B, C, D, E, F, G, H, A, W07, W05, W00, W08, 0x76F988DA831153B5); |
81 | 213k | SHA2_64_F(A, B, C, D, E, F, G, H, W08, W06, W01, W09, 0x983E5152EE66DFAB); |
82 | 213k | SHA2_64_F(H, A, B, C, D, E, F, G, W09, W07, W02, W10, 0xA831C66D2DB43210); |
83 | 213k | SHA2_64_F(G, H, A, B, C, D, E, F, W10, W08, W03, W11, 0xB00327C898FB213F); |
84 | 213k | SHA2_64_F(F, G, H, A, B, C, D, E, W11, W09, W04, W12, 0xBF597FC7BEEF0EE4); |
85 | 213k | SHA2_64_F(E, F, G, H, A, B, C, D, W12, W10, W05, W13, 0xC6E00BF33DA88FC2); |
86 | 213k | SHA2_64_F(D, E, F, G, H, A, B, C, W13, W11, W06, W14, 0xD5A79147930AA725); |
87 | 213k | SHA2_64_F(C, D, E, F, G, H, A, B, W14, W12, W07, W15, 0x06CA6351E003826F); |
88 | 213k | SHA2_64_F(B, C, D, E, F, G, H, A, W15, W13, W08, W00, 0x142929670A0E6E70); |
89 | 213k | SHA2_64_F(A, B, C, D, E, F, G, H, W00, W14, W09, W01, 0x27B70A8546D22FFC); |
90 | 213k | SHA2_64_F(H, A, B, C, D, E, F, G, W01, W15, W10, W02, 0x2E1B21385C26C926); |
91 | 213k | SHA2_64_F(G, H, A, B, C, D, E, F, W02, W00, W11, W03, 0x4D2C6DFC5AC42AED); |
92 | 213k | SHA2_64_F(F, G, H, A, B, C, D, E, W03, W01, W12, W04, 0x53380D139D95B3DF); |
93 | 213k | SHA2_64_F(E, F, G, H, A, B, C, D, W04, W02, W13, W05, 0x650A73548BAF63DE); |
94 | 213k | SHA2_64_F(D, E, F, G, H, A, B, C, W05, W03, W14, W06, 0x766A0ABB3C77B2A8); |
95 | 213k | SHA2_64_F(C, D, E, F, G, H, A, B, W06, W04, W15, W07, 0x81C2C92E47EDAEE6); |
96 | 213k | SHA2_64_F(B, C, D, E, F, G, H, A, W07, W05, W00, W08, 0x92722C851482353B); |
97 | 213k | SHA2_64_F(A, B, C, D, E, F, G, H, W08, W06, W01, W09, 0xA2BFE8A14CF10364); |
98 | 213k | SHA2_64_F(H, A, B, C, D, E, F, G, W09, W07, W02, W10, 0xA81A664BBC423001); |
99 | 213k | SHA2_64_F(G, H, A, B, C, D, E, F, W10, W08, W03, W11, 0xC24B8B70D0F89791); |
100 | 213k | SHA2_64_F(F, G, H, A, B, C, D, E, W11, W09, W04, W12, 0xC76C51A30654BE30); |
101 | 213k | SHA2_64_F(E, F, G, H, A, B, C, D, W12, W10, W05, W13, 0xD192E819D6EF5218); |
102 | 213k | SHA2_64_F(D, E, F, G, H, A, B, C, W13, W11, W06, W14, 0xD69906245565A910); |
103 | 213k | SHA2_64_F(C, D, E, F, G, H, A, B, W14, W12, W07, W15, 0xF40E35855771202A); |
104 | 213k | SHA2_64_F(B, C, D, E, F, G, H, A, W15, W13, W08, W00, 0x106AA07032BBD1B8); |
105 | 213k | SHA2_64_F(A, B, C, D, E, F, G, H, W00, W14, W09, W01, 0x19A4C116B8D2D0C8); |
106 | 213k | SHA2_64_F(H, A, B, C, D, E, F, G, W01, W15, W10, W02, 0x1E376C085141AB53); |
107 | 213k | SHA2_64_F(G, H, A, B, C, D, E, F, W02, W00, W11, W03, 0x2748774CDF8EEB99); |
108 | 213k | SHA2_64_F(F, G, H, A, B, C, D, E, W03, W01, W12, W04, 0x34B0BCB5E19B48A8); |
109 | 213k | SHA2_64_F(E, F, G, H, A, B, C, D, W04, W02, W13, W05, 0x391C0CB3C5C95A63); |
110 | 213k | SHA2_64_F(D, E, F, G, H, A, B, C, W05, W03, W14, W06, 0x4ED8AA4AE3418ACB); |
111 | 213k | SHA2_64_F(C, D, E, F, G, H, A, B, W06, W04, W15, W07, 0x5B9CCA4F7763E373); |
112 | 213k | SHA2_64_F(B, C, D, E, F, G, H, A, W07, W05, W00, W08, 0x682E6FF3D6B2B8A3); |
113 | 213k | SHA2_64_F(A, B, C, D, E, F, G, H, W08, W06, W01, W09, 0x748F82EE5DEFB2FC); |
114 | 213k | SHA2_64_F(H, A, B, C, D, E, F, G, W09, W07, W02, W10, 0x78A5636F43172F60); |
115 | 213k | SHA2_64_F(G, H, A, B, C, D, E, F, W10, W08, W03, W11, 0x84C87814A1F0AB72); |
116 | 213k | SHA2_64_F(F, G, H, A, B, C, D, E, W11, W09, W04, W12, 0x8CC702081A6439EC); |
117 | 213k | SHA2_64_F(E, F, G, H, A, B, C, D, W12, W10, W05, W13, 0x90BEFFFA23631E28); |
118 | 213k | SHA2_64_F(D, E, F, G, H, A, B, C, W13, W11, W06, W14, 0xA4506CEBDE82BDE9); |
119 | 213k | SHA2_64_F(C, D, E, F, G, H, A, B, W14, W12, W07, W15, 0xBEF9A3F7B2C67915); |
120 | 213k | SHA2_64_F(B, C, D, E, F, G, H, A, W15, W13, W08, W00, 0xC67178F2E372532B); |
121 | 213k | SHA2_64_F(A, B, C, D, E, F, G, H, W00, W14, W09, W01, 0xCA273ECEEA26619C); |
122 | 213k | SHA2_64_F(H, A, B, C, D, E, F, G, W01, W15, W10, W02, 0xD186B8C721C0C207); |
123 | 213k | SHA2_64_F(G, H, A, B, C, D, E, F, W02, W00, W11, W03, 0xEADA7DD6CDE0EB1E); |
124 | 213k | SHA2_64_F(F, G, H, A, B, C, D, E, W03, W01, W12, W04, 0xF57D4F7FEE6ED178); |
125 | 213k | SHA2_64_F(E, F, G, H, A, B, C, D, W04, W02, W13, W05, 0x06F067AA72176FBA); |
126 | 213k | SHA2_64_F(D, E, F, G, H, A, B, C, W05, W03, W14, W06, 0x0A637DC5A2C898A6); |
127 | 213k | SHA2_64_F(C, D, E, F, G, H, A, B, W06, W04, W15, W07, 0x113F9804BEF90DAE); |
128 | 213k | SHA2_64_F(B, C, D, E, F, G, H, A, W07, W05, W00, W08, 0x1B710B35131C471B); |
129 | 213k | SHA2_64_F(A, B, C, D, E, F, G, H, W08, W06, W01, W09, 0x28DB77F523047D84); |
130 | 213k | SHA2_64_F(H, A, B, C, D, E, F, G, W09, W07, W02, W10, 0x32CAAB7B40C72493); |
131 | 213k | SHA2_64_F(G, H, A, B, C, D, E, F, W10, W08, W03, W11, 0x3C9EBE0A15C9BEBC); |
132 | 213k | SHA2_64_F(F, G, H, A, B, C, D, E, W11, W09, W04, W12, 0x431D67C49C100D4C); |
133 | 213k | SHA2_64_F(E, F, G, H, A, B, C, D, W12, W10, W05, W13, 0x4CC5D4BECB3E42B6); |
134 | 213k | SHA2_64_F(D, E, F, G, H, A, B, C, W13, W11, W06, W14, 0x597F299CFC657E2A); |
135 | 213k | SHA2_64_F(C, D, E, F, G, H, A, B, W14, W12, W07, W15, 0x5FCB6FAB3AD6FAEC); |
136 | 213k | SHA2_64_F(B, C, D, E, F, G, H, A, W15, W13, W08, W00, 0x6C44198C4A475817); |
137 | 213k | |
138 | 213k | A = (digest[0] += A); |
139 | 213k | B = (digest[1] += B); |
140 | 213k | C = (digest[2] += C); |
141 | 213k | D = (digest[3] += D); |
142 | 213k | E = (digest[4] += E); |
143 | 213k | F = (digest[5] += F); |
144 | 213k | G = (digest[6] += G); |
145 | 213k | H = (digest[7] += H); |
146 | 213k | |
147 | 213k | input += 128; |
148 | 213k | } |
149 | 207k | } |
150 | | |
151 | | #undef SHA2_64_F |
152 | | |
153 | | } |