|
31 | 31 |
|
32 | 32 | typedef __m128i xmmi;
|
33 | 33 |
|
34 |
| -static const alignas(16) uint32_t poly1305_x64_sse2_message_mask[4] = { |
| 34 | +alignas(16) static const uint32_t poly1305_x64_sse2_message_mask[4] = { |
35 | 35 | (1 << 26) - 1, 0, (1 << 26) - 1, 0};
|
36 |
| -static const alignas(16) uint32_t poly1305_x64_sse2_5[4] = {5, 0, 5, 0}; |
37 |
| -static const alignas(16) uint32_t poly1305_x64_sse2_1shl128[4] = { |
38 |
| - (1 << 24), 0, (1 << 24), 0}; |
| 36 | +alignas(16) static const uint32_t poly1305_x64_sse2_5[4] = {5, 0, 5, 0}; |
| 37 | +alignas(16) static const uint32_t poly1305_x64_sse2_1shl128[4] = {(1 << 24), 0, |
| 38 | + (1 << 24), 0}; |
39 | 39 |
|
40 | 40 | static inline uint128_t add128(uint128_t a, uint128_t b) { return a + b; }
|
41 | 41 |
|
@@ -136,7 +136,8 @@ void CRYPTO_poly1305_init(poly1305_state *state, const uint8_t key[32]) {
|
136 | 136 |
|
137 | 137 | static void poly1305_first_block(poly1305_state_internal *st,
|
138 | 138 | const uint8_t *m) {
|
139 |
| - const xmmi MMASK = _mm_load_si128((const xmmi *)poly1305_x64_sse2_message_mask); |
| 139 | + const xmmi MMASK = |
| 140 | + _mm_load_si128((const xmmi *)poly1305_x64_sse2_message_mask); |
140 | 141 | const xmmi FIVE = _mm_load_si128((const xmmi *)poly1305_x64_sse2_5);
|
141 | 142 | const xmmi HIBIT = _mm_load_si128((const xmmi *)poly1305_x64_sse2_1shl128);
|
142 | 143 | xmmi T5, T6;
|
@@ -181,7 +182,7 @@ static void poly1305_first_block(poly1305_state_internal *st,
|
181 | 182 | r20 = r20 & 0xfffffffffff;
|
182 | 183 | r21 += c;
|
183 | 184 |
|
184 |
| - p->R20.v = _mm_shuffle_epi32(_mm_cvtsi32_si128((uint32_t)(r20)&0x3ffffff), |
| 185 | + p->R20.v = _mm_shuffle_epi32(_mm_cvtsi32_si128((uint32_t)(r20) & 0x3ffffff), |
185 | 186 | _MM_SHUFFLE(1, 0, 1, 0));
|
186 | 187 | p->R21.v = _mm_shuffle_epi32(
|
187 | 188 | _mm_cvtsi32_si128((uint32_t)((r20 >> 26) | (r21 << 18)) & 0x3ffffff),
|
@@ -229,7 +230,8 @@ static void poly1305_first_block(poly1305_state_internal *st,
|
229 | 230 |
|
230 | 231 | static void poly1305_blocks(poly1305_state_internal *st, const uint8_t *m,
|
231 | 232 | size_t bytes) {
|
232 |
| - const xmmi MMASK = _mm_load_si128((const xmmi *)poly1305_x64_sse2_message_mask); |
| 233 | + const xmmi MMASK = |
| 234 | + _mm_load_si128((const xmmi *)poly1305_x64_sse2_message_mask); |
233 | 235 | const xmmi FIVE = _mm_load_si128((const xmmi *)poly1305_x64_sse2_5);
|
234 | 236 | const xmmi HIBIT = _mm_load_si128((const xmmi *)poly1305_x64_sse2_1shl128);
|
235 | 237 |
|
@@ -419,7 +421,8 @@ static void poly1305_blocks(poly1305_state_internal *st, const uint8_t *m,
|
419 | 421 |
|
420 | 422 | static size_t poly1305_combine(poly1305_state_internal *st, const uint8_t *m,
|
421 | 423 | size_t bytes) {
|
422 |
| - const xmmi MMASK = _mm_load_si128((const xmmi *)poly1305_x64_sse2_message_mask); |
| 424 | + const xmmi MMASK = |
| 425 | + _mm_load_si128((const xmmi *)poly1305_x64_sse2_message_mask); |
423 | 426 | const xmmi HIBIT = _mm_load_si128((const xmmi *)poly1305_x64_sse2_1shl128);
|
424 | 427 | const xmmi FIVE = _mm_load_si128((const xmmi *)poly1305_x64_sse2_5);
|
425 | 428 |
|
@@ -547,7 +550,7 @@ static size_t poly1305_combine(poly1305_state_internal *st, const uint8_t *m,
|
547 | 550 | r1 = ((uint64_t)p->R21.d[3] << 32) | (uint64_t)p->R21.d[1];
|
548 | 551 | r2 = ((uint64_t)p->R22.d[3] << 32) | (uint64_t)p->R22.d[1];
|
549 | 552 |
|
550 |
| - p->R20.d[2] = (uint32_t)(r0)&0x3ffffff; |
| 553 | + p->R20.d[2] = (uint32_t)(r0) & 0x3ffffff; |
551 | 554 | p->R21.d[2] = (uint32_t)((r0 >> 26) | (r1 << 18)) & 0x3ffffff;
|
552 | 555 | p->R22.d[2] = (uint32_t)((r1 >> 8)) & 0x3ffffff;
|
553 | 556 | p->R23.d[2] = (uint32_t)((r1 >> 34) | (r2 << 10)) & 0x3ffffff;
|
@@ -838,7 +841,7 @@ void CRYPTO_poly1305_finish(poly1305_state *state, uint8_t mac[16]) {
|
838 | 841 | c = (h1 >> 44);
|
839 | 842 | h1 &= 0xfffffffffff;
|
840 | 843 | t1 = (t1 >> 24);
|
841 |
| - h2 += (t1)+c; |
| 844 | + h2 += (t1) + c; |
842 | 845 |
|
843 | 846 | CRYPTO_store_u64_le(mac + 0, ((h0) | (h1 << 44)));
|
844 | 847 | CRYPTO_store_u64_le(mac + 8, ((h1 >> 20) | (h2 << 24)));
|
|
0 commit comments