1 
2 #include <stdint.h>
3 #include <string.h>
4 
5 #include "blake2.h"
6 #include "private/common.h"
7 
8 CRYPTO_ALIGN(64)
9 static const uint64_t blake2b_IV[8] = {
10     0x6a09e667f3bcc908ULL, 0xbb67ae8584caa73bULL, 0x3c6ef372fe94f82bULL,
11     0xa54ff53a5f1d36f1ULL, 0x510e527fade682d1ULL, 0x9b05688c2b3e6c1fULL,
12     0x1f83d9abfb41bd6bULL, 0x5be0cd19137e2179ULL
13 };
14 
15 static const uint8_t blake2b_sigma[12][16] = {
16     { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 },
17     { 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3 },
18     { 11, 8, 12, 0, 5, 2, 15, 13, 10, 14, 3, 6, 7, 1, 9, 4 },
19     { 7, 9, 3, 1, 13, 12, 11, 14, 2, 6, 5, 10, 4, 0, 15, 8 },
20     { 9, 0, 5, 7, 2, 4, 10, 15, 14, 1, 11, 12, 6, 8, 3, 13 },
21     { 2, 12, 6, 10, 0, 11, 8, 3, 4, 13, 7, 5, 15, 14, 1, 9 },
22     { 12, 5, 1, 15, 14, 13, 4, 10, 0, 7, 6, 3, 9, 2, 8, 11 },
23     { 13, 11, 7, 14, 12, 1, 3, 9, 5, 0, 15, 4, 8, 6, 2, 10 },
24     { 6, 15, 14, 9, 11, 3, 0, 8, 12, 2, 13, 7, 1, 4, 10, 5 },
25     { 10, 2, 8, 4, 7, 6, 1, 5, 15, 11, 9, 14, 3, 12, 13, 0 },
26     { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 },
27     { 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3 }
28 };
29 
30 int
blake2b_compress_ref(blake2b_state * S,const uint8_t block[BLAKE2B_BLOCKBYTES])31 blake2b_compress_ref(blake2b_state *S, const uint8_t block[BLAKE2B_BLOCKBYTES])
32 {
33     uint64_t m[16];
34     uint64_t v[16];
35     int      i;
36 
37     for (i = 0; i < 16; ++i) {
38         m[i] = LOAD64_LE(block + i * sizeof(m[i]));
39     }
40     for (i = 0; i < 8; ++i) {
41         v[i] = S->h[i];
42     }
43     v[8]  = blake2b_IV[0];
44     v[9]  = blake2b_IV[1];
45     v[10] = blake2b_IV[2];
46     v[11] = blake2b_IV[3];
47     v[12] = S->t[0] ^ blake2b_IV[4];
48     v[13] = S->t[1] ^ blake2b_IV[5];
49     v[14] = S->f[0] ^ blake2b_IV[6];
50     v[15] = S->f[1] ^ blake2b_IV[7];
51 #define G(r, i, a, b, c, d)                         \
52     do {                                            \
53         a = a + b + m[blake2b_sigma[r][2 * i + 0]]; \
54         d = ROTR64(d ^ a, 32);                      \
55         c = c + d;                                  \
56         b = ROTR64(b ^ c, 24);                      \
57         a = a + b + m[blake2b_sigma[r][2 * i + 1]]; \
58         d = ROTR64(d ^ a, 16);                      \
59         c = c + d;                                  \
60         b = ROTR64(b ^ c, 63);                      \
61     } while (0)
62 #define ROUND(r)                           \
63     do {                                   \
64         G(r, 0, v[0], v[4], v[8], v[12]);  \
65         G(r, 1, v[1], v[5], v[9], v[13]);  \
66         G(r, 2, v[2], v[6], v[10], v[14]); \
67         G(r, 3, v[3], v[7], v[11], v[15]); \
68         G(r, 4, v[0], v[5], v[10], v[15]); \
69         G(r, 5, v[1], v[6], v[11], v[12]); \
70         G(r, 6, v[2], v[7], v[8], v[13]);  \
71         G(r, 7, v[3], v[4], v[9], v[14]);  \
72     } while (0)
73     ROUND(0);
74     ROUND(1);
75     ROUND(2);
76     ROUND(3);
77     ROUND(4);
78     ROUND(5);
79     ROUND(6);
80     ROUND(7);
81     ROUND(8);
82     ROUND(9);
83     ROUND(10);
84     ROUND(11);
85 
86     for (i = 0; i < 8; ++i) {
87         S->h[i] = S->h[i] ^ v[i] ^ v[i + 8];
88     }
89 
90 #undef G
91 #undef ROUND
92     return 0;
93 }
94