1
2#include <stdint.h>
3#include <string.h>
4
5#include "blake2.h"
6#include "private/common.h"
7
8CRYPTO_ALIGN(64)
9static const uint64_t blake2b_IV[8] = {
10    0x6a09e667f3bcc908ULL, 0xbb67ae8584caa73bULL, 0x3c6ef372fe94f82bULL,
11    0xa54ff53a5f1d36f1ULL, 0x510e527fade682d1ULL, 0x9b05688c2b3e6c1fULL,
12    0x1f83d9abfb41bd6bULL, 0x5be0cd19137e2179ULL
13};
14
15static const uint8_t blake2b_sigma[12][16] = {
16    { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 },
17    { 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3 },
18    { 11, 8, 12, 0, 5, 2, 15, 13, 10, 14, 3, 6, 7, 1, 9, 4 },
19    { 7, 9, 3, 1, 13, 12, 11, 14, 2, 6, 5, 10, 4, 0, 15, 8 },
20    { 9, 0, 5, 7, 2, 4, 10, 15, 14, 1, 11, 12, 6, 8, 3, 13 },
21    { 2, 12, 6, 10, 0, 11, 8, 3, 4, 13, 7, 5, 15, 14, 1, 9 },
22    { 12, 5, 1, 15, 14, 13, 4, 10, 0, 7, 6, 3, 9, 2, 8, 11 },
23    { 13, 11, 7, 14, 12, 1, 3, 9, 5, 0, 15, 4, 8, 6, 2, 10 },
24    { 6, 15, 14, 9, 11, 3, 0, 8, 12, 2, 13, 7, 1, 4, 10, 5 },
25    { 10, 2, 8, 4, 7, 6, 1, 5, 15, 11, 9, 14, 3, 12, 13, 0 },
26    { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 },
27    { 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3 }
28};
29
30int
31blake2b_compress_ref(blake2b_state *S, const uint8_t block[BLAKE2B_BLOCKBYTES])
32{
33    uint64_t m[16];
34    uint64_t v[16];
35    int      i;
36
37    for (i = 0; i < 16; ++i) {
38        m[i] = LOAD64_LE(block + i * sizeof(m[i]));
39    }
40    for (i = 0; i < 8; ++i) {
41        v[i] = S->h[i];
42    }
43    v[8]  = blake2b_IV[0];
44    v[9]  = blake2b_IV[1];
45    v[10] = blake2b_IV[2];
46    v[11] = blake2b_IV[3];
47    v[12] = S->t[0] ^ blake2b_IV[4];
48    v[13] = S->t[1] ^ blake2b_IV[5];
49    v[14] = S->f[0] ^ blake2b_IV[6];
50    v[15] = S->f[1] ^ blake2b_IV[7];
51#define G(r, i, a, b, c, d)                         \
52    do {                                            \
53        a = a + b + m[blake2b_sigma[r][2 * i + 0]]; \
54        d = ROTR64(d ^ a, 32);                      \
55        c = c + d;                                  \
56        b = ROTR64(b ^ c, 24);                      \
57        a = a + b + m[blake2b_sigma[r][2 * i + 1]]; \
58        d = ROTR64(d ^ a, 16);                      \
59        c = c + d;                                  \
60        b = ROTR64(b ^ c, 63);                      \
61    } while (0)
62#define ROUND(r)                           \
63    do {                                   \
64        G(r, 0, v[0], v[4], v[8], v[12]);  \
65        G(r, 1, v[1], v[5], v[9], v[13]);  \
66        G(r, 2, v[2], v[6], v[10], v[14]); \
67        G(r, 3, v[3], v[7], v[11], v[15]); \
68        G(r, 4, v[0], v[5], v[10], v[15]); \
69        G(r, 5, v[1], v[6], v[11], v[12]); \
70        G(r, 6, v[2], v[7], v[8], v[13]);  \
71        G(r, 7, v[3], v[4], v[9], v[14]);  \
72    } while (0)
73    ROUND(0);
74    ROUND(1);
75    ROUND(2);
76    ROUND(3);
77    ROUND(4);
78    ROUND(5);
79    ROUND(6);
80    ROUND(7);
81    ROUND(8);
82    ROUND(9);
83    ROUND(10);
84    ROUND(11);
85
86    for (i = 0; i < 8; ++i) {
87        S->h[i] = S->h[i] ^ v[i] ^ v[i + 8];
88    }
89
90#undef G
91#undef ROUND
92    return 0;
93}
94