1*8d3b6649SEric Biggers // SPDX-License-Identifier: GPL-2.0 OR MIT
2*8d3b6649SEric Biggers /*
3*8d3b6649SEric Biggers * Copyright (C) 2015-2019 Jason A. Donenfeld <Jason@zx2c4.com>. All Rights Reserved.
4*8d3b6649SEric Biggers *
5*8d3b6649SEric Biggers * This is an implementation of the BLAKE2s hash and PRF functions.
6*8d3b6649SEric Biggers *
7*8d3b6649SEric Biggers * Information: https://blake2.net/
8*8d3b6649SEric Biggers */
9*8d3b6649SEric Biggers
10*8d3b6649SEric Biggers #include "blake2s.h"
11*8d3b6649SEric Biggers #include <linux/kernel.h>
12*8d3b6649SEric Biggers
ror32(u32 v,int n)13*8d3b6649SEric Biggers static inline u32 ror32(u32 v, int n)
14*8d3b6649SEric Biggers {
15*8d3b6649SEric Biggers return (v >> n) | (v << (32 - n));
16*8d3b6649SEric Biggers }
17*8d3b6649SEric Biggers
le32_to_cpu_array(u32 a[],size_t n)18*8d3b6649SEric Biggers static inline void le32_to_cpu_array(u32 a[], size_t n)
19*8d3b6649SEric Biggers {
20*8d3b6649SEric Biggers for (size_t i = 0; i < n; i++)
21*8d3b6649SEric Biggers a[i] = le32_to_cpu((__force __le32)a[i]);
22*8d3b6649SEric Biggers }
23*8d3b6649SEric Biggers
cpu_to_le32_array(u32 a[],size_t n)24*8d3b6649SEric Biggers static inline void cpu_to_le32_array(u32 a[], size_t n)
25*8d3b6649SEric Biggers {
26*8d3b6649SEric Biggers for (size_t i = 0; i < n; i++)
27*8d3b6649SEric Biggers a[i] = (__force u32)cpu_to_le32(a[i]);
28*8d3b6649SEric Biggers }
29*8d3b6649SEric Biggers
30*8d3b6649SEric Biggers static const u8 blake2s_sigma[10][16] = {
31*8d3b6649SEric Biggers { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 },
32*8d3b6649SEric Biggers { 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3 },
33*8d3b6649SEric Biggers { 11, 8, 12, 0, 5, 2, 15, 13, 10, 14, 3, 6, 7, 1, 9, 4 },
34*8d3b6649SEric Biggers { 7, 9, 3, 1, 13, 12, 11, 14, 2, 6, 5, 10, 4, 0, 15, 8 },
35*8d3b6649SEric Biggers { 9, 0, 5, 7, 2, 4, 10, 15, 14, 1, 11, 12, 6, 8, 3, 13 },
36*8d3b6649SEric Biggers { 2, 12, 6, 10, 0, 11, 8, 3, 4, 13, 7, 5, 15, 14, 1, 9 },
37*8d3b6649SEric Biggers { 12, 5, 1, 15, 14, 13, 4, 10, 0, 7, 6, 3, 9, 2, 8, 11 },
38*8d3b6649SEric Biggers { 13, 11, 7, 14, 12, 1, 3, 9, 5, 0, 15, 4, 8, 6, 2, 10 },
39*8d3b6649SEric Biggers { 6, 15, 14, 9, 11, 3, 0, 8, 12, 2, 13, 7, 1, 4, 10, 5 },
40*8d3b6649SEric Biggers { 10, 2, 8, 4, 7, 6, 1, 5, 15, 11, 9, 14, 3, 12, 13, 0 },
41*8d3b6649SEric Biggers };
42*8d3b6649SEric Biggers
blake2s_increment_counter(struct blake2s_ctx * ctx,u32 inc)43*8d3b6649SEric Biggers static inline void blake2s_increment_counter(struct blake2s_ctx *ctx, u32 inc)
44*8d3b6649SEric Biggers {
45*8d3b6649SEric Biggers ctx->t[0] += inc;
46*8d3b6649SEric Biggers ctx->t[1] += (ctx->t[0] < inc);
47*8d3b6649SEric Biggers }
48*8d3b6649SEric Biggers
blake2s_compress(struct blake2s_ctx * ctx,const u8 * data,size_t nblocks,u32 inc)49*8d3b6649SEric Biggers static void blake2s_compress(struct blake2s_ctx *ctx,
50*8d3b6649SEric Biggers const u8 *data, size_t nblocks, u32 inc)
51*8d3b6649SEric Biggers {
52*8d3b6649SEric Biggers u32 m[16];
53*8d3b6649SEric Biggers u32 v[16];
54*8d3b6649SEric Biggers int i;
55*8d3b6649SEric Biggers
56*8d3b6649SEric Biggers while (nblocks > 0) {
57*8d3b6649SEric Biggers blake2s_increment_counter(ctx, inc);
58*8d3b6649SEric Biggers memcpy(m, data, BLAKE2S_BLOCK_SIZE);
59*8d3b6649SEric Biggers le32_to_cpu_array(m, ARRAY_SIZE(m));
60*8d3b6649SEric Biggers memcpy(v, ctx->h, 32);
61*8d3b6649SEric Biggers v[ 8] = BLAKE2S_IV0;
62*8d3b6649SEric Biggers v[ 9] = BLAKE2S_IV1;
63*8d3b6649SEric Biggers v[10] = BLAKE2S_IV2;
64*8d3b6649SEric Biggers v[11] = BLAKE2S_IV3;
65*8d3b6649SEric Biggers v[12] = BLAKE2S_IV4 ^ ctx->t[0];
66*8d3b6649SEric Biggers v[13] = BLAKE2S_IV5 ^ ctx->t[1];
67*8d3b6649SEric Biggers v[14] = BLAKE2S_IV6 ^ ctx->f[0];
68*8d3b6649SEric Biggers v[15] = BLAKE2S_IV7 ^ ctx->f[1];
69*8d3b6649SEric Biggers
70*8d3b6649SEric Biggers #define G(r, i, a, b, c, d) do { \
71*8d3b6649SEric Biggers a += b + m[blake2s_sigma[r][2 * i + 0]]; \
72*8d3b6649SEric Biggers d = ror32(d ^ a, 16); \
73*8d3b6649SEric Biggers c += d; \
74*8d3b6649SEric Biggers b = ror32(b ^ c, 12); \
75*8d3b6649SEric Biggers a += b + m[blake2s_sigma[r][2 * i + 1]]; \
76*8d3b6649SEric Biggers d = ror32(d ^ a, 8); \
77*8d3b6649SEric Biggers c += d; \
78*8d3b6649SEric Biggers b = ror32(b ^ c, 7); \
79*8d3b6649SEric Biggers } while (0)
80*8d3b6649SEric Biggers
81*8d3b6649SEric Biggers #define ROUND(r) do { \
82*8d3b6649SEric Biggers G(r, 0, v[0], v[ 4], v[ 8], v[12]); \
83*8d3b6649SEric Biggers G(r, 1, v[1], v[ 5], v[ 9], v[13]); \
84*8d3b6649SEric Biggers G(r, 2, v[2], v[ 6], v[10], v[14]); \
85*8d3b6649SEric Biggers G(r, 3, v[3], v[ 7], v[11], v[15]); \
86*8d3b6649SEric Biggers G(r, 4, v[0], v[ 5], v[10], v[15]); \
87*8d3b6649SEric Biggers G(r, 5, v[1], v[ 6], v[11], v[12]); \
88*8d3b6649SEric Biggers G(r, 6, v[2], v[ 7], v[ 8], v[13]); \
89*8d3b6649SEric Biggers G(r, 7, v[3], v[ 4], v[ 9], v[14]); \
90*8d3b6649SEric Biggers } while (0)
91*8d3b6649SEric Biggers ROUND(0);
92*8d3b6649SEric Biggers ROUND(1);
93*8d3b6649SEric Biggers ROUND(2);
94*8d3b6649SEric Biggers ROUND(3);
95*8d3b6649SEric Biggers ROUND(4);
96*8d3b6649SEric Biggers ROUND(5);
97*8d3b6649SEric Biggers ROUND(6);
98*8d3b6649SEric Biggers ROUND(7);
99*8d3b6649SEric Biggers ROUND(8);
100*8d3b6649SEric Biggers ROUND(9);
101*8d3b6649SEric Biggers
102*8d3b6649SEric Biggers #undef G
103*8d3b6649SEric Biggers #undef ROUND
104*8d3b6649SEric Biggers
105*8d3b6649SEric Biggers for (i = 0; i < 8; ++i)
106*8d3b6649SEric Biggers ctx->h[i] ^= v[i] ^ v[i + 8];
107*8d3b6649SEric Biggers
108*8d3b6649SEric Biggers data += BLAKE2S_BLOCK_SIZE;
109*8d3b6649SEric Biggers --nblocks;
110*8d3b6649SEric Biggers }
111*8d3b6649SEric Biggers }
112*8d3b6649SEric Biggers
blake2s_set_lastblock(struct blake2s_ctx * ctx)113*8d3b6649SEric Biggers static inline void blake2s_set_lastblock(struct blake2s_ctx *ctx)
114*8d3b6649SEric Biggers {
115*8d3b6649SEric Biggers ctx->f[0] = -1;
116*8d3b6649SEric Biggers }
117*8d3b6649SEric Biggers
blake2s_update(struct blake2s_ctx * ctx,const u8 * in,size_t inlen)118*8d3b6649SEric Biggers void blake2s_update(struct blake2s_ctx *ctx, const u8 *in, size_t inlen)
119*8d3b6649SEric Biggers {
120*8d3b6649SEric Biggers const size_t fill = BLAKE2S_BLOCK_SIZE - ctx->buflen;
121*8d3b6649SEric Biggers
122*8d3b6649SEric Biggers if (unlikely(!inlen))
123*8d3b6649SEric Biggers return;
124*8d3b6649SEric Biggers if (inlen > fill) {
125*8d3b6649SEric Biggers memcpy(ctx->buf + ctx->buflen, in, fill);
126*8d3b6649SEric Biggers blake2s_compress(ctx, ctx->buf, 1, BLAKE2S_BLOCK_SIZE);
127*8d3b6649SEric Biggers ctx->buflen = 0;
128*8d3b6649SEric Biggers in += fill;
129*8d3b6649SEric Biggers inlen -= fill;
130*8d3b6649SEric Biggers }
131*8d3b6649SEric Biggers if (inlen > BLAKE2S_BLOCK_SIZE) {
132*8d3b6649SEric Biggers const size_t nblocks = DIV_ROUND_UP(inlen, BLAKE2S_BLOCK_SIZE);
133*8d3b6649SEric Biggers
134*8d3b6649SEric Biggers blake2s_compress(ctx, in, nblocks - 1, BLAKE2S_BLOCK_SIZE);
135*8d3b6649SEric Biggers in += BLAKE2S_BLOCK_SIZE * (nblocks - 1);
136*8d3b6649SEric Biggers inlen -= BLAKE2S_BLOCK_SIZE * (nblocks - 1);
137*8d3b6649SEric Biggers }
138*8d3b6649SEric Biggers memcpy(ctx->buf + ctx->buflen, in, inlen);
139*8d3b6649SEric Biggers ctx->buflen += inlen;
140*8d3b6649SEric Biggers }
141*8d3b6649SEric Biggers
blake2s_final(struct blake2s_ctx * ctx,u8 * out)142*8d3b6649SEric Biggers void blake2s_final(struct blake2s_ctx *ctx, u8 *out)
143*8d3b6649SEric Biggers {
144*8d3b6649SEric Biggers blake2s_set_lastblock(ctx);
145*8d3b6649SEric Biggers memset(ctx->buf + ctx->buflen, 0,
146*8d3b6649SEric Biggers BLAKE2S_BLOCK_SIZE - ctx->buflen); /* Padding */
147*8d3b6649SEric Biggers blake2s_compress(ctx, ctx->buf, 1, ctx->buflen);
148*8d3b6649SEric Biggers cpu_to_le32_array(ctx->h, ARRAY_SIZE(ctx->h));
149*8d3b6649SEric Biggers memcpy(out, ctx->h, ctx->outlen);
150*8d3b6649SEric Biggers memset(ctx, 0, sizeof(*ctx));
151*8d3b6649SEric Biggers }
152