1744bfb21SJohn Baldwin /* SPDX-License-Identifier: MIT
2744bfb21SJohn Baldwin *
3744bfb21SJohn Baldwin * Copyright (C) 2015-2021 Jason A. Donenfeld <Jason@zx2c4.com>. All Rights Reserved.
4744bfb21SJohn Baldwin * Copyright (c) 2022 The FreeBSD Foundation
5744bfb21SJohn Baldwin */
6744bfb21SJohn Baldwin
7744bfb21SJohn Baldwin #include <sys/types.h>
8744bfb21SJohn Baldwin #include <sys/systm.h>
9744bfb21SJohn Baldwin #include <sys/endian.h>
10744bfb21SJohn Baldwin #include <sys/mbuf.h>
11744bfb21SJohn Baldwin #include <opencrypto/cryptodev.h>
12744bfb21SJohn Baldwin
13744bfb21SJohn Baldwin #include "crypto.h"
14744bfb21SJohn Baldwin
15744bfb21SJohn Baldwin static crypto_session_t chacha20_poly1305_sid;
16744bfb21SJohn Baldwin
17*854d0662SJohn Baldwin #ifdef COMPAT_NEED_BLAKE2S
18744bfb21SJohn Baldwin #ifndef ARRAY_SIZE
19744bfb21SJohn Baldwin #define ARRAY_SIZE(x) (sizeof(x) / sizeof((x)[0]))
20744bfb21SJohn Baldwin #endif
21744bfb21SJohn Baldwin #ifndef DIV_ROUND_UP
22744bfb21SJohn Baldwin #define DIV_ROUND_UP(n,d) (((n) + (d) - 1) / (d))
23744bfb21SJohn Baldwin #endif
24744bfb21SJohn Baldwin
25744bfb21SJohn Baldwin #define le32_to_cpup(a) le32toh(*(a))
26744bfb21SJohn Baldwin #define cpu_to_le32(a) htole32(a)
27744bfb21SJohn Baldwin
cpu_to_le32_array(uint32_t * buf,unsigned int words)28*854d0662SJohn Baldwin static inline void cpu_to_le32_array(uint32_t *buf, unsigned int words)
29744bfb21SJohn Baldwin {
30744bfb21SJohn Baldwin while (words--) {
31744bfb21SJohn Baldwin *buf = cpu_to_le32(*buf);
32744bfb21SJohn Baldwin ++buf;
33744bfb21SJohn Baldwin }
34744bfb21SJohn Baldwin }
le32_to_cpu_array(uint32_t * buf,unsigned int words)35*854d0662SJohn Baldwin static inline void le32_to_cpu_array(uint32_t *buf, unsigned int words)
36744bfb21SJohn Baldwin {
37744bfb21SJohn Baldwin while (words--) {
38744bfb21SJohn Baldwin *buf = le32_to_cpup(buf);
39744bfb21SJohn Baldwin ++buf;
40744bfb21SJohn Baldwin }
41744bfb21SJohn Baldwin }
ror32(uint32_t word,unsigned int shift)42*854d0662SJohn Baldwin static inline uint32_t ror32(uint32_t word, unsigned int shift)
43744bfb21SJohn Baldwin {
44744bfb21SJohn Baldwin return (word >> (shift & 31)) | (word << ((-shift) & 31));
45744bfb21SJohn Baldwin }
46744bfb21SJohn Baldwin
47744bfb21SJohn Baldwin static const uint32_t blake2s_iv[8] = {
48744bfb21SJohn Baldwin 0x6A09E667UL, 0xBB67AE85UL, 0x3C6EF372UL, 0xA54FF53AUL,
49744bfb21SJohn Baldwin 0x510E527FUL, 0x9B05688CUL, 0x1F83D9ABUL, 0x5BE0CD19UL
50744bfb21SJohn Baldwin };
51744bfb21SJohn Baldwin
52744bfb21SJohn Baldwin static const uint8_t blake2s_sigma[10][16] = {
53744bfb21SJohn Baldwin { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 },
54744bfb21SJohn Baldwin { 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3 },
55744bfb21SJohn Baldwin { 11, 8, 12, 0, 5, 2, 15, 13, 10, 14, 3, 6, 7, 1, 9, 4 },
56744bfb21SJohn Baldwin { 7, 9, 3, 1, 13, 12, 11, 14, 2, 6, 5, 10, 4, 0, 15, 8 },
57744bfb21SJohn Baldwin { 9, 0, 5, 7, 2, 4, 10, 15, 14, 1, 11, 12, 6, 8, 3, 13 },
58744bfb21SJohn Baldwin { 2, 12, 6, 10, 0, 11, 8, 3, 4, 13, 7, 5, 15, 14, 1, 9 },
59744bfb21SJohn Baldwin { 12, 5, 1, 15, 14, 13, 4, 10, 0, 7, 6, 3, 9, 2, 8, 11 },
60744bfb21SJohn Baldwin { 13, 11, 7, 14, 12, 1, 3, 9, 5, 0, 15, 4, 8, 6, 2, 10 },
61744bfb21SJohn Baldwin { 6, 15, 14, 9, 11, 3, 0, 8, 12, 2, 13, 7, 1, 4, 10, 5 },
62744bfb21SJohn Baldwin { 10, 2, 8, 4, 7, 6, 1, 5, 15, 11, 9, 14, 3, 12, 13, 0 },
63744bfb21SJohn Baldwin };
64744bfb21SJohn Baldwin
blake2s_set_lastblock(struct blake2s_state * state)65744bfb21SJohn Baldwin static inline void blake2s_set_lastblock(struct blake2s_state *state)
66744bfb21SJohn Baldwin {
67744bfb21SJohn Baldwin state->f[0] = -1;
68744bfb21SJohn Baldwin }
69744bfb21SJohn Baldwin
blake2s_increment_counter(struct blake2s_state * state,const uint32_t inc)70744bfb21SJohn Baldwin static inline void blake2s_increment_counter(struct blake2s_state *state,
71744bfb21SJohn Baldwin const uint32_t inc)
72744bfb21SJohn Baldwin {
73744bfb21SJohn Baldwin state->t[0] += inc;
74744bfb21SJohn Baldwin state->t[1] += (state->t[0] < inc);
75744bfb21SJohn Baldwin }
76744bfb21SJohn Baldwin
blake2s_init_param(struct blake2s_state * state,const uint32_t param)77744bfb21SJohn Baldwin static inline void blake2s_init_param(struct blake2s_state *state,
78744bfb21SJohn Baldwin const uint32_t param)
79744bfb21SJohn Baldwin {
80744bfb21SJohn Baldwin int i;
81744bfb21SJohn Baldwin
82744bfb21SJohn Baldwin memset(state, 0, sizeof(*state));
83744bfb21SJohn Baldwin for (i = 0; i < 8; ++i)
84744bfb21SJohn Baldwin state->h[i] = blake2s_iv[i];
85744bfb21SJohn Baldwin state->h[0] ^= param;
86744bfb21SJohn Baldwin }
87744bfb21SJohn Baldwin
blake2s_init(struct blake2s_state * state,const size_t outlen)88744bfb21SJohn Baldwin void blake2s_init(struct blake2s_state *state, const size_t outlen)
89744bfb21SJohn Baldwin {
90744bfb21SJohn Baldwin blake2s_init_param(state, 0x01010000 | outlen);
91744bfb21SJohn Baldwin state->outlen = outlen;
92744bfb21SJohn Baldwin }
93744bfb21SJohn Baldwin
blake2s_init_key(struct blake2s_state * state,const size_t outlen,const uint8_t * key,const size_t keylen)94744bfb21SJohn Baldwin void blake2s_init_key(struct blake2s_state *state, const size_t outlen,
95744bfb21SJohn Baldwin const uint8_t *key, const size_t keylen)
96744bfb21SJohn Baldwin {
97744bfb21SJohn Baldwin uint8_t block[BLAKE2S_BLOCK_SIZE] = { 0 };
98744bfb21SJohn Baldwin
99744bfb21SJohn Baldwin blake2s_init_param(state, 0x01010000 | keylen << 8 | outlen);
100744bfb21SJohn Baldwin state->outlen = outlen;
101744bfb21SJohn Baldwin memcpy(block, key, keylen);
102744bfb21SJohn Baldwin blake2s_update(state, block, BLAKE2S_BLOCK_SIZE);
103744bfb21SJohn Baldwin explicit_bzero(block, BLAKE2S_BLOCK_SIZE);
104744bfb21SJohn Baldwin }
105744bfb21SJohn Baldwin
blake2s_compress(struct blake2s_state * state,const uint8_t * block,size_t nblocks,const uint32_t inc)106744bfb21SJohn Baldwin static inline void blake2s_compress(struct blake2s_state *state,
107744bfb21SJohn Baldwin const uint8_t *block, size_t nblocks,
108744bfb21SJohn Baldwin const uint32_t inc)
109744bfb21SJohn Baldwin {
110744bfb21SJohn Baldwin uint32_t m[16];
111744bfb21SJohn Baldwin uint32_t v[16];
112744bfb21SJohn Baldwin int i;
113744bfb21SJohn Baldwin
114744bfb21SJohn Baldwin while (nblocks > 0) {
115744bfb21SJohn Baldwin blake2s_increment_counter(state, inc);
116744bfb21SJohn Baldwin memcpy(m, block, BLAKE2S_BLOCK_SIZE);
117744bfb21SJohn Baldwin le32_to_cpu_array(m, ARRAY_SIZE(m));
118744bfb21SJohn Baldwin memcpy(v, state->h, 32);
119744bfb21SJohn Baldwin v[ 8] = blake2s_iv[0];
120744bfb21SJohn Baldwin v[ 9] = blake2s_iv[1];
121744bfb21SJohn Baldwin v[10] = blake2s_iv[2];
122744bfb21SJohn Baldwin v[11] = blake2s_iv[3];
123744bfb21SJohn Baldwin v[12] = blake2s_iv[4] ^ state->t[0];
124744bfb21SJohn Baldwin v[13] = blake2s_iv[5] ^ state->t[1];
125744bfb21SJohn Baldwin v[14] = blake2s_iv[6] ^ state->f[0];
126744bfb21SJohn Baldwin v[15] = blake2s_iv[7] ^ state->f[1];
127744bfb21SJohn Baldwin
128744bfb21SJohn Baldwin #define G(r, i, a, b, c, d) do { \
129744bfb21SJohn Baldwin a += b + m[blake2s_sigma[r][2 * i + 0]]; \
130744bfb21SJohn Baldwin d = ror32(d ^ a, 16); \
131744bfb21SJohn Baldwin c += d; \
132744bfb21SJohn Baldwin b = ror32(b ^ c, 12); \
133744bfb21SJohn Baldwin a += b + m[blake2s_sigma[r][2 * i + 1]]; \
134744bfb21SJohn Baldwin d = ror32(d ^ a, 8); \
135744bfb21SJohn Baldwin c += d; \
136744bfb21SJohn Baldwin b = ror32(b ^ c, 7); \
137744bfb21SJohn Baldwin } while (0)
138744bfb21SJohn Baldwin
139744bfb21SJohn Baldwin #define ROUND(r) do { \
140744bfb21SJohn Baldwin G(r, 0, v[0], v[ 4], v[ 8], v[12]); \
141744bfb21SJohn Baldwin G(r, 1, v[1], v[ 5], v[ 9], v[13]); \
142744bfb21SJohn Baldwin G(r, 2, v[2], v[ 6], v[10], v[14]); \
143744bfb21SJohn Baldwin G(r, 3, v[3], v[ 7], v[11], v[15]); \
144744bfb21SJohn Baldwin G(r, 4, v[0], v[ 5], v[10], v[15]); \
145744bfb21SJohn Baldwin G(r, 5, v[1], v[ 6], v[11], v[12]); \
146744bfb21SJohn Baldwin G(r, 6, v[2], v[ 7], v[ 8], v[13]); \
147744bfb21SJohn Baldwin G(r, 7, v[3], v[ 4], v[ 9], v[14]); \
148744bfb21SJohn Baldwin } while (0)
149744bfb21SJohn Baldwin ROUND(0);
150744bfb21SJohn Baldwin ROUND(1);
151744bfb21SJohn Baldwin ROUND(2);
152744bfb21SJohn Baldwin ROUND(3);
153744bfb21SJohn Baldwin ROUND(4);
154744bfb21SJohn Baldwin ROUND(5);
155744bfb21SJohn Baldwin ROUND(6);
156744bfb21SJohn Baldwin ROUND(7);
157744bfb21SJohn Baldwin ROUND(8);
158744bfb21SJohn Baldwin ROUND(9);
159744bfb21SJohn Baldwin
160744bfb21SJohn Baldwin #undef G
161744bfb21SJohn Baldwin #undef ROUND
162744bfb21SJohn Baldwin
163744bfb21SJohn Baldwin for (i = 0; i < 8; ++i)
164744bfb21SJohn Baldwin state->h[i] ^= v[i] ^ v[i + 8];
165744bfb21SJohn Baldwin
166744bfb21SJohn Baldwin block += BLAKE2S_BLOCK_SIZE;
167744bfb21SJohn Baldwin --nblocks;
168744bfb21SJohn Baldwin }
169744bfb21SJohn Baldwin }
170744bfb21SJohn Baldwin
blake2s_update(struct blake2s_state * state,const uint8_t * in,size_t inlen)171744bfb21SJohn Baldwin void blake2s_update(struct blake2s_state *state, const uint8_t *in, size_t inlen)
172744bfb21SJohn Baldwin {
173744bfb21SJohn Baldwin const size_t fill = BLAKE2S_BLOCK_SIZE - state->buflen;
174744bfb21SJohn Baldwin
175744bfb21SJohn Baldwin if (!inlen)
176744bfb21SJohn Baldwin return;
177744bfb21SJohn Baldwin if (inlen > fill) {
178744bfb21SJohn Baldwin memcpy(state->buf + state->buflen, in, fill);
179744bfb21SJohn Baldwin blake2s_compress(state, state->buf, 1, BLAKE2S_BLOCK_SIZE);
180744bfb21SJohn Baldwin state->buflen = 0;
181744bfb21SJohn Baldwin in += fill;
182744bfb21SJohn Baldwin inlen -= fill;
183744bfb21SJohn Baldwin }
184744bfb21SJohn Baldwin if (inlen > BLAKE2S_BLOCK_SIZE) {
185744bfb21SJohn Baldwin const size_t nblocks = DIV_ROUND_UP(inlen, BLAKE2S_BLOCK_SIZE);
186744bfb21SJohn Baldwin /* Hash one less (full) block than strictly possible */
187744bfb21SJohn Baldwin blake2s_compress(state, in, nblocks - 1, BLAKE2S_BLOCK_SIZE);
188744bfb21SJohn Baldwin in += BLAKE2S_BLOCK_SIZE * (nblocks - 1);
189744bfb21SJohn Baldwin inlen -= BLAKE2S_BLOCK_SIZE * (nblocks - 1);
190744bfb21SJohn Baldwin }
191744bfb21SJohn Baldwin memcpy(state->buf + state->buflen, in, inlen);
192744bfb21SJohn Baldwin state->buflen += inlen;
193744bfb21SJohn Baldwin }
194744bfb21SJohn Baldwin
blake2s_final(struct blake2s_state * state,uint8_t * out)195744bfb21SJohn Baldwin void blake2s_final(struct blake2s_state *state, uint8_t *out)
196744bfb21SJohn Baldwin {
197744bfb21SJohn Baldwin blake2s_set_lastblock(state);
198744bfb21SJohn Baldwin memset(state->buf + state->buflen, 0,
199744bfb21SJohn Baldwin BLAKE2S_BLOCK_SIZE - state->buflen); /* Padding */
200744bfb21SJohn Baldwin blake2s_compress(state, state->buf, 1, state->buflen);
201744bfb21SJohn Baldwin cpu_to_le32_array(state->h, ARRAY_SIZE(state->h));
202744bfb21SJohn Baldwin memcpy(out, state->h, state->outlen);
203744bfb21SJohn Baldwin explicit_bzero(state, sizeof(*state));
204744bfb21SJohn Baldwin }
205744bfb21SJohn Baldwin #endif
206744bfb21SJohn Baldwin
207*854d0662SJohn Baldwin static int
crypto_callback(struct cryptop * crp)208*854d0662SJohn Baldwin crypto_callback(struct cryptop *crp)
209744bfb21SJohn Baldwin {
210*854d0662SJohn Baldwin return (0);
211744bfb21SJohn Baldwin }
212744bfb21SJohn Baldwin
213*854d0662SJohn Baldwin int
chacha20poly1305_encrypt_mbuf(struct mbuf * m,const uint64_t nonce,const uint8_t key[CHACHA20POLY1305_KEY_SIZE])214*854d0662SJohn Baldwin chacha20poly1305_encrypt_mbuf(struct mbuf *m, const uint64_t nonce,
215*854d0662SJohn Baldwin const uint8_t key[CHACHA20POLY1305_KEY_SIZE])
216744bfb21SJohn Baldwin {
217*854d0662SJohn Baldwin static const char blank_tag[POLY1305_HASH_LEN];
218*854d0662SJohn Baldwin struct cryptop crp;
219*854d0662SJohn Baldwin int ret;
220*854d0662SJohn Baldwin
221*854d0662SJohn Baldwin if (!m_append(m, POLY1305_HASH_LEN, blank_tag))
222*854d0662SJohn Baldwin return (ENOMEM);
223*854d0662SJohn Baldwin crypto_initreq(&crp, chacha20_poly1305_sid);
224*854d0662SJohn Baldwin crp.crp_op = CRYPTO_OP_ENCRYPT | CRYPTO_OP_COMPUTE_DIGEST;
225*854d0662SJohn Baldwin crp.crp_flags = CRYPTO_F_IV_SEPARATE | CRYPTO_F_CBIMM;
226*854d0662SJohn Baldwin crypto_use_mbuf(&crp, m);
227*854d0662SJohn Baldwin crp.crp_payload_length = m->m_pkthdr.len - POLY1305_HASH_LEN;
228*854d0662SJohn Baldwin crp.crp_digest_start = crp.crp_payload_length;
229*854d0662SJohn Baldwin le64enc(crp.crp_iv, nonce);
230*854d0662SJohn Baldwin crp.crp_cipher_key = key;
231*854d0662SJohn Baldwin crp.crp_callback = crypto_callback;
232*854d0662SJohn Baldwin ret = crypto_dispatch(&crp);
233*854d0662SJohn Baldwin crypto_destroyreq(&crp);
234*854d0662SJohn Baldwin return (ret);
235744bfb21SJohn Baldwin }
236744bfb21SJohn Baldwin
237*854d0662SJohn Baldwin int
chacha20poly1305_decrypt_mbuf(struct mbuf * m,const uint64_t nonce,const uint8_t key[CHACHA20POLY1305_KEY_SIZE])238*854d0662SJohn Baldwin chacha20poly1305_decrypt_mbuf(struct mbuf *m, const uint64_t nonce,
239*854d0662SJohn Baldwin const uint8_t key[CHACHA20POLY1305_KEY_SIZE])
240744bfb21SJohn Baldwin {
241*854d0662SJohn Baldwin struct cryptop crp;
242*854d0662SJohn Baldwin int ret;
243*854d0662SJohn Baldwin
244*854d0662SJohn Baldwin if (m->m_pkthdr.len < POLY1305_HASH_LEN)
245*854d0662SJohn Baldwin return (EMSGSIZE);
246*854d0662SJohn Baldwin crypto_initreq(&crp, chacha20_poly1305_sid);
247*854d0662SJohn Baldwin crp.crp_op = CRYPTO_OP_DECRYPT | CRYPTO_OP_VERIFY_DIGEST;
248*854d0662SJohn Baldwin crp.crp_flags = CRYPTO_F_IV_SEPARATE | CRYPTO_F_CBIMM;
249*854d0662SJohn Baldwin crypto_use_mbuf(&crp, m);
250*854d0662SJohn Baldwin crp.crp_payload_length = m->m_pkthdr.len - POLY1305_HASH_LEN;
251*854d0662SJohn Baldwin crp.crp_digest_start = crp.crp_payload_length;
252*854d0662SJohn Baldwin le64enc(crp.crp_iv, nonce);
253*854d0662SJohn Baldwin crp.crp_cipher_key = key;
254*854d0662SJohn Baldwin crp.crp_callback = crypto_callback;
255*854d0662SJohn Baldwin ret = crypto_dispatch(&crp);
256*854d0662SJohn Baldwin crypto_destroyreq(&crp);
257*854d0662SJohn Baldwin if (ret)
258*854d0662SJohn Baldwin return (ret);
259*854d0662SJohn Baldwin m_adj(m, -POLY1305_HASH_LEN);
260*854d0662SJohn Baldwin return (0);
261744bfb21SJohn Baldwin }
262744bfb21SJohn Baldwin
263744bfb21SJohn Baldwin int
crypto_init(void)264744bfb21SJohn Baldwin crypto_init(void)
265744bfb21SJohn Baldwin {
266744bfb21SJohn Baldwin struct crypto_session_params csp = {
267744bfb21SJohn Baldwin .csp_mode = CSP_MODE_AEAD,
268744bfb21SJohn Baldwin .csp_ivlen = sizeof(uint64_t),
269744bfb21SJohn Baldwin .csp_cipher_alg = CRYPTO_CHACHA20_POLY1305,
270744bfb21SJohn Baldwin .csp_cipher_klen = CHACHA20POLY1305_KEY_SIZE,
271744bfb21SJohn Baldwin .csp_flags = CSP_F_SEPARATE_AAD | CSP_F_SEPARATE_OUTPUT
272744bfb21SJohn Baldwin };
273744bfb21SJohn Baldwin int ret = crypto_newsession(&chacha20_poly1305_sid, &csp, CRYPTOCAP_F_SOFTWARE);
274744bfb21SJohn Baldwin if (ret != 0)
275744bfb21SJohn Baldwin return (ret);
276744bfb21SJohn Baldwin return (0);
277744bfb21SJohn Baldwin }
278744bfb21SJohn Baldwin
279744bfb21SJohn Baldwin void
crypto_deinit(void)280744bfb21SJohn Baldwin crypto_deinit(void)
281744bfb21SJohn Baldwin {
282744bfb21SJohn Baldwin crypto_freesession(chacha20_poly1305_sid);
283744bfb21SJohn Baldwin }
284