xref: /openbsd-src/sys/crypto/blake2s.c (revision af293b3df26a0a176bba226b28d9800bfbd2b00a)
1*af293b3dSmiod /*	$OpenBSD: blake2s.c,v 1.3 2023/02/03 18:31:16 miod Exp $	*/
29960953dSdlg /*
39960953dSdlg  * Copyright (C) 2012 Samuel Neves <sneves@dei.uc.pt>. All Rights Reserved.
49960953dSdlg  * Copyright (C) 2015-2020 Jason A. Donenfeld <Jason@zx2c4.com>. All Rights Reserved.
59960953dSdlg  *
69960953dSdlg  * Permission to use, copy, modify, and distribute this software for any
79960953dSdlg  * purpose with or without fee is hereby granted, provided that the above
89960953dSdlg  * copyright notice and this permission notice appear in all copies.
99960953dSdlg  *
109960953dSdlg  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
119960953dSdlg  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
129960953dSdlg  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
139960953dSdlg  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
149960953dSdlg  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
159960953dSdlg  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
169960953dSdlg  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
179960953dSdlg  *
189960953dSdlg  * This is an implementation of the BLAKE2s hash and PRF functions.
199960953dSdlg  * Information: https://blake2.net/
209960953dSdlg  */
219960953dSdlg 
229960953dSdlg #include <sys/types.h>
239960953dSdlg #include <sys/systm.h>
249960953dSdlg 
259960953dSdlg #include <crypto/blake2s.h>
269960953dSdlg 
279960953dSdlg static inline uint32_t
ror32(uint32_t word,unsigned int shift)289960953dSdlg ror32(uint32_t word, unsigned int shift)
299960953dSdlg {
309960953dSdlg 	return (word >> shift) | (word << (32 - shift));
319960953dSdlg }
329960953dSdlg 
339960953dSdlg static const uint32_t blake2s_iv[8] = {
349960953dSdlg 	0x6A09E667UL, 0xBB67AE85UL, 0x3C6EF372UL, 0xA54FF53AUL,
359960953dSdlg 	0x510E527FUL, 0x9B05688CUL, 0x1F83D9ABUL, 0x5BE0CD19UL
369960953dSdlg };
379960953dSdlg 
389960953dSdlg static const uint8_t blake2s_sigma[10][16] = {
399960953dSdlg 	{ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 },
409960953dSdlg 	{ 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3 },
419960953dSdlg 	{ 11, 8, 12, 0, 5, 2, 15, 13, 10, 14, 3, 6, 7, 1, 9, 4 },
429960953dSdlg 	{ 7, 9, 3, 1, 13, 12, 11, 14, 2, 6, 5, 10, 4, 0, 15, 8 },
439960953dSdlg 	{ 9, 0, 5, 7, 2, 4, 10, 15, 14, 1, 11, 12, 6, 8, 3, 13 },
449960953dSdlg 	{ 2, 12, 6, 10, 0, 11, 8, 3, 4, 13, 7, 5, 15, 14, 1, 9 },
459960953dSdlg 	{ 12, 5, 1, 15, 14, 13, 4, 10, 0, 7, 6, 3, 9, 2, 8, 11 },
469960953dSdlg 	{ 13, 11, 7, 14, 12, 1, 3, 9, 5, 0, 15, 4, 8, 6, 2, 10 },
479960953dSdlg 	{ 6, 15, 14, 9, 11, 3, 0, 8, 12, 2, 13, 7, 1, 4, 10, 5 },
489960953dSdlg 	{ 10, 2, 8, 4, 7, 6, 1, 5, 15, 11, 9, 14, 3, 12, 13, 0 },
499960953dSdlg };
509960953dSdlg 
blake2s_set_lastblock(struct blake2s_state * state)519960953dSdlg static inline void blake2s_set_lastblock(struct blake2s_state *state)
529960953dSdlg {
539960953dSdlg 	state->f[0] = -1;
549960953dSdlg }
559960953dSdlg 
blake2s_increment_counter(struct blake2s_state * state,const uint32_t inc)569960953dSdlg static inline void blake2s_increment_counter(struct blake2s_state *state,
579960953dSdlg 					     const uint32_t inc)
589960953dSdlg {
599960953dSdlg 	state->t[0] += inc;
609960953dSdlg 	state->t[1] += (state->t[0] < inc);
619960953dSdlg }
629960953dSdlg 
blake2s_init_param(struct blake2s_state * state,const uint32_t param)639960953dSdlg static inline void blake2s_init_param(struct blake2s_state *state,
649960953dSdlg 				      const uint32_t param)
659960953dSdlg {
669960953dSdlg 	int i;
679960953dSdlg 
689960953dSdlg 	memset(state, 0, sizeof(*state));
699960953dSdlg 	for (i = 0; i < 8; ++i)
709960953dSdlg 		state->h[i] = blake2s_iv[i];
719960953dSdlg 	state->h[0] ^= param;
729960953dSdlg }
739960953dSdlg 
blake2s_init(struct blake2s_state * state,const size_t outlen)749960953dSdlg void blake2s_init(struct blake2s_state *state, const size_t outlen)
759960953dSdlg {
769960953dSdlg 	KASSERT(!(!outlen || outlen > BLAKE2S_HASH_SIZE));
779960953dSdlg 	blake2s_init_param(state, 0x01010000 | outlen);
789960953dSdlg 	state->outlen = outlen;
799960953dSdlg }
809960953dSdlg 
blake2s_init_key(struct blake2s_state * state,const size_t outlen,const void * key,const size_t keylen)819960953dSdlg void blake2s_init_key(struct blake2s_state *state, const size_t outlen,
829960953dSdlg 		      const void *key, const size_t keylen)
839960953dSdlg {
849960953dSdlg 	uint8_t block[BLAKE2S_BLOCK_SIZE] = { 0 };
859960953dSdlg 
869960953dSdlg 	KASSERT(!(!outlen || outlen > BLAKE2S_HASH_SIZE ||
879960953dSdlg 		  !key || !keylen || keylen > BLAKE2S_KEY_SIZE));
889960953dSdlg 
899960953dSdlg 	blake2s_init_param(state, 0x01010000 | keylen << 8 | outlen);
909960953dSdlg 	state->outlen = outlen;
919960953dSdlg 	memcpy(block, key, keylen);
929960953dSdlg 	blake2s_update(state, block, BLAKE2S_BLOCK_SIZE);
939960953dSdlg 	explicit_bzero(block, BLAKE2S_BLOCK_SIZE);
949960953dSdlg }
959960953dSdlg 
blake2s_compress(struct blake2s_state * state,const uint8_t * block,size_t nblocks,const uint32_t inc)969960953dSdlg static inline void blake2s_compress(struct blake2s_state *state,
979960953dSdlg 				    const uint8_t *block, size_t nblocks,
989960953dSdlg 				    const uint32_t inc)
999960953dSdlg {
1009960953dSdlg 	uint32_t m[16];
1019960953dSdlg 	uint32_t v[16];
1029960953dSdlg 	int i;
1039960953dSdlg 
1049960953dSdlg 	KASSERT(!((nblocks > 1 && inc != BLAKE2S_BLOCK_SIZE)));
1059960953dSdlg 
1069960953dSdlg 	while (nblocks > 0) {
1079960953dSdlg 		blake2s_increment_counter(state, inc);
1089960953dSdlg 		memcpy(m, block, BLAKE2S_BLOCK_SIZE);
1099960953dSdlg 		for (i = 0; i < 16; i++)
1109960953dSdlg 			m[i] = le32toh(m[i]);
1119960953dSdlg 		memcpy(v, state->h, 32);
1129960953dSdlg 		v[ 8] = blake2s_iv[0];
1139960953dSdlg 		v[ 9] = blake2s_iv[1];
1149960953dSdlg 		v[10] = blake2s_iv[2];
1159960953dSdlg 		v[11] = blake2s_iv[3];
1169960953dSdlg 		v[12] = blake2s_iv[4] ^ state->t[0];
1179960953dSdlg 		v[13] = blake2s_iv[5] ^ state->t[1];
1189960953dSdlg 		v[14] = blake2s_iv[6] ^ state->f[0];
1199960953dSdlg 		v[15] = blake2s_iv[7] ^ state->f[1];
1209960953dSdlg 
1219960953dSdlg #define G(r, i, a, b, c, d) do { \
1229960953dSdlg 	a += b + m[blake2s_sigma[r][2 * i + 0]]; \
1239960953dSdlg 	d = ror32(d ^ a, 16); \
1249960953dSdlg 	c += d; \
1259960953dSdlg 	b = ror32(b ^ c, 12); \
1269960953dSdlg 	a += b + m[blake2s_sigma[r][2 * i + 1]]; \
1279960953dSdlg 	d = ror32(d ^ a, 8); \
1289960953dSdlg 	c += d; \
1299960953dSdlg 	b = ror32(b ^ c, 7); \
1309960953dSdlg } while (0)
1319960953dSdlg 
1329960953dSdlg #define ROUND(r) do { \
1339960953dSdlg 	G(r, 0, v[0], v[ 4], v[ 8], v[12]); \
1349960953dSdlg 	G(r, 1, v[1], v[ 5], v[ 9], v[13]); \
1359960953dSdlg 	G(r, 2, v[2], v[ 6], v[10], v[14]); \
1369960953dSdlg 	G(r, 3, v[3], v[ 7], v[11], v[15]); \
1379960953dSdlg 	G(r, 4, v[0], v[ 5], v[10], v[15]); \
1389960953dSdlg 	G(r, 5, v[1], v[ 6], v[11], v[12]); \
1399960953dSdlg 	G(r, 6, v[2], v[ 7], v[ 8], v[13]); \
1409960953dSdlg 	G(r, 7, v[3], v[ 4], v[ 9], v[14]); \
1419960953dSdlg } while (0)
1429960953dSdlg 		ROUND(0);
1439960953dSdlg 		ROUND(1);
1449960953dSdlg 		ROUND(2);
1459960953dSdlg 		ROUND(3);
1469960953dSdlg 		ROUND(4);
1479960953dSdlg 		ROUND(5);
1489960953dSdlg 		ROUND(6);
1499960953dSdlg 		ROUND(7);
1509960953dSdlg 		ROUND(8);
1519960953dSdlg 		ROUND(9);
1529960953dSdlg 
1539960953dSdlg #undef G
1549960953dSdlg #undef ROUND
1559960953dSdlg 
1569960953dSdlg 		for (i = 0; i < 8; ++i)
1579960953dSdlg 			state->h[i] ^= v[i] ^ v[i + 8];
1589960953dSdlg 
1599960953dSdlg 		block += BLAKE2S_BLOCK_SIZE;
1609960953dSdlg 		--nblocks;
1619960953dSdlg 	}
1629960953dSdlg }
1639960953dSdlg 
blake2s_update(struct blake2s_state * state,const uint8_t * in,size_t inlen)1649960953dSdlg void blake2s_update(struct blake2s_state *state, const uint8_t *in, size_t inlen)
1659960953dSdlg {
1669960953dSdlg 	const size_t fill = BLAKE2S_BLOCK_SIZE - state->buflen;
1679960953dSdlg 
1689960953dSdlg 	if (!inlen)
1699960953dSdlg 		return;
1709960953dSdlg 	if (inlen > fill) {
1719960953dSdlg 		memcpy(state->buf + state->buflen, in, fill);
1729960953dSdlg 		blake2s_compress(state, state->buf, 1, BLAKE2S_BLOCK_SIZE);
1739960953dSdlg 		state->buflen = 0;
1749960953dSdlg 		in += fill;
1759960953dSdlg 		inlen -= fill;
1769960953dSdlg 	}
1779960953dSdlg 	if (inlen > BLAKE2S_BLOCK_SIZE) {
1789960953dSdlg 		const size_t nblocks =
1799960953dSdlg 			(inlen + BLAKE2S_BLOCK_SIZE - 1) / BLAKE2S_BLOCK_SIZE;
1809960953dSdlg 		/* Hash one less (full) block than strictly possible */
1819960953dSdlg 		blake2s_compress(state, in, nblocks - 1, BLAKE2S_BLOCK_SIZE);
1829960953dSdlg 		in += BLAKE2S_BLOCK_SIZE * (nblocks - 1);
1839960953dSdlg 		inlen -= BLAKE2S_BLOCK_SIZE * (nblocks - 1);
1849960953dSdlg 	}
1859960953dSdlg 	memcpy(state->buf + state->buflen, in, inlen);
1869960953dSdlg 	state->buflen += inlen;
1879960953dSdlg }
1889960953dSdlg 
blake2s_final(struct blake2s_state * state,uint8_t * out)1899960953dSdlg void blake2s_final(struct blake2s_state *state, uint8_t *out)
1909960953dSdlg {
1919960953dSdlg 	int i;
1929960953dSdlg 	blake2s_set_lastblock(state);
1939960953dSdlg 	memset(state->buf + state->buflen, 0,
1949960953dSdlg 	       BLAKE2S_BLOCK_SIZE - state->buflen); /* Padding */
1959960953dSdlg 	blake2s_compress(state, state->buf, 1, state->buflen);
1969960953dSdlg 	for (i = 0; i < 8; i++)
1979960953dSdlg 		state->h[i] = htole32(state->h[i]);
1989960953dSdlg 	memcpy(out, state->h, state->outlen);
1999960953dSdlg 	explicit_bzero(state, sizeof(*state));
2009960953dSdlg }
2019960953dSdlg 
blake2s_hmac(uint8_t * out,const uint8_t * in,const uint8_t * key,const size_t outlen,const size_t inlen,const size_t keylen)2029960953dSdlg void blake2s_hmac(uint8_t *out, const uint8_t *in, const uint8_t *key, const size_t outlen,
2039960953dSdlg 		  const size_t inlen, const size_t keylen)
2049960953dSdlg {
2059960953dSdlg 	struct blake2s_state state;
2069960953dSdlg 	uint8_t x_key[BLAKE2S_BLOCK_SIZE] __aligned(__alignof__(uint32_t)) = { 0 };
2079960953dSdlg 	uint8_t i_hash[BLAKE2S_HASH_SIZE] __aligned(__alignof__(uint32_t));
2089960953dSdlg 	int i;
2099960953dSdlg 
2109960953dSdlg 	if (keylen > BLAKE2S_BLOCK_SIZE) {
2119960953dSdlg 		blake2s_init(&state, BLAKE2S_HASH_SIZE);
2129960953dSdlg 		blake2s_update(&state, key, keylen);
2139960953dSdlg 		blake2s_final(&state, x_key);
2149960953dSdlg 	} else
2159960953dSdlg 		memcpy(x_key, key, keylen);
2169960953dSdlg 
2179960953dSdlg 	for (i = 0; i < BLAKE2S_BLOCK_SIZE; ++i)
2189960953dSdlg 		x_key[i] ^= 0x36;
2199960953dSdlg 
2209960953dSdlg 	blake2s_init(&state, BLAKE2S_HASH_SIZE);
2219960953dSdlg 	blake2s_update(&state, x_key, BLAKE2S_BLOCK_SIZE);
2229960953dSdlg 	blake2s_update(&state, in, inlen);
2239960953dSdlg 	blake2s_final(&state, i_hash);
2249960953dSdlg 
2259960953dSdlg 	for (i = 0; i < BLAKE2S_BLOCK_SIZE; ++i)
2269960953dSdlg 		x_key[i] ^= 0x5c ^ 0x36;
2279960953dSdlg 
2289960953dSdlg 	blake2s_init(&state, BLAKE2S_HASH_SIZE);
2299960953dSdlg 	blake2s_update(&state, x_key, BLAKE2S_BLOCK_SIZE);
2309960953dSdlg 	blake2s_update(&state, i_hash, BLAKE2S_HASH_SIZE);
2319960953dSdlg 	blake2s_final(&state, i_hash);
2329960953dSdlg 
2339960953dSdlg 	memcpy(out, i_hash, outlen);
2349960953dSdlg 	explicit_bzero(x_key, BLAKE2S_BLOCK_SIZE);
2359960953dSdlg 	explicit_bzero(i_hash, BLAKE2S_HASH_SIZE);
2369960953dSdlg }
237