10949a0d6SAaron LI /* $OpenBSD: blake2s.c,v 1.3 2023/02/03 18:31:16 miod Exp $ */
20949a0d6SAaron LI /*
30949a0d6SAaron LI * Copyright (C) 2012 Samuel Neves <sneves@dei.uc.pt>. All Rights Reserved.
40949a0d6SAaron LI * Copyright (C) 2015-2020 Jason A. Donenfeld <Jason@zx2c4.com>. All Rights Reserved.
50949a0d6SAaron LI *
60949a0d6SAaron LI * Permission to use, copy, modify, and distribute this software for any
70949a0d6SAaron LI * purpose with or without fee is hereby granted, provided that the above
80949a0d6SAaron LI * copyright notice and this permission notice appear in all copies.
90949a0d6SAaron LI *
100949a0d6SAaron LI * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
110949a0d6SAaron LI * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
120949a0d6SAaron LI * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
130949a0d6SAaron LI * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
140949a0d6SAaron LI * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
150949a0d6SAaron LI * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
160949a0d6SAaron LI * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
170949a0d6SAaron LI *
180949a0d6SAaron LI * This is an implementation of the BLAKE2s hash and PRF functions.
190949a0d6SAaron LI * Information: https://blake2.net/
200949a0d6SAaron LI */
210949a0d6SAaron LI
220949a0d6SAaron LI #include <sys/types.h>
230949a0d6SAaron LI #include <sys/systm.h>
2415b48a60SAaron LI #include <sys/endian.h>
250949a0d6SAaron LI
2615b48a60SAaron LI #include <crypto/blake2/blake2s.h>
270949a0d6SAaron LI
ror32(uint32_t word,unsigned int shift)2815b48a60SAaron LI static inline uint32_t ror32(uint32_t word, unsigned int shift)
290949a0d6SAaron LI {
300949a0d6SAaron LI return (word >> shift) | (word << (32 - shift));
310949a0d6SAaron LI }
320949a0d6SAaron LI
330949a0d6SAaron LI static const uint32_t blake2s_iv[8] = {
340949a0d6SAaron LI 0x6A09E667UL, 0xBB67AE85UL, 0x3C6EF372UL, 0xA54FF53AUL,
350949a0d6SAaron LI 0x510E527FUL, 0x9B05688CUL, 0x1F83D9ABUL, 0x5BE0CD19UL
360949a0d6SAaron LI };
370949a0d6SAaron LI
380949a0d6SAaron LI static const uint8_t blake2s_sigma[10][16] = {
390949a0d6SAaron LI { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 },
400949a0d6SAaron LI { 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3 },
410949a0d6SAaron LI { 11, 8, 12, 0, 5, 2, 15, 13, 10, 14, 3, 6, 7, 1, 9, 4 },
420949a0d6SAaron LI { 7, 9, 3, 1, 13, 12, 11, 14, 2, 6, 5, 10, 4, 0, 15, 8 },
430949a0d6SAaron LI { 9, 0, 5, 7, 2, 4, 10, 15, 14, 1, 11, 12, 6, 8, 3, 13 },
440949a0d6SAaron LI { 2, 12, 6, 10, 0, 11, 8, 3, 4, 13, 7, 5, 15, 14, 1, 9 },
450949a0d6SAaron LI { 12, 5, 1, 15, 14, 13, 4, 10, 0, 7, 6, 3, 9, 2, 8, 11 },
460949a0d6SAaron LI { 13, 11, 7, 14, 12, 1, 3, 9, 5, 0, 15, 4, 8, 6, 2, 10 },
470949a0d6SAaron LI { 6, 15, 14, 9, 11, 3, 0, 8, 12, 2, 13, 7, 1, 4, 10, 5 },
480949a0d6SAaron LI { 10, 2, 8, 4, 7, 6, 1, 5, 15, 11, 9, 14, 3, 12, 13, 0 },
490949a0d6SAaron LI };
500949a0d6SAaron LI
blake2s_set_lastblock(struct blake2s_state * state)510949a0d6SAaron LI static inline void blake2s_set_lastblock(struct blake2s_state *state)
520949a0d6SAaron LI {
530949a0d6SAaron LI state->f[0] = -1;
540949a0d6SAaron LI }
550949a0d6SAaron LI
blake2s_increment_counter(struct blake2s_state * state,uint32_t inc)560949a0d6SAaron LI static inline void blake2s_increment_counter(struct blake2s_state *state,
5704473dc8SAaron LI uint32_t inc)
580949a0d6SAaron LI {
590949a0d6SAaron LI state->t[0] += inc;
600949a0d6SAaron LI state->t[1] += (state->t[0] < inc);
610949a0d6SAaron LI }
620949a0d6SAaron LI
blake2s_init_param(struct blake2s_state * state,uint32_t param)630949a0d6SAaron LI static inline void blake2s_init_param(struct blake2s_state *state,
6404473dc8SAaron LI uint32_t param)
650949a0d6SAaron LI {
660949a0d6SAaron LI int i;
670949a0d6SAaron LI
680949a0d6SAaron LI memset(state, 0, sizeof(*state));
690949a0d6SAaron LI for (i = 0; i < 8; ++i)
700949a0d6SAaron LI state->h[i] = blake2s_iv[i];
710949a0d6SAaron LI state->h[0] ^= param;
720949a0d6SAaron LI }
730949a0d6SAaron LI
blake2s_init(struct blake2s_state * state,size_t outlen)7404473dc8SAaron LI void blake2s_init(struct blake2s_state *state, size_t outlen)
750949a0d6SAaron LI {
7601a03001SAaron LI KKASSERT(outlen > 0 && outlen <= BLAKE2S_HASH_SIZE);
7701a03001SAaron LI
780949a0d6SAaron LI blake2s_init_param(state, 0x01010000 | outlen);
790949a0d6SAaron LI state->outlen = outlen;
800949a0d6SAaron LI }
810949a0d6SAaron LI
blake2s_init_key(struct blake2s_state * state,size_t outlen,const void * key,size_t keylen)8204473dc8SAaron LI void blake2s_init_key(struct blake2s_state *state, size_t outlen,
8304473dc8SAaron LI const void *key, size_t keylen)
840949a0d6SAaron LI {
850949a0d6SAaron LI uint8_t block[BLAKE2S_BLOCK_SIZE] = { 0 };
860949a0d6SAaron LI
8701a03001SAaron LI KKASSERT(outlen > 0 && outlen <= BLAKE2S_HASH_SIZE);
88*acc7135cSAaron LI KKASSERT(key != NULL && keylen > 0 && keylen <= BLAKE2S_KEY_SIZE);
890949a0d6SAaron LI
900949a0d6SAaron LI blake2s_init_param(state, 0x01010000 | keylen << 8 | outlen);
910949a0d6SAaron LI state->outlen = outlen;
920949a0d6SAaron LI memcpy(block, key, keylen);
930949a0d6SAaron LI blake2s_update(state, block, BLAKE2S_BLOCK_SIZE);
940949a0d6SAaron LI explicit_bzero(block, BLAKE2S_BLOCK_SIZE);
950949a0d6SAaron LI }
960949a0d6SAaron LI
blake2s_compress(struct blake2s_state * state,const uint8_t * block,size_t nblocks,uint32_t inc)970949a0d6SAaron LI static inline void blake2s_compress(struct blake2s_state *state,
980949a0d6SAaron LI const uint8_t *block, size_t nblocks,
9904473dc8SAaron LI uint32_t inc)
1000949a0d6SAaron LI {
1010949a0d6SAaron LI uint32_t m[16];
1020949a0d6SAaron LI uint32_t v[16];
1030949a0d6SAaron LI int i;
1040949a0d6SAaron LI
10515b48a60SAaron LI KKASSERT(!((nblocks > 1 && inc != BLAKE2S_BLOCK_SIZE)));
1060949a0d6SAaron LI
1070949a0d6SAaron LI while (nblocks > 0) {
1080949a0d6SAaron LI blake2s_increment_counter(state, inc);
1090949a0d6SAaron LI memcpy(m, block, BLAKE2S_BLOCK_SIZE);
1100949a0d6SAaron LI for (i = 0; i < 16; i++)
1110949a0d6SAaron LI m[i] = le32toh(m[i]);
1120949a0d6SAaron LI memcpy(v, state->h, 32);
1130949a0d6SAaron LI v[ 8] = blake2s_iv[0];
1140949a0d6SAaron LI v[ 9] = blake2s_iv[1];
1150949a0d6SAaron LI v[10] = blake2s_iv[2];
1160949a0d6SAaron LI v[11] = blake2s_iv[3];
1170949a0d6SAaron LI v[12] = blake2s_iv[4] ^ state->t[0];
1180949a0d6SAaron LI v[13] = blake2s_iv[5] ^ state->t[1];
1190949a0d6SAaron LI v[14] = blake2s_iv[6] ^ state->f[0];
1200949a0d6SAaron LI v[15] = blake2s_iv[7] ^ state->f[1];
1210949a0d6SAaron LI
1220949a0d6SAaron LI #define G(r, i, a, b, c, d) do { \
1230949a0d6SAaron LI a += b + m[blake2s_sigma[r][2 * i + 0]]; \
1240949a0d6SAaron LI d = ror32(d ^ a, 16); \
1250949a0d6SAaron LI c += d; \
1260949a0d6SAaron LI b = ror32(b ^ c, 12); \
1270949a0d6SAaron LI a += b + m[blake2s_sigma[r][2 * i + 1]]; \
1280949a0d6SAaron LI d = ror32(d ^ a, 8); \
1290949a0d6SAaron LI c += d; \
1300949a0d6SAaron LI b = ror32(b ^ c, 7); \
1310949a0d6SAaron LI } while (0)
1320949a0d6SAaron LI
1330949a0d6SAaron LI #define ROUND(r) do { \
1340949a0d6SAaron LI G(r, 0, v[0], v[ 4], v[ 8], v[12]); \
1350949a0d6SAaron LI G(r, 1, v[1], v[ 5], v[ 9], v[13]); \
1360949a0d6SAaron LI G(r, 2, v[2], v[ 6], v[10], v[14]); \
1370949a0d6SAaron LI G(r, 3, v[3], v[ 7], v[11], v[15]); \
1380949a0d6SAaron LI G(r, 4, v[0], v[ 5], v[10], v[15]); \
1390949a0d6SAaron LI G(r, 5, v[1], v[ 6], v[11], v[12]); \
1400949a0d6SAaron LI G(r, 6, v[2], v[ 7], v[ 8], v[13]); \
1410949a0d6SAaron LI G(r, 7, v[3], v[ 4], v[ 9], v[14]); \
1420949a0d6SAaron LI } while (0)
1430949a0d6SAaron LI ROUND(0);
1440949a0d6SAaron LI ROUND(1);
1450949a0d6SAaron LI ROUND(2);
1460949a0d6SAaron LI ROUND(3);
1470949a0d6SAaron LI ROUND(4);
1480949a0d6SAaron LI ROUND(5);
1490949a0d6SAaron LI ROUND(6);
1500949a0d6SAaron LI ROUND(7);
1510949a0d6SAaron LI ROUND(8);
1520949a0d6SAaron LI ROUND(9);
1530949a0d6SAaron LI
1540949a0d6SAaron LI #undef G
1550949a0d6SAaron LI #undef ROUND
1560949a0d6SAaron LI
1570949a0d6SAaron LI for (i = 0; i < 8; ++i)
1580949a0d6SAaron LI state->h[i] ^= v[i] ^ v[i + 8];
1590949a0d6SAaron LI
1600949a0d6SAaron LI block += BLAKE2S_BLOCK_SIZE;
1610949a0d6SAaron LI --nblocks;
1620949a0d6SAaron LI }
1630949a0d6SAaron LI }
1640949a0d6SAaron LI
blake2s_update(struct blake2s_state * state,const uint8_t * in,size_t inlen)1650949a0d6SAaron LI void blake2s_update(struct blake2s_state *state, const uint8_t *in, size_t inlen)
1660949a0d6SAaron LI {
1670949a0d6SAaron LI const size_t fill = BLAKE2S_BLOCK_SIZE - state->buflen;
1680949a0d6SAaron LI
1690949a0d6SAaron LI if (!inlen)
1700949a0d6SAaron LI return;
1710949a0d6SAaron LI if (inlen > fill) {
1720949a0d6SAaron LI memcpy(state->buf + state->buflen, in, fill);
1730949a0d6SAaron LI blake2s_compress(state, state->buf, 1, BLAKE2S_BLOCK_SIZE);
1740949a0d6SAaron LI state->buflen = 0;
1750949a0d6SAaron LI in += fill;
1760949a0d6SAaron LI inlen -= fill;
1770949a0d6SAaron LI }
1780949a0d6SAaron LI if (inlen > BLAKE2S_BLOCK_SIZE) {
1790949a0d6SAaron LI const size_t nblocks =
1800949a0d6SAaron LI (inlen + BLAKE2S_BLOCK_SIZE - 1) / BLAKE2S_BLOCK_SIZE;
1810949a0d6SAaron LI /* Hash one less (full) block than strictly possible */
1820949a0d6SAaron LI blake2s_compress(state, in, nblocks - 1, BLAKE2S_BLOCK_SIZE);
1830949a0d6SAaron LI in += BLAKE2S_BLOCK_SIZE * (nblocks - 1);
1840949a0d6SAaron LI inlen -= BLAKE2S_BLOCK_SIZE * (nblocks - 1);
1850949a0d6SAaron LI }
1860949a0d6SAaron LI memcpy(state->buf + state->buflen, in, inlen);
1870949a0d6SAaron LI state->buflen += inlen;
1880949a0d6SAaron LI }
1890949a0d6SAaron LI
blake2s_final(struct blake2s_state * state,uint8_t * out)1900949a0d6SAaron LI void blake2s_final(struct blake2s_state *state, uint8_t *out)
1910949a0d6SAaron LI {
1920949a0d6SAaron LI int i;
19301a03001SAaron LI
1940949a0d6SAaron LI blake2s_set_lastblock(state);
1950949a0d6SAaron LI memset(state->buf + state->buflen, 0,
1960949a0d6SAaron LI BLAKE2S_BLOCK_SIZE - state->buflen); /* Padding */
1970949a0d6SAaron LI blake2s_compress(state, state->buf, 1, state->buflen);
1980949a0d6SAaron LI for (i = 0; i < 8; i++)
1990949a0d6SAaron LI state->h[i] = htole32(state->h[i]);
2000949a0d6SAaron LI memcpy(out, state->h, state->outlen);
2010949a0d6SAaron LI explicit_bzero(state, sizeof(*state));
2020949a0d6SAaron LI }
203