275 lines
7.3 KiB
C
275 lines
7.3 KiB
C
|
/*
|
||
|
BLAKE2 reference source code package - optimized C implementations
|
||
|
|
||
|
Written in 2012 by Samuel Neves <sneves@dei.uc.pt>
|
||
|
|
||
|
To the extent possible under law, the author(s) have dedicated all copyright
|
||
|
and related and neighboring rights to this software to the public domain
|
||
|
worldwide. This software is distributed without any warranty.
|
||
|
|
||
|
You should have received a copy of the CC0 Public Domain Dedication along with
|
||
|
this software. If not, see <http://creativecommons.org/publicdomain/zero/1.0/>.
|
||
|
*/
|
||
|
|
||
|
#include <stdlib.h>
|
||
|
#include <string.h>
|
||
|
#include <stdio.h>
|
||
|
|
||
|
#if defined(_OPENMP)
|
||
|
#include <omp.h>
|
||
|
#endif
|
||
|
|
||
|
#include "blake2.h"
|
||
|
#include "blake2-impl.h"
|
||
|
|
||
|
#define PARALLELISM_DEGREE 8
|
||
|
|
||
|
static int blake2sp_init_leaf( blake2s_state *S, uint8_t outlen, uint8_t keylen, uint64_t offset )
|
||
|
{
|
||
|
blake2s_param P[1];
|
||
|
P->digest_length = outlen;
|
||
|
P->key_length = keylen;
|
||
|
P->fanout = PARALLELISM_DEGREE;
|
||
|
P->depth = 2;
|
||
|
P->leaf_length = 0;
|
||
|
store48( P->node_offset, offset );
|
||
|
P->node_depth = 0;
|
||
|
P->inner_length = BLAKE2S_OUTBYTES;
|
||
|
memset( P->salt, 0, sizeof( P->salt ) );
|
||
|
memset( P->personal, 0, sizeof( P->personal ) );
|
||
|
blake2s_init_param( S, P );
|
||
|
S->outlen = P->inner_length;
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
static int blake2sp_init_root( blake2s_state *S, uint8_t outlen, uint8_t keylen )
|
||
|
{
|
||
|
blake2s_param P[1];
|
||
|
P->digest_length = outlen;
|
||
|
P->key_length = keylen;
|
||
|
P->fanout = PARALLELISM_DEGREE;
|
||
|
P->depth = 2;
|
||
|
P->leaf_length = 0;
|
||
|
store48( P->node_offset, 0ULL );
|
||
|
P->node_depth = 1;
|
||
|
P->inner_length = BLAKE2S_OUTBYTES;
|
||
|
memset( P->salt, 0, sizeof( P->salt ) );
|
||
|
memset( P->personal, 0, sizeof( P->personal ) );
|
||
|
blake2s_init_param( S, P );
|
||
|
S->outlen = P->digest_length;
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
|
||
|
int blake2sp_init( blake2sp_state *S, size_t outlen )
|
||
|
{
|
||
|
if( !outlen || outlen > BLAKE2S_OUTBYTES ) return -1;
|
||
|
|
||
|
memset( S->buf, 0, sizeof( S->buf ) );
|
||
|
S->buflen = 0;
|
||
|
|
||
|
if( blake2sp_init_root( S->R, ( uint8_t ) outlen, 0 ) < 0 )
|
||
|
return -1;
|
||
|
|
||
|
for( size_t i = 0; i < PARALLELISM_DEGREE; ++i )
|
||
|
if( blake2sp_init_leaf( S->S[i], ( uint8_t ) outlen, 0, i ) < 0 ) return -1;
|
||
|
|
||
|
S->R->last_node = 1;
|
||
|
S->S[PARALLELISM_DEGREE - 1]->last_node = 1;
|
||
|
S->outlen = ( uint8_t ) outlen;
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
int blake2sp_init_key( blake2sp_state *S, size_t outlen, const void *key, size_t keylen )
|
||
|
{
|
||
|
if( !outlen || outlen > BLAKE2S_OUTBYTES ) return -1;
|
||
|
|
||
|
if( !key || !keylen || keylen > BLAKE2S_KEYBYTES ) return -1;
|
||
|
|
||
|
memset( S->buf, 0, sizeof( S->buf ) );
|
||
|
S->buflen = 0;
|
||
|
|
||
|
if( blake2sp_init_root( S->R, ( uint8_t ) outlen, ( uint8_t ) keylen ) < 0 )
|
||
|
return -1;
|
||
|
|
||
|
for( size_t i = 0; i < PARALLELISM_DEGREE; ++i )
|
||
|
if( blake2sp_init_leaf( S->S[i], ( uint8_t ) outlen, ( uint8_t ) keylen, i ) < 0 )
|
||
|
return -1;
|
||
|
|
||
|
S->R->last_node = 1;
|
||
|
S->S[PARALLELISM_DEGREE - 1]->last_node = 1;
|
||
|
S->outlen = ( uint8_t ) outlen;
|
||
|
{
|
||
|
uint8_t block[BLAKE2S_BLOCKBYTES];
|
||
|
memset( block, 0, BLAKE2S_BLOCKBYTES );
|
||
|
memcpy( block, key, keylen );
|
||
|
|
||
|
for( size_t i = 0; i < PARALLELISM_DEGREE; ++i )
|
||
|
blake2s_update( S->S[i], block, BLAKE2S_BLOCKBYTES );
|
||
|
|
||
|
secure_zero_memory( block, BLAKE2S_BLOCKBYTES ); /* Burn the key from stack */
|
||
|
}
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
|
||
|
int blake2sp_update( blake2sp_state *S, const uint8_t *in, size_t inlen )
|
||
|
{
|
||
|
size_t left = S->buflen;
|
||
|
size_t fill = sizeof( S->buf ) - left;
|
||
|
|
||
|
if( left && inlen >= fill )
|
||
|
{
|
||
|
memcpy( S->buf + left, in, fill );
|
||
|
|
||
|
for( size_t i = 0; i < PARALLELISM_DEGREE; ++i )
|
||
|
blake2s_update( S->S[i], S->buf + i * BLAKE2S_BLOCKBYTES, BLAKE2S_BLOCKBYTES );
|
||
|
|
||
|
in += fill;
|
||
|
inlen -= fill;
|
||
|
left = 0;
|
||
|
}
|
||
|
|
||
|
#if defined(_OPENMP)
|
||
|
omp_set_num_threads(PARALLELISM_DEGREE);
|
||
|
#pragma omp parallel shared(S)
|
||
|
#else
|
||
|
for( size_t id__ = 0; id__ < PARALLELISM_DEGREE; ++id__ )
|
||
|
#endif
|
||
|
{
|
||
|
#if defined(_OPENMP)
|
||
|
size_t id__ = ( size_t ) omp_get_thread_num();
|
||
|
#endif
|
||
|
size_t inlen__ = inlen;
|
||
|
const uint8_t *in__ = ( const uint8_t * )in;
|
||
|
in__ += id__ * BLAKE2S_BLOCKBYTES;
|
||
|
|
||
|
while( inlen__ >= PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES )
|
||
|
{
|
||
|
blake2s_update( S->S[id__], in__, BLAKE2S_BLOCKBYTES );
|
||
|
in__ += PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES;
|
||
|
inlen__ -= PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
in += inlen - inlen % ( PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES );
|
||
|
inlen %= PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES;
|
||
|
|
||
|
if( inlen > 0 )
|
||
|
memcpy( S->buf + left, in, inlen );
|
||
|
|
||
|
S->buflen = ( uint32_t ) left + ( uint32_t ) inlen;
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
|
||
|
int blake2sp_final( blake2sp_state *S, uint8_t *out, size_t outlen )
|
||
|
{
|
||
|
uint8_t hash[PARALLELISM_DEGREE][BLAKE2S_OUTBYTES];
|
||
|
|
||
|
if(S->outlen != outlen) return -1;
|
||
|
|
||
|
for( size_t i = 0; i < PARALLELISM_DEGREE; ++i )
|
||
|
{
|
||
|
if( S->buflen > i * BLAKE2S_BLOCKBYTES )
|
||
|
{
|
||
|
size_t left = S->buflen - i * BLAKE2S_BLOCKBYTES;
|
||
|
|
||
|
if( left > BLAKE2S_BLOCKBYTES ) left = BLAKE2S_BLOCKBYTES;
|
||
|
|
||
|
blake2s_update( S->S[i], S->buf + i * BLAKE2S_BLOCKBYTES, left );
|
||
|
}
|
||
|
|
||
|
blake2s_final( S->S[i], hash[i], BLAKE2S_OUTBYTES );
|
||
|
}
|
||
|
|
||
|
for( size_t i = 0; i < PARALLELISM_DEGREE; ++i )
|
||
|
blake2s_update( S->R, hash[i], BLAKE2S_OUTBYTES );
|
||
|
|
||
|
blake2s_final( S->R, out, outlen );
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
|
||
|
int blake2sp( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen )
|
||
|
{
|
||
|
uint8_t hash[PARALLELISM_DEGREE][BLAKE2S_OUTBYTES];
|
||
|
blake2s_state S[PARALLELISM_DEGREE][1];
|
||
|
blake2s_state FS[1];
|
||
|
|
||
|
/* Verify parameters */
|
||
|
if ( NULL == in && inlen > 0 ) return -1;
|
||
|
|
||
|
if ( NULL == out ) return -1;
|
||
|
|
||
|
if ( NULL == key && keylen > 0 ) return -1;
|
||
|
|
||
|
if( !outlen || outlen > BLAKE2S_OUTBYTES ) return -1;
|
||
|
|
||
|
if( keylen > BLAKE2S_KEYBYTES ) return -1;
|
||
|
|
||
|
for( size_t i = 0; i < PARALLELISM_DEGREE; ++i )
|
||
|
if( blake2sp_init_leaf( S[i], ( uint8_t ) outlen, ( uint8_t ) keylen, i ) < 0 )
|
||
|
return -1;
|
||
|
|
||
|
S[PARALLELISM_DEGREE - 1]->last_node = 1; // mark last node
|
||
|
|
||
|
if( keylen > 0 )
|
||
|
{
|
||
|
uint8_t block[BLAKE2S_BLOCKBYTES];
|
||
|
memset( block, 0, BLAKE2S_BLOCKBYTES );
|
||
|
memcpy( block, key, keylen );
|
||
|
|
||
|
for( size_t i = 0; i < PARALLELISM_DEGREE; ++i )
|
||
|
blake2s_update( S[i], block, BLAKE2S_BLOCKBYTES );
|
||
|
|
||
|
secure_zero_memory( block, BLAKE2S_BLOCKBYTES ); /* Burn the key from stack */
|
||
|
}
|
||
|
|
||
|
#if defined(_OPENMP)
|
||
|
omp_set_num_threads(PARALLELISM_DEGREE);
|
||
|
#pragma omp parallel shared(S,hash)
|
||
|
#else
|
||
|
|
||
|
for( size_t id__ = 0; id__ < PARALLELISM_DEGREE; ++id__ )
|
||
|
#endif
|
||
|
{
|
||
|
#if defined(_OPENMP)
|
||
|
size_t id__ = ( size_t ) omp_get_thread_num();
|
||
|
#endif
|
||
|
size_t inlen__ = inlen;
|
||
|
const uint8_t *in__ = ( const uint8_t * )in;
|
||
|
in__ += id__ * BLAKE2S_BLOCKBYTES;
|
||
|
|
||
|
while( inlen__ >= PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES )
|
||
|
{
|
||
|
blake2s_update( S[id__], in__, BLAKE2S_BLOCKBYTES );
|
||
|
in__ += PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES;
|
||
|
inlen__ -= PARALLELISM_DEGREE * BLAKE2S_BLOCKBYTES;
|
||
|
}
|
||
|
|
||
|
if( inlen__ > id__ * BLAKE2S_BLOCKBYTES )
|
||
|
{
|
||
|
const size_t left = inlen__ - id__ * BLAKE2S_BLOCKBYTES;
|
||
|
const size_t len = left <= BLAKE2S_BLOCKBYTES ? left : BLAKE2S_BLOCKBYTES;
|
||
|
blake2s_update( S[id__], in__, len );
|
||
|
}
|
||
|
|
||
|
blake2s_final( S[id__], hash[id__], BLAKE2S_OUTBYTES );
|
||
|
}
|
||
|
|
||
|
if( blake2sp_init_root( FS, ( uint8_t ) outlen, ( uint8_t ) keylen ) < 0 )
|
||
|
return -1;
|
||
|
|
||
|
FS->last_node = 1;
|
||
|
|
||
|
for( size_t i = 0; i < PARALLELISM_DEGREE; ++i )
|
||
|
blake2s_update( FS, hash[i], BLAKE2S_OUTBYTES );
|
||
|
|
||
|
return blake2s_final( FS, out, outlen );
|
||
|
}
|
||
|
|
||
|
|
||
|
|
||
|
|