2 BLAKE2 reference source code package - optimized C implementations
4 Written in 2012 by Samuel Neves <sneves@dei.uc.pt>
6 To the extent possible under law, the author(s) have dedicated all copyright
7 and related and neighboring rights to this software to the public domain
8 worldwide. This software is distributed without any warranty.
10 You should have received a copy of the CC0 Public Domain Dedication along with
11 this software. If not, see <http://creativecommons.org/publicdomain/zero/1.0/>.
14 #ifndef __BLAKE2_IMPL_H__
15 #define __BLAKE2_IMPL_H__
22 #define BLAKE2_IMPL_CAT(x,y) x ## y
23 #define BLAKE2_IMPL_EVAL(x,y) BLAKE2_IMPL_CAT(x,y)
24 #define BLAKE2_IMPL_NAME(fun) BLAKE2_IMPL_EVAL(fun, SUFFIX)
26 static inline uint32_t load32( const void *src )
28 #if defined(NATIVE_LITTLE_ENDIAN) && !defined(HAVE_ALIGNED_ACCESS_REQUIRED)
29 return *( uint32_t * )( src );
31 const uint8_t *p = ( uint8_t * )src;
33 w |= ( uint32_t )( *p++ ) << 8;
34 w |= ( uint32_t )( *p++ ) << 16;
35 w |= ( uint32_t )( *p++ ) << 24;
40 static inline uint64_t load64( const void *src )
42 #if defined(NATIVE_LITTLE_ENDIAN) && !defined(HAVE_ALIGNED_ACCESS_REQUIRED)
43 return *( uint64_t * )( src );
45 const uint8_t *p = ( uint8_t * )src;
47 w |= ( uint64_t )( *p++ ) << 8;
48 w |= ( uint64_t )( *p++ ) << 16;
49 w |= ( uint64_t )( *p++ ) << 24;
50 w |= ( uint64_t )( *p++ ) << 32;
51 w |= ( uint64_t )( *p++ ) << 40;
52 w |= ( uint64_t )( *p++ ) << 48;
53 w |= ( uint64_t )( *p++ ) << 56;
58 static inline void store32( void *dst, uint32_t w )
60 #if defined(NATIVE_LITTLE_ENDIAN) && !defined(HAVE_ALIGNED_ACCESS_REQUIRED)
61 *( uint32_t * )( dst ) = w;
63 uint8_t *p = ( uint8_t * )dst;
64 *p++ = ( uint8_t )w; w >>= 8;
65 *p++ = ( uint8_t )w; w >>= 8;
66 *p++ = ( uint8_t )w; w >>= 8;
71 static inline void store64( void *dst, uint64_t w )
73 #if defined(NATIVE_LITTLE_ENDIAN) && !defined(HAVE_ALIGNED_ACCESS_REQUIRED)
74 *( uint64_t * )( dst ) = w;
76 uint8_t *p = ( uint8_t * )dst;
77 *p++ = ( uint8_t )w; w >>= 8;
78 *p++ = ( uint8_t )w; w >>= 8;
79 *p++ = ( uint8_t )w; w >>= 8;
80 *p++ = ( uint8_t )w; w >>= 8;
81 *p++ = ( uint8_t )w; w >>= 8;
82 *p++ = ( uint8_t )w; w >>= 8;
83 *p++ = ( uint8_t )w; w >>= 8;
88 static inline uint64_t load48( const void *src )
90 const uint8_t *p = ( const uint8_t * )src;
92 w |= ( uint64_t )( *p++ ) << 8;
93 w |= ( uint64_t )( *p++ ) << 16;
94 w |= ( uint64_t )( *p++ ) << 24;
95 w |= ( uint64_t )( *p++ ) << 32;
96 w |= ( uint64_t )( *p++ ) << 40;
100 static inline void store48( void *dst, uint64_t w )
102 uint8_t *p = ( uint8_t * )dst;
103 *p++ = ( uint8_t )w; w >>= 8;
104 *p++ = ( uint8_t )w; w >>= 8;
105 *p++ = ( uint8_t )w; w >>= 8;
106 *p++ = ( uint8_t )w; w >>= 8;
107 *p++ = ( uint8_t )w; w >>= 8;
111 static inline uint32_t rotl32( const uint32_t w, const unsigned c )
113 return ( w << c ) | ( w >> ( 32 - c ) );
116 static inline uint64_t rotl64( const uint64_t w, const unsigned c )
118 return ( w << c ) | ( w >> ( 64 - c ) );
121 static inline uint32_t rotr32( const uint32_t w, const unsigned c )
123 return ( w >> c ) | ( w << ( 32 - c ) );
126 static inline uint64_t rotr64( const uint64_t w, const unsigned c )
128 return ( w >> c ) | ( w << ( 64 - c ) );
131 /* prevents compiler optimizing out memset() */
132 static inline void secure_zero_memory(void *v, size_t n)
135 explicit_bzero(v, n);
137 static void *(*const volatile memset_v)(void *, int, size_t) = &memset;