2 BLAKE2 reference source code package - optimized C implementations
4 Written in 2012 by Samuel Neves <sneves@dei.uc.pt>
6 To the extent possible under law, the author(s) have dedicated all copyright
7 and related and neighboring rights to this software to the public domain
8 worldwide. This software is distributed without any warranty.
10 You should have received a copy of the CC0 Public Domain Dedication along with
11 this software. If not, see <http://creativecommons.org/publicdomain/zero/1.0/>.
19 #if defined(__x86_64__) || defined(__i386__) || defined(_M_IX86) || defined(_M_X64)
36 static const char feature_names[][8] =
52 static inline void cpuid( uint32_t *eax, uint32_t *ebx, uint32_t *ecx, uint32_t *edx )
55 #if defined(__i386__) /* This is needed for -fPIC to work on i386 */
56 "movl %%ebx, %%esi\n\t"
60 "xchgl %%ebx, %%esi\n\t"
61 : "=a"( *eax ), "=S"( *ebx ), "=c"( *ecx ), "=d"( *edx ) : "a"( *eax ) );
63 : "=a"( *eax ), "=b"( *ebx ), "=c"( *ecx ), "=d"( *edx ) : "a"( *eax ) );
67 static inline uint64_t xgetbv(uint32_t xcr)
75 return ((uint64_t)d << 32) | a;
78 #elif defined(_MSC_VER)
80 static inline void cpuid( uint32_t *eax, uint32_t *ebx, uint32_t *ecx, uint32_t *edx )
83 __cpuid( regs, *eax );
90 #error "Don't know how to call cpuid on this compiler!"
95 static inline cpu_feature_t get_cpu_features( void )
98 static volatile int initialized = 0;
99 static cpu_feature_t feature = NONE; // Safe default
100 uint32_t eax, ecx, edx, ebx;
106 cpuid( &eax, &ebx, &ecx, &edx );
108 if( 1 & ( edx >> 26 ) )
111 if( 1 & ( ecx >> 9 ) )
114 if( 1 & ( ecx >> 19 ) )
117 #if defined(WIN32) /* Work around the fact that Windows <7 does NOT support AVX... */
118 if( IsProcessorFeaturePresent(17) ) /* Some environments don't know about PF_XSAVE_ENABLED */
121 /* check for AVX and OSXSAVE bits */
122 if( 1 & ( ecx >> 28 ) & (ecx >> 27) ) {
123 #if !defined(WIN32) /* Already checked for this in WIN32 */
124 if( (xgetbv(0) & 6) == 6 ) /* XCR0 */
131 cpuid( &eax, &ebx, &ecx, &edx );
133 if( 1 & ( ecx >> 11 ) )
137 /* For future architectures */
140 cpuid(&eax, &ebx, &ecx, &edx);
145 /* fprintf( stderr, "Using %s engine\n", feature_names[feature] ); */
155 #if defined(__cplusplus)
158 int blake2b_init_ref( blake2b_state *S, size_t outlen );
159 int blake2b_init_key_ref( blake2b_state *S, size_t outlen, const void *key, size_t keylen );
160 int blake2b_init_param_ref( blake2b_state *S, const blake2b_param *P );
161 int blake2b_update_ref( blake2b_state *S, const uint8_t *in, size_t inlen );
162 int blake2b_final_ref( blake2b_state *S, uint8_t *out, size_t outlen );
163 int blake2b_ref( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
165 #if defined(HAVE_X86)
167 int blake2b_init_sse2( blake2b_state *S, size_t outlen );
168 int blake2b_init_key_sse2( blake2b_state *S, size_t outlen, const void *key, size_t keylen );
169 int blake2b_init_param_sse2( blake2b_state *S, const blake2b_param *P );
170 int blake2b_update_sse2( blake2b_state *S, const uint8_t *in, size_t inlen );
171 int blake2b_final_sse2( blake2b_state *S, uint8_t *out, size_t outlen );
172 int blake2b_sse2( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
174 int blake2b_init_ssse3( blake2b_state *S, size_t outlen );
175 int blake2b_init_key_ssse3( blake2b_state *S, size_t outlen, const void *key, size_t keylen );
176 int blake2b_init_param_ssse3( blake2b_state *S, const blake2b_param *P );
177 int blake2b_update_ssse3( blake2b_state *S, const uint8_t *in, size_t inlen );
178 int blake2b_final_ssse3( blake2b_state *S, uint8_t *out, size_t outlen );
179 int blake2b_ssse3( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
181 int blake2b_init_sse41( blake2b_state *S, size_t outlen );
182 int blake2b_init_key_sse41( blake2b_state *S, size_t outlen, const void *key, size_t keylen );
183 int blake2b_init_param_sse41( blake2b_state *S, const blake2b_param *P );
184 int blake2b_update_sse41( blake2b_state *S, const uint8_t *in, size_t inlen );
185 int blake2b_final_sse41( blake2b_state *S, uint8_t *out, size_t outlen );
186 int blake2b_sse41( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
188 int blake2b_init_avx( blake2b_state *S, size_t outlen );
189 int blake2b_init_key_avx( blake2b_state *S, size_t outlen, const void *key, size_t keylen );
190 int blake2b_init_param_avx( blake2b_state *S, const blake2b_param *P );
191 int blake2b_update_avx( blake2b_state *S, const uint8_t *in, size_t inlen );
192 int blake2b_final_avx( blake2b_state *S, uint8_t *out, size_t outlen );
193 int blake2b_avx( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
195 int blake2b_init_xop( blake2b_state *S, size_t outlen );
196 int blake2b_init_key_xop( blake2b_state *S, size_t outlen, const void *key, size_t keylen );
197 int blake2b_init_param_xop( blake2b_state *S, const blake2b_param *P );
198 int blake2b_update_xop( blake2b_state *S, const uint8_t *in, size_t inlen );
199 int blake2b_final_xop( blake2b_state *S, uint8_t *out, size_t outlen );
200 int blake2b_xop( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
202 #endif /* HAVE_X86 */
204 int blake2s_init_ref( blake2s_state *S, size_t outlen );
205 int blake2s_init_key_ref( blake2s_state *S, size_t outlen, const void *key, size_t keylen );
206 int blake2s_init_param_ref( blake2s_state *S, const blake2s_param *P );
207 int blake2s_update_ref( blake2s_state *S, const uint8_t *in, size_t inlen );
208 int blake2s_final_ref( blake2s_state *S, uint8_t *out, size_t outlen );
209 int blake2s_ref( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
211 #if defined(HAVE_X86)
213 int blake2s_init_sse2( blake2s_state *S, size_t outlen );
214 int blake2s_init_key_sse2( blake2s_state *S, size_t outlen, const void *key, size_t keylen );
215 int blake2s_init_param_sse2( blake2s_state *S, const blake2s_param *P );
216 int blake2s_update_sse2( blake2s_state *S, const uint8_t *in, size_t inlen );
217 int blake2s_final_sse2( blake2s_state *S, uint8_t *out, size_t outlen );
218 int blake2s_sse2( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
220 int blake2s_init_ssse3( blake2s_state *S, size_t outlen );
221 int blake2s_init_key_ssse3( blake2s_state *S, size_t outlen, const void *key, size_t keylen );
222 int blake2s_init_param_ssse3( blake2s_state *S, const blake2s_param *P );
223 int blake2s_update_ssse3( blake2s_state *S, const uint8_t *in, size_t inlen );
224 int blake2s_final_ssse3( blake2s_state *S, uint8_t *out, size_t outlen );
225 int blake2s_ssse3( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
227 int blake2s_init_sse41( blake2s_state *S, size_t outlen );
228 int blake2s_init_key_sse41( blake2s_state *S, size_t outlen, const void *key, size_t keylen );
229 int blake2s_init_param_sse41( blake2s_state *S, const blake2s_param *P );
230 int blake2s_update_sse41( blake2s_state *S, const uint8_t *in, size_t inlen );
231 int blake2s_final_sse41( blake2s_state *S, uint8_t *out, size_t outlen );
232 int blake2s_sse41( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
234 int blake2s_init_avx( blake2s_state *S, size_t outlen );
235 int blake2s_init_key_avx( blake2s_state *S, size_t outlen, const void *key, size_t keylen );
236 int blake2s_init_param_avx( blake2s_state *S, const blake2s_param *P );
237 int blake2s_update_avx( blake2s_state *S, const uint8_t *in, size_t inlen );
238 int blake2s_final_avx( blake2s_state *S, uint8_t *out, size_t outlen );
239 int blake2s_avx( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
241 int blake2s_init_xop( blake2s_state *S, size_t outlen );
242 int blake2s_init_key_xop( blake2s_state *S, size_t outlen, const void *key, size_t keylen );
243 int blake2s_init_param_xop( blake2s_state *S, const blake2s_param *P );
244 int blake2s_update_xop( blake2s_state *S, const uint8_t *in, size_t inlen );
245 int blake2s_final_xop( blake2s_state *S, uint8_t *out, size_t outlen );
246 int blake2s_xop( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
248 #endif /* HAVE_X86 */
250 #if defined(__cplusplus)
254 typedef int ( *blake2b_init_fn )( blake2b_state *, size_t );
255 typedef int ( *blake2b_init_key_fn )( blake2b_state *, size_t, const void *, size_t );
256 typedef int ( *blake2b_init_param_fn )( blake2b_state *, const blake2b_param * );
257 typedef int ( *blake2b_update_fn )( blake2b_state *, const uint8_t *, size_t );
258 typedef int ( *blake2b_final_fn )( blake2b_state *, uint8_t *, size_t );
259 typedef int ( *blake2b_fn )( uint8_t *, const void *, const void *, size_t, size_t, size_t );
261 typedef int ( *blake2s_init_fn )( blake2s_state *, size_t );
262 typedef int ( *blake2s_init_key_fn )( blake2s_state *, size_t, const void *, size_t );
263 typedef int ( *blake2s_init_param_fn )( blake2s_state *, const blake2s_param * );
264 typedef int ( *blake2s_update_fn )( blake2s_state *, const uint8_t *, size_t );
265 typedef int ( *blake2s_final_fn )( blake2s_state *, uint8_t *, size_t );
266 typedef int ( *blake2s_fn )( uint8_t *, const void *, const void *, size_t, size_t, size_t );
268 static const blake2b_init_fn blake2b_init_table[] =
271 #if defined(HAVE_X86)
280 static const blake2b_init_key_fn blake2b_init_key_table[] =
282 blake2b_init_key_ref,
283 #if defined(HAVE_X86)
284 blake2b_init_key_sse2,
285 blake2b_init_key_ssse3,
286 blake2b_init_key_sse41,
287 blake2b_init_key_avx,
292 static const blake2b_init_param_fn blake2b_init_param_table[] =
294 blake2b_init_param_ref,
295 #if defined(HAVE_X86)
296 blake2b_init_param_sse2,
297 blake2b_init_param_ssse3,
298 blake2b_init_param_sse41,
299 blake2b_init_param_avx,
300 blake2b_init_param_xop
304 static const blake2b_update_fn blake2b_update_table[] =
307 #if defined(HAVE_X86)
309 blake2b_update_ssse3,
310 blake2b_update_sse41,
316 static const blake2b_final_fn blake2b_final_table[] =
319 #if defined(HAVE_X86)
328 static const blake2b_fn blake2b_table[] =
331 #if defined(HAVE_X86)
340 static const blake2s_init_fn blake2s_init_table[] =
343 #if defined(HAVE_X86)
352 static const blake2s_init_key_fn blake2s_init_key_table[] =
354 blake2s_init_key_ref,
355 #if defined(HAVE_X86)
356 blake2s_init_key_sse2,
357 blake2s_init_key_ssse3,
358 blake2s_init_key_sse41,
359 blake2s_init_key_avx,
364 static const blake2s_init_param_fn blake2s_init_param_table[] =
366 blake2s_init_param_ref,
367 #if defined(HAVE_X86)
368 blake2s_init_param_sse2,
369 blake2s_init_param_ssse3,
370 blake2s_init_param_sse41,
371 blake2s_init_param_avx,
372 blake2s_init_param_xop
376 static const blake2s_update_fn blake2s_update_table[] =
379 #if defined(HAVE_X86)
381 blake2s_update_ssse3,
382 blake2s_update_sse41,
388 static const blake2s_final_fn blake2s_final_table[] =
391 #if defined(HAVE_X86)
400 static const blake2s_fn blake2s_table[] =
403 #if defined(HAVE_X86)
412 #if defined(__cplusplus)
415 int blake2b_init_dispatch( blake2b_state *S, size_t outlen );
416 int blake2b_init_key_dispatch( blake2b_state *S, size_t outlen, const void *key, size_t keylen );
417 int blake2b_init_param_dispatch( blake2b_state *S, const blake2b_param *P );
418 int blake2b_update_dispatch( blake2b_state *S, const uint8_t *in, size_t inlen );
419 int blake2b_final_dispatch( blake2b_state *S, uint8_t *out, size_t outlen );
420 int blake2b_dispatch( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
422 int blake2s_init_dispatch( blake2s_state *S, size_t outlen );
423 int blake2s_init_key_dispatch( blake2s_state *S, size_t outlen, const void *key, size_t keylen );
424 int blake2s_init_param_dispatch( blake2s_state *S, const blake2s_param *P );
425 int blake2s_update_dispatch( blake2s_state *S, const uint8_t *in, size_t inlen );
426 int blake2s_final_dispatch( blake2s_state *S, uint8_t *out, size_t outlen );
427 int blake2s_dispatch( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen );
428 #if defined(__cplusplus)
432 static blake2b_init_fn blake2b_init_ptr = blake2b_init_dispatch;
433 static blake2b_init_key_fn blake2b_init_key_ptr = blake2b_init_key_dispatch;
434 static blake2b_init_param_fn blake2b_init_param_ptr = blake2b_init_param_dispatch;
435 static blake2b_update_fn blake2b_update_ptr = blake2b_update_dispatch;
436 static blake2b_final_fn blake2b_final_ptr = blake2b_final_dispatch;
437 static blake2b_fn blake2b_ptr = blake2b_dispatch;
439 static blake2s_init_fn blake2s_init_ptr = blake2s_init_dispatch;
440 static blake2s_init_key_fn blake2s_init_key_ptr = blake2s_init_key_dispatch;
441 static blake2s_init_param_fn blake2s_init_param_ptr = blake2s_init_param_dispatch;
442 static blake2s_update_fn blake2s_update_ptr = blake2s_update_dispatch;
443 static blake2s_final_fn blake2s_final_ptr = blake2s_final_dispatch;
444 static blake2s_fn blake2s_ptr = blake2s_dispatch;
446 int blake2b_init_dispatch( blake2b_state *S, size_t outlen )
448 blake2b_init_ptr = blake2b_init_table[get_cpu_features()];
449 return blake2b_init_ptr( S, outlen );
452 int blake2b_init_key_dispatch( blake2b_state *S, size_t outlen, const void *key, size_t keylen )
454 blake2b_init_key_ptr = blake2b_init_key_table[get_cpu_features()];
455 return blake2b_init_key_ptr( S, outlen, key, keylen );
458 int blake2b_init_param_dispatch( blake2b_state *S, const blake2b_param *P )
460 blake2b_init_param_ptr = blake2b_init_param_table[get_cpu_features()];
461 return blake2b_init_param_ptr( S, P );
464 int blake2b_update_dispatch( blake2b_state *S, const uint8_t *in, size_t inlen )
466 blake2b_update_ptr = blake2b_update_table[get_cpu_features()];
467 return blake2b_update_ptr( S, in, inlen );
470 int blake2b_final_dispatch( blake2b_state *S, uint8_t *out, size_t outlen )
472 blake2b_final_ptr = blake2b_final_table[get_cpu_features()];
473 return blake2b_final_ptr( S, out, outlen );
476 int blake2b_dispatch( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen )
478 blake2b_ptr = blake2b_table[get_cpu_features()];
479 return blake2b_ptr( out, in, key, outlen, inlen, keylen );
482 BLAKE2_API int blake2b_init( blake2b_state *S, size_t outlen )
484 return blake2b_init_ptr( S, outlen );
487 BLAKE2_API int blake2b_init_key( blake2b_state *S, size_t outlen, const void *key, size_t keylen )
489 return blake2b_init_key_ptr( S, outlen, key, keylen );
492 BLAKE2_API int blake2b_init_param( blake2b_state *S, const blake2b_param *P )
494 return blake2b_init_param_ptr( S, P );
497 BLAKE2_API int blake2b_update( blake2b_state *S, const uint8_t *in, size_t inlen )
499 return blake2b_update_ptr( S, in, inlen );
502 BLAKE2_API int blake2b_final( blake2b_state *S, uint8_t *out, size_t outlen )
504 return blake2b_final_ptr( S, out, outlen );
507 BLAKE2_API int blake2b( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen )
509 return blake2b_ptr( out, in, key, outlen, inlen, keylen );
512 int blake2s_init_dispatch( blake2s_state *S, size_t outlen )
514 blake2s_init_ptr = blake2s_init_table[get_cpu_features()];
515 return blake2s_init_ptr( S, outlen );
518 int blake2s_init_key_dispatch( blake2s_state *S, size_t outlen, const void *key, size_t keylen )
520 blake2s_init_key_ptr = blake2s_init_key_table[get_cpu_features()];
521 return blake2s_init_key_ptr( S, outlen, key, keylen );
524 int blake2s_init_param_dispatch( blake2s_state *S, const blake2s_param *P )
526 blake2s_init_param_ptr = blake2s_init_param_table[get_cpu_features()];
527 return blake2s_init_param_ptr( S, P );
530 int blake2s_update_dispatch( blake2s_state *S, const uint8_t *in, size_t inlen )
532 blake2s_update_ptr = blake2s_update_table[get_cpu_features()];
533 return blake2s_update_ptr( S, in, inlen );
536 int blake2s_final_dispatch( blake2s_state *S, uint8_t *out, size_t outlen )
538 blake2s_final_ptr = blake2s_final_table[get_cpu_features()];
539 return blake2s_final_ptr( S, out, outlen );
542 int blake2s_dispatch( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen )
544 blake2s_ptr = blake2s_table[get_cpu_features()];
545 return blake2s_ptr( out, in, key, outlen, inlen, keylen );
548 BLAKE2_API int blake2s_init( blake2s_state *S, size_t outlen )
550 return blake2s_init_ptr( S, outlen );
553 BLAKE2_API int blake2s_init_key( blake2s_state *S, size_t outlen, const void *key, size_t keylen )
555 return blake2s_init_key_ptr( S, outlen, key, keylen );
558 BLAKE2_API int blake2s_init_param( blake2s_state *S, const blake2s_param *P )
560 return blake2s_init_param_ptr( S, P );
563 BLAKE2_API int blake2s_update( blake2s_state *S, const uint8_t *in, size_t inlen )
565 return blake2s_update_ptr( S, in, inlen );
568 BLAKE2_API int blake2s_final( blake2s_state *S, uint8_t *out, size_t outlen )
570 return blake2s_final_ptr( S, out, outlen );
573 BLAKE2_API int blake2s( uint8_t *out, const void *in, const void *key, size_t outlen, size_t inlen, size_t keylen )
575 return blake2s_ptr( out, in, key, outlen, inlen, keylen );