util/storage/lookup3.c

   1 /*
   2   February 2013(Wouter) patch defines for BSD endianness, from Brad Smith.
   3   January 2012(Wouter) added randomised initial value, fallout from 28c3.
   4   March 2007(Wouter) adapted from lookup3.c original, add config.h include.
   5      added #ifdef VALGRIND to remove 298,384,660 'unused variable k8' warnings.
   6      added include of lookup3.h to check definitions match declarations.
   7      removed include of stdint - config.h takes care of platform independence.
   8   url http://burtleburtle.net/bob/hash/index.html.
   9 */
  10 /*
  11 -------------------------------------------------------------------------------
  12 lookup3.c, by Bob Jenkins, May 2006, Public Domain.
  13
  14 These are functions for producing 32-bit hashes for hash table lookup.
  15 hashword(), hashlittle(), hashlittle2(), hashbig(), mix(), and final()
  16 are externally useful functions.  Routines to test the hash are included
  17 if SELF_TEST is defined.  You can use this free for any purpose.  It's in
  18 the public domain.  It has no warranty.
  19
  20 You probably want to use hashlittle().  hashlittle() and hashbig()
  21 hash byte arrays.  hashlittle() is is faster than hashbig() on
  22 little-endian machines.  Intel and AMD are little-endian machines.
  23 On second thought, you probably want hashlittle2(), which is identical to
  24 hashlittle() except it returns two 32-bit hashes for the price of one.
  25 You could implement hashbig2() if you wanted but I haven't bothered here.
  26
  27 If you want to find a hash of, say, exactly 7 integers, do
  28   a = i1;  b = i2;  c = i3;
  29   mix(a,b,c);
  30   a += i4; b += i5; c += i6;
  31   mix(a,b,c);
  32   a += i7;
  33   final(a,b,c);
  34 then use c as the hash value.  If you have a variable length array of
  35 4-byte integers to hash, use hashword().  If you have a byte array (like
  36 a character string), use hashlittle().  If you have several byte arrays, or
  37 a mix of things, see the comments above hashlittle().
  38
  39 Why is this so big?  I read 12 bytes at a time into 3 4-byte integers,
  40 then mix those integers.  This is fast (you can do a lot more thorough
  41 mixing with 12*3 instructions on 3 integers than you can with 3 instructions
  42 on 1 byte), but shoehorning those bytes into integers efficiently is messy.
  43 -------------------------------------------------------------------------------
  44 */
  45 /*#define SELF_TEST 1*/
  46
  47 #include "config.h"
  48 #include "util/storage/lookup3.h"
  49 #include <stdio.h>      /* defines printf for tests */
  50 #include <time.h>       /* defines time_t for timings in the test */
  51 /*#include <stdint.h>     defines uint32_t etc  (from config.h) */
  52 #include <sys/param.h>  /* attempt to define endianness */
  53 #ifdef HAVE_SYS_TYPES_H
  54 # include <sys/types.h> /* attempt to define endianness (solaris) */
  55 #endif
  56 #ifdef linux
  57 # include <endian.h>    /* attempt to define endianness */
  58 #endif
  59 #if defined(__FreeBSD__) || defined(__NetBSD__) || defined(__DragonFly__)
  60 #include <sys/endian.h> /* attempt to define endianness */
  61 #endif
  62 #ifdef __OpenBSD__
  63 #include <machine/endian.h> /* attempt to define endianness */
  64 #endif
  65
  66 /* random initial value */
  67 static uint32_t raninit = (uint32_t)0xdeadbeef;
  68
  69 void
  70 hash_set_raninit(uint32_t v)
  71 {
  72         raninit = v;
  73 }
  74
  75 /*
  76  * My best guess at if you are big-endian or little-endian.  This may
  77  * need adjustment.
  78  */
  79 #if (defined(__BYTE_ORDER) && defined(__LITTLE_ENDIAN) && \
  80      __BYTE_ORDER == __LITTLE_ENDIAN) || \
  81     (defined(i386) || defined(__i386__) || defined(__i486__) || \
  82      defined(__i586__) || defined(__i686__) || defined(vax) || defined(MIPSEL) || defined(__x86))
  83 # define HASH_LITTLE_ENDIAN 1
  84 # define HASH_BIG_ENDIAN 0
  85 #elif (defined(__BYTE_ORDER) && defined(__BIG_ENDIAN) && \
  86        __BYTE_ORDER == __BIG_ENDIAN) || \
  87       (defined(sparc) || defined(__sparc) || defined(__sparc__) || defined(POWERPC) || defined(mc68000) || defined(sel))
  88 # define HASH_LITTLE_ENDIAN 0
  89 # define HASH_BIG_ENDIAN 1
  90 #elif defined(_MACHINE_ENDIAN_H_)
  91 /* test for machine_endian_h protects failure if some are empty strings */
  92 # if defined(_BYTE_ORDER) && defined(_BIG_ENDIAN) && _BYTE_ORDER == _BIG_ENDIAN
  93 #  define HASH_LITTLE_ENDIAN 0
  94 #  define HASH_BIG_ENDIAN 1
  95 # endif
  96 # if defined(_BYTE_ORDER) && defined(_LITTLE_ENDIAN) && _BYTE_ORDER == _LITTLE_ENDIAN
  97 #  define HASH_LITTLE_ENDIAN 1
  98 #  define HASH_BIG_ENDIAN 0
  99 # endif /* _MACHINE_ENDIAN_H_ */
 100 #else
 101 # define HASH_LITTLE_ENDIAN 0
 102 # define HASH_BIG_ENDIAN 0
 103 #endif
 104
 105 #define hashsize(n) ((uint32_t)1<<(n))
 106 #define hashmask(n) (hashsize(n)-1)
 107 #define rot(x,k) (((x)<<(k)) | ((x)>>(32-(k))))
 108
 109 /*
 110 -------------------------------------------------------------------------------
 111 mix -- mix 3 32-bit values reversibly.
 112
 113 This is reversible, so any information in (a,b,c) before mix() is
 114 still in (a,b,c) after mix().
 115
 116 If four pairs of (a,b,c) inputs are run through mix(), or through
 117 mix() in reverse, there are at least 32 bits of the output that
 118 are sometimes the same for one pair and different for another pair.
 119 This was tested for:
 120 * pairs that differed by one bit, by two bits, in any combination
 121   of top bits of (a,b,c), or in any combination of bottom bits of
 122   (a,b,c).
 123 * "differ" is defined as +, -, ^, or ~^.  For + and -, I transformed
 124   the output delta to a Gray code (a^(a>>1)) so a string of 1's (as
 125   is commonly produced by subtraction) look like a single 1-bit
 126   difference.
 127 * the base values were pseudorandom, all zero but one bit set, or
 128   all zero plus a counter that starts at zero.
 129
 130 Some k values for my "a-=c; a^=rot(c,k); c+=b;" arrangement that
 131 satisfy this are
 132     4  6  8 16 19  4
 133     9 15  3 18 27 15
 134    14  9  3  7 17  3
 135 Well, "9 15 3 18 27 15" didn't quite get 32 bits diffing
 136 for "differ" defined as + with a one-bit base and a two-bit delta.  I
 137 used http://burtleburtle.net/bob/hash/avalanche.html to choose
 138 the operations, constants, and arrangements of the variables.
 139
 140 This does not achieve avalanche.  There are input bits of (a,b,c)
 141 that fail to affect some output bits of (a,b,c), especially of a.  The
 142 most thoroughly mixed value is c, but it doesn't really even achieve
 143 avalanche in c.
 144
 145 This allows some parallelism.  Read-after-writes are good at doubling
 146 the number of bits affected, so the goal of mixing pulls in the opposite
 147 direction as the goal of parallelism.  I did what I could.  Rotates
 148 seem to cost as much as shifts on every machine I could lay my hands
 149 on, and rotates are much kinder to the top and bottom bits, so I used
 150 rotates.
 151 -------------------------------------------------------------------------------
 152 */
 153 #define mix(a,b,c) \
 154 { \
 155   a -= c;  a ^= rot(c, 4);  c += b; \
 156   b -= a;  b ^= rot(a, 6);  a += c; \
 157   c -= b;  c ^= rot(b, 8);  b += a; \
 158   a -= c;  a ^= rot(c,16);  c += b; \
 159   b -= a;  b ^= rot(a,19);  a += c; \
 160   c -= b;  c ^= rot(b, 4);  b += a; \
 161 }
 162
 163 /*
 164 -------------------------------------------------------------------------------
 165 final -- final mixing of 3 32-bit values (a,b,c) into c
 166
 167 Pairs of (a,b,c) values differing in only a few bits will usually
 168 produce values of c that look totally different.  This was tested for
 169 * pairs that differed by one bit, by two bits, in any combination
 170   of top bits of (a,b,c), or in any combination of bottom bits of
 171   (a,b,c).
 172 * "differ" is defined as +, -, ^, or ~^.  For + and -, I transformed
 173   the output delta to a Gray code (a^(a>>1)) so a string of 1's (as
 174   is commonly produced by subtraction) look like a single 1-bit
 175   difference.
 176 * the base values were pseudorandom, all zero but one bit set, or
 177   all zero plus a counter that starts at zero.
 178
 179 These constants passed:
 180  14 11 25 16 4 14 24
 181  12 14 25 16 4 14 24
 182 and these came close:
 183   4  8 15 26 3 22 24
 184  10  8 15 26 3 22 24
 185  11  8 15 26 3 22 24
 186 -------------------------------------------------------------------------------
 187 */
 188 #define final(a,b,c) \
 189 { \
 190   c ^= b; c -= rot(b,14); \
 191   a ^= c; a -= rot(c,11); \
 192   b ^= a; b -= rot(a,25); \
 193   c ^= b; c -= rot(b,16); \
 194   a ^= c; a -= rot(c,4);  \
 195   b ^= a; b -= rot(a,14); \
 196   c ^= b; c -= rot(b,24); \
 197 }
 198
 199 /*
 200 --------------------------------------------------------------------
 201  This works on all machines.  To be useful, it requires
 202  -- that the key be an array of uint32_t's, and
 203  -- that the length be the number of uint32_t's in the key
 204
 205  The function hashword() is identical to hashlittle() on little-endian
 206  machines, and identical to hashbig() on big-endian machines,
 207  except that the length has to be measured in uint32_ts rather than in
 208  bytes.  hashlittle() is more complicated than hashword() only because
 209  hashlittle() has to dance around fitting the key bytes into registers.
 210 --------------------------------------------------------------------
 211 */
 212 uint32_t hashword(
 213 const uint32_t *k,                   /* the key, an array of uint32_t values */
 214 size_t          length,               /* the length of the key, in uint32_ts */
 215 uint32_t        initval)         /* the previous hash, or an arbitrary value */
 216 {
 217   uint32_t a,b,c;
 218
 219   /* Set up the internal state */
 220   a = b = c = raninit + (((uint32_t)length)<<2) + initval;
 221
 222   /*------------------------------------------------- handle most of the key */
 223   while (length > 3)
 224   {
 225     a += k[0];
 226     b += k[1];
 227     c += k[2];
 228     mix(a,b,c);
 229     length -= 3;
 230     k += 3;
 231   }
 232
 233   /*------------------------------------------- handle the last 3 uint32_t's */
 234   switch(length)                     /* all the case statements fall through */
 235   {
 236   case 3 : c+=k[2];
 237   case 2 : b+=k[1];
 238   case 1 : a+=k[0];
 239     final(a,b,c);
 240   case 0:     /* case 0: nothing left to add */
 241     break;
 242   }
 243   /*------------------------------------------------------ report the result */
 244   return c;
 245 }
 246
 247
 248 #ifdef SELF_TEST
 249
 250 /*
 251 --------------------------------------------------------------------
 252 hashword2() -- same as hashword(), but take two seeds and return two
 253 32-bit values.  pc and pb must both be nonnull, and *pc and *pb must
 254 both be initialized with seeds.  If you pass in (*pb)==0, the output
 255 (*pc) will be the same as the return value from hashword().
 256 --------------------------------------------------------------------
 257 */
 258 void hashword2 (
 259 const uint32_t *k,                   /* the key, an array of uint32_t values */
 260 size_t          length,               /* the length of the key, in uint32_ts */
 261 uint32_t       *pc,                      /* IN: seed OUT: primary hash value */
 262 uint32_t       *pb)               /* IN: more seed OUT: secondary hash value */
 263 {
 264   uint32_t a,b,c;
 265
 266   /* Set up the internal state */
 267   a = b = c = raninit + ((uint32_t)(length<<2)) + *pc;
 268   c += *pb;
 269
 270   /*------------------------------------------------- handle most of the key */
 271   while (length > 3)
 272   {
 273     a += k[0];
 274     b += k[1];
 275     c += k[2];
 276     mix(a,b,c);
 277     length -= 3;
 278     k += 3;
 279   }
 280
 281   /*------------------------------------------- handle the last 3 uint32_t's */
 282   switch(length)                     /* all the case statements fall through */
 283   {
 284   case 3 : c+=k[2];
 285   case 2 : b+=k[1];
 286   case 1 : a+=k[0];
 287     final(a,b,c);
 288   case 0:     /* case 0: nothing left to add */
 289     break;
 290   }
 291   /*------------------------------------------------------ report the result */
 292   *pc=c; *pb=b;
 293 }
 294
 295 #endif /* SELF_TEST */
 296
 297 /*
 298 -------------------------------------------------------------------------------
 299 hashlittle() -- hash a variable-length key into a 32-bit value
 300   k       : the key (the unaligned variable-length array of bytes)
 301   length  : the length of the key, counting by bytes
 302   initval : can be any 4-byte value
 303 Returns a 32-bit value.  Every bit of the key affects every bit of
 304 the return value.  Two keys differing by one or two bits will have
 305 totally different hash values.
 306
 307 The best hash table sizes are powers of 2.  There is no need to do
 308 mod a prime (mod is sooo slow!).  If you need less than 32 bits,
 309 use a bitmask.  For example, if you need only 10 bits, do
 310   h = (h & hashmask(10));
 311 In which case, the hash table should have hashsize(10) elements.
 312
 313 If you are hashing n strings (uint8_t **)k, do it like this:
 314   for (i=0, h=0; i<n; ++i) h = hashlittle( k[i], len[i], h);
 315
 316 By Bob Jenkins, 2006.  bob_jenkins@burtleburtle.net.  You may use this
 317 code any way you wish, private, educational, or commercial.  It's free.
 318
 319 Use for hash table lookup, or anything where one collision in 2^^32 is
 320 acceptable.  Do NOT use for cryptographic purposes.
 321 -------------------------------------------------------------------------------
 322 */
 323
 324 uint32_t hashlittle( const void *key, size_t length, uint32_t initval)
 325 {
 326   uint32_t a,b,c;                                          /* internal state */
 327   union { const void *ptr; size_t i; } u;     /* needed for Mac Powerbook G4 */
 328
 329   /* Set up the internal state */
 330   a = b = c = raninit + ((uint32_t)length) + initval;
 331
 332   u.ptr = key;
 333   if (HASH_LITTLE_ENDIAN && ((u.i & 0x3) == 0)) {
 334     const uint32_t *k = (const uint32_t *)key;         /* read 32-bit chunks */
 335 #ifdef VALGRIND
 336     const uint8_t  *k8;
 337 #endif
 338
 339     /*------ all but last block: aligned reads and affect 32 bits of (a,b,c) */
 340     while (length > 12)
 341     {
 342       a += k[0];
 343       b += k[1];
 344       c += k[2];
 345       mix(a,b,c);
 346       length -= 12;
 347       k += 3;
 348     }
 349
 350     /*----------------------------- handle the last (probably partial) block */
 351     /*
 352      * "k[2]&0xffffff" actually reads beyond the end of the string, but
 353      * then masks off the part it's not allowed to read.  Because the
 354      * string is aligned, the masked-off tail is in the same word as the
 355      * rest of the string.  Every machine with memory protection I've seen
 356      * does it on word boundaries, so is OK with this.  But VALGRIND will
 357      * still catch it and complain.  The masking trick does make the hash
 358      * noticably faster for short strings (like English words).
 359      */
 360 #ifndef VALGRIND
 361
 362     switch(length)
 363     {
 364     case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
 365     case 11: c+=k[2]&0xffffff; b+=k[1]; a+=k[0]; break;
 366     case 10: c+=k[2]&0xffff; b+=k[1]; a+=k[0]; break;
 367     case 9 : c+=k[2]&0xff; b+=k[1]; a+=k[0]; break;
 368     case 8 : b+=k[1]; a+=k[0]; break;
 369     case 7 : b+=k[1]&0xffffff; a+=k[0]; break;
 370     case 6 : b+=k[1]&0xffff; a+=k[0]; break;
 371     case 5 : b+=k[1]&0xff; a+=k[0]; break;
 372     case 4 : a+=k[0]; break;
 373     case 3 : a+=k[0]&0xffffff; break;
 374     case 2 : a+=k[0]&0xffff; break;
 375     case 1 : a+=k[0]&0xff; break;
 376     case 0 : return c;              /* zero length strings require no mixing */
 377     }
 378
 379 #else /* make valgrind happy */
 380
 381     k8 = (const uint8_t *)k;
 382     switch(length)
 383     {
 384     case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
 385     case 11: c+=((uint32_t)k8[10])<<16;  /* fall through */
 386     case 10: c+=((uint32_t)k8[9])<<8;    /* fall through */
 387     case 9 : c+=k8[8];                   /* fall through */
 388     case 8 : b+=k[1]; a+=k[0]; break;
 389     case 7 : b+=((uint32_t)k8[6])<<16;   /* fall through */
 390     case 6 : b+=((uint32_t)k8[5])<<8;    /* fall through */
 391     case 5 : b+=k8[4];                   /* fall through */
 392     case 4 : a+=k[0]; break;
 393     case 3 : a+=((uint32_t)k8[2])<<16;   /* fall through */
 394     case 2 : a+=((uint32_t)k8[1])<<8;    /* fall through */
 395     case 1 : a+=k8[0]; break;
 396     case 0 : return c;
 397     }
 398
 399 #endif /* !valgrind */
 400
 401   } else if (HASH_LITTLE_ENDIAN && ((u.i & 0x1) == 0)) {
 402     const uint16_t *k = (const uint16_t *)key;         /* read 16-bit chunks */
 403     const uint8_t  *k8;
 404
 405     /*--------------- all but last block: aligned reads and different mixing */
 406     while (length > 12)
 407     {
 408       a += k[0] + (((uint32_t)k[1])<<16);
 409       b += k[2] + (((uint32_t)k[3])<<16);
 410       c += k[4] + (((uint32_t)k[5])<<16);
 411       mix(a,b,c);
 412       length -= 12;
 413       k += 6;
 414     }
 415
 416     /*----------------------------- handle the last (probably partial) block */
 417     k8 = (const uint8_t *)k;
 418     switch(length)
 419     {
 420     case 12: c+=k[4]+(((uint32_t)k[5])<<16);
 421              b+=k[2]+(((uint32_t)k[3])<<16);
 422              a+=k[0]+(((uint32_t)k[1])<<16);
 423              break;
 424     case 11: c+=((uint32_t)k8[10])<<16;     /* fall through */
 425     case 10: c+=k[4];
 426              b+=k[2]+(((uint32_t)k[3])<<16);
 427              a+=k[0]+(((uint32_t)k[1])<<16);
 428              break;
 429     case 9 : c+=k8[8];                      /* fall through */
 430     case 8 : b+=k[2]+(((uint32_t)k[3])<<16);
 431              a+=k[0]+(((uint32_t)k[1])<<16);
 432              break;
 433     case 7 : b+=((uint32_t)k8[6])<<16;      /* fall through */
 434     case 6 : b+=k[2];
 435              a+=k[0]+(((uint32_t)k[1])<<16);
 436              break;
 437     case 5 : b+=k8[4];                      /* fall through */
 438     case 4 : a+=k[0]+(((uint32_t)k[1])<<16);
 439              break;
 440     case 3 : a+=((uint32_t)k8[2])<<16;      /* fall through */
 441     case 2 : a+=k[0];
 442              break;
 443     case 1 : a+=k8[0];
 444              break;
 445     case 0 : return c;                     /* zero length requires no mixing */
 446     }
 447
 448   } else {                        /* need to read the key one byte at a time */
 449     const uint8_t *k = (const uint8_t *)key;
 450
 451     /*--------------- all but the last block: affect some 32 bits of (a,b,c) */
 452     while (length > 12)
 453     {
 454       a += k[0];
 455       a += ((uint32_t)k[1])<<8;
 456       a += ((uint32_t)k[2])<<16;
 457       a += ((uint32_t)k[3])<<24;
 458       b += k[4];
 459       b += ((uint32_t)k[5])<<8;
 460       b += ((uint32_t)k[6])<<16;
 461       b += ((uint32_t)k[7])<<24;
 462       c += k[8];
 463       c += ((uint32_t)k[9])<<8;
 464       c += ((uint32_t)k[10])<<16;
 465       c += ((uint32_t)k[11])<<24;
 466       mix(a,b,c);
 467       length -= 12;
 468       k += 12;
 469     }
 470
 471     /*-------------------------------- last block: affect all 32 bits of (c) */
 472     switch(length)                   /* all the case statements fall through */
 473     {
 474     case 12: c+=((uint32_t)k[11])<<24;
 475     case 11: c+=((uint32_t)k[10])<<16;
 476     case 10: c+=((uint32_t)k[9])<<8;
 477     case 9 : c+=k[8];
 478     case 8 : b+=((uint32_t)k[7])<<24;
 479     case 7 : b+=((uint32_t)k[6])<<16;
 480     case 6 : b+=((uint32_t)k[5])<<8;
 481     case 5 : b+=k[4];
 482     case 4 : a+=((uint32_t)k[3])<<24;
 483     case 3 : a+=((uint32_t)k[2])<<16;
 484     case 2 : a+=((uint32_t)k[1])<<8;
 485     case 1 : a+=k[0];
 486              break;
 487     case 0 : return c;
 488     }
 489   }
 490
 491   final(a,b,c);
 492   return c;
 493 }
 494
 495 #ifdef SELF_TEST
 496
 497 /*
 498  * hashlittle2: return 2 32-bit hash values
 499  *
 500  * This is identical to hashlittle(), except it returns two 32-bit hash
 501  * values instead of just one.  This is good enough for hash table
 502  * lookup with 2^^64 buckets, or if you want a second hash if you're not
 503  * happy with the first, or if you want a probably-unique 64-bit ID for
 504  * the key.  *pc is better mixed than *pb, so use *pc first.  If you want
 505  * a 64-bit value do something like "*pc + (((uint64_t)*pb)<<32)".
 506  */
 507 void hashlittle2(
 508   const void *key,       /* the key to hash */
 509   size_t      length,    /* length of the key */
 510   uint32_t   *pc,        /* IN: primary initval, OUT: primary hash */
 511   uint32_t   *pb)        /* IN: secondary initval, OUT: secondary hash */
 512 {
 513   uint32_t a,b,c;                                          /* internal state */
 514   union { const void *ptr; size_t i; } u;     /* needed for Mac Powerbook G4 */
 515
 516   /* Set up the internal state */
 517   a = b = c = raninit + ((uint32_t)length) + *pc;
 518   c += *pb;
 519
 520   u.ptr = key;
 521   if (HASH_LITTLE_ENDIAN && ((u.i & 0x3) == 0)) {
 522     const uint32_t *k = (const uint32_t *)key;         /* read 32-bit chunks */
 523 #ifdef VALGRIND
 524     const uint8_t  *k8;
 525 #endif
 526
 527     /*------ all but last block: aligned reads and affect 32 bits of (a,b,c) */
 528     while (length > 12)
 529     {
 530       a += k[0];
 531       b += k[1];
 532       c += k[2];
 533       mix(a,b,c);
 534       length -= 12;
 535       k += 3;
 536     }
 537
 538     /*----------------------------- handle the last (probably partial) block */
 539     /*
 540      * "k[2]&0xffffff" actually reads beyond the end of the string, but
 541      * then masks off the part it's not allowed to read.  Because the
 542      * string is aligned, the masked-off tail is in the same word as the
 543      * rest of the string.  Every machine with memory protection I've seen
 544      * does it on word boundaries, so is OK with this.  But VALGRIND will
 545      * still catch it and complain.  The masking trick does make the hash
 546      * noticably faster for short strings (like English words).
 547      */
 548 #ifndef VALGRIND
 549
 550     switch(length)
 551     {
 552     case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
 553     case 11: c+=k[2]&0xffffff; b+=k[1]; a+=k[0]; break;
 554     case 10: c+=k[2]&0xffff; b+=k[1]; a+=k[0]; break;
 555     case 9 : c+=k[2]&0xff; b+=k[1]; a+=k[0]; break;
 556     case 8 : b+=k[1]; a+=k[0]; break;
 557     case 7 : b+=k[1]&0xffffff; a+=k[0]; break;
 558     case 6 : b+=k[1]&0xffff; a+=k[0]; break;
 559     case 5 : b+=k[1]&0xff; a+=k[0]; break;
 560     case 4 : a+=k[0]; break;
 561     case 3 : a+=k[0]&0xffffff; break;
 562     case 2 : a+=k[0]&0xffff; break;
 563     case 1 : a+=k[0]&0xff; break;
 564     case 0 : *pc=c; *pb=b; return;  /* zero length strings require no mixing */
 565     }
 566
 567 #else /* make valgrind happy */
 568
 569     k8 = (const uint8_t *)k;
 570     switch(length)
 571     {
 572     case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
 573     case 11: c+=((uint32_t)k8[10])<<16;  /* fall through */
 574     case 10: c+=((uint32_t)k8[9])<<8;    /* fall through */
 575     case 9 : c+=k8[8];                   /* fall through */
 576     case 8 : b+=k[1]; a+=k[0]; break;
 577     case 7 : b+=((uint32_t)k8[6])<<16;   /* fall through */
 578     case 6 : b+=((uint32_t)k8[5])<<8;    /* fall through */
 579     case 5 : b+=k8[4];                   /* fall through */
 580     case 4 : a+=k[0]; break;
 581     case 3 : a+=((uint32_t)k8[2])<<16;   /* fall through */
 582     case 2 : a+=((uint32_t)k8[1])<<8;    /* fall through */
 583     case 1 : a+=k8[0]; break;
 584     case 0 : *pc=c; *pb=b; return;  /* zero length strings require no mixing */
 585     }
 586
 587 #endif /* !valgrind */
 588
 589   } else if (HASH_LITTLE_ENDIAN && ((u.i & 0x1) == 0)) {
 590     const uint16_t *k = (const uint16_t *)key;         /* read 16-bit chunks */
 591     const uint8_t  *k8;
 592
 593     /*--------------- all but last block: aligned reads and different mixing */
 594     while (length > 12)
 595     {
 596       a += k[0] + (((uint32_t)k[1])<<16);
 597       b += k[2] + (((uint32_t)k[3])<<16);
 598       c += k[4] + (((uint32_t)k[5])<<16);
 599       mix(a,b,c);
 600       length -= 12;
 601       k += 6;
 602     }
 603
 604     /*----------------------------- handle the last (probably partial) block */
 605     k8 = (const uint8_t *)k;
 606     switch(length)
 607     {
 608     case 12: c+=k[4]+(((uint32_t)k[5])<<16);
 609              b+=k[2]+(((uint32_t)k[3])<<16);
 610              a+=k[0]+(((uint32_t)k[1])<<16);
 611              break;
 612     case 11: c+=((uint32_t)k8[10])<<16;     /* fall through */
 613     case 10: c+=k[4];
 614              b+=k[2]+(((uint32_t)k[3])<<16);
 615              a+=k[0]+(((uint32_t)k[1])<<16);
 616              break;
 617     case 9 : c+=k8[8];                      /* fall through */
 618     case 8 : b+=k[2]+(((uint32_t)k[3])<<16);
 619              a+=k[0]+(((uint32_t)k[1])<<16);
 620              break;
 621     case 7 : b+=((uint32_t)k8[6])<<16;      /* fall through */
 622     case 6 : b+=k[2];
 623              a+=k[0]+(((uint32_t)k[1])<<16);
 624              break;
 625     case 5 : b+=k8[4];                      /* fall through */
 626     case 4 : a+=k[0]+(((uint32_t)k[1])<<16);
 627              break;
 628     case 3 : a+=((uint32_t)k8[2])<<16;      /* fall through */
 629     case 2 : a+=k[0];
 630              break;
 631     case 1 : a+=k8[0];
 632              break;
 633     case 0 : *pc=c; *pb=b; return;  /* zero length strings require no mixing */
 634     }
 635
 636   } else {                        /* need to read the key one byte at a time */
 637     const uint8_t *k = (const uint8_t *)key;
 638
 639     /*--------------- all but the last block: affect some 32 bits of (a,b,c) */
 640     while (length > 12)
 641     {
 642       a += k[0];
 643       a += ((uint32_t)k[1])<<8;
 644       a += ((uint32_t)k[2])<<16;
 645       a += ((uint32_t)k[3])<<24;
 646       b += k[4];
 647       b += ((uint32_t)k[5])<<8;
 648       b += ((uint32_t)k[6])<<16;
 649       b += ((uint32_t)k[7])<<24;
 650       c += k[8];
 651       c += ((uint32_t)k[9])<<8;
 652       c += ((uint32_t)k[10])<<16;
 653       c += ((uint32_t)k[11])<<24;
 654       mix(a,b,c);
 655       length -= 12;
 656       k += 12;
 657     }
 658
 659     /*-------------------------------- last block: affect all 32 bits of (c) */
 660     switch(length)                   /* all the case statements fall through */
 661     {
 662     case 12: c+=((uint32_t)k[11])<<24;
 663     case 11: c+=((uint32_t)k[10])<<16;
 664     case 10: c+=((uint32_t)k[9])<<8;
 665     case 9 : c+=k[8];
 666     case 8 : b+=((uint32_t)k[7])<<24;
 667     case 7 : b+=((uint32_t)k[6])<<16;
 668     case 6 : b+=((uint32_t)k[5])<<8;
 669     case 5 : b+=k[4];
 670     case 4 : a+=((uint32_t)k[3])<<24;
 671     case 3 : a+=((uint32_t)k[2])<<16;
 672     case 2 : a+=((uint32_t)k[1])<<8;
 673     case 1 : a+=k[0];
 674              break;
 675     case 0 : *pc=c; *pb=b; return;  /* zero length strings require no mixing */
 676     }
 677   }
 678
 679   final(a,b,c);
 680   *pc=c; *pb=b;
 681 }
 682
 683 #endif /* SELF_TEST */
 684
 685 #if 0   /* currently not used */
 686
 687 /*
 688  * hashbig():
 689  * This is the same as hashword() on big-endian machines.  It is different
 690  * from hashlittle() on all machines.  hashbig() takes advantage of
 691  * big-endian byte ordering.
 692  */
 693 uint32_t hashbig( const void *key, size_t length, uint32_t initval)
 694 {
 695   uint32_t a,b,c;
 696   union { const void *ptr; size_t i; } u; /* to cast key to (size_t) happily */
 697
 698   /* Set up the internal state */
 699   a = b = c = raninit + ((uint32_t)length) + initval;
 700
 701   u.ptr = key;
 702   if (HASH_BIG_ENDIAN && ((u.i & 0x3) == 0)) {
 703     const uint32_t *k = (const uint32_t *)key;         /* read 32-bit chunks */
 704 #ifdef VALGRIND
 705     const uint8_t  *k8;
 706 #endif
 707
 708     /*------ all but last block: aligned reads and affect 32 bits of (a,b,c) */
 709     while (length > 12)
 710     {
 711       a += k[0];
 712       b += k[1];
 713       c += k[2];
 714       mix(a,b,c);
 715       length -= 12;
 716       k += 3;
 717     }
 718
 719     /*----------------------------- handle the last (probably partial) block */
 720     /*
 721      * "k[2]<<8" actually reads beyond the end of the string, but
 722      * then shifts out the part it's not allowed to read.  Because the
 723      * string is aligned, the illegal read is in the same word as the
 724      * rest of the string.  Every machine with memory protection I've seen
 725      * does it on word boundaries, so is OK with this.  But VALGRIND will
 726      * still catch it and complain.  The masking trick does make the hash
 727      * noticably faster for short strings (like English words).
 728      */
 729 #ifndef VALGRIND
 730
 731     switch(length)
 732     {
 733     case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
 734     case 11: c+=k[2]&0xffffff00; b+=k[1]; a+=k[0]; break;
 735     case 10: c+=k[2]&0xffff0000; b+=k[1]; a+=k[0]; break;
 736     case 9 : c+=k[2]&0xff000000; b+=k[1]; a+=k[0]; break;
 737     case 8 : b+=k[1]; a+=k[0]; break;
 738     case 7 : b+=k[1]&0xffffff00; a+=k[0]; break;
 739     case 6 : b+=k[1]&0xffff0000; a+=k[0]; break;
 740     case 5 : b+=k[1]&0xff000000; a+=k[0]; break;
 741     case 4 : a+=k[0]; break;
 742     case 3 : a+=k[0]&0xffffff00; break;
 743     case 2 : a+=k[0]&0xffff0000; break;
 744     case 1 : a+=k[0]&0xff000000; break;
 745     case 0 : return c;              /* zero length strings require no mixing */
 746     }
 747
 748 #else  /* make valgrind happy */
 749
 750     k8 = (const uint8_t *)k;
 751     switch(length)                   /* all the case statements fall through */
 752     {
 753     case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
 754     case 11: c+=((uint32_t)k8[10])<<8;  /* fall through */
 755     case 10: c+=((uint32_t)k8[9])<<16;  /* fall through */
 756     case 9 : c+=((uint32_t)k8[8])<<24;  /* fall through */
 757     case 8 : b+=k[1]; a+=k[0]; break;
 758     case 7 : b+=((uint32_t)k8[6])<<8;   /* fall through */
 759     case 6 : b+=((uint32_t)k8[5])<<16;  /* fall through */
 760     case 5 : b+=((uint32_t)k8[4])<<24;  /* fall through */
 761     case 4 : a+=k[0]; break;
 762     case 3 : a+=((uint32_t)k8[2])<<8;   /* fall through */
 763     case 2 : a+=((uint32_t)k8[1])<<16;  /* fall through */
 764     case 1 : a+=((uint32_t)k8[0])<<24; break;
 765     case 0 : return c;
 766     }
 767
 768 #endif /* !VALGRIND */
 769
 770   } else {                        /* need to read the key one byte at a time */
 771     const uint8_t *k = (const uint8_t *)key;
 772
 773     /*--------------- all but the last block: affect some 32 bits of (a,b,c) */
 774     while (length > 12)
 775     {
 776       a += ((uint32_t)k[0])<<24;
 777       a += ((uint32_t)k[1])<<16;
 778       a += ((uint32_t)k[2])<<8;
 779       a += ((uint32_t)k[3]);
 780       b += ((uint32_t)k[4])<<24;
 781       b += ((uint32_t)k[5])<<16;
 782       b += ((uint32_t)k[6])<<8;
 783       b += ((uint32_t)k[7]);
 784       c += ((uint32_t)k[8])<<24;
 785       c += ((uint32_t)k[9])<<16;
 786       c += ((uint32_t)k[10])<<8;
 787       c += ((uint32_t)k[11]);
 788       mix(a,b,c);
 789       length -= 12;
 790       k += 12;
 791     }
 792
 793     /*-------------------------------- last block: affect all 32 bits of (c) */
 794     switch(length)                   /* all the case statements fall through */
 795     {
 796     case 12: c+=k[11];
 797     case 11: c+=((uint32_t)k[10])<<8;
 798     case 10: c+=((uint32_t)k[9])<<16;
 799     case 9 : c+=((uint32_t)k[8])<<24;
 800     case 8 : b+=k[7];
 801     case 7 : b+=((uint32_t)k[6])<<8;
 802     case 6 : b+=((uint32_t)k[5])<<16;
 803     case 5 : b+=((uint32_t)k[4])<<24;
 804     case 4 : a+=k[3];
 805     case 3 : a+=((uint32_t)k[2])<<8;
 806     case 2 : a+=((uint32_t)k[1])<<16;
 807     case 1 : a+=((uint32_t)k[0])<<24;
 808              break;
 809     case 0 : return c;
 810     }
 811   }
 812
 813   final(a,b,c);
 814   return c;
 815 }
 816
 817 #endif /* 0 == currently not used */
 818
 819 #ifdef SELF_TEST
 820
 821 /* used for timings */
 822 void driver1()
 823 {
 824   uint8_t buf[256];
 825   uint32_t i;
 826   uint32_t h=0;
 827   time_t a,z;
 828
 829   time(&a);
 830   for (i=0; i<256; ++i) buf[i] = 'x';
 831   for (i=0; i<1; ++i)
 832   {
 833     h = hashlittle(&buf[0],1,h);
 834   }
 835   time(&z);
 836   if (z-a > 0) printf("time %d %.8x\n", z-a, h);
 837 }
 838
 839 /* check that every input bit changes every output bit half the time */
 840 #define HASHSTATE 1
 841 #define HASHLEN   1
 842 #define MAXPAIR 60
 843 #define MAXLEN  70
 844 void driver2()
 845 {
 846   uint8_t qa[MAXLEN+1], qb[MAXLEN+2], *a = &qa[0], *b = &qb[1];
 847   uint32_t c[HASHSTATE], d[HASHSTATE], i=0, j=0, k, l, m=0, z;
 848   uint32_t e[HASHSTATE],f[HASHSTATE],g[HASHSTATE],h[HASHSTATE];
 849   uint32_t x[HASHSTATE],y[HASHSTATE];
 850   uint32_t hlen;
 851
 852   printf("No more than %d trials should ever be needed \n",MAXPAIR/2);
 853   for (hlen=0; hlen < MAXLEN; ++hlen)
 854   {
 855     z=0;
 856     for (i=0; i<hlen; ++i)  /*----------------------- for each input byte, */
 857     {
 858       for (j=0; j<8; ++j)   /*------------------------ for each input bit, */
 859       {
 860         for (m=1; m<8; ++m) /*------------ for serveral possible initvals, */
 861         {
 862           for (l=0; l<HASHSTATE; ++l)
 863             e[l]=f[l]=g[l]=h[l]=x[l]=y[l]=~((uint32_t)0);
 864
 865           /*---- check that every output bit is affected by that input bit */
 866           for (k=0; k<MAXPAIR; k+=2)
 867           {
 868             uint32_t finished=1;
 869             /* keys have one bit different */
 870             for (l=0; l<hlen+1; ++l) {a[l] = b[l] = (uint8_t)0;}
 871             /* have a and b be two keys differing in only one bit */
 872             a[i] ^= (k<<j);
 873             a[i] ^= (k>>(8-j));
 874              c[0] = hashlittle(a, hlen, m);
 875             b[i] ^= ((k+1)<<j);
 876             b[i] ^= ((k+1)>>(8-j));
 877              d[0] = hashlittle(b, hlen, m);
 878             /* check every bit is 1, 0, set, and not set at least once */
 879             for (l=0; l<HASHSTATE; ++l)
 880             {
 881               e[l] &= (c[l]^d[l]);
 882               f[l] &= ~(c[l]^d[l]);
 883               g[l] &= c[l];
 884               h[l] &= ~c[l];
 885               x[l] &= d[l];
 886               y[l] &= ~d[l];
 887               if (e[l]|f[l]|g[l]|h[l]|x[l]|y[l]) finished=0;
 888             }
 889             if (finished) break;
 890           }
 891           if (k>z) z=k;
 892           if (k==MAXPAIR)
 893           {
 894              printf("Some bit didn't change: ");
 895              printf("%.8x %.8x %.8x %.8x %.8x %.8x  ",
 896                     e[0],f[0],g[0],h[0],x[0],y[0]);
 897              printf("i %d j %d m %d len %d\n", i, j, m, hlen);
 898           }
 899           if (z==MAXPAIR) goto done;
 900         }
 901       }
 902     }
 903    done:
 904     if (z < MAXPAIR)
 905     {
 906       printf("Mix success  %2d bytes  %2d initvals  ",i,m);
 907       printf("required  %d  trials\n", z/2);
 908     }
 909   }
 910   printf("\n");
 911 }
 912
 913 /* Check for reading beyond the end of the buffer and alignment problems */
 914 void driver3()
 915 {
 916   uint8_t buf[MAXLEN+20], *b;
 917   uint32_t len;
 918   uint8_t q[] = "This is the time for all good men to come to the aid of their country...";
 919   uint32_t h;
 920   uint8_t qq[] = "xThis is the time for all good men to come to the aid of their country...";
 921   uint32_t i;
 922   uint8_t qqq[] = "xxThis is the time for all good men to come to the aid of their country...";
 923   uint32_t j;
 924   uint8_t qqqq[] = "xxxThis is the time for all good men to come to the aid of their country...";
 925   uint32_t ref,x,y;
 926   uint8_t *p;
 927
 928   printf("Endianness.  These lines should all be the same (for values filled in):\n");
 929   printf("%.8x                            %.8x                            %.8x\n",
 930          hashword((const uint32_t *)q, (sizeof(q)-1)/4, 13),
 931          hashword((const uint32_t *)q, (sizeof(q)-5)/4, 13),
 932          hashword((const uint32_t *)q, (sizeof(q)-9)/4, 13));
 933   p = q;
 934   printf("%.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x\n",
 935          hashlittle(p, sizeof(q)-1, 13), hashlittle(p, sizeof(q)-2, 13),
 936          hashlittle(p, sizeof(q)-3, 13), hashlittle(p, sizeof(q)-4, 13),
 937          hashlittle(p, sizeof(q)-5, 13), hashlittle(p, sizeof(q)-6, 13),
 938          hashlittle(p, sizeof(q)-7, 13), hashlittle(p, sizeof(q)-8, 13),
 939          hashlittle(p, sizeof(q)-9, 13), hashlittle(p, sizeof(q)-10, 13),
 940          hashlittle(p, sizeof(q)-11, 13), hashlittle(p, sizeof(q)-12, 13));
 941   p = &qq[1];
 942   printf("%.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x\n",
 943          hashlittle(p, sizeof(q)-1, 13), hashlittle(p, sizeof(q)-2, 13),
 944          hashlittle(p, sizeof(q)-3, 13), hashlittle(p, sizeof(q)-4, 13),
 945          hashlittle(p, sizeof(q)-5, 13), hashlittle(p, sizeof(q)-6, 13),
 946          hashlittle(p, sizeof(q)-7, 13), hashlittle(p, sizeof(q)-8, 13),
 947          hashlittle(p, sizeof(q)-9, 13), hashlittle(p, sizeof(q)-10, 13),
 948          hashlittle(p, sizeof(q)-11, 13), hashlittle(p, sizeof(q)-12, 13));
 949   p = &qqq[2];
 950   printf("%.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x\n",
 951          hashlittle(p, sizeof(q)-1, 13), hashlittle(p, sizeof(q)-2, 13),
 952          hashlittle(p, sizeof(q)-3, 13), hashlittle(p, sizeof(q)-4, 13),
 953          hashlittle(p, sizeof(q)-5, 13), hashlittle(p, sizeof(q)-6, 13),
 954          hashlittle(p, sizeof(q)-7, 13), hashlittle(p, sizeof(q)-8, 13),
 955          hashlittle(p, sizeof(q)-9, 13), hashlittle(p, sizeof(q)-10, 13),
 956          hashlittle(p, sizeof(q)-11, 13), hashlittle(p, sizeof(q)-12, 13));
 957   p = &qqqq[3];
 958   printf("%.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x\n",
 959          hashlittle(p, sizeof(q)-1, 13), hashlittle(p, sizeof(q)-2, 13),
 960          hashlittle(p, sizeof(q)-3, 13), hashlittle(p, sizeof(q)-4, 13),
 961          hashlittle(p, sizeof(q)-5, 13), hashlittle(p, sizeof(q)-6, 13),
 962          hashlittle(p, sizeof(q)-7, 13), hashlittle(p, sizeof(q)-8, 13),
 963          hashlittle(p, sizeof(q)-9, 13), hashlittle(p, sizeof(q)-10, 13),
 964          hashlittle(p, sizeof(q)-11, 13), hashlittle(p, sizeof(q)-12, 13));
 965   printf("\n");
 966
 967   /* check that hashlittle2 and hashlittle produce the same results */
 968   i=47; j=0;
 969   hashlittle2(q, sizeof(q), &i, &j);
 970   if (hashlittle(q, sizeof(q), 47) != i)
 971     printf("hashlittle2 and hashlittle mismatch\n");
 972
 973   /* check that hashword2 and hashword produce the same results */
 974   len = raninit;
 975   i=47, j=0;
 976   hashword2(&len, 1, &i, &j);
 977   if (hashword(&len, 1, 47) != i)
 978     printf("hashword2 and hashword mismatch %x %x\n",
 979            i, hashword(&len, 1, 47));
 980
 981   /* check hashlittle doesn't read before or after the ends of the string */
 982   for (h=0, b=buf+1; h<8; ++h, ++b)
 983   {
 984     for (i=0; i<MAXLEN; ++i)
 985     {
 986       len = i;
 987       for (j=0; j<i; ++j) *(b+j)=0;
 988
 989       /* these should all be equal */
 990       ref = hashlittle(b, len, (uint32_t)1);
 991       *(b+i)=(uint8_t)~0;
 992       *(b-1)=(uint8_t)~0;
 993       x = hashlittle(b, len, (uint32_t)1);
 994       y = hashlittle(b, len, (uint32_t)1);
 995       if ((ref != x) || (ref != y))
 996       {
 997         printf("alignment error: %.8x %.8x %.8x %d %d\n",ref,x,y,
 998                h, i);
 999       }
1000     }
1001   }
1002 }
1003
1004 /* check for problems with nulls */
1005  void driver4()
1006 {
1007   uint8_t buf[1];
1008   uint32_t h,i,state[HASHSTATE];
1009
1010
1011   buf[0] = ~0;
1012   for (i=0; i<HASHSTATE; ++i) state[i] = 1;
1013   printf("These should all be different\n");
1014   for (i=0, h=0; i<8; ++i)
1015   {
1016     h = hashlittle(buf, 0, h);
1017     printf("%2ld  0-byte strings, hash is  %.8x\n", i, h);
1018   }
1019 }
1020
1021
1022 int main()
1023 {
1024   driver1();   /* test that the key is hashed: used for timings */
1025   driver2();   /* test that whole key is hashed thoroughly */
1026   driver3();   /* test that nothing but the key is hashed */
1027   driver4();   /* test hashing multiple buffers (all buffers are null) */
1028   return 1;
1029 }
1030
1031 #endif  /* SELF_TEST */