sys/libkern/jenkins_hash.c

123445Sjkoshy#ifndef __LIBKERN_JENKINS_H__
208291Suqs#define __LIBKERN_JENKINS_H__
123445Sjkoshy/*
123445Sjkoshy * Taken from http://burtleburtle.net/bob/c/lookup3.c
123445Sjkoshy * $FreeBSD: head/sys/libkern/jenkins.h 218965 2011-02-23 09:22:33Z brucec $
123445Sjkoshy */
123445Sjkoshy
123445Sjkoshy/*
123445Sjkoshy-------------------------------------------------------------------------------
123445Sjkoshy  lookup3.c, by Bob Jenkins, May 2006, Public Domain.
123445Sjkoshy
123445Sjkoshy  These are functions for producing 32-bit hashes for hash table lookup.
123445Sjkoshy  hashword(), hashlittle(), hashlittle2(), hashbig(), mix(), and final()
123445Sjkoshy  are externally useful functions.  Routines to test the hash are included
123445Sjkoshy  if SELF_TEST is defined.  You can use this free for any purpose.  It's in
123445Sjkoshy  the public domain.  It has no warranty.
123445Sjkoshy
123445Sjkoshy  You probably want to use hashlittle().  hashlittle() and hashbig()
123445Sjkoshy  hash byte arrays.  hashlittle() is faster than hashbig() on
123445Sjkoshy  little-endian machines.  Intel and AMD are little-endian machines.
123445Sjkoshy  On second thought, you probably want hashlittle2(), which is identical to
123445Sjkoshy  hashlittle() except it returns two 32-bit hashes for the price of one.
123445Sjkoshy  You could implement hashbig2() if you wanted but I haven't bothered here.
123445Sjkoshy
123445Sjkoshy  If you want to find a hash of, say, exactly 7 integers, do
123445Sjkoshy    a = i1;  b = i2;  c = i3;
123445Sjkoshy    mix(a,b,c);
123445Sjkoshy    a += i4; b += i5; c += i6;
131683Sru    mix(a,b,c);
123445Sjkoshy    a += i7;
206622Suqs    final(a,b,c);
123445Sjkoshy  then use c as the hash value.  If you have a variable length array of
123445Sjkoshy  4-byte integers to hash, use hashword().  If you have a byte array (like
123445Sjkoshy  a character string), use hashlittle().  If you have several byte arrays, or
123445Sjkoshy  a mix of things, see the comments above hashlittle().
123445Sjkoshy
123445Sjkoshy  Why is this so big?  I read 12 bytes at a time into 3 4-byte integers,
123445Sjkoshy  then mix those integers.  This is fast (you can do a lot more thorough
123445Sjkoshy  mixing with 12*3 instructions on 3 integers than you can with 3 instructions
123445Sjkoshy  on 1 byte), but shoehorning those bytes into integers efficiently is messy.
131683Sru-------------------------------------------------------------------------------
123445Sjkoshy*/
123445Sjkoshy
123445Sjkoshy#define rot(x,k) (((x)<<(k)) | ((x)>>(32-(k))))
123445Sjkoshy
123445Sjkoshy/*
123445Sjkoshy-------------------------------------------------------------------------------
123445Sjkoshymix -- mix 3 32-bit values reversibly.
131683Sru
123445SjkoshyThis is reversible, so any information in (a,b,c) before mix() is
131683Srustill in (a,b,c) after mix().
131683Sru
131683SruIf four pairs of (a,b,c) inputs are run through mix(), or through
123445Sjkoshymix() in reverse, there are at least 32 bits of the output that
123445Sjkoshyare sometimes the same for one pair and different for another pair.
123445SjkoshyThis was tested for:
123445Sjkoshy* pairs that differed by one bit, by two bits, in any combination
123445Sjkoshy  of top bits of (a,b,c), or in any combination of bottom bits of
123445Sjkoshy  (a,b,c).
123445Sjkoshy* "differ" is defined as +, -, ^, or ~^.  For + and -, I transformed
123445Sjkoshy  the output delta to a Gray code (a^(a>>1)) so a string of 1's (as
123445Sjkoshy  is commonly produced by subtraction) look like a single 1-bit
131683Sru  difference.
131683Sru* the base values were pseudorandom, all zero but one bit set, or
123445Sjkoshy  all zero plus a counter that starts at zero.
123445Sjkoshy
131683SruSome k values for my "a-=c; a^=rot(c,k); c+=b;" arrangement that
123445Sjkoshysatisfy this are
123445Sjkoshy    4  6  8 16 19  4
123445Sjkoshy    9 15  3 18 27 15
130843Smpp   14  9  3  7 17  3
123445SjkoshyWell, "9 15 3 18 27 15" didn't quite get 32 bits diffing
123445Sjkoshyfor "differ" defined as + with a one-bit base and a two-bit delta.  I
123445Sjkoshyused http://burtleburtle.net/bob/hash/avalanche.html to choose
123445Sjkoshythe operations, constants, and arrangements of the variables.
123445Sjkoshy
123445SjkoshyThis does not achieve avalanche.  There are input bits of (a,b,c)
123445Sjkoshythat fail to affect some output bits of (a,b,c), especially of a.  The
123445Sjkoshymost thoroughly mixed value is c, but it doesn't really even achieve
123445Sjkoshyavalanche in c.
123445Sjkoshy
131683SruThis allows some parallelism.  Read-after-writes are good at doubling
the number of bits affected, so the goal of mixing pulls in the opposite
direction as the goal of parallelism.  I did what I could.  Rotates
seem to cost as much as shifts on every machine I could lay my hands
on, and rotates are much kinder to the top and bottom bits, so I used
rotates.
-------------------------------------------------------------------------------
*/
#define mix(a,b,c) \
{ \
  a -= c;  a ^= rot(c, 4);  c += b; \
  b -= a;  b ^= rot(a, 6);  a += c; \
  c -= b;  c ^= rot(b, 8);  b += a; \
  a -= c;  a ^= rot(c,16);  c += b; \
  b -= a;  b ^= rot(a,19);  a += c; \
  c -= b;  c ^= rot(b, 4);  b += a; \
}

/*
-------------------------------------------------------------------------------
final -- final mixing of 3 32-bit values (a,b,c) into c

Pairs of (a,b,c) values differing in only a few bits will usually
produce values of c that look totally different.  This was tested for
* pairs that differed by one bit, by two bits, in any combination
  of top bits of (a,b,c), or in any combination of bottom bits of
  (a,b,c).
* "differ" is defined as +, -, ^, or ~^.  For + and -, I transformed
  the output delta to a Gray code (a^(a>>1)) so a string of 1's (as
  is commonly produced by subtraction) look like a single 1-bit
  difference.
* the base values were pseudorandom, all zero but one bit set, or
  all zero plus a counter that starts at zero.

These constants passed:
 14 11 25 16 4 14 24
 12 14 25 16 4 14 24
and these came close:
  4  8 15 26 3 22 24
 10  8 15 26 3 22 24
 11  8 15 26 3 22 24
-------------------------------------------------------------------------------
*/
#define final(a,b,c) \
{ \
  c ^= b; c -= rot(b,14); \
  a ^= c; a -= rot(c,11); \
  b ^= a; b -= rot(a,25); \
  c ^= b; c -= rot(b,16); \
  a ^= c; a -= rot(c,4);  \
  b ^= a; b -= rot(a,14); \
  c ^= b; c -= rot(b,24); \
}

/*
--------------------------------------------------------------------
 This works on all machines.  To be useful, it requires
 -- that the key be an array of uint32_t's, and
 -- that the length be the number of uint32_t's in the key

 The function hashword() is identical to hashlittle() on little-endian
 machines, and identical to hashbig() on big-endian machines,
 except that the length has to be measured in uint32_ts rather than in
 bytes.  hashlittle() is more complicated than hashword() only because
 hashlittle() has to dance around fitting the key bytes into registers.
--------------------------------------------------------------------
*/
static uint32_t
jenkins_hashword(
                const uint32_t *k,  /* the key, an array of uint32_t values */
                size_t length,      /* the length of the key, in uint32_ts */
                uint32_t initval    /* the previous hash, or an arbitrary value */
)
{
  uint32_t a,b,c;

  /* Set up the internal state */
  a = b = c = 0xdeadbeef + (((uint32_t)length)<<2) + initval;

  /*------------------------------------------------- handle most of the key */
  while (length > 3)
  {
    a += k[0];
    b += k[1];
    c += k[2];
    mix(a,b,c);
    length -= 3;
    k += 3;
  }

  /*------------------------------------------- handle the last 3 uint32_t's */
  switch(length)                     /* all the case statements fall through */
  {
  case 3 : c+=k[2];
  case 2 : b+=k[1];
  case 1 : a+=k[0];
    final(a,b,c);
  case 0:     /* case 0: nothing left to add */
    break;
  }
  /*------------------------------------------------------ report the result */
  return c;
}
#endif