hash_func.c revision 1574
1/*- 2 * Copyright (c) 1990, 1993 3 * The Regents of the University of California. All rights reserved. 4 * 5 * This code is derived from software contributed to Berkeley by 6 * Margo Seltzer. 7 * 8 * Redistribution and use in source and binary forms, with or without 9 * modification, are permitted provided that the following conditions 10 * are met: 11 * 1. Redistributions of source code must retain the above copyright 12 * notice, this list of conditions and the following disclaimer. 13 * 2. Redistributions in binary form must reproduce the above copyright 14 * notice, this list of conditions and the following disclaimer in the 15 * documentation and/or other materials provided with the distribution. 16 * 3. All advertising materials mentioning features or use of this software 17 * must display the following acknowledgement: 18 * This product includes software developed by the University of 19 * California, Berkeley and its contributors. 20 * 4. Neither the name of the University nor the names of its contributors 21 * may be used to endorse or promote products derived from this software 22 * without specific prior written permission. 23 * 24 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 25 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 26 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 27 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 28 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 29 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 30 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 31 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 32 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 33 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 34 * SUCH DAMAGE. 35 */ 36 37#if defined(LIBC_SCCS) && !defined(lint) 38static char sccsid[] = "@(#)hash_func.c 8.2 (Berkeley) 2/21/94"; 39#endif /* LIBC_SCCS and not lint */ 40 41#include <sys/types.h> 42 43#include <db.h> 44#include "hash.h" 45#include "page.h" 46#include "extern.h" 47 48static u_int32_t hash1 __P((const void *, size_t)); 49static u_int32_t hash2 __P((const void *, size_t)); 50static u_int32_t hash3 __P((const void *, size_t)); 51static u_int32_t hash4 __P((const void *, size_t)); 52 53/* Global default hash function */ 54u_int32_t (*__default_hash) __P((const void *, size_t)) = hash4; 55 56/* 57 * HASH FUNCTIONS 58 * 59 * Assume that we've already split the bucket to which this key hashes, 60 * calculate that bucket, and check that in fact we did already split it. 61 * 62 * This came from ejb's hsearch. 63 */ 64 65#define PRIME1 37 66#define PRIME2 1048583 67 68static u_int32_t 69hash1(keyarg, len) 70 const void *keyarg; 71 register size_t len; 72{ 73 register const u_char *key; 74 register u_int32_t h; 75 76 /* Convert string to integer */ 77 for (key = keyarg, h = 0; len--;) 78 h = h * PRIME1 ^ (*key++ - ' '); 79 h %= PRIME2; 80 return (h); 81} 82 83/* 84 * Phong's linear congruential hash 85 */ 86#define dcharhash(h, c) ((h) = 0x63c63cd9*(h) + 0x9c39c33d + (c)) 87 88static u_int32_t 89hash2(keyarg, len) 90 const void *keyarg; 91 size_t len; 92{ 93 register const u_char *e, *key; 94 register u_int32_t h; 95 register u_char c; 96 97 key = keyarg; 98 e = key + len; 99 for (h = 0; key != e;) { 100 c = *key++; 101 if (!c && key > e) 102 break; 103 dcharhash(h, c); 104 } 105 return (h); 106} 107 108/* 109 * This is INCREDIBLY ugly, but fast. We break the string up into 8 byte 110 * units. On the first time through the loop we get the "leftover bytes" 111 * (strlen % 8). On every other iteration, we perform 8 HASHC's so we handle 112 * all 8 bytes. Essentially, this saves us 7 cmp & branch instructions. If 113 * this routine is heavily used enough, it's worth the ugly coding. 114 * 115 * OZ's original sdbm hash 116 */ 117static u_int32_t 118hash3(keyarg, len) 119 const void *keyarg; 120 register size_t len; 121{ 122 register const u_char *key; 123 register size_t loop; 124 register u_int32_t h; 125 126#define HASHC h = *key++ + 65599 * h 127 128 h = 0; 129 key = keyarg; 130 if (len > 0) { 131 loop = (len + 8 - 1) >> 3; 132 133 switch (len & (8 - 1)) { 134 case 0: 135 do { 136 HASHC; 137 /* FALLTHROUGH */ 138 case 7: 139 HASHC; 140 /* FALLTHROUGH */ 141 case 6: 142 HASHC; 143 /* FALLTHROUGH */ 144 case 5: 145 HASHC; 146 /* FALLTHROUGH */ 147 case 4: 148 HASHC; 149 /* FALLTHROUGH */ 150 case 3: 151 HASHC; 152 /* FALLTHROUGH */ 153 case 2: 154 HASHC; 155 /* FALLTHROUGH */ 156 case 1: 157 HASHC; 158 } while (--loop); 159 } 160 } 161 return (h); 162} 163 164/* Hash function from Chris Torek. */ 165static u_int32_t 166hash4(keyarg, len) 167 const void *keyarg; 168 register size_t len; 169{ 170 register const u_char *key; 171 register size_t loop; 172 register u_int32_t h; 173 174#define HASH4a h = (h << 5) - h + *key++; 175#define HASH4b h = (h << 5) + h + *key++; 176#define HASH4 HASH4b 177 178 h = 0; 179 key = keyarg; 180 if (len > 0) { 181 loop = (len + 8 - 1) >> 3; 182 183 switch (len & (8 - 1)) { 184 case 0: 185 do { 186 HASH4; 187 /* FALLTHROUGH */ 188 case 7: 189 HASH4; 190 /* FALLTHROUGH */ 191 case 6: 192 HASH4; 193 /* FALLTHROUGH */ 194 case 5: 195 HASH4; 196 /* FALLTHROUGH */ 197 case 4: 198 HASH4; 199 /* FALLTHROUGH */ 200 case 3: 201 HASH4; 202 /* FALLTHROUGH */ 203 case 2: 204 HASH4; 205 /* FALLTHROUGH */ 206 case 1: 207 HASH4; 208 } while (--loop); 209 } 210 } 211 return (h); 212} 213