10SN/A/* Licensed to the Apache Software Foundation (ASF) under one or more 211784Sdarcy * contributor license agreements. See the NOTICE file distributed with 30SN/A * this work for additional information regarding copyright ownership. 40SN/A * The ASF licenses this file to You under the Apache License, Version 2.0 50SN/A * (the "License"); you may not use this file except in compliance with 60SN/A * the License. You may obtain a copy of the License at 72362SN/A * 80SN/A * http://www.apache.org/licenses/LICENSE-2.0 92362SN/A * 100SN/A * Unless required by applicable law or agreed to in writing, software 110SN/A * distributed under the License is distributed on an "AS IS" BASIS, 120SN/A * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 130SN/A * See the License for the specific language governing permissions and 140SN/A * limitations under the License. 150SN/A */ 160SN/A 170SN/A/* 180SN/A * sdbm - ndbm work-alike hashed database library 190SN/A * based on Per-Aake Larson's Dynamic Hashing algorithms. BIT 18 (1978). 200SN/A * author: oz@nexus.yorku.ca 212362SN/A * ex-public domain, ported to APR for Apache 2 222362SN/A * core routines 232362SN/A */ 240SN/A 250SN/A#include "apr.h" 260SN/A#include "apr_file_io.h" 270SN/A#include "apr_strings.h" 280SN/A#include "apr_errno.h" 290SN/A#include "apr_sdbm.h" 300SN/A 310SN/A#include "sdbm_tune.h" 320SN/A#include "sdbm_pair.h" 330SN/A#include "sdbm_private.h" 340SN/A 350SN/A#include <string.h> /* for memset() */ 360SN/A#include <stdlib.h> /* for malloc() and free() */ 370SN/A 380SN/A/* 390SN/A * forward 400SN/A */ 410SN/Astatic int getdbit (apr_sdbm_t *, long); 420SN/Astatic apr_status_t setdbit(apr_sdbm_t *, long); 430SN/Astatic apr_status_t getpage(apr_sdbm_t *db, long); 440SN/Astatic apr_status_t getnext(apr_sdbm_datum_t *key, apr_sdbm_t *db); 450SN/Astatic apr_status_t makroom(apr_sdbm_t *, long, int); 4611784Sdarcy 470SN/A/* 480SN/A * useful macros 490SN/A */ 500SN/A#define bad(x) ((x).dptr == NULL || (x).dsize <= 0) 510SN/A#define exhash(item) sdbm_hash((item).dptr, (item).dsize) 520SN/A 530SN/A#define OFF_PAG(off) (apr_off_t) (off) * PBLKSIZ 540SN/A#define OFF_DIR(off) (apr_off_t) (off) * DBLKSIZ 550SN/A 560SN/Astatic const long masks[] = { 570SN/A 000000000000, 000000000001, 000000000003, 000000000007, 580SN/A 000000000017, 000000000037, 000000000077, 000000000177, 590SN/A 000000000377, 000000000777, 000000001777, 000000003777, 600SN/A 000000007777, 000000017777, 000000037777, 000000077777, 6111784Sdarcy 000000177777, 000000377777, 000000777777, 000001777777, 6211784Sdarcy 000003777777, 000007777777, 000017777777, 000037777777, 630SN/A 000077777777, 000177777777, 000377777777, 000777777777, 640SN/A 001777777777, 003777777777, 007777777777, 017777777777 650SN/A}; 660SN/A 670SN/Aconst apr_sdbm_datum_t sdbm_nullitem = { NULL, 0 }; 680SN/A 690SN/Astatic apr_status_t database_cleanup(void *data) 700SN/A{ 710SN/A apr_sdbm_t *db = data; 720SN/A 730SN/A /* 740SN/A * Can't rely on apr_sdbm_unlock, since it will merely 750SN/A * decrement the refcnt if several locks are held. 760SN/A */ 770SN/A if (db->flags & (SDBM_SHARED_LOCK | SDBM_EXCLUSIVE_LOCK)) 780SN/A (void) apr_file_unlock(db->dirf); 790SN/A (void) apr_file_close(db->dirf); 800SN/A (void) apr_file_close(db->pagf); 810SN/A free(db); 820SN/A 830SN/A return APR_SUCCESS; 840SN/A} 850SN/A 860SN/Astatic apr_status_t prep(apr_sdbm_t **pdb, const char *dirname, const char *pagname, 870SN/A apr_int32_t flags, apr_fileperms_t perms, apr_pool_t *p) 880SN/A{ 890SN/A apr_sdbm_t *db; 900SN/A apr_status_t status; 910SN/A 920SN/A *pdb = NULL; 930SN/A 940SN/A db = malloc(sizeof(*db)); 950SN/A memset(db, 0, sizeof(*db)); 960SN/A 970SN/A db->pool = p; 980SN/A 990SN/A /* 1000SN/A * adjust user flags so that WRONLY becomes RDWR, 1010SN/A * as required by this package. Also set our internal 1020SN/A * flag for RDONLY if needed. 1030SN/A */ 1040SN/A if (!(flags & APR_FOPEN_WRITE)) { 1050SN/A db->flags |= SDBM_RDONLY; 1060SN/A } 1070SN/A 1080SN/A /* 1090SN/A * adjust the file open flags so that we handle locking 1100SN/A * on our own (don't rely on any locking behavior within 1110SN/A * an apr_file_t, in case it's ever introduced, and set 1120SN/A * our own flag. 1130SN/A */ 1140SN/A if (flags & APR_FOPEN_SHARELOCK) { 1150SN/A db->flags |= SDBM_SHARED; 1160SN/A flags &= ~APR_FOPEN_SHARELOCK; 1170SN/A } 1180SN/A 1190SN/A flags |= APR_FOPEN_BINARY | APR_FOPEN_READ; 1200SN/A 1210SN/A /* 1220SN/A * open the files in sequence, and stat the dirfile. 123 * If we fail anywhere, undo everything, return NULL. 124 */ 125 126 if ((status = apr_file_open(&db->dirf, dirname, flags, perms, p)) 127 != APR_SUCCESS) 128 goto error; 129 130 if ((status = apr_file_open(&db->pagf, pagname, flags, perms, p)) 131 != APR_SUCCESS) 132 goto error; 133 134 if ((status = apr_sdbm_lock(db, (db->flags & SDBM_RDONLY) 135 ? APR_FLOCK_SHARED 136 : APR_FLOCK_EXCLUSIVE)) 137 != APR_SUCCESS) 138 goto error; 139 140 /* apr_pcalloc zeroed the buffers 141 * apr_sdbm_lock stated the dirf->size and invalidated the cache 142 */ 143 144 /* 145 * if we are opened in SHARED mode, unlock ourself 146 */ 147 if (db->flags & SDBM_SHARED) 148 if ((status = apr_sdbm_unlock(db)) != APR_SUCCESS) 149 goto error; 150 151 /* make sure that we close the database at some point */ 152 apr_pool_cleanup_register(p, db, database_cleanup, apr_pool_cleanup_null); 153 154 /* Done! */ 155 *pdb = db; 156 return APR_SUCCESS; 157 158error: 159 if (db->dirf && db->pagf) 160 (void) apr_sdbm_unlock(db); 161 if (db->dirf != NULL) 162 (void) apr_file_close(db->dirf); 163 if (db->pagf != NULL) { 164 (void) apr_file_close(db->pagf); 165 } 166 free(db); 167 return status; 168} 169 170APU_DECLARE(apr_status_t) apr_sdbm_open(apr_sdbm_t **db, const char *file, 171 apr_int32_t flags, 172 apr_fileperms_t perms, apr_pool_t *p) 173{ 174 char *dirname = apr_pstrcat(p, file, APR_SDBM_DIRFEXT, NULL); 175 char *pagname = apr_pstrcat(p, file, APR_SDBM_PAGFEXT, NULL); 176 177 return prep(db, dirname, pagname, flags, perms, p); 178} 179 180APU_DECLARE(apr_status_t) apr_sdbm_close(apr_sdbm_t *db) 181{ 182 return apr_pool_cleanup_run(db->pool, db, database_cleanup); 183} 184 185APU_DECLARE(apr_status_t) apr_sdbm_fetch(apr_sdbm_t *db, apr_sdbm_datum_t *val, 186 apr_sdbm_datum_t key) 187{ 188 apr_status_t status; 189 190 if (db == NULL || bad(key)) 191 return APR_EINVAL; 192 193 if ((status = apr_sdbm_lock(db, APR_FLOCK_SHARED)) != APR_SUCCESS) 194 return status; 195 196 if ((status = getpage(db, exhash(key))) == APR_SUCCESS) { 197 *val = getpair(db->pagbuf, key); 198 /* ### do we want a not-found result? */ 199 } 200 201 (void) apr_sdbm_unlock(db); 202 203 return status; 204} 205 206static apr_status_t write_page(apr_sdbm_t *db, const char *buf, long pagno) 207{ 208 apr_status_t status; 209 apr_off_t off = OFF_PAG(pagno); 210 211 if ((status = apr_file_seek(db->pagf, APR_SET, &off)) == APR_SUCCESS) 212 status = apr_file_write_full(db->pagf, buf, PBLKSIZ, NULL); 213 214 return status; 215} 216 217APU_DECLARE(apr_status_t) apr_sdbm_delete(apr_sdbm_t *db, 218 const apr_sdbm_datum_t key) 219{ 220 apr_status_t status; 221 222 if (db == NULL || bad(key)) 223 return APR_EINVAL; 224 if (apr_sdbm_rdonly(db)) 225 return APR_EINVAL; 226 227 if ((status = apr_sdbm_lock(db, APR_FLOCK_EXCLUSIVE)) != APR_SUCCESS) 228 return status; 229 230 if ((status = getpage(db, exhash(key))) == APR_SUCCESS) { 231 if (!delpair(db->pagbuf, key)) 232 /* ### should we define some APRUTIL codes? */ 233 status = APR_EGENERAL; 234 else 235 status = write_page(db, db->pagbuf, db->pagbno); 236 } 237 238 (void) apr_sdbm_unlock(db); 239 240 return status; 241} 242 243APU_DECLARE(apr_status_t) apr_sdbm_store(apr_sdbm_t *db, apr_sdbm_datum_t key, 244 apr_sdbm_datum_t val, int flags) 245{ 246 int need; 247 register long hash; 248 apr_status_t status; 249 250 if (db == NULL || bad(key)) 251 return APR_EINVAL; 252 if (apr_sdbm_rdonly(db)) 253 return APR_EINVAL; 254 need = key.dsize + val.dsize; 255 /* 256 * is the pair too big (or too small) for this database ?? 257 */ 258 if (need < 0 || need > PAIRMAX) 259 return APR_EINVAL; 260 261 if ((status = apr_sdbm_lock(db, APR_FLOCK_EXCLUSIVE)) != APR_SUCCESS) 262 return status; 263 264 if ((status = getpage(db, (hash = exhash(key)))) == APR_SUCCESS) { 265 266 /* 267 * if we need to replace, delete the key/data pair 268 * first. If it is not there, ignore. 269 */ 270 if (flags == APR_SDBM_REPLACE) 271 (void) delpair(db->pagbuf, key); 272 else if (!(flags & APR_SDBM_INSERTDUP) && duppair(db->pagbuf, key)) { 273 status = APR_EEXIST; 274 goto error; 275 } 276 /* 277 * if we do not have enough room, we have to split. 278 */ 279 if (!fitpair(db->pagbuf, need)) 280 if ((status = makroom(db, hash, need)) != APR_SUCCESS) 281 goto error; 282 /* 283 * we have enough room or split is successful. insert the key, 284 * and update the page file. 285 */ 286 (void) putpair(db->pagbuf, key, val); 287 288 status = write_page(db, db->pagbuf, db->pagbno); 289 } 290 291error: 292 (void) apr_sdbm_unlock(db); 293 294 return status; 295} 296 297/* 298 * makroom - make room by splitting the overfull page 299 * this routine will attempt to make room for SPLTMAX times before 300 * giving up. 301 */ 302static apr_status_t makroom(apr_sdbm_t *db, long hash, int need) 303{ 304 long newp; 305 char twin[PBLKSIZ]; 306 char *pag = db->pagbuf; 307 char *new = twin; 308 register int smax = SPLTMAX; 309 apr_status_t status; 310 311 do { 312 /* 313 * split the current page 314 */ 315 (void) splpage(pag, new, db->hmask + 1); 316 /* 317 * address of the new page 318 */ 319 newp = (hash & db->hmask) | (db->hmask + 1); 320 321 /* 322 * write delay, read avoidence/cache shuffle: 323 * select the page for incoming pair: if key is to go to the new page, 324 * write out the previous one, and copy the new one over, thus making 325 * it the current page. If not, simply write the new page, and we are 326 * still looking at the page of interest. current page is not updated 327 * here, as sdbm_store will do so, after it inserts the incoming pair. 328 */ 329 if (hash & (db->hmask + 1)) { 330 if ((status = write_page(db, db->pagbuf, db->pagbno)) 331 != APR_SUCCESS) 332 return status; 333 334 db->pagbno = newp; 335 (void) memcpy(pag, new, PBLKSIZ); 336 } 337 else { 338 if ((status = write_page(db, new, newp)) != APR_SUCCESS) 339 return status; 340 } 341 342 if ((status = setdbit(db, db->curbit)) != APR_SUCCESS) 343 return status; 344 /* 345 * see if we have enough room now 346 */ 347 if (fitpair(pag, need)) 348 return APR_SUCCESS; 349 /* 350 * try again... update curbit and hmask as getpage would have 351 * done. because of our update of the current page, we do not 352 * need to read in anything. BUT we have to write the current 353 * [deferred] page out, as the window of failure is too great. 354 */ 355 db->curbit = 2 * db->curbit 356 + ((hash & (db->hmask + 1)) ? 2 : 1); 357 db->hmask |= db->hmask + 1; 358 359 if ((status = write_page(db, db->pagbuf, db->pagbno)) 360 != APR_SUCCESS) 361 return status; 362 363 } while (--smax); 364 365 /* 366 * if we are here, this is real bad news. After SPLTMAX splits, 367 * we still cannot fit the key. say goodnight. 368 */ 369#if 0 370 (void) write(2, "sdbm: cannot insert after SPLTMAX attempts.\n", 44); 371#endif 372 /* ### ENOSPC not really appropriate but better than nothing */ 373 return APR_ENOSPC; 374 375} 376 377/* Reads 'len' bytes from file 'f' at offset 'off' into buf. 378 * 'off' is given relative to the start of the file. 379 * If EOF is returned while reading, this is taken as success. 380 */ 381static apr_status_t read_from(apr_file_t *f, void *buf, 382 apr_off_t off, apr_size_t len) 383{ 384 apr_status_t status; 385 386 if ((status = apr_file_seek(f, APR_SET, &off)) != APR_SUCCESS || 387 ((status = apr_file_read_full(f, buf, len, NULL)) != APR_SUCCESS)) { 388 /* if EOF is reached, pretend we read all zero's */ 389 if (status == APR_EOF) { 390 memset(buf, 0, len); 391 status = APR_SUCCESS; 392 } 393 } 394 395 return status; 396} 397 398/* 399 * the following two routines will break if 400 * deletions aren't taken into account. (ndbm bug) 401 */ 402APU_DECLARE(apr_status_t) apr_sdbm_firstkey(apr_sdbm_t *db, 403 apr_sdbm_datum_t *key) 404{ 405 apr_status_t status; 406 407 if ((status = apr_sdbm_lock(db, APR_FLOCK_SHARED)) != APR_SUCCESS) 408 return status; 409 410 /* 411 * start at page 0 412 */ 413 if ((status = read_from(db->pagf, db->pagbuf, OFF_PAG(0), PBLKSIZ)) 414 == APR_SUCCESS) { 415 db->pagbno = 0; 416 db->blkptr = 0; 417 db->keyptr = 0; 418 status = getnext(key, db); 419 } 420 421 (void) apr_sdbm_unlock(db); 422 423 return status; 424} 425 426APU_DECLARE(apr_status_t) apr_sdbm_nextkey(apr_sdbm_t *db, 427 apr_sdbm_datum_t *key) 428{ 429 apr_status_t status; 430 431 if ((status = apr_sdbm_lock(db, APR_FLOCK_SHARED)) != APR_SUCCESS) 432 return status; 433 434 status = getnext(key, db); 435 436 (void) apr_sdbm_unlock(db); 437 438 return status; 439} 440 441/* 442 * all important binary tree traversal 443 */ 444static apr_status_t getpage(apr_sdbm_t *db, long hash) 445{ 446 register int hbit; 447 register long dbit; 448 register long pagb; 449 apr_status_t status; 450 451 dbit = 0; 452 hbit = 0; 453 while (dbit < db->maxbno && getdbit(db, dbit)) 454 dbit = 2 * dbit + ((hash & (1 << hbit++)) ? 2 : 1); 455 456 debug(("dbit: %d...", dbit)); 457 458 db->curbit = dbit; 459 db->hmask = masks[hbit]; 460 461 pagb = hash & db->hmask; 462 /* 463 * see if the block we need is already in memory. 464 * note: this lookaside cache has about 10% hit rate. 465 */ 466 if (pagb != db->pagbno) { 467 /* 468 * note: here, we assume a "hole" is read as 0s. 469 * if not, must zero pagbuf first. 470 * ### joe: this assumption was surely never correct? but 471 * ### we make it so in read_from anyway. 472 */ 473 if ((status = read_from(db->pagf, db->pagbuf, OFF_PAG(pagb), PBLKSIZ)) 474 != APR_SUCCESS) 475 return status; 476 477 if (!chkpage(db->pagbuf)) 478 return APR_ENOSPC; /* ### better error? */ 479 db->pagbno = pagb; 480 481 debug(("pag read: %d\n", pagb)); 482 } 483 return APR_SUCCESS; 484} 485 486static int getdbit(apr_sdbm_t *db, long dbit) 487{ 488 register long c; 489 register long dirb; 490 491 c = dbit / BYTESIZ; 492 dirb = c / DBLKSIZ; 493 494 if (dirb != db->dirbno) { 495 if (read_from(db->dirf, db->dirbuf, OFF_DIR(dirb), DBLKSIZ) 496 != APR_SUCCESS) 497 return 0; 498 499 db->dirbno = dirb; 500 501 debug(("dir read: %d\n", dirb)); 502 } 503 504 return db->dirbuf[c % DBLKSIZ] & (1 << dbit % BYTESIZ); 505} 506 507static apr_status_t setdbit(apr_sdbm_t *db, long dbit) 508{ 509 register long c; 510 register long dirb; 511 apr_status_t status; 512 apr_off_t off; 513 514 c = dbit / BYTESIZ; 515 dirb = c / DBLKSIZ; 516 517 if (dirb != db->dirbno) { 518 if ((status = read_from(db->dirf, db->dirbuf, OFF_DIR(dirb), DBLKSIZ)) 519 != APR_SUCCESS) 520 return status; 521 522 db->dirbno = dirb; 523 524 debug(("dir read: %d\n", dirb)); 525 } 526 527 db->dirbuf[c % DBLKSIZ] |= (1 << dbit % BYTESIZ); 528 529 if (dbit >= db->maxbno) 530 db->maxbno += DBLKSIZ * BYTESIZ; 531 532 off = OFF_DIR(dirb); 533 if ((status = apr_file_seek(db->dirf, APR_SET, &off)) == APR_SUCCESS) 534 status = apr_file_write_full(db->dirf, db->dirbuf, DBLKSIZ, NULL); 535 536 return status; 537} 538 539/* 540* getnext - get the next key in the page, and if done with 541* the page, try the next page in sequence 542*/ 543static apr_status_t getnext(apr_sdbm_datum_t *key, apr_sdbm_t *db) 544{ 545 apr_status_t status; 546 for (;;) { 547 db->keyptr++; 548 *key = getnkey(db->pagbuf, db->keyptr); 549 if (key->dptr != NULL) 550 return APR_SUCCESS; 551 /* 552 * we either run out, or there is nothing on this page.. 553 * try the next one... If we lost our position on the 554 * file, we will have to seek. 555 */ 556 db->keyptr = 0; 557 if (db->pagbno != db->blkptr++) { 558 apr_off_t off = OFF_PAG(db->blkptr); 559 if ((status = apr_file_seek(db->pagf, APR_SET, &off)) 560 != APR_SUCCESS) 561 return status; 562 } 563 564 db->pagbno = db->blkptr; 565 /* ### EOF acceptable here too? */ 566 if ((status = apr_file_read_full(db->pagf, db->pagbuf, PBLKSIZ, NULL)) 567 != APR_SUCCESS) 568 return status; 569 if (!chkpage(db->pagbuf)) 570 return APR_EGENERAL; /* ### need better error */ 571 } 572 573 /* NOTREACHED */ 574} 575 576 577APU_DECLARE(int) apr_sdbm_rdonly(apr_sdbm_t *db) 578{ 579 /* ### Should we return true if the first lock is a share lock, 580 * to reflect that apr_sdbm_store and apr_sdbm_delete will fail? 581 */ 582 return (db->flags & SDBM_RDONLY) != 0; 583} 584 585