ref: b24fd14c329aa00b0d9703864f875258164216c4
dir: /util/htab.c/
#include <stdlib.h> #include <stdio.h> #include <stdarg.h> #include <inttypes.h> #include <assert.h> #include <limits.h> #include <string.h> #include "util.h" #define Initsz 16 #define Seed 2928213749 ulong murmurhash2(void *key, size_t len); /* Creates a new empty hash table, using 'hash' as the * hash funciton, and 'cmp' to verify that there are no * hash collisions. */ Htab *mkht(ulong (*hash)(void *key), int (*cmp)(void *k1, void *k2)) { Htab *ht; ht = xalloc(sizeof(Htab)); ht->nelt = 0; ht->ndead = 0; ht->sz = Initsz; ht->hash = hash; ht->cmp = cmp; ht->keys = zalloc(Initsz * sizeof(void *)); ht->vals = zalloc(Initsz * sizeof(void *)); ht->hashes = zalloc(Initsz * sizeof(void *)); ht->dead = zalloc(Initsz * sizeof(char)); return ht; } /* Frees a hash table. Passing this function * NULL is a no-op. */ void htfree(Htab *ht) { if (!ht) return; free(ht->keys); free(ht->vals); free(ht->hashes); free(ht->dead); free(ht); } /* Offsets the hash so that '0' can be * used as a 'no valid value */ static ulong hash(Htab *ht, void *k) { ulong h; h = ht->hash(k); if (h == 0) return 1; else return h; } /* Resizes the hash table by copying all * the old keys into the right slots in a * new table. */ static void grow(Htab *ht, int sz) { void **oldk; void **oldv; ulong *oldh; char *oldd; int oldsz; int i; oldk = ht->keys; oldv = ht->vals; oldh = ht->hashes; oldd = ht->dead; oldsz = ht->sz; ht->nelt = 0; ht->ndead = 0; ht->sz = sz; ht->keys = zalloc(sz * sizeof(void *)); ht->vals = zalloc(sz * sizeof(void *)); ht->hashes = zalloc(sz * sizeof(void *)); ht->dead = zalloc(sz * sizeof(void *)); for (i = 0; i < oldsz; i++) if (oldh[i] && !oldd[i]) htput(ht, oldk[i], oldv[i]); free(oldh); free(oldk); free(oldv); free(oldd); } /* Inserts 'k' into the hash table, possibly * killing any previous key that compares * as equal. */ int htput(Htab *ht, void *k, void *v) { int i; ulong h; int di; di = 0; h = hash(ht, k); i = h & (ht->sz - 1); while (ht->hashes[i] && !ht->dead[i]) { /* second insertion overwrites first. nb, we shouldn't touch the * keys for dead values */ if (ht->hashes[i] == h) { if (ht->dead[i]) break; else if (ht->cmp(ht->keys[i], k)) goto conflicted; } di++; i = (h + di) & (ht->sz - 1); } ht->nelt++; conflicted: if (ht->dead[i]) ht->ndead--; ht->hashes[i] = h; ht->keys[i] = k; ht->vals[i] = v; ht->dead[i] = 0; if (ht->sz < ht->nelt * 2) grow(ht, ht->sz * 2); if (ht->sz < ht->ndead * 4) grow(ht, ht->sz); return 1; } /* Finds the index that we would insert * the key into */ static ssize_t htidx(Htab *ht, void *k) { ssize_t i; ulong h; int di; di = 0; h = hash(ht, k); i = h & (ht->sz - 1); while (ht->hashes[i] && !ht->dead[i] && ht->hashes[i] != h) { searchmore: di++; i = (h + di) & (ht->sz - 1); } if (!ht->hashes[i]) return -1; if ((ht->hashes[i] == h && ht->dead[i]) || !ht->cmp(ht->keys[i], k)) goto searchmore; /* collision */ return i; } /* Looks up a key, returning NULL if * the value is not present. Note, * if NULL is a valid value, you need * to check with hthas() to see if it's * not there */ void *htget(Htab *ht, void *k) { ssize_t i; i = htidx(ht, k); if (i < 0) return NULL; else return ht->vals[i]; } void htdel(Htab *ht, void *k) { ssize_t i; i = htidx(ht, k); if (i < 0) return; assert(!ht->dead[i]); assert(ht->hashes[i]); ht->dead[i] = 1; ht->nelt--; ht->ndead++; } /* Tests for 'k's presence in 'ht' */ int hthas(Htab *ht, void *k) { return htidx(ht, k) >= 0; } /* Returns a list of all keys in the hash * table, storing the size of the returned * array in 'nkeys'. NB: the value returned * is allocated on the heap, and it is the * job of the caller to free it */ void **htkeys(Htab *ht, size_t *nkeys) { void **k; size_t i, j; j = 0; k = xalloc(sizeof(void *) * ht->nelt); for (i = 0; i < ht->sz; i++) if (ht->hashes[i] && !ht->dead[i]) k[j++] = ht->keys[i]; *nkeys = ht->nelt; return k; } ulong strhash(void *_s) { char *s; s = _s; if (!s) return Seed; return murmurhash2(_s, strlen(_s)); } int streq(void *a, void *b) { if (a == b) return 1; if (a == NULL || b == NULL) return 0; return !strcmp(a, b); } ulong strlithash(void *_s) { Str *s; s = _s; if (!s) return Seed; return murmurhash2(s->buf, s->len); } int strliteq(void *_a, void *_b) { Str *a, *b; a = _a; b = _b; if (a == b) return 1; if (a == NULL || b == NULL) return 0; if (a->len != b->len) return 0; return !memcmp(a->buf, b->buf, a->len); } ulong ptrhash(void *key) { return inthash((uintptr_t)key); } ulong inthash(uint64_t key) { return murmurhash2(&key, sizeof key); } int inteq(uint64_t a, uint64_t b) { return a == b; } int ptreq(void *a, void *b) { return a == b; } ulong murmurhash2 (void *ptr, size_t len) { uint32_t m = 0x5bd1e995; uint32_t r = 24; uint32_t h, k; uint32_t *data; char *buf; buf = ptr; data = (uint32_t*)buf; h = Seed ^ len; while (len >= 4) { k = *data; k *= m; k ^= k >> r; k *= m; h *= m; h ^= k; data++; len -= sizeof(*data); } switch (len) { case 3: h ^= buf[2] << 16; case 2: h ^= buf[1] << 8; case 1: h ^= buf[0] << 0; default: break; }; h *= m; h ^= h >> 13; h *= m; h ^= h >> 15; return h; }