1*6d38604fSBaptiste Daroussin /* $Id: compat_ohash.c,v 1.7 2020/06/15 01:37:15 schwarze Exp $ */
261d06d6bSBaptiste Daroussin /* $OpenBSD: ohash.c,v 1.1 2014/06/02 18:52:03 deraadt Exp $ */
361d06d6bSBaptiste Daroussin
461d06d6bSBaptiste Daroussin /* Copyright (c) 1999, 2004 Marc Espie <espie@openbsd.org>
561d06d6bSBaptiste Daroussin *
661d06d6bSBaptiste Daroussin * Permission to use, copy, modify, and distribute this software for any
761d06d6bSBaptiste Daroussin * purpose with or without fee is hereby granted, provided that the above
861d06d6bSBaptiste Daroussin * copyright notice and this permission notice appear in all copies.
961d06d6bSBaptiste Daroussin *
1061d06d6bSBaptiste Daroussin * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
1161d06d6bSBaptiste Daroussin * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
1261d06d6bSBaptiste Daroussin * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
1361d06d6bSBaptiste Daroussin * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
1461d06d6bSBaptiste Daroussin * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
1561d06d6bSBaptiste Daroussin * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
1661d06d6bSBaptiste Daroussin * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
1761d06d6bSBaptiste Daroussin */
18*6d38604fSBaptiste Daroussin #include "config.h"
1961d06d6bSBaptiste Daroussin
2061d06d6bSBaptiste Daroussin #include <sys/types.h>
2161d06d6bSBaptiste Daroussin #include <stddef.h>
2261d06d6bSBaptiste Daroussin #include <stdint.h>
2361d06d6bSBaptiste Daroussin #include <stdlib.h>
2461d06d6bSBaptiste Daroussin #include <string.h>
2561d06d6bSBaptiste Daroussin #include <limits.h>
2661d06d6bSBaptiste Daroussin #include "compat_ohash.h"
2761d06d6bSBaptiste Daroussin
2861d06d6bSBaptiste Daroussin struct _ohash_record {
2961d06d6bSBaptiste Daroussin uint32_t hv;
3061d06d6bSBaptiste Daroussin const char *p;
3161d06d6bSBaptiste Daroussin };
3261d06d6bSBaptiste Daroussin
3361d06d6bSBaptiste Daroussin #define DELETED ((const char *)h)
3461d06d6bSBaptiste Daroussin #define NONE (h->size)
3561d06d6bSBaptiste Daroussin
3661d06d6bSBaptiste Daroussin /* Don't bother changing the hash table if the change is small enough. */
3761d06d6bSBaptiste Daroussin #define MINSIZE (1UL << 4)
3861d06d6bSBaptiste Daroussin #define MINDELETED 4
3961d06d6bSBaptiste Daroussin
4061d06d6bSBaptiste Daroussin static void ohash_resize(struct ohash *);
4161d06d6bSBaptiste Daroussin
4261d06d6bSBaptiste Daroussin
4361d06d6bSBaptiste Daroussin /* This handles the common case of variable length keys, where the
4461d06d6bSBaptiste Daroussin * key is stored at the end of the record.
4561d06d6bSBaptiste Daroussin */
4661d06d6bSBaptiste Daroussin void *
ohash_create_entry(struct ohash_info * i,const char * start,const char ** end)4761d06d6bSBaptiste Daroussin ohash_create_entry(struct ohash_info *i, const char *start, const char **end)
4861d06d6bSBaptiste Daroussin {
4961d06d6bSBaptiste Daroussin char *p;
5061d06d6bSBaptiste Daroussin
5161d06d6bSBaptiste Daroussin if (!*end)
5261d06d6bSBaptiste Daroussin *end = start + strlen(start);
5361d06d6bSBaptiste Daroussin p = (i->alloc)(i->key_offset + (*end - start) + 1, i->data);
5461d06d6bSBaptiste Daroussin if (p) {
5561d06d6bSBaptiste Daroussin memcpy(p+i->key_offset, start, *end-start);
5661d06d6bSBaptiste Daroussin p[i->key_offset + (*end - start)] = '\0';
5761d06d6bSBaptiste Daroussin }
5861d06d6bSBaptiste Daroussin return (void *)p;
5961d06d6bSBaptiste Daroussin }
6061d06d6bSBaptiste Daroussin
6161d06d6bSBaptiste Daroussin /* hash_delete only frees the hash structure. Use hash_first/hash_next
6261d06d6bSBaptiste Daroussin * to free entries as well. */
6361d06d6bSBaptiste Daroussin void
ohash_delete(struct ohash * h)6461d06d6bSBaptiste Daroussin ohash_delete(struct ohash *h)
6561d06d6bSBaptiste Daroussin {
6661d06d6bSBaptiste Daroussin (h->info.free)(h->t, h->info.data);
6761d06d6bSBaptiste Daroussin #ifndef NDEBUG
6861d06d6bSBaptiste Daroussin h->t = NULL;
6961d06d6bSBaptiste Daroussin #endif
7061d06d6bSBaptiste Daroussin }
7161d06d6bSBaptiste Daroussin
7261d06d6bSBaptiste Daroussin static void
ohash_resize(struct ohash * h)7361d06d6bSBaptiste Daroussin ohash_resize(struct ohash *h)
7461d06d6bSBaptiste Daroussin {
7561d06d6bSBaptiste Daroussin struct _ohash_record *n;
7661d06d6bSBaptiste Daroussin size_t ns;
7761d06d6bSBaptiste Daroussin unsigned int j;
7861d06d6bSBaptiste Daroussin unsigned int i, incr;
7961d06d6bSBaptiste Daroussin
8061d06d6bSBaptiste Daroussin if (4 * h->deleted < h->total) {
8161d06d6bSBaptiste Daroussin if (h->size >= (UINT_MAX >> 1U))
8261d06d6bSBaptiste Daroussin ns = UINT_MAX;
8361d06d6bSBaptiste Daroussin else
8461d06d6bSBaptiste Daroussin ns = h->size << 1U;
8561d06d6bSBaptiste Daroussin } else if (3 * h->deleted > 2 * h->total)
8661d06d6bSBaptiste Daroussin ns = h->size >> 1U;
8761d06d6bSBaptiste Daroussin else
8861d06d6bSBaptiste Daroussin ns = h->size;
8961d06d6bSBaptiste Daroussin if (ns < MINSIZE)
9061d06d6bSBaptiste Daroussin ns = MINSIZE;
9161d06d6bSBaptiste Daroussin #ifdef STATS_HASH
9261d06d6bSBaptiste Daroussin STAT_HASH_EXPAND++;
9361d06d6bSBaptiste Daroussin STAT_HASH_SIZE += ns - h->size;
9461d06d6bSBaptiste Daroussin #endif
9561d06d6bSBaptiste Daroussin
9661d06d6bSBaptiste Daroussin n = (h->info.calloc)(ns, sizeof(struct _ohash_record), h->info.data);
9761d06d6bSBaptiste Daroussin if (!n)
9861d06d6bSBaptiste Daroussin return;
9961d06d6bSBaptiste Daroussin
10061d06d6bSBaptiste Daroussin for (j = 0; j < h->size; j++) {
10161d06d6bSBaptiste Daroussin if (h->t[j].p != NULL && h->t[j].p != DELETED) {
10261d06d6bSBaptiste Daroussin i = h->t[j].hv % ns;
10361d06d6bSBaptiste Daroussin incr = ((h->t[j].hv % (ns - 2)) & ~1) + 1;
10461d06d6bSBaptiste Daroussin while (n[i].p != NULL) {
10561d06d6bSBaptiste Daroussin i += incr;
10661d06d6bSBaptiste Daroussin if (i >= ns)
10761d06d6bSBaptiste Daroussin i -= ns;
10861d06d6bSBaptiste Daroussin }
10961d06d6bSBaptiste Daroussin n[i].hv = h->t[j].hv;
11061d06d6bSBaptiste Daroussin n[i].p = h->t[j].p;
11161d06d6bSBaptiste Daroussin }
11261d06d6bSBaptiste Daroussin }
11361d06d6bSBaptiste Daroussin (h->info.free)(h->t, h->info.data);
11461d06d6bSBaptiste Daroussin h->t = n;
11561d06d6bSBaptiste Daroussin h->size = ns;
11661d06d6bSBaptiste Daroussin h->total -= h->deleted;
11761d06d6bSBaptiste Daroussin h->deleted = 0;
11861d06d6bSBaptiste Daroussin }
11961d06d6bSBaptiste Daroussin
12061d06d6bSBaptiste Daroussin void *
ohash_remove(struct ohash * h,unsigned int i)12161d06d6bSBaptiste Daroussin ohash_remove(struct ohash *h, unsigned int i)
12261d06d6bSBaptiste Daroussin {
12361d06d6bSBaptiste Daroussin void *result = (void *)h->t[i].p;
12461d06d6bSBaptiste Daroussin
12561d06d6bSBaptiste Daroussin if (result == NULL || result == DELETED)
12661d06d6bSBaptiste Daroussin return NULL;
12761d06d6bSBaptiste Daroussin
12861d06d6bSBaptiste Daroussin #ifdef STATS_HASH
12961d06d6bSBaptiste Daroussin STAT_HASH_ENTRIES--;
13061d06d6bSBaptiste Daroussin #endif
13161d06d6bSBaptiste Daroussin h->t[i].p = DELETED;
13261d06d6bSBaptiste Daroussin h->deleted++;
13361d06d6bSBaptiste Daroussin if (h->deleted >= MINDELETED && 4 * h->deleted > h->total)
13461d06d6bSBaptiste Daroussin ohash_resize(h);
13561d06d6bSBaptiste Daroussin return result;
13661d06d6bSBaptiste Daroussin }
13761d06d6bSBaptiste Daroussin
13861d06d6bSBaptiste Daroussin void *
ohash_find(struct ohash * h,unsigned int i)13961d06d6bSBaptiste Daroussin ohash_find(struct ohash *h, unsigned int i)
14061d06d6bSBaptiste Daroussin {
14161d06d6bSBaptiste Daroussin if (h->t[i].p == DELETED)
14261d06d6bSBaptiste Daroussin return NULL;
14361d06d6bSBaptiste Daroussin else
14461d06d6bSBaptiste Daroussin return (void *)h->t[i].p;
14561d06d6bSBaptiste Daroussin }
14661d06d6bSBaptiste Daroussin
14761d06d6bSBaptiste Daroussin void *
ohash_insert(struct ohash * h,unsigned int i,void * p)14861d06d6bSBaptiste Daroussin ohash_insert(struct ohash *h, unsigned int i, void *p)
14961d06d6bSBaptiste Daroussin {
15061d06d6bSBaptiste Daroussin #ifdef STATS_HASH
15161d06d6bSBaptiste Daroussin STAT_HASH_ENTRIES++;
15261d06d6bSBaptiste Daroussin #endif
15361d06d6bSBaptiste Daroussin if (h->t[i].p == DELETED) {
15461d06d6bSBaptiste Daroussin h->deleted--;
15561d06d6bSBaptiste Daroussin h->t[i].p = p;
15661d06d6bSBaptiste Daroussin } else {
15761d06d6bSBaptiste Daroussin h->t[i].p = p;
15861d06d6bSBaptiste Daroussin /* Arbitrary resize boundary. Tweak if not efficient enough. */
15961d06d6bSBaptiste Daroussin if (++h->total * 4 > h->size * 3)
16061d06d6bSBaptiste Daroussin ohash_resize(h);
16161d06d6bSBaptiste Daroussin }
16261d06d6bSBaptiste Daroussin return p;
16361d06d6bSBaptiste Daroussin }
16461d06d6bSBaptiste Daroussin
16561d06d6bSBaptiste Daroussin unsigned int
ohash_entries(struct ohash * h)16661d06d6bSBaptiste Daroussin ohash_entries(struct ohash *h)
16761d06d6bSBaptiste Daroussin {
16861d06d6bSBaptiste Daroussin return h->total - h->deleted;
16961d06d6bSBaptiste Daroussin }
17061d06d6bSBaptiste Daroussin
17161d06d6bSBaptiste Daroussin void *
ohash_first(struct ohash * h,unsigned int * pos)17261d06d6bSBaptiste Daroussin ohash_first(struct ohash *h, unsigned int *pos)
17361d06d6bSBaptiste Daroussin {
17461d06d6bSBaptiste Daroussin *pos = 0;
17561d06d6bSBaptiste Daroussin return ohash_next(h, pos);
17661d06d6bSBaptiste Daroussin }
17761d06d6bSBaptiste Daroussin
17861d06d6bSBaptiste Daroussin void *
ohash_next(struct ohash * h,unsigned int * pos)17961d06d6bSBaptiste Daroussin ohash_next(struct ohash *h, unsigned int *pos)
18061d06d6bSBaptiste Daroussin {
18161d06d6bSBaptiste Daroussin for (; *pos < h->size; (*pos)++)
18261d06d6bSBaptiste Daroussin if (h->t[*pos].p != DELETED && h->t[*pos].p != NULL)
18361d06d6bSBaptiste Daroussin return (void *)h->t[(*pos)++].p;
18461d06d6bSBaptiste Daroussin return NULL;
18561d06d6bSBaptiste Daroussin }
18661d06d6bSBaptiste Daroussin
18761d06d6bSBaptiste Daroussin void
ohash_init(struct ohash * h,unsigned int size,struct ohash_info * info)18861d06d6bSBaptiste Daroussin ohash_init(struct ohash *h, unsigned int size, struct ohash_info *info)
18961d06d6bSBaptiste Daroussin {
19061d06d6bSBaptiste Daroussin h->size = 1UL << size;
19161d06d6bSBaptiste Daroussin if (h->size < MINSIZE)
19261d06d6bSBaptiste Daroussin h->size = MINSIZE;
19361d06d6bSBaptiste Daroussin #ifdef STATS_HASH
19461d06d6bSBaptiste Daroussin STAT_HASH_CREATION++;
19561d06d6bSBaptiste Daroussin STAT_HASH_SIZE += h->size;
19661d06d6bSBaptiste Daroussin #endif
19761d06d6bSBaptiste Daroussin /* Copy info so that caller may free it. */
19861d06d6bSBaptiste Daroussin h->info.key_offset = info->key_offset;
19961d06d6bSBaptiste Daroussin h->info.calloc = info->calloc;
20061d06d6bSBaptiste Daroussin h->info.free = info->free;
20161d06d6bSBaptiste Daroussin h->info.alloc = info->alloc;
20261d06d6bSBaptiste Daroussin h->info.data = info->data;
20361d06d6bSBaptiste Daroussin h->t = (h->info.calloc)(h->size, sizeof(struct _ohash_record),
20461d06d6bSBaptiste Daroussin h->info.data);
20561d06d6bSBaptiste Daroussin h->total = h->deleted = 0;
20661d06d6bSBaptiste Daroussin }
20761d06d6bSBaptiste Daroussin
20861d06d6bSBaptiste Daroussin uint32_t
ohash_interval(const char * s,const char ** e)20961d06d6bSBaptiste Daroussin ohash_interval(const char *s, const char **e)
21061d06d6bSBaptiste Daroussin {
21161d06d6bSBaptiste Daroussin uint32_t k;
21261d06d6bSBaptiste Daroussin
21361d06d6bSBaptiste Daroussin if (!*e)
21461d06d6bSBaptiste Daroussin *e = s + strlen(s);
21561d06d6bSBaptiste Daroussin if (s == *e)
21661d06d6bSBaptiste Daroussin k = 0;
21761d06d6bSBaptiste Daroussin else
21861d06d6bSBaptiste Daroussin k = *s++;
21961d06d6bSBaptiste Daroussin while (s != *e)
22061d06d6bSBaptiste Daroussin k = ((k << 2) | (k >> 30)) ^ *s++;
22161d06d6bSBaptiste Daroussin return k;
22261d06d6bSBaptiste Daroussin }
22361d06d6bSBaptiste Daroussin
22461d06d6bSBaptiste Daroussin unsigned int
ohash_lookup_interval(struct ohash * h,const char * start,const char * end,uint32_t hv)22561d06d6bSBaptiste Daroussin ohash_lookup_interval(struct ohash *h, const char *start, const char *end,
22661d06d6bSBaptiste Daroussin uint32_t hv)
22761d06d6bSBaptiste Daroussin {
22861d06d6bSBaptiste Daroussin unsigned int i, incr;
22961d06d6bSBaptiste Daroussin unsigned int empty;
23061d06d6bSBaptiste Daroussin
23161d06d6bSBaptiste Daroussin #ifdef STATS_HASH
23261d06d6bSBaptiste Daroussin STAT_HASH_LOOKUP++;
23361d06d6bSBaptiste Daroussin #endif
23461d06d6bSBaptiste Daroussin empty = NONE;
23561d06d6bSBaptiste Daroussin i = hv % h->size;
23661d06d6bSBaptiste Daroussin incr = ((hv % (h->size-2)) & ~1) + 1;
23761d06d6bSBaptiste Daroussin while (h->t[i].p != NULL) {
23861d06d6bSBaptiste Daroussin #ifdef STATS_HASH
23961d06d6bSBaptiste Daroussin STAT_HASH_LENGTH++;
24061d06d6bSBaptiste Daroussin #endif
24161d06d6bSBaptiste Daroussin if (h->t[i].p == DELETED) {
24261d06d6bSBaptiste Daroussin if (empty == NONE)
24361d06d6bSBaptiste Daroussin empty = i;
24461d06d6bSBaptiste Daroussin } else if (h->t[i].hv == hv &&
24561d06d6bSBaptiste Daroussin strncmp(h->t[i].p+h->info.key_offset, start,
24661d06d6bSBaptiste Daroussin end - start) == 0 &&
24761d06d6bSBaptiste Daroussin (h->t[i].p+h->info.key_offset)[end-start] == '\0') {
24861d06d6bSBaptiste Daroussin if (empty != NONE) {
24961d06d6bSBaptiste Daroussin h->t[empty].hv = hv;
25061d06d6bSBaptiste Daroussin h->t[empty].p = h->t[i].p;
25161d06d6bSBaptiste Daroussin h->t[i].p = DELETED;
25261d06d6bSBaptiste Daroussin return empty;
25361d06d6bSBaptiste Daroussin } else {
25461d06d6bSBaptiste Daroussin #ifdef STATS_HASH
25561d06d6bSBaptiste Daroussin STAT_HASH_POSITIVE++;
25661d06d6bSBaptiste Daroussin #endif
25761d06d6bSBaptiste Daroussin return i;
25861d06d6bSBaptiste Daroussin }
25961d06d6bSBaptiste Daroussin }
26061d06d6bSBaptiste Daroussin i += incr;
26161d06d6bSBaptiste Daroussin if (i >= h->size)
26261d06d6bSBaptiste Daroussin i -= h->size;
26361d06d6bSBaptiste Daroussin }
26461d06d6bSBaptiste Daroussin
26561d06d6bSBaptiste Daroussin /* Found an empty position. */
26661d06d6bSBaptiste Daroussin if (empty != NONE)
26761d06d6bSBaptiste Daroussin i = empty;
26861d06d6bSBaptiste Daroussin h->t[i].hv = hv;
26961d06d6bSBaptiste Daroussin return i;
27061d06d6bSBaptiste Daroussin }
27161d06d6bSBaptiste Daroussin
27261d06d6bSBaptiste Daroussin unsigned int
ohash_lookup_memory(struct ohash * h,const char * k,size_t size,uint32_t hv)27361d06d6bSBaptiste Daroussin ohash_lookup_memory(struct ohash *h, const char *k, size_t size, uint32_t hv)
27461d06d6bSBaptiste Daroussin {
27561d06d6bSBaptiste Daroussin unsigned int i, incr;
27661d06d6bSBaptiste Daroussin unsigned int empty;
27761d06d6bSBaptiste Daroussin
27861d06d6bSBaptiste Daroussin #ifdef STATS_HASH
27961d06d6bSBaptiste Daroussin STAT_HASH_LOOKUP++;
28061d06d6bSBaptiste Daroussin #endif
28161d06d6bSBaptiste Daroussin empty = NONE;
28261d06d6bSBaptiste Daroussin i = hv % h->size;
28361d06d6bSBaptiste Daroussin incr = ((hv % (h->size-2)) & ~1) + 1;
28461d06d6bSBaptiste Daroussin while (h->t[i].p != NULL) {
28561d06d6bSBaptiste Daroussin #ifdef STATS_HASH
28661d06d6bSBaptiste Daroussin STAT_HASH_LENGTH++;
28761d06d6bSBaptiste Daroussin #endif
28861d06d6bSBaptiste Daroussin if (h->t[i].p == DELETED) {
28961d06d6bSBaptiste Daroussin if (empty == NONE)
29061d06d6bSBaptiste Daroussin empty = i;
29161d06d6bSBaptiste Daroussin } else if (h->t[i].hv == hv &&
29261d06d6bSBaptiste Daroussin memcmp(h->t[i].p+h->info.key_offset, k, size) == 0) {
29361d06d6bSBaptiste Daroussin if (empty != NONE) {
29461d06d6bSBaptiste Daroussin h->t[empty].hv = hv;
29561d06d6bSBaptiste Daroussin h->t[empty].p = h->t[i].p;
29661d06d6bSBaptiste Daroussin h->t[i].p = DELETED;
29761d06d6bSBaptiste Daroussin return empty;
29861d06d6bSBaptiste Daroussin } else {
29961d06d6bSBaptiste Daroussin #ifdef STATS_HASH
30061d06d6bSBaptiste Daroussin STAT_HASH_POSITIVE++;
30161d06d6bSBaptiste Daroussin #endif
30261d06d6bSBaptiste Daroussin } return i;
30361d06d6bSBaptiste Daroussin }
30461d06d6bSBaptiste Daroussin i += incr;
30561d06d6bSBaptiste Daroussin if (i >= h->size)
30661d06d6bSBaptiste Daroussin i -= h->size;
30761d06d6bSBaptiste Daroussin }
30861d06d6bSBaptiste Daroussin
30961d06d6bSBaptiste Daroussin /* Found an empty position. */
31061d06d6bSBaptiste Daroussin if (empty != NONE)
31161d06d6bSBaptiste Daroussin i = empty;
31261d06d6bSBaptiste Daroussin h->t[i].hv = hv;
31361d06d6bSBaptiste Daroussin return i;
31461d06d6bSBaptiste Daroussin }
31561d06d6bSBaptiste Daroussin
31661d06d6bSBaptiste Daroussin unsigned int
ohash_qlookup(struct ohash * h,const char * s)31761d06d6bSBaptiste Daroussin ohash_qlookup(struct ohash *h, const char *s)
31861d06d6bSBaptiste Daroussin {
31961d06d6bSBaptiste Daroussin const char *e = NULL;
32061d06d6bSBaptiste Daroussin return ohash_qlookupi(h, s, &e);
32161d06d6bSBaptiste Daroussin }
32261d06d6bSBaptiste Daroussin
32361d06d6bSBaptiste Daroussin unsigned int
ohash_qlookupi(struct ohash * h,const char * s,const char ** e)32461d06d6bSBaptiste Daroussin ohash_qlookupi(struct ohash *h, const char *s, const char **e)
32561d06d6bSBaptiste Daroussin {
32661d06d6bSBaptiste Daroussin uint32_t hv;
32761d06d6bSBaptiste Daroussin
32861d06d6bSBaptiste Daroussin hv = ohash_interval(s, e);
32961d06d6bSBaptiste Daroussin return ohash_lookup_interval(h, s, *e, hv);
33061d06d6bSBaptiste Daroussin }
331