1 bbcba3ed 2022-01-10 op /* $OpenBSD: ohash.c,v 1.1 2014/06/02 18:52:03 deraadt Exp $ */
3 bbcba3ed 2022-01-10 op /* Copyright (c) 1999, 2004 Marc Espie <espie@openbsd.org>
5 bbcba3ed 2022-01-10 op * Permission to use, copy, modify, and distribute this software for any
6 bbcba3ed 2022-01-10 op * purpose with or without fee is hereby granted, provided that the above
7 bbcba3ed 2022-01-10 op * copyright notice and this permission notice appear in all copies.
9 bbcba3ed 2022-01-10 op * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10 bbcba3ed 2022-01-10 op * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11 bbcba3ed 2022-01-10 op * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12 bbcba3ed 2022-01-10 op * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13 bbcba3ed 2022-01-10 op * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14 bbcba3ed 2022-01-10 op * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15 bbcba3ed 2022-01-10 op * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
18 bbcba3ed 2022-01-10 op #include "compat.h"
20 bbcba3ed 2022-01-10 op #include <stddef.h>
21 bbcba3ed 2022-01-10 op #include <stdint.h>
22 bbcba3ed 2022-01-10 op #include <stdlib.h>
23 bbcba3ed 2022-01-10 op #include <string.h>
24 bbcba3ed 2022-01-10 op #include <limits.h>
25 bbcba3ed 2022-01-10 op #include "ohash.h"
27 bbcba3ed 2022-01-10 op struct _ohash_record {
29 bbcba3ed 2022-01-10 op const char *p;
32 bbcba3ed 2022-01-10 op #define DELETED ((const char *)h)
33 bbcba3ed 2022-01-10 op #define NONE (h->size)
35 bbcba3ed 2022-01-10 op /* Don't bother changing the hash table if the change is small enough. */
36 bbcba3ed 2022-01-10 op #define MINSIZE (1UL << 4)
37 bbcba3ed 2022-01-10 op #define MINDELETED 4
39 bbcba3ed 2022-01-10 op static void ohash_resize(struct ohash *);
42 bbcba3ed 2022-01-10 op /* This handles the common case of variable length keys, where the
43 bbcba3ed 2022-01-10 op * key is stored at the end of the record.
46 bbcba3ed 2022-01-10 op ohash_create_entry(struct ohash_info *i, const char *start, const char **end)
51 bbcba3ed 2022-01-10 op *end = start + strlen(start);
52 bbcba3ed 2022-01-10 op p = (i->alloc)(i->key_offset + (*end - start) + 1, i->data);
54 bbcba3ed 2022-01-10 op memcpy(p+i->key_offset, start, *end-start);
55 bbcba3ed 2022-01-10 op p[i->key_offset + (*end - start)] = '\0';
57 bbcba3ed 2022-01-10 op return (void *)p;
60 bbcba3ed 2022-01-10 op /* hash_delete only frees the hash structure. Use hash_first/hash_next
61 bbcba3ed 2022-01-10 op * to free entries as well. */
63 bbcba3ed 2022-01-10 op ohash_delete(struct ohash *h)
65 bbcba3ed 2022-01-10 op (h->info.free)(h->t, h->info.data);
66 bbcba3ed 2022-01-10 op #ifndef NDEBUG
72 bbcba3ed 2022-01-10 op ohash_resize(struct ohash *h)
74 bbcba3ed 2022-01-10 op struct _ohash_record *n;
76 bbcba3ed 2022-01-10 op unsigned int j;
77 bbcba3ed 2022-01-10 op unsigned int i, incr;
79 bbcba3ed 2022-01-10 op if (4 * h->deleted < h->total) {
80 bbcba3ed 2022-01-10 op if (h->size >= (UINT_MAX >> 1U))
81 bbcba3ed 2022-01-10 op ns = UINT_MAX;
83 bbcba3ed 2022-01-10 op ns = h->size << 1U;
84 bbcba3ed 2022-01-10 op } else if (3 * h->deleted > 2 * h->total)
85 bbcba3ed 2022-01-10 op ns = h->size >> 1U;
88 bbcba3ed 2022-01-10 op if (ns < MINSIZE)
90 bbcba3ed 2022-01-10 op #ifdef STATS_HASH
91 bbcba3ed 2022-01-10 op STAT_HASH_EXPAND++;
92 bbcba3ed 2022-01-10 op STAT_HASH_SIZE += ns - h->size;
95 bbcba3ed 2022-01-10 op n = (h->info.calloc)(ns, sizeof(struct _ohash_record), h->info.data);
99 bbcba3ed 2022-01-10 op for (j = 0; j < h->size; j++) {
100 bbcba3ed 2022-01-10 op if (h->t[j].p != NULL && h->t[j].p != DELETED) {
101 bbcba3ed 2022-01-10 op i = h->t[j].hv % ns;
102 bbcba3ed 2022-01-10 op incr = ((h->t[j].hv % (ns - 2)) & ~1) + 1;
103 bbcba3ed 2022-01-10 op while (n[i].p != NULL) {
108 bbcba3ed 2022-01-10 op n[i].hv = h->t[j].hv;
109 bbcba3ed 2022-01-10 op n[i].p = h->t[j].p;
112 bbcba3ed 2022-01-10 op (h->info.free)(h->t, h->info.data);
114 bbcba3ed 2022-01-10 op h->size = ns;
115 bbcba3ed 2022-01-10 op h->total -= h->deleted;
116 bbcba3ed 2022-01-10 op h->deleted = 0;
120 bbcba3ed 2022-01-10 op ohash_remove(struct ohash *h, unsigned int i)
122 bbcba3ed 2022-01-10 op void *result = (void *)h->t[i].p;
124 bbcba3ed 2022-01-10 op if (result == NULL || result == DELETED)
127 bbcba3ed 2022-01-10 op #ifdef STATS_HASH
128 bbcba3ed 2022-01-10 op STAT_HASH_ENTRIES--;
130 bbcba3ed 2022-01-10 op h->t[i].p = DELETED;
131 bbcba3ed 2022-01-10 op h->deleted++;
132 bbcba3ed 2022-01-10 op if (h->deleted >= MINDELETED && 4 * h->deleted > h->total)
133 bbcba3ed 2022-01-10 op ohash_resize(h);
134 bbcba3ed 2022-01-10 op return result;
138 bbcba3ed 2022-01-10 op ohash_find(struct ohash *h, unsigned int i)
140 bbcba3ed 2022-01-10 op if (h->t[i].p == DELETED)
143 bbcba3ed 2022-01-10 op return (void *)h->t[i].p;
147 bbcba3ed 2022-01-10 op ohash_insert(struct ohash *h, unsigned int i, void *p)
149 bbcba3ed 2022-01-10 op #ifdef STATS_HASH
150 bbcba3ed 2022-01-10 op STAT_HASH_ENTRIES++;
152 bbcba3ed 2022-01-10 op if (h->t[i].p == DELETED) {
153 bbcba3ed 2022-01-10 op h->deleted--;
154 bbcba3ed 2022-01-10 op h->t[i].p = p;
156 bbcba3ed 2022-01-10 op h->t[i].p = p;
157 bbcba3ed 2022-01-10 op /* Arbitrary resize boundary. Tweak if not efficient enough. */
158 bbcba3ed 2022-01-10 op if (++h->total * 4 > h->size * 3)
159 bbcba3ed 2022-01-10 op ohash_resize(h);
165 bbcba3ed 2022-01-10 op ohash_entries(struct ohash *h)
167 bbcba3ed 2022-01-10 op return h->total - h->deleted;
171 bbcba3ed 2022-01-10 op ohash_first(struct ohash *h, unsigned int *pos)
174 bbcba3ed 2022-01-10 op return ohash_next(h, pos);
178 bbcba3ed 2022-01-10 op ohash_next(struct ohash *h, unsigned int *pos)
180 bbcba3ed 2022-01-10 op for (; *pos < h->size; (*pos)++)
181 bbcba3ed 2022-01-10 op if (h->t[*pos].p != DELETED && h->t[*pos].p != NULL)
182 bbcba3ed 2022-01-10 op return (void *)h->t[(*pos)++].p;
187 bbcba3ed 2022-01-10 op ohash_init(struct ohash *h, unsigned int size, struct ohash_info *info)
189 bbcba3ed 2022-01-10 op h->size = 1UL << size;
190 bbcba3ed 2022-01-10 op if (h->size < MINSIZE)
191 bbcba3ed 2022-01-10 op h->size = MINSIZE;
192 bbcba3ed 2022-01-10 op #ifdef STATS_HASH
193 bbcba3ed 2022-01-10 op STAT_HASH_CREATION++;
194 bbcba3ed 2022-01-10 op STAT_HASH_SIZE += h->size;
196 bbcba3ed 2022-01-10 op /* Copy info so that caller may free it. */
197 bbcba3ed 2022-01-10 op h->info.key_offset = info->key_offset;
198 bbcba3ed 2022-01-10 op h->info.calloc = info->calloc;
199 bbcba3ed 2022-01-10 op h->info.free = info->free;
200 bbcba3ed 2022-01-10 op h->info.alloc = info->alloc;
201 bbcba3ed 2022-01-10 op h->info.data = info->data;
202 bbcba3ed 2022-01-10 op h->t = (h->info.calloc)(h->size, sizeof(struct _ohash_record),
203 bbcba3ed 2022-01-10 op h->info.data);
204 bbcba3ed 2022-01-10 op h->total = h->deleted = 0;
208 bbcba3ed 2022-01-10 op ohash_interval(const char *s, const char **e)
213 bbcba3ed 2022-01-10 op *e = s + strlen(s);
218 bbcba3ed 2022-01-10 op while (s != *e)
219 bbcba3ed 2022-01-10 op k = ((k << 2) | (k >> 30)) ^ *s++;
224 bbcba3ed 2022-01-10 op ohash_lookup_interval(struct ohash *h, const char *start, const char *end,
227 bbcba3ed 2022-01-10 op unsigned int i, incr;
228 bbcba3ed 2022-01-10 op unsigned int empty;
230 bbcba3ed 2022-01-10 op #ifdef STATS_HASH
231 bbcba3ed 2022-01-10 op STAT_HASH_LOOKUP++;
233 bbcba3ed 2022-01-10 op empty = NONE;
234 bbcba3ed 2022-01-10 op i = hv % h->size;
235 bbcba3ed 2022-01-10 op incr = ((hv % (h->size-2)) & ~1) + 1;
236 bbcba3ed 2022-01-10 op while (h->t[i].p != NULL) {
237 bbcba3ed 2022-01-10 op #ifdef STATS_HASH
238 bbcba3ed 2022-01-10 op STAT_HASH_LENGTH++;
240 bbcba3ed 2022-01-10 op if (h->t[i].p == DELETED) {
241 bbcba3ed 2022-01-10 op if (empty == NONE)
243 bbcba3ed 2022-01-10 op } else if (h->t[i].hv == hv &&
244 bbcba3ed 2022-01-10 op strncmp(h->t[i].p+h->info.key_offset, start,
245 bbcba3ed 2022-01-10 op end - start) == 0 &&
246 bbcba3ed 2022-01-10 op (h->t[i].p+h->info.key_offset)[end-start] == '\0') {
247 bbcba3ed 2022-01-10 op if (empty != NONE) {
248 bbcba3ed 2022-01-10 op h->t[empty].hv = hv;
249 bbcba3ed 2022-01-10 op h->t[empty].p = h->t[i].p;
250 bbcba3ed 2022-01-10 op h->t[i].p = DELETED;
251 bbcba3ed 2022-01-10 op return empty;
253 bbcba3ed 2022-01-10 op #ifdef STATS_HASH
254 bbcba3ed 2022-01-10 op STAT_HASH_POSITIVE++;
260 bbcba3ed 2022-01-10 op if (i >= h->size)
261 bbcba3ed 2022-01-10 op i -= h->size;
264 bbcba3ed 2022-01-10 op /* Found an empty position. */
265 bbcba3ed 2022-01-10 op if (empty != NONE)
267 bbcba3ed 2022-01-10 op h->t[i].hv = hv;
272 bbcba3ed 2022-01-10 op ohash_lookup_memory(struct ohash *h, const char *k, size_t size, uint32_t hv)
274 bbcba3ed 2022-01-10 op unsigned int i, incr;
275 bbcba3ed 2022-01-10 op unsigned int empty;
277 bbcba3ed 2022-01-10 op #ifdef STATS_HASH
278 bbcba3ed 2022-01-10 op STAT_HASH_LOOKUP++;
280 bbcba3ed 2022-01-10 op empty = NONE;
281 bbcba3ed 2022-01-10 op i = hv % h->size;
282 bbcba3ed 2022-01-10 op incr = ((hv % (h->size-2)) & ~1) + 1;
283 bbcba3ed 2022-01-10 op while (h->t[i].p != NULL) {
284 bbcba3ed 2022-01-10 op #ifdef STATS_HASH
285 bbcba3ed 2022-01-10 op STAT_HASH_LENGTH++;
287 bbcba3ed 2022-01-10 op if (h->t[i].p == DELETED) {
288 bbcba3ed 2022-01-10 op if (empty == NONE)
290 bbcba3ed 2022-01-10 op } else if (h->t[i].hv == hv &&
291 bbcba3ed 2022-01-10 op memcmp(h->t[i].p+h->info.key_offset, k, size) == 0) {
292 bbcba3ed 2022-01-10 op if (empty != NONE) {
293 bbcba3ed 2022-01-10 op h->t[empty].hv = hv;
294 bbcba3ed 2022-01-10 op h->t[empty].p = h->t[i].p;
295 bbcba3ed 2022-01-10 op h->t[i].p = DELETED;
296 bbcba3ed 2022-01-10 op return empty;
298 bbcba3ed 2022-01-10 op #ifdef STATS_HASH
299 bbcba3ed 2022-01-10 op STAT_HASH_POSITIVE++;
304 bbcba3ed 2022-01-10 op if (i >= h->size)
305 bbcba3ed 2022-01-10 op i -= h->size;
308 bbcba3ed 2022-01-10 op /* Found an empty position. */
309 bbcba3ed 2022-01-10 op if (empty != NONE)
311 bbcba3ed 2022-01-10 op h->t[i].hv = hv;
316 bbcba3ed 2022-01-10 op ohash_qlookup(struct ohash *h, const char *s)
318 bbcba3ed 2022-01-10 op const char *e = NULL;
319 bbcba3ed 2022-01-10 op return ohash_qlookupi(h, s, &e);
323 bbcba3ed 2022-01-10 op ohash_qlookupi(struct ohash *h, const char *s, const char **e)
327 bbcba3ed 2022-01-10 op hv = ohash_interval(s, e);
328 bbcba3ed 2022-01-10 op return ohash_lookup_interval(h, s, *e, hv);