1 /* Copyright 2002 Christopher Clark */
2 /* Copyright 2005-2012 Nick Mathewson */
3 /* Copyright 2009-2012 Niels Provos and Nick Mathewson */
4 /* See license at end. */
5
6 /* Based on ideas by Christopher Clark and interfaces from Niels Provos. */
7
8 #ifndef HT_INTERNAL_H_INCLUDED_
9 #define HT_INTERNAL_H_INCLUDED_
10
11 #define HT_HEAD(name, type) \
12 struct name { \
13 /* The hash table itself. */ \
14 struct type **hth_table; \
15 /* How long is the hash table? */ \
16 unsigned hth_table_length; \
17 /* How many elements does the table contain? */ \
18 unsigned hth_n_entries; \
19 /* How many elements will we allow in the table before resizing it? */ \
20 unsigned hth_load_limit; \
21 /* Position of hth_table_length in the primes table. */ \
22 int hth_prime_idx; \
23 }
24
25 #define HT_INITIALIZER() \
26 { NULL, 0, 0, 0, -1 }
27
28 #ifdef HT_NO_CACHE_HASH_VALUES
29 #define HT_ENTRY(type) \
30 struct { \
31 struct type *hte_next; \
32 }
33 #else
34 #define HT_ENTRY(type) \
35 struct { \
36 struct type *hte_next; \
37 unsigned hte_hash; \
38 }
39 #endif
40
41 #define HT_EMPTY(head) \
42 ((head)->hth_n_entries == 0)
43
44 /* How many elements in 'head'? */
45 #define HT_SIZE(head) \
46 ((head)->hth_n_entries)
47
48 /* Return memory usage for a hashtable (not counting the entries themselves) */
49 #define HT_MEM_USAGE(head) \
50 (sizeof(*head) + (head)->hth_table_length * sizeof(void*))
51
52 #define HT_FIND(name, head, elm) name##_HT_FIND((head), (elm))
53 #define HT_INSERT(name, head, elm) name##_HT_INSERT((head), (elm))
54 #define HT_REPLACE(name, head, elm) name##_HT_REPLACE((head), (elm))
55 #define HT_REMOVE(name, head, elm) name##_HT_REMOVE((head), (elm))
56 #define HT_START(name, head) name##_HT_START(head)
57 #define HT_NEXT(name, head, elm) name##_HT_NEXT((head), (elm))
58 #define HT_NEXT_RMV(name, head, elm) name##_HT_NEXT_RMV((head), (elm))
59 #define HT_CLEAR(name, head) name##_HT_CLEAR(head)
60 #define HT_INIT(name, head) name##_HT_INIT(head)
61 /* Helper: */
62 static inline unsigned
ht_improve_hash_(unsigned h)63 ht_improve_hash_(unsigned h)
64 {
65 /* Aim to protect against poor hash functions by adding logic here
66 * - logic taken from java 1.4 hashtable source */
67 h += ~(h << 9);
68 h ^= ((h >> 14) | (h << 18)); /* >>> */
69 h += (h << 4);
70 h ^= ((h >> 10) | (h << 22)); /* >>> */
71 return h;
72 }
73
74 #if 0
75 /** Basic string hash function, from Java standard String.hashCode(). */
76 static inline unsigned
77 ht_string_hash_(const char *s)
78 {
79 unsigned h = 0;
80 int m = 1;
81 while (*s) {
82 h += ((signed char)*s++)*m;
83 m = (m<<5)-1; /* m *= 31 */
84 }
85 return h;
86 }
87 #endif
88
89 /** Basic string hash function, from Python's str.__hash__() */
90 static inline unsigned
ht_string_hash_(const char * s)91 ht_string_hash_(const char *s)
92 {
93 unsigned h;
94 const unsigned char *cp = (const unsigned char *)s;
95 h = *cp << 7;
96 while (*cp) {
97 h = (1000003*h) ^ *cp++;
98 }
99 /* This conversion truncates the length of the string, but that's ok. */
100 h ^= (unsigned)(cp-(const unsigned char*)s);
101 return h;
102 }
103
104 #ifndef HT_NO_CACHE_HASH_VALUES
105 #define HT_SET_HASH_(elm, field, hashfn) \
106 do { (elm)->field.hte_hash = hashfn(elm); } while (0)
107 #define HT_SET_HASHVAL_(elm, field, val) \
108 do { (elm)->field.hte_hash = (val); } while (0)
109 #define HT_ELT_HASH_(elm, field, hashfn) \
110 ((elm)->field.hte_hash)
111 #else
112 #define HT_SET_HASH_(elm, field, hashfn) \
113 ((void)0)
114 #define HT_ELT_HASH_(elm, field, hashfn) \
115 (hashfn(elm))
116 #define HT_SET_HASHVAL_(elm, field, val) \
117 ((void)0)
118 #endif
119
120 /* Helper: alias for the bucket containing 'elm'. */
121 #define HT_BUCKET_(head, field, elm, hashfn) \
122 ((head)->hth_table[HT_ELT_HASH_(elm,field,hashfn) % head->hth_table_length])
123
124 #define HT_FOREACH(x, name, head) \
125 for ((x) = HT_START(name, head); \
126 (x) != NULL; \
127 (x) = HT_NEXT(name, head, x))
128
129 #define HT_PROTOTYPE(name, type, field, hashfn, eqfn) \
130 int name##_HT_GROW(struct name *ht, unsigned min_capacity); \
131 void name##_HT_CLEAR(struct name *ht); \
132 int name##_HT_REP_IS_BAD_(const struct name *ht); \
133 static inline void \
134 name##_HT_INIT(struct name *head) { \
135 head->hth_table_length = 0; \
136 head->hth_table = NULL; \
137 head->hth_n_entries = 0; \
138 head->hth_load_limit = 0; \
139 head->hth_prime_idx = -1; \
140 } \
141 /* Helper: returns a pointer to the right location in the table \
142 * 'head' to find or insert the element 'elm'. */ \
143 static inline struct type ** \
144 name##_HT_FIND_P_(struct name *head, struct type *elm) \
145 { \
146 struct type **p; \
147 if (!head->hth_table) \
148 return NULL; \
149 p = &HT_BUCKET_(head, field, elm, hashfn); \
150 while (*p) { \
151 if (eqfn(*p, elm)) \
152 return p; \
153 p = &(*p)->field.hte_next; \
154 } \
155 return p; \
156 } \
157 /* Return a pointer to the element in the table 'head' matching 'elm', \
158 * or NULL if no such element exists */ \
159 static inline struct type * \
160 name##_HT_FIND(const struct name *head, struct type *elm) \
161 { \
162 struct type **p; \
163 struct name *h = (struct name *) head; \
164 HT_SET_HASH_(elm, field, hashfn); \
165 p = name##_HT_FIND_P_(h, elm); \
166 return p ? *p : NULL; \
167 } \
168 /* Insert the element 'elm' into the table 'head'. Do not call this \
169 * function if the table might already contain a matching element. */ \
170 static inline void \
171 name##_HT_INSERT(struct name *head, struct type *elm) \
172 { \
173 struct type **p; \
174 if (!head->hth_table || head->hth_n_entries >= head->hth_load_limit) \
175 name##_HT_GROW(head, head->hth_n_entries+1); \
176 ++head->hth_n_entries; \
177 HT_SET_HASH_(elm, field, hashfn); \
178 p = &HT_BUCKET_(head, field, elm, hashfn); \
179 elm->field.hte_next = *p; \
180 *p = elm; \
181 } \
182 /* Insert the element 'elm' into the table 'head'. If there already \
183 * a matching element in the table, replace that element and return \
184 * it. */ \
185 static inline struct type * \
186 name##_HT_REPLACE(struct name *head, struct type *elm) \
187 { \
188 struct type **p, *r; \
189 if (!head->hth_table || head->hth_n_entries >= head->hth_load_limit) \
190 name##_HT_GROW(head, head->hth_n_entries+1); \
191 HT_SET_HASH_(elm, field, hashfn); \
192 p = name##_HT_FIND_P_(head, elm); \
193 r = *p; \
194 *p = elm; \
195 if (r && (r!=elm)) { \
196 elm->field.hte_next = r->field.hte_next; \
197 r->field.hte_next = NULL; \
198 return r; \
199 } else { \
200 ++head->hth_n_entries; \
201 return NULL; \
202 } \
203 } \
204 /* Remove any element matching 'elm' from the table 'head'. If such \
205 * an element is found, return it; otherwise return NULL. */ \
206 static inline struct type * \
207 name##_HT_REMOVE(struct name *head, struct type *elm) \
208 { \
209 struct type **p, *r; \
210 HT_SET_HASH_(elm, field, hashfn); \
211 p = name##_HT_FIND_P_(head,elm); \
212 if (!p || !*p) \
213 return NULL; \
214 r = *p; \
215 *p = r->field.hte_next; \
216 r->field.hte_next = NULL; \
217 --head->hth_n_entries; \
218 return r; \
219 } \
220 /* Invoke the function 'fn' on every element of the table 'head', \
221 * using 'data' as its second argument. If the function returns \
222 * nonzero, remove the most recently examined element before invoking \
223 * the function again. */ \
224 static inline void \
225 name##_HT_FOREACH_FN(struct name *head, \
226 int (*fn)(struct type *, void *), \
227 void *data) \
228 { \
229 unsigned idx; \
230 struct type **p, **nextp, *next; \
231 if (!head->hth_table) \
232 return; \
233 for (idx=0; idx < head->hth_table_length; ++idx) { \
234 p = &head->hth_table[idx]; \
235 while (*p) { \
236 nextp = &(*p)->field.hte_next; \
237 next = *nextp; \
238 if (fn(*p, data)) { \
239 --head->hth_n_entries; \
240 *p = next; \
241 } else { \
242 p = nextp; \
243 } \
244 } \
245 } \
246 } \
247 /* Return a pointer to the first element in the table 'head', under \
248 * an arbitrary order. This order is stable under remove operations, \
249 * but not under others. If the table is empty, return NULL. */ \
250 static inline struct type ** \
251 name##_HT_START(struct name *head) \
252 { \
253 unsigned b = 0; \
254 while (b < head->hth_table_length) { \
255 if (head->hth_table[b]) \
256 return &head->hth_table[b]; \
257 ++b; \
258 } \
259 return NULL; \
260 } \
261 /* Return the next element in 'head' after 'elm', under the arbitrary \
262 * order used by HT_START. If there are no more elements, return \
263 * NULL. If 'elm' is to be removed from the table, you must call \
264 * this function for the next value before you remove it. \
265 */ \
266 static inline struct type ** \
267 name##_HT_NEXT(struct name *head, struct type **elm) \
268 { \
269 if ((*elm)->field.hte_next) { \
270 return &(*elm)->field.hte_next; \
271 } else { \
272 unsigned b = (HT_ELT_HASH_(*elm, field, hashfn) % head->hth_table_length)+1; \
273 while (b < head->hth_table_length) { \
274 if (head->hth_table[b]) \
275 return &head->hth_table[b]; \
276 ++b; \
277 } \
278 return NULL; \
279 } \
280 } \
281 static inline struct type ** \
282 name##_HT_NEXT_RMV(struct name *head, struct type **elm) \
283 { \
284 unsigned h = HT_ELT_HASH_(*elm, field, hashfn); \
285 *elm = (*elm)->field.hte_next; \
286 --head->hth_n_entries; \
287 if (*elm) { \
288 return elm; \
289 } else { \
290 unsigned b = (h % head->hth_table_length)+1; \
291 while (b < head->hth_table_length) { \
292 if (head->hth_table[b]) \
293 return &head->hth_table[b]; \
294 ++b; \
295 } \
296 return NULL; \
297 } \
298 }
299
300 #define HT_GENERATE(name, type, field, hashfn, eqfn, load, mallocfn, \
301 reallocfn, freefn) \
302 static unsigned name##_PRIMES[] = { \
303 53, 97, 193, 389, \
304 769, 1543, 3079, 6151, \
305 12289, 24593, 49157, 98317, \
306 196613, 393241, 786433, 1572869, \
307 3145739, 6291469, 12582917, 25165843, \
308 50331653, 100663319, 201326611, 402653189, \
309 805306457, 1610612741 \
310 }; \
311 static unsigned name##_N_PRIMES = \
312 (unsigned)(sizeof(name##_PRIMES)/sizeof(name##_PRIMES[0])); \
313 /* Expand the internal table of 'head' until it is large enough to \
314 * hold 'size' elements. Return 0 on success, -1 on allocation \
315 * failure. */ \
316 int \
317 name##_HT_GROW(struct name *head, unsigned size) \
318 { \
319 unsigned new_len, new_load_limit; \
320 int prime_idx; \
321 struct type **new_table; \
322 if (head->hth_prime_idx == (int)name##_N_PRIMES - 1) \
323 return 0; \
324 if (head->hth_load_limit > size) \
325 return 0; \
326 prime_idx = head->hth_prime_idx; \
327 do { \
328 new_len = name##_PRIMES[++prime_idx]; \
329 new_load_limit = (unsigned)(load*new_len); \
330 } while (new_load_limit <= size && \
331 prime_idx < (int)name##_N_PRIMES); \
332 if ((new_table = mallocfn(new_len*sizeof(struct type*)))) { \
333 unsigned b; \
334 memset(new_table, 0, new_len*sizeof(struct type*)); \
335 for (b = 0; b < head->hth_table_length; ++b) { \
336 struct type *elm, *next; \
337 unsigned b2; \
338 elm = head->hth_table[b]; \
339 while (elm) { \
340 next = elm->field.hte_next; \
341 b2 = HT_ELT_HASH_(elm, field, hashfn) % new_len; \
342 elm->field.hte_next = new_table[b2]; \
343 new_table[b2] = elm; \
344 elm = next; \
345 } \
346 } \
347 if (head->hth_table) \
348 freefn(head->hth_table); \
349 head->hth_table = new_table; \
350 } else { \
351 unsigned b, b2; \
352 new_table = reallocfn(head->hth_table, new_len*sizeof(struct type*)); \
353 if (!new_table) return -1; \
354 memset(new_table + head->hth_table_length, 0, \
355 (new_len - head->hth_table_length)*sizeof(struct type*)); \
356 for (b=0; b < head->hth_table_length; ++b) { \
357 struct type *e, **pE; \
358 for (pE = &new_table[b], e = *pE; e != NULL; e = *pE) { \
359 b2 = HT_ELT_HASH_(e, field, hashfn) % new_len; \
360 if (b2 == b) { \
361 pE = &e->field.hte_next; \
362 } else { \
363 *pE = e->field.hte_next; \
364 e->field.hte_next = new_table[b2]; \
365 new_table[b2] = e; \
366 } \
367 } \
368 } \
369 head->hth_table = new_table; \
370 } \
371 head->hth_table_length = new_len; \
372 head->hth_prime_idx = prime_idx; \
373 head->hth_load_limit = new_load_limit; \
374 return 0; \
375 } \
376 /* Free all storage held by 'head'. Does not free 'head' itself, or \
377 * individual elements. */ \
378 void \
379 name##_HT_CLEAR(struct name *head) \
380 { \
381 if (head->hth_table) \
382 freefn(head->hth_table); \
383 name##_HT_INIT(head); \
384 } \
385 /* Debugging helper: return false iff the representation of 'head' is \
386 * internally consistent. */ \
387 int \
388 name##_HT_REP_IS_BAD_(const struct name *head) \
389 { \
390 unsigned n, i; \
391 struct type *elm; \
392 if (!head->hth_table_length) { \
393 if (!head->hth_table && !head->hth_n_entries && \
394 !head->hth_load_limit && head->hth_prime_idx == -1) \
395 return 0; \
396 else \
397 return 1; \
398 } \
399 if (!head->hth_table || head->hth_prime_idx < 0 || \
400 !head->hth_load_limit) \
401 return 2; \
402 if (head->hth_n_entries > head->hth_load_limit) \
403 return 3; \
404 if (head->hth_table_length != name##_PRIMES[head->hth_prime_idx]) \
405 return 4; \
406 if (head->hth_load_limit != (unsigned)(load*head->hth_table_length)) \
407 return 5; \
408 for (n = i = 0; i < head->hth_table_length; ++i) { \
409 for (elm = head->hth_table[i]; elm; elm = elm->field.hte_next) { \
410 if (HT_ELT_HASH_(elm, field, hashfn) != hashfn(elm)) \
411 return 1000 + i; \
412 if ((HT_ELT_HASH_(elm, field, hashfn) % head->hth_table_length) != i) \
413 return 10000 + i; \
414 ++n; \
415 } \
416 } \
417 if (n != head->hth_n_entries) \
418 return 6; \
419 return 0; \
420 }
421
422 /** Implements an over-optimized "find and insert if absent" block;
423 * not meant for direct usage by typical code, or usage outside the critical
424 * path.*/
425 #define HT_FIND_OR_INSERT_(name, field, hashfn, head, eltype, elm, var, y, n) \
426 { \
427 struct name *var##_head_ = head; \
428 struct eltype **var; \
429 if (!var##_head_->hth_table || \
430 var##_head_->hth_n_entries >= var##_head_->hth_load_limit) \
431 name##_HT_GROW(var##_head_, var##_head_->hth_n_entries+1); \
432 HT_SET_HASH_((elm), field, hashfn); \
433 var = name##_HT_FIND_P_(var##_head_, (elm)); \
434 if (*var) { \
435 y; \
436 } else { \
437 n; \
438 } \
439 }
440 #define HT_FOI_INSERT_(field, head, elm, newent, var) \
441 { \
442 HT_SET_HASHVAL_(newent, field, (elm)->field.hte_hash); \
443 newent->field.hte_next = NULL; \
444 *var = newent; \
445 ++((head)->hth_n_entries); \
446 }
447
448 /*
449 * Copyright 2005, Nick Mathewson. Implementation logic is adapted from code
450 * by Christopher Clark, retrofit to allow drop-in memory management, and to
451 * use the same interface as Niels Provos's tree.h. This is probably still
452 * a derived work, so the original license below still applies.
453 *
454 * Copyright (c) 2002, Christopher Clark
455 * All rights reserved.
456 *
457 * Redistribution and use in source and binary forms, with or without
458 * modification, are permitted provided that the following conditions
459 * are met:
460 *
461 * * Redistributions of source code must retain the above copyright
462 * notice, this list of conditions and the following disclaimer.
463 *
464 * * Redistributions in binary form must reproduce the above copyright
465 * notice, this list of conditions and the following disclaimer in the
466 * documentation and/or other materials provided with the distribution.
467 *
468 * * Neither the name of the original author; nor the names of any contributors
469 * may be used to endorse or promote products derived from this software
470 * without specific prior written permission.
471 *
472 *
473 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
474 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
475 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
476 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
477 * OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
478 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
479 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
480 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
481 * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
482 * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
483 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
484 */
485
486 #endif
487
488