]> git.saurik.com Git - apple/xnu.git/blob - libkern/kxld/kxld_dict.c
xnu-3247.1.106.tar.gz
[apple/xnu.git] / libkern / kxld / kxld_dict.c
1 /*
2 * Copyright (c) 2007-2008 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28 #include <string.h>
29 #include <sys/types.h>
30
31 #define DEBUG_ASSERT_COMPONENT_NAME_STRING "kxld"
32 #include <AssertMacros.h>
33
34 #include "kxld_dict.h"
35 #include "kxld_util.h"
36
37 /*******************************************************************************
38 * Types and macros
39 *******************************************************************************/
40
41 /* Ratio of num_entries:num_buckets that will cause a resize */
42 #define RESIZE_NUMER 7
43 #define RESIZE_DENOM 10
44 #define RESIZE_THRESHOLD(x) (((x)*RESIZE_NUMER) / RESIZE_DENOM)
45 #define MIN_BUCKETS(x) (((x)*RESIZE_DENOM) / RESIZE_NUMER)
46
47 /* Selected for good scaling qualities when resizing dictionary
48 * ... see: http://www.concentric.net/~ttwang/tech/hashsize.htm
49 */
50 #define DEFAULT_DICT_SIZE 89
51
52 typedef struct dict_entry DictEntry;
53
54 typedef enum {
55 EMPTY = 0,
56 USED = 1,
57 DELETED = 2
58 } DictEntryState;
59
60 struct dict_entry {
61 const void *key;
62 void *value;
63 DictEntryState state;
64 };
65
66 /*******************************************************************************
67 * Function prototypes
68 *******************************************************************************/
69
70 static kern_return_t get_locate_index(const KXLDDict *dict, const void *key,
71 u_int *idx);
72 static kern_return_t get_insert_index(const KXLDDict *dict, const void *key,
73 u_int *idx);
74 static kern_return_t resize_dict(KXLDDict *dict);
75
76 /*******************************************************************************
77 *******************************************************************************/
78 kern_return_t
79 kxld_dict_init(KXLDDict * dict, kxld_dict_hash hash, kxld_dict_cmp cmp,
80 u_int num_entries)
81 {
82 kern_return_t rval = KERN_FAILURE;
83 u_int min_buckets = MIN_BUCKETS(num_entries);
84 u_int num_buckets = DEFAULT_DICT_SIZE;
85
86 check(dict);
87 check(hash);
88 check(cmp);
89
90 /* We want the number of allocated buckets to be at least twice that of the
91 * number to be inserted.
92 */
93 while (min_buckets > num_buckets) {
94 num_buckets *= 2;
95 num_buckets++;
96 }
97
98 /* Allocate enough buckets for the anticipated number of entries */
99 rval = kxld_array_init(&dict->buckets, sizeof(DictEntry), num_buckets);
100 require_noerr(rval, finish);
101
102 /* Initialize */
103 dict->hash = hash;
104 dict->cmp = cmp;
105 dict->num_entries = 0;
106 dict->resize_threshold = RESIZE_THRESHOLD(num_buckets);
107
108 rval = KERN_SUCCESS;
109
110 finish:
111 return rval;
112 }
113
114 /*******************************************************************************
115 *******************************************************************************/
116 void
117 kxld_dict_clear(KXLDDict *dict)
118 {
119 check(dict);
120
121 dict->hash = NULL;
122 dict->cmp = NULL;
123 dict->num_entries = 0;
124 dict->resize_threshold = 0;
125 kxld_array_clear(&dict->buckets);
126 kxld_array_clear(&dict->resize_buckets);
127 }
128
129 /*******************************************************************************
130 *******************************************************************************/
131 void
132 kxld_dict_iterator_init(KXLDDictIterator *iter, const KXLDDict *dict)
133 {
134 check(iter);
135 check(dict);
136
137 iter->idx = 0;
138 iter->dict = dict;
139 }
140
141 /*******************************************************************************
142 *******************************************************************************/
143 void
144 kxld_dict_deinit(KXLDDict *dict)
145 {
146 check(dict);
147
148 kxld_array_deinit(&dict->buckets);
149 kxld_array_deinit(&dict->resize_buckets);
150 }
151
152 /*******************************************************************************
153 *******************************************************************************/
154 u_int
155 kxld_dict_get_num_entries(const KXLDDict *dict)
156 {
157 check(dict);
158
159 return dict->num_entries;
160 }
161
162 /*******************************************************************************
163 *******************************************************************************/
164 void *
165 kxld_dict_find(const KXLDDict *dict, const void *key)
166 {
167 kern_return_t rval = KERN_FAILURE;
168 DictEntry *entry = NULL;
169 u_int idx = 0;
170
171 check(dict);
172 check(key);
173
174 rval = get_locate_index(dict, key, &idx);
175 if (rval) return NULL;
176
177 entry = kxld_array_get_item(&dict->buckets, idx);
178
179 return entry->value;
180 }
181
182 /*******************************************************************************
183 * This dictionary uses linear probing, which means that when there is a
184 * collision, we just walk along the buckets until a free bucket shows up.
185 * A consequence of this is that when looking up an item, items that lie between
186 * its hash value and its actual bucket may have been deleted since it was
187 * inserted. Thus, we should only stop a lookup when we've wrapped around the
188 * dictionary or encountered an EMPTY bucket.
189 ********************************************************************************/
190 static kern_return_t
191 get_locate_index(const KXLDDict *dict, const void *key, u_int *_idx)
192 {
193 kern_return_t rval = KERN_FAILURE;
194 DictEntry *entry = NULL;
195 u_int base, idx;
196
197 base = idx = dict->hash(dict, key);
198
199 /* Iterate until we match the key, wrap, or hit an empty bucket */
200 entry = kxld_array_get_item(&dict->buckets, idx);
201 while (!dict->cmp(entry->key, key)) {
202 if (entry->state == EMPTY) goto finish;
203
204 idx = (idx + 1) % dict->buckets.nitems;
205 if (idx == base) goto finish;
206
207 entry = kxld_array_get_item(&dict->buckets, idx);
208 }
209
210 check(idx < dict->buckets.nitems);
211
212 *_idx = idx;
213 rval = KERN_SUCCESS;
214
215 finish:
216 return rval;
217 }
218
219 /*******************************************************************************
220 *******************************************************************************/
221 kern_return_t
222 kxld_dict_insert(KXLDDict *dict, const void *key, void *value)
223 {
224 kern_return_t rval = KERN_FAILURE;
225 DictEntry *entry = NULL;
226 u_int idx = 0;
227
228 check(dict);
229 check(key);
230 check(value);
231
232 /* Resize if we are greater than the capacity threshold.
233 * Note: this is expensive, but the dictionary can be sized correctly at
234 * construction to avoid ever having to do this.
235 */
236 while (dict->num_entries > dict->resize_threshold) {
237 rval = resize_dict(dict);
238 require_noerr(rval, finish);
239 }
240
241 /* If this function returns FULL after we've already resized appropriately
242 * something is very wrong and we should return an error.
243 */
244 rval = get_insert_index(dict, key, &idx);
245 require_noerr(rval, finish);
246
247 /* Insert the new key-value pair into the bucket, but only count it as a
248 * new entry if we are not overwriting an existing entry.
249 */
250 entry = kxld_array_get_item(&dict->buckets, idx);
251 if (entry->state != USED) {
252 dict->num_entries++;
253 entry->key = key;
254 entry->state = USED;
255 }
256 entry->value = value;
257
258 rval = KERN_SUCCESS;
259
260 finish:
261 return rval;
262 }
263
264 /*******************************************************************************
265 * Increases the hash table's capacity by 2N+1. Uses dictionary API. Not
266 * fast; just correct.
267 *******************************************************************************/
268 static kern_return_t
269 resize_dict(KXLDDict *dict)
270 {
271 kern_return_t rval = KERN_FAILURE;
272 KXLDArray tmparray;
273 DictEntry *entry = NULL;
274 u_int nbuckets = (dict->buckets.nitems * 2 + 1);
275 u_int i = 0;
276
277 check(dict);
278
279 /* Initialize a new set of buckets to hold more entries */
280 rval = kxld_array_init(&dict->resize_buckets, sizeof(DictEntry), nbuckets);
281 require_noerr(rval, finish);
282
283 /* Swap the new buckets with the old buckets */
284 tmparray = dict->buckets;
285 dict->buckets = dict->resize_buckets;
286 dict->resize_buckets = tmparray;
287
288 /* Reset dictionary parameters */
289 dict->num_entries = 0;
290 dict->resize_threshold = RESIZE_THRESHOLD(dict->buckets.nitems);
291
292 /* Rehash all of the entries */
293 for (i = 0; i < dict->resize_buckets.nitems; ++i) {
294 entry = kxld_array_get_item(&dict->resize_buckets, i);
295 if (entry->state == USED) {
296 rval = kxld_dict_insert(dict, entry->key, entry->value);
297 require_noerr(rval, finish);
298 }
299 }
300
301 /* Clear the old buckets */
302 kxld_array_clear(&dict->resize_buckets);
303
304 rval = KERN_SUCCESS;
305
306 finish:
307 return rval;
308 }
309
310 /*******************************************************************************
311 * Simple function to find the first empty cell
312 *******************************************************************************/
313 static kern_return_t
314 get_insert_index(const KXLDDict *dict, const void *key, u_int *r_index)
315 {
316 kern_return_t rval = KERN_FAILURE;
317 DictEntry *entry = NULL;
318 u_int base, idx;
319
320 base = idx = dict->hash(dict, key);
321
322 /* Iterate through the buckets until we find an EMPTY bucket, a DELETED
323 * bucket, or a key match.
324 */
325 entry = kxld_array_get_item(&dict->buckets, idx);
326 while (entry->state == USED && !dict->cmp(entry->key, key)) {
327 idx = (idx + 1) % dict->buckets.nitems;
328 require_action(base != idx, finish, rval=KERN_FAILURE);
329 entry = kxld_array_get_item(&dict->buckets, idx);
330 }
331
332 *r_index = idx;
333 rval = KERN_SUCCESS;
334
335 finish:
336 return rval;
337 }
338
339 /*******************************************************************************
340 *******************************************************************************/
341 void
342 kxld_dict_remove(KXLDDict *dict, const void *key, void **value)
343 {
344 kern_return_t rval = KERN_FAILURE;
345 DictEntry *entry = NULL;
346 u_int idx = 0;
347
348 check(dict);
349 check(key);
350
351 /* Find the item */
352 rval = get_locate_index(dict, key, &idx);
353 if (rval) {
354 if (value) *value = NULL;
355 return;
356 }
357
358 entry = kxld_array_get_item(&dict->buckets, idx);
359
360 /* Save the value if requested */
361 if (value) *value = entry->value;
362
363 /* Delete the item from the dictionary */
364 entry->key = NULL;
365 entry->value = NULL;
366 entry->state = DELETED;
367 dict->num_entries--;
368 }
369
370 /*******************************************************************************
371 *******************************************************************************/
372 void
373 kxld_dict_iterator_get_next(KXLDDictIterator *iter, const void **key,
374 void **value)
375 {
376 DictEntry *entry = NULL;
377
378 check(iter);
379 check(key);
380 check(value);
381
382 *key = NULL;
383 *value = NULL;
384
385 /* Walk over the dictionary looking for USED buckets */
386 for (; iter->idx < iter->dict->buckets.nitems; ++(iter->idx)) {
387 entry = kxld_array_get_item(&iter->dict->buckets, iter->idx);
388 if (entry->state == USED) {
389 *key = entry->key;
390 *value = entry->value;
391 ++(iter->idx);
392 break;
393 }
394 }
395 }
396
397 /*******************************************************************************
398 *******************************************************************************/
399 void
400 kxld_dict_iterator_reset(KXLDDictIterator *iter)
401 {
402 iter->idx = 0;
403 }
404
405 /*******************************************************************************
406 * This is Daniel Bernstein's hash algorithm from comp.lang.c
407 * It's fast and distributes well. Returns an idx into the symbol hash table.
408 * NOTE: Will not check for a valid pointer - performance
409 *******************************************************************************/
410 u_int
411 kxld_dict_string_hash(const KXLDDict *dict, const void *_key)
412 {
413 const char *key = _key;
414 u_int c = 0;
415 u_int hash_val = 5381;
416
417 check(dict);
418 check(_key);
419
420 while ((c = *key++)) {
421 /* hash(i) = hash(i-1) *33 ^ name[i] */
422 hash_val = ((hash_val << 5) + hash_val) ^ c;
423 }
424
425 return (hash_val % dict->buckets.nitems);
426 }
427
428 u_int
429 kxld_dict_uint32_hash(const KXLDDict *dict, const void *_key)
430 {
431 uint32_t key = *(const uint32_t *) _key;
432
433 check(_key);
434
435 return (u_int) (key % dict->buckets.nitems);
436 }
437
438 u_int
439 kxld_dict_kxldaddr_hash(const KXLDDict *dict, const void *_key)
440 {
441 kxld_addr_t key = *(const kxld_addr_t *) _key;
442
443 check(_key);
444
445 return (u_int) (key % dict->buckets.nitems);
446 }
447
448 u_int
449 kxld_dict_string_cmp(const void *key1, const void *key2)
450 {
451 return streq(key1, key2);
452 }
453
454 u_int
455 kxld_dict_uint32_cmp(const void *key1, const void *key2)
456 {
457 const uint32_t *a = key1;
458 const uint32_t *b = key2;
459
460 return (a && b && (*a == *b));
461 }
462
463 u_int
464 kxld_dict_kxldaddr_cmp(const void *key1, const void *key2)
465 {
466 const kxld_addr_t *a = key1;
467 const kxld_addr_t *b = key2;
468
469 return (a && b && (*a == *b));
470 }
471