1 /* hash - hashing table processing. 
   3    Copyright (C) 1998, 1999, 2000, 2001, 2002, 2003 Free Software 
   6    Written by Jim Meyering, 1992. 
   8    This program is free software; you can redistribute it and/or modify 
   9    it under the terms of the GNU General Public License as published by 
  10    the Free Software Foundation; either version 2, or (at your option) 
  13    This program is distributed in the hope that it will be useful, 
  14    but WITHOUT ANY WARRANTY; without even the implied warranty of 
  15    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the 
  16    GNU General Public License for more details. 
  18    You should have received a copy of the GNU General Public License 
  19    along with this program; if not, write to the Free Software Foundation, 
  20    Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.  */ 
  22 /* A generic hash table package.  */ 
  24 /* Define USE_OBSTACK to 1 if you want the allocator to use obstacks instead 
  25    of malloc.  If you change USE_OBSTACK, you have to recompile!  */ 
  37 #ifndef HAVE_DECL_FREE 
  38 "this configure-time declaration test was not run" 
  44 #ifndef HAVE_DECL_MALLOC 
  45 "this configure-time declaration test was not run" 
  53 # ifndef obstack_chunk_alloc 
  54 #  define obstack_chunk_alloc malloc 
  56 # ifndef obstack_chunk_free 
  57 #  define obstack_chunk_free free 
  65     /* The array of buckets starts at BUCKET and extends to BUCKET_LIMIT-1, 
  66        for a possibility of N_BUCKETS.  Among those, N_BUCKETS_USED buckets 
  67        are not empty, there are N_ENTRIES active entries in the table.  */ 
  68     struct hash_entry 
*bucket
; 
  69     struct hash_entry 
*bucket_limit
; 
  71     unsigned n_buckets_used
; 
  74     /* Tuning arguments, kept in a physicaly separate structure.  */ 
  75     const Hash_tuning 
*tuning
; 
  77     /* Three functions are given to `hash_initialize', see the documentation 
  78        block for this function.  In a word, HASHER randomizes a user entry 
  79        into a number up from 0 up to some maximum minus 1; COMPARATOR returns 
  80        true if two user entries compare equally; and DATA_FREER is the cleanup 
  81        function for a user entry.  */ 
  83     Hash_comparator comparator
; 
  84     Hash_data_freer data_freer
; 
  86     /* A linked list of freed struct hash_entry structs.  */ 
  87     struct hash_entry 
*free_entry_list
; 
  90     /* Whenever obstacks are used, it is possible to allocate all overflowed 
  91        entries into a single stack, so they all can be freed in a single 
  92        operation.  It is not clear if the speedup is worth the trouble.  */ 
  93     struct obstack entry_stack
; 
  97 /* A hash table contains many internal entries, each holding a pointer to 
  98    some user provided data (also called a user entry).  An entry indistinctly 
  99    refers to both the internal entry and its associated user entry.  A user 
 100    entry contents may be hashed by a randomization function (the hashing 
 101    function, or just `hasher' for short) into a number (or `slot') between 0 
 102    and the current table size.  At each slot position in the hash table, 
 103    starts a linked chain of entries for which the user data all hash to this 
 104    slot.  A bucket is the collection of all entries hashing to the same slot. 
 106    A good `hasher' function will distribute entries rather evenly in buckets. 
 107    In the ideal case, the length of each bucket is roughly the number of 
 108    entries divided by the table size.  Finding the slot for a data is usually 
 109    done in constant time by the `hasher', and the later finding of a precise 
 110    entry is linear in time with the size of the bucket.  Consequently, a 
 111    larger hash table size (that is, a larger number of buckets) is prone to 
 112    yielding shorter chains, *given* the `hasher' function behaves properly. 
 114    Long buckets slow down the lookup algorithm.  One might use big hash table 
 115    sizes in hope to reduce the average length of buckets, but this might 
 116    become inordinate, as unused slots in the hash table take some space.  The 
 117    best bet is to make sure you are using a good `hasher' function (beware 
 118    that those are not that easy to write! :-), and to use a table size 
 119    larger than the actual number of entries.  */ 
 121 /* If an insertion makes the ratio of nonempty buckets to table size larger 
 122    than the growth threshold (a number between 0.0 and 1.0), then increase 
 123    the table size by multiplying by the growth factor (a number greater than 
 124    1.0).  The growth threshold defaults to 0.8, and the growth factor 
 125    defaults to 1.414, meaning that the table will have doubled its size 
 126    every second time 80% of the buckets get used.  */ 
 127 #define DEFAULT_GROWTH_THRESHOLD 0.8 
 128 #define DEFAULT_GROWTH_FACTOR 1.414 
 130 /* If a deletion empties a bucket and causes the ratio of used buckets to 
 131    table size to become smaller than the shrink threshold (a number between 
 132    0.0 and 1.0), then shrink the table by multiplying by the shrink factor (a 
 133    number greater than the shrink threshold but smaller than 1.0).  The shrink 
 134    threshold and factor default to 0.0 and 1.0, meaning that the table never 
 136 #define DEFAULT_SHRINK_THRESHOLD 0.0 
 137 #define DEFAULT_SHRINK_FACTOR 1.0 
 139 /* Use this to initialize or reset a TUNING structure to 
 140    some sensible values. */ 
 141 static const Hash_tuning default_tuning 
= 
 143     DEFAULT_SHRINK_THRESHOLD
, 
 144     DEFAULT_SHRINK_FACTOR
, 
 145     DEFAULT_GROWTH_THRESHOLD
, 
 146     DEFAULT_GROWTH_FACTOR
, 
 150 /* Information and lookup.  */ 
 152 /* The following few functions provide information about the overall hash 
 153    table organization: the number of entries, number of buckets and maximum 
 154    length of buckets.  */ 
 156 /* Return the number of buckets in the hash table.  The table size, the total 
 157    number of buckets (used plus unused), or the maximum number of slots, are 
 158    the same quantity.  */ 
 161 hash_get_n_buckets (const Hash_table 
*table
) 
 163   return table
->n_buckets
; 
 166 /* Return the number of slots in use (non-empty buckets).  */ 
 169 hash_get_n_buckets_used (const Hash_table 
*table
) 
 171   return table
->n_buckets_used
; 
 174 /* Return the number of active entries.  */ 
 177 hash_get_n_entries (const Hash_table 
*table
) 
 179   return table
->n_entries
; 
 182 /* Return the length of the longest chain (bucket).  */ 
 185 hash_get_max_bucket_length (const Hash_table 
*table
) 
 187   struct hash_entry 
*bucket
; 
 188   unsigned max_bucket_length 
= 0; 
 190   for (bucket 
= table
->bucket
; bucket 
< table
->bucket_limit
; bucket
++) 
 194           struct hash_entry 
*cursor 
= bucket
; 
 195           unsigned bucket_length 
= 1; 
 197           while (cursor 
= cursor
->next
, cursor
) 
 200           if (bucket_length 
> max_bucket_length
) 
 201             max_bucket_length 
= bucket_length
; 
 205   return max_bucket_length
; 
 208 /* Do a mild validation of a hash table, by traversing it and checking two 
 212 hash_table_ok (const Hash_table 
*table
) 
 214   struct hash_entry 
*bucket
; 
 215   unsigned n_buckets_used 
= 0; 
 216   unsigned n_entries 
= 0; 
 218   for (bucket 
= table
->bucket
; bucket 
< table
->bucket_limit
; bucket
++) 
 222           struct hash_entry 
*cursor 
= bucket
; 
 224           /* Count bucket head.  */ 
 228           /* Count bucket overflow.  */ 
 229           while (cursor 
= cursor
->next
, cursor
) 
 234   if (n_buckets_used 
== table
->n_buckets_used 
&& n_entries 
== table
->n_entries
) 
 241 hash_print_statistics (const Hash_table 
*table
, FILE *stream
) 
 243   unsigned n_entries 
= hash_get_n_entries (table
); 
 244   unsigned n_buckets 
= hash_get_n_buckets (table
); 
 245   unsigned n_buckets_used 
= hash_get_n_buckets_used (table
); 
 246   unsigned max_bucket_length 
= hash_get_max_bucket_length (table
); 
 248   fprintf (stream
, "# entries:         %u\n", n_entries
); 
 249   fprintf (stream
, "# buckets:         %u\n", n_buckets
); 
 250   fprintf (stream
, "# buckets used:    %u (%.2f%%)\n", n_buckets_used
, 
 251            (100.0 * n_buckets_used
) / n_buckets
); 
 252   fprintf (stream
, "max bucket length: %u\n", max_bucket_length
); 
 255 /* If ENTRY matches an entry already in the hash table, return the 
 256    entry from the table.  Otherwise, return NULL.  */ 
 259 hash_lookup (const Hash_table 
*table
, const void *entry
) 
 261   struct hash_entry 
*bucket
 
 262     = table
->bucket 
+ table
->hasher (entry
, table
->n_buckets
); 
 263   struct hash_entry 
*cursor
; 
 265   if (! (bucket 
< table
->bucket_limit
)) 
 268   if (bucket
->data 
== NULL
) 
 271   for (cursor 
= bucket
; cursor
; cursor 
= cursor
->next
) 
 272     if (table
->comparator (entry
, cursor
->data
)) 
 280 /* The functions in this page traverse the hash table and process the 
 281    contained entries.  For the traversal to work properly, the hash table 
 282    should not be resized nor modified while any particular entry is being 
 283    processed.  In particular, entries should not be added or removed.  */ 
 285 /* Return the first data in the table, or NULL if the table is empty.  */ 
 288 hash_get_first (const Hash_table 
*table
) 
 290   struct hash_entry 
*bucket
; 
 292   if (table
->n_entries 
== 0) 
 295   for (bucket 
= table
->bucket
; ; bucket
++) 
 296     if (! (bucket 
< table
->bucket_limit
)) 
 298     else if (bucket
->data
) 
 302 /* Return the user data for the entry following ENTRY, where ENTRY has been 
 303    returned by a previous call to either `hash_get_first' or `hash_get_next'. 
 304    Return NULL if there are no more entries.  */ 
 307 hash_get_next (const Hash_table 
*table
, const void *entry
) 
 309   struct hash_entry 
*bucket
 
 310     = table
->bucket 
+ table
->hasher (entry
, table
->n_buckets
); 
 311   struct hash_entry 
*cursor
; 
 313   if (! (bucket 
< table
->bucket_limit
)) 
 316   /* Find next entry in the same bucket.  */ 
 317   for (cursor 
= bucket
; cursor
; cursor 
= cursor
->next
) 
 318     if (cursor
->data 
== entry 
&& cursor
->next
) 
 319       return cursor
->next
->data
; 
 321   /* Find first entry in any subsequent bucket.  */ 
 322   while (++bucket 
< table
->bucket_limit
) 
 330 /* Fill BUFFER with pointers to active user entries in the hash table, then 
 331    return the number of pointers copied.  Do not copy more than BUFFER_SIZE 
 335 hash_get_entries (const Hash_table 
*table
, void **buffer
, 
 336                   unsigned buffer_size
) 
 338   unsigned counter 
= 0; 
 339   struct hash_entry 
*bucket
; 
 340   struct hash_entry 
*cursor
; 
 342   for (bucket 
= table
->bucket
; bucket 
< table
->bucket_limit
; bucket
++) 
 346           for (cursor 
= bucket
; cursor
; cursor 
= cursor
->next
) 
 348               if (counter 
>= buffer_size
) 
 350               buffer
[counter
++] = cursor
->data
; 
 358 /* Call a PROCESSOR function for each entry of a hash table, and return the 
 359    number of entries for which the processor function returned success.  A 
 360    pointer to some PROCESSOR_DATA which will be made available to each call to 
 361    the processor function.  The PROCESSOR accepts two arguments: the first is 
 362    the user entry being walked into, the second is the value of PROCESSOR_DATA 
 363    as received.  The walking continue for as long as the PROCESSOR function 
 364    returns nonzero.  When it returns zero, the walking is interrupted.  */ 
 367 hash_do_for_each (const Hash_table 
*table
, Hash_processor processor
, 
 368                   void *processor_data
) 
 370   unsigned counter 
= 0; 
 371   struct hash_entry 
*bucket
; 
 372   struct hash_entry 
*cursor
; 
 374   for (bucket 
= table
->bucket
; bucket 
< table
->bucket_limit
; bucket
++) 
 378           for (cursor 
= bucket
; cursor
; cursor 
= cursor
->next
) 
 380               if (!(*processor
) (cursor
->data
, processor_data
)) 
 390 /* Allocation and clean-up.  */ 
 392 /* Return a hash index for a NUL-terminated STRING between 0 and N_BUCKETS-1. 
 393    This is a convenience routine for constructing other hashing functions.  */ 
 397 /* About hashings, Paul Eggert writes to me (FP), on 1994-01-01: "Please see 
 398    B. J. McKenzie, R. Harries & T. Bell, Selecting a hashing algorithm, 
 399    Software--practice & experience 20, 2 (Feb 1990), 209-224.  Good hash 
 400    algorithms tend to be domain-specific, so what's good for [diffutils'] io.c 
 401    may not be good for your application."  */ 
 404 hash_string (const char *string
, unsigned n_buckets
) 
 409 # define ROTATE_LEFT(Value, Shift) \ 
 410   ((Value) << (Shift) | (Value) >> ((sizeof (unsigned) * CHAR_BIT) - (Shift))) 
 411 # define HASH_ONE_CHAR(Value, Byte) \ 
 412   ((Byte) + ROTATE_LEFT (Value, 7)) 
 416   for (; *string
; string
++) 
 417     value 
= HASH_ONE_CHAR (value
, *(const unsigned char *) string
); 
 418   return value 
% n_buckets
; 
 421 # undef HASH_ONE_CHAR 
 424 #else /* not USE_DIFF_HASH */ 
 426 /* This one comes from `recode', and performs a bit better than the above as 
 427    per a few experiments.  It is inspired from a hashing routine found in the 
 428    very old Cyber `snoop', itself written in typical Greg Mansfield style. 
 429    (By the way, what happened to this excellent man?  Is he still alive?)  */ 
 432 hash_string (const char *string
, unsigned n_buckets
) 
 437     value 
= ((value 
* 31 + (int) *(const unsigned char *) string
++) 
 442 #endif /* not USE_DIFF_HASH */ 
 444 /* Return true if CANDIDATE is a prime number.  CANDIDATE should be an odd 
 445    number at least equal to 11.  */ 
 448 is_prime (unsigned long candidate
) 
 450   unsigned long divisor 
= 3; 
 451   unsigned long square 
= divisor 
* divisor
; 
 453   while (square 
< candidate 
&& (candidate 
% divisor
)) 
 456       square 
+= 4 * divisor
; 
 460   return (candidate 
% divisor 
? true : false); 
 463 /* Round a given CANDIDATE number up to the nearest prime, and return that 
 464    prime.  Primes lower than 10 are merely skipped.  */ 
 467 next_prime (unsigned long candidate
) 
 469   /* Skip small primes.  */ 
 473   /* Make it definitely odd.  */ 
 476   while (!is_prime (candidate
)) 
 483 hash_reset_tuning (Hash_tuning 
*tuning
) 
 485   *tuning 
= default_tuning
; 
 488 /* For the given hash TABLE, check the user supplied tuning structure for 
 489    reasonable values, and return true if there is no gross error with it. 
 490    Otherwise, definitively reset the TUNING field to some acceptable default 
 491    in the hash table (that is, the user loses the right of further modifying 
 492    tuning arguments), and return false.  */ 
 495 check_tuning (Hash_table 
*table
) 
 497   const Hash_tuning 
*tuning 
= table
->tuning
; 
 499   if (tuning
->growth_threshold 
> 0.0 
 500       && tuning
->growth_threshold 
< 1.0 
 501       && tuning
->growth_factor 
> 1.0 
 502       && tuning
->shrink_threshold 
>= 0.0 
 503       && tuning
->shrink_threshold 
< 1.0 
 504       && tuning
->shrink_factor 
> tuning
->shrink_threshold
 
 505       && tuning
->shrink_factor 
<= 1.0 
 506       && tuning
->shrink_threshold 
< tuning
->growth_threshold
) 
 509   table
->tuning 
= &default_tuning
; 
 513 /* Allocate and return a new hash table, or NULL upon failure.  The initial 
 514    number of buckets is automatically selected so as to _guarantee_ that you 
 515    may insert at least CANDIDATE different user entries before any growth of 
 516    the hash table size occurs.  So, if have a reasonably tight a-priori upper 
 517    bound on the number of entries you intend to insert in the hash table, you 
 518    may save some table memory and insertion time, by specifying it here.  If 
 519    the IS_N_BUCKETS field of the TUNING structure is true, the CANDIDATE 
 520    argument has its meaning changed to the wanted number of buckets. 
 522    TUNING points to a structure of user-supplied values, in case some fine 
 523    tuning is wanted over the default behavior of the hasher.  If TUNING is 
 524    NULL, the default tuning parameters are used instead. 
 526    The user-supplied HASHER function should be provided.  It accepts two 
 527    arguments ENTRY and TABLE_SIZE.  It computes, by hashing ENTRY contents, a 
 528    slot number for that entry which should be in the range 0..TABLE_SIZE-1. 
 529    This slot number is then returned. 
 531    The user-supplied COMPARATOR function should be provided.  It accepts two 
 532    arguments pointing to user data, it then returns true for a pair of entries 
 533    that compare equal, or false otherwise.  This function is internally called 
 534    on entries which are already known to hash to the same bucket index. 
 536    The user-supplied DATA_FREER function, when not NULL, may be later called 
 537    with the user data as an argument, just before the entry containing the 
 538    data gets freed.  This happens from within `hash_free' or `hash_clear'. 
 539    You should specify this function only if you want these functions to free 
 540    all of your `data' data.  This is typically the case when your data is 
 541    simply an auxiliary struct that you have malloc'd to aggregate several 
 545 hash_initialize (unsigned candidate
, const Hash_tuning 
*tuning
, 
 546                  Hash_hasher hasher
, Hash_comparator comparator
, 
 547                  Hash_data_freer data_freer
) 
 550   struct hash_entry 
*bucket
; 
 552   if (hasher 
== NULL 
|| comparator 
== NULL
) 
 555   table 
= (Hash_table 
*) malloc (sizeof (Hash_table
)); 
 560     tuning 
= &default_tuning
; 
 561   table
->tuning 
= tuning
; 
 562   if (!check_tuning (table
)) 
 564       /* Fail if the tuning options are invalid.  This is the only occasion 
 565          when the user gets some feedback about it.  Once the table is created, 
 566          if the user provides invalid tuning options, we silently revert to 
 567          using the defaults, and ignore further request to change the tuning 
 574     = next_prime (tuning
->is_n_buckets 
? candidate
 
 575                   : (unsigned) (candidate 
/ tuning
->growth_threshold
)); 
 577   table
->bucket 
= (struct hash_entry 
*) 
 578     malloc (table
->n_buckets 
* sizeof (struct hash_entry
)); 
 579   if (table
->bucket 
== NULL
) 
 584   table
->bucket_limit 
= table
->bucket 
+ table
->n_buckets
; 
 586   for (bucket 
= table
->bucket
; bucket 
< table
->bucket_limit
; bucket
++) 
 591   table
->n_buckets_used 
= 0; 
 592   table
->n_entries 
= 0; 
 594   table
->hasher 
= hasher
; 
 595   table
->comparator 
= comparator
; 
 596   table
->data_freer 
= data_freer
; 
 598   table
->free_entry_list 
= NULL
; 
 600   obstack_init (&table
->entry_stack
); 
 605 /* Make all buckets empty, placing any chained entries on the free list. 
 606    Apply the user-specified function data_freer (if any) to the datas of any 
 610 hash_clear (Hash_table 
*table
) 
 612   struct hash_entry 
*bucket
; 
 614   for (bucket 
= table
->bucket
; bucket 
< table
->bucket_limit
; bucket
++) 
 618           struct hash_entry 
*cursor
; 
 619           struct hash_entry 
*next
; 
 621           /* Free the bucket overflow.  */ 
 622           for (cursor 
= bucket
->next
; cursor
; cursor 
= next
) 
 624               if (table
->data_freer
) 
 625                 (*table
->data_freer
) (cursor
->data
); 
 629               /* Relinking is done one entry at a time, as it is to be expected 
 630                  that overflows are either rare or short.  */ 
 631               cursor
->next 
= table
->free_entry_list
; 
 632               table
->free_entry_list 
= cursor
; 
 635           /* Free the bucket head.  */ 
 636           if (table
->data_freer
) 
 637             (*table
->data_freer
) (bucket
->data
); 
 643   table
->n_buckets_used 
= 0; 
 644   table
->n_entries 
= 0; 
 647 /* Reclaim all storage associated with a hash table.  If a data_freer 
 648    function has been supplied by the user when the hash table was created, 
 649    this function applies it to the data of each entry before freeing that 
 653 hash_free (Hash_table 
*table
) 
 655   struct hash_entry 
*bucket
; 
 656   struct hash_entry 
*cursor
; 
 657   struct hash_entry 
*next
; 
 659   /* Call the user data_freer function.  */ 
 660   if (table
->data_freer 
&& table
->n_entries
) 
 662       for (bucket 
= table
->bucket
; bucket 
< table
->bucket_limit
; bucket
++) 
 666               for (cursor 
= bucket
; cursor
; cursor 
= cursor
->next
) 
 668                   (*table
->data_freer
) (cursor
->data
); 
 676   obstack_free (&table
->entry_stack
, NULL
); 
 680   /* Free all bucket overflowed entries.  */ 
 681   for (bucket 
= table
->bucket
; bucket 
< table
->bucket_limit
; bucket
++) 
 683       for (cursor 
= bucket
->next
; cursor
; cursor 
= next
) 
 690   /* Also reclaim the internal list of previously freed entries.  */ 
 691   for (cursor 
= table
->free_entry_list
; cursor
; cursor 
= next
) 
 699   /* Free the remainder of the hash table structure.  */ 
 700   free (table
->bucket
); 
 704 /* Insertion and deletion.  */ 
 706 /* Get a new hash entry for a bucket overflow, possibly by reclying a 
 707    previously freed one.  If this is not possible, allocate a new one.  */ 
 709 static struct hash_entry 
* 
 710 allocate_entry (Hash_table 
*table
) 
 712   struct hash_entry 
*new; 
 714   if (table
->free_entry_list
) 
 716       new = table
->free_entry_list
; 
 717       table
->free_entry_list 
= new->next
; 
 722       new = (struct hash_entry 
*) 
 723         obstack_alloc (&table
->entry_stack
, sizeof (struct hash_entry
)); 
 725       new = (struct hash_entry 
*) malloc (sizeof (struct hash_entry
)); 
 732 /* Free a hash entry which was part of some bucket overflow, 
 733    saving it for later recycling.  */ 
 736 free_entry (Hash_table 
*table
, struct hash_entry 
*entry
) 
 739   entry
->next 
= table
->free_entry_list
; 
 740   table
->free_entry_list 
= entry
; 
 743 /* This private function is used to help with insertion and deletion.  When 
 744    ENTRY matches an entry in the table, return a pointer to the corresponding 
 745    user data and set *BUCKET_HEAD to the head of the selected bucket. 
 746    Otherwise, return NULL.  When DELETE is true and ENTRY matches an entry in 
 747    the table, unlink the matching entry.  */ 
 750 hash_find_entry (Hash_table 
*table
, const void *entry
, 
 751                  struct hash_entry 
**bucket_head
, bool delete) 
 753   struct hash_entry 
*bucket
 
 754     = table
->bucket 
+ table
->hasher (entry
, table
->n_buckets
); 
 755   struct hash_entry 
*cursor
; 
 757   if (! (bucket 
< table
->bucket_limit
)) 
 760   *bucket_head 
= bucket
; 
 762   /* Test for empty bucket.  */ 
 763   if (bucket
->data 
== NULL
) 
 766   /* See if the entry is the first in the bucket.  */ 
 767   if ((*table
->comparator
) (entry
, bucket
->data
)) 
 769       void *data 
= bucket
->data
; 
 775               struct hash_entry 
*next 
= bucket
->next
; 
 777               /* Bump the first overflow entry into the bucket head, then save 
 778                  the previous first overflow entry for later recycling.  */ 
 780               free_entry (table
, next
); 
 791   /* Scan the bucket overflow.  */ 
 792   for (cursor 
= bucket
; cursor
->next
; cursor 
= cursor
->next
) 
 794       if ((*table
->comparator
) (entry
, cursor
->next
->data
)) 
 796           void *data 
= cursor
->next
->data
; 
 800               struct hash_entry 
*next 
= cursor
->next
; 
 802               /* Unlink the entry to delete, then save the freed entry for later 
 804               cursor
->next 
= next
->next
; 
 805               free_entry (table
, next
); 
 812   /* No entry found.  */ 
 816 /* For an already existing hash table, change the number of buckets through 
 817    specifying CANDIDATE.  The contents of the hash table are preserved.  The 
 818    new number of buckets is automatically selected so as to _guarantee_ that 
 819    the table may receive at least CANDIDATE different user entries, including 
 820    those already in the table, before any other growth of the hash table size 
 821    occurs.  If TUNING->IS_N_BUCKETS is true, then CANDIDATE specifies the 
 822    exact number of buckets desired.  */ 
 825 hash_rehash (Hash_table 
*table
, unsigned candidate
) 
 827   Hash_table 
*new_table
; 
 828   struct hash_entry 
*bucket
; 
 829   struct hash_entry 
*cursor
; 
 830   struct hash_entry 
*next
; 
 832   new_table 
= hash_initialize (candidate
, table
->tuning
, table
->hasher
, 
 833                                table
->comparator
, table
->data_freer
); 
 834   if (new_table 
== NULL
) 
 837   /* Merely reuse the extra old space into the new table.  */ 
 839   obstack_free (&new_table
->entry_stack
, NULL
); 
 840   new_table
->entry_stack 
= table
->entry_stack
; 
 842   new_table
->free_entry_list 
= table
->free_entry_list
; 
 844   for (bucket 
= table
->bucket
; bucket 
< table
->bucket_limit
; bucket
++) 
 846       for (cursor 
= bucket
; cursor
; cursor 
= next
) 
 848           void *data 
= cursor
->data
; 
 849           struct hash_entry 
*new_bucket
 
 851                + new_table
->hasher (data
, new_table
->n_buckets
)); 
 853           if (! (new_bucket 
< new_table
->bucket_limit
)) 
 858           if (new_bucket
->data
) 
 860               if (cursor 
== bucket
) 
 862                   /* Allocate or recycle an entry, when moving from a bucket 
 863                      header into a bucket overflow.  */ 
 864                   struct hash_entry 
*new_entry 
= allocate_entry (new_table
); 
 866                   if (new_entry 
== NULL
) 
 869                   new_entry
->data 
= data
; 
 870                   new_entry
->next 
= new_bucket
->next
; 
 871                   new_bucket
->next 
= new_entry
; 
 875                   /* Merely relink an existing entry, when moving from a 
 876                      bucket overflow into a bucket overflow.  */ 
 877                   cursor
->next 
= new_bucket
->next
; 
 878                   new_bucket
->next 
= cursor
; 
 883               /* Free an existing entry, when moving from a bucket 
 884                  overflow into a bucket header.  Also take care of the 
 885                  simple case of moving from a bucket header into a bucket 
 887               new_bucket
->data 
= data
; 
 888               new_table
->n_buckets_used
++; 
 889               if (cursor 
!= bucket
) 
 890                 free_entry (new_table
, cursor
); 
 894   free (table
->bucket
); 
 895   table
->bucket 
= new_table
->bucket
; 
 896   table
->bucket_limit 
= new_table
->bucket_limit
; 
 897   table
->n_buckets 
= new_table
->n_buckets
; 
 898   table
->n_buckets_used 
= new_table
->n_buckets_used
; 
 899   table
->free_entry_list 
= new_table
->free_entry_list
; 
 900   /* table->n_entries already holds its value.  */ 
 902   table
->entry_stack 
= new_table
->entry_stack
; 
 909 /* If ENTRY matches an entry already in the hash table, return the pointer 
 910    to the entry from the table.  Otherwise, insert ENTRY and return ENTRY. 
 911    Return NULL if the storage required for insertion cannot be allocated.  */ 
 914 hash_insert (Hash_table 
*table
, const void *entry
) 
 917   struct hash_entry 
*bucket
; 
 919   /* The caller cannot insert a NULL entry.  */ 
 923   /* If there's a matching entry already in the table, return that.  */ 
 924   if ((data 
= hash_find_entry (table
, entry
, &bucket
, false)) != NULL
) 
 927   /* ENTRY is not matched, it should be inserted.  */ 
 931       struct hash_entry 
*new_entry 
= allocate_entry (table
); 
 933       if (new_entry 
== NULL
) 
 936       /* Add ENTRY in the overflow of the bucket.  */ 
 938       new_entry
->data 
= (void *) entry
; 
 939       new_entry
->next 
= bucket
->next
; 
 940       bucket
->next 
= new_entry
; 
 942       return (void *) entry
; 
 945   /* Add ENTRY right in the bucket head.  */ 
 947   bucket
->data 
= (void *) entry
; 
 949   table
->n_buckets_used
++; 
 951   /* If the growth threshold of the buckets in use has been reached, increase 
 952      the table size and rehash.  There's no point in checking the number of 
 953      entries:  if the hashing function is ill-conditioned, rehashing is not 
 954      likely to improve it.  */ 
 956   if (table
->n_buckets_used
 
 957       > table
->tuning
->growth_threshold 
* table
->n_buckets
) 
 959       /* Check more fully, before starting real work.  If tuning arguments 
 960          became invalid, the second check will rely on proper defaults.  */ 
 961       check_tuning (table
); 
 962       if (table
->n_buckets_used
 
 963           > table
->tuning
->growth_threshold 
* table
->n_buckets
) 
 965           const Hash_tuning 
*tuning 
= table
->tuning
; 
 967             = (unsigned) (tuning
->is_n_buckets
 
 968                           ? (table
->n_buckets 
* tuning
->growth_factor
) 
 969                           : (table
->n_buckets 
* tuning
->growth_factor
 
 970                              * tuning
->growth_threshold
)); 
 972           /* If the rehash fails, arrange to return NULL.  */ 
 973           if (!hash_rehash (table
, candidate
)) 
 978   return (void *) entry
; 
 981 /* If ENTRY is already in the table, remove it and return the just-deleted 
 982    data (the user may want to deallocate its storage).  If ENTRY is not in the 
 983    table, don't modify the table and return NULL.  */ 
 986 hash_delete (Hash_table 
*table
, const void *entry
) 
 989   struct hash_entry 
*bucket
; 
 991   data 
= hash_find_entry (table
, entry
, &bucket
, true); 
 998       table
->n_buckets_used
--; 
1000       /* If the shrink threshold of the buckets in use has been reached, 
1001          rehash into a smaller table.  */ 
1003       if (table
->n_buckets_used
 
1004           < table
->tuning
->shrink_threshold 
* table
->n_buckets
) 
1006           /* Check more fully, before starting real work.  If tuning arguments 
1007              became invalid, the second check will rely on proper defaults.  */ 
1008           check_tuning (table
); 
1009           if (table
->n_buckets_used
 
1010               < table
->tuning
->shrink_threshold 
* table
->n_buckets
) 
1012               const Hash_tuning 
*tuning 
= table
->tuning
; 
1014                 = (unsigned) (tuning
->is_n_buckets
 
1015                               ? table
->n_buckets 
* tuning
->shrink_factor
 
1016                               : (table
->n_buckets 
* tuning
->shrink_factor
 
1017                                  * tuning
->growth_threshold
)); 
1019               hash_rehash (table
, candidate
); 
1032 hash_print (const Hash_table 
*table
) 
1034   struct hash_entry 
*bucket
; 
1036   for (bucket 
= table
->bucket
; bucket 
< table
->bucket_limit
; bucket
++) 
1038       struct hash_entry 
*cursor
; 
1041         printf ("%d:\n", bucket 
- table
->bucket
); 
1043       for (cursor 
= bucket
; cursor
; cursor 
= cursor
->next
) 
1045           char *s 
= (char *) cursor
->data
; 
1048             printf ("  %s\n", s
); 
1053 #endif /* TESTING */