1 /************************************************************************
2 Copyright 1988, 1991 by Carnegie Mellon University
6 Permission to use, copy, modify, and distribute this software and its
7 documentation for any purpose and without fee is hereby granted, provided
8 that the above copyright notice appear in all copies and that both that
9 copyright notice and this permission notice appear in supporting
10 documentation, and that the name of Carnegie Mellon University not be used
11 in advertising or publicity pertaining to distribution of the software
12 without specific, written prior permission.
14 CARNEGIE MELLON UNIVERSITY DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS
15 SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS.
16 IN NO EVENT SHALL CMU BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL
17 DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
18 PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
19 ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS
21 ************************************************************************/
23 #include <sys/cdefs.h>
25 __RCSID("$NetBSD: hash.c,v 1.6 2002/07/14 00:30:02 wiz Exp $");
30 * Generalized hash table ADT
32 * Provides multiple, dynamically-allocated, variable-sized hash tables on
33 * various data and keys.
35 * This package attempts to follow some of the coding conventions suggested
36 * by Bob Sidebotham and the AFS Clean Code Committee of the
37 * Information Technology Center at Carnegie Mellon.
41 #include <sys/types.h>
54 * This can be changed to make internal routines visible to debuggers, etc.
57 #define PRIVATE static
60 PRIVATE
void hashi_FreeMembers(hash_member
*, hash_freefp
);
66 * Hash table initialization routine.
68 * This routine creates and intializes a hash table of size "tablesize"
69 * entries. Successful calls return a pointer to the hash table (which must
70 * be passed to other hash routines to identify the hash table). Failed
75 hash_Init(unsigned int tablesize
)
81 totalsize
= sizeof(hash_tbl
)
82 + sizeof(hash_member
*) * (tablesize
- 1);
83 hashtblptr
= (hash_tbl
*) malloc(totalsize
);
85 bzero((char *) hashtblptr
, totalsize
);
86 hashtblptr
->size
= tablesize
; /* Success! */
87 hashtblptr
->bucketnum
= 0;
88 hashtblptr
->member
= (hashtblptr
->table
)[0];
91 hashtblptr
= NULL
; /* Disallow zero-length tables */
93 return hashtblptr
; /* NULL if failure */
99 * Frees an entire linked list of bucket members (used in the open
100 * hashing scheme). Does nothing if the passed pointer is NULL.
104 hashi_FreeMembers(hash_member
*bucketptr
, hash_freefp free_data
)
106 hash_member
*nextbucket
;
108 nextbucket
= bucketptr
->next
;
109 (*free_data
) (bucketptr
->data
);
110 free((char *) bucketptr
);
111 bucketptr
= nextbucket
;
119 * This routine re-initializes the hash table. It frees all the allocated
120 * memory and resets all bucket pointers to NULL.
124 hash_Reset(hash_tbl
*hashtable
, hash_freefp free_data
)
126 hash_member
**bucketptr
;
129 bucketptr
= hashtable
->table
;
130 for (i
= 0; i
< hashtable
->size
; i
++) {
131 hashi_FreeMembers(*bucketptr
, free_data
);
134 hashtable
->bucketnum
= 0;
135 hashtable
->member
= (hashtable
->table
)[0];
141 * Generic hash function to calculate a hash code from the given string.
143 * For each byte of the string, this function left-shifts the value in an
144 * accumulator and then adds the byte into the accumulator. The contents of
145 * the accumulator is returned after the entire string has been processed.
146 * It is assumed that this result will be used as the "hashcode" parameter in
147 * calls to other functions in this package. These functions automatically
148 * adjust the hashcode for the size of each hashtable.
150 * This algorithm probably works best when the hash table size is a prime
153 * Hopefully, this function is better than the previous one which returned
154 * the sum of the squares of all the bytes. I'm still open to other
155 * suggestions for a default hash function. The programmer is more than
156 * welcome to supply his/her own hash function as that is one of the design
157 * features of this package.
161 hash_HashFunction(unsigned char *string
, unsigned int len
)
166 for (; len
> 0; len
--) {
168 accum
+= (unsigned) (*string
++ & 0xFF);
176 * Returns TRUE if at least one entry for the given key exists; FALSE
181 hash_Exists(hash_tbl
*hashtable
, unsigned int hashcode
, hash_cmpfp compare
,
184 hash_member
*memberptr
;
186 memberptr
= (hashtable
->table
)[hashcode
% (hashtable
->size
)];
188 if ((*compare
) (key
, memberptr
->data
)) {
189 return TRUE
; /* Entry does exist */
191 memberptr
= memberptr
->next
;
193 return FALSE
; /* Entry does not exist */
199 * Insert the data item "element" into the hash table using "hashcode"
200 * to determine the bucket number, and "compare" and "key" to determine
203 * If the insertion is successful 0 is returned. If a matching entry
204 * already exists in the given bucket of the hash table, or some other error
205 * occurs, -1 is returned and the insertion is not done.
209 hash_Insert(hash_tbl
*hashtable
, unsigned int hashcode
, hash_cmpfp compare
,
210 hash_datum
*key
, hash_datum
*element
)
214 hashcode
%= hashtable
->size
;
215 if (hash_Exists(hashtable
, hashcode
, compare
, key
)) {
216 return -1; /* At least one entry already exists */
218 temp
= (hash_member
*) malloc(sizeof(hash_member
));
220 return -1; /* malloc failed! */
222 temp
->data
= element
;
223 temp
->next
= (hashtable
->table
)[hashcode
];
224 (hashtable
->table
)[hashcode
] = temp
;
225 return 0; /* Success */
231 * Delete all data elements which match the given key. If at least one
232 * element is found and the deletion is successful, 0 is returned.
233 * If no matching elements can be found in the hash table, -1 is returned.
237 hash_Delete(hash_tbl
*hashtable
, unsigned int hashcode
, hash_cmpfp compare
,
238 hash_datum
*key
, hash_freefp free_data
)
240 hash_member
*memberptr
, *tempptr
;
241 hash_member
*previous
= NULL
;
245 hashcode
%= hashtable
->size
;
248 * Delete the first member of the list if it matches. Since this moves
249 * the second member into the first position we have to keep doing this
250 * over and over until it no longer matches.
252 memberptr
= (hashtable
->table
)[hashcode
];
253 while (memberptr
&& (*compare
) (key
, memberptr
->data
)) {
254 (hashtable
->table
)[hashcode
] = memberptr
->next
;
256 * Stop hashi_FreeMembers() from deleting the whole list!
258 memberptr
->next
= NULL
;
259 hashi_FreeMembers(memberptr
, free_data
);
260 memberptr
= (hashtable
->table
)[hashcode
];
265 * Now traverse the rest of the list
268 previous
= memberptr
;
269 memberptr
= memberptr
->next
;
272 if ((*compare
) (key
, memberptr
->data
)) {
274 previous
->next
= memberptr
= memberptr
->next
;
276 * Put the brakes on hashi_FreeMembers(). . . .
278 tempptr
->next
= NULL
;
279 hashi_FreeMembers(tempptr
, free_data
);
282 previous
= memberptr
;
283 memberptr
= memberptr
->next
;
292 * Locate and return the data entry associated with the given key.
294 * If the data entry is found, a pointer to it is returned. Otherwise,
299 hash_Lookup(hash_tbl
*hashtable
, unsigned int hashcode
, hash_cmpfp compare
,
302 hash_member
*memberptr
;
304 memberptr
= (hashtable
->table
)[hashcode
% (hashtable
->size
)];
306 if ((*compare
) (key
, memberptr
->data
)) {
307 return (memberptr
->data
);
309 memberptr
= memberptr
->next
;
317 * Return the next available entry in the hashtable for a linear search
321 hash_NextEntry(hash_tbl
*hashtable
)
324 hash_member
*memberptr
;
327 * First try to pick up where we left off.
329 memberptr
= hashtable
->member
;
331 hashtable
->member
= memberptr
->next
; /* Set up for next call */
332 return memberptr
->data
; /* Return the data */
335 * We hit the end of a chain, so look through the array of buckets
336 * until we find a new chain (non-empty bucket) or run out of buckets.
338 bucket
= hashtable
->bucketnum
+ 1;
339 while ((bucket
< hashtable
->size
) &&
340 !(memberptr
= (hashtable
->table
)[bucket
])) {
345 * Check to see if we ran out of buckets.
347 if (bucket
>= hashtable
->size
) {
349 * Reset to top of table for next call.
351 hashtable
->bucketnum
= 0;
352 hashtable
->member
= (hashtable
->table
)[0];
354 * But return end-of-table indication to the caller this time.
359 * Must have found a non-empty bucket.
361 hashtable
->bucketnum
= bucket
;
362 hashtable
->member
= memberptr
->next
; /* Set up for next call */
363 return memberptr
->data
; /* Return the data */
369 * Return the first entry in a hash table for a linear search
373 hash_FirstEntry(hash_tbl
*hashtable
)
375 hashtable
->bucketnum
= 0;
376 hashtable
->member
= (hashtable
->table
)[0];
377 return hash_NextEntry(hashtable
);
384 * c-argdecl-indent: 4
385 * c-continued-statement-offset: 4
386 * c-continued-brace-offset: -4