144099b7bSPaul Traina /************************************************************************
244099b7bSPaul Traina Copyright 1988, 1991 by Carnegie Mellon University
344099b7bSPaul Traina
444099b7bSPaul Traina All Rights Reserved
544099b7bSPaul Traina
644099b7bSPaul Traina Permission to use, copy, modify, and distribute this software and its
744099b7bSPaul Traina documentation for any purpose and without fee is hereby granted, provided
844099b7bSPaul Traina that the above copyright notice appear in all copies and that both that
944099b7bSPaul Traina copyright notice and this permission notice appear in supporting
1044099b7bSPaul Traina documentation, and that the name of Carnegie Mellon University not be used
1144099b7bSPaul Traina in advertising or publicity pertaining to distribution of the software
1244099b7bSPaul Traina without specific, written prior permission.
1344099b7bSPaul Traina
1444099b7bSPaul Traina CARNEGIE MELLON UNIVERSITY DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS
1544099b7bSPaul Traina SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS.
1644099b7bSPaul Traina IN NO EVENT SHALL CMU BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL
1744099b7bSPaul Traina DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
1844099b7bSPaul Traina PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
1944099b7bSPaul Traina ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS
2044099b7bSPaul Traina SOFTWARE.
21148531efSWolfram Schneider
2244099b7bSPaul Traina ************************************************************************/
2344099b7bSPaul Traina
2444099b7bSPaul Traina /*
2544099b7bSPaul Traina * Generalized hash table ADT
2644099b7bSPaul Traina *
2744099b7bSPaul Traina * Provides multiple, dynamically-allocated, variable-sized hash tables on
2844099b7bSPaul Traina * various data and keys.
2944099b7bSPaul Traina *
3044099b7bSPaul Traina * This package attempts to follow some of the coding conventions suggested
3144099b7bSPaul Traina * by Bob Sidebotham and the AFS Clean Code Committee of the
3244099b7bSPaul Traina * Information Technology Center at Carnegie Mellon.
3344099b7bSPaul Traina */
3444099b7bSPaul Traina
3544099b7bSPaul Traina
3644099b7bSPaul Traina #include <sys/types.h>
3744099b7bSPaul Traina #include <stdlib.h>
38cfb9be50SKyle Evans #include <strings.h>
3944099b7bSPaul Traina
4044099b7bSPaul Traina #include "hash.h"
4144099b7bSPaul Traina
4244099b7bSPaul Traina #define TRUE 1
4344099b7bSPaul Traina #define FALSE 0
4444099b7bSPaul Traina #ifndef NULL
4544099b7bSPaul Traina #define NULL 0
4644099b7bSPaul Traina #endif
4744099b7bSPaul Traina
4844099b7bSPaul Traina /*
4944099b7bSPaul Traina * This can be changed to make internal routines visible to debuggers, etc.
5044099b7bSPaul Traina */
5144099b7bSPaul Traina #ifndef PRIVATE
5244099b7bSPaul Traina #define PRIVATE static
5344099b7bSPaul Traina #endif
5444099b7bSPaul Traina
55f19d047aSAlfred Perlstein PRIVATE void hashi_FreeMembers(hash_member *, hash_freefp);
5644099b7bSPaul Traina
5744099b7bSPaul Traina
5844099b7bSPaul Traina
5944099b7bSPaul Traina
6044099b7bSPaul Traina /*
6144099b7bSPaul Traina * Hash table initialization routine.
6244099b7bSPaul Traina *
6344099b7bSPaul Traina * This routine creates and intializes a hash table of size "tablesize"
6444099b7bSPaul Traina * entries. Successful calls return a pointer to the hash table (which must
6544099b7bSPaul Traina * be passed to other hash routines to identify the hash table). Failed
6644099b7bSPaul Traina * calls return NULL.
6744099b7bSPaul Traina */
6844099b7bSPaul Traina
6944099b7bSPaul Traina hash_tbl *
hash_Init(unsigned tablesize)70*8b356c88SJohn Baldwin hash_Init(unsigned tablesize)
7144099b7bSPaul Traina {
7207ee9f80SPedro F. Giffuni hash_tbl *hashtblptr;
7307ee9f80SPedro F. Giffuni unsigned totalsize;
7444099b7bSPaul Traina
7544099b7bSPaul Traina if (tablesize > 0) {
7644099b7bSPaul Traina totalsize = sizeof(hash_tbl)
7744099b7bSPaul Traina + sizeof(hash_member *) * (tablesize - 1);
7844099b7bSPaul Traina hashtblptr = (hash_tbl *) malloc(totalsize);
7944099b7bSPaul Traina if (hashtblptr) {
8044099b7bSPaul Traina bzero((char *) hashtblptr, totalsize);
8144099b7bSPaul Traina hashtblptr->size = tablesize; /* Success! */
8244099b7bSPaul Traina hashtblptr->bucketnum = 0;
8344099b7bSPaul Traina hashtblptr->member = (hashtblptr->table)[0];
8444099b7bSPaul Traina }
8544099b7bSPaul Traina } else {
8644099b7bSPaul Traina hashtblptr = NULL; /* Disallow zero-length tables */
8744099b7bSPaul Traina }
8844099b7bSPaul Traina return hashtblptr; /* NULL if failure */
8944099b7bSPaul Traina }
9044099b7bSPaul Traina
9144099b7bSPaul Traina
9244099b7bSPaul Traina
9344099b7bSPaul Traina /*
9444099b7bSPaul Traina * Frees an entire linked list of bucket members (used in the open
9544099b7bSPaul Traina * hashing scheme). Does nothing if the passed pointer is NULL.
9644099b7bSPaul Traina */
9744099b7bSPaul Traina
9844099b7bSPaul Traina PRIVATE void
hashi_FreeMembers(hash_member * bucketptr,hash_freefp free_data)99*8b356c88SJohn Baldwin hashi_FreeMembers(hash_member *bucketptr, hash_freefp free_data)
10044099b7bSPaul Traina {
10144099b7bSPaul Traina hash_member *nextbucket;
10244099b7bSPaul Traina while (bucketptr) {
10344099b7bSPaul Traina nextbucket = bucketptr->next;
10444099b7bSPaul Traina (*free_data) (bucketptr->data);
10544099b7bSPaul Traina free((char *) bucketptr);
10644099b7bSPaul Traina bucketptr = nextbucket;
10744099b7bSPaul Traina }
10844099b7bSPaul Traina }
10944099b7bSPaul Traina
11044099b7bSPaul Traina
11144099b7bSPaul Traina
11244099b7bSPaul Traina
11344099b7bSPaul Traina /*
11444099b7bSPaul Traina * This routine re-initializes the hash table. It frees all the allocated
11544099b7bSPaul Traina * memory and resets all bucket pointers to NULL.
11644099b7bSPaul Traina */
11744099b7bSPaul Traina
11844099b7bSPaul Traina void
hash_Reset(hash_tbl * hashtable,hash_freefp free_data)119*8b356c88SJohn Baldwin hash_Reset(hash_tbl *hashtable, hash_freefp free_data)
12044099b7bSPaul Traina {
12144099b7bSPaul Traina hash_member **bucketptr;
12244099b7bSPaul Traina unsigned i;
12344099b7bSPaul Traina
12444099b7bSPaul Traina bucketptr = hashtable->table;
12544099b7bSPaul Traina for (i = 0; i < hashtable->size; i++) {
12644099b7bSPaul Traina hashi_FreeMembers(*bucketptr, free_data);
12744099b7bSPaul Traina *bucketptr++ = NULL;
12844099b7bSPaul Traina }
12944099b7bSPaul Traina hashtable->bucketnum = 0;
13044099b7bSPaul Traina hashtable->member = (hashtable->table)[0];
13144099b7bSPaul Traina }
13244099b7bSPaul Traina
13344099b7bSPaul Traina
13444099b7bSPaul Traina
13544099b7bSPaul Traina /*
13644099b7bSPaul Traina * Generic hash function to calculate a hash code from the given string.
13744099b7bSPaul Traina *
13844099b7bSPaul Traina * For each byte of the string, this function left-shifts the value in an
13944099b7bSPaul Traina * accumulator and then adds the byte into the accumulator. The contents of
14044099b7bSPaul Traina * the accumulator is returned after the entire string has been processed.
14144099b7bSPaul Traina * It is assumed that this result will be used as the "hashcode" parameter in
14244099b7bSPaul Traina * calls to other functions in this package. These functions automatically
14344099b7bSPaul Traina * adjust the hashcode for the size of each hashtable.
14444099b7bSPaul Traina *
14544099b7bSPaul Traina * This algorithm probably works best when the hash table size is a prime
14644099b7bSPaul Traina * number.
14744099b7bSPaul Traina *
14844099b7bSPaul Traina * Hopefully, this function is better than the previous one which returned
14944099b7bSPaul Traina * the sum of the squares of all the bytes. I'm still open to other
15044099b7bSPaul Traina * suggestions for a default hash function. The programmer is more than
15144099b7bSPaul Traina * welcome to supply his/her own hash function as that is one of the design
15244099b7bSPaul Traina * features of this package.
15344099b7bSPaul Traina */
15444099b7bSPaul Traina
15544099b7bSPaul Traina unsigned
hash_HashFunction(unsigned char * string,unsigned len)156*8b356c88SJohn Baldwin hash_HashFunction(unsigned char *string, unsigned len)
15744099b7bSPaul Traina {
15807ee9f80SPedro F. Giffuni unsigned accum;
15944099b7bSPaul Traina
16044099b7bSPaul Traina accum = 0;
16144099b7bSPaul Traina for (; len > 0; len--) {
16244099b7bSPaul Traina accum <<= 1;
16344099b7bSPaul Traina accum += (unsigned) (*string++ & 0xFF);
16444099b7bSPaul Traina }
16544099b7bSPaul Traina return accum;
16644099b7bSPaul Traina }
16744099b7bSPaul Traina
16844099b7bSPaul Traina
16944099b7bSPaul Traina
17044099b7bSPaul Traina /*
17144099b7bSPaul Traina * Returns TRUE if at least one entry for the given key exists; FALSE
17244099b7bSPaul Traina * otherwise.
17344099b7bSPaul Traina */
17444099b7bSPaul Traina
17544099b7bSPaul Traina int
hash_Exists(hash_tbl * hashtable,unsigned hashcode,hash_cmpfp compare,hash_datum * key)176*8b356c88SJohn Baldwin hash_Exists(hash_tbl *hashtable, unsigned hashcode, hash_cmpfp compare,
177*8b356c88SJohn Baldwin hash_datum *key)
17844099b7bSPaul Traina {
17907ee9f80SPedro F. Giffuni hash_member *memberptr;
18044099b7bSPaul Traina
18144099b7bSPaul Traina memberptr = (hashtable->table)[hashcode % (hashtable->size)];
18244099b7bSPaul Traina while (memberptr) {
18344099b7bSPaul Traina if ((*compare) (key, memberptr->data)) {
18444099b7bSPaul Traina return TRUE; /* Entry does exist */
18544099b7bSPaul Traina }
18644099b7bSPaul Traina memberptr = memberptr->next;
18744099b7bSPaul Traina }
18844099b7bSPaul Traina return FALSE; /* Entry does not exist */
18944099b7bSPaul Traina }
19044099b7bSPaul Traina
19144099b7bSPaul Traina
19244099b7bSPaul Traina
19344099b7bSPaul Traina /*
19444099b7bSPaul Traina * Insert the data item "element" into the hash table using "hashcode"
19544099b7bSPaul Traina * to determine the bucket number, and "compare" and "key" to determine
19644099b7bSPaul Traina * its uniqueness.
19744099b7bSPaul Traina *
19844099b7bSPaul Traina * If the insertion is successful 0 is returned. If a matching entry
19944099b7bSPaul Traina * already exists in the given bucket of the hash table, or some other error
20044099b7bSPaul Traina * occurs, -1 is returned and the insertion is not done.
20144099b7bSPaul Traina */
20244099b7bSPaul Traina
20344099b7bSPaul Traina int
hash_Insert(hash_tbl * hashtable,unsigned hashcode,hash_cmpfp compare,hash_datum * key,hash_datum * element)204*8b356c88SJohn Baldwin hash_Insert(hash_tbl *hashtable, unsigned hashcode, hash_cmpfp compare,
205*8b356c88SJohn Baldwin hash_datum *key, hash_datum *element)
20644099b7bSPaul Traina {
20744099b7bSPaul Traina hash_member *temp;
20844099b7bSPaul Traina
20944099b7bSPaul Traina hashcode %= hashtable->size;
21044099b7bSPaul Traina if (hash_Exists(hashtable, hashcode, compare, key)) {
21144099b7bSPaul Traina return -1; /* At least one entry already exists */
21244099b7bSPaul Traina }
21344099b7bSPaul Traina temp = (hash_member *) malloc(sizeof(hash_member));
21444099b7bSPaul Traina if (!temp)
21544099b7bSPaul Traina return -1; /* malloc failed! */
21644099b7bSPaul Traina
21744099b7bSPaul Traina temp->data = element;
21844099b7bSPaul Traina temp->next = (hashtable->table)[hashcode];
21944099b7bSPaul Traina (hashtable->table)[hashcode] = temp;
22044099b7bSPaul Traina return 0; /* Success */
22144099b7bSPaul Traina }
22244099b7bSPaul Traina
22344099b7bSPaul Traina
22444099b7bSPaul Traina
22544099b7bSPaul Traina /*
22644099b7bSPaul Traina * Delete all data elements which match the given key. If at least one
22744099b7bSPaul Traina * element is found and the deletion is successful, 0 is returned.
22844099b7bSPaul Traina * If no matching elements can be found in the hash table, -1 is returned.
22944099b7bSPaul Traina */
23044099b7bSPaul Traina
23144099b7bSPaul Traina int
hash_Delete(hash_tbl * hashtable,unsigned hashcode,hash_cmpfp compare,hash_datum * key,hash_freefp free_data)232*8b356c88SJohn Baldwin hash_Delete(hash_tbl *hashtable, unsigned hashcode, hash_cmpfp compare,
233*8b356c88SJohn Baldwin hash_datum *key, hash_freefp free_data)
23444099b7bSPaul Traina {
23544099b7bSPaul Traina hash_member *memberptr, *tempptr;
23644099b7bSPaul Traina hash_member *previous = NULL;
23744099b7bSPaul Traina int retval;
23844099b7bSPaul Traina
23944099b7bSPaul Traina retval = -1;
24044099b7bSPaul Traina hashcode %= hashtable->size;
24144099b7bSPaul Traina
24244099b7bSPaul Traina /*
24344099b7bSPaul Traina * Delete the first member of the list if it matches. Since this moves
24444099b7bSPaul Traina * the second member into the first position we have to keep doing this
24544099b7bSPaul Traina * over and over until it no longer matches.
24644099b7bSPaul Traina */
24744099b7bSPaul Traina memberptr = (hashtable->table)[hashcode];
24844099b7bSPaul Traina while (memberptr && (*compare) (key, memberptr->data)) {
24944099b7bSPaul Traina (hashtable->table)[hashcode] = memberptr->next;
25044099b7bSPaul Traina /*
25144099b7bSPaul Traina * Stop hashi_FreeMembers() from deleting the whole list!
25244099b7bSPaul Traina */
25344099b7bSPaul Traina memberptr->next = NULL;
25444099b7bSPaul Traina hashi_FreeMembers(memberptr, free_data);
25544099b7bSPaul Traina memberptr = (hashtable->table)[hashcode];
25644099b7bSPaul Traina retval = 0;
25744099b7bSPaul Traina }
25844099b7bSPaul Traina
25944099b7bSPaul Traina /*
26044099b7bSPaul Traina * Now traverse the rest of the list
26144099b7bSPaul Traina */
26244099b7bSPaul Traina if (memberptr) {
26344099b7bSPaul Traina previous = memberptr;
26444099b7bSPaul Traina memberptr = memberptr->next;
26544099b7bSPaul Traina }
26644099b7bSPaul Traina while (memberptr) {
26744099b7bSPaul Traina if ((*compare) (key, memberptr->data)) {
26844099b7bSPaul Traina tempptr = memberptr;
26944099b7bSPaul Traina previous->next = memberptr = memberptr->next;
27044099b7bSPaul Traina /*
27144099b7bSPaul Traina * Put the brakes on hashi_FreeMembers(). . . .
27244099b7bSPaul Traina */
27344099b7bSPaul Traina tempptr->next = NULL;
27444099b7bSPaul Traina hashi_FreeMembers(tempptr, free_data);
27544099b7bSPaul Traina retval = 0;
27644099b7bSPaul Traina } else {
27744099b7bSPaul Traina previous = memberptr;
27844099b7bSPaul Traina memberptr = memberptr->next;
27944099b7bSPaul Traina }
28044099b7bSPaul Traina }
28144099b7bSPaul Traina return retval;
28244099b7bSPaul Traina }
28344099b7bSPaul Traina
28444099b7bSPaul Traina
28544099b7bSPaul Traina
28644099b7bSPaul Traina /*
28744099b7bSPaul Traina * Locate and return the data entry associated with the given key.
28844099b7bSPaul Traina *
28944099b7bSPaul Traina * If the data entry is found, a pointer to it is returned. Otherwise,
29044099b7bSPaul Traina * NULL is returned.
29144099b7bSPaul Traina */
29244099b7bSPaul Traina
29344099b7bSPaul Traina hash_datum *
hash_Lookup(hash_tbl * hashtable,unsigned hashcode,hash_cmpfp compare,hash_datum * key)294*8b356c88SJohn Baldwin hash_Lookup(hash_tbl *hashtable, unsigned hashcode, hash_cmpfp compare,
295*8b356c88SJohn Baldwin hash_datum *key)
29644099b7bSPaul Traina {
29744099b7bSPaul Traina hash_member *memberptr;
29844099b7bSPaul Traina
29944099b7bSPaul Traina memberptr = (hashtable->table)[hashcode % (hashtable->size)];
30044099b7bSPaul Traina while (memberptr) {
30144099b7bSPaul Traina if ((*compare) (key, memberptr->data)) {
30244099b7bSPaul Traina return (memberptr->data);
30344099b7bSPaul Traina }
30444099b7bSPaul Traina memberptr = memberptr->next;
30544099b7bSPaul Traina }
30644099b7bSPaul Traina return NULL;
30744099b7bSPaul Traina }
30844099b7bSPaul Traina
30944099b7bSPaul Traina
31044099b7bSPaul Traina
31144099b7bSPaul Traina /*
31244099b7bSPaul Traina * Return the next available entry in the hashtable for a linear search
31344099b7bSPaul Traina */
31444099b7bSPaul Traina
31544099b7bSPaul Traina hash_datum *
hash_NextEntry(hash_tbl * hashtable)316*8b356c88SJohn Baldwin hash_NextEntry(hash_tbl *hashtable)
31744099b7bSPaul Traina {
31807ee9f80SPedro F. Giffuni unsigned bucket;
31907ee9f80SPedro F. Giffuni hash_member *memberptr;
32044099b7bSPaul Traina
32144099b7bSPaul Traina /*
32244099b7bSPaul Traina * First try to pick up where we left off.
32344099b7bSPaul Traina */
32444099b7bSPaul Traina memberptr = hashtable->member;
32544099b7bSPaul Traina if (memberptr) {
32644099b7bSPaul Traina hashtable->member = memberptr->next; /* Set up for next call */
32744099b7bSPaul Traina return memberptr->data; /* Return the data */
32844099b7bSPaul Traina }
32944099b7bSPaul Traina /*
33044099b7bSPaul Traina * We hit the end of a chain, so look through the array of buckets
33144099b7bSPaul Traina * until we find a new chain (non-empty bucket) or run out of buckets.
33244099b7bSPaul Traina */
33344099b7bSPaul Traina bucket = hashtable->bucketnum + 1;
33444099b7bSPaul Traina while ((bucket < hashtable->size) &&
33544099b7bSPaul Traina !(memberptr = (hashtable->table)[bucket])) {
33644099b7bSPaul Traina bucket++;
33744099b7bSPaul Traina }
33844099b7bSPaul Traina
33944099b7bSPaul Traina /*
34044099b7bSPaul Traina * Check to see if we ran out of buckets.
34144099b7bSPaul Traina */
34244099b7bSPaul Traina if (bucket >= hashtable->size) {
34344099b7bSPaul Traina /*
34444099b7bSPaul Traina * Reset to top of table for next call.
34544099b7bSPaul Traina */
34644099b7bSPaul Traina hashtable->bucketnum = 0;
34744099b7bSPaul Traina hashtable->member = (hashtable->table)[0];
34844099b7bSPaul Traina /*
34944099b7bSPaul Traina * But return end-of-table indication to the caller this time.
35044099b7bSPaul Traina */
35144099b7bSPaul Traina return NULL;
35244099b7bSPaul Traina }
35344099b7bSPaul Traina /*
35444099b7bSPaul Traina * Must have found a non-empty bucket.
35544099b7bSPaul Traina */
35644099b7bSPaul Traina hashtable->bucketnum = bucket;
35744099b7bSPaul Traina hashtable->member = memberptr->next; /* Set up for next call */
35844099b7bSPaul Traina return memberptr->data; /* Return the data */
35944099b7bSPaul Traina }
36044099b7bSPaul Traina
36144099b7bSPaul Traina
36244099b7bSPaul Traina
36344099b7bSPaul Traina /*
36444099b7bSPaul Traina * Return the first entry in a hash table for a linear search
36544099b7bSPaul Traina */
36644099b7bSPaul Traina
36744099b7bSPaul Traina hash_datum *
hash_FirstEntry(hash_tbl * hashtable)368*8b356c88SJohn Baldwin hash_FirstEntry(hash_tbl *hashtable)
36944099b7bSPaul Traina {
37044099b7bSPaul Traina hashtable->bucketnum = 0;
37144099b7bSPaul Traina hashtable->member = (hashtable->table)[0];
37244099b7bSPaul Traina return hash_NextEntry(hashtable);
37344099b7bSPaul Traina }
37444099b7bSPaul Traina
37544099b7bSPaul Traina /*
37644099b7bSPaul Traina * Local Variables:
37744099b7bSPaul Traina * tab-width: 4
37844099b7bSPaul Traina * c-indent-level: 4
37944099b7bSPaul Traina * c-argdecl-indent: 4
38044099b7bSPaul Traina * c-continued-statement-offset: 4
38144099b7bSPaul Traina * c-continued-brace-offset: -4
38244099b7bSPaul Traina * c-label-offset: -4
38344099b7bSPaul Traina * c-brace-offset: 0
38444099b7bSPaul Traina * End:
38544099b7bSPaul Traina */
386