144099b7bSPaul Traina /************************************************************************ 244099b7bSPaul Traina Copyright 1988, 1991 by Carnegie Mellon University 344099b7bSPaul Traina 444099b7bSPaul Traina All Rights Reserved 544099b7bSPaul Traina 644099b7bSPaul Traina Permission to use, copy, modify, and distribute this software and its 744099b7bSPaul Traina documentation for any purpose and without fee is hereby granted, provided 844099b7bSPaul Traina that the above copyright notice appear in all copies and that both that 944099b7bSPaul Traina copyright notice and this permission notice appear in supporting 1044099b7bSPaul Traina documentation, and that the name of Carnegie Mellon University not be used 1144099b7bSPaul Traina in advertising or publicity pertaining to distribution of the software 1244099b7bSPaul Traina without specific, written prior permission. 1344099b7bSPaul Traina 1444099b7bSPaul Traina CARNEGIE MELLON UNIVERSITY DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS 1544099b7bSPaul Traina SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS. 1644099b7bSPaul Traina IN NO EVENT SHALL CMU BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL 1744099b7bSPaul Traina DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR 1844099b7bSPaul Traina PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS 1944099b7bSPaul Traina ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS 2044099b7bSPaul Traina SOFTWARE. 21148531efSWolfram Schneider 22148531efSWolfram Schneider $Id$ 23148531efSWolfram Schneider 2444099b7bSPaul Traina ************************************************************************/ 2544099b7bSPaul Traina 2644099b7bSPaul Traina /* 2744099b7bSPaul Traina * Generalized hash table ADT 2844099b7bSPaul Traina * 2944099b7bSPaul Traina * Provides multiple, dynamically-allocated, variable-sized hash tables on 3044099b7bSPaul Traina * various data and keys. 3144099b7bSPaul Traina * 3244099b7bSPaul Traina * This package attempts to follow some of the coding conventions suggested 3344099b7bSPaul Traina * by Bob Sidebotham and the AFS Clean Code Committee of the 3444099b7bSPaul Traina * Information Technology Center at Carnegie Mellon. 3544099b7bSPaul Traina */ 3644099b7bSPaul Traina 3744099b7bSPaul Traina 3844099b7bSPaul Traina #include <sys/types.h> 3944099b7bSPaul Traina #include <stdlib.h> 4044099b7bSPaul Traina 4144099b7bSPaul Traina #ifndef USE_BFUNCS 4244099b7bSPaul Traina #include <memory.h> 4344099b7bSPaul Traina /* Yes, memcpy is OK here (no overlapped copies). */ 4444099b7bSPaul Traina #define bcopy(a,b,c) memcpy(b,a,c) 4544099b7bSPaul Traina #define bzero(p,l) memset(p,0,l) 4644099b7bSPaul Traina #define bcmp(a,b,c) memcmp(a,b,c) 4744099b7bSPaul Traina #endif 4844099b7bSPaul Traina 4944099b7bSPaul Traina #include "hash.h" 5044099b7bSPaul Traina 5144099b7bSPaul Traina #define TRUE 1 5244099b7bSPaul Traina #define FALSE 0 5344099b7bSPaul Traina #ifndef NULL 5444099b7bSPaul Traina #define NULL 0 5544099b7bSPaul Traina #endif 5644099b7bSPaul Traina 5744099b7bSPaul Traina /* 5844099b7bSPaul Traina * This can be changed to make internal routines visible to debuggers, etc. 5944099b7bSPaul Traina */ 6044099b7bSPaul Traina #ifndef PRIVATE 6144099b7bSPaul Traina #define PRIVATE static 6244099b7bSPaul Traina #endif 6344099b7bSPaul Traina 6444099b7bSPaul Traina #ifdef __STDC__ 6544099b7bSPaul Traina #define P(args) args 6644099b7bSPaul Traina #else 6744099b7bSPaul Traina #define P(args) () 6844099b7bSPaul Traina #endif 6944099b7bSPaul Traina 7044099b7bSPaul Traina PRIVATE void hashi_FreeMembers P((hash_member *, hash_freefp)); 7144099b7bSPaul Traina 7244099b7bSPaul Traina #undef P 7344099b7bSPaul Traina 7444099b7bSPaul Traina 7544099b7bSPaul Traina 7644099b7bSPaul Traina /* 7744099b7bSPaul Traina * Hash table initialization routine. 7844099b7bSPaul Traina * 7944099b7bSPaul Traina * This routine creates and intializes a hash table of size "tablesize" 8044099b7bSPaul Traina * entries. Successful calls return a pointer to the hash table (which must 8144099b7bSPaul Traina * be passed to other hash routines to identify the hash table). Failed 8244099b7bSPaul Traina * calls return NULL. 8344099b7bSPaul Traina */ 8444099b7bSPaul Traina 8544099b7bSPaul Traina hash_tbl * 8644099b7bSPaul Traina hash_Init(tablesize) 8744099b7bSPaul Traina unsigned tablesize; 8844099b7bSPaul Traina { 8944099b7bSPaul Traina register hash_tbl *hashtblptr; 9044099b7bSPaul Traina register unsigned totalsize; 9144099b7bSPaul Traina 9244099b7bSPaul Traina if (tablesize > 0) { 9344099b7bSPaul Traina totalsize = sizeof(hash_tbl) 9444099b7bSPaul Traina + sizeof(hash_member *) * (tablesize - 1); 9544099b7bSPaul Traina hashtblptr = (hash_tbl *) malloc(totalsize); 9644099b7bSPaul Traina if (hashtblptr) { 9744099b7bSPaul Traina bzero((char *) hashtblptr, totalsize); 9844099b7bSPaul Traina hashtblptr->size = tablesize; /* Success! */ 9944099b7bSPaul Traina hashtblptr->bucketnum = 0; 10044099b7bSPaul Traina hashtblptr->member = (hashtblptr->table)[0]; 10144099b7bSPaul Traina } 10244099b7bSPaul Traina } else { 10344099b7bSPaul Traina hashtblptr = NULL; /* Disallow zero-length tables */ 10444099b7bSPaul Traina } 10544099b7bSPaul Traina return hashtblptr; /* NULL if failure */ 10644099b7bSPaul Traina } 10744099b7bSPaul Traina 10844099b7bSPaul Traina 10944099b7bSPaul Traina 11044099b7bSPaul Traina /* 11144099b7bSPaul Traina * Frees an entire linked list of bucket members (used in the open 11244099b7bSPaul Traina * hashing scheme). Does nothing if the passed pointer is NULL. 11344099b7bSPaul Traina */ 11444099b7bSPaul Traina 11544099b7bSPaul Traina PRIVATE void 11644099b7bSPaul Traina hashi_FreeMembers(bucketptr, free_data) 11744099b7bSPaul Traina hash_member *bucketptr; 11844099b7bSPaul Traina hash_freefp free_data; 11944099b7bSPaul Traina { 12044099b7bSPaul Traina hash_member *nextbucket; 12144099b7bSPaul Traina while (bucketptr) { 12244099b7bSPaul Traina nextbucket = bucketptr->next; 12344099b7bSPaul Traina (*free_data) (bucketptr->data); 12444099b7bSPaul Traina free((char *) bucketptr); 12544099b7bSPaul Traina bucketptr = nextbucket; 12644099b7bSPaul Traina } 12744099b7bSPaul Traina } 12844099b7bSPaul Traina 12944099b7bSPaul Traina 13044099b7bSPaul Traina 13144099b7bSPaul Traina 13244099b7bSPaul Traina /* 13344099b7bSPaul Traina * This routine re-initializes the hash table. It frees all the allocated 13444099b7bSPaul Traina * memory and resets all bucket pointers to NULL. 13544099b7bSPaul Traina */ 13644099b7bSPaul Traina 13744099b7bSPaul Traina void 13844099b7bSPaul Traina hash_Reset(hashtable, free_data) 13944099b7bSPaul Traina hash_tbl *hashtable; 14044099b7bSPaul Traina hash_freefp free_data; 14144099b7bSPaul Traina { 14244099b7bSPaul Traina hash_member **bucketptr; 14344099b7bSPaul Traina unsigned i; 14444099b7bSPaul Traina 14544099b7bSPaul Traina bucketptr = hashtable->table; 14644099b7bSPaul Traina for (i = 0; i < hashtable->size; i++) { 14744099b7bSPaul Traina hashi_FreeMembers(*bucketptr, free_data); 14844099b7bSPaul Traina *bucketptr++ = NULL; 14944099b7bSPaul Traina } 15044099b7bSPaul Traina hashtable->bucketnum = 0; 15144099b7bSPaul Traina hashtable->member = (hashtable->table)[0]; 15244099b7bSPaul Traina } 15344099b7bSPaul Traina 15444099b7bSPaul Traina 15544099b7bSPaul Traina 15644099b7bSPaul Traina /* 15744099b7bSPaul Traina * Generic hash function to calculate a hash code from the given string. 15844099b7bSPaul Traina * 15944099b7bSPaul Traina * For each byte of the string, this function left-shifts the value in an 16044099b7bSPaul Traina * accumulator and then adds the byte into the accumulator. The contents of 16144099b7bSPaul Traina * the accumulator is returned after the entire string has been processed. 16244099b7bSPaul Traina * It is assumed that this result will be used as the "hashcode" parameter in 16344099b7bSPaul Traina * calls to other functions in this package. These functions automatically 16444099b7bSPaul Traina * adjust the hashcode for the size of each hashtable. 16544099b7bSPaul Traina * 16644099b7bSPaul Traina * This algorithm probably works best when the hash table size is a prime 16744099b7bSPaul Traina * number. 16844099b7bSPaul Traina * 16944099b7bSPaul Traina * Hopefully, this function is better than the previous one which returned 17044099b7bSPaul Traina * the sum of the squares of all the bytes. I'm still open to other 17144099b7bSPaul Traina * suggestions for a default hash function. The programmer is more than 17244099b7bSPaul Traina * welcome to supply his/her own hash function as that is one of the design 17344099b7bSPaul Traina * features of this package. 17444099b7bSPaul Traina */ 17544099b7bSPaul Traina 17644099b7bSPaul Traina unsigned 17744099b7bSPaul Traina hash_HashFunction(string, len) 17844099b7bSPaul Traina unsigned char *string; 17944099b7bSPaul Traina register unsigned len; 18044099b7bSPaul Traina { 18144099b7bSPaul Traina register unsigned accum; 18244099b7bSPaul Traina 18344099b7bSPaul Traina accum = 0; 18444099b7bSPaul Traina for (; len > 0; len--) { 18544099b7bSPaul Traina accum <<= 1; 18644099b7bSPaul Traina accum += (unsigned) (*string++ & 0xFF); 18744099b7bSPaul Traina } 18844099b7bSPaul Traina return accum; 18944099b7bSPaul Traina } 19044099b7bSPaul Traina 19144099b7bSPaul Traina 19244099b7bSPaul Traina 19344099b7bSPaul Traina /* 19444099b7bSPaul Traina * Returns TRUE if at least one entry for the given key exists; FALSE 19544099b7bSPaul Traina * otherwise. 19644099b7bSPaul Traina */ 19744099b7bSPaul Traina 19844099b7bSPaul Traina int 19944099b7bSPaul Traina hash_Exists(hashtable, hashcode, compare, key) 20044099b7bSPaul Traina hash_tbl *hashtable; 20144099b7bSPaul Traina unsigned hashcode; 20244099b7bSPaul Traina hash_cmpfp compare; 20344099b7bSPaul Traina hash_datum *key; 20444099b7bSPaul Traina { 20544099b7bSPaul Traina register hash_member *memberptr; 20644099b7bSPaul Traina 20744099b7bSPaul Traina memberptr = (hashtable->table)[hashcode % (hashtable->size)]; 20844099b7bSPaul Traina while (memberptr) { 20944099b7bSPaul Traina if ((*compare) (key, memberptr->data)) { 21044099b7bSPaul Traina return TRUE; /* Entry does exist */ 21144099b7bSPaul Traina } 21244099b7bSPaul Traina memberptr = memberptr->next; 21344099b7bSPaul Traina } 21444099b7bSPaul Traina return FALSE; /* Entry does not exist */ 21544099b7bSPaul Traina } 21644099b7bSPaul Traina 21744099b7bSPaul Traina 21844099b7bSPaul Traina 21944099b7bSPaul Traina /* 22044099b7bSPaul Traina * Insert the data item "element" into the hash table using "hashcode" 22144099b7bSPaul Traina * to determine the bucket number, and "compare" and "key" to determine 22244099b7bSPaul Traina * its uniqueness. 22344099b7bSPaul Traina * 22444099b7bSPaul Traina * If the insertion is successful 0 is returned. If a matching entry 22544099b7bSPaul Traina * already exists in the given bucket of the hash table, or some other error 22644099b7bSPaul Traina * occurs, -1 is returned and the insertion is not done. 22744099b7bSPaul Traina */ 22844099b7bSPaul Traina 22944099b7bSPaul Traina int 23044099b7bSPaul Traina hash_Insert(hashtable, hashcode, compare, key, element) 23144099b7bSPaul Traina hash_tbl *hashtable; 23244099b7bSPaul Traina unsigned hashcode; 23344099b7bSPaul Traina hash_cmpfp compare; 23444099b7bSPaul Traina hash_datum *key, *element; 23544099b7bSPaul Traina { 23644099b7bSPaul Traina hash_member *temp; 23744099b7bSPaul Traina 23844099b7bSPaul Traina hashcode %= hashtable->size; 23944099b7bSPaul Traina if (hash_Exists(hashtable, hashcode, compare, key)) { 24044099b7bSPaul Traina return -1; /* At least one entry already exists */ 24144099b7bSPaul Traina } 24244099b7bSPaul Traina temp = (hash_member *) malloc(sizeof(hash_member)); 24344099b7bSPaul Traina if (!temp) 24444099b7bSPaul Traina return -1; /* malloc failed! */ 24544099b7bSPaul Traina 24644099b7bSPaul Traina temp->data = element; 24744099b7bSPaul Traina temp->next = (hashtable->table)[hashcode]; 24844099b7bSPaul Traina (hashtable->table)[hashcode] = temp; 24944099b7bSPaul Traina return 0; /* Success */ 25044099b7bSPaul Traina } 25144099b7bSPaul Traina 25244099b7bSPaul Traina 25344099b7bSPaul Traina 25444099b7bSPaul Traina /* 25544099b7bSPaul Traina * Delete all data elements which match the given key. If at least one 25644099b7bSPaul Traina * element is found and the deletion is successful, 0 is returned. 25744099b7bSPaul Traina * If no matching elements can be found in the hash table, -1 is returned. 25844099b7bSPaul Traina */ 25944099b7bSPaul Traina 26044099b7bSPaul Traina int 26144099b7bSPaul Traina hash_Delete(hashtable, hashcode, compare, key, free_data) 26244099b7bSPaul Traina hash_tbl *hashtable; 26344099b7bSPaul Traina unsigned hashcode; 26444099b7bSPaul Traina hash_cmpfp compare; 26544099b7bSPaul Traina hash_datum *key; 26644099b7bSPaul Traina hash_freefp free_data; 26744099b7bSPaul Traina { 26844099b7bSPaul Traina hash_member *memberptr, *tempptr; 26944099b7bSPaul Traina hash_member *previous = NULL; 27044099b7bSPaul Traina int retval; 27144099b7bSPaul Traina 27244099b7bSPaul Traina retval = -1; 27344099b7bSPaul Traina hashcode %= hashtable->size; 27444099b7bSPaul Traina 27544099b7bSPaul Traina /* 27644099b7bSPaul Traina * Delete the first member of the list if it matches. Since this moves 27744099b7bSPaul Traina * the second member into the first position we have to keep doing this 27844099b7bSPaul Traina * over and over until it no longer matches. 27944099b7bSPaul Traina */ 28044099b7bSPaul Traina memberptr = (hashtable->table)[hashcode]; 28144099b7bSPaul Traina while (memberptr && (*compare) (key, memberptr->data)) { 28244099b7bSPaul Traina (hashtable->table)[hashcode] = memberptr->next; 28344099b7bSPaul Traina /* 28444099b7bSPaul Traina * Stop hashi_FreeMembers() from deleting the whole list! 28544099b7bSPaul Traina */ 28644099b7bSPaul Traina memberptr->next = NULL; 28744099b7bSPaul Traina hashi_FreeMembers(memberptr, free_data); 28844099b7bSPaul Traina memberptr = (hashtable->table)[hashcode]; 28944099b7bSPaul Traina retval = 0; 29044099b7bSPaul Traina } 29144099b7bSPaul Traina 29244099b7bSPaul Traina /* 29344099b7bSPaul Traina * Now traverse the rest of the list 29444099b7bSPaul Traina */ 29544099b7bSPaul Traina if (memberptr) { 29644099b7bSPaul Traina previous = memberptr; 29744099b7bSPaul Traina memberptr = memberptr->next; 29844099b7bSPaul Traina } 29944099b7bSPaul Traina while (memberptr) { 30044099b7bSPaul Traina if ((*compare) (key, memberptr->data)) { 30144099b7bSPaul Traina tempptr = memberptr; 30244099b7bSPaul Traina previous->next = memberptr = memberptr->next; 30344099b7bSPaul Traina /* 30444099b7bSPaul Traina * Put the brakes on hashi_FreeMembers(). . . . 30544099b7bSPaul Traina */ 30644099b7bSPaul Traina tempptr->next = NULL; 30744099b7bSPaul Traina hashi_FreeMembers(tempptr, free_data); 30844099b7bSPaul Traina retval = 0; 30944099b7bSPaul Traina } else { 31044099b7bSPaul Traina previous = memberptr; 31144099b7bSPaul Traina memberptr = memberptr->next; 31244099b7bSPaul Traina } 31344099b7bSPaul Traina } 31444099b7bSPaul Traina return retval; 31544099b7bSPaul Traina } 31644099b7bSPaul Traina 31744099b7bSPaul Traina 31844099b7bSPaul Traina 31944099b7bSPaul Traina /* 32044099b7bSPaul Traina * Locate and return the data entry associated with the given key. 32144099b7bSPaul Traina * 32244099b7bSPaul Traina * If the data entry is found, a pointer to it is returned. Otherwise, 32344099b7bSPaul Traina * NULL is returned. 32444099b7bSPaul Traina */ 32544099b7bSPaul Traina 32644099b7bSPaul Traina hash_datum * 32744099b7bSPaul Traina hash_Lookup(hashtable, hashcode, compare, key) 32844099b7bSPaul Traina hash_tbl *hashtable; 32944099b7bSPaul Traina unsigned hashcode; 33044099b7bSPaul Traina hash_cmpfp compare; 33144099b7bSPaul Traina hash_datum *key; 33244099b7bSPaul Traina { 33344099b7bSPaul Traina hash_member *memberptr; 33444099b7bSPaul Traina 33544099b7bSPaul Traina memberptr = (hashtable->table)[hashcode % (hashtable->size)]; 33644099b7bSPaul Traina while (memberptr) { 33744099b7bSPaul Traina if ((*compare) (key, memberptr->data)) { 33844099b7bSPaul Traina return (memberptr->data); 33944099b7bSPaul Traina } 34044099b7bSPaul Traina memberptr = memberptr->next; 34144099b7bSPaul Traina } 34244099b7bSPaul Traina return NULL; 34344099b7bSPaul Traina } 34444099b7bSPaul Traina 34544099b7bSPaul Traina 34644099b7bSPaul Traina 34744099b7bSPaul Traina /* 34844099b7bSPaul Traina * Return the next available entry in the hashtable for a linear search 34944099b7bSPaul Traina */ 35044099b7bSPaul Traina 35144099b7bSPaul Traina hash_datum * 35244099b7bSPaul Traina hash_NextEntry(hashtable) 35344099b7bSPaul Traina hash_tbl *hashtable; 35444099b7bSPaul Traina { 35544099b7bSPaul Traina register unsigned bucket; 35644099b7bSPaul Traina register hash_member *memberptr; 35744099b7bSPaul Traina 35844099b7bSPaul Traina /* 35944099b7bSPaul Traina * First try to pick up where we left off. 36044099b7bSPaul Traina */ 36144099b7bSPaul Traina memberptr = hashtable->member; 36244099b7bSPaul Traina if (memberptr) { 36344099b7bSPaul Traina hashtable->member = memberptr->next; /* Set up for next call */ 36444099b7bSPaul Traina return memberptr->data; /* Return the data */ 36544099b7bSPaul Traina } 36644099b7bSPaul Traina /* 36744099b7bSPaul Traina * We hit the end of a chain, so look through the array of buckets 36844099b7bSPaul Traina * until we find a new chain (non-empty bucket) or run out of buckets. 36944099b7bSPaul Traina */ 37044099b7bSPaul Traina bucket = hashtable->bucketnum + 1; 37144099b7bSPaul Traina while ((bucket < hashtable->size) && 37244099b7bSPaul Traina !(memberptr = (hashtable->table)[bucket])) { 37344099b7bSPaul Traina bucket++; 37444099b7bSPaul Traina } 37544099b7bSPaul Traina 37644099b7bSPaul Traina /* 37744099b7bSPaul Traina * Check to see if we ran out of buckets. 37844099b7bSPaul Traina */ 37944099b7bSPaul Traina if (bucket >= hashtable->size) { 38044099b7bSPaul Traina /* 38144099b7bSPaul Traina * Reset to top of table for next call. 38244099b7bSPaul Traina */ 38344099b7bSPaul Traina hashtable->bucketnum = 0; 38444099b7bSPaul Traina hashtable->member = (hashtable->table)[0]; 38544099b7bSPaul Traina /* 38644099b7bSPaul Traina * But return end-of-table indication to the caller this time. 38744099b7bSPaul Traina */ 38844099b7bSPaul Traina return NULL; 38944099b7bSPaul Traina } 39044099b7bSPaul Traina /* 39144099b7bSPaul Traina * Must have found a non-empty bucket. 39244099b7bSPaul Traina */ 39344099b7bSPaul Traina hashtable->bucketnum = bucket; 39444099b7bSPaul Traina hashtable->member = memberptr->next; /* Set up for next call */ 39544099b7bSPaul Traina return memberptr->data; /* Return the data */ 39644099b7bSPaul Traina } 39744099b7bSPaul Traina 39844099b7bSPaul Traina 39944099b7bSPaul Traina 40044099b7bSPaul Traina /* 40144099b7bSPaul Traina * Return the first entry in a hash table for a linear search 40244099b7bSPaul Traina */ 40344099b7bSPaul Traina 40444099b7bSPaul Traina hash_datum * 40544099b7bSPaul Traina hash_FirstEntry(hashtable) 40644099b7bSPaul Traina hash_tbl *hashtable; 40744099b7bSPaul Traina { 40844099b7bSPaul Traina hashtable->bucketnum = 0; 40944099b7bSPaul Traina hashtable->member = (hashtable->table)[0]; 41044099b7bSPaul Traina return hash_NextEntry(hashtable); 41144099b7bSPaul Traina } 41244099b7bSPaul Traina 41344099b7bSPaul Traina /* 41444099b7bSPaul Traina * Local Variables: 41544099b7bSPaul Traina * tab-width: 4 41644099b7bSPaul Traina * c-indent-level: 4 41744099b7bSPaul Traina * c-argdecl-indent: 4 41844099b7bSPaul Traina * c-continued-statement-offset: 4 41944099b7bSPaul Traina * c-continued-brace-offset: -4 42044099b7bSPaul Traina * c-label-offset: -4 42144099b7bSPaul Traina * c-brace-offset: 0 42244099b7bSPaul Traina * End: 42344099b7bSPaul Traina */ 424