/* * Copyright 2011 Steven Gribble * * This file is part of the UW CSE 333 course project sequence * (333proj). * * 333proj is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * 333proj is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with 333proj. If not, see . */ #ifndef HW1_HASHTABLE_H_ #define HW1_HASHTABLE_H_ #include // for bool, true, false #include // so we can use uint64_t, etc. // A HashTable is a simple chained hash table with a static number of buckets. // We provide the interface; your job is to provide the implementation. // // To hide the implementation of HashTable, we declare the "struct htrec" // structure here, but we define the structure in the internal header // HashTable_priv.h. This lets us define a pointer to the HashTableRecord as // a new "HashTable" type, but leave the implementation details of HashTable // opaque to the customer. struct htrec; typedef struct htrec *HashTable; // When freeing a HashTable, customers need to pass a pointer to a function // that frees the payload. The pointed-to function is invoked once for each // value in the HashTable. typedef void(*ValueFreeFnPtr)(void *value); // Allocate and return a new HashTable. // // Arguments: // // - num_buckets: the number of buckets the hash table should // initially contain. Remember that this is a chained hash // table, so as the load factor approaches 1, linked lists hanging // off of each bucket will start to grow. This implementation // will dynamically resize the hashtable when the load factor // exceeds 3. It will multiple the number of buckets in the // hashtable by 3, so that post-resize load factor is 1/3. // // Returns NULL on error, non-NULL on success. HashTable AllocateHashTable(uint32_t num_buckets); // Free a HashTable. // // Arguments: // // - table: the HashTable to free. It is unsafe to use table // after this function returns. // // - value_free_function: this argument is a pointer to a value // freeing function; see above for details. void FreeHashTable(HashTable table, ValueFreeFnPtr value_free_function); // Figure out the number of elements in the hash table. // // Arguments: // // - table: the table to query // // Returns: // // - table size (>=0); note that this is an unsigned 64-bit integer. uint64_t NumElementsInHashTable(HashTable table); // HashTables store key/value pairs. We'll define a key to be an // unsigned 64-bit integer; it's up to the customer to figure out how // to produce an appropriate hash key, but below we provide an // implementation of FNV hashing to help them out. We'll define // a value to be a (void *), so that customers can pass in pointers to // arbitrary structs as values, but of course we have to worry about // memory management as a side-effect. typedef uint64_t HTKey_t; // hash table key type typedef void* HTValue_t; // hash table value type typedef struct { HTKey_t key; // the key in the key/value pair HTValue_t value; // the value in the key/value pair } HTKeyValue, *HTKeyValuePtr; // This is an implementation of FNV hashing. Customers // can use it to hash an arbitrary sequence of bytes into // a 64-bit key suitable for using as a hash key. // // If you're curious, you can read about FNV hashing here: // // http://en.wikipedia.org/wiki/Fowler–Noll–Vo_hash_function // // Arguments: // // - buffer: a pointer to a len-size buffer of unsigned chars // // - len: how many bytes are in the buffer // // Returns: // // - a nicely distributed 64-bit hash value suitable for // use in a HTKeyValue uint64_t FNVHash64(unsigned char *buffer, unsigned int len); // This is a convenience routine to produce a nice, evenly // distributed 64-bit hash key from a potentially poorly // distributed 64 bit number. It uses FNVHash64 to get its // job done. // // Arguments: // // - hashme: a 64-bit integer to hash // // Returns: // // - a nicely distributed 64-bit hash value suitable for // use in a HTKeyValue uint64_t FNVHashInt64(uint64_t hashme); // Inserts a key,value pair into the HashTable. // // Arguments: // // - table: the HashTable to insert into // // - newkeyvalue: the HTKeyValue to insert into the table // // - oldkeyval: if the key in newkeyvalue is already present // in the HashTable, that old key/value is replaced with // newkeyvalue. In that case, the old key/value is returned via // this return parameter to the caller. It's up to the caller // to free any allocated memory associated with oldkeyvalue->value. // // Returns: // // - 0 on failure (e.g., out of memory) // // - +1 if the newkeyvalue was inserted and there was no // existing key/value with that key // // - +2 if the newkeyvalue was inserted and an old key/value // with the same key was replaced and returned through // the oldkeyval return parameter. In this case, the caller assumes // ownership of oldkeyvalue. int InsertHashTable(HashTable table, HTKeyValue newkeyvalue, HTKeyValue *oldkeyvalue); // Looks up a key in the HashTable, and if it is // present, returns the key/value associated with it. // // Arguments: // // - table: the HashTable to look in // // - key: the key to look up // // - keyvalue: if the key is present, a copy of the key/value is // returned to the caller via this return parameter. Note that the // key/value is left in the HashTable, so it is not safe for the // caller to free keyvalue->value. // // Returns: // // - -1 if there was an error (e.g., out of memory) // // - 0 if the key wasn't found in the HashTable // // - +1 if the key was found, and therefore the associated key/value // was returned to the caller via that keyvalue return parameter. int LookupHashTable(HashTable table, uint64_t key, HTKeyValue *keyvalue); // Removes a key/value from the HashTable and returns it to the // caller. // // Arguments: // // - table: the HashTable to look in // // - key: the key to look up // // - keyvalue: if the key is present, a copy of key/value is returned // to the caller via this return parameter and the key/value is // removed from the HashTable. Note that the caller is responsible // for managing the memory associated with keyvalue->value from // this point on. // // Returns: // - -1 on error (e.g., out of memory) // // - 0 if the key wasn't found in the HashTable // // - +1 if the key was found, and therefore (a) the associated // key/value was returned to the caller via that keyvalue return // parameter, and (b) that key/value was removed from the // HashTable. int RemoveFromHashTable(HashTable table, uint64_t key, HTKeyValue *keyvalue); // HashTables support the notion of an iterator, similar to // Java iterators. You use an iterator to iterate forward // through the HashTable. The order in which the iterator // goes through the HashTable is undefined, and not necessarily // deterministic; all that is promised is that each key/value // is visited exactly once. Also, if the customer uses a // HashTable function to mutate the hash table, any existing // iterators become dangerous to use and should be freed. struct ht_itrec; typedef struct ht_itrec *HTIter; // same trick to hide implementation. // Manufacture an iterator for the table. If there are // elements in the hash table, the iterator is initialized // to point at the "first" one. If there are no elements // in the hash table, the iterator is unusable and // // Arguments: // // - table: the table from which to return an iterator // // Returns NULL on failure, non-NULL on success. HTIter HashTableMakeIterator(HashTable table); // When you're done with a hash table iterator, you need to free it // by calling this function. // // Arguments: // // - iter: the iterator to free. It is not safe to use // the iterator after freeing it. void HTIteratorFree(HTIter iter); // Move the iterator to the next element of the table. // // Arguments: // // - iter: the iterator to move // // Returns: // // - +1 on success // // - 0 if the iterator cannot be moved forward to the next // valid element, either because the table is empty, or // because the iterator (after moving it forward) is past the // end of the table. In either case, the iterator is no // longer usable. int HTIteratorNext(HTIter iter); // Tests to see whether the iterator is past the end // of the table. // // Arguments: // // - iter: the iterator to test // // Returns: // // - +1 if iter is past the end of the table or the table is empty. // // - 0 if iter is not at the end of the table (and therefore // the table is non-empty). int HTIteratorPastEnd(HTIter iter); // Returns a copy of the key/value that the iterator is currently // pointing at. // // Arguments: // // - iter: the iterator to fetch the key/value from // // - keyvalue: a return parameter through which the key/value // is returned. // // Returns: // // - 0 if the iterator is not valid or the table is empty // // - +1 on success. int HTIteratorGet(HTIter iter, HTKeyValue *keyvalue); // Returns a copy of key/value that the iterator is currently // pointing at, and removes that key/value from the // hashtable. The caller assumes ownership of any memory // pointed to by the value. As well, this advances // the iterator to the next element in the hashtable. // // Arguments: // // - iter: the iterator to fetch the key/value from // // - keyvalue: a return parameter through which the key/value // is returned. // // Returns: // // - 0 if the iterator is not valid or the table is empty // // - +1 on success, and the iterator is still valid. // // - +2 on success, but the iterator is now invalid because // it has advanced past the end of the hash table. int HTIteratorDelete(HTIter iter, HTKeyValue *keyvalue); #endif // HW1_HASHTABLE_H_