/* -*- coding: utf-8 -*- * ---------------------------------------------------------------------- * Copyright © 2011-2013, RedJack, LLC. * All rights reserved. * * Please see the COPYING file in this distribution for license * details. * ---------------------------------------------------------------------- */ #include #include #include "libcork/core/callbacks.h" #include "libcork/core/hash.h" #include "libcork/core/mempool.h" #include "libcork/core/types.h" #include "libcork/ds/dllist.h" #include "libcork/ds/hash-table.h" #include "libcork/helpers/errors.h" #ifndef CORK_HASH_TABLE_DEBUG #define CORK_HASH_TABLE_DEBUG 0 #endif #if CORK_HASH_TABLE_DEBUG #include #define DEBUG(...) \ do { \ fprintf(stderr, __VA_ARGS__); \ fprintf(stderr, "\n"); \ } while (0) #else #define DEBUG(...) /* nothing */ #endif /*----------------------------------------------------------------------- * Hash tables */ struct cork_hash_table_entry_priv { struct cork_hash_table_entry public; struct cork_dllist_item in_bucket; struct cork_dllist_item insertion_order; }; struct cork_hash_table { struct cork_dllist *bins; struct cork_dllist insertion_order; size_t bin_count; size_t bin_mask; size_t entry_count; struct cork_mempool *pool; void *user_data; cork_free_f free_user_data; cork_hash_f hash; cork_equals_f equals; cork_free_f free_key; cork_free_f free_value; }; static cork_hash cork_hash_table__default_hash(void *user_data, const void *key) { return (cork_hash) (uintptr_t) key; } static bool cork_hash_table__default_equals(void *user_data, const void *key1, const void *key2) { return key1 == key2; } /* The default initial number of bins to allocate in a new table. */ #define CORK_HASH_TABLE_DEFAULT_INITIAL_SIZE 8 /* The default number of entries per bin to allow before increasing the * number of bins. */ #define CORK_HASH_TABLE_MAX_DENSITY 5 /* Return a power-of-2 bin count that's at least as big as the given requested * size. */ static inline size_t cork_hash_table_new_size(size_t desired_count) { size_t v = desired_count; size_t r = 1; while (v >>= 1) { r <<= 1; } if (r != desired_count) { r <<= 1; } return r; } #define bin_index(table, hash) ((hash) & (table)->bin_mask) /* Allocates a new bins array in a hash table. We overwrite the old * array, so make sure to stash it away somewhere safe first. */ static void cork_hash_table_allocate_bins(struct cork_hash_table *table, size_t desired_count) { size_t i; table->bin_count = cork_hash_table_new_size(desired_count); table->bin_mask = table->bin_count - 1; DEBUG("Allocate %zu bins", table->bin_count); table->bins = cork_calloc(table->bin_count, sizeof(struct cork_dllist)); for (i = 0; i < table->bin_count; i++) { cork_dllist_init(&table->bins[i]); } } static struct cork_hash_table_entry_priv * cork_hash_table_new_entry(struct cork_hash_table *table, cork_hash hash, void *key, void *value) { struct cork_hash_table_entry_priv *entry = cork_mempool_new_object(table->pool); cork_dllist_add(&table->insertion_order, &entry->insertion_order); entry->public.hash = hash; entry->public.key = key; entry->public.value = value; return entry; } static void cork_hash_table_free_entry(struct cork_hash_table *table, struct cork_hash_table_entry_priv *entry) { if (table->free_key != NULL) { table->free_key(entry->public.key); } if (table->free_value != NULL) { table->free_value(entry->public.value); } cork_dllist_remove(&entry->insertion_order); cork_mempool_free_object(table->pool, entry); } struct cork_hash_table * cork_hash_table_new(size_t initial_size, unsigned int flags) { struct cork_hash_table *table = cork_new(struct cork_hash_table); table->entry_count = 0; table->user_data = NULL; table->free_user_data = NULL; table->hash = cork_hash_table__default_hash; table->equals = cork_hash_table__default_equals; table->free_key = NULL; table->free_value = NULL; table->pool = cork_mempool_new(struct cork_hash_table_entry_priv); cork_dllist_init(&table->insertion_order); if (initial_size < CORK_HASH_TABLE_DEFAULT_INITIAL_SIZE) { initial_size = CORK_HASH_TABLE_DEFAULT_INITIAL_SIZE; } cork_hash_table_allocate_bins(table, initial_size); return table; } void cork_hash_table_clear(struct cork_hash_table *table) { size_t i; struct cork_dllist_item *curr; struct cork_dllist_item *next; DEBUG("(clear) Remove all entries"); for (curr = cork_dllist_start(&table->insertion_order); !cork_dllist_is_end(&table->insertion_order, curr); curr = next) { struct cork_hash_table_entry_priv *entry = cork_container_of (curr, struct cork_hash_table_entry_priv, insertion_order); next = curr->next; cork_hash_table_free_entry(table, entry); } cork_dllist_init(&table->insertion_order); DEBUG("(clear) Clear bins"); for (i = 0; i < table->bin_count; i++) { DEBUG(" Bin %zu", i); cork_dllist_init(&table->bins[i]); } table->entry_count = 0; } void cork_hash_table_free(struct cork_hash_table *table) { cork_hash_table_clear(table); cork_mempool_free(table->pool); free(table->bins); free(table); } size_t cork_hash_table_size(const struct cork_hash_table *table) { return table->entry_count; } void cork_hash_table_set_user_data(struct cork_hash_table *table, void *user_data, cork_free_f free_user_data) { table->user_data = user_data; table->free_user_data = free_user_data; } void cork_hash_table_set_hash(struct cork_hash_table *table, cork_hash_f hash) { table->hash = hash; } void cork_hash_table_set_equals(struct cork_hash_table *table, cork_equals_f equals) { table->equals = equals; } void cork_hash_table_set_free_key(struct cork_hash_table *table, cork_free_f free) { table->free_key = free; } void cork_hash_table_set_free_value(struct cork_hash_table *table, cork_free_f free) { table->free_value = free; } void cork_hash_table_ensure_size(struct cork_hash_table *table, size_t desired_count) { if (desired_count > table->bin_count) { struct cork_dllist *old_bins = table->bins; size_t old_bin_count = table->bin_count; cork_hash_table_allocate_bins(table, desired_count); if (old_bins != NULL) { size_t i; for (i = 0; i < old_bin_count; i++) { struct cork_dllist *bin = &old_bins[i]; struct cork_dllist_item *curr = cork_dllist_start(bin); while (!cork_dllist_is_end(bin, curr)) { struct cork_hash_table_entry_priv *entry = cork_container_of (curr, struct cork_hash_table_entry_priv, in_bucket); struct cork_dllist_item *next = curr->next; size_t bin_index = bin_index(table, entry->public.hash); DEBUG(" Rehash %p from bin %zu to bin %zu", entry, i, bin_index); cork_dllist_add(&table->bins[bin_index], curr); curr = next; } } free(old_bins); } } } static void cork_hash_table_rehash(struct cork_hash_table *table) { DEBUG(" Reached maximum density; rehash"); cork_hash_table_ensure_size(table, table->bin_count + 1); } struct cork_hash_table_entry * cork_hash_table_get_entry_hash(const struct cork_hash_table *table, cork_hash hash, const void *key) { size_t bin_index; struct cork_dllist *bin; struct cork_dllist_item *curr; if (table->bin_count == 0) { DEBUG("(get) Empty table when searching for key %p " "(hash 0x%08" PRIx32 ")", key, hash); return NULL; } bin_index = bin_index(table, hash); DEBUG("(get) Search for key %p (hash 0x%08" PRIx32 ", bin %zu)", key, hash, bin_index); bin = &table->bins[bin_index]; curr = cork_dllist_start(bin); while (!cork_dllist_is_end(bin, curr)) { struct cork_hash_table_entry_priv *entry = cork_container_of (curr, struct cork_hash_table_entry_priv, in_bucket); DEBUG(" Check entry %p", entry); if (table->equals(table->user_data, key, entry->public.key)) { DEBUG(" Match"); return &entry->public; } curr = curr->next; } DEBUG(" Entry not found"); return NULL; } struct cork_hash_table_entry * cork_hash_table_get_entry(const struct cork_hash_table *table, const void *key) { cork_hash hash = table->hash(table->user_data, key); return cork_hash_table_get_entry_hash(table, hash, key); } void * cork_hash_table_get_hash(const struct cork_hash_table *table, cork_hash hash, const void *key) { struct cork_hash_table_entry *entry = cork_hash_table_get_entry_hash(table, hash, key); if (entry == NULL) { return NULL; } else { DEBUG(" Extract value pointer %p", entry->value); return entry->value; } } void * cork_hash_table_get(const struct cork_hash_table *table, const void *key) { struct cork_hash_table_entry *entry = cork_hash_table_get_entry(table, key); if (entry == NULL) { return NULL; } else { DEBUG(" Extract value pointer %p", entry->value); return entry->value; } } struct cork_hash_table_entry * cork_hash_table_get_or_create_hash(struct cork_hash_table *table, cork_hash hash, void *key, bool *is_new) { struct cork_hash_table_entry_priv *entry; size_t bin_index; if (table->bin_count > 0) { struct cork_dllist *bin; struct cork_dllist_item *curr; bin_index = bin_index(table, hash); DEBUG("(get_or_create) Search for key %p " "(hash 0x%08" PRIx32 ", bin %zu)", key, hash, bin_index); bin = &table->bins[bin_index]; curr = cork_dllist_start(bin); while (!cork_dllist_is_end(bin, curr)) { struct cork_hash_table_entry_priv *entry = cork_container_of (curr, struct cork_hash_table_entry_priv, in_bucket); DEBUG(" Check entry %p", entry); if (table->equals(table->user_data, key, entry->public.key)) { DEBUG(" Match"); DEBUG(" Return value pointer %p", entry->public.value); *is_new = false; return &entry->public; } curr = curr->next; } /* create a new entry */ DEBUG(" Entry not found"); if ((table->entry_count / table->bin_count) > CORK_HASH_TABLE_MAX_DENSITY) { cork_hash_table_rehash(table); bin_index = bin_index(table, hash); } } else { DEBUG("(get_or_create) Search for key %p (hash 0x%08" PRIx32 ")", key, hash); DEBUG(" Empty table"); cork_hash_table_rehash(table); bin_index = bin_index(table, hash); } DEBUG(" Allocate new entry"); entry = cork_hash_table_new_entry(table, hash, key, NULL); DEBUG(" Created new entry %p", entry); DEBUG(" Add entry into bin %zu", bin_index); cork_dllist_add(&table->bins[bin_index], &entry->in_bucket); table->entry_count++; *is_new = true; return &entry->public; } struct cork_hash_table_entry * cork_hash_table_get_or_create(struct cork_hash_table *table, void *key, bool *is_new) { cork_hash hash = table->hash(table->user_data, key); return cork_hash_table_get_or_create_hash(table, hash, key, is_new); } void cork_hash_table_put_hash(struct cork_hash_table *table, cork_hash hash, void *key, void *value, bool *is_new, void **old_key, void **old_value) { struct cork_hash_table_entry_priv *entry; size_t bin_index; if (table->bin_count > 0) { struct cork_dllist *bin; struct cork_dllist_item *curr; bin_index = bin_index(table, hash); DEBUG("(put) Search for key %p (hash 0x%08" PRIx32 ", bin %zu)", key, hash, bin_index); bin = &table->bins[bin_index]; curr = cork_dllist_start(bin); while (!cork_dllist_is_end(bin, curr)) { struct cork_hash_table_entry_priv *entry = cork_container_of (curr, struct cork_hash_table_entry_priv, in_bucket); DEBUG(" Check entry %p", entry); if (table->equals(table->user_data, key, entry->public.key)) { DEBUG(" Found existing entry; overwriting"); DEBUG(" Return old key %p", entry->public.key); if (old_key != NULL) { *old_key = entry->public.key; } DEBUG(" Return old value %p", entry->public.value); if (old_value != NULL) { *old_value = entry->public.value; } DEBUG(" Copy key %p into entry", key); entry->public.key = key; DEBUG(" Copy value %p into entry", value); entry->public.value = value; if (is_new != NULL) { *is_new = false; } return; } curr = curr->next; } /* create a new entry */ DEBUG(" Entry not found"); if ((table->entry_count / table->bin_count) > CORK_HASH_TABLE_MAX_DENSITY) { cork_hash_table_rehash(table); bin_index = bin_index(table, hash); } } else { DEBUG("(put) Search for key %p (hash 0x%08" PRIx32 ")", key, hash); DEBUG(" Empty table"); cork_hash_table_rehash(table); bin_index = bin_index(table, hash); } DEBUG(" Allocate new entry"); entry = cork_hash_table_new_entry(table, hash, key, value); DEBUG(" Created new entry %p", entry); DEBUG(" Add entry into bin %zu", bin_index); cork_dllist_add(&table->bins[bin_index], &entry->in_bucket); table->entry_count++; if (old_key != NULL) { *old_key = NULL; } if (old_value != NULL) { *old_value = NULL; } if (is_new != NULL) { *is_new = true; } } void cork_hash_table_put(struct cork_hash_table *table, void *key, void *value, bool *is_new, void **old_key, void **old_value) { cork_hash hash = table->hash(table->user_data, key); cork_hash_table_put_hash (table, hash, key, value, is_new, old_key, old_value); } void cork_hash_table_delete_entry(struct cork_hash_table *table, struct cork_hash_table_entry *ventry) { struct cork_hash_table_entry_priv *entry = cork_container_of(ventry, struct cork_hash_table_entry_priv, public); cork_dllist_remove(&entry->in_bucket); table->entry_count--; cork_hash_table_free_entry(table, entry); } bool cork_hash_table_delete_hash(struct cork_hash_table *table, cork_hash hash, const void *key, void **deleted_key, void **deleted_value) { size_t bin_index; struct cork_dllist *bin; struct cork_dllist_item *curr; if (table->bin_count == 0) { DEBUG("(delete) Empty table when searching for key %p " "(hash 0x%08" PRIx32 ")", key, hash); return false; } bin_index = bin_index(table, hash); DEBUG("(delete) Search for key %p (hash 0x%08" PRIx32 ", bin %zu)", key, hash, bin_index); bin = &table->bins[bin_index]; curr = cork_dllist_start(bin); while (!cork_dllist_is_end(bin, curr)) { struct cork_hash_table_entry_priv *entry = cork_container_of (curr, struct cork_hash_table_entry_priv, in_bucket); DEBUG(" Check entry %p", entry); if (table->equals(table->user_data, key, entry->public.key)) { DEBUG(" Match"); if (deleted_key != NULL) { *deleted_key = entry->public.key; } if (deleted_value != NULL) { *deleted_value = entry->public.value; } DEBUG(" Remove entry from hash bin %zu", bin_index); cork_dllist_remove(curr); table->entry_count--; DEBUG(" Free entry %p", entry); cork_hash_table_free_entry(table, entry); return true; } curr = curr->next; } DEBUG(" Entry not found"); return false; } bool cork_hash_table_delete(struct cork_hash_table *table, const void *key, void **deleted_key, void **deleted_value) { cork_hash hash = table->hash(table->user_data, key); return cork_hash_table_delete_hash (table, hash, key, deleted_key, deleted_value); } void cork_hash_table_map(struct cork_hash_table *table, void *user_data, cork_hash_table_map_f map) { struct cork_dllist_item *curr; DEBUG("Map across hash table"); curr = cork_dllist_start(&table->insertion_order); while (!cork_dllist_is_end(&table->insertion_order, curr)) { struct cork_hash_table_entry_priv *entry = cork_container_of (curr, struct cork_hash_table_entry_priv, insertion_order); struct cork_dllist_item *next = curr->next; enum cork_hash_table_map_result result; DEBUG(" Apply function to entry %p", entry); result = map(user_data, &entry->public); if (result == CORK_HASH_TABLE_MAP_ABORT) { return; } else if (result == CORK_HASH_TABLE_MAP_DELETE) { DEBUG(" Delete requested"); cork_dllist_remove(curr); table->entry_count--; cork_hash_table_free_entry(table, entry); } curr = next; } } void cork_hash_table_iterator_init(struct cork_hash_table *table, struct cork_hash_table_iterator *iterator) { DEBUG("Iterate through hash table"); iterator->table = table; iterator->priv = cork_dllist_start(&table->insertion_order); } struct cork_hash_table_entry * cork_hash_table_iterator_next(struct cork_hash_table_iterator *iterator) { struct cork_hash_table *table = iterator->table; struct cork_dllist_item *curr = iterator->priv; struct cork_hash_table_entry_priv *entry; if (cork_dllist_is_end(&table->insertion_order, curr)) { return NULL; } entry = cork_container_of (curr, struct cork_hash_table_entry_priv, insertion_order); DEBUG(" Return entry %p", entry); iterator->priv = curr->next; return &entry->public; } /*----------------------------------------------------------------------- * Built-in key types */ static cork_hash string_hash(void *user_data, const void *vk) { const char *k = vk; size_t len = strlen(k); return cork_hash_buffer(0, k, len); } static bool string_equals(void *user_data, const void *vk1, const void *vk2) { const char *k1 = vk1; const char *k2 = vk2; return strcmp(k1, k2) == 0; } struct cork_hash_table * cork_string_hash_table_new(size_t initial_size, unsigned int flags) { struct cork_hash_table *table = cork_hash_table_new(initial_size, flags); cork_hash_table_set_hash(table, string_hash); cork_hash_table_set_equals(table, string_equals); return table; } struct cork_hash_table * cork_pointer_hash_table_new(size_t initial_size, unsigned int flags) { return cork_hash_table_new(initial_size, flags); }