/* * hash.c * * Copyright (C) 1995-1997 Peter Mattis, Spencer Kimball and Josh MacDonald * 2003 Bastian Blank * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . */ #include #include #include #include #include typedef struct di_hash_node di_hash_node; /** * @addtogroup di_hash_table * @{ */ /** * @internal * @brief Hash table */ struct di_hash_table { size_t size; /**< the overall size */ size_t nnodes; /**< number of nodes */ di_hash_node **nodes; /**< nodes */ di_mem_chunk *mem_chunk; /**< di_mem_chunk for allocating the nodes (di_hash_node) */ di_hash_func *hash_func; /**< hashing function */ di_equal_func *key_equal_func; /**< key compare function */ di_destroy_notify *key_destroy_func; /**< key destroy function, may NULL */ di_destroy_notify *value_destroy_func; /**< value destroy function, may NULL */ }; /** * @internal * @brief Node of a hash table */ struct di_hash_node { void *key; /**< key */ void *value; /**< value */ di_hash_node *next; /**< the next node */ }; /** * @internal * Defines if a resize is necessary * * @param hash_table a di_hash_table */ #define HASH_TABLE_RESIZE(hash_table) \ if ((hash_table->size >= 3 * hash_table->nnodes && \ hash_table->size > HASH_TABLE_MIN_SIZE) || \ (3 * hash_table->size <= hash_table->nnodes && \ hash_table->size < HASH_TABLE_MAX_SIZE)) \ internal_di_hash_table_resize (hash_table); /** * @internal * The minimal hash table size */ #define HASH_TABLE_MIN_SIZE 11 /** * @internal * The maximal hash table size */ #define HASH_TABLE_MAX_SIZE 13845163 /** * @internal * @param x value * @param low low bound * @param high high bound * * @return a value between low and high */ #define CLAMP(x, low, high) (((x) > (high)) ? (high) : (((x) < (low)) ? (low) : (x))) static void internal_di_hash_table_resize (di_hash_table *hash_table); static di_hash_node **internal_di_hash_table_lookup_node (di_hash_table *hash_table, const void *key); static di_hash_node *internal_di_hash_node_new (di_hash_table *hash_table, void *key, void *value); static void internal_di_hash_node_destroy (di_hash_node *hash_node, di_destroy_notify key_destroy_func, di_destroy_notify value_destroy_func) __attribute__ ((unused)); static void internal_di_hash_nodes_destroy (di_hash_node *hash_node, di_destroy_notify key_destroy_func, di_destroy_notify value_destroy_func); /** @} */ static unsigned int internal_di_spaced_primes_closest (unsigned int num); di_hash_table *di_hash_table_new (di_hash_func hash_func, di_equal_func key_equal_func) { return di_hash_table_new_full (hash_func, key_equal_func, NULL, NULL); } di_hash_table *di_hash_table_new_full (di_hash_func hash_func, di_equal_func key_equal_func, di_destroy_notify key_destroy_func, di_destroy_notify value_destroy_func) { di_hash_table *hash_table; size_t i; hash_table = di_new (di_hash_table, 1); hash_table->size = HASH_TABLE_MIN_SIZE; hash_table->nnodes = 0; hash_table->mem_chunk = di_mem_chunk_new (sizeof (di_hash_node), 4096); hash_table->hash_func = hash_func; hash_table->key_equal_func = key_equal_func; hash_table->key_destroy_func = key_destroy_func; hash_table->value_destroy_func = value_destroy_func; hash_table->nodes = di_new (di_hash_node*, hash_table->size); for (i = 0; i < hash_table->size; i++) hash_table->nodes[i] = NULL; return hash_table; } void di_hash_table_destroy (di_hash_table *hash_table) { size_t i; for (i = 0; i < hash_table->size; i++) internal_di_hash_nodes_destroy (hash_table->nodes[i], hash_table->key_destroy_func, hash_table->value_destroy_func); di_mem_chunk_destroy (hash_table->mem_chunk); di_free (hash_table->nodes); di_free (hash_table); } static inline di_hash_node** internal_di_hash_table_lookup_node (di_hash_table *hash_table, const void *key) { di_hash_node **node; node = &hash_table->nodes [hash_table->hash_func (key) % hash_table->size]; /* Hash table lookup needs to be fast. * We therefore remove the extra conditional of testing * whether to call the key_equal_func or not from * the inner loop. */ if (hash_table->key_equal_func) while (*node && !(*hash_table->key_equal_func) ((*node)->key, key)) node = &(*node)->next; else while (*node && (*node)->key != key) node = &(*node)->next; return node; } void *di_hash_table_lookup (di_hash_table *hash_table, const void *key) { di_hash_node *node; node = *internal_di_hash_table_lookup_node (hash_table, key); return node ? node->value : NULL; } void di_hash_table_insert (di_hash_table *hash_table, void *key, void *value) { di_hash_node **node; node = internal_di_hash_table_lookup_node (hash_table, key); if (*node) { if (hash_table->key_destroy_func) hash_table->key_destroy_func (key); if (hash_table->value_destroy_func) hash_table->value_destroy_func ((*node)->value); (*node)->value = value; } else { *node = internal_di_hash_node_new (hash_table, key, value); hash_table->nnodes++; HASH_TABLE_RESIZE (hash_table); } } static di_hash_node* internal_di_hash_node_new (di_hash_table *hash_table, void *key, void *value) { di_hash_node *hash_node; hash_node = di_mem_chunk_alloc (hash_table->mem_chunk); hash_node->key = key; hash_node->value = value; hash_node->next = NULL; return hash_node; } static void internal_di_hash_node_destroy (di_hash_node *hash_node, di_destroy_notify key_destroy_func, di_destroy_notify value_destroy_func) { if (key_destroy_func) key_destroy_func (hash_node->key); if (value_destroy_func) value_destroy_func (hash_node->value); } static void internal_di_hash_nodes_destroy (di_hash_node *hash_node, di_destroy_notify key_destroy_func, di_destroy_notify value_destroy_func) { if (hash_node) { di_hash_node *node = hash_node; while (node->next) { if (key_destroy_func) key_destroy_func (node->key); if (value_destroy_func) value_destroy_func (node->value); node = node->next; } if (key_destroy_func) key_destroy_func (node->key); if (value_destroy_func) value_destroy_func (node->value); } } void di_hash_table_foreach (di_hash_table *hash_table, di_hfunc *func, void *user_data) { di_hash_node *node; size_t i; for (i = 0; i < hash_table->size; i++) for (node = hash_table->nodes[i]; node; node = node->next) func (node->key, node->value, user_data); } di_ksize_t di_hash_table_size (di_hash_table *hash_table) { return hash_table->nnodes; } static void internal_di_hash_table_resize (di_hash_table *hash_table) { di_hash_node **new_nodes; di_hash_node *node; di_hash_node *next; uint32_t hash_val; size_t new_size; size_t i; new_size = internal_di_spaced_primes_closest (hash_table->nnodes); new_size = CLAMP (new_size, HASH_TABLE_MIN_SIZE, HASH_TABLE_MAX_SIZE); new_nodes = di_new0 (di_hash_node*, new_size); for (i = 0; i < hash_table->size; i++) for (node = hash_table->nodes[i]; node; node = next) { next = node->next; hash_val = (* hash_table->hash_func) (node->key) % new_size; node->next = new_nodes[hash_val]; new_nodes[hash_val] = node; } di_free (hash_table->nodes); hash_table->nodes = new_nodes; hash_table->size = new_size; } static const unsigned int internal_di_primes[] = { 11, 19, 37, 73, 109, 163, 251, 367, 557, 823, 1237, 1861, 2777, 4177, 6247, 9371, 14057, 21089, 31627, 47431, 71143, 106721, 160073, 240101, 360163, 540217, 810343, 1215497, 1823231, 2734867, 4102283, 6153409, 9230113, 13845163, }; static const unsigned int internal_di_nprimes = sizeof (internal_di_primes) / sizeof (internal_di_primes[0]); static unsigned int internal_di_spaced_primes_closest (unsigned int num) { unsigned int i; for (i = 0; i < internal_di_nprimes; i++) if (internal_di_primes[i] > num) return internal_di_primes[i]; return internal_di_primes[internal_di_nprimes - 1]; }