mirror of
git://sourceware.org/git/valgrind.git
synced 2026-01-12 00:19:31 +08:00
- Update COPYING and VEX/LICENSE.GPL to version 3. - Update README, NEWS, docs/manual license and contributing text. - Update file headers to say either version 3 of the License, or (at your option) any later version. - Leave tests and perf file headers as is, unless the code is derived from Valgrind/VEX. - Leave valgrind.h, cachegrind.h, callgrind.h, drd.h, helgrind.h, memcheck.h and dhat.h Hybrid-BSD licensed.
435 lines
14 KiB
C
435 lines
14 KiB
C
|
|
/*--------------------------------------------------------------------*/
|
|
/*--- A separately-chained hash table. m_hashtable.c ---*/
|
|
/*--------------------------------------------------------------------*/
|
|
|
|
/*
|
|
This file is part of Valgrind, a dynamic binary instrumentation
|
|
framework.
|
|
|
|
Copyright (C) 2005-2017 Nicholas Nethercote
|
|
njn@valgrind.org
|
|
|
|
This program is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU General Public License as
|
|
published by the Free Software Foundation; either version 3 of the
|
|
License, or (at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful, but
|
|
WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, see <http://www.gnu.org/licenses/>.
|
|
|
|
The GNU General Public License is contained in the file COPYING.
|
|
*/
|
|
|
|
#include "pub_core_basics.h"
|
|
#include "pub_core_debuglog.h"
|
|
#include "pub_core_hashtable.h"
|
|
#include "pub_core_libcassert.h"
|
|
#include "pub_core_libcbase.h"
|
|
#include "pub_core_libcprint.h"
|
|
#include "pub_core_mallocfree.h"
|
|
|
|
/*--------------------------------------------------------------------*/
|
|
/*--- Declarations ---*/
|
|
/*--------------------------------------------------------------------*/
|
|
|
|
#define CHAIN_NO(key,tbl) (((UWord)(key)) % tbl->n_chains)
|
|
|
|
struct _VgHashTable {
|
|
UInt n_chains; // should be prime
|
|
UInt n_elements;
|
|
VgHashNode* iterNode; // current iterator node
|
|
UInt iterChain; // next chain to be traversed by the iterator
|
|
Bool iterOK; // table safe to iterate over?
|
|
VgHashNode** chains; // expanding array of hash chains
|
|
const HChar* name; // name of table (for debugging only)
|
|
};
|
|
|
|
#define N_HASH_PRIMES 20
|
|
|
|
static const SizeT primes[N_HASH_PRIMES] = {
|
|
769UL, 1543UL, 3079UL, 6151UL,
|
|
12289UL, 24593UL, 49157UL, 98317UL,
|
|
196613UL, 393241UL, 786433UL, 1572869UL,
|
|
3145739UL, 6291469UL, 12582917UL, 25165843UL,
|
|
50331653UL, 100663319UL, 201326611UL, 402653189UL
|
|
};
|
|
|
|
/*--------------------------------------------------------------------*/
|
|
/*--- Functions ---*/
|
|
/*--------------------------------------------------------------------*/
|
|
|
|
VgHashTable *VG_(HT_construct) ( const HChar* name )
|
|
{
|
|
/* Initialises to zero, ie. all entries NULL */
|
|
SizeT n_chains = primes[0];
|
|
SizeT sz = n_chains * sizeof(VgHashNode*);
|
|
VgHashTable *table = VG_(calloc)("hashtable.Hc.1",
|
|
1, sizeof(struct _VgHashTable));
|
|
table->chains = VG_(calloc)("hashtable.Hc.2", 1, sz);
|
|
table->n_chains = n_chains;
|
|
table->n_elements = 0;
|
|
table->iterOK = True;
|
|
table->name = name;
|
|
vg_assert(name);
|
|
return table;
|
|
}
|
|
|
|
UInt VG_(HT_count_nodes) ( const VgHashTable *table )
|
|
{
|
|
return table->n_elements;
|
|
}
|
|
|
|
static void resize ( VgHashTable *table )
|
|
{
|
|
Int i;
|
|
SizeT sz;
|
|
SizeT old_chains = table->n_chains;
|
|
SizeT new_chains = old_chains + 1;
|
|
VgHashNode** chains;
|
|
VgHashNode * node;
|
|
|
|
/* If we've run out of primes, do nothing. */
|
|
if (old_chains == primes[N_HASH_PRIMES-1])
|
|
return;
|
|
|
|
vg_assert(old_chains >= primes[0]
|
|
&& old_chains < primes[N_HASH_PRIMES-1]);
|
|
|
|
for (i = 0; i < N_HASH_PRIMES; i++) {
|
|
if (primes[i] > new_chains) {
|
|
new_chains = primes[i];
|
|
break;
|
|
}
|
|
}
|
|
|
|
vg_assert(new_chains > old_chains);
|
|
vg_assert(new_chains > primes[0]
|
|
&& new_chains <= primes[N_HASH_PRIMES-1]);
|
|
|
|
VG_(debugLog)(
|
|
1, "hashtable",
|
|
"resizing table `%s' from %lu to %lu (total elems %lu)\n",
|
|
table->name, (UWord)old_chains, (UWord)new_chains,
|
|
(UWord)table->n_elements );
|
|
|
|
table->n_chains = new_chains;
|
|
sz = new_chains * sizeof(VgHashNode*);
|
|
chains = VG_(calloc)("hashtable.resize.1", 1, sz);
|
|
|
|
for (i = 0; i < old_chains; i++) {
|
|
node = table->chains[i];
|
|
while (node != NULL) {
|
|
VgHashNode* next = node->next;
|
|
UWord chain = CHAIN_NO(node->key, table);
|
|
node->next = chains[chain];
|
|
chains[chain] = node;
|
|
node = next;
|
|
}
|
|
}
|
|
|
|
VG_(free)(table->chains);
|
|
table->chains = chains;
|
|
}
|
|
|
|
/* Puts a new, heap allocated VgHashNode, into the VgHashTable. Prepends
|
|
the node to the appropriate chain. No duplicate key detection is done. */
|
|
void VG_(HT_add_node) ( VgHashTable *table, void* vnode )
|
|
{
|
|
VgHashNode* node = (VgHashNode*)vnode;
|
|
UWord chain = CHAIN_NO(node->key, table);
|
|
node->next = table->chains[chain];
|
|
table->chains[chain] = node;
|
|
table->n_elements++;
|
|
if ( (1 * (ULong)table->n_elements) > (1 * (ULong)table->n_chains) ) {
|
|
resize(table);
|
|
}
|
|
|
|
/* Table has been modified; hence HT_Next should assert. */
|
|
table->iterOK = False;
|
|
}
|
|
|
|
/* Looks up a VgHashNode by key in the table. Returns NULL if not found. */
|
|
void* VG_(HT_lookup) ( const VgHashTable *table, UWord key )
|
|
{
|
|
VgHashNode* curr = table->chains[ CHAIN_NO(key, table) ];
|
|
|
|
while (curr) {
|
|
if (key == curr->key) {
|
|
return curr;
|
|
}
|
|
curr = curr->next;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/* Looks up a VgHashNode by node in the table. Returns NULL if not found.
|
|
GEN!!! marks the lines that differs from VG_(HT_lookup). */
|
|
void* VG_(HT_gen_lookup) ( const VgHashTable *table, const void* node,
|
|
HT_Cmp_t cmp )
|
|
{
|
|
const VgHashNode* hnode = node; // GEN!!!
|
|
VgHashNode* curr = table->chains[ CHAIN_NO(hnode->key, table) ]; // GEN!!!
|
|
|
|
while (curr) {
|
|
if (hnode->key == curr->key && cmp (hnode, curr) == 0) { // GEN!!!
|
|
return curr;
|
|
}
|
|
curr = curr->next;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/* Removes a VgHashNode from the table. Returns NULL if not found. */
|
|
void* VG_(HT_remove) ( VgHashTable *table, UWord key )
|
|
{
|
|
UWord chain = CHAIN_NO(key, table);
|
|
VgHashNode* curr = table->chains[chain];
|
|
VgHashNode** prev_next_ptr = &(table->chains[chain]);
|
|
|
|
/* Table has been modified; hence HT_Next should assert. */
|
|
table->iterOK = False;
|
|
|
|
while (curr) {
|
|
if (key == curr->key) {
|
|
*prev_next_ptr = curr->next;
|
|
table->n_elements--;
|
|
return curr;
|
|
}
|
|
prev_next_ptr = &(curr->next);
|
|
curr = curr->next;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/* Removes a VgHashNode by node from the table. Returns NULL if not found.
|
|
GEN!!! marks the lines that differs from VG_(HT_remove). */
|
|
void* VG_(HT_gen_remove) ( VgHashTable *table, const void* node, HT_Cmp_t cmp )
|
|
{
|
|
const VgHashNode* hnode = node; // GEN!!!
|
|
UWord chain = CHAIN_NO(hnode->key, table); // GEN!!!
|
|
VgHashNode* curr = table->chains[chain];
|
|
VgHashNode** prev_next_ptr = &(table->chains[chain]);
|
|
|
|
/* Table has been modified; hence HT_Next should assert. */
|
|
table->iterOK = False;
|
|
|
|
while (curr) {
|
|
if (hnode->key == curr->key && cmp(hnode, curr) == 0) { // GEN!!!
|
|
*prev_next_ptr = curr->next;
|
|
table->n_elements--;
|
|
return curr;
|
|
}
|
|
prev_next_ptr = &(curr->next);
|
|
curr = curr->next;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
void VG_(HT_print_stats) ( const VgHashTable *table, HT_Cmp_t cmp )
|
|
{
|
|
#define MAXOCCUR 20
|
|
UInt elt_occurrences[MAXOCCUR+1];
|
|
UInt key_occurrences[MAXOCCUR+1];
|
|
UInt cno_occurrences[MAXOCCUR+1];
|
|
/* Key occurrence : how many ht elements have the same key.
|
|
elt_occurrences : how many elements are inserted multiple time.
|
|
cno_occurrences : how many chains have that length.
|
|
The last entry in these arrays collects all occurrences >= MAXOCCUR. */
|
|
#define INCOCCUR(occur,n) (n >= MAXOCCUR ? occur[MAXOCCUR]++ : occur[n]++)
|
|
UInt i;
|
|
UInt nkey, nelt, ncno;
|
|
VgHashNode *cnode, *node;
|
|
|
|
VG_(memset)(key_occurrences, 0, sizeof(key_occurrences));
|
|
VG_(memset)(elt_occurrences, 0, sizeof(elt_occurrences));
|
|
VG_(memset)(cno_occurrences, 0, sizeof(cno_occurrences));
|
|
|
|
// Note that the below algorithm is quadractic in nr of elements in a chain
|
|
// but if that happens, the hash table/function is really bad and that
|
|
// should be fixed.
|
|
for (i = 0; i < table->n_chains; i++) {
|
|
ncno = 0;
|
|
for (cnode = table->chains[i]; cnode != NULL; cnode = cnode->next) {
|
|
ncno++;
|
|
|
|
nkey = 0;
|
|
// Is the same cnode->key existing before cnode ?
|
|
for (node = table->chains[i]; node != cnode; node = node->next) {
|
|
if (node->key == cnode->key)
|
|
nkey++;
|
|
}
|
|
// If cnode->key not in a previous node, count occurrences of key.
|
|
if (nkey == 0) {
|
|
for (node = cnode; node != NULL; node = node->next) {
|
|
if (node->key == cnode->key)
|
|
nkey++;
|
|
}
|
|
INCOCCUR(key_occurrences, nkey);
|
|
}
|
|
|
|
nelt = 0;
|
|
// Is the same cnode element existing before cnode ?
|
|
for (node = table->chains[i]; node != cnode; node = node->next) {
|
|
if (node->key == cnode->key
|
|
&& (cmp == NULL || cmp (node, cnode) == 0)) {
|
|
nelt++;
|
|
}
|
|
}
|
|
// If cnode element not in a previous node, count occurrences of elt.
|
|
if (nelt == 0) {
|
|
for (node = cnode; node != NULL; node = node->next) {
|
|
if (node->key == cnode->key
|
|
&& (cmp == NULL || cmp (node, cnode) == 0)) {
|
|
nelt++;
|
|
}
|
|
}
|
|
INCOCCUR(elt_occurrences, nelt);
|
|
}
|
|
}
|
|
INCOCCUR(cno_occurrences, ncno);
|
|
}
|
|
|
|
VG_(message)(Vg_DebugMsg,
|
|
"nr occurrences of"
|
|
" chains of len N,"
|
|
" N-plicated keys,"
|
|
" N-plicated elts\n");
|
|
nkey = nelt = ncno = 0;
|
|
for (i = 0; i <= MAXOCCUR; i++) {
|
|
if (elt_occurrences[i] > 0
|
|
|| key_occurrences[i] > 0
|
|
|| cno_occurrences[i] > 0)
|
|
VG_(message)(Vg_DebugMsg,
|
|
"%s=%2u : nr chain %6u, nr keys %6u, nr elts %6u\n",
|
|
i == MAXOCCUR ? ">" : "N", i,
|
|
cno_occurrences[i], key_occurrences[i], elt_occurrences[i]);
|
|
nkey += key_occurrences[i];
|
|
nelt += elt_occurrences[i];
|
|
ncno += cno_occurrences[i];
|
|
}
|
|
VG_(message)(Vg_DebugMsg,
|
|
"total nr of unique slots: %6u, keys %6u, elts %6u."
|
|
" Avg chain len %3.1f\n",
|
|
ncno, nkey, nelt,
|
|
(Double)nelt/(Double)(ncno == cno_occurrences[0] ?
|
|
1 : ncno - cno_occurrences[0]));
|
|
}
|
|
|
|
|
|
/* Allocates a suitably-sized array, copies pointers to all the hashtable
|
|
elements into it, then returns both the array and the size of it. The
|
|
array must be freed with VG_(free).
|
|
*/
|
|
VgHashNode** VG_(HT_to_array) (const VgHashTable *table, /*OUT*/ UInt* n_elems)
|
|
{
|
|
UInt i, j;
|
|
VgHashNode** arr;
|
|
VgHashNode* node;
|
|
|
|
*n_elems = table->n_elements;
|
|
if (*n_elems == 0)
|
|
return NULL;
|
|
|
|
arr = VG_(malloc)( "hashtable.Hta.1", *n_elems * sizeof(VgHashNode*) );
|
|
|
|
j = 0;
|
|
for (i = 0; i < table->n_chains; i++) {
|
|
for (node = table->chains[i]; node != NULL; node = node->next) {
|
|
arr[j++] = node;
|
|
}
|
|
}
|
|
vg_assert(j == *n_elems);
|
|
|
|
return arr;
|
|
}
|
|
|
|
void VG_(HT_ResetIter)(VgHashTable *table)
|
|
{
|
|
vg_assert(table);
|
|
table->iterNode = NULL;
|
|
table->iterChain = 0;
|
|
table->iterOK = True;
|
|
}
|
|
|
|
void* VG_(HT_Next)(VgHashTable *table)
|
|
{
|
|
Int i;
|
|
vg_assert(table);
|
|
/* See long comment on HT_Next prototype in pub_tool_hashtable.h.
|
|
In short if this fails, it means the caller tried to modify the
|
|
table whilst iterating over it, which is a bug.
|
|
One exception: HT_remove_at_Iter can remove the current entry and
|
|
leave the iterator in a valid state for HT_Next. */
|
|
vg_assert(table->iterOK);
|
|
|
|
if (table->iterNode && table->iterNode->next) {
|
|
table->iterNode = table->iterNode->next;
|
|
return table->iterNode;
|
|
}
|
|
|
|
for (i = table->iterChain; i < table->n_chains; i++) {
|
|
if (table->chains[i]) {
|
|
table->iterNode = table->chains[i];
|
|
table->iterChain = i + 1; // Next chain to be traversed
|
|
return table->iterNode;
|
|
}
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
void VG_(HT_remove_at_Iter)(VgHashTable *table)
|
|
{
|
|
vg_assert(table);
|
|
vg_assert(table->iterOK);
|
|
vg_assert(table->iterNode);
|
|
|
|
const UInt curChain = table->iterChain - 1; // chain of iterNode.
|
|
|
|
|
|
if (table->chains[curChain] == table->iterNode) {
|
|
/* iterNode is the first of its chain -> remove it from the chain. */
|
|
table->chains[curChain] = table->iterNode->next;
|
|
/* Setup the iterator to visit first node of curChain: */
|
|
table->iterNode = NULL;
|
|
table->iterChain = curChain;
|
|
} else {
|
|
/* iterNode is somewhere inside curChain chain */
|
|
VgHashNode* prev = table->chains[curChain];
|
|
|
|
while (prev->next != table->iterNode)
|
|
prev = prev->next;
|
|
/* Remove iterNode from the chain. */
|
|
prev->next = table->iterNode->next;
|
|
/* Setup the iterator to visit prev->next, which is the node
|
|
that was after the deleted node. */
|
|
table->iterNode = prev;
|
|
}
|
|
|
|
table->n_elements--;
|
|
}
|
|
|
|
void VG_(HT_destruct)(VgHashTable *table, void(*freenode_fn)(void*))
|
|
{
|
|
UInt i;
|
|
VgHashNode *node, *node_next;
|
|
|
|
for (i = 0; i < table->n_chains; i++) {
|
|
for (node = table->chains[i]; node != NULL; node = node_next) {
|
|
node_next = node->next;
|
|
freenode_fn(node);
|
|
}
|
|
}
|
|
VG_(free)(table->chains);
|
|
VG_(free)(table);
|
|
}
|
|
|
|
/*--------------------------------------------------------------------*/
|
|
/*--- end ---*/
|
|
/*--------------------------------------------------------------------*/
|