/* * Hash Array Mapped Trie (HAMT) implementation * * Copyright (C) 2001-2007 Peter Johnson * * Based on the paper "Ideal Hash Tries" by Phil Bagwell [2000]. * One algorithmic change from that described in the paper: we use the LSB's * of the key to index the root table and move upward in the key rather than * use the MSBs as described in the paper. The LSBs have more entropy. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND OTHER CONTRIBUTORS ``AS IS'' * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR OTHER CONTRIBUTORS BE * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE * POSSIBILITY OF SUCH DAMAGE. */ #include "util.h" /*@unused@*/ RCSID("$Id: hamt.c 1907 2007-08-05 16:44:07Z peter $"); #include #include "libyasm-stdint.h" #include "coretype.h" #include "hamt.h" struct HAMTEntry { STAILQ_ENTRY(HAMTEntry) next; /* next hash table entry */ /*@dependent@*/ const char *str; /* string being hashed */ /*@owned@*/ void *data; /* data pointer being stored */ }; typedef struct HAMTNode { unsigned long BitMapKey; /* 32 bits, bitmap or hash key */ uintptr_t BaseValue; /* Base of HAMTNode list or value */ } HAMTNode; struct HAMT { STAILQ_HEAD(HAMTEntryHead, HAMTEntry) entries; HAMTNode *root; /*@exits@*/ void (*error_func) (const char *file, unsigned int line, const char *message); unsigned long (*HashKey) (const char *key); unsigned long (*ReHashKey) (const char *key, int Level); int (*CmpKey) (const char *s1, const char *s2); }; /* XXX make a portable version of this. This depends on the pointer being * 4 or 2-byte aligned (as it uses the LSB of the pointer variable to store * the subtrie flag! */ #define IsSubTrie(n) ((n)->BaseValue & 1) #define SetSubTrie(h, n, v) do { \ if ((uintptr_t)(v) & 1) \ h->error_func(__FILE__, __LINE__, \ N_("Subtrie is seen as subtrie before flag is set (misaligned?)")); \ (n)->BaseValue = (uintptr_t)(v) | 1; \ } while (0) #define SetValue(h, n, v) do { \ if ((uintptr_t)(v) & 1) \ h->error_func(__FILE__, __LINE__, \ N_("Value is seen as subtrie (misaligned?)")); \ (n)->BaseValue = (uintptr_t)(v); \ } while (0) #define GetSubTrie(n) (HAMTNode *)(((n)->BaseValue | 1) ^ 1) static unsigned long HashKey(const char *key) { unsigned long a=31415, b=27183, vHash; for (vHash=0; *key; key++, a*=b) vHash = a*vHash + *key; return vHash; } static unsigned long ReHashKey(const char *key, int Level) { unsigned long a=31415, b=27183, vHash; for (vHash=0; *key; key++, a*=b) vHash = a*vHash*(unsigned long)Level + *key; return vHash; } static unsigned long HashKey_nocase(const char *key) { unsigned long a=31415, b=27183, vHash; for (vHash=0; *key; key++, a*=b) vHash = a*vHash + tolower(*key); return vHash; } static unsigned long ReHashKey_nocase(const char *key, int Level) { unsigned long a=31415, b=27183, vHash; for (vHash=0; *key; key++, a*=b) vHash = a*vHash*(unsigned long)Level + tolower(*key); return vHash; } HAMT * HAMT_create(int nocase, /*@exits@*/ void (*error_func) (const char *file, unsigned int line, const char *message)) { /*@out@*/ HAMT *hamt = yasm_xmalloc(sizeof(HAMT)); int i; STAILQ_INIT(&hamt->entries); hamt->root = yasm_xmalloc(32*sizeof(HAMTNode)); for (i=0; i<32; i++) { hamt->root[i].BitMapKey = 0; hamt->root[i].BaseValue = 0; } hamt->error_func = error_func; if (nocase) { hamt->HashKey = HashKey_nocase; hamt->ReHashKey = ReHashKey_nocase; hamt->CmpKey = yasm__strcasecmp; } else { hamt->HashKey = HashKey; hamt->ReHashKey = ReHashKey; hamt->CmpKey = strcmp; } return hamt; } static void HAMT_delete_trie(HAMTNode *node) { if (IsSubTrie(node)) { unsigned long i, Size; /* Count total number of bits in bitmap to determine size */ BitCount(Size, node->BitMapKey); Size &= 0x1F; if (Size == 0) Size = 32; for (i=0; ientries)) { HAMTEntry *entry; entry = STAILQ_FIRST(&hamt->entries); STAILQ_REMOVE_HEAD(&hamt->entries, next); deletefunc(entry->data); yasm_xfree(entry); } /* delete trie */ for (i=0; i<32; i++) HAMT_delete_trie(&hamt->root[i]); yasm_xfree(hamt->root); yasm_xfree(hamt); } int HAMT_traverse(HAMT *hamt, void *d, int (*func) (/*@dependent@*/ /*@null@*/ void *node, /*@null@*/ void *d)) { HAMTEntry *entry; STAILQ_FOREACH(entry, &hamt->entries, next) { int retval = func(entry->data, d); if (retval != 0) return retval; } return 0; } const HAMTEntry * HAMT_first(const HAMT *hamt) { return STAILQ_FIRST(&hamt->entries); } const HAMTEntry * HAMT_next(const HAMTEntry *prev) { return STAILQ_NEXT(prev, next); } void * HAMTEntry_get_data(const HAMTEntry *entry) { return entry->data; } /*@-temptrans -kepttrans -mustfree@*/ void * HAMT_insert(HAMT *hamt, const char *str, void *data, int *replace, void (*deletefunc) (/*@only@*/ void *data)) { HAMTNode *node, *newnodes; HAMTEntry *entry; unsigned long key, keypart, Map; int keypartbits = 0; int level = 0; key = hamt->HashKey(str); keypart = key & 0x1F; node = &hamt->root[keypart]; if (!node->BaseValue) { node->BitMapKey = key; entry = yasm_xmalloc(sizeof(HAMTEntry)); entry->str = str; entry->data = data; STAILQ_INSERT_TAIL(&hamt->entries, entry, next); SetValue(hamt, node, entry); if (IsSubTrie(node)) hamt->error_func(__FILE__, __LINE__, N_("Data is seen as subtrie (misaligned?)")); *replace = 1; return data; } for (;;) { if (!(IsSubTrie(node))) { if (node->BitMapKey == key && hamt->CmpKey(((HAMTEntry *)(node->BaseValue))->str, str) == 0) { /*@-branchstate@*/ if (*replace) { deletefunc(((HAMTEntry *)(node->BaseValue))->data); ((HAMTEntry *)(node->BaseValue))->str = str; ((HAMTEntry *)(node->BaseValue))->data = data; } else deletefunc(data); /*@=branchstate@*/ return ((HAMTEntry *)(node->BaseValue))->data; } else { unsigned long key2 = node->BitMapKey; /* build tree downward until keys differ */ for (;;) { unsigned long keypart2; /* replace node with subtrie */ keypartbits += 5; if (keypartbits > 30) { /* Exceeded 32 bits: rehash */ key = hamt->ReHashKey(str, level); key2 = hamt->ReHashKey( ((HAMTEntry *)(node->BaseValue))->str, level); keypartbits = 0; } keypart = (key >> keypartbits) & 0x1F; keypart2 = (key2 >> keypartbits) & 0x1F; if (keypart == keypart2) { /* Still equal, build one-node subtrie and continue * downward. */ newnodes = yasm_xmalloc(sizeof(HAMTNode)); newnodes[0].BitMapKey = key2; newnodes[0].BaseValue = node->BaseValue; node->BitMapKey = 1<str = str; entry->data = data; STAILQ_INSERT_TAIL(&hamt->entries, entry, next); /* Copy nodes into subtrie based on order */ if (keypart2 < keypart) { newnodes[0].BitMapKey = key2; newnodes[0].BaseValue = node->BaseValue; newnodes[1].BitMapKey = key; SetValue(hamt, &newnodes[1], entry); } else { newnodes[0].BitMapKey = key; SetValue(hamt, &newnodes[0], entry); newnodes[1].BitMapKey = key2; newnodes[1].BaseValue = node->BaseValue; } /* Set bits in bitmap corresponding to keys */ node->BitMapKey = (1UL< 30) { /* Exceeded 32 bits of current key: rehash */ key = hamt->ReHashKey(str, level); keypartbits = 0; } keypart = (key >> keypartbits) & 0x1F; if (!(node->BitMapKey & (1< add node to table */ unsigned long Size; /* set bit to 1 */ node->BitMapKey |= 1<BitMapKey); Size &= 0x1F; if (Size == 0) Size = 32; newnodes = yasm_xmalloc(Size*sizeof(HAMTNode)); /* Count bits below to find where to insert new node at */ BitCount(Map, node->BitMapKey & ~((~0UL)<str = str; entry->data = data; STAILQ_INSERT_TAIL(&hamt->entries, entry, next); SetValue(hamt, &newnodes[Map], entry); SetSubTrie(hamt, node, newnodes); *replace = 1; return data; } /* Count bits below */ BitCount(Map, node->BitMapKey & ~((~0UL)<HashKey(str); keypart = key & 0x1F; node = &hamt->root[keypart]; if (!node->BaseValue) return NULL; for (;;) { if (!(IsSubTrie(node))) { if (node->BitMapKey == key && hamt->CmpKey(((HAMTEntry *)(node->BaseValue))->str, str) == 0) return ((HAMTEntry *)(node->BaseValue))->data; else return NULL; } /* Subtree: look up in bitmap */ keypartbits += 5; if (keypartbits > 30) { /* Exceeded 32 bits of current key: rehash */ key = hamt->ReHashKey(str, level); keypartbits = 0; } keypart = (key >> keypartbits) & 0x1F; if (!(node->BitMapKey & (1< no match */ /* Count bits below */ BitCount(Map, node->BitMapKey & ~((~0UL)<