/* hash.c -- gas hash table code Copyright 1987, 1990, 1991, 1992, 1993, 1994, 1995, 1996, 1998, 1999, 2000, 2001, 2002, 2003, 2005, 2007, 2008, 2009 Free Software Foundation, Inc. This file is part of GAS, the GNU Assembler. GAS is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3, or (at your option) any later version. GAS is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with GAS; see the file COPYING. If not, write to the Free Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA 02110-1301, USA. */ /* This version of the hash table code is a wholescale replacement of the old hash table code, which was fairly bad. This is based on the hash table code in BFD, but optimized slightly for the assembler. The assembler does not need to derive structures that are stored in the hash table. Instead, it always stores a pointer. The assembler uses the hash table mostly to store symbols, and we don't need to confuse the symbol structure with a hash table structure. */ #include "as.h" #include "safe-ctype.h" #include "obstack.h" /* An entry in a hash table. */ struct hash_entry { /* Next entry for this hash code. */ struct hash_entry *next; /* String being hashed. */ const char *string; /* Hash code. This is the full hash code, not the index into the table. */ unsigned long hash; /* Pointer being stored in the hash table. */ void *data; }; /* A hash table. */ struct hash_control { /* The hash array. */ struct hash_entry **table; /* The number of slots in the hash table. */ unsigned int size; /* An obstack for this hash table. */ struct obstack memory; #ifdef HASH_STATISTICS /* Statistics. */ unsigned long lookups; unsigned long hash_compares; unsigned long string_compares; unsigned long insertions; unsigned long replacements; unsigned long deletions; #endif /* HASH_STATISTICS */ }; /* The default number of entries to use when creating a hash table. Note this value can be reduced to 4051 by using the command line switch --reduce-memory-overheads, or set to other values by using the --hash-size=<NUMBER> switch. */ static unsigned long gas_hash_table_size = 65537; void set_gas_hash_table_size (unsigned long size) { gas_hash_table_size = size; } /* FIXME: This function should be amalgmated with bfd/hash.c:bfd_hash_set_default_size(). */ static unsigned long get_gas_hash_table_size (void) { /* Extend this prime list if you want more granularity of hash table size. */ static const unsigned long hash_size_primes[] = { 1021, 4051, 8599, 16699, 65537 }; unsigned int hindex; /* Work out the best prime number near the hash_size. FIXME: This could be a more sophisticated algorithm, but is it really worth implementing it ? */ for (hindex = 0; hindex < ARRAY_SIZE (hash_size_primes) - 1; ++ hindex) if (gas_hash_table_size <= hash_size_primes[hindex]) break; return hash_size_primes[hindex]; } /* Create a hash table. This return a control block. */ struct hash_control * hash_new (void) { unsigned long size; unsigned long alloc; struct hash_control *ret; size = get_gas_hash_table_size (); ret = (struct hash_control *) xmalloc (sizeof *ret); obstack_begin (&ret->memory, chunksize); alloc = size * sizeof (struct hash_entry *); ret->table = (struct hash_entry **) obstack_alloc (&ret->memory, alloc); memset (ret->table, 0, alloc); ret->size = size; #ifdef HASH_STATISTICS ret->lookups = 0; ret->hash_compares = 0; ret->string_compares = 0; ret->insertions = 0; ret->replacements = 0; ret->deletions = 0; #endif return ret; } /* Delete a hash table, freeing all allocated memory. */ void hash_die (struct hash_control *table) { obstack_free (&table->memory, 0); free (table); } /* Look up a string in a hash table. This returns a pointer to the hash_entry, or NULL if the string is not in the table. If PLIST is not NULL, this sets *PLIST to point to the start of the list which would hold this hash entry. If PHASH is not NULL, this sets *PHASH to the hash code for KEY. Each time we look up a string, we move it to the start of the list for its hash code, to take advantage of referential locality. */ static struct hash_entry * hash_lookup (struct hash_control *table, const char *key, size_t len, struct hash_entry ***plist, unsigned long *phash) { unsigned long hash; size_t n; unsigned int c; unsigned int hindex; struct hash_entry **list; struct hash_entry *p; struct hash_entry *prev; #ifdef HASH_STATISTICS ++table->lookups; #endif hash = 0; for (n = 0; n < len; n++) { c = key[n]; hash += c + (c << 17); hash ^= hash >> 2; } hash += len + (len << 17); hash ^= hash >> 2; if (phash != NULL) *phash = hash; hindex = hash % table->size; list = table->table + hindex; if (plist != NULL) *plist = list; prev = NULL; for (p = *list; p != NULL; p = p->next) { #ifdef HASH_STATISTICS ++table->hash_compares; #endif if (p->hash == hash) { #ifdef HASH_STATISTICS ++table->string_compares; #endif if (strncmp (p->string, key, len) == 0 && p->string[len] == '\0') { if (prev != NULL) { prev->next = p->next; p->next = *list; *list = p; } return p; } } prev = p; } return NULL; } /* Insert an entry into a hash table. This returns NULL on success. On error, it returns a printable string indicating the error. It is considered to be an error if the entry already exists in the hash table. */ const char * hash_insert (struct hash_control *table, const char *key, void *val) { struct hash_entry *p; struct hash_entry **list; unsigned long hash; p = hash_lookup (table, key, strlen (key), &list, &hash); if (p != NULL) return "exists"; #ifdef HASH_STATISTICS ++table->insertions; #endif p = (struct hash_entry *) obstack_alloc (&table->memory, sizeof (*p)); p->string = key; p->hash = hash; p->data = val; p->next = *list; *list = p; return NULL; } /* Insert or replace an entry in a hash table. This returns NULL on success. On error, it returns a printable string indicating the error. If an entry already exists, its value is replaced. */ const char * hash_jam (struct hash_control *table, const char *key, void *val) { struct hash_entry *p; struct hash_entry **list; unsigned long hash; p = hash_lookup (table, key, strlen (key), &list, &hash); if (p != NULL) { #ifdef HASH_STATISTICS ++table->replacements; #endif p->data = val; } else { #ifdef HASH_STATISTICS ++table->insertions; #endif p = (struct hash_entry *) obstack_alloc (&table->memory, sizeof (*p)); p->string = key; p->hash = hash; p->data = val; p->next = *list; *list = p; } return NULL; } /* Replace an existing entry in a hash table. This returns the old value stored for the entry. If the entry is not found in the hash table, this does nothing and returns NULL. */ void * hash_replace (struct hash_control *table, const char *key, void *value) { struct hash_entry *p; void *ret; p = hash_lookup (table, key, strlen (key), NULL, NULL); if (p == NULL) return NULL; #ifdef HASH_STATISTICS ++table->replacements; #endif ret = p->data; p->data = value; return ret; } /* Find an entry in a hash table, returning its value. Returns NULL if the entry is not found. */ void * hash_find (struct hash_control *table, const char *key) { struct hash_entry *p; p = hash_lookup (table, key, strlen (key), NULL, NULL); if (p == NULL) return NULL; return p->data; } /* As hash_find, but KEY is of length LEN and is not guaranteed to be NUL-terminated. */ void * hash_find_n (struct hash_control *table, const char *key, size_t len) { struct hash_entry *p; p = hash_lookup (table, key, len, NULL, NULL); if (p == NULL) return NULL; return p->data; } /* Delete an entry from a hash table. This returns the value stored for that entry, or NULL if there is no such entry. */ void * hash_delete (struct hash_control *table, const char *key, int freeme) { struct hash_entry *p; struct hash_entry **list; p = hash_lookup (table, key, strlen (key), &list, NULL); if (p == NULL) return NULL; if (p != *list) abort (); #ifdef HASH_STATISTICS ++table->deletions; #endif *list = p->next; if (freeme) obstack_free (&table->memory, p); return p->data; } /* Traverse a hash table. Call the function on every entry in the hash table. */ void hash_traverse (struct hash_control *table, void (*pfn) (const char *key, void *value)) { unsigned int i; for (i = 0; i < table->size; ++i) { struct hash_entry *p; for (p = table->table[i]; p != NULL; p = p->next) (*pfn) (p->string, p->data); } } /* Print hash table statistics on the specified file. NAME is the name of the hash table, used for printing a header. */ void hash_print_statistics (FILE *f ATTRIBUTE_UNUSED, const char *name ATTRIBUTE_UNUSED, struct hash_control *table ATTRIBUTE_UNUSED) { #ifdef HASH_STATISTICS unsigned int i; unsigned long total; unsigned long empty; fprintf (f, "%s hash statistics:\n", name); fprintf (f, "\t%lu lookups\n", table->lookups); fprintf (f, "\t%lu hash comparisons\n", table->hash_compares); fprintf (f, "\t%lu string comparisons\n", table->string_compares); fprintf (f, "\t%lu insertions\n", table->insertions); fprintf (f, "\t%lu replacements\n", table->replacements); fprintf (f, "\t%lu deletions\n", table->deletions); total = 0; empty = 0; for (i = 0; i < table->size; ++i) { struct hash_entry *p; if (table->table[i] == NULL) ++empty; else { for (p = table->table[i]; p != NULL; p = p->next) ++total; } } fprintf (f, "\t%g average chain length\n", (double) total / table->size); fprintf (f, "\t%lu empty slots\n", empty); #endif } #ifdef TEST /* This test program is left over from the old hash table code. */ /* Number of hash tables to maintain (at once) in any testing. */ #define TABLES (6) /* We can have 12 statistics. */ #define STATBUFSIZE (12) /* Display statistics here. */ int statbuf[STATBUFSIZE]; /* Human farts here. */ char answer[100]; /* We test many hash tables at once. */ char *hashtable[TABLES]; /* Points to current hash_control. */ char *h; char **pp; char *p; char *name; char *value; int size; int used; char command; /* Number 0:TABLES-1 of current hashed symbol table. */ int number; int main () { void applicatee (); void destroy (); char *what (); int *ip; number = 0; h = 0; printf ("type h <RETURN> for help\n"); for (;;) { printf ("hash_test command: "); gets (answer); command = answer[0]; command = TOLOWER (command); /* Ecch! */ switch (command) { case '#': printf ("old hash table #=%d.\n", number); whattable (); break; case '?': for (pp = hashtable; pp < hashtable + TABLES; pp++) { printf ("address of hash table #%d control block is %xx\n", pp - hashtable, *pp); } break; case 'a': hash_traverse (h, applicatee); break; case 'd': hash_traverse (h, destroy); hash_die (h); break; case 'f': p = hash_find (h, name = what ("symbol")); printf ("value of \"%s\" is \"%s\"\n", name, p ? p : "NOT-PRESENT"); break; case 'h': printf ("# show old, select new default hash table number\n"); printf ("? display all hashtable control block addresses\n"); printf ("a apply a simple display-er to each symbol in table\n"); printf ("d die: destroy hashtable\n"); printf ("f find value of nominated symbol\n"); printf ("h this help\n"); printf ("i insert value into symbol\n"); printf ("j jam value into symbol\n"); printf ("n new hashtable\n"); printf ("r replace a value with another\n"); printf ("s say what %% of table is used\n"); printf ("q exit this program\n"); printf ("x delete a symbol from table, report its value\n"); break; case 'i': p = hash_insert (h, name = what ("symbol"), value = what ("value")); if (p) { printf ("symbol=\"%s\" value=\"%s\" error=%s\n", name, value, p); } break; case 'j': p = hash_jam (h, name = what ("symbol"), value = what ("value")); if (p) { printf ("symbol=\"%s\" value=\"%s\" error=%s\n", name, value, p); } break; case 'n': h = hashtable[number] = (char *) hash_new (); break; case 'q': exit (EXIT_SUCCESS); case 'r': p = hash_replace (h, name = what ("symbol"), value = what ("value")); printf ("old value was \"%s\"\n", p ? p : "{}"); break; case 's': hash_say (h, statbuf, STATBUFSIZE); for (ip = statbuf; ip < statbuf + STATBUFSIZE; ip++) { printf ("%d ", *ip); } printf ("\n"); break; case 'x': p = hash_delete (h, name = what ("symbol")); printf ("old value was \"%s\"\n", p ? p : "{}"); break; default: printf ("I can't understand command \"%c\"\n", command); break; } } } char * what (description) char *description; { printf (" %s : ", description); gets (answer); return xstrdup (answer); } void destroy (string, value) char *string; char *value; { free (string); free (value); } void applicatee (string, value) char *string; char *value; { printf ("%.20s-%.20s\n", string, value); } /* Determine number: what hash table to use. Also determine h: points to hash_control. */ void whattable () { for (;;) { printf (" what hash table (%d:%d) ? ", 0, TABLES - 1); gets (answer); sscanf (answer, "%d", &number); if (number >= 0 && number < TABLES) { h = hashtable[number]; if (!h) { printf ("warning: current hash-table-#%d. has no hash-control\n", number); } return; } else { printf ("invalid hash table number: %d\n", number); } } } #endif /* TEST */