1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Copyright 2007 The Android Open Source Project
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * General purpose hash table, used for finding classes, methods, etc.
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * When the number of elements reaches 3/4 of the table's capacity, the
7*4882a593Smuzhiyun * table will be resized.
8*4882a593Smuzhiyun */
9*4882a593Smuzhiyun #ifndef _MINZIP_HASH
10*4882a593Smuzhiyun #define _MINZIP_HASH
11*4882a593Smuzhiyun
12*4882a593Smuzhiyun
13*4882a593Smuzhiyun #include <stdlib.h>
14*4882a593Smuzhiyun #include <stdbool.h>
15*4882a593Smuzhiyun #include <assert.h>
16*4882a593Smuzhiyun #define INLINE static inline
17*4882a593Smuzhiyun /* compute the hash of an item with a specific type */
18*4882a593Smuzhiyun typedef unsigned int (*HashCompute)(const void* item);
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun /*
21*4882a593Smuzhiyun * Compare a hash entry with a "loose" item after their hash values match.
22*4882a593Smuzhiyun * Returns { <0, 0, >0 } depending on ordering of items (same semantics
23*4882a593Smuzhiyun * as strcmp()).
24*4882a593Smuzhiyun */
25*4882a593Smuzhiyun typedef int (*HashCompareFunc)(const void* tableItem, const void* looseItem);
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun /*
28*4882a593Smuzhiyun * This function will be used to free entries in the table. This can be
29*4882a593Smuzhiyun * NULL if no free is required, free(), or a custom function.
30*4882a593Smuzhiyun */
31*4882a593Smuzhiyun typedef void (*HashFreeFunc)(void* ptr);
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun /*
34*4882a593Smuzhiyun * Used by mzHashForeach().
35*4882a593Smuzhiyun */
36*4882a593Smuzhiyun typedef int (*HashForeachFunc)(void* data, void* arg);
37*4882a593Smuzhiyun
38*4882a593Smuzhiyun /*
39*4882a593Smuzhiyun * One entry in the hash table. "data" values are expected to be (or have
40*4882a593Smuzhiyun * the same characteristics as) valid pointers. In particular, a NULL
41*4882a593Smuzhiyun * value for "data" indicates an empty slot, and HASH_TOMBSTONE indicates
42*4882a593Smuzhiyun * a no-longer-used slot that must be stepped over during probing.
43*4882a593Smuzhiyun *
44*4882a593Smuzhiyun * Attempting to add a NULL or tombstone value is an error.
45*4882a593Smuzhiyun *
46*4882a593Smuzhiyun * When an entry is released, we will call (HashFreeFunc)(entry->data).
47*4882a593Smuzhiyun */
48*4882a593Smuzhiyun typedef struct HashEntry {
49*4882a593Smuzhiyun unsigned int hashValue;
50*4882a593Smuzhiyun void* data;
51*4882a593Smuzhiyun } HashEntry;
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun #define HASH_TOMBSTONE ((void*) 0xcbcacccd) // invalid ptr value
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun /*
56*4882a593Smuzhiyun * Expandable hash table.
57*4882a593Smuzhiyun *
58*4882a593Smuzhiyun * This structure should be considered opaque.
59*4882a593Smuzhiyun */
60*4882a593Smuzhiyun typedef struct HashTable {
61*4882a593Smuzhiyun int tableSize; /* must be power of 2 */
62*4882a593Smuzhiyun int numEntries; /* current #of "live" entries */
63*4882a593Smuzhiyun int numDeadEntries; /* current #of tombstone entries */
64*4882a593Smuzhiyun HashEntry* pEntries; /* array on heap */
65*4882a593Smuzhiyun HashFreeFunc freeFunc;
66*4882a593Smuzhiyun } HashTable;
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun /*
69*4882a593Smuzhiyun * Create and initialize a HashTable structure, using "initialSize" as
70*4882a593Smuzhiyun * a basis for the initial capacity of the table. (The actual initial
71*4882a593Smuzhiyun * table size may be adjusted upward.) If you know exactly how many
72*4882a593Smuzhiyun * elements the table will hold, pass the result from mzHashSize() in.)
73*4882a593Smuzhiyun *
74*4882a593Smuzhiyun * Returns "false" if unable to allocate the table.
75*4882a593Smuzhiyun */
76*4882a593Smuzhiyun HashTable* mzHashTableCreate(size_t initialSize, HashFreeFunc freeFunc);
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun /*
79*4882a593Smuzhiyun * Compute the capacity needed for a table to hold "size" elements. Use
80*4882a593Smuzhiyun * this when you know ahead of time how many elements the table will hold.
81*4882a593Smuzhiyun * Pass this value into mzHashTableCreate() to ensure that you can add
82*4882a593Smuzhiyun * all elements without needing to reallocate the table.
83*4882a593Smuzhiyun */
84*4882a593Smuzhiyun size_t mzHashSize(size_t size);
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun /*
87*4882a593Smuzhiyun * Clear out a hash table, freeing the contents of any used entries.
88*4882a593Smuzhiyun */
89*4882a593Smuzhiyun void mzHashTableClear(HashTable* pHashTable);
90*4882a593Smuzhiyun
91*4882a593Smuzhiyun /*
92*4882a593Smuzhiyun * Free a hash table.
93*4882a593Smuzhiyun */
94*4882a593Smuzhiyun void mzHashTableFree(HashTable* pHashTable);
95*4882a593Smuzhiyun
96*4882a593Smuzhiyun /*
97*4882a593Smuzhiyun * Get #of entries in hash table.
98*4882a593Smuzhiyun */
mzHashTableNumEntries(HashTable * pHashTable)99*4882a593Smuzhiyun INLINE int mzHashTableNumEntries(HashTable* pHashTable)
100*4882a593Smuzhiyun {
101*4882a593Smuzhiyun return pHashTable->numEntries;
102*4882a593Smuzhiyun }
103*4882a593Smuzhiyun
104*4882a593Smuzhiyun /*
105*4882a593Smuzhiyun * Get total size of hash table (for memory usage calculations).
106*4882a593Smuzhiyun */
mzHashTableMemUsage(HashTable * pHashTable)107*4882a593Smuzhiyun INLINE int mzHashTableMemUsage(HashTable* pHashTable)
108*4882a593Smuzhiyun {
109*4882a593Smuzhiyun return sizeof(HashTable) + pHashTable->tableSize * sizeof(HashEntry);
110*4882a593Smuzhiyun }
111*4882a593Smuzhiyun
112*4882a593Smuzhiyun /*
113*4882a593Smuzhiyun * Look up an entry in the table, possibly adding it if it's not there.
114*4882a593Smuzhiyun *
115*4882a593Smuzhiyun * If "item" is not found, and "doAdd" is false, NULL is returned.
116*4882a593Smuzhiyun * Otherwise, a pointer to the found or added item is returned. (You can
117*4882a593Smuzhiyun * tell the difference by seeing if return value == item.)
118*4882a593Smuzhiyun *
119*4882a593Smuzhiyun * An "add" operation may cause the entire table to be reallocated.
120*4882a593Smuzhiyun */
121*4882a593Smuzhiyun void* mzHashTableLookup(HashTable* pHashTable, unsigned int itemHash, void* item,
122*4882a593Smuzhiyun HashCompareFunc cmpFunc, bool doAdd);
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun /*
125*4882a593Smuzhiyun * Remove an item from the hash table, given its "data" pointer. Does not
126*4882a593Smuzhiyun * invoke the "free" function; just detaches it from the table.
127*4882a593Smuzhiyun */
128*4882a593Smuzhiyun bool mzHashTableRemove(HashTable* pHashTable, unsigned int hash, void* item);
129*4882a593Smuzhiyun
130*4882a593Smuzhiyun /*
131*4882a593Smuzhiyun * Execute "func" on every entry in the hash table.
132*4882a593Smuzhiyun *
133*4882a593Smuzhiyun * If "func" returns a nonzero value, terminate early and return the value.
134*4882a593Smuzhiyun */
135*4882a593Smuzhiyun int mzHashForeach(HashTable* pHashTable, HashForeachFunc func, void* arg);
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun /*
138*4882a593Smuzhiyun * An alternative to mzHashForeach(), using an iterator.
139*4882a593Smuzhiyun *
140*4882a593Smuzhiyun * Use like this:
141*4882a593Smuzhiyun * HashIter iter;
142*4882a593Smuzhiyun * for (mzHashIterBegin(hashTable, &iter); !mzHashIterDone(&iter);
143*4882a593Smuzhiyun * mzHashIterNext(&iter))
144*4882a593Smuzhiyun * {
145*4882a593Smuzhiyun * MyData* data = (MyData*)mzHashIterData(&iter);
146*4882a593Smuzhiyun * }
147*4882a593Smuzhiyun */
148*4882a593Smuzhiyun typedef struct HashIter {
149*4882a593Smuzhiyun void* data;
150*4882a593Smuzhiyun HashTable* pHashTable;
151*4882a593Smuzhiyun int idx;
152*4882a593Smuzhiyun } HashIter;
mzHashIterNext(HashIter * pIter)153*4882a593Smuzhiyun INLINE void mzHashIterNext(HashIter* pIter)
154*4882a593Smuzhiyun {
155*4882a593Smuzhiyun int i = pIter->idx + 1;
156*4882a593Smuzhiyun int lim = pIter->pHashTable->tableSize;
157*4882a593Smuzhiyun for ( ; i < lim; i++) {
158*4882a593Smuzhiyun void* data = pIter->pHashTable->pEntries[i].data;
159*4882a593Smuzhiyun if (data != NULL && data != HASH_TOMBSTONE)
160*4882a593Smuzhiyun break;
161*4882a593Smuzhiyun }
162*4882a593Smuzhiyun pIter->idx = i;
163*4882a593Smuzhiyun }
mzHashIterBegin(HashTable * pHashTable,HashIter * pIter)164*4882a593Smuzhiyun INLINE void mzHashIterBegin(HashTable* pHashTable, HashIter* pIter)
165*4882a593Smuzhiyun {
166*4882a593Smuzhiyun pIter->pHashTable = pHashTable;
167*4882a593Smuzhiyun pIter->idx = -1;
168*4882a593Smuzhiyun mzHashIterNext(pIter);
169*4882a593Smuzhiyun }
mzHashIterDone(HashIter * pIter)170*4882a593Smuzhiyun INLINE bool mzHashIterDone(HashIter* pIter)
171*4882a593Smuzhiyun {
172*4882a593Smuzhiyun return (pIter->idx >= pIter->pHashTable->tableSize);
173*4882a593Smuzhiyun }
mzHashIterData(HashIter * pIter)174*4882a593Smuzhiyun INLINE void* mzHashIterData(HashIter* pIter)
175*4882a593Smuzhiyun {
176*4882a593Smuzhiyun assert(pIter->idx >= 0 && pIter->idx < pIter->pHashTable->tableSize);
177*4882a593Smuzhiyun return pIter->pHashTable->pEntries[pIter->idx].data;
178*4882a593Smuzhiyun }
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun
181*4882a593Smuzhiyun /*
182*4882a593Smuzhiyun * Evaluate hash table performance by examining the number of times we
183*4882a593Smuzhiyun * have to probe for an entry.
184*4882a593Smuzhiyun *
185*4882a593Smuzhiyun * The caller should lock the table beforehand.
186*4882a593Smuzhiyun */
187*4882a593Smuzhiyun typedef unsigned int (*HashCalcFunc)(const void* item);
188*4882a593Smuzhiyun void mzHashTableProbeCount(HashTable* pHashTable, HashCalcFunc calcFunc,
189*4882a593Smuzhiyun HashCompareFunc cmpFunc);
190*4882a593Smuzhiyun
191*4882a593Smuzhiyun #endif /*_MINZIP_HASH*/
192