1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Copyright 2007 The Android Open Source Project
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * General purpose hash table, used for finding classes, methods, etc.
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * When the number of elements reaches 3/4 of the table's capacity, the
7*4882a593Smuzhiyun * table will be resized.
8*4882a593Smuzhiyun */
9*4882a593Smuzhiyun #ifndef _MINZIP_HASH
10*4882a593Smuzhiyun #define _MINZIP_HASH
11*4882a593Smuzhiyun
12*4882a593Smuzhiyun #include "inline_magic.h"
13*4882a593Smuzhiyun
14*4882a593Smuzhiyun #include <stdlib.h>
15*4882a593Smuzhiyun #include <stdbool.h>
16*4882a593Smuzhiyun #include <assert.h>
17*4882a593Smuzhiyun #define INLINE static inline
18*4882a593Smuzhiyun /* compute the hash of an item with a specific type */
19*4882a593Smuzhiyun typedef unsigned int (*HashCompute)(const void* item);
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun /*
22*4882a593Smuzhiyun * Compare a hash entry with a "loose" item after their hash values match.
23*4882a593Smuzhiyun * Returns { <0, 0, >0 } depending on ordering of items (same semantics
24*4882a593Smuzhiyun * as strcmp()).
25*4882a593Smuzhiyun */
26*4882a593Smuzhiyun typedef int (*HashCompareFunc)(const void* tableItem, const void* looseItem);
27*4882a593Smuzhiyun
28*4882a593Smuzhiyun /*
29*4882a593Smuzhiyun * This function will be used to free entries in the table. This can be
30*4882a593Smuzhiyun * NULL if no free is required, free(), or a custom function.
31*4882a593Smuzhiyun */
32*4882a593Smuzhiyun typedef void (*HashFreeFunc)(void* ptr);
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun /*
35*4882a593Smuzhiyun * Used by mzHashForeach().
36*4882a593Smuzhiyun */
37*4882a593Smuzhiyun typedef int (*HashForeachFunc)(void* data, void* arg);
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun /*
40*4882a593Smuzhiyun * One entry in the hash table. "data" values are expected to be (or have
41*4882a593Smuzhiyun * the same characteristics as) valid pointers. In particular, a NULL
42*4882a593Smuzhiyun * value for "data" indicates an empty slot, and HASH_TOMBSTONE indicates
43*4882a593Smuzhiyun * a no-longer-used slot that must be stepped over during probing.
44*4882a593Smuzhiyun *
45*4882a593Smuzhiyun * Attempting to add a NULL or tombstone value is an error.
46*4882a593Smuzhiyun *
47*4882a593Smuzhiyun * When an entry is released, we will call (HashFreeFunc)(entry->data).
48*4882a593Smuzhiyun */
49*4882a593Smuzhiyun typedef struct HashEntry {
50*4882a593Smuzhiyun unsigned int hashValue;
51*4882a593Smuzhiyun void* data;
52*4882a593Smuzhiyun } HashEntry;
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun #define HASH_TOMBSTONE ((void*) 0xcbcacccd) // invalid ptr value
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun /*
57*4882a593Smuzhiyun * Expandable hash table.
58*4882a593Smuzhiyun *
59*4882a593Smuzhiyun * This structure should be considered opaque.
60*4882a593Smuzhiyun */
61*4882a593Smuzhiyun typedef struct HashTable {
62*4882a593Smuzhiyun int tableSize; /* must be power of 2 */
63*4882a593Smuzhiyun int numEntries; /* current #of "live" entries */
64*4882a593Smuzhiyun int numDeadEntries; /* current #of tombstone entries */
65*4882a593Smuzhiyun HashEntry* pEntries; /* array on heap */
66*4882a593Smuzhiyun HashFreeFunc freeFunc;
67*4882a593Smuzhiyun } HashTable;
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun /*
70*4882a593Smuzhiyun * Create and initialize a HashTable structure, using "initialSize" as
71*4882a593Smuzhiyun * a basis for the initial capacity of the table. (The actual initial
72*4882a593Smuzhiyun * table size may be adjusted upward.) If you know exactly how many
73*4882a593Smuzhiyun * elements the table will hold, pass the result from mzHashSize() in.)
74*4882a593Smuzhiyun *
75*4882a593Smuzhiyun * Returns "false" if unable to allocate the table.
76*4882a593Smuzhiyun */
77*4882a593Smuzhiyun HashTable* mzHashTableCreate(size_t initialSize, HashFreeFunc freeFunc);
78*4882a593Smuzhiyun
79*4882a593Smuzhiyun /*
80*4882a593Smuzhiyun * Compute the capacity needed for a table to hold "size" elements. Use
81*4882a593Smuzhiyun * this when you know ahead of time how many elements the table will hold.
82*4882a593Smuzhiyun * Pass this value into mzHashTableCreate() to ensure that you can add
83*4882a593Smuzhiyun * all elements without needing to reallocate the table.
84*4882a593Smuzhiyun */
85*4882a593Smuzhiyun size_t mzHashSize(size_t size);
86*4882a593Smuzhiyun
87*4882a593Smuzhiyun /*
88*4882a593Smuzhiyun * Clear out a hash table, freeing the contents of any used entries.
89*4882a593Smuzhiyun */
90*4882a593Smuzhiyun void mzHashTableClear(HashTable* pHashTable);
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun /*
93*4882a593Smuzhiyun * Free a hash table.
94*4882a593Smuzhiyun */
95*4882a593Smuzhiyun void mzHashTableFree(HashTable* pHashTable);
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun /*
98*4882a593Smuzhiyun * Get #of entries in hash table.
99*4882a593Smuzhiyun */
mzHashTableNumEntries(HashTable * pHashTable)100*4882a593Smuzhiyun INLINE int mzHashTableNumEntries(HashTable* pHashTable) {
101*4882a593Smuzhiyun return pHashTable->numEntries;
102*4882a593Smuzhiyun }
103*4882a593Smuzhiyun
104*4882a593Smuzhiyun /*
105*4882a593Smuzhiyun * Get total size of hash table (for memory usage calculations).
106*4882a593Smuzhiyun */
mzHashTableMemUsage(HashTable * pHashTable)107*4882a593Smuzhiyun INLINE int mzHashTableMemUsage(HashTable* pHashTable) {
108*4882a593Smuzhiyun return sizeof(HashTable) + pHashTable->tableSize * sizeof(HashEntry);
109*4882a593Smuzhiyun }
110*4882a593Smuzhiyun
111*4882a593Smuzhiyun /*
112*4882a593Smuzhiyun * Look up an entry in the table, possibly adding it if it's not there.
113*4882a593Smuzhiyun *
114*4882a593Smuzhiyun * If "item" is not found, and "doAdd" is false, NULL is returned.
115*4882a593Smuzhiyun * Otherwise, a pointer to the found or added item is returned. (You can
116*4882a593Smuzhiyun * tell the difference by seeing if return value == item.)
117*4882a593Smuzhiyun *
118*4882a593Smuzhiyun * An "add" operation may cause the entire table to be reallocated.
119*4882a593Smuzhiyun */
120*4882a593Smuzhiyun void* mzHashTableLookup(HashTable* pHashTable, unsigned int itemHash, void* item,
121*4882a593Smuzhiyun HashCompareFunc cmpFunc, bool doAdd);
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun /*
124*4882a593Smuzhiyun * Remove an item from the hash table, given its "data" pointer. Does not
125*4882a593Smuzhiyun * invoke the "free" function; just detaches it from the table.
126*4882a593Smuzhiyun */
127*4882a593Smuzhiyun bool mzHashTableRemove(HashTable* pHashTable, unsigned int hash, void* item);
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun /*
130*4882a593Smuzhiyun * Execute "func" on every entry in the hash table.
131*4882a593Smuzhiyun *
132*4882a593Smuzhiyun * If "func" returns a nonzero value, terminate early and return the value.
133*4882a593Smuzhiyun */
134*4882a593Smuzhiyun int mzHashForeach(HashTable* pHashTable, HashForeachFunc func, void* arg);
135*4882a593Smuzhiyun
136*4882a593Smuzhiyun /*
137*4882a593Smuzhiyun * An alternative to mzHashForeach(), using an iterator.
138*4882a593Smuzhiyun *
139*4882a593Smuzhiyun * Use like this:
140*4882a593Smuzhiyun * HashIter iter;
141*4882a593Smuzhiyun * for (mzHashIterBegin(hashTable, &iter); !mzHashIterDone(&iter);
142*4882a593Smuzhiyun * mzHashIterNext(&iter))
143*4882a593Smuzhiyun * {
144*4882a593Smuzhiyun * MyData* data = (MyData*)mzHashIterData(&iter);
145*4882a593Smuzhiyun * }
146*4882a593Smuzhiyun */
147*4882a593Smuzhiyun typedef struct HashIter {
148*4882a593Smuzhiyun void* data;
149*4882a593Smuzhiyun HashTable* pHashTable;
150*4882a593Smuzhiyun int idx;
151*4882a593Smuzhiyun } HashIter;
mzHashIterNext(HashIter * pIter)152*4882a593Smuzhiyun INLINE void mzHashIterNext(HashIter* pIter) {
153*4882a593Smuzhiyun int i = pIter->idx +1;
154*4882a593Smuzhiyun int lim = pIter->pHashTable->tableSize;
155*4882a593Smuzhiyun for ( ; i < lim; i++) {
156*4882a593Smuzhiyun void* data = pIter->pHashTable->pEntries[i].data;
157*4882a593Smuzhiyun if (data != NULL && data != HASH_TOMBSTONE)
158*4882a593Smuzhiyun break;
159*4882a593Smuzhiyun }
160*4882a593Smuzhiyun pIter->idx = i;
161*4882a593Smuzhiyun }
mzHashIterBegin(HashTable * pHashTable,HashIter * pIter)162*4882a593Smuzhiyun INLINE void mzHashIterBegin(HashTable* pHashTable, HashIter* pIter) {
163*4882a593Smuzhiyun pIter->pHashTable = pHashTable;
164*4882a593Smuzhiyun pIter->idx = -1;
165*4882a593Smuzhiyun mzHashIterNext(pIter);
166*4882a593Smuzhiyun }
mzHashIterDone(HashIter * pIter)167*4882a593Smuzhiyun INLINE bool mzHashIterDone(HashIter* pIter) {
168*4882a593Smuzhiyun return (pIter->idx >= pIter->pHashTable->tableSize);
169*4882a593Smuzhiyun }
mzHashIterData(HashIter * pIter)170*4882a593Smuzhiyun INLINE void* mzHashIterData(HashIter* pIter) {
171*4882a593Smuzhiyun assert(pIter->idx >= 0 && pIter->idx < pIter->pHashTable->tableSize);
172*4882a593Smuzhiyun return pIter->pHashTable->pEntries[pIter->idx].data;
173*4882a593Smuzhiyun }
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun
176*4882a593Smuzhiyun /*
177*4882a593Smuzhiyun * Evaluate hash table performance by examining the number of times we
178*4882a593Smuzhiyun * have to probe for an entry.
179*4882a593Smuzhiyun *
180*4882a593Smuzhiyun * The caller should lock the table beforehand.
181*4882a593Smuzhiyun */
182*4882a593Smuzhiyun typedef unsigned int (*HashCalcFunc)(const void* item);
183*4882a593Smuzhiyun void mzHashTableProbeCount(HashTable* pHashTable, HashCalcFunc calcFunc,
184*4882a593Smuzhiyun HashCompareFunc cmpFunc);
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun #endif /*_MINZIP_HASH*/
187