blob: 2937ad4fe7e2c01a4de5bd2101d5e3e30a3dd9cb [file] [log] [blame]
drhbeae3192001-09-22 18:12:08 +00001/*
2** 2001 September 22
3**
4** The author disclaims copyright to this source code. In place of
5** a legal notice, here is a blessing:
6**
7** May you do good and not evil.
8** May you find forgiveness for yourself and forgive others.
9** May you share freely, never taking more than you give.
10**
11*************************************************************************
12** This is the implementation of generic hash-tables
13** used in SQLite.
14**
danielk19774adee202004-05-08 08:23:19 +000015** $Id: hash.c,v 1.12 2004/05/08 08:23:25 danielk1977 Exp $
drhbeae3192001-09-22 18:12:08 +000016*/
17#include "sqliteInt.h"
18#include <assert.h>
19
20/* Turn bulk memory into a hash table object by initializing the
21** fields of the Hash structure.
drhaacc5432002-01-06 17:07:40 +000022**
23** "new" is a pointer to the hash table that is to be initialized.
24** keyClass is one of the constants SQLITE_HASH_INT, SQLITE_HASH_POINTER,
25** SQLITE_HASH_BINARY, or SQLITE_HASH_STRING. The value of keyClass
26** determines what kind of key the hash table will use. "copyKey" is
27** true if the hash table should make its own private copy of keys and
28** false if it should just use the supplied pointer. CopyKey only makes
29** sense for SQLITE_HASH_STRING and SQLITE_HASH_BINARY and is ignored
30** for other key classes.
drhbeae3192001-09-22 18:12:08 +000031*/
danielk19774adee202004-05-08 08:23:19 +000032void sqlite3HashInit(Hash *new, int keyClass, int copyKey){
drhbeae3192001-09-22 18:12:08 +000033 assert( new!=0 );
34 assert( keyClass>=SQLITE_HASH_INT && keyClass<=SQLITE_HASH_BINARY );
35 new->keyClass = keyClass;
36 new->copyKey = copyKey &&
37 (keyClass==SQLITE_HASH_STRING || keyClass==SQLITE_HASH_BINARY);
38 new->first = 0;
39 new->count = 0;
40 new->htsize = 0;
41 new->ht = 0;
42}
43
44/* Remove all entries from a hash table. Reclaim all memory.
drhaacc5432002-01-06 17:07:40 +000045** Call this routine to delete a hash table or to reset a hash table
46** to the empty state.
drhbeae3192001-09-22 18:12:08 +000047*/
danielk19774adee202004-05-08 08:23:19 +000048void sqlite3HashClear(Hash *pH){
drhbeae3192001-09-22 18:12:08 +000049 HashElem *elem; /* For looping over all elements of the table */
50
51 assert( pH!=0 );
52 elem = pH->first;
53 pH->first = 0;
54 if( pH->ht ) sqliteFree(pH->ht);
55 pH->ht = 0;
56 pH->htsize = 0;
57 while( elem ){
58 HashElem *next_elem = elem->next;
59 if( pH->copyKey && elem->pKey ){
60 sqliteFree(elem->pKey);
61 }
62 sqliteFree(elem);
63 elem = next_elem;
64 }
65 pH->count = 0;
66}
67
68/*
69** Hash and comparison functions when the mode is SQLITE_HASH_INT
70*/
71static int intHash(const void *pKey, int nKey){
72 return nKey ^ (nKey<<8) ^ (nKey>>8);
73}
74static int intCompare(const void *pKey1, int n1, const void *pKey2, int n2){
75 return n2 - n1;
76}
77
drhba212562004-01-08 02:17:31 +000078#if 0 /* NOT USED */
drhbeae3192001-09-22 18:12:08 +000079/*
80** Hash and comparison functions when the mode is SQLITE_HASH_POINTER
81*/
82static int ptrHash(const void *pKey, int nKey){
drh5a2c2c22001-11-21 02:21:11 +000083 uptr x = Addr(pKey);
84 return x ^ (x<<8) ^ (x>>8);
drhbeae3192001-09-22 18:12:08 +000085}
86static int ptrCompare(const void *pKey1, int n1, const void *pKey2, int n2){
drh5a2c2c22001-11-21 02:21:11 +000087 if( pKey1==pKey2 ) return 0;
88 if( pKey1<pKey2 ) return -1;
89 return 1;
drhbeae3192001-09-22 18:12:08 +000090}
drhba212562004-01-08 02:17:31 +000091#endif
drhbeae3192001-09-22 18:12:08 +000092
93/*
94** Hash and comparison functions when the mode is SQLITE_HASH_STRING
95*/
96static int strHash(const void *pKey, int nKey){
danielk19774adee202004-05-08 08:23:19 +000097 return sqlite3HashNoCase((const char*)pKey, nKey);
drhbeae3192001-09-22 18:12:08 +000098}
99static int strCompare(const void *pKey1, int n1, const void *pKey2, int n2){
100 if( n1!=n2 ) return n2-n1;
danielk19774adee202004-05-08 08:23:19 +0000101 return sqlite3StrNICmp((const char*)pKey1,(const char*)pKey2,n1);
drhbeae3192001-09-22 18:12:08 +0000102}
103
104/*
105** Hash and comparison functions when the mode is SQLITE_HASH_BINARY
106*/
107static int binHash(const void *pKey, int nKey){
108 int h = 0;
109 const char *z = (const char *)pKey;
110 while( nKey-- > 0 ){
111 h = (h<<3) ^ h ^ *(z++);
112 }
drh5364f602003-05-12 23:06:52 +0000113 return h & 0x7fffffff;
drhbeae3192001-09-22 18:12:08 +0000114}
115static int binCompare(const void *pKey1, int n1, const void *pKey2, int n2){
116 if( n1!=n2 ) return n2-n1;
117 return memcmp(pKey1,pKey2,n1);
118}
119
120/*
121** Return a pointer to the appropriate hash function given the key class.
drhaacc5432002-01-06 17:07:40 +0000122**
123** The C syntax in this function definition may be unfamilar to some
124** programmers, so we provide the following additional explanation:
125**
126** The name of the function is "hashFunction". The function takes a
127** single parameter "keyClass". The return value of hashFunction()
128** is a pointer to another function. Specifically, the return value
129** of hashFunction() is a pointer to a function that takes two parameters
130** with types "const void*" and "int" and returns an "int".
drhbeae3192001-09-22 18:12:08 +0000131*/
132static int (*hashFunction(int keyClass))(const void*,int){
133 switch( keyClass ){
drh1ab43002002-01-14 09:28:19 +0000134 case SQLITE_HASH_INT: return &intHash;
drhba212562004-01-08 02:17:31 +0000135 /* case SQLITE_HASH_POINTER: return &ptrHash; // NOT USED */
drh1ab43002002-01-14 09:28:19 +0000136 case SQLITE_HASH_STRING: return &strHash;
137 case SQLITE_HASH_BINARY: return &binHash;;
drhbeae3192001-09-22 18:12:08 +0000138 default: break;
139 }
140 return 0;
141}
142
143/*
144** Return a pointer to the appropriate hash function given the key class.
drhaacc5432002-01-06 17:07:40 +0000145**
146** For help in interpreted the obscure C code in the function definition,
147** see the header comment on the previous function.
drhbeae3192001-09-22 18:12:08 +0000148*/
149static int (*compareFunction(int keyClass))(const void*,int,const void*,int){
150 switch( keyClass ){
drh1ab43002002-01-14 09:28:19 +0000151 case SQLITE_HASH_INT: return &intCompare;
drhba212562004-01-08 02:17:31 +0000152 /* case SQLITE_HASH_POINTER: return &ptrCompare; // NOT USED */
drh1ab43002002-01-14 09:28:19 +0000153 case SQLITE_HASH_STRING: return &strCompare;
154 case SQLITE_HASH_BINARY: return &binCompare;
drhbeae3192001-09-22 18:12:08 +0000155 default: break;
156 }
157 return 0;
158}
159
160
drhaacc5432002-01-06 17:07:40 +0000161/* Resize the hash table so that it cantains "new_size" buckets.
162** "new_size" must be a power of 2. The hash table might fail
163** to resize if sqliteMalloc() fails.
drhbeae3192001-09-22 18:12:08 +0000164*/
165static void rehash(Hash *pH, int new_size){
166 struct _ht *new_ht; /* The new hash table */
167 HashElem *elem, *next_elem; /* For looping over existing elements */
168 HashElem *x; /* Element being copied to new hash table */
169 int (*xHash)(const void*,int); /* The hash function */
170
171 assert( (new_size & (new_size-1))==0 );
172 new_ht = (struct _ht *)sqliteMalloc( new_size*sizeof(struct _ht) );
173 if( new_ht==0 ) return;
174 if( pH->ht ) sqliteFree(pH->ht);
175 pH->ht = new_ht;
176 pH->htsize = new_size;
177 xHash = hashFunction(pH->keyClass);
178 for(elem=pH->first, pH->first=0; elem; elem = next_elem){
179 int h = (*xHash)(elem->pKey, elem->nKey) & (new_size-1);
180 next_elem = elem->next;
181 x = new_ht[h].chain;
182 if( x ){
183 elem->next = x;
184 elem->prev = x->prev;
185 if( x->prev ) x->prev->next = elem;
186 else pH->first = elem;
187 x->prev = elem;
188 }else{
189 elem->next = pH->first;
190 if( pH->first ) pH->first->prev = elem;
191 elem->prev = 0;
192 pH->first = elem;
193 }
194 new_ht[h].chain = elem;
195 new_ht[h].count++;
196 }
197}
198
199/* This function (for internal use only) locates an element in an
drhaacc5432002-01-06 17:07:40 +0000200** hash table that matches the given key. The hash for this key has
201** already been computed and is passed as the 4th parameter.
drhbeae3192001-09-22 18:12:08 +0000202*/
203static HashElem *findElementGivenHash(
204 const Hash *pH, /* The pH to be searched */
205 const void *pKey, /* The key we are searching for */
206 int nKey,
207 int h /* The hash for this key. */
208){
209 HashElem *elem; /* Used to loop thru the element list */
210 int count; /* Number of elements left to test */
211 int (*xCompare)(const void*,int,const void*,int); /* comparison function */
212
213 if( pH->ht ){
214 elem = pH->ht[h].chain;
215 count = pH->ht[h].count;
216 xCompare = compareFunction(pH->keyClass);
217 while( count-- && elem ){
218 if( (*xCompare)(elem->pKey,elem->nKey,pKey,nKey)==0 ){
219 return elem;
220 }
221 elem = elem->next;
222 }
223 }
224 return 0;
225}
226
drh81a20f22001-10-12 17:30:04 +0000227/* Remove a single entry from the hash table given a pointer to that
drhbeae3192001-09-22 18:12:08 +0000228** element and a hash on the element's key.
229*/
230static void removeElementGivenHash(
231 Hash *pH, /* The pH containing "elem" */
232 HashElem* elem, /* The element to be removed from the pH */
drhaacc5432002-01-06 17:07:40 +0000233 int h /* Hash value for the element */
drhbeae3192001-09-22 18:12:08 +0000234){
235 if( elem->prev ){
236 elem->prev->next = elem->next;
237 }else{
238 pH->first = elem->next;
239 }
240 if( elem->next ){
241 elem->next->prev = elem->prev;
242 }
243 if( pH->ht[h].chain==elem ){
244 pH->ht[h].chain = elem->next;
245 }
246 pH->ht[h].count--;
247 if( pH->ht[h].count<=0 ){
248 pH->ht[h].chain = 0;
249 }
250 if( pH->copyKey && elem->pKey ){
251 sqliteFree(elem->pKey);
252 }
253 sqliteFree( elem );
254 pH->count--;
255}
256
drhaacc5432002-01-06 17:07:40 +0000257/* Attempt to locate an element of the hash table pH with a key
drh81a20f22001-10-12 17:30:04 +0000258** that matches pKey,nKey. Return the data for this element if it is
drhaacc5432002-01-06 17:07:40 +0000259** found, or NULL if there is no match.
drhbeae3192001-09-22 18:12:08 +0000260*/
danielk19774adee202004-05-08 08:23:19 +0000261void *sqlite3HashFind(const Hash *pH, const void *pKey, int nKey){
drhbeae3192001-09-22 18:12:08 +0000262 int h; /* A hash on key */
263 HashElem *elem; /* The element that matches key */
264 int (*xHash)(const void*,int); /* The hash function */
265
266 if( pH==0 || pH->ht==0 ) return 0;
267 xHash = hashFunction(pH->keyClass);
268 assert( xHash!=0 );
269 h = (*xHash)(pKey,nKey);
270 assert( (pH->htsize & (pH->htsize-1))==0 );
271 elem = findElementGivenHash(pH,pKey,nKey, h & (pH->htsize-1));
272 return elem ? elem->data : 0;
273}
274
drh81a20f22001-10-12 17:30:04 +0000275/* Insert an element into the hash table pH. The key is pKey,nKey
276** and the data is "data".
drhbeae3192001-09-22 18:12:08 +0000277**
drh81a20f22001-10-12 17:30:04 +0000278** If no element exists with a matching key, then a new
279** element is created. A copy of the key is made if the copyKey
280** flag is set. NULL is returned.
drhbeae3192001-09-22 18:12:08 +0000281**
282** If another element already exists with the same key, then the
283** new data replaces the old data and the old data is returned.
drh6d4abfb2001-10-22 02:58:08 +0000284** The key is not copied in this instance. If a malloc fails, then
drhaacc5432002-01-06 17:07:40 +0000285** the new data is returned and the hash table is unchanged.
drhbeae3192001-09-22 18:12:08 +0000286**
287** If the "data" parameter to this function is NULL, then the
drh81a20f22001-10-12 17:30:04 +0000288** element corresponding to "key" is removed from the hash table.
drhbeae3192001-09-22 18:12:08 +0000289*/
danielk19774adee202004-05-08 08:23:19 +0000290void *sqlite3HashInsert(Hash *pH, const void *pKey, int nKey, void *data){
drhbeae3192001-09-22 18:12:08 +0000291 int hraw; /* Raw hash value of the key */
292 int h; /* the hash of the key modulo hash table size */
293 HashElem *elem; /* Used to loop thru the element list */
294 HashElem *new_elem; /* New element added to the pH */
295 int (*xHash)(const void*,int); /* The hash function */
296
297 assert( pH!=0 );
298 xHash = hashFunction(pH->keyClass);
299 assert( xHash!=0 );
300 hraw = (*xHash)(pKey, nKey);
301 assert( (pH->htsize & (pH->htsize-1))==0 );
302 h = hraw & (pH->htsize-1);
303 elem = findElementGivenHash(pH,pKey,nKey,h);
304 if( elem ){
305 void *old_data = elem->data;
306 if( data==0 ){
307 removeElementGivenHash(pH,elem,h);
308 }else{
309 elem->data = data;
310 }
311 return old_data;
312 }
313 if( data==0 ) return 0;
314 new_elem = (HashElem*)sqliteMalloc( sizeof(HashElem) );
drh6d4abfb2001-10-22 02:58:08 +0000315 if( new_elem==0 ) return data;
drhbeae3192001-09-22 18:12:08 +0000316 if( pH->copyKey && pKey!=0 ){
drh8c1238a2003-01-02 14:43:55 +0000317 new_elem->pKey = sqliteMallocRaw( nKey );
drhbeae3192001-09-22 18:12:08 +0000318 if( new_elem->pKey==0 ){
319 sqliteFree(new_elem);
drh6d4abfb2001-10-22 02:58:08 +0000320 return data;
drhbeae3192001-09-22 18:12:08 +0000321 }
322 memcpy((void*)new_elem->pKey, pKey, nKey);
323 }else{
drh2ce1a6e2002-05-21 23:44:30 +0000324 new_elem->pKey = (void*)pKey;
drhbeae3192001-09-22 18:12:08 +0000325 }
326 new_elem->nKey = nKey;
327 pH->count++;
328 if( pH->htsize==0 ) rehash(pH,8);
329 if( pH->htsize==0 ){
330 pH->count = 0;
331 sqliteFree(new_elem);
drh6d4abfb2001-10-22 02:58:08 +0000332 return data;
drhbeae3192001-09-22 18:12:08 +0000333 }
334 if( pH->count > pH->htsize ){
335 rehash(pH,pH->htsize*2);
336 }
337 assert( (pH->htsize & (pH->htsize-1))==0 );
338 h = hraw & (pH->htsize-1);
339 elem = pH->ht[h].chain;
340 if( elem ){
341 new_elem->next = elem;
342 new_elem->prev = elem->prev;
343 if( elem->prev ){ elem->prev->next = new_elem; }
344 else { pH->first = new_elem; }
345 elem->prev = new_elem;
346 }else{
347 new_elem->next = pH->first;
348 new_elem->prev = 0;
349 if( pH->first ){ pH->first->prev = new_elem; }
350 pH->first = new_elem;
351 }
352 pH->ht[h].count++;
353 pH->ht[h].chain = new_elem;
354 new_elem->data = data;
355 return 0;
356}
danielk19774adee202004-05-08 08:23:19 +0000357
358
359