Line data Source code
1 : /**********************************************************************
2 : *
3 : * Name: tif_hash_set.c
4 : * Purpose: Hash set functions.
5 : * Author: Even Rouault, <even dot rouault at spatialys.com>
6 : *
7 : **********************************************************************
8 : * Copyright (c) 2008-2009, Even Rouault <even dot rouault at spatialys.com>
9 : *
10 : * Permission is hereby granted, free of charge, to any person obtaining a
11 : * copy of this software and associated documentation files (the "Software"),
12 : * to deal in the Software without restriction, including without limitation
13 : * the rights to use, copy, modify, merge, publish, distribute, sublicense,
14 : * and/or sell copies of the Software, and to permit persons to whom the
15 : * Software is furnished to do so, subject to the following conditions:
16 : *
17 : * The above copyright notice and this permission notice shall be included
18 : * in all copies or substantial portions of the Software.
19 : *
20 : * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
21 : * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
22 : * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
23 : * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
24 : * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
25 : * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
26 : * DEALINGS IN THE SOFTWARE.
27 : ****************************************************************************/
28 :
29 : #include "tif_config.h"
30 :
31 : #include "tif_hash_set.h"
32 :
33 : #include <assert.h>
34 : #include <stdbool.h>
35 : #include <stdint.h>
36 : #include <stdio.h>
37 : #include <stdlib.h>
38 :
39 : /** List element structure. */
40 : typedef struct _TIFFList TIFFList;
41 :
42 : /** List element structure. */
43 : struct _TIFFList
44 : {
45 : /*! Pointer to the data object. Should be allocated and freed by the
46 : * caller.
47 : * */
48 : void *pData;
49 : /*! Pointer to the next element in list. NULL, if current element is the
50 : * last one.
51 : */
52 : struct _TIFFList *psNext;
53 : };
54 :
55 : struct _TIFFHashSet
56 : {
57 : TIFFHashSetHashFunc fnHashFunc;
58 : TIFFHashSetEqualFunc fnEqualFunc;
59 : TIFFHashSetFreeEltFunc fnFreeEltFunc;
60 : TIFFList **tabList;
61 : int nSize;
62 : int nIndiceAllocatedSize;
63 : int nAllocatedSize;
64 : TIFFList *psRecyclingList;
65 : int nRecyclingListSize;
66 : bool bRehash;
67 : #ifdef HASH_DEBUG
68 : int nCollisions;
69 : #endif
70 : };
71 :
72 : static const int anPrimes[] = {
73 : 53, 97, 193, 389, 769, 1543, 3079,
74 : 6151, 12289, 24593, 49157, 98317, 196613, 393241,
75 : 786433, 1572869, 3145739, 6291469, 12582917, 25165843, 50331653,
76 : 100663319, 201326611, 402653189, 805306457, 1610612741};
77 :
78 : /************************************************************************/
79 : /* TIFFHashSetHashPointer() */
80 : /************************************************************************/
81 :
82 : /**
83 : * Hash function for an arbitrary pointer
84 : *
85 : * @param elt the arbitrary pointer to hash
86 : *
87 : * @return the hash value of the pointer
88 : */
89 :
90 0 : static unsigned long TIFFHashSetHashPointer(const void *elt)
91 : {
92 0 : return (unsigned long)(uintptr_t)((void *)(elt));
93 : }
94 :
95 : /************************************************************************/
96 : /* TIFFHashSetEqualPointer() */
97 : /************************************************************************/
98 :
99 : /**
100 : * Equality function for arbitrary pointers
101 : *
102 : * @param elt1 the first arbitrary pointer to compare
103 : * @param elt2 the second arbitrary pointer to compare
104 : *
105 : * @return true if the pointers are equal
106 : */
107 :
108 0 : static bool TIFFHashSetEqualPointer(const void *elt1, const void *elt2)
109 : {
110 0 : return elt1 == elt2;
111 : }
112 :
113 : /************************************************************************/
114 : /* TIFFHashSetNew() */
115 : /************************************************************************/
116 :
117 : /**
118 : * Creates a new hash set
119 : *
120 : * The hash function must return a hash value for the elements to insert.
121 : * If fnHashFunc is NULL, TIFFHashSetHashPointer will be used.
122 : *
123 : * The equal function must return if two elements are equal.
124 : * If fnEqualFunc is NULL, TIFFHashSetEqualPointer will be used.
125 : *
126 : * The free function is used to free elements inserted in the hash set,
127 : * when the hash set is destroyed, when elements are removed or replaced.
128 : * If fnFreeEltFunc is NULL, elements inserted into the hash set will not be
129 : * freed.
130 : *
131 : * @param fnHashFunc hash function. May be NULL.
132 : * @param fnEqualFunc equal function. May be NULL.
133 : * @param fnFreeEltFunc element free function. May be NULL.
134 : *
135 : * @return a new hash set
136 : */
137 :
138 125137 : TIFFHashSet *TIFFHashSetNew(TIFFHashSetHashFunc fnHashFunc,
139 : TIFFHashSetEqualFunc fnEqualFunc,
140 : TIFFHashSetFreeEltFunc fnFreeEltFunc)
141 : {
142 125137 : TIFFHashSet *set = (TIFFHashSet *)malloc(sizeof(TIFFHashSet));
143 125137 : if (set == NULL)
144 0 : return NULL;
145 125137 : set->fnHashFunc = fnHashFunc ? fnHashFunc : TIFFHashSetHashPointer;
146 125137 : set->fnEqualFunc = fnEqualFunc ? fnEqualFunc : TIFFHashSetEqualPointer;
147 125137 : set->fnFreeEltFunc = fnFreeEltFunc;
148 125137 : set->nSize = 0;
149 125137 : set->tabList = (TIFFList **)(calloc(53, sizeof(TIFFList *)));
150 125137 : if (set->tabList == NULL)
151 : {
152 0 : free(set);
153 0 : return NULL;
154 : }
155 125137 : set->nIndiceAllocatedSize = 0;
156 125137 : set->nAllocatedSize = 53;
157 125137 : set->psRecyclingList = NULL;
158 125137 : set->nRecyclingListSize = 0;
159 125137 : set->bRehash = false;
160 : #ifdef HASH_DEBUG
161 : set->nCollisions = 0;
162 : #endif
163 125137 : return set;
164 : }
165 :
166 : /************************************************************************/
167 : /* TIFFHashSetSize() */
168 : /************************************************************************/
169 :
170 : /**
171 : * Returns the number of elements inserted in the hash set
172 : *
173 : * Note: this is not the internal size of the hash set
174 : *
175 : * @param set the hash set
176 : *
177 : * @return the number of elements in the hash set
178 : */
179 :
180 69672 : int TIFFHashSetSize(const TIFFHashSet *set)
181 : {
182 69672 : assert(set != NULL);
183 69672 : return set->nSize;
184 : }
185 :
186 : /************************************************************************/
187 : /* TIFFHashSetGetNewListElt() */
188 : /************************************************************************/
189 :
190 139431 : static TIFFList *TIFFHashSetGetNewListElt(TIFFHashSet *set)
191 : {
192 139431 : if (set->psRecyclingList)
193 : {
194 2770 : TIFFList *psRet = set->psRecyclingList;
195 2770 : psRet->pData = NULL;
196 2770 : set->nRecyclingListSize--;
197 2770 : set->psRecyclingList = psRet->psNext;
198 2770 : return psRet;
199 : }
200 :
201 136661 : return (TIFFList *)malloc(sizeof(TIFFList));
202 : }
203 :
204 : /************************************************************************/
205 : /* TIFFHashSetReturnListElt() */
206 : /************************************************************************/
207 :
208 2792 : static void TIFFHashSetReturnListElt(TIFFHashSet *set, TIFFList *psList)
209 : {
210 2792 : if (set->nRecyclingListSize < 128)
211 : {
212 2792 : psList->psNext = set->psRecyclingList;
213 2792 : set->psRecyclingList = psList;
214 2792 : set->nRecyclingListSize++;
215 : }
216 : else
217 : {
218 0 : free(psList);
219 : }
220 2792 : }
221 :
222 : /************************************************************************/
223 : /* TIFFHashSetClearInternal() */
224 : /************************************************************************/
225 :
226 125202 : static void TIFFHashSetClearInternal(TIFFHashSet *set, bool bFinalize)
227 : {
228 125202 : assert(set != NULL);
229 6758650 : for (int i = 0; i < set->nAllocatedSize; i++)
230 : {
231 6633450 : TIFFList *cur = set->tabList[i];
232 6770200 : while (cur)
233 : {
234 136754 : if (set->fnFreeEltFunc)
235 68377 : set->fnFreeEltFunc(cur->pData);
236 136749 : TIFFList *psNext = cur->psNext;
237 136749 : if (bFinalize)
238 136749 : free(cur);
239 : else
240 0 : TIFFHashSetReturnListElt(set, cur);
241 136750 : cur = psNext;
242 : }
243 6633450 : set->tabList[i] = NULL;
244 : }
245 125198 : set->bRehash = false;
246 125198 : }
247 :
248 : /************************************************************************/
249 : /* TIFFListDestroy() */
250 : /************************************************************************/
251 :
252 : /**
253 : * Destroy a list. Caller responsible for freeing data objects contained in
254 : * list elements.
255 : *
256 : * @param psList pointer to list head.
257 : *
258 : */
259 :
260 125184 : static void TIFFListDestroy(TIFFList *psList)
261 : {
262 125184 : TIFFList *psCurrent = psList;
263 :
264 125206 : while (psCurrent)
265 : {
266 22 : TIFFList *const psNext = psCurrent->psNext;
267 22 : free(psCurrent);
268 22 : psCurrent = psNext;
269 : }
270 125184 : }
271 :
272 : /************************************************************************/
273 : /* TIFFHashSetDestroy() */
274 : /************************************************************************/
275 :
276 : /**
277 : * Destroys an allocated hash set.
278 : *
279 : * This function also frees the elements if a free function was
280 : * provided at the creation of the hash set.
281 : *
282 : * @param set the hash set
283 : */
284 :
285 125205 : void TIFFHashSetDestroy(TIFFHashSet *set)
286 : {
287 125205 : if (set)
288 : {
289 125206 : TIFFHashSetClearInternal(set, true);
290 125212 : free(set->tabList);
291 125212 : TIFFListDestroy(set->psRecyclingList);
292 125211 : free(set);
293 : }
294 125210 : }
295 :
296 : #ifdef notused
297 : /************************************************************************/
298 : /* TIFFHashSetClear() */
299 : /************************************************************************/
300 :
301 : /**
302 : * Clear all elements from a hash set.
303 : *
304 : * This function also frees the elements if a free function was
305 : * provided at the creation of the hash set.
306 : *
307 : * @param set the hash set
308 : */
309 :
310 : void TIFFHashSetClear(TIFFHashSet *set)
311 : {
312 : TIFFHashSetClearInternal(set, false);
313 : set->nIndiceAllocatedSize = 0;
314 : set->nAllocatedSize = 53;
315 : #ifdef HASH_DEBUG
316 : set->nCollisions = 0;
317 : #endif
318 : set->nSize = 0;
319 : }
320 :
321 : /************************************************************************/
322 : /* TIFFHashSetForeach() */
323 : /************************************************************************/
324 :
325 : /**
326 : * Walk through the hash set and runs the provided function on all the
327 : * elements
328 : *
329 : * This function is provided the user_data argument of TIFFHashSetForeach.
330 : * It must return true to go on the walk through the hash set, or FALSE to
331 : * make it stop.
332 : *
333 : * Note : the structure of the hash set must *NOT* be modified during the
334 : * walk.
335 : *
336 : * @param set the hash set.
337 : * @param fnIterFunc the function called on each element.
338 : * @param user_data the user data provided to the function.
339 : */
340 :
341 : void TIFFHashSetForeach(TIFFHashSet *set, TIFFHashSetIterEltFunc fnIterFunc,
342 : void *user_data)
343 : {
344 : assert(set != NULL);
345 : if (!fnIterFunc)
346 : return;
347 :
348 : for (int i = 0; i < set->nAllocatedSize; i++)
349 : {
350 : TIFFList *cur = set->tabList[i];
351 : while (cur)
352 : {
353 : if (!fnIterFunc(cur->pData, user_data))
354 : return;
355 :
356 : cur = cur->psNext;
357 : }
358 : }
359 : }
360 : #endif
361 :
362 : /************************************************************************/
363 : /* TIFFHashSetRehash() */
364 : /************************************************************************/
365 :
366 0 : static bool TIFFHashSetRehash(TIFFHashSet *set)
367 : {
368 0 : int nNewAllocatedSize = anPrimes[set->nIndiceAllocatedSize];
369 : TIFFList **newTabList =
370 0 : (TIFFList **)(calloc(nNewAllocatedSize, sizeof(TIFFList *)));
371 0 : if (newTabList == NULL)
372 0 : return false;
373 : #ifdef HASH_DEBUG
374 : TIFFDebug("TIFFHASH",
375 : "hashSet=%p, nSize=%d, nCollisions=%d, "
376 : "fCollisionRate=%.02f",
377 : set, set->nSize, set->nCollisions,
378 : set->nCollisions * 100.0 / set->nSize);
379 : set->nCollisions = 0;
380 : #endif
381 0 : for (int i = 0; i < set->nAllocatedSize; i++)
382 : {
383 0 : TIFFList *cur = set->tabList[i];
384 0 : while (cur)
385 : {
386 0 : const unsigned long nNewHashVal =
387 0 : set->fnHashFunc(cur->pData) % nNewAllocatedSize;
388 : #ifdef HASH_DEBUG
389 : if (newTabList[nNewHashVal])
390 : set->nCollisions++;
391 : #endif
392 0 : TIFFList *psNext = cur->psNext;
393 0 : cur->psNext = newTabList[nNewHashVal];
394 0 : newTabList[nNewHashVal] = cur;
395 0 : cur = psNext;
396 : }
397 : }
398 0 : free(set->tabList);
399 0 : set->tabList = newTabList;
400 0 : set->nAllocatedSize = nNewAllocatedSize;
401 0 : set->bRehash = false;
402 0 : return true;
403 : }
404 :
405 : /************************************************************************/
406 : /* TIFFHashSetFindPtr() */
407 : /************************************************************************/
408 :
409 332620 : static void **TIFFHashSetFindPtr(TIFFHashSet *set, const void *elt)
410 : {
411 332620 : const unsigned long nHashVal = set->fnHashFunc(elt) % set->nAllocatedSize;
412 332569 : TIFFList *cur = set->tabList[nHashVal];
413 333197 : while (cur)
414 : {
415 52752 : if (set->fnEqualFunc(cur->pData, elt))
416 52124 : return &cur->pData;
417 628 : cur = cur->psNext;
418 : }
419 280445 : return NULL;
420 : }
421 :
422 : /************************************************************************/
423 : /* TIFFHashSetInsert() */
424 : /************************************************************************/
425 :
426 : /**
427 : * Inserts an element into a hash set.
428 : *
429 : * If the element was already inserted in the hash set, the previous
430 : * element is replaced by the new element. If a free function was provided,
431 : * it is used to free the previously inserted element
432 : *
433 : * @param set the hash set
434 : * @param elt the new element to insert in the hash set
435 : *
436 : * @return true if success. If false is returned, elt has not been inserted,
437 : * but TIFFHashSetInsert() will have run the free function if provided.
438 : */
439 :
440 139385 : bool TIFFHashSetInsert(TIFFHashSet *set, void *elt)
441 : {
442 139385 : assert(set != NULL);
443 139385 : void **pElt = TIFFHashSetFindPtr(set, elt);
444 139390 : if (pElt)
445 : {
446 0 : if (set->fnFreeEltFunc)
447 0 : set->fnFreeEltFunc(*pElt);
448 :
449 0 : *pElt = elt;
450 0 : return true;
451 : }
452 :
453 139390 : if (set->nSize >= 2 * set->nAllocatedSize / 3 ||
454 139437 : (set->bRehash && set->nIndiceAllocatedSize > 0 &&
455 0 : set->nSize <= set->nAllocatedSize / 2))
456 : {
457 0 : set->nIndiceAllocatedSize++;
458 0 : if (!TIFFHashSetRehash(set))
459 : {
460 0 : set->nIndiceAllocatedSize--;
461 0 : if (set->fnFreeEltFunc)
462 0 : set->fnFreeEltFunc(elt);
463 0 : return false;
464 : }
465 : }
466 :
467 139437 : const unsigned long nHashVal = set->fnHashFunc(elt) % set->nAllocatedSize;
468 : #ifdef HASH_DEBUG
469 : if (set->tabList[nHashVal])
470 : set->nCollisions++;
471 : #endif
472 :
473 139471 : TIFFList *new_elt = TIFFHashSetGetNewListElt(set);
474 139453 : if (new_elt == NULL)
475 : {
476 0 : if (set->fnFreeEltFunc)
477 0 : set->fnFreeEltFunc(elt);
478 0 : return false;
479 : }
480 139453 : new_elt->pData = elt;
481 139453 : new_elt->psNext = set->tabList[nHashVal];
482 139453 : set->tabList[nHashVal] = new_elt;
483 139453 : set->nSize++;
484 :
485 139453 : return true;
486 : }
487 :
488 : /************************************************************************/
489 : /* TIFFHashSetLookup() */
490 : /************************************************************************/
491 :
492 : /**
493 : * Returns the element found in the hash set corresponding to the element to
494 : * look up The element must not be modified.
495 : *
496 : * @param set the hash set
497 : * @param elt the element to look up in the hash set
498 : *
499 : * @return the element found in the hash set or NULL
500 : */
501 :
502 193251 : void *TIFFHashSetLookup(TIFFHashSet *set, const void *elt)
503 : {
504 193251 : assert(set != NULL);
505 193251 : void **pElt = TIFFHashSetFindPtr(set, elt);
506 193195 : if (pElt)
507 52124 : return *pElt;
508 :
509 141071 : return NULL;
510 : }
511 :
512 : /************************************************************************/
513 : /* TIFFHashSetRemoveInternal() */
514 : /************************************************************************/
515 :
516 2792 : static bool TIFFHashSetRemoveInternal(TIFFHashSet *set, const void *elt,
517 : bool bDeferRehash)
518 : {
519 2792 : assert(set != NULL);
520 2792 : if (set->nIndiceAllocatedSize > 0 && set->nSize <= set->nAllocatedSize / 2)
521 : {
522 0 : set->nIndiceAllocatedSize--;
523 0 : if (bDeferRehash)
524 0 : set->bRehash = true;
525 : else
526 : {
527 0 : if (!TIFFHashSetRehash(set))
528 : {
529 0 : set->nIndiceAllocatedSize++;
530 0 : return false;
531 : }
532 : }
533 : }
534 :
535 2792 : int nHashVal = (int)(set->fnHashFunc(elt) % set->nAllocatedSize);
536 2792 : TIFFList *cur = set->tabList[nHashVal];
537 2792 : TIFFList *prev = NULL;
538 2792 : while (cur)
539 : {
540 2792 : if (set->fnEqualFunc(cur->pData, elt))
541 : {
542 2792 : if (prev)
543 0 : prev->psNext = cur->psNext;
544 : else
545 2792 : set->tabList[nHashVal] = cur->psNext;
546 :
547 2792 : if (set->fnFreeEltFunc)
548 1396 : set->fnFreeEltFunc(cur->pData);
549 :
550 2792 : TIFFHashSetReturnListElt(set, cur);
551 : #ifdef HASH_DEBUG
552 : if (set->tabList[nHashVal])
553 : set->nCollisions--;
554 : #endif
555 2792 : set->nSize--;
556 2792 : return true;
557 : }
558 0 : prev = cur;
559 0 : cur = cur->psNext;
560 : }
561 0 : return false;
562 : }
563 :
564 : /************************************************************************/
565 : /* TIFFHashSetRemove() */
566 : /************************************************************************/
567 :
568 : /**
569 : * Removes an element from a hash set
570 : *
571 : * @param set the hash set
572 : * @param elt the new element to remove from the hash set
573 : *
574 : * @return true if the element was in the hash set
575 : */
576 :
577 2792 : bool TIFFHashSetRemove(TIFFHashSet *set, const void *elt)
578 : {
579 2792 : return TIFFHashSetRemoveInternal(set, elt, false);
580 : }
581 :
582 : #ifdef notused
583 : /************************************************************************/
584 : /* TIFFHashSetRemoveDeferRehash() */
585 : /************************************************************************/
586 :
587 : /**
588 : * Removes an element from a hash set.
589 : *
590 : * This will defer potential rehashing of the set to later calls to
591 : * TIFFHashSetInsert() or TIFFHashSetRemove().
592 : *
593 : * @param set the hash set
594 : * @param elt the new element to remove from the hash set
595 : *
596 : * @return true if the element was in the hash set
597 : */
598 :
599 : bool TIFFHashSetRemoveDeferRehash(TIFFHashSet *set, const void *elt)
600 : {
601 : return TIFFHashSetRemoveInternal(set, elt, true);
602 : }
603 : #endif
|