]>
git.ipfire.org Git - thirdparty/squid.git/blob - lib/hash.cc
5 * DEBUG: section 00 Hash Tables
6 * AUTHOR: Harvest Derived
8 * SQUID Web Proxy Cache http://www.squid-cache.org/
9 * ----------------------------------------------------------
11 * Squid is the result of efforts by numerous individuals from
12 * the Internet community; see the CONTRIBUTORS file for full
13 * details. Many organizations have provided support for Squid's
14 * development; see the SPONSORS file for full details. Squid is
15 * Copyrighted (C) 2001 by the Regents of the University of
16 * California; see the COPYRIGHT file for full details. Squid
17 * incorporates software developed and/or copyrighted by other
18 * sources; see the CREDITS file for full details.
20 * This program is free software; you can redistribute it and/or modify
21 * it under the terms of the GNU General Public License as published by
22 * the Free Software Foundation; either version 2 of the License, or
23 * (at your option) any later version.
25 * This program is distributed in the hope that it will be useful,
26 * but WITHOUT ANY WARRANTY; without even the implied warranty of
27 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
28 * GNU General Public License for more details.
30 * You should have received a copy of the GNU General Public License
31 * along with this program; if not, write to the Free Software
32 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111, USA.
38 #include "profiler/Profiler.h"
53 #include <gnumalloc.h>
64 static void hash_next_bucket(hash_table
* hid
);
67 hash_string(const void *data
, unsigned int size
)
69 const unsigned char *s
= static_cast<const unsigned char *>(data
);
82 /* the following function(s) were adapted from
83 * usr/src/lib/libc/db/hash_func.c, 4.4 BSD lite */
85 /* Hash function from Chris Torek. */
87 hash4(const void *data
, unsigned int size
)
89 const char *key
= static_cast<const char *>(data
);
94 #define HASH4a h = (h << 5) - h + *key++;
95 #define HASH4b h = (h << 5) + h + *key++;
101 switch (len
& (8 - 1)) {
140 * hash_create - creates a new hash table, uses the cmp_func
141 * to compare keys. Returns the identification for the hash table;
142 * otherwise returns a negative number on error.
145 hash_create(HASHCMP
* cmp_func
, int hash_sz
, HASHHASH
* hash_func
)
147 hash_table
*hid
= (hash_table
*)xcalloc(1, sizeof(hash_table
));
149 hid
->size
= (unsigned int) DEFAULT_HASH_SIZE
;
151 hid
->size
= (unsigned int) hash_sz
;
152 /* allocate and null the buckets */
153 hid
->buckets
= (hash_link
**)xcalloc(hid
->size
, sizeof(hash_link
*));
155 hid
->hash
= hash_func
;
157 hid
->current_slot
= 0;
162 * hash_join - joins a hash_link under its key lnk->key
163 * into the hash table 'hid'.
165 * It does not copy any data into the hash table, only links pointers.
168 hash_join(hash_table
* hid
, hash_link
* lnk
)
171 i
= hid
->hash(lnk
->key
, hid
->size
);
172 lnk
->next
= hid
->buckets
[i
];
173 hid
->buckets
[i
] = lnk
;
178 * hash_lookup - locates the item under the key 'k' in the hash table
179 * 'hid'. Returns a pointer to the hash bucket on success; otherwise
183 hash_lookup(hash_table
* hid
, const void *k
)
186 PROF_start(hash_lookup
);
188 b
= hid
->hash(k
, hid
->size
);
189 for (hash_link
*walker
= hid
->buckets
[b
]; walker
!= NULL
; walker
= walker
->next
) {
190 if ((hid
->cmp
) (k
, walker
->key
) == 0) {
191 PROF_stop(hash_lookup
);
194 assert(walker
!= walker
->next
);
196 PROF_stop(hash_lookup
);
201 hash_next_bucket(hash_table
* hid
)
203 while (hid
->next
== NULL
&& ++hid
->current_slot
< hid
->size
)
204 hid
->next
= hid
->buckets
[hid
->current_slot
];
208 * hash_first - initializes the hash table for the hash_next()
212 hash_first(hash_table
* hid
)
214 assert(NULL
== hid
->next
);
215 hid
->current_slot
= 0;
216 hid
->next
= hid
->buckets
[hid
->current_slot
];
217 if (NULL
== hid
->next
)
218 hash_next_bucket(hid
);
222 * hash_next - returns the next item in the hash table 'hid'.
223 * Otherwise, returns NULL on error or end of list.
225 * MUST call hash_first() before hash_next().
228 hash_next(hash_table
* hid
)
230 hash_link
*p
= hid
->next
;
234 if (NULL
== hid
->next
)
235 hash_next_bucket(hid
);
240 * hash_last - resets hash traversal state to NULL
244 hash_last(hash_table
* hid
)
248 hid
->current_slot
= 0;
252 * hash_remove_link - deletes the given hash_link node from the
253 * hash table 'hid'. Does not free the item, only removes it
256 * An assertion is triggered if the hash_link is not found in the
260 hash_remove_link(hash_table
* hid
, hash_link
* hl
)
263 int i
= hid
->hash(hl
->key
, hid
->size
);
264 for (hash_link
**P
= &hid
->buckets
[i
]; *P
; P
= &(*P
)->next
) {
268 if (hid
->next
== hl
) {
269 hid
->next
= hl
->next
;
270 if (NULL
== hid
->next
)
271 hash_next_bucket(hid
);
280 * hash_get_bucket - returns the head item of the bucket
281 * in the hash table 'hid'. Otherwise, returns NULL on error.
284 hash_get_bucket(hash_table
* hid
, unsigned int bucket
)
286 if (bucket
>= hid
->size
)
288 return (hid
->buckets
[bucket
]);
292 hashFreeItems(hash_table
* hid
, HASHFREE
* free_func
)
296 hash_link
**list
= (hash_link
**)xcalloc(hid
->count
, sizeof(hash_link
*));
298 while ((l
= hash_next(hid
)) && i
< hid
->count
) {
302 for (int j
= 0; j
< i
; ++j
)
303 free_func(*(list
+ j
));
308 hashFreeMemory(hash_table
* hid
)
317 static int hash_primes
[] = {
335 int I
= sizeof(hash_primes
) / sizeof(int);
336 int best_prime
= hash_primes
[0];
337 double min
= fabs(log((double) n
) - log((double) hash_primes
[0]));
339 for (int i
= 0; i
< I
; ++i
) {
340 d
= fabs(log((double) n
) - log((double) hash_primes
[i
]));
344 best_prime
= hash_primes
[i
];
350 * return the key of a hash_link as a const string
353 hashKeyStr(hash_link
* hl
)
355 return (const char *) hl
->key
;
360 * hash-driver - Run with a big file as stdin to insert each line into the
361 * hash table, then prints the whole hash table, then deletes a random item,
362 * and prints the table again...
368 LOCAL_ARRAY(char, buf
, BUFSIZ
);
369 LOCAL_ARRAY(char, todelete
, BUFSIZ
);
370 hash_link
*walker
= NULL
;
375 printf("creating hash table\n");
376 if ((hid
= hash_create((HASHCMP
*) strcmp
, 229, hash4
)) < 0) {
377 printf("hash_create error.\n");
380 printf("done creating hash table: %d\n", hid
);
382 while (fgets(buf
, BUFSIZ
, stdin
)) {
383 buf
[strlen(buf
) - 1] = '\0';
384 printf("Inserting '%s' for item %p to hash table: %d\n",
386 hash_insert(hid
, xstrdup(buf
), (void *) 0x12345678);
387 if (random() % 17 == 0)
388 strcpy(todelete
, buf
);
391 printf("walking hash table...\n");
392 for (int i
= 0, walker
= hash_first(hid
); walker
; walker
= hash_next(hid
)) {
393 printf("item %5d: key: '%s' item: %p\n", i
++, walker
->key
,
396 printf("done walking hash table...\n");
399 printf("deleting %s from %d\n", todelete
, hid
);
400 if (hash_delete(hid
, todelete
))
401 printf("hash_delete error\n");
403 printf("walking hash table...\n");
404 for (int i
= 0, walker
= hash_first(hid
); walker
; walker
= hash_next(hid
)) {
405 printf("item %5d: key: '%s' item: %p\n", i
++, walker
->key
,
408 printf("done walking hash table...\n");
410 printf("driver finished.\n");