You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
148 lines
7.6 KiB
148 lines
7.6 KiB
#ifndef _HASH_GENERIC
|
|
#define _HASH_GENERIC
|
|
|
|
#include <string.h>
|
|
#include <stdlib.h>
|
|
|
|
|
|
#define HASH_MAXSIZE 4096
|
|
// for fibonacci hashing, 2^{32,64}/<golden ratio>
|
|
#define HASH_RATIO32 (unsigned int)2654435769u
|
|
#define HASH_RATIO64 (unsigned long long int)11400714819322457583u
|
|
// salt for string hashing
|
|
#define HASH_STRSALT 0xbabb0cac
|
|
|
|
|
|
/* Ready-made compares */
|
|
static inline int hash_cmp_u32(unsigned int a, unsigned int b) { return a == b; }
|
|
static inline int hash_cmp_u64(unsigned long long int a, unsigned long long int b) { return a == b; }
|
|
static inline int hash_cmp_str(const char *a, const char *b) { return strcmp(a, b) == 0; }
|
|
|
|
|
|
/* Ready-made hashes */
|
|
static inline unsigned int hash_u64(unsigned long long int c)
|
|
{
|
|
return (unsigned long long int)((unsigned long long int)(c*HASH_RATIO64)>>32);
|
|
}
|
|
static inline unsigned int hash_u32(unsigned int c)
|
|
{
|
|
return (unsigned int)((unsigned long long int)(c*HASH_RATIO32)>>32);
|
|
}
|
|
static inline unsigned int hash_str(const char *s)
|
|
{
|
|
unsigned int h = HASH_STRSALT;
|
|
const unsigned char *v = (const unsigned char *)(s);
|
|
for (int x = *s; x; x--) {
|
|
h += v[x-1];
|
|
h += h << 10;
|
|
h ^= h >> 6;
|
|
}
|
|
h += h << 3;
|
|
h ^= h >> 11;
|
|
h += h << 15;
|
|
return h;
|
|
}
|
|
|
|
|
|
#define HASH_DECL(hashname, codetype, datatype, hashfn, cmpfn) \
|
|
struct hashname##_entry { \
|
|
codetype code; \
|
|
datatype data; \
|
|
}; \
|
|
\
|
|
struct hashname##_ref { \
|
|
unsigned int items, size; \
|
|
struct hashname##_entry bucket[]; \
|
|
}; \
|
|
\
|
|
\
|
|
struct hashname##_ref * hashname##_create(unsigned int size) \
|
|
{ \
|
|
if (!size || size > HASH_MAXSIZE) \
|
|
return NULL; \
|
|
/* round to the greater power of two */ \
|
|
/* FIXME: check for intger overflow here */ \
|
|
size = 1<<__builtin_clz(size); \
|
|
/* FIXME: check for intger overflow here */ \
|
|
struct hashname##_ref *ht = malloc(sizeof(struct hashname##_ref)+sizeof(struct hashname##_entry)*size); \
|
|
if (ht) { \
|
|
ht->items = 0; \
|
|
ht->size = size; \
|
|
memset(ht->bucket, 0, sizeof(struct hashname##_entry)*size); \
|
|
} \
|
|
return ht; \
|
|
} \
|
|
\
|
|
\
|
|
void hashname##_destroy(struct hashname##_ref *ht) \
|
|
{ \
|
|
if (ht) \
|
|
free(ht); \
|
|
} \
|
|
\
|
|
\
|
|
static struct hashname##_entry * hashname##lookup(struct hashname##_ref *ht, codetype code) \
|
|
{ \
|
|
if (!ht) \
|
|
return NULL; \
|
|
/* fast modulo operation for power-of-2 size */ \
|
|
unsigned int mask = ht->size - 1; \
|
|
unsigned int i = hashfn(code); \
|
|
for (unsigned int j = 1; ; i += j++) { \
|
|
if (!ht->bucket[i&mask].code || cmpfn(ht->bucket[i].code, code)) \
|
|
return &(ht->bucket[i&mask]); \
|
|
} \
|
|
return NULL; \
|
|
} \
|
|
\
|
|
\
|
|
/* Find and return the element by code */ \
|
|
struct hashname##_entry * hashname##_search(struct hashname##_ref *ht, codetype code) \
|
|
{ \
|
|
if (!ht) \
|
|
return NULL; \
|
|
struct hashname##_entry *r = hashname##lookup(ht, code); \
|
|
if (r && cmpfn(r->code, code)) \
|
|
return r; \
|
|
return NULL; \
|
|
} \
|
|
\
|
|
\
|
|
/* FIXME: this simply overrides the found item */ \
|
|
struct hashname##_entry * hashname##_insert(struct hashname##_ref *ht, struct hashname##_entry *entry) \
|
|
{ \
|
|
struct hashname##_entry *r = hashname##lookup(ht, entry->code); \
|
|
if (r) { \
|
|
if (!r->code) \
|
|
ht->items++; \
|
|
*r = *entry; \
|
|
} \
|
|
return r; \
|
|
} \
|
|
\
|
|
\
|
|
/* returns the number of removed items */ \
|
|
int hashname##_remove(struct hashname##_ref *ht, codetype code) \
|
|
{ \
|
|
if (!ht) \
|
|
return -1; \
|
|
unsigned int mask = ht->size - 1; \
|
|
unsigned int s = hashfn(code)&mask, inc = 0; \
|
|
struct hashname##_entry *r; \
|
|
/* Flag for removal */ \
|
|
while (ht->items > 0 && (r = hashname##lookup(ht, code)) && r->code) { \
|
|
/* FIXME: this cast may not work */ \
|
|
r->code = (codetype)(-1); \
|
|
ht->items--; \
|
|
} \
|
|
/* Remove */ \
|
|
for (unsigned int i = s; i < ht->items; i++) { \
|
|
if (ht->bucket[i].code == (codetype)(-1)) { \
|
|
ht->bucket[i] = (struct hashname##_entry){0}; \
|
|
inc++; \
|
|
} \
|
|
} \
|
|
return inc; \
|
|
} \
|
|
|
|
#endif
|
|
|