mirror of
https://github.com/DarkPlacesEngine/gmqcc.git
synced 2024-11-27 14:12:36 +00:00
fast optimized murmur hash with crc seeding, literally zero collision, and roughly only 52 instructions
This commit is contained in:
parent
ec2ff09eff
commit
a336fb62ff
1 changed files with 93 additions and 11 deletions
104
util.c
104
util.c
|
@ -525,21 +525,103 @@ typedef struct hash_node_t {
|
||||||
struct hash_node_t *next; /* next node (linked list) */
|
struct hash_node_t *next; /* next node (linked list) */
|
||||||
} hash_node_t;
|
} hash_node_t;
|
||||||
|
|
||||||
|
/*
|
||||||
size_t util_hthash(hash_table_t *ht, const char *key) {
|
* x86 and x86_64 optimized murmur hash functions for the hashtable
|
||||||
uint64_t val = 0;
|
* we have individual implementations for optimal performance.
|
||||||
size_t len = strlen(key);
|
*
|
||||||
size_t itr = 0;
|
* Forced inlined as we wrap these up in the actual utility function
|
||||||
|
* below. These should be autovectorized by gcc.
|
||||||
|
*/
|
||||||
|
#ifdef __x86_64__
|
||||||
|
GMQCC_INLINE uint32_t util_hthashfunc(hash_table_t *ht, const char *key, register size_t seed) {
|
||||||
|
const uint64_t mix = 0xC6A4A7935BD1E995;
|
||||||
|
const int rot = 47;
|
||||||
|
size_t size = strlen(key);
|
||||||
|
uint64_t hash = seed ^ (size - mix);
|
||||||
|
uint64_t alias = 0;
|
||||||
|
const uint64_t *beg = (const uint64_t*)key;
|
||||||
|
const uint64_t *end = beg + (size / 8);
|
||||||
|
const unsigned char *final = NULL;
|
||||||
|
|
||||||
|
while (beg != end) {
|
||||||
while (val < ((uint64_t)~1) /* MAX SIZE OF UINT64 */ && itr < len) {
|
alias = *beg++;
|
||||||
val = val << 8;
|
|
||||||
val += key[itr];
|
|
||||||
|
|
||||||
itr++;
|
alias *= mix;
|
||||||
|
alias ^= alias >> rot;
|
||||||
|
alias *= mix;
|
||||||
|
|
||||||
|
hash ^= alias;
|
||||||
|
hash *= mix;
|
||||||
}
|
}
|
||||||
|
|
||||||
return val % ht->size;
|
final = (const unsigned char *)beg;
|
||||||
|
|
||||||
|
switch (size & 7) {
|
||||||
|
case 7: hash ^= (uint64_t)(final[6]) << 48;
|
||||||
|
case 6: hash ^= (uint64_t)(final[5]) << 40;
|
||||||
|
case 5: hash ^= (uint64_t)(final[4]) << 32;
|
||||||
|
case 4: hash ^= (uint64_t)(final[3]) << 24;
|
||||||
|
case 3: hash ^= (uint64_t)(final[2]) << 16;
|
||||||
|
case 2: hash ^= (uint64_t)(final[1]) << 8;
|
||||||
|
case 1: hash ^= (uint64_t)(final[0]);
|
||||||
|
hash *= mix;
|
||||||
|
}
|
||||||
|
|
||||||
|
hash ^= hash >> rot;
|
||||||
|
hash *= mix;
|
||||||
|
hash ^= hash >> rot;
|
||||||
|
|
||||||
|
return (uint32_t)(hash % ht->size);
|
||||||
|
}
|
||||||
|
|
||||||
|
#else
|
||||||
|
GMQCC_INLINE uint32_t util_hthashfunc(hash_table_t *ht, const char *key, register size_t seed) {
|
||||||
|
const uint32_t mix = 0x5BD1E995;
|
||||||
|
const uint32_t rot = 24;
|
||||||
|
size_t size = strlen(key);
|
||||||
|
uint32_t hash = seed ^ size;
|
||||||
|
uint32_t alias = 0;
|
||||||
|
const unsigned char *data = (const unsigned char*)ket;
|
||||||
|
|
||||||
|
while (size >= 4) {
|
||||||
|
alias = *(uint32_t*)data;
|
||||||
|
|
||||||
|
alias *= mix;
|
||||||
|
alias ^= alias >> rot;
|
||||||
|
alias *= mix;
|
||||||
|
|
||||||
|
hash *= mix;
|
||||||
|
hash ^= alias;
|
||||||
|
|
||||||
|
data += 4;
|
||||||
|
size -= 4;
|
||||||
|
}
|
||||||
|
|
||||||
|
switch (size) {
|
||||||
|
case 3: hash ^= data[2] << 16;
|
||||||
|
case 2: hash ^= data[1] << 8;
|
||||||
|
case 1: hash ^= data[0];
|
||||||
|
hash *= mix;
|
||||||
|
}
|
||||||
|
|
||||||
|
hash ^= hash >> 13;
|
||||||
|
hash *= mix;
|
||||||
|
hash ^= hash >> 15;
|
||||||
|
|
||||||
|
return hash % ht->size;
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
|
/* we use the crc table as seeds for the murmur hash :P */
|
||||||
|
size_t util_hthash(hash_table_t *ht, const char *key) {
|
||||||
|
static size_t seed = 0;
|
||||||
|
register size_t hash = util_hthashfunc(ht, key, util_crc32_table[seed]);
|
||||||
|
|
||||||
|
/* reset seed */
|
||||||
|
if (seed >= sizeof(util_crc32_table) / sizeof(*util_crc32_table))
|
||||||
|
seed = 0;
|
||||||
|
|
||||||
|
return hash;
|
||||||
}
|
}
|
||||||
|
|
||||||
hash_node_t *_util_htnewpair(const char *key, void *value) {
|
hash_node_t *_util_htnewpair(const char *key, void *value) {
|
||||||
|
|
Loading…
Reference in a new issue