-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathchibihash64.h
82 lines (71 loc) · 2.41 KB
/
chibihash64.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
#ifndef CHIBIHASH64__HGUARD
#define CHIBIHASH64__HGUARD
// small, fast 64 bit hash function (version 2).
//
// https://github.com/N-R-K/ChibiHash
//
// This is free and unencumbered software released into the public domain.
// For more information, please refer to <https://unlicense.org/>
#include <stdint.h>
#include <stddef.h>
static inline uint64_t chibihash64__load32le(const uint8_t *p)
{
return (uint64_t)p[0] << 0 | (uint64_t)p[1] << 8 |
(uint64_t)p[2] << 16 | (uint64_t)p[3] << 24;
}
static inline uint64_t chibihash64__load64le(const uint8_t *p)
{
return chibihash64__load32le(p) | (chibihash64__load32le(p+4) << 32);
}
static inline uint64_t chibihash64__rotl(uint64_t x, int n)
{
return (x << n) | (x >> (-n & 63));
}
static inline uint64_t
chibihash64(const void *keyIn, ptrdiff_t len, uint64_t seed)
{
const uint8_t *p = (const uint8_t *)keyIn;
ptrdiff_t l = len;
const uint64_t K = UINT64_C(0x2B7E151628AED2A7); // digits of e
uint64_t seed2 = chibihash64__rotl(seed-K, 15) + chibihash64__rotl(seed-K, 47);
uint64_t h[4] = { seed, seed+K, seed2, seed2+(K*K^K) };
// depending on your system unrolling might (or might not) make things
// a tad bit faster on large strings. on my system, it actually makes
// things slower.
// generally speaking, the cost of bigger code size is usually not
// worth the trade-off since larger code-size will hinder inlinability
// but depending on your needs, you may want to uncomment the pragma
// below to unroll the loop.
//#pragma GCC unroll 2
for (; l >= 32; l -= 32) {
for (int i = 0; i < 4; ++i, p += 8) {
uint64_t stripe = chibihash64__load64le(p);
h[i] = (stripe + h[i]) * K;
h[(i+1)&3] += chibihash64__rotl(stripe, 27);
}
}
for (; l >= 8; l -= 8, p += 8) {
h[0] ^= chibihash64__load32le(p+0); h[0] *= K;
h[1] ^= chibihash64__load32le(p+4); h[1] *= K;
}
if (l >= 4) {
h[2] ^= chibihash64__load32le(p);
h[3] ^= chibihash64__load32le(p + l - 4);
} else if (l > 0) {
h[2] ^= p[0];
h[3] ^= p[l/2] | ((uint64_t)p[l-1] << 8);
}
h[0] += chibihash64__rotl(h[2] * K, 31) ^ (h[2] >> 31);
h[1] += chibihash64__rotl(h[3] * K, 31) ^ (h[3] >> 31);
h[0] *= K; h[0] ^= h[0] >> 31;
h[1] += h[0];
uint64_t x = (uint64_t)len * K;
x ^= chibihash64__rotl(x, 29);
x += seed;
x ^= h[1];
x ^= chibihash64__rotl(x, 15) ^ chibihash64__rotl(x, 42);
x *= K;
x ^= chibihash64__rotl(x, 13) ^ chibihash64__rotl(x, 31);
return x;
}
#endif // CHIBIHASH64__HGUARD