11fb62fb0SOlivier Houchard /*
21fb62fb0SOlivier Houchard * Copyright 2012-2015 Samy Al Bahra
31fb62fb0SOlivier Houchard * Copyright 2011-2014 AppNexus, Inc.
41fb62fb0SOlivier Houchard *
51fb62fb0SOlivier Houchard * Redistribution and use in source and binary forms, with or without
61fb62fb0SOlivier Houchard * modification, are permitted provided that the following conditions
71fb62fb0SOlivier Houchard * are met:
81fb62fb0SOlivier Houchard * 1. Redistributions of source code must retain the above copyright
91fb62fb0SOlivier Houchard * notice, this list of conditions and the following disclaimer.
101fb62fb0SOlivier Houchard * 2. Redistributions in binary form must reproduce the above copyright
111fb62fb0SOlivier Houchard * notice, this list of conditions and the following disclaimer in the
121fb62fb0SOlivier Houchard * documentation and/or other materials provided with the distribution.
131fb62fb0SOlivier Houchard *
141fb62fb0SOlivier Houchard * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
151fb62fb0SOlivier Houchard * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
161fb62fb0SOlivier Houchard * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
171fb62fb0SOlivier Houchard * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
181fb62fb0SOlivier Houchard * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
191fb62fb0SOlivier Houchard * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
201fb62fb0SOlivier Houchard * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
211fb62fb0SOlivier Houchard * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
221fb62fb0SOlivier Houchard * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
231fb62fb0SOlivier Houchard * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
241fb62fb0SOlivier Houchard * SUCH DAMAGE.
251fb62fb0SOlivier Houchard */
261fb62fb0SOlivier Houchard
271fb62fb0SOlivier Houchard #ifndef CK_HT_HASH_H
281fb62fb0SOlivier Houchard #define CK_HT_HASH_H
291fb62fb0SOlivier Houchard
301fb62fb0SOlivier Houchard /*
311fb62fb0SOlivier Houchard * This is the Murmur hash written by Austin Appleby.
321fb62fb0SOlivier Houchard */
331fb62fb0SOlivier Houchard
341fb62fb0SOlivier Houchard #include <ck_stdint.h>
351fb62fb0SOlivier Houchard #include <ck_string.h>
361fb62fb0SOlivier Houchard
371fb62fb0SOlivier Houchard //-----------------------------------------------------------------------------
381fb62fb0SOlivier Houchard // MurmurHash3 was written by Austin Appleby, and is placed in the public
391fb62fb0SOlivier Houchard // domain. The author hereby disclaims copyright to this source code.
401fb62fb0SOlivier Houchard
411fb62fb0SOlivier Houchard // Note - The x86 and x64 versions do _not_ produce the same results, as the
421fb62fb0SOlivier Houchard // algorithms are optimized for their respective platforms. You can still
431fb62fb0SOlivier Houchard // compile and run any of them on any platform, but your performance with the
441fb62fb0SOlivier Houchard // non-native version will be less than optimal.
451fb62fb0SOlivier Houchard
461fb62fb0SOlivier Houchard //-----------------------------------------------------------------------------
471fb62fb0SOlivier Houchard // Platform-specific functions and macros
481fb62fb0SOlivier Houchard
491fb62fb0SOlivier Houchard // Microsoft Visual Studio
501fb62fb0SOlivier Houchard
511fb62fb0SOlivier Houchard #if defined(_MSC_VER)
521fb62fb0SOlivier Houchard
531fb62fb0SOlivier Houchard #define FORCE_INLINE __forceinline
541fb62fb0SOlivier Houchard
551fb62fb0SOlivier Houchard #include <stdlib.h>
561fb62fb0SOlivier Houchard
571fb62fb0SOlivier Houchard #define ROTL32(x,y) _rotl(x,y)
581fb62fb0SOlivier Houchard #define ROTL64(x,y) _rotl64(x,y)
591fb62fb0SOlivier Houchard
601fb62fb0SOlivier Houchard #define BIG_CONSTANT(x) (x)
611fb62fb0SOlivier Houchard
621fb62fb0SOlivier Houchard // Other compilers
631fb62fb0SOlivier Houchard
641fb62fb0SOlivier Houchard #else // defined(_MSC_VER)
651fb62fb0SOlivier Houchard
661fb62fb0SOlivier Houchard #define FORCE_INLINE inline __attribute__((always_inline))
671fb62fb0SOlivier Houchard
rotl32(uint32_t x,int8_t r)681fb62fb0SOlivier Houchard static inline uint32_t rotl32 ( uint32_t x, int8_t r )
691fb62fb0SOlivier Houchard {
701fb62fb0SOlivier Houchard return (x << r) | (x >> (32 - r));
711fb62fb0SOlivier Houchard }
721fb62fb0SOlivier Houchard
rotl64(uint64_t x,int8_t r)731fb62fb0SOlivier Houchard static inline uint64_t rotl64 ( uint64_t x, int8_t r )
741fb62fb0SOlivier Houchard {
751fb62fb0SOlivier Houchard return (x << r) | (x >> (64 - r));
761fb62fb0SOlivier Houchard }
771fb62fb0SOlivier Houchard
781fb62fb0SOlivier Houchard #define ROTL32(x,y) rotl32(x,y)
791fb62fb0SOlivier Houchard #define ROTL64(x,y) rotl64(x,y)
801fb62fb0SOlivier Houchard
811fb62fb0SOlivier Houchard #define BIG_CONSTANT(x) (x##LLU)
821fb62fb0SOlivier Houchard
831fb62fb0SOlivier Houchard #endif // !defined(_MSC_VER)
841fb62fb0SOlivier Houchard
851fb62fb0SOlivier Houchard //-----------------------------------------------------------------------------
861fb62fb0SOlivier Houchard // Block read - if your platform needs to do endian-swapping or can only
871fb62fb0SOlivier Houchard // handle aligned reads, do the conversion here
881fb62fb0SOlivier Houchard
getblock(const uint32_t * p,int i)891fb62fb0SOlivier Houchard FORCE_INLINE static uint32_t getblock ( const uint32_t * p, int i )
901fb62fb0SOlivier Houchard {
91*271ce402SOlivier Houchard #ifdef __s390x__
92*271ce402SOlivier Houchard uint32_t res;
93*271ce402SOlivier Houchard
94*271ce402SOlivier Houchard __asm__ (" lrv %0,%1\n"
95*271ce402SOlivier Houchard : "=r" (res) : "Q" (p[i]) : "cc", "mem");
96*271ce402SOlivier Houchard return res;
97*271ce402SOlivier Houchard #else
981fb62fb0SOlivier Houchard return p[i];
99*271ce402SOlivier Houchard #endif /* !__s390x__ */
1001fb62fb0SOlivier Houchard }
1011fb62fb0SOlivier Houchard
1021fb62fb0SOlivier Houchard //-----------------------------------------------------------------------------
1031fb62fb0SOlivier Houchard // Finalization mix - force all bits of a hash block to avalanche
1041fb62fb0SOlivier Houchard
fmix(uint32_t h)1051fb62fb0SOlivier Houchard FORCE_INLINE static uint32_t fmix ( uint32_t h )
1061fb62fb0SOlivier Houchard {
1071fb62fb0SOlivier Houchard h ^= h >> 16;
1081fb62fb0SOlivier Houchard h *= 0x85ebca6b;
1091fb62fb0SOlivier Houchard h ^= h >> 13;
1101fb62fb0SOlivier Houchard h *= 0xc2b2ae35;
1111fb62fb0SOlivier Houchard h ^= h >> 16;
1121fb62fb0SOlivier Houchard
1131fb62fb0SOlivier Houchard return h;
1141fb62fb0SOlivier Houchard }
1151fb62fb0SOlivier Houchard
1161fb62fb0SOlivier Houchard //-----------------------------------------------------------------------------
1171fb62fb0SOlivier Houchard
MurmurHash3_x86_32(const void * key,int len,uint32_t seed,uint32_t * out)1181fb62fb0SOlivier Houchard static inline void MurmurHash3_x86_32 ( const void * key, int len,
1191fb62fb0SOlivier Houchard uint32_t seed, uint32_t * out )
1201fb62fb0SOlivier Houchard {
1211fb62fb0SOlivier Houchard const uint8_t * data = (const uint8_t*)key;
1221fb62fb0SOlivier Houchard const int nblocks = len / 4;
1231fb62fb0SOlivier Houchard int i;
1241fb62fb0SOlivier Houchard
1251fb62fb0SOlivier Houchard uint32_t h1 = seed;
1261fb62fb0SOlivier Houchard
1271fb62fb0SOlivier Houchard uint32_t c1 = 0xcc9e2d51;
1281fb62fb0SOlivier Houchard uint32_t c2 = 0x1b873593;
1291fb62fb0SOlivier Houchard
1301fb62fb0SOlivier Houchard //----------
1311fb62fb0SOlivier Houchard // body
1321fb62fb0SOlivier Houchard
1331fb62fb0SOlivier Houchard const uint32_t * blocks = (const uint32_t *)(const void *)(data + nblocks*4);
1341fb62fb0SOlivier Houchard
1351fb62fb0SOlivier Houchard for(i = -nblocks; i; i++)
1361fb62fb0SOlivier Houchard {
1371fb62fb0SOlivier Houchard uint32_t k1 = getblock(blocks,i);
1381fb62fb0SOlivier Houchard
1391fb62fb0SOlivier Houchard k1 *= c1;
1401fb62fb0SOlivier Houchard k1 = ROTL32(k1,15);
1411fb62fb0SOlivier Houchard k1 *= c2;
1421fb62fb0SOlivier Houchard
1431fb62fb0SOlivier Houchard h1 ^= k1;
1441fb62fb0SOlivier Houchard h1 = ROTL32(h1,13);
1451fb62fb0SOlivier Houchard h1 = h1*5+0xe6546b64;
1461fb62fb0SOlivier Houchard }
1471fb62fb0SOlivier Houchard
1481fb62fb0SOlivier Houchard //----------
1491fb62fb0SOlivier Houchard // tail
1501fb62fb0SOlivier Houchard
1511fb62fb0SOlivier Houchard const uint8_t * tail = (const uint8_t*)(data + nblocks*4);
1521fb62fb0SOlivier Houchard
1531fb62fb0SOlivier Houchard uint32_t k1 = 0;
1541fb62fb0SOlivier Houchard
1551fb62fb0SOlivier Houchard switch(len & 3)
1561fb62fb0SOlivier Houchard {
1571fb62fb0SOlivier Houchard case 3: k1 ^= tail[2] << 16;
158*271ce402SOlivier Houchard /* fall through */
1591fb62fb0SOlivier Houchard case 2: k1 ^= tail[1] << 8;
160*271ce402SOlivier Houchard /* fall through */
1611fb62fb0SOlivier Houchard case 1: k1 ^= tail[0];
1621fb62fb0SOlivier Houchard k1 *= c1; k1 = ROTL32(k1,15); k1 *= c2; h1 ^= k1;
1631fb62fb0SOlivier Houchard };
1641fb62fb0SOlivier Houchard
1651fb62fb0SOlivier Houchard //----------
1661fb62fb0SOlivier Houchard // finalization
1671fb62fb0SOlivier Houchard
1681fb62fb0SOlivier Houchard h1 ^= len;
1691fb62fb0SOlivier Houchard
1701fb62fb0SOlivier Houchard h1 = fmix(h1);
1711fb62fb0SOlivier Houchard
1721fb62fb0SOlivier Houchard *(uint32_t *)out = h1;
1731fb62fb0SOlivier Houchard }
1741fb62fb0SOlivier Houchard
MurmurHash64A(const void * key,int len,uint64_t seed)1751fb62fb0SOlivier Houchard static inline uint64_t MurmurHash64A ( const void * key, int len, uint64_t seed )
1761fb62fb0SOlivier Houchard {
1771fb62fb0SOlivier Houchard const uint64_t m = BIG_CONSTANT(0xc6a4a7935bd1e995);
1781fb62fb0SOlivier Houchard const int r = 47;
1791fb62fb0SOlivier Houchard
1801fb62fb0SOlivier Houchard uint64_t h = seed ^ (len * m);
1811fb62fb0SOlivier Houchard
1821fb62fb0SOlivier Houchard const uint64_t * data = (const uint64_t *)key;
1831fb62fb0SOlivier Houchard const uint64_t * end = data + (len/8);
1841fb62fb0SOlivier Houchard
1851fb62fb0SOlivier Houchard while(data != end)
1861fb62fb0SOlivier Houchard {
1871fb62fb0SOlivier Houchard uint64_t k;
1881fb62fb0SOlivier Houchard
1891fb62fb0SOlivier Houchard if (!((uintptr_t)data & 0x7))
1901fb62fb0SOlivier Houchard k = *data++;
1911fb62fb0SOlivier Houchard else {
1921fb62fb0SOlivier Houchard memcpy(&k, data, sizeof(k));
1931fb62fb0SOlivier Houchard data++;
1941fb62fb0SOlivier Houchard }
1951fb62fb0SOlivier Houchard
1961fb62fb0SOlivier Houchard k *= m;
1971fb62fb0SOlivier Houchard k ^= k >> r;
1981fb62fb0SOlivier Houchard k *= m;
1991fb62fb0SOlivier Houchard
2001fb62fb0SOlivier Houchard h ^= k;
2011fb62fb0SOlivier Houchard h *= m;
2021fb62fb0SOlivier Houchard }
2031fb62fb0SOlivier Houchard
2041fb62fb0SOlivier Houchard const unsigned char * data2 = (const unsigned char*)data;
2051fb62fb0SOlivier Houchard
2061fb62fb0SOlivier Houchard switch(len & 7)
2071fb62fb0SOlivier Houchard {
2081fb62fb0SOlivier Houchard case 7: h ^= (uint64_t)(data2[6]) << 48;
209*271ce402SOlivier Houchard /* fall through */
2101fb62fb0SOlivier Houchard case 6: h ^= (uint64_t)(data2[5]) << 40;
211*271ce402SOlivier Houchard /* fall through */
2121fb62fb0SOlivier Houchard case 5: h ^= (uint64_t)(data2[4]) << 32;
213*271ce402SOlivier Houchard /* fall through */
2141fb62fb0SOlivier Houchard case 4: h ^= (uint64_t)(data2[3]) << 24;
215*271ce402SOlivier Houchard /* fall through */
2161fb62fb0SOlivier Houchard case 3: h ^= (uint64_t)(data2[2]) << 16;
217*271ce402SOlivier Houchard /* fall through */
2181fb62fb0SOlivier Houchard case 2: h ^= (uint64_t)(data2[1]) << 8;
219*271ce402SOlivier Houchard /* fall through */
2201fb62fb0SOlivier Houchard case 1: h ^= (uint64_t)(data2[0]);
2211fb62fb0SOlivier Houchard h *= m;
2221fb62fb0SOlivier Houchard };
2231fb62fb0SOlivier Houchard
2241fb62fb0SOlivier Houchard h ^= h >> r;
2251fb62fb0SOlivier Houchard h *= m;
2261fb62fb0SOlivier Houchard h ^= h >> r;
2271fb62fb0SOlivier Houchard
2281fb62fb0SOlivier Houchard return h;
2291fb62fb0SOlivier Houchard }
2301fb62fb0SOlivier Houchard
2311fb62fb0SOlivier Houchard
2321fb62fb0SOlivier Houchard // 64-bit hash for 32-bit platforms
2331fb62fb0SOlivier Houchard
MurmurHash64B(const void * key,int len,uint64_t seed)2341fb62fb0SOlivier Houchard static inline uint64_t MurmurHash64B ( const void * key, int len, uint64_t seed )
2351fb62fb0SOlivier Houchard {
2361fb62fb0SOlivier Houchard const uint32_t m = 0x5bd1e995;
2371fb62fb0SOlivier Houchard const int r = 24;
2381fb62fb0SOlivier Houchard
2391fb62fb0SOlivier Houchard uint32_t h1 = (uint32_t)(seed) ^ len;
2401fb62fb0SOlivier Houchard uint32_t h2 = (uint32_t)(seed >> 32);
2411fb62fb0SOlivier Houchard
2421fb62fb0SOlivier Houchard const uint32_t * data = (const uint32_t *)key;
2431fb62fb0SOlivier Houchard
2441fb62fb0SOlivier Houchard while(len >= 8)
2451fb62fb0SOlivier Houchard {
2461fb62fb0SOlivier Houchard uint32_t k1 = *data++;
2471fb62fb0SOlivier Houchard k1 *= m; k1 ^= k1 >> r; k1 *= m;
2481fb62fb0SOlivier Houchard h1 *= m; h1 ^= k1;
2491fb62fb0SOlivier Houchard len -= 4;
2501fb62fb0SOlivier Houchard
2511fb62fb0SOlivier Houchard uint32_t k2 = *data++;
2521fb62fb0SOlivier Houchard k2 *= m; k2 ^= k2 >> r; k2 *= m;
2531fb62fb0SOlivier Houchard h2 *= m; h2 ^= k2;
2541fb62fb0SOlivier Houchard len -= 4;
2551fb62fb0SOlivier Houchard }
2561fb62fb0SOlivier Houchard
2571fb62fb0SOlivier Houchard if(len >= 4)
2581fb62fb0SOlivier Houchard {
2591fb62fb0SOlivier Houchard uint32_t k1 = *data++;
2601fb62fb0SOlivier Houchard k1 *= m; k1 ^= k1 >> r; k1 *= m;
2611fb62fb0SOlivier Houchard h1 *= m; h1 ^= k1;
2621fb62fb0SOlivier Houchard len -= 4;
2631fb62fb0SOlivier Houchard }
2641fb62fb0SOlivier Houchard
2651fb62fb0SOlivier Houchard switch(len)
2661fb62fb0SOlivier Houchard {
2671fb62fb0SOlivier Houchard case 3: h2 ^= ((const unsigned char*)data)[2] << 16;
268*271ce402SOlivier Houchard /* fall through */
2691fb62fb0SOlivier Houchard case 2: h2 ^= ((const unsigned char*)data)[1] << 8;
270*271ce402SOlivier Houchard /* fall through */
2711fb62fb0SOlivier Houchard case 1: h2 ^= ((const unsigned char*)data)[0];
2721fb62fb0SOlivier Houchard h2 *= m;
2731fb62fb0SOlivier Houchard };
2741fb62fb0SOlivier Houchard
2751fb62fb0SOlivier Houchard h1 ^= h2 >> 18; h1 *= m;
2761fb62fb0SOlivier Houchard h2 ^= h1 >> 22; h2 *= m;
2771fb62fb0SOlivier Houchard h1 ^= h2 >> 17; h1 *= m;
2781fb62fb0SOlivier Houchard h2 ^= h1 >> 19; h2 *= m;
2791fb62fb0SOlivier Houchard
2801fb62fb0SOlivier Houchard uint64_t h = h1;
2811fb62fb0SOlivier Houchard
2821fb62fb0SOlivier Houchard h = (h << 32) | h2;
2831fb62fb0SOlivier Houchard
2841fb62fb0SOlivier Houchard return h;
2851fb62fb0SOlivier Houchard }
2861fb62fb0SOlivier Houchard
2871fb62fb0SOlivier Houchard #endif /* CK_HT_HASH_H */
288