xref: /freebsd-src/sys/contrib/ck/src/ck_ht_hash.h (revision 271ce40239ec643af1264c36b73ea1563f4263ba)
11fb62fb0SOlivier Houchard /*
21fb62fb0SOlivier Houchard  * Copyright 2012-2015 Samy Al Bahra
31fb62fb0SOlivier Houchard  * Copyright 2011-2014 AppNexus, Inc.
41fb62fb0SOlivier Houchard  *
51fb62fb0SOlivier Houchard  * Redistribution and use in source and binary forms, with or without
61fb62fb0SOlivier Houchard  * modification, are permitted provided that the following conditions
71fb62fb0SOlivier Houchard  * are met:
81fb62fb0SOlivier Houchard  * 1. Redistributions of source code must retain the above copyright
91fb62fb0SOlivier Houchard  *    notice, this list of conditions and the following disclaimer.
101fb62fb0SOlivier Houchard  * 2. Redistributions in binary form must reproduce the above copyright
111fb62fb0SOlivier Houchard  *    notice, this list of conditions and the following disclaimer in the
121fb62fb0SOlivier Houchard  *    documentation and/or other materials provided with the distribution.
131fb62fb0SOlivier Houchard  *
141fb62fb0SOlivier Houchard  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
151fb62fb0SOlivier Houchard  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
161fb62fb0SOlivier Houchard  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
171fb62fb0SOlivier Houchard  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
181fb62fb0SOlivier Houchard  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
191fb62fb0SOlivier Houchard  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
201fb62fb0SOlivier Houchard  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
211fb62fb0SOlivier Houchard  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
221fb62fb0SOlivier Houchard  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
231fb62fb0SOlivier Houchard  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
241fb62fb0SOlivier Houchard  * SUCH DAMAGE.
251fb62fb0SOlivier Houchard  */
261fb62fb0SOlivier Houchard 
271fb62fb0SOlivier Houchard #ifndef CK_HT_HASH_H
281fb62fb0SOlivier Houchard #define CK_HT_HASH_H
291fb62fb0SOlivier Houchard 
301fb62fb0SOlivier Houchard /*
311fb62fb0SOlivier Houchard  * This is the Murmur hash written by Austin Appleby.
321fb62fb0SOlivier Houchard  */
331fb62fb0SOlivier Houchard 
341fb62fb0SOlivier Houchard #include <ck_stdint.h>
351fb62fb0SOlivier Houchard #include <ck_string.h>
361fb62fb0SOlivier Houchard 
371fb62fb0SOlivier Houchard //-----------------------------------------------------------------------------
381fb62fb0SOlivier Houchard // MurmurHash3 was written by Austin Appleby, and is placed in the public
391fb62fb0SOlivier Houchard // domain. The author hereby disclaims copyright to this source code.
401fb62fb0SOlivier Houchard 
411fb62fb0SOlivier Houchard // Note - The x86 and x64 versions do _not_ produce the same results, as the
421fb62fb0SOlivier Houchard // algorithms are optimized for their respective platforms. You can still
431fb62fb0SOlivier Houchard // compile and run any of them on any platform, but your performance with the
441fb62fb0SOlivier Houchard // non-native version will be less than optimal.
451fb62fb0SOlivier Houchard 
461fb62fb0SOlivier Houchard //-----------------------------------------------------------------------------
471fb62fb0SOlivier Houchard // Platform-specific functions and macros
481fb62fb0SOlivier Houchard 
491fb62fb0SOlivier Houchard // Microsoft Visual Studio
501fb62fb0SOlivier Houchard 
511fb62fb0SOlivier Houchard #if defined(_MSC_VER)
521fb62fb0SOlivier Houchard 
531fb62fb0SOlivier Houchard #define FORCE_INLINE    __forceinline
541fb62fb0SOlivier Houchard 
551fb62fb0SOlivier Houchard #include <stdlib.h>
561fb62fb0SOlivier Houchard 
571fb62fb0SOlivier Houchard #define ROTL32(x,y)     _rotl(x,y)
581fb62fb0SOlivier Houchard #define ROTL64(x,y)     _rotl64(x,y)
591fb62fb0SOlivier Houchard 
601fb62fb0SOlivier Houchard #define BIG_CONSTANT(x) (x)
611fb62fb0SOlivier Houchard 
621fb62fb0SOlivier Houchard // Other compilers
631fb62fb0SOlivier Houchard 
641fb62fb0SOlivier Houchard #else   // defined(_MSC_VER)
651fb62fb0SOlivier Houchard 
661fb62fb0SOlivier Houchard #define FORCE_INLINE inline __attribute__((always_inline))
671fb62fb0SOlivier Houchard 
rotl32(uint32_t x,int8_t r)681fb62fb0SOlivier Houchard static inline uint32_t rotl32 ( uint32_t x, int8_t r )
691fb62fb0SOlivier Houchard {
701fb62fb0SOlivier Houchard   return (x << r) | (x >> (32 - r));
711fb62fb0SOlivier Houchard }
721fb62fb0SOlivier Houchard 
rotl64(uint64_t x,int8_t r)731fb62fb0SOlivier Houchard static inline uint64_t rotl64 ( uint64_t x, int8_t r )
741fb62fb0SOlivier Houchard {
751fb62fb0SOlivier Houchard   return (x << r) | (x >> (64 - r));
761fb62fb0SOlivier Houchard }
771fb62fb0SOlivier Houchard 
781fb62fb0SOlivier Houchard #define ROTL32(x,y)     rotl32(x,y)
791fb62fb0SOlivier Houchard #define ROTL64(x,y)     rotl64(x,y)
801fb62fb0SOlivier Houchard 
811fb62fb0SOlivier Houchard #define BIG_CONSTANT(x) (x##LLU)
821fb62fb0SOlivier Houchard 
831fb62fb0SOlivier Houchard #endif // !defined(_MSC_VER)
841fb62fb0SOlivier Houchard 
851fb62fb0SOlivier Houchard //-----------------------------------------------------------------------------
861fb62fb0SOlivier Houchard // Block read - if your platform needs to do endian-swapping or can only
871fb62fb0SOlivier Houchard // handle aligned reads, do the conversion here
881fb62fb0SOlivier Houchard 
getblock(const uint32_t * p,int i)891fb62fb0SOlivier Houchard FORCE_INLINE static uint32_t getblock ( const uint32_t * p, int i )
901fb62fb0SOlivier Houchard {
91*271ce402SOlivier Houchard #ifdef __s390x__
92*271ce402SOlivier Houchard   uint32_t res;
93*271ce402SOlivier Houchard 
94*271ce402SOlivier Houchard   __asm__ ("	lrv	%0,%1\n"
95*271ce402SOlivier Houchard 	   : "=r" (res) : "Q" (p[i]) : "cc", "mem");
96*271ce402SOlivier Houchard   return res;
97*271ce402SOlivier Houchard #else
981fb62fb0SOlivier Houchard   return p[i];
99*271ce402SOlivier Houchard #endif /* !__s390x__ */
1001fb62fb0SOlivier Houchard }
1011fb62fb0SOlivier Houchard 
1021fb62fb0SOlivier Houchard //-----------------------------------------------------------------------------
1031fb62fb0SOlivier Houchard // Finalization mix - force all bits of a hash block to avalanche
1041fb62fb0SOlivier Houchard 
fmix(uint32_t h)1051fb62fb0SOlivier Houchard FORCE_INLINE static uint32_t fmix ( uint32_t h )
1061fb62fb0SOlivier Houchard {
1071fb62fb0SOlivier Houchard   h ^= h >> 16;
1081fb62fb0SOlivier Houchard   h *= 0x85ebca6b;
1091fb62fb0SOlivier Houchard   h ^= h >> 13;
1101fb62fb0SOlivier Houchard   h *= 0xc2b2ae35;
1111fb62fb0SOlivier Houchard   h ^= h >> 16;
1121fb62fb0SOlivier Houchard 
1131fb62fb0SOlivier Houchard   return h;
1141fb62fb0SOlivier Houchard }
1151fb62fb0SOlivier Houchard 
1161fb62fb0SOlivier Houchard //-----------------------------------------------------------------------------
1171fb62fb0SOlivier Houchard 
MurmurHash3_x86_32(const void * key,int len,uint32_t seed,uint32_t * out)1181fb62fb0SOlivier Houchard static inline void MurmurHash3_x86_32 ( const void * key, int len,
1191fb62fb0SOlivier Houchard                           uint32_t seed, uint32_t * out )
1201fb62fb0SOlivier Houchard {
1211fb62fb0SOlivier Houchard   const uint8_t * data = (const uint8_t*)key;
1221fb62fb0SOlivier Houchard   const int nblocks = len / 4;
1231fb62fb0SOlivier Houchard   int i;
1241fb62fb0SOlivier Houchard 
1251fb62fb0SOlivier Houchard   uint32_t h1 = seed;
1261fb62fb0SOlivier Houchard 
1271fb62fb0SOlivier Houchard   uint32_t c1 = 0xcc9e2d51;
1281fb62fb0SOlivier Houchard   uint32_t c2 = 0x1b873593;
1291fb62fb0SOlivier Houchard 
1301fb62fb0SOlivier Houchard   //----------
1311fb62fb0SOlivier Houchard   // body
1321fb62fb0SOlivier Houchard 
1331fb62fb0SOlivier Houchard   const uint32_t * blocks = (const uint32_t *)(const void *)(data + nblocks*4);
1341fb62fb0SOlivier Houchard 
1351fb62fb0SOlivier Houchard   for(i = -nblocks; i; i++)
1361fb62fb0SOlivier Houchard   {
1371fb62fb0SOlivier Houchard     uint32_t k1 = getblock(blocks,i);
1381fb62fb0SOlivier Houchard 
1391fb62fb0SOlivier Houchard     k1 *= c1;
1401fb62fb0SOlivier Houchard     k1 = ROTL32(k1,15);
1411fb62fb0SOlivier Houchard     k1 *= c2;
1421fb62fb0SOlivier Houchard 
1431fb62fb0SOlivier Houchard     h1 ^= k1;
1441fb62fb0SOlivier Houchard     h1 = ROTL32(h1,13);
1451fb62fb0SOlivier Houchard     h1 = h1*5+0xe6546b64;
1461fb62fb0SOlivier Houchard   }
1471fb62fb0SOlivier Houchard 
1481fb62fb0SOlivier Houchard   //----------
1491fb62fb0SOlivier Houchard   // tail
1501fb62fb0SOlivier Houchard 
1511fb62fb0SOlivier Houchard   const uint8_t * tail = (const uint8_t*)(data + nblocks*4);
1521fb62fb0SOlivier Houchard 
1531fb62fb0SOlivier Houchard   uint32_t k1 = 0;
1541fb62fb0SOlivier Houchard 
1551fb62fb0SOlivier Houchard   switch(len & 3)
1561fb62fb0SOlivier Houchard   {
1571fb62fb0SOlivier Houchard   case 3: k1 ^= tail[2] << 16;
158*271ce402SOlivier Houchard   /* fall through */
1591fb62fb0SOlivier Houchard   case 2: k1 ^= tail[1] << 8;
160*271ce402SOlivier Houchard   /* fall through */
1611fb62fb0SOlivier Houchard   case 1: k1 ^= tail[0];
1621fb62fb0SOlivier Houchard           k1 *= c1; k1 = ROTL32(k1,15); k1 *= c2; h1 ^= k1;
1631fb62fb0SOlivier Houchard   };
1641fb62fb0SOlivier Houchard 
1651fb62fb0SOlivier Houchard   //----------
1661fb62fb0SOlivier Houchard   // finalization
1671fb62fb0SOlivier Houchard 
1681fb62fb0SOlivier Houchard   h1 ^= len;
1691fb62fb0SOlivier Houchard 
1701fb62fb0SOlivier Houchard   h1 = fmix(h1);
1711fb62fb0SOlivier Houchard 
1721fb62fb0SOlivier Houchard   *(uint32_t *)out = h1;
1731fb62fb0SOlivier Houchard }
1741fb62fb0SOlivier Houchard 
MurmurHash64A(const void * key,int len,uint64_t seed)1751fb62fb0SOlivier Houchard static inline uint64_t MurmurHash64A ( const void * key, int len, uint64_t seed )
1761fb62fb0SOlivier Houchard {
1771fb62fb0SOlivier Houchard   const uint64_t m = BIG_CONSTANT(0xc6a4a7935bd1e995);
1781fb62fb0SOlivier Houchard   const int r = 47;
1791fb62fb0SOlivier Houchard 
1801fb62fb0SOlivier Houchard   uint64_t h = seed ^ (len * m);
1811fb62fb0SOlivier Houchard 
1821fb62fb0SOlivier Houchard   const uint64_t * data = (const uint64_t *)key;
1831fb62fb0SOlivier Houchard   const uint64_t * end = data + (len/8);
1841fb62fb0SOlivier Houchard 
1851fb62fb0SOlivier Houchard   while(data != end)
1861fb62fb0SOlivier Houchard   {
1871fb62fb0SOlivier Houchard     uint64_t k;
1881fb62fb0SOlivier Houchard 
1891fb62fb0SOlivier Houchard     if (!((uintptr_t)data & 0x7))
1901fb62fb0SOlivier Houchard 	    k = *data++;
1911fb62fb0SOlivier Houchard     else {
1921fb62fb0SOlivier Houchard 	    memcpy(&k, data, sizeof(k));
1931fb62fb0SOlivier Houchard 	    data++;
1941fb62fb0SOlivier Houchard     }
1951fb62fb0SOlivier Houchard 
1961fb62fb0SOlivier Houchard     k *= m;
1971fb62fb0SOlivier Houchard     k ^= k >> r;
1981fb62fb0SOlivier Houchard     k *= m;
1991fb62fb0SOlivier Houchard 
2001fb62fb0SOlivier Houchard     h ^= k;
2011fb62fb0SOlivier Houchard     h *= m;
2021fb62fb0SOlivier Houchard   }
2031fb62fb0SOlivier Houchard 
2041fb62fb0SOlivier Houchard   const unsigned char * data2 = (const unsigned char*)data;
2051fb62fb0SOlivier Houchard 
2061fb62fb0SOlivier Houchard   switch(len & 7)
2071fb62fb0SOlivier Houchard   {
2081fb62fb0SOlivier Houchard   case 7: h ^= (uint64_t)(data2[6]) << 48;
209*271ce402SOlivier Houchard   /* fall through */
2101fb62fb0SOlivier Houchard   case 6: h ^= (uint64_t)(data2[5]) << 40;
211*271ce402SOlivier Houchard   /* fall through */
2121fb62fb0SOlivier Houchard   case 5: h ^= (uint64_t)(data2[4]) << 32;
213*271ce402SOlivier Houchard   /* fall through */
2141fb62fb0SOlivier Houchard   case 4: h ^= (uint64_t)(data2[3]) << 24;
215*271ce402SOlivier Houchard   /* fall through */
2161fb62fb0SOlivier Houchard   case 3: h ^= (uint64_t)(data2[2]) << 16;
217*271ce402SOlivier Houchard   /* fall through */
2181fb62fb0SOlivier Houchard   case 2: h ^= (uint64_t)(data2[1]) << 8;
219*271ce402SOlivier Houchard   /* fall through */
2201fb62fb0SOlivier Houchard   case 1: h ^= (uint64_t)(data2[0]);
2211fb62fb0SOlivier Houchard           h *= m;
2221fb62fb0SOlivier Houchard   };
2231fb62fb0SOlivier Houchard 
2241fb62fb0SOlivier Houchard   h ^= h >> r;
2251fb62fb0SOlivier Houchard   h *= m;
2261fb62fb0SOlivier Houchard   h ^= h >> r;
2271fb62fb0SOlivier Houchard 
2281fb62fb0SOlivier Houchard   return h;
2291fb62fb0SOlivier Houchard }
2301fb62fb0SOlivier Houchard 
2311fb62fb0SOlivier Houchard 
2321fb62fb0SOlivier Houchard // 64-bit hash for 32-bit platforms
2331fb62fb0SOlivier Houchard 
MurmurHash64B(const void * key,int len,uint64_t seed)2341fb62fb0SOlivier Houchard static inline uint64_t MurmurHash64B ( const void * key, int len, uint64_t seed )
2351fb62fb0SOlivier Houchard {
2361fb62fb0SOlivier Houchard   const uint32_t m = 0x5bd1e995;
2371fb62fb0SOlivier Houchard   const int r = 24;
2381fb62fb0SOlivier Houchard 
2391fb62fb0SOlivier Houchard   uint32_t h1 = (uint32_t)(seed) ^ len;
2401fb62fb0SOlivier Houchard   uint32_t h2 = (uint32_t)(seed >> 32);
2411fb62fb0SOlivier Houchard 
2421fb62fb0SOlivier Houchard   const uint32_t * data = (const uint32_t *)key;
2431fb62fb0SOlivier Houchard 
2441fb62fb0SOlivier Houchard   while(len >= 8)
2451fb62fb0SOlivier Houchard   {
2461fb62fb0SOlivier Houchard     uint32_t k1 = *data++;
2471fb62fb0SOlivier Houchard     k1 *= m; k1 ^= k1 >> r; k1 *= m;
2481fb62fb0SOlivier Houchard     h1 *= m; h1 ^= k1;
2491fb62fb0SOlivier Houchard     len -= 4;
2501fb62fb0SOlivier Houchard 
2511fb62fb0SOlivier Houchard     uint32_t k2 = *data++;
2521fb62fb0SOlivier Houchard     k2 *= m; k2 ^= k2 >> r; k2 *= m;
2531fb62fb0SOlivier Houchard     h2 *= m; h2 ^= k2;
2541fb62fb0SOlivier Houchard     len -= 4;
2551fb62fb0SOlivier Houchard   }
2561fb62fb0SOlivier Houchard 
2571fb62fb0SOlivier Houchard   if(len >= 4)
2581fb62fb0SOlivier Houchard   {
2591fb62fb0SOlivier Houchard     uint32_t k1 = *data++;
2601fb62fb0SOlivier Houchard     k1 *= m; k1 ^= k1 >> r; k1 *= m;
2611fb62fb0SOlivier Houchard     h1 *= m; h1 ^= k1;
2621fb62fb0SOlivier Houchard     len -= 4;
2631fb62fb0SOlivier Houchard   }
2641fb62fb0SOlivier Houchard 
2651fb62fb0SOlivier Houchard   switch(len)
2661fb62fb0SOlivier Houchard   {
2671fb62fb0SOlivier Houchard   case 3: h2 ^= ((const unsigned char*)data)[2] << 16;
268*271ce402SOlivier Houchard   /* fall through */
2691fb62fb0SOlivier Houchard   case 2: h2 ^= ((const unsigned char*)data)[1] << 8;
270*271ce402SOlivier Houchard   /* fall through */
2711fb62fb0SOlivier Houchard   case 1: h2 ^= ((const unsigned char*)data)[0];
2721fb62fb0SOlivier Houchard       h2 *= m;
2731fb62fb0SOlivier Houchard   };
2741fb62fb0SOlivier Houchard 
2751fb62fb0SOlivier Houchard   h1 ^= h2 >> 18; h1 *= m;
2761fb62fb0SOlivier Houchard   h2 ^= h1 >> 22; h2 *= m;
2771fb62fb0SOlivier Houchard   h1 ^= h2 >> 17; h1 *= m;
2781fb62fb0SOlivier Houchard   h2 ^= h1 >> 19; h2 *= m;
2791fb62fb0SOlivier Houchard 
2801fb62fb0SOlivier Houchard   uint64_t h = h1;
2811fb62fb0SOlivier Houchard 
2821fb62fb0SOlivier Houchard   h = (h << 32) | h2;
2831fb62fb0SOlivier Houchard 
2841fb62fb0SOlivier Houchard   return h;
2851fb62fb0SOlivier Houchard }
2861fb62fb0SOlivier Houchard 
2871fb62fb0SOlivier Houchard #endif /* CK_HT_HASH_H */
288