// Minimally modified from Austin Applebee's code: // * Removed MurmurHash3_x86_32 and MurmurHash3_x86_128 // * Changed input seed in MurmurHash3_x64_128 to uint64_t // * Define and use HashState reference to return result // * Made entire hash function defined inline //----------------------------------------------------------------------------- // MurmurHash3 was written by Austin Appleby, and is placed in the public // domain. The author hereby disclaims copyright to this source code. // Note - The x86 and x64 versions do _not_ produce the same results, as the // algorithms are optimized for their respective platforms. You can still // compile and run any of them on any platform, but your performance with the // non-native version will be less than optimal. #ifndef _MURMURHASH3_H_ #define _MURMURHASH3_H_ //----------------------------------------------------------------------------- // Platform-specific functions and macros // Microsoft Visual Studio #if defined(_MSC_VER) && (_MSC_VER < 1600) typedef unsigned char uint8_t; typedef unsigned int uint32_t; typedef unsigned __int64 uint64_t; #define FORCE_INLINE __forceinline #include #define ROTL32(x,y) _rotl(x,y) #define ROTL64(x,y) _rotl64(x,y) #define BIG_CONSTANT(x) (x) // Other compilers #else // defined(_MSC_VER) #include #define FORCE_INLINE inline __attribute__((always_inline)) inline uint32_t rotl32 ( uint32_t x, int8_t r ) { return (x << r) | (x >> (32 - r)); } inline uint64_t rotl64 ( uint64_t x, int8_t r ) { return (x << r) | (x >> (64 - r)); } #define ROTL32(x,y) rotl32(x,y) #define ROTL64(x,y) rotl64(x,y) #define BIG_CONSTANT(x) (x##LLU) #endif // !defined(_MSC_VER) //----------------------------------------------------------------------------- //----------------------------------------------------------------------------- // Return type - Using C++ reference for return type which should allow better // compiler optimization than a void* pointer typedef struct { uint64_t h1; uint64_t h2; } HashState; //----------------------------------------------------------------------------- // Block read - if your platform needs to do endian-swapping or can only // handle aligned reads, do the conversion here FORCE_INLINE uint64_t getblock64 ( const uint64_t * p, int i ) { return p[i]; } //----------------------------------------------------------------------------- // Finalization mix - force all bits of a hash block to avalanche FORCE_INLINE uint64_t fmix64 ( uint64_t k ) { k ^= k >> 33; k *= BIG_CONSTANT(0xff51afd7ed558ccd); k ^= k >> 33; k *= BIG_CONSTANT(0xc4ceb9fe1a85ec53); k ^= k >> 33; return k; } FORCE_INLINE void MurmurHash3_x64_128(const void* key, int lenBytes, uint64_t seed, HashState& out) { static const uint64_t c1 = BIG_CONSTANT(0x87c37b91114253d5); static const uint64_t c2 = BIG_CONSTANT(0x4cf5ad432745937f); const uint8_t* data = (const uint8_t*)key; out.h1 = seed; out.h2 = seed; // Number of full 128-bit blocks of 16 bytes. // Possible exclusion fo a remainder of up to 15 bytes. const int nblocks = lenBytes >> 4; // bytes / 16 // Process the 128-bit blocks (the body) into teh hash const uint64_t* blocks = (const uint64_t*)(data); for (int i = 0; i < nblocks; ++i) { // 16 bytes per block //uint64_t k1 = getblock64(blocks, 0); //uint64_t k2 = getblock64(blocks, 1); uint64_t k1 = getblock64(blocks,i*2+0); uint64_t k2 = getblock64(blocks,i*2+1); k1 *= c1; k1 = ROTL64(k1,31); k1 *= c2; out.h1 ^= k1; out.h1 = ROTL64(out.h1,27); out.h1 += out.h2; out.h1 = out.h1*5+0x52dce729; k2 *= c2; k2 = ROTL64(k2,33); k2 *= c1; out.h2 ^= k2; out.h2 = ROTL64(out.h2,31); out.h2 += out.h1; out.h2 = out.h2*5+0x38495ab5; blocks += 2; } // tail //const uint8_t * tail = (const uint8_t*)blocks; const uint8_t * tail = (const uint8_t*)(data + (nblocks << 4)); uint64_t k1 = 0; uint64_t k2 = 0; switch(lenBytes & 15) { case 15: k2 ^= ((uint64_t)tail[14]) << 48; //@suppress("No break at end of case") case 14: k2 ^= ((uint64_t)tail[13]) << 40; //@suppress("No break at end of case") case 13: k2 ^= ((uint64_t)tail[12]) << 32; //@suppress("No break at end of case") case 12: k2 ^= ((uint64_t)tail[11]) << 24; //@suppress("No break at end of case") case 11: k2 ^= ((uint64_t)tail[10]) << 16; //@suppress("No break at end of case") case 10: k2 ^= ((uint64_t)tail[ 9]) << 8; //@suppress("No break at end of case") case 9: k2 ^= ((uint64_t)tail[ 8]) << 0; k2 *= c2; k2 = ROTL64(k2,33); k2 *= c1; out.h2 ^= k2; //@suppress("No break at end of case") case 8: k1 ^= ((uint64_t)tail[ 7]) << 56; //@suppress("No break at end of case") case 7: k1 ^= ((uint64_t)tail[ 6]) << 48; //@suppress("No break at end of case") case 6: k1 ^= ((uint64_t)tail[ 5]) << 40; //@suppress("No break at end of case") case 5: k1 ^= ((uint64_t)tail[ 4]) << 32; //@suppress("No break at end of case") case 4: k1 ^= ((uint64_t)tail[ 3]) << 24; //@suppress("No break at end of case") case 3: k1 ^= ((uint64_t)tail[ 2]) << 16; //@suppress("No break at end of case") case 2: k1 ^= ((uint64_t)tail[ 1]) << 8; //@suppress("No break at end of case") case 1: k1 ^= ((uint64_t)tail[ 0]) << 0; k1 *= c1; k1 = ROTL64(k1,31); k1 *= c2; out.h1 ^= k1; }; //---------- // finalization out.h1 ^= lenBytes; out.h2 ^= lenBytes; out.h1 += out.h2; out.h2 += out.h1; out.h1 = fmix64(out.h1); out.h2 = fmix64(out.h2); out.h1 += out.h2; out.h2 += out.h1; } //----------------------------------------------------------------------------- #endif // _MURMURHASH3_H_