123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203 |
- package murmur3
- import (
- //"encoding/binary"
- "hash"
- "unsafe"
- )
- const (
- c1_128 = 0x87c37b91114253d5
- c2_128 = 0x4cf5ad432745937f
- )
- // Make sure interfaces are correctly implemented.
- var (
- _ hash.Hash = new(digest128)
- _ Hash128 = new(digest128)
- _ bmixer = new(digest128)
- )
- // Hash128 represents a 128-bit hasher
- // Hack: the standard api doesn't define any Hash128 interface.
- type Hash128 interface {
- hash.Hash
- Sum128() (uint64, uint64)
- }
- // digest128 represents a partial evaluation of a 128 bites hash.
- type digest128 struct {
- digest
- h1 uint64 // Unfinalized running hash part 1.
- h2 uint64 // Unfinalized running hash part 2.
- }
- // New128 returns a 128-bit hasher
- func New128() Hash128 { return New128WithSeed(0) }
- // New128WithSeed returns a 128-bit hasher set with explicit seed value
- func New128WithSeed(seed uint32) Hash128 {
- d := new(digest128)
- d.seed = seed
- d.bmixer = d
- d.Reset()
- return d
- }
- func (d *digest128) Size() int { return 16 }
- func (d *digest128) reset() { d.h1, d.h2 = uint64(d.seed), uint64(d.seed) }
- func (d *digest128) Sum(b []byte) []byte {
- h1, h2 := d.Sum128()
- return append(b,
- byte(h1>>56), byte(h1>>48), byte(h1>>40), byte(h1>>32),
- byte(h1>>24), byte(h1>>16), byte(h1>>8), byte(h1),
- byte(h2>>56), byte(h2>>48), byte(h2>>40), byte(h2>>32),
- byte(h2>>24), byte(h2>>16), byte(h2>>8), byte(h2),
- )
- }
- func (d *digest128) bmix(p []byte) (tail []byte) {
- h1, h2 := d.h1, d.h2
- nblocks := len(p) / 16
- for i := 0; i < nblocks; i++ {
- t := (*[2]uint64)(unsafe.Pointer(&p[i*16]))
- k1, k2 := t[0], t[1]
- k1 *= c1_128
- k1 = (k1 << 31) | (k1 >> 33) // rotl64(k1, 31)
- k1 *= c2_128
- h1 ^= k1
- h1 = (h1 << 27) | (h1 >> 37) // rotl64(h1, 27)
- h1 += h2
- h1 = h1*5 + 0x52dce729
- k2 *= c2_128
- k2 = (k2 << 33) | (k2 >> 31) // rotl64(k2, 33)
- k2 *= c1_128
- h2 ^= k2
- h2 = (h2 << 31) | (h2 >> 33) // rotl64(h2, 31)
- h2 += h1
- h2 = h2*5 + 0x38495ab5
- }
- d.h1, d.h2 = h1, h2
- return p[nblocks*d.Size():]
- }
- func (d *digest128) Sum128() (h1, h2 uint64) {
- h1, h2 = d.h1, d.h2
- var k1, k2 uint64
- switch len(d.tail) & 15 {
- case 15:
- k2 ^= uint64(d.tail[14]) << 48
- fallthrough
- case 14:
- k2 ^= uint64(d.tail[13]) << 40
- fallthrough
- case 13:
- k2 ^= uint64(d.tail[12]) << 32
- fallthrough
- case 12:
- k2 ^= uint64(d.tail[11]) << 24
- fallthrough
- case 11:
- k2 ^= uint64(d.tail[10]) << 16
- fallthrough
- case 10:
- k2 ^= uint64(d.tail[9]) << 8
- fallthrough
- case 9:
- k2 ^= uint64(d.tail[8]) << 0
- k2 *= c2_128
- k2 = (k2 << 33) | (k2 >> 31) // rotl64(k2, 33)
- k2 *= c1_128
- h2 ^= k2
- fallthrough
- case 8:
- k1 ^= uint64(d.tail[7]) << 56
- fallthrough
- case 7:
- k1 ^= uint64(d.tail[6]) << 48
- fallthrough
- case 6:
- k1 ^= uint64(d.tail[5]) << 40
- fallthrough
- case 5:
- k1 ^= uint64(d.tail[4]) << 32
- fallthrough
- case 4:
- k1 ^= uint64(d.tail[3]) << 24
- fallthrough
- case 3:
- k1 ^= uint64(d.tail[2]) << 16
- fallthrough
- case 2:
- k1 ^= uint64(d.tail[1]) << 8
- fallthrough
- case 1:
- k1 ^= uint64(d.tail[0]) << 0
- k1 *= c1_128
- k1 = (k1 << 31) | (k1 >> 33) // rotl64(k1, 31)
- k1 *= c2_128
- h1 ^= k1
- }
- h1 ^= uint64(d.clen)
- h2 ^= uint64(d.clen)
- h1 += h2
- h2 += h1
- h1 = fmix64(h1)
- h2 = fmix64(h2)
- h1 += h2
- h2 += h1
- return h1, h2
- }
- func fmix64(k uint64) uint64 {
- k ^= k >> 33
- k *= 0xff51afd7ed558ccd
- k ^= k >> 33
- k *= 0xc4ceb9fe1a85ec53
- k ^= k >> 33
- return k
- }
- /*
- func rotl64(x uint64, r byte) uint64 {
- return (x << r) | (x >> (64 - r))
- }
- */
- // Sum128 returns the MurmurHash3 sum of data. It is equivalent to the
- // following sequence (without the extra burden and the extra allocation):
- // hasher := New128()
- // hasher.Write(data)
- // return hasher.Sum128()
- func Sum128(data []byte) (h1 uint64, h2 uint64) { return Sum128WithSeed(data, 0) }
- // Sum128WithSeed returns the MurmurHash3 sum of data. It is equivalent to the
- // following sequence (without the extra burden and the extra allocation):
- // hasher := New128WithSeed(seed)
- // hasher.Write(data)
- // return hasher.Sum128()
- func Sum128WithSeed(data []byte, seed uint32) (h1 uint64, h2 uint64) {
- d := &digest128{h1: uint64(seed), h2: uint64(seed)}
- d.seed = seed
- d.tail = d.bmix(data)
- d.clen = len(data)
- return d.Sum128()
- }
|