-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathhasher.go
65 lines (58 loc) · 1.89 KB
/
hasher.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
// Copyright 2014 Spencer Kimball.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
// implied. See the License for the specific language governing
// permissions and limitations under the License. See the AUTHORS file
// for names of contributors.
//
// Author: Spencer Kimball ([email protected])
package cbfilter
import (
"fmt"
"hash"
"io"
"github.com/spaolacci/murmur3"
)
// Hasher utilizes a 64 bit variant of MurmurHash3 to support
// the use of the Kirsch and MitzenMacher method to determine k
// hashed values using this formula:
//
// H[i](x) = hash[0:4] + i*hash[4:8]
//
// http://www.eecs.harvard.edu/~kirsch/pubs/bbbf/rsa.pdf
type hasher struct {
mmh3 hash.Hash64
hashed bool // true if we've hashed a key
h1 uint32 // first 4 bytes of key hash
h2 uint32 // last 4 bytes of key hash
}
// newHasher allocates and return a new Hasher.
func newHasher() *hasher {
return &hasher{mmh3: murmur3.New64()}
}
// HashKey writes the given key string to the hasher.
func (h *hasher) hashKey(key string) {
h.mmh3.Reset() // clear current hash state
if _, err := io.WriteString(h.mmh3, key); err != nil {
panic(fmt.Sprintf("unable to write string to hasher: %s", key))
}
h.hashed = true
sum := h.mmh3.Sum64()
h.h1 = uint32(sum & 0xffffffff)
h.h2 = uint32((sum >> 32) & 0xffffffff)
}
// GetHash returns the hash value at the given offset.
func (h *hasher) getHash(i uint32) uint32 {
if !h.hashed {
panic("hasher must be initialized first with a call to hashKey(key)")
}
return h.h1 + i*h.h2
}