-
Notifications
You must be signed in to change notification settings - Fork 35
/
cm4.go
93 lines (78 loc) · 2.14 KB
/
cm4.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
package tinylfu
// cm4 is a small conservative-update count-min sketch implementation with 4-bit counters
type cm4 struct {
s [depth]nvec
mask uint32
}
const depth = 4
func newCM4(w int) *cm4 {
if w < 1 {
panic("cm4: bad width")
}
// use 4 counters per item per level, for a total of 16 counters or 8 bytes per item, matching the TinyLFU paper.
w32 := nextPowerOfTwo(uint32(w) * 4)
c := cm4{
mask: w32 - 1,
}
for i := 0; i < depth; i++ {
c.s[i] = newNvec(int(w32))
}
return &c
}
func (c *cm4) add(keyh uint64) {
// The loop unrolling prevents this function from being inlined, but it still results in a slight overall speedup.
c.s[3].inc(c.counterOffset(keyh, 3))
c.s[2].inc(c.counterOffset(keyh, 2))
c.s[1].inc(c.counterOffset(keyh, 1))
c.s[0].inc(c.counterOffset(keyh, 0))
}
func (c *cm4) counterOffset(keyh uint64, level int) uint32 {
// counterOffset gets inlined and the compiler removes the duplicated computations of h1 and h2, so there is no
// benefit to accepting h1 and h2 as arguments.
h1, h2 := uint32(keyh), uint32(keyh>>32)
return (h1 + uint32(level)*h2) & c.mask
}
func (c *cm4) estimate(keyh uint64) byte {
var min byte = 255
bmin := func(v, min byte) byte {
// bmin gets inlined and the else branch gets optimized away
if v < min {
return v
} else {
return min
}
}
min = bmin(c.s[3].get(c.counterOffset(keyh, 3)), min)
min = bmin(c.s[2].get(c.counterOffset(keyh, 2)), min)
min = bmin(c.s[1].get(c.counterOffset(keyh, 1)), min)
min = bmin(c.s[0].get(c.counterOffset(keyh, 0)), min)
return min
}
func (c *cm4) reset() {
// There is no point in unrolling this loop, the cost is dominated by nvec.reset, which is O(n)
for _, n := range c.s {
n.reset()
}
}
// nybble vector
type nvec []byte
func newNvec(w int) nvec {
return make(nvec, w/2)
}
func (n nvec) get(i uint32) byte {
// Ugly, but as a single expression so the compiler will inline it :/
return byte(n[i/2]>>((i&1)*4)) & 0x0f
}
func (n nvec) inc(i uint32) {
idx := i / 2
shift := (i & 1) * 4
v := (n[idx] >> shift) & 0x0f
if v < 15 {
n[idx] += 1 << shift
}
}
func (n nvec) reset() {
for i := range n {
n[i] = (n[i] >> 1) & 0x77
}
}