forked from ot/succinct
-
Notifications
You must be signed in to change notification settings - Fork 0
/
gamma_vector.hpp
119 lines (97 loc) · 3.28 KB
/
gamma_vector.hpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
#pragma once
#include "broadword.hpp"
#include "forward_enumerator.hpp"
#include "darray64.hpp"
namespace succinct {
// Compressed random-access vector to store unsigned integers
// using gamma codes.
struct gamma_vector
{
typedef uint64_t value_type;
gamma_vector() {}
template <typename Range>
gamma_vector(Range const& ints)
{
darray64::builder high_bits;
bit_vector_builder low_bits;
high_bits.append1();
typedef typename boost::range_const_iterator<Range>::type iterator_t;
for (iterator_t iter = boost::begin(ints);
iter != boost::end(ints);
++iter) {
const value_type val = *iter + 1;
uint8_t l = broadword::msb(val);
low_bits.append_bits(val ^ (uint64_t(1) << l), l);
high_bits.append1(l);
}
darray64(&high_bits).swap(m_high_bits);
bit_vector(&low_bits).swap(m_low_bits);
}
value_type operator[](size_t idx) const
{
size_t pos = m_high_bits.select(idx);
size_t l; // ignored
return retrieve_value(idx, pos, l);
}
size_t size() const
{
return m_high_bits.num_ones() - 1;
}
void swap(gamma_vector& other)
{
m_high_bits.swap(other.m_high_bits);
m_low_bits.swap(other.m_low_bits);
}
template <typename Visitor>
void map(Visitor& visit) {
visit
(m_high_bits, "m_high_bits")
(m_low_bits, "m_low_bits")
;
}
private:
value_type retrieve_value(size_t idx, size_t pos, size_t& l) const
{
assert(m_high_bits.bits()[pos] == 1);
l = broadword::lsb(m_high_bits.bits().get_word(pos + 1));
return ((uint64_t(1) << l) | m_low_bits.get_bits(pos - idx, l)) - 1;
}
friend struct forward_enumerator<gamma_vector>;
darray64 m_high_bits;
bit_vector m_low_bits;
};
template <>
struct forward_enumerator<gamma_vector>
{
typedef gamma_vector::value_type value_type;
forward_enumerator(gamma_vector const& c, size_t idx = 0)
: m_c(&c)
, m_idx(idx)
, m_pos(0)
{
if (idx < m_c->size()) {
m_pos = m_c->m_high_bits.select(idx);
m_high_bits_enumerator =
bit_vector::unary_enumerator(m_c->m_high_bits.bits(), m_pos + 1);
m_low_bits_enumerator = bit_vector::enumerator(m_c->m_low_bits, m_pos - m_idx);
}
}
value_type next()
{
assert(m_idx <= m_c->size());
size_t next_pos = m_high_bits_enumerator.next();
size_t l = next_pos - m_pos - 1;
m_pos = next_pos;
uint64_t chunk = m_low_bits_enumerator.take(l);
uint64_t val = (chunk | (uint64_t(1) << (l))) - 1;
m_idx += 1;
return val;
}
private:
gamma_vector const* m_c;
size_t m_idx;
size_t m_pos;
bit_vector::unary_enumerator m_high_bits_enumerator;
bit_vector::enumerator m_low_bits_enumerator;
};
}