blob: 07e6b271358aa9c18c0a8f6a509db4bdeb59ca6c [file] [log] [blame]
David Srbecky052f8ca2018-04-26 15:42:54 +01001/*
2 * Copyright (C) 2018 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#ifndef ART_LIBARTBASE_BASE_BIT_TABLE_H_
18#define ART_LIBARTBASE_BASE_BIT_TABLE_H_
19
David Srbeckydd966bc2018-05-24 13:55:52 +010020#include <array>
David Srbeckyf325e282018-06-13 15:02:32 +010021#include <initializer_list>
David Srbeckydd966bc2018-05-24 13:55:52 +010022#include <numeric>
23#include <string.h>
24#include <type_traits>
25#include <unordered_map>
David Srbecky052f8ca2018-04-26 15:42:54 +010026
27#include "base/bit_memory_region.h"
David Srbeckydd966bc2018-05-24 13:55:52 +010028#include "base/casts.h"
David Srbecky93bd3612018-07-02 19:30:18 +010029#include "base/iteration_range.h"
David Srbecky052f8ca2018-04-26 15:42:54 +010030#include "base/memory_region.h"
David Srbeckydd966bc2018-05-24 13:55:52 +010031#include "base/scoped_arena_containers.h"
32#include "base/stl_util.h"
David Srbecky052f8ca2018-04-26 15:42:54 +010033
34namespace art {
35
David Srbeckycf7833e2018-06-14 16:45:22 +010036// Generic purpose table of uint32_t values, which are tightly packed at bit level.
37// It has its own header with the number of rows and the bit-widths of all columns.
38// The values are accessible by (row, column). The value -1 is stored efficiently.
David Srbecky052f8ca2018-04-26 15:42:54 +010039template<uint32_t kNumColumns>
David Srbeckycf7833e2018-06-14 16:45:22 +010040class BitTableBase {
David Srbecky052f8ca2018-04-26 15:42:54 +010041 public:
David Srbeckycf7833e2018-06-14 16:45:22 +010042 static constexpr uint32_t kNoValue = std::numeric_limits<uint32_t>::max(); // == -1.
43 static constexpr uint32_t kValueBias = kNoValue; // Bias so that -1 is encoded as 0.
David Srbecky052f8ca2018-04-26 15:42:54 +010044
David Srbeckycf7833e2018-06-14 16:45:22 +010045 BitTableBase() {}
David Srbecky078d7ba2018-06-21 15:36:48 +010046 explicit BitTableBase(BitMemoryReader& reader) {
47 Decode(reader);
David Srbecky052f8ca2018-04-26 15:42:54 +010048 }
49
David Srbecky078d7ba2018-06-21 15:36:48 +010050 ALWAYS_INLINE void Decode(BitMemoryReader& reader) {
David Srbecky052f8ca2018-04-26 15:42:54 +010051 // Decode row count and column sizes from the table header.
David Srbecky6c4ec5c2019-06-20 07:23:19 +000052 std::array<uint32_t, 1+kNumColumns> header = reader.ReadInterleavedVarints<1+kNumColumns>();
David Srbecky697c47a2019-06-16 21:53:07 +010053 num_rows_ = header[0];
54 column_offset_[0] = 0;
55 for (uint32_t i = 0; i < kNumColumns; i++) {
56 size_t column_end = column_offset_[i] + header[i + 1];
57 column_offset_[i + 1] = dchecked_integral_cast<uint16_t>(column_end);
David Srbecky052f8ca2018-04-26 15:42:54 +010058 }
59
60 // Record the region which contains the table data and skip past it.
David Srbeckyd1606412018-07-31 15:05:14 +010061 table_data_ = reader.ReadRegion(num_rows_ * NumRowBits());
David Srbecky052f8ca2018-04-26 15:42:54 +010062 }
63
64 ALWAYS_INLINE uint32_t Get(uint32_t row, uint32_t column = 0) const {
David Srbecky42deda82018-08-10 11:23:27 +010065 DCHECK(table_data_.IsValid()) << "Table has not been loaded";
David Srbecky052f8ca2018-04-26 15:42:54 +010066 DCHECK_LT(row, num_rows_);
67 DCHECK_LT(column, kNumColumns);
68 size_t offset = row * NumRowBits() + column_offset_[column];
69 return table_data_.LoadBits(offset, NumColumnBits(column)) + kValueBias;
70 }
71
David Srbecky5513c2b2018-05-24 15:03:20 +010072 ALWAYS_INLINE BitMemoryRegion GetBitMemoryRegion(uint32_t row, uint32_t column = 0) const {
David Srbecky42deda82018-08-10 11:23:27 +010073 DCHECK(table_data_.IsValid()) << "Table has not been loaded";
David Srbecky5513c2b2018-05-24 15:03:20 +010074 DCHECK_LT(row, num_rows_);
75 DCHECK_LT(column, kNumColumns);
76 size_t offset = row * NumRowBits() + column_offset_[column];
77 return table_data_.Subregion(offset, NumColumnBits(column));
78 }
79
Vladimir Marko394a0822021-10-25 10:31:15 +010080 uint32_t NumRows() const { return num_rows_; }
David Srbecky052f8ca2018-04-26 15:42:54 +010081
82 uint32_t NumRowBits() const { return column_offset_[kNumColumns]; }
83
Vladimir Marko394a0822021-10-25 10:31:15 +010084 constexpr uint32_t NumColumns() const { return kNumColumns; }
David Srbecky052f8ca2018-04-26 15:42:54 +010085
86 uint32_t NumColumnBits(uint32_t column) const {
87 return column_offset_[column + 1] - column_offset_[column];
88 }
89
David Srbecky42deda82018-08-10 11:23:27 +010090 size_t DataBitSize() const { return table_data_.size_in_bits(); }
David Srbecky052f8ca2018-04-26 15:42:54 +010091
David Srbeckyd1606412018-07-31 15:05:14 +010092 bool Equals(const BitTableBase& other) const {
93 return num_rows_ == other.num_rows_ &&
94 std::equal(column_offset_, column_offset_ + kNumColumns, other.column_offset_) &&
Roland Levillain8c7f6492022-03-14 12:14:36 +000095 BitMemoryRegion::Compare(table_data_, other.table_data_) == 0;
David Srbeckyd1606412018-07-31 15:05:14 +010096 }
97
David Srbecky052f8ca2018-04-26 15:42:54 +010098 protected:
99 BitMemoryRegion table_data_;
Vladimir Marko394a0822021-10-25 10:31:15 +0100100 uint32_t num_rows_ = 0;
David Srbecky052f8ca2018-04-26 15:42:54 +0100101 uint16_t column_offset_[kNumColumns + 1] = {};
102};
103
David Srbeckycf7833e2018-06-14 16:45:22 +0100104// Helper class which can be used to create BitTable accessors with named getters.
105template<uint32_t NumColumns>
106class BitTableAccessor {
107 public:
108 static constexpr uint32_t kNumColumns = NumColumns;
109 static constexpr uint32_t kNoValue = BitTableBase<kNumColumns>::kNoValue;
110
David Srbecky145a18a2019-06-03 14:35:22 +0100111 BitTableAccessor() = default;
David Srbeckycf7833e2018-06-14 16:45:22 +0100112 BitTableAccessor(const BitTableBase<kNumColumns>* table, uint32_t row)
113 : table_(table), row_(row) {
David Srbeckya45a85c2018-06-21 16:03:12 +0100114 DCHECK(table_ != nullptr);
David Srbeckycf7833e2018-06-14 16:45:22 +0100115 }
116
117 ALWAYS_INLINE uint32_t Row() const { return row_; }
118
David Srbeckya45a85c2018-06-21 16:03:12 +0100119 ALWAYS_INLINE bool IsValid() const { return row_ < table_->NumRows(); }
David Srbeckycf7833e2018-06-14 16:45:22 +0100120
121 ALWAYS_INLINE bool Equals(const BitTableAccessor& other) {
122 return this->table_ == other.table_ && this->row_ == other.row_;
123 }
124
125// Helper macro to create constructors and per-table utilities in derived class.
David Srbecky42deda82018-08-10 11:23:27 +0100126#define BIT_TABLE_HEADER(NAME) \
David Srbeckycf7833e2018-06-14 16:45:22 +0100127 using BitTableAccessor<kNumColumns>::BitTableAccessor; /* inherit constructors */ \
128 template<int COLUMN, int UNUSED /*needed to compile*/> struct ColumnName; \
David Srbecky42deda82018-08-10 11:23:27 +0100129 static constexpr const char* kTableName = #NAME; \
David Srbeckycf7833e2018-06-14 16:45:22 +0100130
131// Helper macro to create named column accessors in derived class.
132#define BIT_TABLE_COLUMN(COLUMN, NAME) \
133 static constexpr uint32_t k##NAME = COLUMN; \
134 ALWAYS_INLINE uint32_t Get##NAME() const { return table_->Get(row_, COLUMN); } \
135 ALWAYS_INLINE bool Has##NAME() const { return Get##NAME() != kNoValue; } \
136 template<int UNUSED> struct ColumnName<COLUMN, UNUSED> { \
137 static constexpr const char* Value = #NAME; \
138 }; \
139
140 protected:
141 const BitTableBase<kNumColumns>* table_ = nullptr;
142 uint32_t row_ = -1;
143};
144
David Srbeckyd97e0822018-06-03 12:00:24 +0100145// Template meta-programming helper.
146template<typename Accessor, size_t... Columns>
David Srbecky86decb62018-06-05 06:41:10 +0100147static const char* const* GetBitTableColumnNamesImpl(std::index_sequence<Columns...>) {
David Srbeckyd97e0822018-06-03 12:00:24 +0100148 static const char* names[] = { Accessor::template ColumnName<Columns, 0>::Value... };
149 return names;
150}
David Srbecky052f8ca2018-04-26 15:42:54 +0100151
David Srbeckycf7833e2018-06-14 16:45:22 +0100152// Wrapper which makes it easier to use named accessors for the individual rows.
153template<typename Accessor>
154class BitTable : public BitTableBase<Accessor::kNumColumns> {
155 public:
David Srbecky0b4e5a32018-06-11 16:25:29 +0100156 class const_iterator : public std::iterator<std::random_access_iterator_tag,
157 /* value_type */ Accessor,
158 /* difference_type */ int32_t,
159 /* pointer */ void,
160 /* reference */ void> {
161 public:
162 using difference_type = int32_t;
163 const_iterator() {}
164 const_iterator(const BitTable* table, uint32_t row) : table_(table), row_(row) {}
165 const_iterator operator+(difference_type n) { return const_iterator(table_, row_ + n); }
166 const_iterator operator-(difference_type n) { return const_iterator(table_, row_ - n); }
167 difference_type operator-(const const_iterator& other) { return row_ - other.row_; }
168 void operator+=(difference_type rows) { row_ += rows; }
169 void operator-=(difference_type rows) { row_ -= rows; }
170 const_iterator operator++() { return const_iterator(table_, ++row_); }
171 const_iterator operator--() { return const_iterator(table_, --row_); }
172 const_iterator operator++(int) { return const_iterator(table_, row_++); }
173 const_iterator operator--(int) { return const_iterator(table_, row_--); }
174 bool operator==(const_iterator i) const { DCHECK(table_ == i.table_); return row_ == i.row_; }
175 bool operator!=(const_iterator i) const { DCHECK(table_ == i.table_); return row_ != i.row_; }
176 bool operator<=(const_iterator i) const { DCHECK(table_ == i.table_); return row_ <= i.row_; }
177 bool operator>=(const_iterator i) const { DCHECK(table_ == i.table_); return row_ >= i.row_; }
178 bool operator<(const_iterator i) const { DCHECK(table_ == i.table_); return row_ < i.row_; }
179 bool operator>(const_iterator i) const { DCHECK(table_ == i.table_); return row_ > i.row_; }
David Srbecky93bd3612018-07-02 19:30:18 +0100180 Accessor operator*() {
181 DCHECK_LT(row_, table_->NumRows());
182 return Accessor(table_, row_);
183 }
184 Accessor operator->() {
185 DCHECK_LT(row_, table_->NumRows());
186 return Accessor(table_, row_);
187 }
188 Accessor operator[](size_t index) {
189 DCHECK_LT(row_ + index, table_->NumRows());
190 return Accessor(table_, row_ + index);
191 }
David Srbecky0b4e5a32018-06-11 16:25:29 +0100192 private:
193 const BitTable* table_ = nullptr;
194 uint32_t row_ = 0;
195 };
196
David Srbeckycf7833e2018-06-14 16:45:22 +0100197 using BitTableBase<Accessor::kNumColumns>::BitTableBase; // Constructors.
198
David Srbecky0b4e5a32018-06-11 16:25:29 +0100199 ALWAYS_INLINE const_iterator begin() const { return const_iterator(this, 0); }
200 ALWAYS_INLINE const_iterator end() const { return const_iterator(this, this->NumRows()); }
201
David Srbeckycf7833e2018-06-14 16:45:22 +0100202 ALWAYS_INLINE Accessor GetRow(uint32_t row) const {
203 return Accessor(this, row);
204 }
David Srbeckya45a85c2018-06-21 16:03:12 +0100205
206 ALWAYS_INLINE Accessor GetInvalidRow() const {
207 return Accessor(this, static_cast<uint32_t>(-1));
208 }
David Srbecky42deda82018-08-10 11:23:27 +0100209
210 const char* GetName() const {
211 return Accessor::kTableName;
212 }
213
214 const char* const* GetColumnNames() const {
215 return GetBitTableColumnNamesImpl<Accessor>(std::make_index_sequence<Accessor::kNumColumns>());
216 }
David Srbeckycf7833e2018-06-14 16:45:22 +0100217};
218
David Srbecky0b4e5a32018-06-11 16:25:29 +0100219template<typename Accessor>
220typename BitTable<Accessor>::const_iterator operator+(
221 typename BitTable<Accessor>::const_iterator::difference_type n,
222 typename BitTable<Accessor>::const_iterator a) {
223 return a + n;
224}
225
David Srbecky93bd3612018-07-02 19:30:18 +0100226template<typename Accessor>
227class BitTableRange : public IterationRange<typename BitTable<Accessor>::const_iterator> {
228 public:
Vladimir Marko4f990712021-07-14 12:45:13 +0100229 using const_iterator = typename BitTable<Accessor>::const_iterator;
David Srbecky93bd3612018-07-02 19:30:18 +0100230
231 using IterationRange<const_iterator>::IterationRange;
232 BitTableRange() : IterationRange<const_iterator>(const_iterator(), const_iterator()) { }
233
234 bool empty() const { return this->begin() == this->end(); }
235 size_t size() const { return this->end() - this->begin(); }
236
237 Accessor operator[](size_t index) const {
238 const_iterator it = this->begin() + index;
239 DCHECK(it < this->end());
240 return *it;
241 }
242
243 Accessor back() const {
244 DCHECK(!empty());
245 return *(this->end() - 1);
246 }
247
248 void pop_back() {
249 DCHECK(!empty());
250 --this->last_;
251 }
252};
253
David Srbeckydd966bc2018-05-24 13:55:52 +0100254// Helper class for encoding BitTable. It can optionally de-duplicate the inputs.
David Srbeckyf325e282018-06-13 15:02:32 +0100255template<uint32_t kNumColumns>
David Srbeckycf7833e2018-06-14 16:45:22 +0100256class BitTableBuilderBase {
David Srbecky052f8ca2018-04-26 15:42:54 +0100257 public:
David Srbeckycf7833e2018-06-14 16:45:22 +0100258 static constexpr uint32_t kNoValue = BitTableBase<kNumColumns>::kNoValue;
259 static constexpr uint32_t kValueBias = BitTableBase<kNumColumns>::kValueBias;
260
David Srbeckyf325e282018-06-13 15:02:32 +0100261 class Entry {
262 public:
263 Entry() {
Orion Hodson2dd16812018-07-03 14:16:05 +0100264 // The definition of kNoValue here is for host and target debug builds which complain about
265 // missing a symbol definition for BitTableBase<N>::kNovValue when optimization is off.
266 static constexpr uint32_t kNoValue = BitTableBase<kNumColumns>::kNoValue;
David Srbeckycf7833e2018-06-14 16:45:22 +0100267 std::fill_n(data_, kNumColumns, kNoValue);
David Srbeckyf325e282018-06-13 15:02:32 +0100268 }
269
270 Entry(std::initializer_list<uint32_t> values) {
271 DCHECK_EQ(values.size(), kNumColumns);
272 std::copy(values.begin(), values.end(), data_);
273 }
274
275 uint32_t& operator[](size_t column) {
276 DCHECK_LT(column, kNumColumns);
277 return data_[column];
278 }
279
280 uint32_t operator[](size_t column) const {
281 DCHECK_LT(column, kNumColumns);
282 return data_[column];
283 }
284
285 private:
286 uint32_t data_[kNumColumns];
287 };
David Srbecky052f8ca2018-04-26 15:42:54 +0100288
David Srbeckycf7833e2018-06-14 16:45:22 +0100289 explicit BitTableBuilderBase(ScopedArenaAllocator* allocator)
David Srbecky159c9dd2018-05-24 14:56:51 +0100290 : rows_(allocator->Adapter(kArenaAllocBitTableBuilder)),
291 dedup_(8, allocator->Adapter(kArenaAllocBitTableBuilder)) {
David Srbeckydd966bc2018-05-24 13:55:52 +0100292 }
293
David Srbeckyf325e282018-06-13 15:02:32 +0100294 Entry& operator[](size_t row) { return rows_[row]; }
295 const Entry& operator[](size_t row) const { return rows_[row]; }
David Srbecky0b4e5a32018-06-11 16:25:29 +0100296 const Entry& back() const { return rows_.back(); }
David Srbeckydd966bc2018-05-24 13:55:52 +0100297 size_t size() const { return rows_.size(); }
298
David Srbecky159c9dd2018-05-24 14:56:51 +0100299 // Append given value to the vector without de-duplication.
300 // This will not add the element to the dedup map to avoid its associated costs.
David Srbeckyf325e282018-06-13 15:02:32 +0100301 void Add(Entry value) {
David Srbeckydd966bc2018-05-24 13:55:52 +0100302 rows_.push_back(value);
David Srbecky052f8ca2018-04-26 15:42:54 +0100303 }
304
David Srbecky159c9dd2018-05-24 14:56:51 +0100305 // Append given list of values and return the index of the first value.
306 // If the exact same set of values was already added, return the old index.
David Srbeckyf325e282018-06-13 15:02:32 +0100307 uint32_t Dedup(Entry* values, size_t count = 1) {
David Srbecky159c9dd2018-05-24 14:56:51 +0100308 FNVHash<MemoryRegion> hasher;
David Srbeckyf325e282018-06-13 15:02:32 +0100309 uint32_t hash = hasher(MemoryRegion(values, sizeof(Entry) * count));
David Srbecky159c9dd2018-05-24 14:56:51 +0100310
311 // Check if we have already added identical set of values.
312 auto range = dedup_.equal_range(hash);
313 for (auto it = range.first; it != range.second; ++it) {
314 uint32_t index = it->second;
315 if (count <= size() - index &&
316 std::equal(values,
317 values + count,
David Srbecky5f937102018-06-02 10:24:25 +0100318 rows_.begin() + index,
David Srbeckyf325e282018-06-13 15:02:32 +0100319 [](const Entry& lhs, const Entry& rhs) {
320 return memcmp(&lhs, &rhs, sizeof(Entry)) == 0;
David Srbecky159c9dd2018-05-24 14:56:51 +0100321 })) {
322 return index;
323 }
324 }
325
326 // Add the set of values and add the index to the dedup map.
327 uint32_t index = size();
328 rows_.insert(rows_.end(), values, values + count);
329 dedup_.emplace(hash, index);
330 return index;
331 }
332
David Srbeckyf325e282018-06-13 15:02:32 +0100333 uint32_t Dedup(Entry value) {
334 return Dedup(&value, /* count */ 1);
David Srbecky052f8ca2018-04-26 15:42:54 +0100335 }
336
David Srbeckydd966bc2018-05-24 13:55:52 +0100337 // Calculate the column bit widths based on the current data.
David Srbecky6c4ec5c2019-06-20 07:23:19 +0000338 void Measure(/*out*/ uint32_t* column_bits) const {
David Srbeckydd966bc2018-05-24 13:55:52 +0100339 uint32_t max_column_value[kNumColumns];
340 std::fill_n(max_column_value, kNumColumns, 0);
341 for (uint32_t r = 0; r < size(); r++) {
342 for (uint32_t c = 0; c < kNumColumns; c++) {
David Srbeckycf7833e2018-06-14 16:45:22 +0100343 max_column_value[c] |= rows_[r][c] - kValueBias;
David Srbeckydd966bc2018-05-24 13:55:52 +0100344 }
345 }
346 for (uint32_t c = 0; c < kNumColumns; c++) {
David Srbecky6c4ec5c2019-06-20 07:23:19 +0000347 column_bits[c] = MinimumBitsToStore(max_column_value[c]);
David Srbeckydd966bc2018-05-24 13:55:52 +0100348 }
349 }
350
351 // Encode the stored data into a BitTable.
David Srbecky052f8ca2018-04-26 15:42:54 +0100352 template<typename Vector>
David Srbecky078d7ba2018-06-21 15:36:48 +0100353 void Encode(BitMemoryWriter<Vector>& out) const {
David Srbeckyd1606412018-07-31 15:05:14 +0100354 size_t initial_bit_offset = out.NumberOfWrittenBits();
David Srbeckydd966bc2018-05-24 13:55:52 +0100355
David Srbecky697c47a2019-06-16 21:53:07 +0100356 // Write table header.
David Srbecky6c4ec5c2019-06-20 07:23:19 +0000357 std::array<uint32_t, 1 + kNumColumns> header;
358 header[0] = size();
359 uint32_t* column_bits = header.data() + 1;
360 Measure(column_bits);
361 out.WriteInterleavedVarints(header);
David Srbecky697c47a2019-06-16 21:53:07 +0100362
363 // Write table data.
364 for (uint32_t r = 0; r < size(); r++) {
365 for (uint32_t c = 0; c < kNumColumns; c++) {
366 out.WriteBits(rows_[r][c] - kValueBias, column_bits[c]);
David Srbecky052f8ca2018-04-26 15:42:54 +0100367 }
368 }
David Srbeckydd966bc2018-05-24 13:55:52 +0100369
David Srbecky052f8ca2018-04-26 15:42:54 +0100370 // Verify the written data.
371 if (kIsDebugBuild) {
David Srbeckycf7833e2018-06-14 16:45:22 +0100372 BitTableBase<kNumColumns> table;
David Srbeckyd1606412018-07-31 15:05:14 +0100373 BitMemoryReader reader(out.GetWrittenRegion().Subregion(initial_bit_offset));
David Srbecky078d7ba2018-06-21 15:36:48 +0100374 table.Decode(reader);
David Srbeckydd966bc2018-05-24 13:55:52 +0100375 DCHECK_EQ(size(), table.NumRows());
David Srbecky052f8ca2018-04-26 15:42:54 +0100376 for (uint32_t c = 0; c < kNumColumns; c++) {
377 DCHECK_EQ(column_bits[c], table.NumColumnBits(c));
378 }
David Srbeckydd966bc2018-05-24 13:55:52 +0100379 for (uint32_t r = 0; r < size(); r++) {
David Srbecky052f8ca2018-04-26 15:42:54 +0100380 for (uint32_t c = 0; c < kNumColumns; c++) {
David Srbeckyf325e282018-06-13 15:02:32 +0100381 DCHECK_EQ(rows_[r][c], table.Get(r, c)) << " (" << r << ", " << c << ")";
David Srbecky052f8ca2018-04-26 15:42:54 +0100382 }
383 }
384 }
385 }
386
387 protected:
David Srbeckyf325e282018-06-13 15:02:32 +0100388 ScopedArenaDeque<Entry> rows_;
David Srbecky159c9dd2018-05-24 14:56:51 +0100389 ScopedArenaUnorderedMultimap<uint32_t, uint32_t> dedup_; // Hash -> row index.
David Srbecky052f8ca2018-04-26 15:42:54 +0100390};
391
David Srbeckycf7833e2018-06-14 16:45:22 +0100392template<typename Accessor>
393class BitTableBuilder : public BitTableBuilderBase<Accessor::kNumColumns> {
394 public:
395 using BitTableBuilderBase<Accessor::kNumColumns>::BitTableBuilderBase; // Constructors.
396};
397
David Srbecky5513c2b2018-05-24 15:03:20 +0100398// Helper class for encoding single-column BitTable of bitmaps (allows more than 32 bits).
399class BitmapTableBuilder {
400 public:
401 explicit BitmapTableBuilder(ScopedArenaAllocator* const allocator)
402 : allocator_(allocator),
403 rows_(allocator->Adapter(kArenaAllocBitTableBuilder)),
404 dedup_(8, allocator_->Adapter(kArenaAllocBitTableBuilder)) {
405 }
406
407 MemoryRegion operator[](size_t row) { return rows_[row]; }
408 const MemoryRegion operator[](size_t row) const { return rows_[row]; }
409 size_t size() const { return rows_.size(); }
410
411 // Add the given bitmap to the table and return its index.
412 // If the bitmap was already added it will be deduplicated.
413 // The last bit must be set and any padding bits in the last byte must be zero.
414 uint32_t Dedup(const void* bitmap, size_t num_bits) {
415 MemoryRegion region(const_cast<void*>(bitmap), BitsToBytesRoundUp(num_bits));
416 DCHECK(num_bits == 0 || BitMemoryRegion(region).LoadBit(num_bits - 1) == 1);
417 DCHECK_EQ(BitMemoryRegion(region).LoadBits(num_bits, region.size_in_bits() - num_bits), 0u);
418 FNVHash<MemoryRegion> hasher;
419 uint32_t hash = hasher(region);
420
421 // Check if we have already added identical bitmap.
422 auto range = dedup_.equal_range(hash);
423 for (auto it = range.first; it != range.second; ++it) {
424 if (MemoryRegion::ContentEquals()(region, rows_[it->second])) {
425 return it->second;
426 }
427 }
428
429 // Add the bitmap and add the index to the dedup map.
430 uint32_t index = size();
431 void* copy = allocator_->Alloc(region.size(), kArenaAllocBitTableBuilder);
432 memcpy(copy, region.pointer(), region.size());
433 rows_.push_back(MemoryRegion(copy, region.size()));
434 dedup_.emplace(hash, index);
435 max_num_bits_ = std::max(max_num_bits_, num_bits);
436 return index;
437 }
438
439 // Encode the stored data into a BitTable.
440 template<typename Vector>
David Srbecky078d7ba2018-06-21 15:36:48 +0100441 void Encode(BitMemoryWriter<Vector>& out) const {
David Srbeckyd1606412018-07-31 15:05:14 +0100442 size_t initial_bit_offset = out.NumberOfWrittenBits();
David Srbecky5513c2b2018-05-24 15:03:20 +0100443
David Srbecky697c47a2019-06-16 21:53:07 +0100444 // Write table header.
David Srbecky6c4ec5c2019-06-20 07:23:19 +0000445 out.WriteInterleavedVarints(std::array<uint32_t, 2>{
446 dchecked_integral_cast<uint32_t>(size()),
447 dchecked_integral_cast<uint32_t>(max_num_bits_),
448 });
David Srbecky5513c2b2018-05-24 15:03:20 +0100449
David Srbecky697c47a2019-06-16 21:53:07 +0100450 // Write table data.
451 for (MemoryRegion row : rows_) {
Roland Levillain8c7f6492022-03-14 12:14:36 +0000452 BitMemoryRegion src(row);
David Srbecky697c47a2019-06-16 21:53:07 +0100453 BitMemoryRegion dst = out.Allocate(max_num_bits_);
Roland Levillain8c7f6492022-03-14 12:14:36 +0000454 dst.StoreBits(/* bit_offset */ 0, src, std::min(max_num_bits_, src.size_in_bits()));
David Srbecky5513c2b2018-05-24 15:03:20 +0100455 }
456
457 // Verify the written data.
458 if (kIsDebugBuild) {
David Srbeckycf7833e2018-06-14 16:45:22 +0100459 BitTableBase<1> table;
David Srbeckyd1606412018-07-31 15:05:14 +0100460 BitMemoryReader reader(out.GetWrittenRegion().Subregion(initial_bit_offset));
David Srbecky078d7ba2018-06-21 15:36:48 +0100461 table.Decode(reader);
David Srbecky5513c2b2018-05-24 15:03:20 +0100462 DCHECK_EQ(size(), table.NumRows());
463 DCHECK_EQ(max_num_bits_, table.NumColumnBits(0));
464 for (uint32_t r = 0; r < size(); r++) {
465 BitMemoryRegion expected(rows_[r]);
466 BitMemoryRegion seen = table.GetBitMemoryRegion(r);
467 size_t num_bits = std::max(expected.size_in_bits(), seen.size_in_bits());
468 for (size_t b = 0; b < num_bits; b++) {
469 bool e = b < expected.size_in_bits() && expected.LoadBit(b);
470 bool s = b < seen.size_in_bits() && seen.LoadBit(b);
471 DCHECK_EQ(e, s) << " (" << r << ")[" << b << "]";
472 }
473 }
474 }
475 }
476
477 private:
478 ScopedArenaAllocator* const allocator_;
479 ScopedArenaDeque<MemoryRegion> rows_;
480 ScopedArenaUnorderedMultimap<uint32_t, uint32_t> dedup_; // Hash -> row index.
481 size_t max_num_bits_ = 0u;
482};
483
David Srbecky052f8ca2018-04-26 15:42:54 +0100484} // namespace art
485
486#endif // ART_LIBARTBASE_BASE_BIT_TABLE_H_