Make the block size of vector<bool> consistent

This commit is contained in:
Patrick Niklaus 2018-03-23 12:02:20 +00:00
parent c0dd5d7c76
commit c322d93435
6 changed files with 49 additions and 39 deletions

View File

@ -94,7 +94,7 @@ class ContiguousInternalMemoryAlgorithmDataFacade<CH> : public datafacade::Algor
auto filter_block_id = static_cast<storage::DataLayout::BlockID>( auto filter_block_id = static_cast<storage::DataLayout::BlockID>(
storage::DataLayout::CH_EDGE_FILTER_0 + exclude_index); storage::DataLayout::CH_EDGE_FILTER_0 + exclude_index);
auto edge_filter_ptr = data_layout.GetBlockPtr<unsigned>(memory_block, filter_block_id); auto edge_filter_ptr = data_layout.GetBlockPtr<util::vector_view<bool>::Word>(memory_block, filter_block_id);
util::vector_view<GraphNode> node_list( util::vector_view<GraphNode> node_list(
graph_nodes_ptr, data_layout.GetBlockEntries(storage::DataLayout::CH_GRAPH_NODE_LIST)); graph_nodes_ptr, data_layout.GetBlockEntries(storage::DataLayout::CH_GRAPH_NODE_LIST));

View File

@ -129,21 +129,21 @@ void write(tar::FileWriter &writer, const std::string &name, const util::vector_
namespace detail namespace detail
{ {
template <typename T> template <typename T, typename BlockT = unsigned char>
inline unsigned char packBits(const T &data, std::size_t index, std::size_t count) inline BlockT packBits(const T &data, std::size_t index, std::size_t count)
{ {
static_assert(std::is_same<typename T::value_type, bool>::value, "value_type is not bool"); static_assert(std::is_same<typename T::value_type, bool>::value, "value_type is not bool");
unsigned char value = 0; BlockT value = 0;
for (std::size_t bit = 0; bit < count; ++bit, ++index) for (std::size_t bit = 0; bit < count; ++bit, ++index)
value = (value << 1) | data[index]; value = (value << 1) | data[index];
return value; return value;
} }
template <typename T> template <typename T, typename BlockT = unsigned char>
inline void unpackBits(T &data, std::size_t index, std::size_t count, unsigned char value) inline void unpackBits(T &data, std::size_t index, std::size_t count, BlockT value)
{ {
static_assert(std::is_same<typename T::value_type, bool>::value, "value_type is not bool"); static_assert(std::is_same<typename T::value_type, bool>::value, "value_type is not bool");
const unsigned char mask = 1 << (count - 1); const BlockT mask = BlockT {1} << (count - 1);
for (std::size_t bit = 0; bit < count; value <<= 1, ++bit, ++index) for (std::size_t bit = 0; bit < count; value <<= 1, ++bit, ++index)
data[index] = value & mask; data[index] = value & mask;
} }
@ -155,13 +155,15 @@ void readBoolVector(tar::FileReader &reader, const std::string &name, VectorT &d
data.resize(count); data.resize(count);
std::uint64_t index = 0; std::uint64_t index = 0;
const auto decode = [&](const unsigned char block) { constexpr std::uint64_t WORD_BITS = CHAR_BIT * sizeof(std::uint64_t);
auto read_size = std::min<std::size_t>(count - index, CHAR_BIT);
unpackBits(data, index, read_size, block); const auto decode = [&](const std::uint64_t block) {
index += CHAR_BIT; auto read_size = std::min<std::size_t>(count - index, WORD_BITS);
unpackBits<VectorT,std::uint64_t>(data, index, read_size, block);
index += WORD_BITS;
}; };
reader.ReadStreaming<unsigned char>(name, boost::make_function_output_iterator(decode)); reader.ReadStreaming<std::uint64_t>(name, boost::make_function_output_iterator(decode));
} }
template <typename VectorT> template <typename VectorT>
@ -171,17 +173,19 @@ void writeBoolVector(tar::FileWriter &writer, const std::string &name, const Vec
writer.WriteElementCount64(name, count); writer.WriteElementCount64(name, count);
std::uint64_t index = 0; std::uint64_t index = 0;
constexpr std::uint64_t WORD_BITS = CHAR_BIT * sizeof(std::uint64_t);
// FIXME on old boost version the function_input_iterator does not work with lambdas // FIXME on old boost version the function_input_iterator does not work with lambdas
// so we need to wrap it in a function here. // so we need to wrap it in a function here.
const std::function<char()> encode_function = [&]() -> char { const std::function<std::uint64_t()> encode_function = [&]() -> std::uint64_t {
auto write_size = std::min<std::size_t>(count - index, CHAR_BIT); auto write_size = std::min<std::size_t>(count - index, WORD_BITS);
auto packed = packBits(data, index, write_size); auto packed = packBits<VectorT, std::uint64_t>(data, index, write_size);
index += CHAR_BIT; index += WORD_BITS;
return packed; return packed;
}; };
std::uint64_t number_of_blocks = std::ceil((double)count / CHAR_BIT); std::uint64_t number_of_blocks = (count + WORD_BITS - 1) / WORD_BITS;
writer.WriteStreaming<unsigned char>( writer.WriteStreaming<std::uint64_t>(
name, name,
boost::make_function_input_iterator(encode_function, boost::infinite()), boost::make_function_input_iterator(encode_function, boost::infinite()),
number_of_blocks); number_of_blocks);

View File

@ -436,7 +436,7 @@ template <typename T, std::size_t Bits, storage::Ownership Ownership> class Pack
void resize(std::size_t elements) void resize(std::size_t elements)
{ {
num_elements = elements; num_elements = elements;
auto num_blocks = std::ceil(static_cast<double>(elements) / BLOCK_ELEMENTS); auto num_blocks = (elements + BLOCK_ELEMENTS - 1) / BLOCK_ELEMENTS;
vec.resize(num_blocks * BLOCK_WORDS + 1); vec.resize(num_blocks * BLOCK_WORDS + 1);
} }
@ -445,7 +445,7 @@ template <typename T, std::size_t Bits, storage::Ownership Ownership> class Pack
template <bool enabled = (Ownership == storage::Ownership::View)> template <bool enabled = (Ownership == storage::Ownership::View)>
void reserve(typename std::enable_if<!enabled, std::size_t>::type capacity) void reserve(typename std::enable_if<!enabled, std::size_t>::type capacity)
{ {
auto num_blocks = std::ceil(static_cast<double>(capacity) / BLOCK_ELEMENTS); auto num_blocks = (capacity + BLOCK_ELEMENTS - 1) / BLOCK_ELEMENTS;
vec.reserve(num_blocks * BLOCK_WORDS + 1); vec.reserve(num_blocks * BLOCK_WORDS + 1);
} }

View File

@ -150,11 +150,14 @@ template <typename DataT> class vector_view
template <> class vector_view<bool> template <> class vector_view<bool>
{ {
private: public:
unsigned *m_ptr; using Word = std::uint64_t;
std::size_t m_size;
static constexpr std::size_t UNSIGNED_BITS = CHAR_BIT * sizeof(unsigned); private:
static constexpr std::size_t WORD_BITS = CHAR_BIT * sizeof(Word);
Word *m_ptr;
std::size_t m_size;
public: public:
using value_type = bool; using value_type = bool;
@ -178,23 +181,23 @@ template <> class vector_view<bool>
return os << static_cast<bool>(rhs); return os << static_cast<bool>(rhs);
} }
unsigned *m_ptr; Word *m_ptr;
const unsigned mask; const Word mask;
}; };
vector_view() : m_ptr(nullptr), m_size(0) {} vector_view() : m_ptr(nullptr), m_size(0) {}
vector_view(unsigned *ptr, std::size_t size) : m_ptr(ptr), m_size(size) {} vector_view(Word *ptr, std::size_t size) : m_ptr(ptr), m_size(size) {}
bool at(const std::size_t index) const bool at(const std::size_t index) const
{ {
BOOST_ASSERT_MSG(index < m_size, "invalid size"); BOOST_ASSERT_MSG(index < m_size, "invalid size");
const std::size_t bucket = index / UNSIGNED_BITS; const std::size_t bucket = index / WORD_BITS;
const unsigned offset = index % UNSIGNED_BITS; const auto offset = index % WORD_BITS;
return m_ptr[bucket] & (1u << offset); return m_ptr[bucket] & (static_cast<Word>(1) << offset);
} }
void reset(unsigned *ptr, std::size_t size) void reset(std::uint64_t *ptr, std::size_t size)
{ {
m_ptr = ptr; m_ptr = ptr;
m_size = size; m_size = size;
@ -213,14 +216,14 @@ template <> class vector_view<bool>
bool empty() const { return 0 == size(); } bool empty() const { return 0 == size(); }
bool operator[](const unsigned index) const { return at(index); } bool operator[](const std::size_t index) const { return at(index); }
reference operator[](const unsigned index) reference operator[](const std::size_t index)
{ {
BOOST_ASSERT(index < m_size); BOOST_ASSERT(index < m_size);
const std::size_t bucket = index / UNSIGNED_BITS; const auto bucket = index / WORD_BITS;
const unsigned offset = index % UNSIGNED_BITS; const auto offset = index % WORD_BITS;
return reference{m_ptr + bucket, 1u << offset}; return reference{m_ptr + bucket, static_cast<Word>(1) << offset};
} }
template <typename T> friend void swap(vector_view<T> &, vector_view<T> &) noexcept; template <typename T> friend void swap(vector_view<T> &, vector_view<T> &) noexcept;

View File

@ -712,7 +712,7 @@ void Storage::PopulateData(const DataLayout &layout, char *memory_ptr)
{ {
auto block_id = auto block_id =
static_cast<DataLayout::BlockID>(storage::DataLayout::CH_EDGE_FILTER_0 + index); static_cast<DataLayout::BlockID>(storage::DataLayout::CH_EDGE_FILTER_0 + index);
auto data_ptr = layout.GetBlockPtr<unsigned, true>(memory_ptr, block_id); auto data_ptr = layout.GetBlockPtr<util::vector_view<bool>::Word, true>(memory_ptr, block_id);
auto num_entries = layout.GetBlockEntries(block_id); auto num_entries = layout.GetBlockEntries(block_id);
edge_filter.emplace_back(data_ptr, num_entries); edge_filter.emplace_back(data_ptr, num_entries);
} }

View File

@ -43,8 +43,11 @@ BOOST_AUTO_TEST_CASE(rw_short)
BOOST_AUTO_TEST_CASE(rw_bool) BOOST_AUTO_TEST_CASE(rw_bool)
{ {
std::size_t num_elements = 1000; std::size_t num_elements = 1000;
std::unique_ptr<char[]> data = std::make_unique<char[]>(num_elements / sizeof(std::uint32_t)); auto data = std::make_unique<typename vector_view<bool>::Word[]>(
util::vector_view<bool> view(reinterpret_cast<std::uint32_t *>(data.get()), num_elements); (num_elements + sizeof(typename vector_view<bool>::Word) - 1) /
sizeof(typename vector_view<bool>::Word));
util::vector_view<bool> view(reinterpret_cast<typename vector_view<bool>::Word *>(data.get()),
num_elements);
std::vector<bool> reference; std::vector<bool> reference;
std::mt19937 rng; std::mt19937 rng;