me-main #1

Merged
Nate Rupsis merged 123 commits from me-main into main 2023-02-13 18:39:11 +01:00
Showing only changes of commit f0669ff8ba - Show all commits

View File

@ -16,13 +16,13 @@
* *
* The compact nature of storing bools in individual bits has some downsides that have to be kept * The compact nature of storing bools in individual bits has some downsides that have to be kept
* in mind: * in mind:
* - Writing to separate bits in the same byte is not thread-safe. Therefore, an existing vector of * - Writing to separate bits in the same int is not thread-safe. Therefore, an existing vector of
* bool can't easily be replaced with a bit vector, if it is written to from multiple threads. * bool can't easily be replaced with a bit vector, if it is written to from multiple threads.
* Read-only access from multiple threads is fine though. * Read-only access from multiple threads is fine though.
* - Writing individual elements is more expensive when the array is in cache already. That is * - Writing individual elements is more expensive when the array is in cache already. That is
* because changing a bit is always a read-modify-write operation on the byte the bit resides in. * because changing a bit is always a read-modify-write operation on the int the bit resides in.
* - Reading individual elements is more expensive when the array is in cache already. That is * - Reading individual elements is more expensive when the array is in cache already. That is
* because additional bit-wise operations have to be applied after the corresponding byte is * because additional bit-wise operations have to be applied after the corresponding int is
* read. * read.
* *
* Comparison to `std::vector<bool>`: * Comparison to `std::vector<bool>`:
@ -42,18 +42,27 @@
#include "BLI_memory_utils.hh" #include "BLI_memory_utils.hh"
#include "BLI_span.hh" #include "BLI_span.hh"
namespace blender { namespace blender::bits {
/** /**
* This is a read-only pointer to a specific bit. The value of the bit can be retrieved, but not * Using a large integer type is better because then it's easier to process many bits at once.
* changed. */
using IntType = uint64_t;
static constexpr int64_t BitsPerInt = int64_t(sizeof(IntType) * 8);
static constexpr int64_t BitToIntIndexShift = 3 + (sizeof(IntType) >= 2) + (sizeof(IntType) >= 4) +
(sizeof(IntType) >= 8);
static constexpr IntType BitIndexMask = (IntType(1) << BitToIntIndexShift) - 1;
/**
* This is a read-only pointer to a specific bit. The value of the bit can be retrieved, but
* not changed.
*/ */
class BitRef { class BitRef {
private: private:
/** Points to the exact byte that the bit is in. */ /** Points to the integer that the bit is in. */
const uint8_t *byte_ptr_; const IntType *ptr_;
/** All zeros except for a single one at the bit that is referenced. */ /** All zeros except for a single one at the bit that is referenced. */
uint8_t mask_; IntType mask_;
friend class MutableBitRef; friend class MutableBitRef;
@ -61,13 +70,13 @@ class BitRef {
BitRef() = default; BitRef() = default;
/** /**
* Reference a specific bit in a byte array. Note that #byte_ptr does *not* have to point to the * Reference a specific bit in an array. Note that #ptr does *not* have to point to the
* exact byte the bit is in. * exact integer the bit is in.
*/ */
BitRef(const uint8_t *byte_ptr, const int64_t bit_index) BitRef(const IntType *ptr, const int64_t bit_index)
{ {
byte_ptr_ = byte_ptr + (bit_index >> 3); ptr_ = ptr + (bit_index >> BitToIntIndexShift);
mask_ = 1 << (bit_index & 7); mask_ = IntType(1) << (bit_index & BitIndexMask);
} }
/** /**
@ -75,9 +84,9 @@ class BitRef {
*/ */
bool test() const bool test() const
{ {
const uint8_t byte = *byte_ptr_; const IntType value = *ptr_;
const uint8_t masked_byte = byte & mask_; const IntType masked_value = value & mask_;
return masked_byte != 0; return masked_value != 0;
} }
operator bool() const operator bool() const
@ -91,22 +100,22 @@ class BitRef {
*/ */
class MutableBitRef { class MutableBitRef {
private: private:
/** Points to the exact byte that the bit is in. */ /** Points to the integer that the bit is in. */
uint8_t *byte_ptr_; IntType *ptr_;
/** All zeros except for a single one at the bit that is referenced. */ /** All zeros except for a single one at the bit that is referenced. */
uint8_t mask_; IntType mask_;
public: public:
MutableBitRef() = default; MutableBitRef() = default;
/** /**
* Reference a specific bit in a byte array. Note that #byte_ptr does *not* have to point to the * Reference a specific bit in an array. Note that #ptr does *not* have to point to the
* exact byte the bit is in. * exact int the bit is in.
*/ */
MutableBitRef(uint8_t *byte_ptr, const int64_t bit_index) MutableBitRef(IntType *ptr, const int64_t bit_index)
{ {
byte_ptr_ = byte_ptr + (bit_index >> 3); ptr_ = ptr + (bit_index >> BitToIntIndexShift);
mask_ = 1 << uint8_t(bit_index & 7); mask_ = IntType(1) << IntType(bit_index & BitIndexMask);
} }
/** /**
@ -115,7 +124,7 @@ class MutableBitRef {
operator BitRef() const operator BitRef() const
{ {
BitRef bit_ref; BitRef bit_ref;
bit_ref.byte_ptr_ = byte_ptr_; bit_ref.ptr_ = ptr_;
bit_ref.mask_ = mask_; bit_ref.mask_ = mask_;
return bit_ref; return bit_ref;
} }
@ -125,9 +134,9 @@ class MutableBitRef {
*/ */
bool test() const bool test() const
{ {
const uint8_t byte = *byte_ptr_; const IntType value = *ptr_;
const uint8_t masked_byte = byte & mask_; const IntType masked_value = value & mask_;
return masked_byte != 0; return masked_value != 0;
} }
operator bool() const operator bool() const
@ -140,7 +149,7 @@ class MutableBitRef {
*/ */
void set() void set()
{ {
*byte_ptr_ |= mask_; *ptr_ |= mask_;
} }
/** /**
@ -148,7 +157,7 @@ class MutableBitRef {
*/ */
void reset() void reset()
{ {
*byte_ptr_ &= ~mask_; *ptr_ &= ~mask_;
} }
/** /**
@ -177,21 +186,20 @@ template<
typename Allocator = GuardedAllocator> typename Allocator = GuardedAllocator>
class BitVector { class BitVector {
private: private:
static constexpr int64_t required_bytes_for_bits(const int64_t number_of_bits) static constexpr int64_t required_ints_for_bits(const int64_t number_of_bits)
{ {
return (number_of_bits + BitsPerByte - 1) / BitsPerByte; return (number_of_bits + BitsPerInt - 1) / BitsPerInt;
} }
static constexpr int64_t BitsPerByte = 8; static constexpr int64_t IntsInInlineBuffer = required_ints_for_bits(InlineBufferCapacity);
static constexpr int64_t BytesInInlineBuffer = required_bytes_for_bits(InlineBufferCapacity); static constexpr int64_t BitsInInlineBuffer = IntsInInlineBuffer * BitsPerInt;
static constexpr int64_t BitsInInlineBuffer = BytesInInlineBuffer * BitsPerByte; static constexpr int64_t AllocationAlignment = alignof(IntType);
static constexpr int64_t AllocationAlignment = 8;
/** /**
* Points to the first byte used by the vector. It might point to the memory in the inline * Points to the first integer used by the vector. It might point to the memory in the inline
* buffer. * buffer.
*/ */
uint8_t *data_; IntType *data_;
/** Current size of the vector in bits. */ /** Current size of the vector in bits. */
int64_t size_in_bits_; int64_t size_in_bits_;
@ -203,7 +211,7 @@ class BitVector {
BLI_NO_UNIQUE_ADDRESS Allocator allocator_; BLI_NO_UNIQUE_ADDRESS Allocator allocator_;
/** Contains the bits as long as the vector is small enough. */ /** Contains the bits as long as the vector is small enough. */
BLI_NO_UNIQUE_ADDRESS TypedBuffer<uint8_t, BytesInInlineBuffer> inline_buffer_; BLI_NO_UNIQUE_ADDRESS TypedBuffer<IntType, IntsInInlineBuffer> inline_buffer_;
public: public:
BitVector(Allocator allocator = {}) noexcept : allocator_(allocator) BitVector(Allocator allocator = {}) noexcept : allocator_(allocator)
@ -211,7 +219,7 @@ class BitVector {
data_ = inline_buffer_; data_ = inline_buffer_;
size_in_bits_ = 0; size_in_bits_ = 0;
capacity_in_bits_ = BitsInInlineBuffer; capacity_in_bits_ = BitsInInlineBuffer;
uninitialized_fill_n(data_, BytesInInlineBuffer, uint8_t(0)); uninitialized_fill_n(data_, IntsInInlineBuffer, IntType(0));
} }
BitVector(NoExceptConstructor, Allocator allocator = {}) noexcept : BitVector(allocator) BitVector(NoExceptConstructor, Allocator allocator = {}) noexcept : BitVector(allocator)
@ -220,29 +228,29 @@ class BitVector {
BitVector(const BitVector &other) : BitVector(NoExceptConstructor(), other.allocator_) BitVector(const BitVector &other) : BitVector(NoExceptConstructor(), other.allocator_)
{ {
const int64_t bytes_to_copy = other.used_bytes_amount(); const int64_t ints_to_copy = other.used_ints_amount();
if (other.size_in_bits_ <= BitsInInlineBuffer) { if (other.size_in_bits_ <= BitsInInlineBuffer) {
/* The data is copied into the owned inline buffer. */ /* The data is copied into the owned inline buffer. */
data_ = inline_buffer_; data_ = inline_buffer_;
capacity_in_bits_ = BitsInInlineBuffer; capacity_in_bits_ = BitsInInlineBuffer;
} }
else { else {
/* Allocate a new byte array because the inline buffer is too small. */ /* Allocate a new array because the inline buffer is too small. */
data_ = static_cast<uint8_t *>( data_ = static_cast<IntType *>(
allocator_.allocate(bytes_to_copy, AllocationAlignment, __func__)); allocator_.allocate(ints_to_copy * sizeof(IntType), AllocationAlignment, __func__));
capacity_in_bits_ = bytes_to_copy * BitsPerByte; capacity_in_bits_ = ints_to_copy * BitsPerInt;
} }
size_in_bits_ = other.size_in_bits_; size_in_bits_ = other.size_in_bits_;
uninitialized_copy_n(other.data_, bytes_to_copy, data_); uninitialized_copy_n(other.data_, ints_to_copy, data_);
} }
BitVector(BitVector &&other) noexcept : BitVector(NoExceptConstructor(), other.allocator_) BitVector(BitVector &&other) noexcept : BitVector(NoExceptConstructor(), other.allocator_)
{ {
if (other.is_inline()) { if (other.is_inline()) {
/* Copy the data into the inline buffer. */ /* Copy the data into the inline buffer. */
const int64_t bytes_to_copy = other.used_bytes_amount(); const int64_t ints_to_copy = other.used_ints_amount();
data_ = inline_buffer_; data_ = inline_buffer_;
uninitialized_copy_n(other.data_, bytes_to_copy, data_); uninitialized_copy_n(other.data_, ints_to_copy, data_);
} }
else { else {
/* Steal the pointer. */ /* Steal the pointer. */
@ -305,7 +313,7 @@ class BitVector {
bool is_empty() const bool is_empty() const
{ {
return this->size() == 0; return size_in_bits_ == 0;
} }
/** /**
@ -442,20 +450,20 @@ class BitVector {
*/ */
void fill_range(const IndexRange range, const bool value) void fill_range(const IndexRange range, const bool value)
{ {
const AlignedIndexRanges aligned_ranges = split_index_range_by_alignment(range, BitsPerByte); const AlignedIndexRanges aligned_ranges = split_index_range_by_alignment(range, BitsPerInt);
/* Fill first few bits. */ /* Fill first few bits. */
for (const int64_t i : aligned_ranges.prefix) { for (const int64_t i : aligned_ranges.prefix) {
(*this)[i].set(value); (*this)[i].set(value);
} }
/* Fill entire bytes at once. */ /* Fill entire ints at once. */
const int64_t start_fill_byte_index = aligned_ranges.aligned.start() / BitsPerByte; const int64_t start_fill_int_index = aligned_ranges.aligned.start() / BitsPerInt;
const int64_t bytes_to_fill = aligned_ranges.aligned.size() / BitsPerByte; const int64_t ints_to_fill = aligned_ranges.aligned.size() / BitsPerInt;
const uint8_t fill_value = value ? uint8_t(0xff) : uint8_t(0x00); const IntType fill_value = value ? IntType(-1) : IntType(0);
initialized_fill_n(data_ + start_fill_byte_index, bytes_to_fill, fill_value); initialized_fill_n(data_ + start_fill_int_index, ints_to_fill, fill_value);
/* Fill bits in the end that don't cover a full byte. */ /* Fill bits in the end that don't cover a full int. */
for (const int64_t i : aligned_ranges.suffix) { for (const int64_t i : aligned_ranges.suffix) {
(*this)[i].set(value); (*this)[i].set(value);
} }
@ -509,37 +517,35 @@ class BitVector {
} }
BLI_NOINLINE void realloc_to_at_least(const int64_t min_capacity_in_bits, BLI_NOINLINE void realloc_to_at_least(const int64_t min_capacity_in_bits,
const uint8_t initial_value_for_new_bytes = 0x00) const IntType initial_value_for_new_ints = 0x00)
{ {
if (capacity_in_bits_ >= min_capacity_in_bits) { if (capacity_in_bits_ >= min_capacity_in_bits) {
return; return;
} }
const int64_t min_capacity_in_bytes = this->required_bytes_for_bits(min_capacity_in_bits); const int64_t min_capacity_in_ints = this->required_ints_for_bits(min_capacity_in_bits);
/* At least double the size of the previous allocation. */ /* At least double the size of the previous allocation. */
const int64_t min_new_capacity_in_bytes = capacity_in_bits_ * 2; const int64_t min_new_capacity_in_ints = 2 * this->required_ints_for_bits(capacity_in_bits_);
const int64_t new_capacity_in_bytes = std::max(min_capacity_in_bytes, const int64_t new_capacity_in_ints = std::max(min_capacity_in_ints, min_new_capacity_in_ints);
min_new_capacity_in_bytes); const int64_t ints_to_copy = this->used_ints_amount();
const int64_t bytes_to_copy = this->used_bytes_amount();
uint8_t *new_data = static_cast<uint8_t *>( IntType *new_data = static_cast<IntType *>(allocator_.allocate(
allocator_.allocate(new_capacity_in_bytes, AllocationAlignment, __func__)); new_capacity_in_ints * sizeof(IntType), AllocationAlignment, __func__));
uninitialized_copy_n(data_, bytes_to_copy, new_data); uninitialized_copy_n(data_, ints_to_copy, new_data);
/* Always initialize new capacity even if it isn't used yet. That's necessary to avoid warnings /* Always initialize new capacity even if it isn't used yet. That's necessary to avoid warnings
* caused by using uninitialized memory. This happens when e.g. setting a clearing a bit in an * caused by using uninitialized memory. This happens when e.g. setting a clearing a bit in an
* uninitialized byte. */ * uninitialized int. */
uninitialized_fill_n(new_data + bytes_to_copy, uninitialized_fill_n(
new_capacity_in_bytes - bytes_to_copy, new_data + ints_to_copy, new_capacity_in_ints - ints_to_copy, initial_value_for_new_ints);
uint8_t(initial_value_for_new_bytes));
if (!this->is_inline()) { if (!this->is_inline()) {
allocator_.deallocate(data_); allocator_.deallocate(data_);
} }
data_ = new_data; data_ = new_data;
capacity_in_bits_ = new_capacity_in_bytes * BitsPerByte; capacity_in_bits_ = new_capacity_in_ints * BitsPerInt;
} }
bool is_inline() const bool is_inline() const
@ -547,10 +553,16 @@ class BitVector {
return data_ == inline_buffer_; return data_ == inline_buffer_;
} }
int64_t used_bytes_amount() const int64_t used_ints_amount() const
{ {
return this->required_bytes_for_bits(size_in_bits_); return this->required_ints_for_bits(size_in_bits_);
} }
}; };
} // namespace blender::bits
namespace blender {
using bits::BitRef;
using bits::BitVector;
using bits::MutableBitRef;
} // namespace blender } // namespace blender