apache · mapleFU · May 16, 2024 · May 17, 2024 · May 20, 2024 · May 21, 2024
diff --git a/cpp/src/arrow/util/bit_util.h b/cpp/src/arrow/util/bit_util.h
@@ -281,10 +281,22 @@ static inline int Log2(uint64_t x) {
 //
 
 // Bitmask selecting the k-th bit in a byte
-static constexpr uint8_t kBitmask[] = {1, 2, 4, 8, 16, 32, 64, 128};
+// static constexpr uint8_t kBitmask[] = {1, 2, 4, 8, 16, 32, 64, 128};
+template <typename T>
+static constexpr uint8_t GetBitMask(T index) {
+  // DCHECK(index >= 0 && index <= 7);
+  ARROW_COMPILER_ASSUME(index >= 0);
+  return static_cast<uint8_t>(1) << index;
+}
 
 // the bitwise complement version of kBitmask
-static constexpr uint8_t kFlippedBitmask[] = {254, 253, 251, 247, 239, 223, 191, 127};
+// static constexpr uint8_t kFlippedBitmask[] = {254, 253, 251, 247, 239, 223, 191, 127};
+template <typename T>
+static constexpr uint8_t GetFlippedBitMask(T index) {
+  // DCHECK(index >= 0 && index <= 7);
+  ARROW_COMPILER_ASSUME(index >= 0);
+  return ~(static_cast<uint8_t>(1) << index);
+}
 
 // Bitmask selecting the (k - 1) preceding bits in a byte
 static constexpr uint8_t kPrecedingBitmask[] = {0, 1, 3, 7, 15, 31, 63, 127};
@@ -299,22 +311,27 @@ static constexpr bool GetBit(const uint8_t* bits, uint64_t i) {
 
 // Gets the i-th bit from a byte. Should only be used with i <= 7.
 static constexpr bool GetBitFromByte(uint8_t byte, uint8_t i) {
-  return byte & kBitmask[i];
+  return byte & GetBitMask(i);
 }
 
 static inline void ClearBit(uint8_t* bits, int64_t i) {
-  bits[i / 8] &= kFlippedBitmask[i % 8];
+  ARROW_COMPILER_ASSUME(i >= 0);
+  bits[i / 8] &= GetFlippedBitMask(i % 8);
 }
 
-static inline void SetBit(uint8_t* bits, int64_t i) { bits[i / 8] |= kBitmask[i % 8]; }
+static inline void SetBit(uint8_t* bits, int64_t i) {
+  ARROW_COMPILER_ASSUME(i >= 0);
+  bits[i / 8] |= GetBitMask(i % 8);
+}
 
 static inline void SetBitTo(uint8_t* bits, int64_t i, bool bit_is_set) {
+  ARROW_COMPILER_ASSUME(i >= 0);
   // https://graphics.stanford.edu/~seander/bithacks.html
   // "Conditionally set or clear bits without branching"
   // NOTE: this seems to confuse Valgrind as it reads from potentially
   // uninitialized memory
   bits[i / 8] ^= static_cast<uint8_t>(-static_cast<uint8_t>(bit_is_set) ^ bits[i / 8]) &
-                 kBitmask[i % 8];
+                 GetBitMask(i % 8);
 }
 
 /// \brief set or clear a range of bits quickly

diff --git a/cpp/src/arrow/util/bitmap_generate.h b/cpp/src/arrow/util/bitmap_generate.h
@@ -39,7 +39,7 @@ void GenerateBits(uint8_t* bitmap, int64_t start_offset, int64_t length, Generat
     return;
   }
   uint8_t* cur = bitmap + start_offset / 8;
-  uint8_t bit_mask = bit_util::kBitmask[start_offset % 8];
+  uint8_t bit_mask = bit_util::GetBitMask(start_offset % 8);
   uint8_t current_byte = *cur & bit_util::kPrecedingBitmask[start_offset % 8];
 
   for (int64_t index = 0; index < length; ++index) {
@@ -71,7 +71,7 @@ void GenerateBitsUnrolled(uint8_t* bitmap, int64_t start_offset, int64_t length,
   uint8_t current_byte;
   uint8_t* cur = bitmap + start_offset / 8;
   const uint64_t start_bit_offset = start_offset % 8;
-  uint8_t bit_mask = bit_util::kBitmask[start_bit_offset];
+  uint8_t bit_mask = bit_util::GetBitMask(start_bit_offset);
   int64_t remaining = length;
 
   if (bit_mask != 0x01) {

diff --git a/cpp/src/arrow/util/bitmap_writer.h b/cpp/src/arrow/util/bitmap_writer.h
@@ -34,7 +34,7 @@ class BitmapWriter {
   BitmapWriter(uint8_t* bitmap, int64_t start_offset, int64_t length)
       : bitmap_(bitmap), position_(0), length_(length) {
     byte_offset_ = start_offset / 8;
-    bit_mask_ = bit_util::kBitmask[start_offset % 8];
+    bit_mask_ = bit_util::GetBitMask(start_offset % 8);
     if (length > 0) {
       current_byte_ = bitmap[byte_offset_];
     } else {
@@ -88,7 +88,7 @@ class FirstTimeBitmapWriter {
       : bitmap_(bitmap), position_(0), length_(length) {
     current_byte_ = 0;
     byte_offset_ = start_offset / 8;
-    bit_mask_ = bit_util::kBitmask[start_offset % 8];
+    bit_mask_ = bit_util::GetBitMask(start_offset % 8);
     if (length > 0) {
       current_byte_ =
           bitmap[byte_offset_] & bit_util::kPrecedingBitmask[start_offset % 8];
@@ -113,7 +113,7 @@ class FirstTimeBitmapWriter {
     // Update state variables except for current_byte_ here.
     position_ += number_of_bits;
     int64_t bit_offset = bit_util::CountTrailingZeros(static_cast<uint32_t>(bit_mask_));
-    bit_mask_ = bit_util::kBitmask[(bit_offset + number_of_bits) % 8];
+    bit_mask_ = bit_util::GetBitMask((bit_offset + number_of_bits) % 8);
     byte_offset_ += (bit_offset + number_of_bits) / 8;
 
     if (bit_offset != 0) {