github.com/Schaudge/grailbase@v0.0.0-20240223061707-44c758a471c0/bitset/bitset.go (about) 1 // Copyright 2022 GRAIL, Inc. All rights reserved. 2 // Use of this source code is governed by the Apache-2.0 3 // license that can be found in the LICENSE file. 4 5 // This is similar to github.com/willf/bitset , but with some extraneous 6 // abstraction removed. See also simd/count_amd64.go. 7 // 8 // ([]byte <-> []uintptr adapters will be added when needed.) 9 10 package bitset 11 12 import ( 13 "math/bits" 14 ) 15 16 // BitsPerWord is the number of bits in a machine word. 17 const BitsPerWord = 64 18 19 // Log2BitsPerWord is log_2(BitsPerWord). 20 const Log2BitsPerWord = uint(6) 21 22 // Set sets the given bit in a []uintptr bitset. 23 func Set(data []uintptr, bitIdx int) { 24 // Unsigned division by a power-of-2 constant compiles to a right-shift, 25 // while signed does not due to negative nastiness. 26 data[uint(bitIdx)/BitsPerWord] |= 1 << (uint(bitIdx) % BitsPerWord) 27 } 28 29 // Clear clears the given bit in a []uintptr bitset. 30 func Clear(data []uintptr, bitIdx int) { 31 wordIdx := uint(bitIdx) / BitsPerWord 32 data[wordIdx] = data[wordIdx] &^ (1 << (uint(bitIdx) % BitsPerWord)) 33 } 34 35 // Test returns true iff the given bit is set. 36 func Test(data []uintptr, bitIdx int) bool { 37 return (data[uint(bitIdx)/BitsPerWord] & (1 << (uint(bitIdx) % BitsPerWord))) != 0 38 } 39 40 // SetInterval sets the bits at all positions in [startIdx, limitIdx) in a 41 // []uintptr bitset. 42 func SetInterval(data []uintptr, startIdx, limitIdx int) { 43 if startIdx >= limitIdx { 44 return 45 } 46 startWordIdx := startIdx >> Log2BitsPerWord 47 startBit := uintptr(1) << uint32(startIdx&(BitsPerWord-1)) 48 limitWordIdx := limitIdx >> Log2BitsPerWord 49 limitBit := uintptr(1) << uint32(limitIdx&(BitsPerWord-1)) 50 if startWordIdx == limitWordIdx { 51 // We can't fill all bits from startBit on in the first word, since the 52 // limit is also within this word. 53 data[startWordIdx] |= limitBit - startBit 54 return 55 } 56 // Fill all bits from startBit on in the first word. 57 data[startWordIdx] |= -startBit 58 // Fill all bits in intermediate words. 59 // (todo: ensure compiler doesn't insert pointless slice bounds-checks on 60 // every iteration) 61 for wordIdx := startWordIdx + 1; wordIdx < limitWordIdx; wordIdx++ { 62 data[wordIdx] = ^uintptr(0) 63 } 64 // Fill just the bottom bits in the last word, if necessary. 65 if limitBit != 1 { 66 data[limitWordIdx] |= limitBit - 1 67 } 68 } 69 70 // ClearInterval clears the bits at all positions in [startIdx, limitIdx) in a 71 // []uintptr bitset. 72 func ClearInterval(data []uintptr, startIdx, limitIdx int) { 73 if startIdx >= limitIdx { 74 return 75 } 76 startWordIdx := startIdx >> Log2BitsPerWord 77 startBit := uintptr(1) << uint32(startIdx&(BitsPerWord-1)) 78 limitWordIdx := limitIdx >> Log2BitsPerWord 79 limitBit := uintptr(1) << uint32(limitIdx&(BitsPerWord-1)) 80 if startWordIdx == limitWordIdx { 81 // We can't clear all bits from startBit on in the first word, since the 82 // limit is also within this word. 83 data[startWordIdx] &= ^(limitBit - startBit) 84 return 85 } 86 // Clear all bits from startBit on in the first word. 87 data[startWordIdx] &= startBit - 1 88 // Clear all bits in intermediate words. 89 for wordIdx := startWordIdx + 1; wordIdx < limitWordIdx; wordIdx++ { 90 data[wordIdx] = 0 91 } 92 // Clear just the bottom bits in the last word, if necessary. 93 if limitBit != 1 { 94 data[limitWordIdx] &= -limitBit 95 } 96 } 97 98 // NewClearBits creates a []uintptr bitset with capacity for at least nBit 99 // bits, and all bits clear. 100 func NewClearBits(nBit int) []uintptr { 101 nWord := (nBit + BitsPerWord - 1) / BitsPerWord 102 return make([]uintptr, nWord) 103 } 104 105 // NewSetBits creates a []uintptr bitset with capacity for at least nBit bits, 106 // and all bits at positions [0, nBit) set. 107 func NewSetBits(nBit int) []uintptr { 108 data := NewClearBits(nBit) 109 SetInterval(data, 0, nBit) 110 return data 111 } 112 113 // NonzeroWordScanner iterates over and clears the set bits in a bitset, with 114 // the somewhat unusual precondition that the number of nonzero words is known 115 // in advance. The 'BitsetScanner' name is being reserved for a scanner which 116 // expects the number of set bits to be known instead. 117 // 118 // Note that, when many bits are set, a more complicated double-loop based 119 // around a function like willf/bitset.NextSetMany() has ~40% less overhead (at 120 // least with Go 1.10 on a Mac), and you can do even better with manual 121 // inlining of the iteration logic. As a consequence, it shouldn't be used 122 // when the bit iteration/clearing process is actually the dominant 123 // computational cost (and neither should NextSetMany(), manual inlining is 124 // 2-6x better without much more code, see bitsetManualInlineSubtask() in 125 // bitset_test.go for an example). However, it's a good choice everywhere 126 // else, outperforming the other scanners I'm aware of with similar ease of 127 // use, and maybe a future Go version will inline it properly. 128 type NonzeroWordScanner struct { 129 // data is the original bitset. 130 data []uintptr 131 // bitIdxOffset is BitsPerWord times the current data[] array index. 132 bitIdxOffset int 133 // bitWord is bits[bitIdxOffset / BitsPerWord], with already-iterated-over 134 // bits cleared. 135 bitWord uintptr 136 // nNonzeroWord is the number of nonzero words remaining in data[]. 137 nNonzeroWord int 138 } 139 140 // NewNonzeroWordScanner returns a NonzeroWordScanner for the given bitset, 141 // along with the position of the first bit. (This interface has been chosen 142 // to make for loops with properly-scoped variables easy to write.) 143 // 144 // The bitset is expected to be nonempty; otherwise this will crash the program 145 // with an out-of-bounds slice access. Similarly, if nNonzeroWord is larger 146 // than the actual number of nonzero words, or initially <= 0, the standard for 147 // loop will crash the program. (If nNonzeroWord is smaller but >0, the last 148 // nonzero words will be ignored.) 149 func NewNonzeroWordScanner(data []uintptr, nNonzeroWord int) (NonzeroWordScanner, int) { 150 for wordIdx := 0; ; wordIdx++ { 151 bitWord := data[wordIdx] 152 if bitWord != 0 { 153 bitIdxOffset := wordIdx * BitsPerWord 154 return NonzeroWordScanner{ 155 data: data, 156 bitIdxOffset: bitIdxOffset, 157 bitWord: bitWord & (bitWord - 1), 158 nNonzeroWord: nNonzeroWord, 159 }, bits.TrailingZeros64(uint64(bitWord)) + bitIdxOffset 160 } 161 } 162 } 163 164 // Next returns the position of the next set bit, or -1 if there aren't any. 165 func (s *NonzeroWordScanner) Next() int { 166 bitWord := s.bitWord 167 if bitWord == 0 { 168 wordIdx := int(uint(s.bitIdxOffset) / BitsPerWord) 169 s.data[wordIdx] = 0 170 s.nNonzeroWord-- 171 if s.nNonzeroWord == 0 { 172 // All words with set bits are accounted for, we can exit early. 173 // This is deliberately == 0 instead of <= 0 since it'll only be less 174 // than zero if there's a bug in the caller. We want to crash with an 175 // out-of-bounds access in that case. 176 return -1 177 } 178 for { 179 wordIdx++ 180 bitWord = s.data[wordIdx] 181 if bitWord != 0 { 182 break 183 } 184 } 185 s.bitIdxOffset = wordIdx * BitsPerWord 186 } 187 s.bitWord = bitWord & (bitWord - 1) 188 return bits.TrailingZeros64(uint64(bitWord)) + s.bitIdxOffset 189 }