Skip to content

Commit

Permalink
Merge pull request #154 from bits-and-blooms/rankselect
Browse files Browse the repository at this point in the history
Adds support for rank/select queries
  • Loading branch information
lemire authored Dec 25, 2023
2 parents 4c5f79a + d601532 commit f70586a
Show file tree
Hide file tree
Showing 3 changed files with 119 additions and 3 deletions.
40 changes: 37 additions & 3 deletions bitset.go
Original file line number Diff line number Diff line change
Expand Up @@ -94,17 +94,17 @@ func (b *BitSet) SetBitsetFrom(buf []uint64) {
b.set = buf
}

// From is a constructor used to create a BitSet from an array of integers
// From is a constructor used to create a BitSet from an array of words
func From(buf []uint64) *BitSet {
return FromWithLength(uint(len(buf))*64, buf)
}

// FromWithLength constructs from an array of integers and length.
// FromWithLength constructs from an array of words and length.
func FromWithLength(len uint, set []uint64) *BitSet {
return &BitSet{len, set}
}

// Bytes returns the bitset as array of integers
// Bytes returns the bitset as array of words
func (b *BitSet) Bytes() []uint64 {
return b.set
}
Expand Down Expand Up @@ -1147,3 +1147,37 @@ func (b *BitSet) UnmarshalJSON(data []byte) error {
_, err = b.ReadFrom(bytes.NewReader(buf))
return err
}

// Rank returns the nunber of set bits up to and including the index
// that are set in the bitset.
// See https://en.wikipedia.org/wiki/Ranking#Ranking_in_statistics
func (b *BitSet) Rank(index uint) uint {
if index >= b.length {
return b.Count()
}
leftover := (index + 1) & 63
answer := uint(popcntSlice(b.set[:(index+1)>>6]))
if leftover != 0 {
answer += uint(popcount(b.set[(index+1)>>6] << (64 - leftover)))
}
return answer
}

// Select returns the index of the jth set bit, where j is the argument.
// The caller is responsible to ensure that 0 <= j < Count(): when j is
// out of range, the function returns the length of the bitset (b.length).
//
// Note that this function differs in convention from the Rank function which
// returns 1 when ranking the smallest value. We follow the conventional
// textbook definition of Select and Rank.
func (b *BitSet) Select(index uint) uint {
leftover := index
for idx, word := range b.set {
w := uint(popcount(word))
if w > leftover {
return uint(idx)*64 + select64(word, leftover)
}
leftover -= w
}
return b.length
}
37 changes: 37 additions & 0 deletions bitset_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -1497,6 +1497,43 @@ func TestClearAll(t *testing.T) {
}
}

func TestRankSelect(t *testing.T) {
u := []uint{2, 3, 5, 7, 11, 700, 1500}
b := BitSet{}
for _, v := range u {
b.Set(v)
}

if b.Rank(5) != 3 {
t.Error("Unexpected rank")
return
}
if b.Rank(6) != 3 {
t.Error("Unexpected rank")
return
}
if b.Rank(1500) != 7 {
t.Error("Unexpected rank")
return
}
if b.Select(0) != 2 {
t.Error("Unexpected select")
return
}
if b.Select(1) != 3 {
t.Error("Unexpected select")
return
}
if b.Select(2) != 5 {
t.Error("Unexpected select")
return
}

if b.Select(5) != 700 {
t.Error("Unexpected select")
return
}
}
func TestFlip(t *testing.T) {
b := new(BitSet)
c := b.Flip(11)
Expand Down
45 changes: 45 additions & 0 deletions select.go
Original file line number Diff line number Diff line change
@@ -0,0 +1,45 @@
package bitset

func select64(w uint64, j uint) uint {
seen := 0
// Divide 64bit
part := w & 0xFFFFFFFF
n := uint(popcount(part))
if n <= j {
part = w >> 32
seen += 32
j -= n
}
ww := part

// Divide 32bit
part = ww & 0xFFFF

n = uint(popcount(part))
if n <= j {
part = ww >> 16
seen += 16
j -= n
}
ww = part

// Divide 16bit
part = ww & 0xFF
n = uint(popcount(part))
if n <= j {
part = ww >> 8
seen += 8
j -= n
}
ww = part

// Lookup in final byte
counter := 0
for ; counter < 8; counter++ {
j -= uint((ww >> counter) & 1)
if j+1 == 0 {
break
}
}
return uint(seen + counter)
}

0 comments on commit f70586a

Please sign in to comment.