From 0bbc63af13c37d306bcf7397989e35c5046730a2 Mon Sep 17 00:00:00 2001 From: Andrzej Liszka Date: Thu, 5 Dec 2024 12:16:04 +0100 Subject: [PATCH] feature: native prefill method --- benchmark_opt_test.go | 27 ++++++++++++++ bitmap_opt.go | 84 +++++++++++++++++++++++++++++++++++++++++++ bitmap_opt_test.go | 22 ++++++++++++ 3 files changed, 133 insertions(+) diff --git a/benchmark_opt_test.go b/benchmark_opt_test.go index 49db81a..9135b57 100644 --- a/benchmark_opt_test.go +++ b/benchmark_opt_test.go @@ -5,6 +5,33 @@ import ( "testing" ) +// go test -v -bench BenchmarkPrefillNative -benchmem -run ^$ github.com/weaviate/sroar -cpuprofile cpu.prof +func BenchmarkPrefillNative(b *testing.B) { + for i := 0; i < b.N; i++ { + Prefill(200_000_000) + } +} + +// go test -v -bench BenchmarkPrefillFromSortedList -benchmem -run ^$ github.com/weaviate/sroar -cpuprofile cpu.prof +func BenchmarkPrefillFromSortedList(b *testing.B) { + prefillBufferSize := 65_536 + maxVal := uint64(200_000_000) + inc := uint64(prefillBufferSize) + buf := make([]uint64, prefillBufferSize) + + for i := 0; i < b.N; i++ { + finalBM := NewBitmap() + + for i := uint64(0); i <= maxVal; i += inc { + j := uint64(0) + for ; j < inc && i+j <= maxVal; j++ { + buf[j] = i + j + } + finalBM.Or(FromSortedList(buf[:j])) + } + } +} + // ================================================================================ // // BENCHMARKS comparing performance of different merge implementations diff --git a/bitmap_opt.go b/bitmap_opt.go index 8351c31..f00f343 100644 --- a/bitmap_opt.go +++ b/bitmap_opt.go @@ -1,6 +1,7 @@ package sroar import ( + "math" "sync" ) @@ -647,3 +648,86 @@ func andNotSelectedContainers(a, b *Bitmap, ai, an, bi, bn int, containerBuf []u } } } + +func Prefill(maxX uint64) *Bitmap { + maxCard64 := uint64(maxCardinality) + + // maxX should be included, therefore +1 + n := maxX / maxCard64 + rem := maxX % maxCard64 + if rem == maxCard64-1 { + n++ + } + rem = (rem + 1) % maxCard64 + + // create additional container for remaining values (or empty if there are not) + // +1 additional key to avoid keys expanding (there should always be 1 spare) + bm := newBitmapWithSize(int(n)+1+1, maxContainerSize, int(n)*maxContainerSize) + + var refContainer []uint16 + var remOffset = bm.keys.val(0) + + if n > 0 { + refContainer = bm.getContainer(remOffset) + refContainer[indexSize] = maxContainerSize + refContainer[indexType] = typeBitmap + setCardinality(refContainer, maxCardinality) + + // fill entire bitmap container with ones + refContainer64 := uint16To64SliceUnsafe(refContainer[startIdx:]) + for i := range refContainer64 { + refContainer64[i] = math.MaxUint64 + } + + // fill remaining containers by copying reference one + for i := uint64(1); i < n; i++ { + key := (i * maxCard64) & mask + offset := bm.newContainerNoClr(maxContainerSize) + bm.setKey(key, offset) + + copy(bm.data[offset:], refContainer) + } + + // create container for remaining values + key := (n * maxCard64) & mask + remOffset = bm.newContainer(maxContainerSize) + bm.setKey(key, remOffset) + } + + container := bm.getContainer(remOffset) + container[indexSize] = maxContainerSize + container[indexType] = typeBitmap + setCardinality(container, int(rem)) + + if rem > 0 { + n16 := uint16(rem) / 16 + rem16 := uint16(rem) % 16 + + if refContainer != nil { + // refContainer available (maxX >= math.MaxUint16-1), + // fill remaining values container by copying biggest possible slice of refContainer (batches of 16s) + copy(bm.data[remOffset+uint64(startIdx):], refContainer[startIdx:startIdx+n16]) + // set remaining bits + for i := uint16(0); i < rem16; i++ { + container[startIdx+n16] |= bitmapMask[i] + } + } else { + // refContainer not available (maxX < math.MaxUint16-1), + // set bits by copying MaxUint64 first, then MaxUint16, then single bits + n64 := uint16(rem) / 64 + + container64 := uint16To64SliceUnsafe(container[startIdx:]) + for i := uint16(0); i < n64; i++ { + container64[i] = math.MaxUint64 + } + for i := uint16(n64 * 4); i < n16; i++ { + container[startIdx+i] = math.MaxUint16 + } + for i := uint16(0); i < rem16; i++ { + container[startIdx+n16] |= bitmapMask[i] + } + } + } + + return bm +} diff --git a/bitmap_opt_test.go b/bitmap_opt_test.go index 7e45eeb..518b267 100644 --- a/bitmap_opt_test.go +++ b/bitmap_opt_test.go @@ -871,6 +871,28 @@ func TestIssue_Or_NotMergeContainers(t *testing.T) { }) } +func TestPrefill(t *testing.T) { + for _, maxX := range []int{ + 0, 1, + math.MaxInt16, + math.MaxUint16 - 1, math.MaxUint16, math.MaxUint16 + 1, + math.MaxUint16*3 - 1, math.MaxUint16 * 3, math.MaxUint16*3 + 1, + 234_567, + } { + t.Run(fmt.Sprintf("value %d", maxX), func(t *testing.T) { + bm := Prefill(uint64(maxX)) + require.Equal(t, maxX+1, bm.GetCardinality()) + + arr := bm.ToArray() + require.Len(t, arr, maxX+1) + + for i, x := range arr { + require.Equal(t, uint64(i), x) + } + }) + } +} + func TestMergeToSuperset(t *testing.T) { run := func(t *testing.T, bufs [][]uint16) { containerThreshold := uint64(math.MaxUint16 + 1)