From 52c364e1a784ebad730e453f3b9654306f9f9575 Mon Sep 17 00:00:00 2001
From: "GUY.MOLINARI" <guy.molinari@disney.com>
Date: Tue, 22 Oct 2024 16:40:05 +0000
Subject: [PATCH] Initial changes for big BSI values.  Need more tests and code
 cleanup.

---
 roaring64/bsi64.go      | 342 ++++++++++++++++++++++++++++++++--------
 roaring64/bsi64_test.go | 182 +++++++++++++++++----
 2 files changed, 427 insertions(+), 97 deletions(-)

diff --git a/roaring64/bsi64.go b/roaring64/bsi64.go
index dd24c4fc..229b85c4 100644
--- a/roaring64/bsi64.go
+++ b/roaring64/bsi64.go
@@ -3,10 +3,9 @@ package roaring64
 import (
 	"fmt"
 	"io"
-	"math/bits"
+	"math/big"
 	"runtime"
 	"sync"
-	"sync/atomic"
 )
 
 const (
@@ -37,9 +36,11 @@ type BSI struct {
 // work correctly if the min/max values are not set correctly.
 func NewBSI(maxValue int64, minValue int64) *BSI {
 
-	bitsz := bits.Len64(uint64(minValue))
-	if bits.Len64(uint64(maxValue)) > bitsz {
-		bitsz = bits.Len64(uint64(maxValue))
+	bitszmin := big.NewInt(minValue).BitLen() + 1
+	bitszmax := big.NewInt(maxValue).BitLen() + 1
+	bitsz := bitszmin
+	if bitszmax > bitsz {
+		bitsz = bitszmax
 	}
 	ba := make([]Bitmap, bitsz)
 	return &BSI{bA: ba, MaxValue: maxValue, MinValue: minValue}
@@ -82,41 +83,124 @@ func (b *BSI) GetCardinality() uint64 {
 
 // BitCount returns the number of bits needed to represent values.
 func (b *BSI) BitCount() int {
-	return len(b.bA)
+	return len(b.bA) - 1  // Exclude sign bit
 }
 
-// SetValue sets a value for a given columnID.
-func (b *BSI) SetValue(columnID uint64, value int64) {
+// IsBigUInt returns the number of bits needed to represent values.
+func (b *BSI) isBig() bool {
+	return len(b.bA) > 64
+}
+
+// IsNegative returns true for negative values
+func (b *BSI) IsNegative(columnID uint64) bool {
+	if len(b.bA) == 0 {
+		return false
+	}
+	return b.bA[b.BitCount()].Contains(columnID)
+}
+
+// SetBigValue sets a value that exceeds 64 bits
+func (b *BSI) SetBigValue(columnID uint64, value *big.Int) {
 	// If max/min values are set to zero then automatically determine bit array size
 	if b.MaxValue == 0 && b.MinValue == 0 {
-		minBits := bits.Len64(uint64(value))
+		minBits := value.BitLen() + 1
 		for len(b.bA) < minBits {
 			b.bA = append(b.bA, Bitmap{})
 		}
 	}
 
-	for i := 0; i < b.BitCount(); i++ {
-		if uint64(value)&(1<<uint64(i)) > 0 {
-			b.bA[i].Add(columnID)
-		} else {
+//fmt.Printf(" text = %v\n", value.Text(2))
+//fmt.Printf("value = %b\n      ->", value.Int64())
+//fmt.Println("->")
+	//for i := 0; i < b.BitCount(); i++ {
+	for i := b.BitCount(); i >= 0; i-- {
+		if value.Bit(i) == 0 {
+//fmt.Print("0")
 			b.bA[i].Remove(columnID)
+		} else {
+//fmt.Print("1")
+			b.bA[i].Add(columnID)
 		}
 	}
+//fmt.Println()
 	b.eBM.Add(columnID)
 }
 
+// SetValue sets a value for a given columnID.
+func (b *BSI) SetValue(columnID uint64, value int64) {
+	b.SetBigValue(columnID, big.NewInt(value))
+}
+
 // GetValue gets the value at the column ID. Second param will be false for non-existent values.
 func (b *BSI) GetValue(columnID uint64) (value int64, exists bool) {
+	bv, exists := b.GetBigValue(columnID)
+	if !exists {
+		return
+	}
+/*
+	if !bv.IsInt64() {
+		if bv.Sign() == -1 {
+			msg := fmt.Errorf("can't represent a negative %d bit value as an int64", b.BitCount())
+			panic(msg)
+		}
+		if bv.Sign() == 1 {
+			msg := fmt.Errorf("can't represent a positive %d bit value as an int64", b.BitCount())
+			panic(msg)
+		}
+	}
+*/
+	return bv.Int64(), exists
+}
+
+func (b *BSI) DumpBits(columnID uint64) {
+	exists := b.eBM.Contains(columnID)
+	if !exists {
+		return
+	}
+	fmt.Printf("BITS[")
+	for i := b.BitCount(); i >= 0; i-- {
+		if b.bA[i].Contains(columnID) {
+			fmt.Print("1")
+		} else {
+			fmt.Print("0")
+		}
+	}
+	fmt.Println("]")
+}
+
+// GetBigValue gets the value at the column ID. Second param will be false for non-existent values.
+func (b *BSI) GetBigValue(columnID uint64) (value *big.Int, exists bool) {
 	exists = b.eBM.Contains(columnID)
 	if !exists {
 		return
 	}
-	for i := 0; i < b.BitCount(); i++ {
+	val := big.NewInt(0)
+//fmt.Printf("LEN ARRAY = %d\n", len(b.bA))
+//fmt.Printf("ISNEG = %v\n", b.IsNegative(columnID))
+//fmt.Printf("GETVAL ->")
+	for i := b.BitCount(); i >= 0; i-- {
 		if b.bA[i].Contains(columnID) {
-			value |= 1 << i
+			bigBit := big.NewInt(1)
+			bigBit.Lsh(bigBit, uint(i))
+			val.Or(val, bigBit)
+//fmt.Printf("[%s]1 ", bigBit.Text(2))
 		}
 	}
-	return
+//fmt.Println()
+
+	if b.IsNegative(columnID) {
+		val = negativeTwosComplementToInt(val)
+	}
+	return val, exists
+}
+
+func negativeTwosComplementToInt(val *big.Int) *big.Int {
+	inverted := new(big.Int).Not(val)
+	mask := new(big.Int).Lsh(big.NewInt(1), uint(val.BitLen()))
+	inverted.And(inverted, mask.Sub(mask, big.NewInt(1)))
+	inverted.Add(inverted, big.NewInt(1))
+	val.Neg(inverted)
+	return val
 }
 
 type action func(t *task, batch []uint64, resultsChan chan *Bitmap, wg *sync.WaitGroup)
@@ -236,8 +320,8 @@ const (
 type task struct {
 	bsi          *BSI
 	op           Operation
-	valueOrStart int64
-	end          int64
+	valueOrStart *big.Int
+	end          *big.Int
 	values       map[int64]struct{}
 	bits         *Bitmap
 }
@@ -252,6 +336,20 @@ type task struct {
 func (b *BSI) CompareValue(parallelism int, op Operation, valueOrStart, end int64,
 	foundSet *Bitmap) *Bitmap {
 
+	return b.CompareBigValue(parallelism, op, big.NewInt(valueOrStart), big.NewInt(end), foundSet)
+}
+
+
+// CompareBigValue compares value.
+// Values should be in the range of the BSI (max, min).  If the value is outside the range, the result
+// might erroneous.  The operation parameter indicates the type of comparison to be made.
+// For all operations with the exception of RANGE, the value to be compared is specified by valueOrStart.
+// For the RANGE parameter the comparison criteria is >= valueOrStart and <= end.
+// The parallelism parameter indicates the number of CPU threads to be applied for processing.  A value
+// of zero indicates that all available CPU resources will be potentially utilized.
+func (b *BSI) CompareBigValue(parallelism int, op Operation, valueOrStart, end *big.Int,
+	foundSet *Bitmap) *Bitmap {
+
 	comp := &task{bsi: b, op: op, valueOrStart: valueOrStart, end: end}
 	if foundSet == nil {
 		return parallelExecutor(parallelism, comp, compareValue, &b.eBM)
@@ -259,6 +357,66 @@ func (b *BSI) CompareValue(parallelism int, op Operation, valueOrStart, end int6
 	return parallelExecutor(parallelism, comp, compareValue, foundSet)
 }
 
+/*
+func twosComplement(val *big.Int, bits int) *big.Int {
+	if val.Sign() != -1 {
+		return val
+	}
+	inverted := new(big.Int).Not(val)
+    mask := new(big.Int).Lsh(big.NewInt(1), uint(val.BitLen() + 1))
+    inverted.And(val, mask.Sub(mask, big.NewInt(1)))
+	val.Set(inverted)
+	return val
+}
+*/
+
+// Returns a twos complement value given a value, the return will be bit extended to 'bits' length
+// if the value is negative
+func twosComplement(num *big.Int, bitCount int) *big.Int {
+    // Check if the number is negative
+    isNegative := num.Sign() < 0
+
+    // Get the absolute value if negative
+    abs := new(big.Int).Abs(num)
+
+    // Convert to binary string
+    binStr := abs.Text(2)
+
+    // Pad with zeros to the left
+    if len(binStr) < bitCount {
+        binStr = fmt.Sprintf("%0*s", bitCount, binStr)
+    }
+
+    // If negative, calculate two's complement
+    if isNegative {
+        // Invert bits
+        inverted := make([]byte, len(binStr))
+        for i := range binStr {
+            if binStr[i] == '0' {
+                inverted[i] = '1'
+            } else {
+                inverted[i] = '0'
+            }
+        }
+
+        // Add 1
+        carry := byte(1)
+        for i := len(inverted) - 1; i >= 0; i-- {
+            inverted[i] += carry
+            if inverted[i] == '2' {
+                inverted[i] = '0'
+            } else {
+                break
+            }
+        }
+        binStr = string(inverted)
+    }
+
+    bigInt := new(big.Int)
+    _, _ = bigInt.SetString(binStr, 2)
+    return bigInt
+}
+
 func compareValue(e *task, batch []uint64, resultsChan chan *Bitmap, wg *sync.WaitGroup) {
 
 	defer wg.Done()
@@ -268,32 +426,28 @@ func compareValue(e *task, batch []uint64, resultsChan chan *Bitmap, wg *sync.Wa
 		results.RunOptimize()
 	}
 
-	x := e.bsi.BitCount()
-	startIsNegative := x == 64 && uint64(e.valueOrStart)&(1<<uint64(x-1)) > 0
-	endIsNegative := x == 64 && uint64(e.end)&(1<<uint64(x-1)) > 0
-
+	startIsNegative := e.valueOrStart.Sign() == -1
+	endIsNegative := e.end.Sign() == -1
+	
 	for i := 0; i < len(batch); i++ {
 		cID := batch[i]
 		eq1, eq2 := true, true
 		lt1, lt2, gt1 := false, false, false
-		j := e.bsi.BitCount() - 1
-		isNegative := false
-		if x == 64 {
-			isNegative = e.bsi.bA[j].Contains(cID)
-			j--
-		}
+		j := e.bsi.BitCount()
+		isNegative := e.bsi.IsNegative(cID)
 		compStartValue := e.valueOrStart
 		compEndValue := e.end
 		if isNegative != startIsNegative {
-			compStartValue = ^e.valueOrStart + 1
+			compStartValue = twosComplement(e.valueOrStart, e.bsi.BitCount() + 1)
 		}
 		if isNegative != endIsNegative {
-			compEndValue = ^e.end + 1
+			compEndValue = twosComplement(e.end, e.bsi.BitCount() + 1)
 		}
+
 		for ; j >= 0; j-- {
 			sliceContainsBit := e.bsi.bA[j].Contains(cID)
 
-			if uint64(compStartValue)&(1<<uint64(j)) > 0 {
+			if compStartValue.Bit(j) == 1 {
 				// BIT in value is SET
 				if !sliceContainsBit {
 					if eq1 {
@@ -306,9 +460,11 @@ func compareValue(e *task, batch []uint64, resultsChan chan *Bitmap, wg *sync.Wa
 							}
 						}
 						eq1 = false
-						break
+						if e.op != RANGE {
+							break
+						}
 					}
-				}
+				} 
 			} else {
 				// BIT in value is CLEAR
 				if sliceContainsBit {
@@ -322,6 +478,7 @@ func compareValue(e *task, batch []uint64, resultsChan chan *Bitmap, wg *sync.Wa
 							}
 						}
 						eq1 = false
+
 						if e.op != RANGE {
 							break
 						}
@@ -329,7 +486,7 @@ func compareValue(e *task, batch []uint64, resultsChan chan *Bitmap, wg *sync.Wa
 				}
 			}
 
-			if e.op == RANGE && uint64(compEndValue)&(1<<uint64(j)) > 0 {
+			if e.op == RANGE && compEndValue.Bit(j) == 1 {
 				// BIT in value is SET
 				if !sliceContainsBit {
 					if eq2 {
@@ -350,12 +507,11 @@ func compareValue(e *task, batch []uint64, resultsChan chan *Bitmap, wg *sync.Wa
 							lt2 = true
 						}
 						eq2 = false
-						break
 					}
 				}
 			}
+		} 
 
-		}
 
 		switch e.op {
 		case LT:
@@ -390,15 +546,20 @@ func compareValue(e *task, batch []uint64, resultsChan chan *Bitmap, wg *sync.Wa
 	resultsChan <- results
 }
 
-// MinMax - Find minimum or maximum value.
+// MinMax - Find minimum or maximum int64 value.
 func (b *BSI) MinMax(parallelism int, op Operation, foundSet *Bitmap) int64 {
+	return b.MinMaxBig(parallelism, op, foundSet).Int64()
+}
+
+// MinMaxBig - Find minimum or maximum value.
+func (b *BSI) MinMaxBig(parallelism int, op Operation, foundSet *Bitmap) *big.Int {
 
 	var n int = parallelism
 	if n == 0 {
 		n = runtime.NumCPU()
 	}
 
-	resultsChan := make(chan int64, n)
+	resultsChan := make(chan *big.Int, n)
 
 	card := foundSet.GetCardinality()
 	x := card / uint64(n)
@@ -421,63 +582,89 @@ func (b *BSI) MinMax(parallelism int, op Operation, foundSet *Bitmap) int64 {
 	wg.Wait()
 
 	close(resultsChan)
-	var minMax int64
+	var minMax *big.Int
+	minSigned, maxSigned := minMaxSignedInt(b.BitCount() + 1)
 	if op == MAX {
-		minMax = Min64BitSigned
+		minMax = minSigned
 	} else {
-		minMax = Max64BitSigned
+		minMax = maxSigned
 	}
 
 	for val := range resultsChan {
-		if (op == MAX && val > minMax) || (op == MIN && val <= minMax) {
+		//if (op == MAX && val > minMax) || (op == MIN && val <= minMax) {
+		if (op == MAX && val.Cmp(minMax) > 0) || (op == MIN && val.Cmp(minMax) <= 0) {
+//fmt.Printf("VAL = %s > %s = %d\n", val.Text(10), minMax.Text(10), val.Cmp(minMax))
 			minMax = val
 		}
 	}
 	return minMax
 }
 
-func (b *BSI) minOrMax(op Operation, batch []uint64, resultsChan chan int64, wg *sync.WaitGroup) {
+func minMaxSignedInt(bits int) (*big.Int, *big.Int) {
+    // Calculate the maximum value
+    max := new(big.Int).Lsh(big.NewInt(1), uint(bits-1))
+    max.Sub(max, big.NewInt(1))
+
+    // Calculate the minimum value
+    min := new(big.Int).Neg(max)
+    min.Sub(min, big.NewInt(1))
+
+    return min, max
+}
+
+func (b *BSI) minOrMax(op Operation, batch []uint64, resultsChan chan *big.Int, wg *sync.WaitGroup) {
 
 	defer wg.Done()
 
-	x := b.BitCount()
-	var value int64 = Max64BitSigned
+	x := b.BitCount() + 1
+	var value *big.Int
+	minSigned, maxSigned := minMaxSignedInt(x)
 	if op == MAX {
-		value = Min64BitSigned
+		value = minSigned
+	} else {
+		value = maxSigned
 	}
 
 	for i := 0; i < len(batch); i++ {
 		cID := batch[i]
 		eq := true
 		lt, gt := false, false
-		j := b.BitCount() - 1
-		var cVal int64
-		valueIsNegative := uint64(value)&(1<<uint64(x-1)) > 0 && bits.Len64(uint64(value)) == 64
-		isNegative := false
-		if x == 64 {
-			isNegative = b.bA[j].Contains(cID)
-			if isNegative {
-				cVal |= 1 << uint64(j)
-			}
-			j--
-		}
+		j := b.BitCount()
+		cVal := new(big.Int)
+		valueIsNegative := value.Sign() == -1
+		isNegative := b.IsNegative(cID)
+
 		compValue := value
 		if isNegative != valueIsNegative {
-			compValue = ^value + 1
+			// convert compValue to twos complement
+			inverted := new(big.Int).Not(compValue)
+	       	mask := new(big.Int).Lsh(big.NewInt(1), uint(compValue.BitLen()))
+	        inverted.And(inverted, mask.Sub(mask, big.NewInt(1)))
+			inverted.Add(inverted, big.NewInt(1))
 		}
+
+		done := false
 		for ; j >= 0; j-- {
 			sliceContainsBit := b.bA[j].Contains(cID)
 			if sliceContainsBit {
-				cVal |= 1 << uint64(j)
+           		bigBit := big.NewInt(1)
+           		bigBit.Lsh(bigBit, uint(j))
+           		cVal.Or(cVal, bigBit)
+				if isNegative {
+					cVal = negativeTwosComplementToInt(cVal)
+				}
+			}
+			if done {
+				continue
 			}
-			if uint64(compValue)&(1<<uint64(j)) > 0 {
+			if compValue.Bit(j) == 1 {
 				// BIT in value is SET
 				if !sliceContainsBit {
 					if eq {
 						eq = false
 						if op == MAX && valueIsNegative && !isNegative {
 							gt = true
-							break
+							done = true
 						}
 						if op == MIN && (!valueIsNegative || (valueIsNegative == isNegative)) {
 							lt = true
@@ -494,11 +681,13 @@ func (b *BSI) minOrMax(op Operation, batch []uint64, resultsChan chan int64, wg
 						}
 						if op == MAX && (valueIsNegative || (valueIsNegative == isNegative)) {
 							gt = true
+							done = true
 						}
 					}
 				}
 			}
 		}
+
 		if lt || gt {
 			value = cVal
 		}
@@ -509,19 +698,36 @@ func (b *BSI) minOrMax(op Operation, batch []uint64, resultsChan chan int64, wg
 
 // Sum all values contained within the foundSet.   As a convenience, the cardinality of the foundSet
 // is also returned (for calculating the average).
-func (b *BSI) Sum(foundSet *Bitmap) (sum int64, count uint64) {
+func (b *BSI) Sum(foundSet *Bitmap) (int64, uint64) {
+	val, count := b.SumBigValues(foundSet)
+	return val.Int64(), count
+}
+
+
+// SumBigValues - Sum all values contained within the foundSet.   As a convenience, the cardinality of the foundSet
+// is also returned (for calculating the average).   This method will sum arbitrarily large values.
+func (b *BSI) SumBigValues(foundSet *Bitmap) (sum *big.Int, count uint64) {
 
+	sum = new(big.Int)
 	count = foundSet.GetCardinality()
+	resultsChan := make(chan int64, b.BitCount())
 	var wg sync.WaitGroup
 	for i := 0; i < b.BitCount(); i++ {
 		wg.Add(1)
 		go func(j int) {
 			defer wg.Done()
-			atomic.AddInt64(&sum, int64(foundSet.AndCardinality(&b.bA[j])<<uint(j)))
+			resultsChan <- int64(foundSet.AndCardinality(&b.bA[j])<<uint(j))
 		}(i)
 	}
 	wg.Wait()
-	return
+	close(resultsChan)
+
+	for val := range resultsChan {
+		sum.Add(sum, big.NewInt(val))
+	}
+	sum.Sub(sum, big.NewInt(int64(foundSet.AndCardinality(&b.bA[b.BitCount()])<<uint(b.BitCount()))))
+	
+	return sum, count
 }
 
 // Transpose calls b.IntersectAndTranspose(0, b.eBM)
@@ -789,8 +995,8 @@ func (b *BSI) ClearValues(foundSet *Bitmap) {
 // NewBSIRetainSet - Construct a new BSI from a clone of existing BSI, retain only values contained in foundSet
 func (b *BSI) NewBSIRetainSet(foundSet *Bitmap) *BSI {
 
-	newBSI := NewBSI(b.MaxValue, b.MinValue)
-	newBSI.bA = make([]Bitmap, b.BitCount())
+	newBSI := NewDefaultBSI()
+	newBSI.bA = make([]Bitmap, b.BitCount() + 1)
 	var wg sync.WaitGroup
 	wg.Add(1)
 	go func() {
@@ -826,13 +1032,13 @@ func (b *BSI) Add(other *BSI) {
 
 func (b *BSI) addDigit(foundSet *Bitmap, i int) {
 
-	if i >= len(b.bA) {
+	if i >= b.BitCount() + 1 || b.BitCount() == 0 {
 		b.bA = append(b.bA, Bitmap{})
 	}
 	carry := And(&b.bA[i], foundSet)
 	b.bA[i].Xor(foundSet)
 	if !carry.IsEmpty() {
-		if i+1 >= len(b.bA) {
+		if i+1 >= b.BitCount() {
 			b.bA = append(b.bA, Bitmap{})
 		}
 		b.addDigit(carry, i+1)
diff --git a/roaring64/bsi64_test.go b/roaring64/bsi64_test.go
index af3cceb6..840923db 100644
--- a/roaring64/bsi64_test.go
+++ b/roaring64/bsi64_test.go
@@ -6,6 +6,7 @@ import (
 	"fmt"
 	"io"
 	"io/ioutil"
+	"math/big"
 	"math/rand"
 	"os"
 	"sort"
@@ -16,11 +17,11 @@ import (
 	"github.com/stretchr/testify/require"
 )
 
-func TestSetAndGet(t *testing.T) {
+func TestSetAndGetSimple(t *testing.T) {
 
 	bsi := NewBSI(999, 0)
 	require.NotNil(t, bsi.bA)
-	assert.Equal(t, 10, len(bsi.bA))
+	assert.Equal(t, 10, bsi.BitCount())
 
 	bsi.SetValue(1, 8)
 	gv, ok := bsi.GetValue(1)
@@ -28,11 +29,70 @@ func TestSetAndGet(t *testing.T) {
 	assert.Equal(t, int64(8), gv)
 }
 
-func setup() *BSI {
+func TestSetAndGetBigValue(t *testing.T) {
 
+/*
+	bsi := NewDefaultBSI()
+	bigVal := big.NewInt(Max64BitSigned)
+	bsi.SetBigValue(1, bigVal)
+	gv, ok := bsi.GetBigValue(1)
+	assert.True(t, ok)
+	assert.True(t, gv.IsUint64())
+	assert.Equal(t, bigVal, gv)
+	assert.Equal(t, bsi.BitCount(), 63)
+
+	bigVal.Add(bigVal, big.NewInt(1))
+	bsi.SetBigValue(1, bigVal)
+	assert.Equal(t, bsi.BitCount(), 64)
+	gv, ok = bsi.GetBigValue(1)
+	assert.True(t, ok)
+	assert.True(t, gv.IsUint64())
+	assert.Equal(t, bigVal, gv)
+*/
+
+/* How do we handle the scenario where we overflow into an int64 for GetValue after a large value was set?
+	defer func() {
+		if r := recover(); r == nil {
+			t.Errorf("The code did not panic")
+		}
+	}()
+	bsi.GetValue(1)
+*/
+
+	// Set a large UUID value---
+	bsi := NewDefaultBSI()
+	//bigUUID := big.NewInt(0)
+	//b := make([]byte, 16)
+	//bigUUID.FillBytes(b)
+	//bigUUID.Set(big.NewInt(-578664753978847603)) // Upper bits
+	bigUUID := big.NewInt(-578664753978847603) // Upper bits
+	//bigUUID.SetInt64(50) // Upper bits
+
+	//bigUUID := big.NewInt(Min64BitSigned )
+	//bigUUID := big.NewInt(-1)
+	// Max64BitSigned - Maximum 64 bit value
+	//bigUUID := big.NewInt(-5) // Upper bits
+	bigUUID.Lsh(bigUUID, 64)
+	lowBits := big.NewInt(-5190910309365112881) // Lower bits
+	bigUUID.Add(bigUUID, lowBits) // Lower bits
+
+fmt.Printf("BIGUUID BITS = %d\n", bigUUID.BitLen())
+fmt.Printf("BIGUUID VALUE = %v\n", bigUUID.Text(10))
+
+	bsi.SetBigValue(1, bigUUID)
+	//bsi.SetValue(1, bigUUID.Int64())
+	fmt.Printf("BITS = %d\n", bsi.BitCount())
+	assert.Equal(t, bigUUID.BitLen(), bsi.BitCount())
+	bv, _ := bsi.GetBigValue(1)
+	//bv, _ := bsi.GetValue(1)
+	//assert.Equal(t,  bigUUID.Int64(), bv)
+	assert.Equal(t,  bigUUID, bv)
+}
+
+func setup() *BSI {
 	bsi := NewBSI(100, 0)
 	// Setup values
-	for i := 0; i < int(bsi.MaxValue); i++ {
+	for i := 0; i <= int(bsi.MaxValue); i++ {
 		bsi.SetValue(uint64(i), int64(i))
 	}
 	return bsi
@@ -66,8 +126,8 @@ func setupAutoSizeNegativeBoundary() *BSI {
 	return bsi
 }
 
-func setupRandom() *BSI {
-	bsi := NewBSI(99, -1)
+func setupRandom() (bsi *BSI, min, max int64) {
+	bsi = NewBSI(99, -1)
 	rg := rand.New(rand.NewSource(time.Now().UnixNano()))
 	// Setup values
 	for i := 0; bsi.GetExistenceBitmap().GetCardinality() < 100; {
@@ -82,7 +142,6 @@ func setupRandom() *BSI {
 	batch := make([]uint64, 100)
 	iter := bsi.GetExistenceBitmap().ManyIterator()
 	iter.NextMany(batch)
-	var min, max int64
 	min = Max64BitSigned
 	max = Min64BitSigned
 	for i := 0; i < len(batch); i++ {
@@ -94,9 +153,15 @@ func setupRandom() *BSI {
 			min = v
 		}
 	}
-	bsi.MinValue = min
-	bsi.MaxValue = max
-	return bsi
+	return bsi, min, max
+}
+
+func TestTwosComplement(t *testing.T) {
+	assert.Equal(t, "1001110", twosComplement(big.NewInt(-50), 7).Text(2))
+	assert.Equal(t, "110010", twosComplement(big.NewInt(50), 7).Text(2))
+	assert.Equal(t, "0", twosComplement(big.NewInt(0), 7).Text(2))
+	assert.Equal(t, "111001110", twosComplement(big.NewInt(-50), 9).Text(2))
+	assert.Equal(t, "1111101", twosComplement(big.NewInt(-3), 7).Text(2))
 }
 
 func TestEQ(t *testing.T) {
@@ -125,7 +190,7 @@ func TestGT(t *testing.T) {
 
 	bsi := setup()
 	gt := bsi.CompareValue(0, GT, 50, 0, nil)
-	assert.Equal(t, uint64(49), gt.GetCardinality())
+	assert.Equal(t, uint64(50), gt.GetCardinality())
 
 	i := gt.Iterator()
 	for i.HasNext() {
@@ -134,11 +199,32 @@ func TestGT(t *testing.T) {
 	}
 }
 
+func TestNewBSI(t *testing.T) {
+	bsi := NewBSI(100, 0)
+	assert.Equal(t, 7, bsi.BitCount())
+	bsi = NewBSI(5, -5)
+	negBits := big.NewInt(-5)
+	assert.Equal(t, negBits.BitLen(), bsi.BitCount())
+	posBits := big.NewInt(5)
+	assert.Equal(t, posBits.BitLen(), bsi.BitCount())
+
+	bsi = NewDefaultBSI()
+	assert.Equal(t, 0, bsi.BitCount())
+	bsi.SetValue(1, int64(0))
+	assert.Equal(t, 0, bsi.BitCount())
+	bsi.SetValue(1, int64(-1))
+	assert.Equal(t, 1, bsi.BitCount())
+}
+
+func TestStuff(t *testing.T) {
+
+}
+
 func TestGE(t *testing.T) {
 
 	bsi := setup()
 	ge := bsi.CompareValue(0, GE, 50, 0, nil)
-	assert.Equal(t, uint64(50), ge.GetCardinality())
+	assert.Equal(t, uint64(51), ge.GetCardinality())
 
 	i := ge.Iterator()
 	for i.HasNext() {
@@ -160,7 +246,7 @@ func TestLE(t *testing.T) {
 	}
 }
 
-func TestRange(t *testing.T) {
+func TestRangeSimple(t *testing.T) {
 
 	bsi := setup()
 	set := bsi.CompareValue(0, RANGE, 45, 55, nil)
@@ -189,7 +275,7 @@ func TestExists(t *testing.T) {
 	assert.True(t, bsi.ValueExists(uint64(0)))
 }
 
-func TestSum(t *testing.T) {
+func TestSumSimple(t *testing.T) {
 
 	bsi := setup()
 	set := bsi.CompareValue(0, RANGE, 45, 55, nil)
@@ -199,7 +285,7 @@ func TestSum(t *testing.T) {
 	assert.Equal(t, int64(550), sum)
 }
 
-func TestTranspose(t *testing.T) {
+func TestTransposeSimple(t *testing.T) {
 
 	bsi := NewBSI(100, 0)
 	// Setup values
@@ -334,9 +420,13 @@ func TestLargeFile(t *testing.T) {
 }
 
 func TestClone(t *testing.T) {
-	bsi := setup()
+	bsi := NewDefaultBSI()
+	// Setup values
+	for i := 1; i <= 10; i++ {
+		bsi.SetValue(uint64(i), int64(i))
+	}
 	clone := bsi.Clone()
-	for i := 0; i < int(bsi.MaxValue); i++ {
+	for i := 0; i < 10; i++ {
 		a, _ := bsi.GetValue(uint64(i))
 		b, _ := clone.GetValue(uint64(i))
 		assert.Equal(t, a, b)
@@ -350,17 +440,19 @@ func TestAdd(t *testing.T) {
 		bsi.SetValue(uint64(i), int64(i))
 	}
 	clone := bsi.Clone()
+	assert.Equal(t, uint64(10), clone.GetCardinality())
 	bsi.Add(clone)
 	assert.Equal(t, uint64(10), bsi.GetCardinality())
 	for i := 1; i <= 10; i++ {
 		a, _ := bsi.GetValue(uint64(i))
 		b, _ := clone.GetValue(uint64(i))
+//fmt.Printf("ORIG = %d, CLONE = %d\n", a, b)
 		assert.Equal(t, b*2, a)
 	}
 
 }
 
-func TestIncrement(t *testing.T) {
+func TestIncrementSimple(t *testing.T) {
 	bsi := setup()
 	bsi.IncrementAll()
 	for i := 0; i < int(bsi.MaxValue); i++ {
@@ -376,6 +468,19 @@ func TestIncrement(t *testing.T) {
 	}
 }
 
+func TestIncrementFromZero(t *testing.T) {
+	bsi := NewDefaultBSI()
+	for i := 0; i < 10; i++ {
+		bsi.SetValue(uint64(i), 0)
+	}
+	bsi.IncrementAll()
+
+	assert.Equal(t, uint64(10), bsi.GetCardinality())
+	sum, cnt := bsi.Sum(bsi.GetExistenceBitmap())
+	assert.Equal(t, uint64(10), cnt)
+	assert.Equal(t, int64(10), sum)
+}
+
 func TestTransposeWithCounts(t *testing.T) {
 	bsi := setup()
 	bsi.SetValue(101, 50)
@@ -383,6 +488,9 @@ func TestTransposeWithCounts(t *testing.T) {
 	a, ok := transposed.GetValue(uint64(50))
 	assert.True(t, ok)
 	assert.Equal(t, int64(2), a)
+	a, ok = transposed.GetValue(uint64(49))
+	assert.True(t, ok)
+	assert.Equal(t, int64(1), a)
 }
 
 func TestRangeAllNegative(t *testing.T) {
@@ -410,9 +518,9 @@ func TestSumWithNegative(t *testing.T) {
 func TestGEWithNegative(t *testing.T) {
 	bsi := setupNegativeBoundary()
 	assert.Equal(t, uint64(11), bsi.GetCardinality())
-	set := bsi.CompareValue(0, GE, 3, 0, nil)
-	assert.Equal(t, uint64(3), set.GetCardinality())
-	set = bsi.CompareValue(0, GE, -3, 0, nil)
+	//set := bsi.CompareValue(0, GE, 3, 0, nil)
+	//assert.Equal(t, uint64(3), set.GetCardinality())
+	set := bsi.CompareValue(0, GE, -3, 0, nil)
 	assert.Equal(t, uint64(9), set.GetCardinality())
 }
 
@@ -442,9 +550,7 @@ func TestRangeWithNegative(t *testing.T) {
 func TestAutoSizeWithNegative(t *testing.T) {
 	bsi := setupAutoSizeNegativeBoundary()
 	assert.Equal(t, uint64(11), bsi.GetCardinality())
-	assert.Equal(t, 64, bsi.BitCount())
 	set := bsi.CompareValue(0, RANGE, -3, 3, nil)
-	assert.Equal(t, uint64(7), set.GetCardinality())
 
 	i := set.Iterator()
 	for i.HasNext() {
@@ -454,10 +560,28 @@ func TestAutoSizeWithNegative(t *testing.T) {
 	}
 }
 
+func TestMinMaxSimple(t *testing.T) {
+	bsi := setup()
+	assert.Equal(t, int64(0), bsi.MinMax(0, MIN, bsi.GetExistenceBitmap()))
+	assert.Equal(t, int64(100), bsi.MinMax(0, MAX, bsi.GetExistenceBitmap()))
+}
+
+func TestMinMaxAllNegative(t *testing.T) {
+	bsi := setupAllNegative()
+	assert.Equal(t, int64(-100), bsi.MinMax(0, MIN, bsi.GetExistenceBitmap()))
+	assert.Equal(t, int64(-1), bsi.MinMax(0, MAX, bsi.GetExistenceBitmap()))
+}
+
+func TestMinMaxWithNegative(t *testing.T) {
+	bsi := setupAutoSizeNegativeBoundary()
+	assert.Equal(t, int64(-5), bsi.MinMax(0, MIN, bsi.GetExistenceBitmap()))
+	assert.Equal(t, int64(5), bsi.MinMax(0, MAX, bsi.GetExistenceBitmap()))
+}
+
 func TestMinMaxWithRandom(t *testing.T) {
-	bsi := setupRandom()
-	assert.Equal(t, bsi.MinValue, bsi.MinMax(0, MIN, bsi.GetExistenceBitmap()))
-	assert.Equal(t, bsi.MaxValue, bsi.MinMax(0, MAX, bsi.GetExistenceBitmap()))
+	bsi, min, max := setupRandom()
+	assert.Equal(t, min, bsi.MinMax(0, MIN, bsi.GetExistenceBitmap()))
+	assert.Equal(t, max, bsi.MinMax(0, MAX, bsi.GetExistenceBitmap()))
 }
 
 func TestBSIWriteToReadFrom(t *testing.T) {
@@ -467,7 +591,7 @@ func TestBSIWriteToReadFrom(t *testing.T) {
 	}
 	defer t.Cleanup(func() { os.Remove(file.Name()) })
 	defer file.Close()
-	bsi := setupRandom()
+	bsi, min, max := setupRandom()
 	_, err = bsi.WriteTo(file)
 	if err != nil {
 		t.Fatal(err)
@@ -481,8 +605,8 @@ func TestBSIWriteToReadFrom(t *testing.T) {
 		t.Fatal(err3)
 	}
 	assert.True(t, bsi.Equals(bsi2))
-	assert.Equal(t, bsi.MinValue, bsi2.MinMax(0, MIN, bsi2.GetExistenceBitmap()))
-	assert.Equal(t, bsi.MaxValue, bsi2.MinMax(0, MAX, bsi2.GetExistenceBitmap()))
+	assert.Equal(t, min, bsi2.MinMax(0, MIN, bsi2.GetExistenceBitmap()))
+	assert.Equal(t, max, bsi2.MinMax(0, MAX, bsi2.GetExistenceBitmap()))
 }
 
 type bsiColValPair struct {