2021-08-20 08:12:52 +00:00
|
|
|
package bptree
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
type ItemKey Hashable
|
2021-08-21 22:52:17 +00:00
|
|
|
type ItemValue Equatable
|
2021-08-23 01:19:26 +00:00
|
|
|
type PersistFunc func(node *BpNode) error
|
|
|
|
type DestroyFunc func(node *BpNode) error
|
|
|
|
|
|
|
|
var (
|
|
|
|
PersistFn PersistFunc
|
|
|
|
DestroyFn DestroyFunc
|
|
|
|
)
|
2021-08-21 22:52:17 +00:00
|
|
|
|
2021-08-20 08:12:52 +00:00
|
|
|
type BpNode struct {
|
2021-08-23 01:19:26 +00:00
|
|
|
keys []ItemKey
|
|
|
|
values []ItemValue
|
|
|
|
pointers []*BpNode
|
|
|
|
next *BpNode
|
|
|
|
prev *BpNode
|
|
|
|
protoNodeId int64
|
|
|
|
protoNode *ProtoNode
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func NewInternal(size int) *BpNode {
|
|
|
|
if size < 0 {
|
|
|
|
panic(NegativeSize())
|
|
|
|
}
|
|
|
|
return &BpNode{
|
2021-08-23 01:19:26 +00:00
|
|
|
keys: make([]ItemKey, 0, size),
|
|
|
|
pointers: make([]*BpNode, 0, size),
|
|
|
|
protoNodeId: GetProtoNodeId(),
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-09-18 08:29:47 +00:00
|
|
|
func NewLeaf(size int) *BpNode {
|
2021-08-20 08:12:52 +00:00
|
|
|
if size < 0 {
|
|
|
|
panic(NegativeSize())
|
|
|
|
}
|
|
|
|
return &BpNode{
|
2021-08-23 01:19:26 +00:00
|
|
|
keys: make([]ItemKey, 0, size),
|
|
|
|
values: make([]ItemValue, 0, size),
|
|
|
|
protoNodeId: GetProtoNodeId(),
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) Full() bool {
|
|
|
|
return len(self.keys) == cap(self.keys)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) Pure() bool {
|
|
|
|
if len(self.keys) == 0 {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
k0 := self.keys[0]
|
|
|
|
for _, k := range self.keys {
|
|
|
|
if !k0.Equals(k) {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) Internal() bool {
|
|
|
|
return cap(self.pointers) > 0
|
|
|
|
}
|
|
|
|
|
2021-09-18 08:29:47 +00:00
|
|
|
func (self *BpNode) Len() int {
|
|
|
|
return len(self.keys)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) Capacity() int {
|
2021-08-20 08:12:52 +00:00
|
|
|
return cap(self.keys)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) Height() int {
|
|
|
|
if !self.Internal() {
|
|
|
|
return 1
|
|
|
|
} else if len(self.pointers) == 0 {
|
|
|
|
panic(BpTreeError("Internal node has no pointers but asked for height"))
|
|
|
|
}
|
|
|
|
return self.pointers[0].Height() + 1
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) has(key ItemKey) bool {
|
2021-08-20 08:12:52 +00:00
|
|
|
_, has := self.find(key)
|
|
|
|
return has
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) left_most_leaf() *BpNode {
|
|
|
|
if self.Internal() {
|
|
|
|
return self.pointers[0].left_most_leaf()
|
|
|
|
}
|
|
|
|
return self
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) right_most_leaf() *BpNode {
|
|
|
|
if self.Internal() {
|
|
|
|
return self.pointers[len(self.pointers)-1].right_most_leaf()
|
|
|
|
}
|
|
|
|
return self
|
|
|
|
}
|
|
|
|
|
|
|
|
/* returns the index and leaf-block of the first key greater than or equal to
|
|
|
|
* the search key. (unless the search key is greater than all the keys in the
|
|
|
|
* tree, in that case it will be the last key in the tree)
|
|
|
|
*/
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) get_start(key ItemKey) (i int, leaf *BpNode) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Internal() {
|
|
|
|
return self.internal_get_start(key)
|
|
|
|
} else {
|
|
|
|
return self.leaf_get_start(key)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func next_location(i int, leaf *BpNode) (int, *BpNode, bool) {
|
|
|
|
j := i + 1
|
2021-08-21 01:50:16 +00:00
|
|
|
for j >= len(leaf.keys) && leaf.getNext() != nil {
|
2021-08-20 08:12:52 +00:00
|
|
|
j = 0
|
2021-08-21 01:50:16 +00:00
|
|
|
leaf = leaf.getNext()
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
if j >= len(leaf.keys) {
|
|
|
|
return -1, nil, true
|
|
|
|
}
|
|
|
|
return j, leaf, false
|
|
|
|
}
|
|
|
|
|
|
|
|
func prev_location(i int, leaf *BpNode) (int, *BpNode, bool) {
|
|
|
|
j := i - 1
|
2021-08-21 01:50:16 +00:00
|
|
|
for j < 0 && leaf.getPrev() != nil {
|
|
|
|
leaf = leaf.getPrev()
|
2021-08-20 08:12:52 +00:00
|
|
|
j = len(leaf.keys) - 1
|
|
|
|
}
|
|
|
|
if j < 0 {
|
|
|
|
return -1, nil, true
|
|
|
|
}
|
|
|
|
return j, leaf, false
|
|
|
|
}
|
|
|
|
|
|
|
|
/* returns the index and leaf-block of the last key equal to the search key or
|
|
|
|
* the first key greater than the search key. (unless the search key is greater
|
|
|
|
* than all the keys in the tree, in that case it will be the last key in the
|
|
|
|
* tree)
|
|
|
|
*/
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) get_end(key ItemKey) (i int, leaf *BpNode) {
|
2021-08-20 08:12:52 +00:00
|
|
|
end := false
|
|
|
|
i, leaf = self.get_start(key)
|
|
|
|
pi, pleaf := i, leaf
|
|
|
|
for !end && leaf.keys[i].Equals(key) {
|
|
|
|
pi, pleaf = i, leaf
|
|
|
|
i, leaf, end = next_location(i, leaf)
|
|
|
|
}
|
|
|
|
return pi, pleaf
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) internal_get_start(key ItemKey) (i int, leaf *BpNode) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if !self.Internal() {
|
|
|
|
panic(BpTreeError("Expected a internal node"))
|
|
|
|
}
|
|
|
|
i, has := self.find(key)
|
|
|
|
if !has && i > 0 {
|
|
|
|
// if it doesn't have it and the index > 0 then we have the next block
|
|
|
|
// so we have to subtract one from the index.
|
|
|
|
i--
|
|
|
|
}
|
|
|
|
child := self.pointers[i]
|
|
|
|
return child.get_start(key)
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) leaf_get_start(key ItemKey) (i int, leaf *BpNode) {
|
2021-08-20 08:12:52 +00:00
|
|
|
i, has := self.find(key)
|
|
|
|
if i >= len(self.keys) && i > 0 {
|
|
|
|
i = len(self.keys) - 1
|
|
|
|
}
|
2021-08-21 01:50:16 +00:00
|
|
|
if !has && (len(self.keys) == 0 || self.keys[i].Less(key)) && self.getNext() != nil {
|
|
|
|
return self.getNext().leaf_get_start(key)
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
return i, self
|
|
|
|
}
|
|
|
|
|
|
|
|
/* This puts the k/v pair into the B+Tree rooted at this node and returns the
|
|
|
|
* (possibly) new root of the tree.
|
|
|
|
*/
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) put(key ItemKey, value ItemValue) (root *BpNode, err error) {
|
2021-08-20 08:12:52 +00:00
|
|
|
a, b, err := self.insert(key, value)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
} else if b == nil {
|
|
|
|
return a, nil
|
|
|
|
}
|
|
|
|
// else we have root split
|
2021-09-18 08:29:47 +00:00
|
|
|
root = NewInternal(self.Capacity())
|
2021-08-20 08:12:52 +00:00
|
|
|
root.put_kp(a.keys[0], a)
|
|
|
|
root.put_kp(b.keys[0], b)
|
2021-08-23 01:19:26 +00:00
|
|
|
return root, root.persist()
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// right is only set on split
|
|
|
|
// left is always set. When split is false left is the pointer to block
|
|
|
|
// When split is true left is the pointer to the new left
|
|
|
|
// block
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) insert(key ItemKey, value ItemValue) (a, b *BpNode, err error) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Internal() {
|
|
|
|
return self.internal_insert(key, value)
|
|
|
|
} else { // leaf node
|
|
|
|
return self.leaf_insert(key, value)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* - first find the child to insert into
|
|
|
|
* - do the child insert
|
|
|
|
* - if there was a split:
|
|
|
|
* - if the block is full, split this block
|
|
|
|
* - else insert the new key/pointer into this block
|
|
|
|
*/
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) internal_insert(key ItemKey, value ItemValue) (a, b *BpNode, err error) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if !self.Internal() {
|
|
|
|
return nil, nil, BpTreeError("Expected a internal node")
|
|
|
|
}
|
|
|
|
i, has := self.find(key)
|
|
|
|
if !has && i > 0 {
|
|
|
|
// if it doesn't have it and the index > 0 then we have the next block
|
|
|
|
// so we have to subtract one from the index.
|
|
|
|
i--
|
|
|
|
}
|
|
|
|
child := self.pointers[i]
|
|
|
|
p, q, err := child.insert(key, value)
|
|
|
|
if err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
self.keys[i] = p.keys[0]
|
|
|
|
self.pointers[i] = p
|
|
|
|
if q != nil {
|
|
|
|
// we had a split
|
|
|
|
if self.Full() {
|
|
|
|
return self.internal_split(q.keys[0], q)
|
|
|
|
} else {
|
|
|
|
if err := self.put_kp(q.keys[0], q); err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
2021-08-23 01:19:26 +00:00
|
|
|
return self, nil, self.persist()
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
}
|
2021-08-23 01:19:26 +00:00
|
|
|
return self, nil, self.maybePersist(child != p)
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* On split
|
|
|
|
* - first assert that the key to be inserted is not already in the block.
|
|
|
|
* - Make a new block
|
|
|
|
* - balance the two blocks.
|
|
|
|
* - insert the new key/pointer combo into the correct block
|
|
|
|
*/
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) internal_split(key ItemKey, ptr *BpNode) (a, b *BpNode, err error) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if !self.Internal() {
|
|
|
|
return nil, nil, BpTreeError("Expected a internal node")
|
|
|
|
}
|
|
|
|
if self.has(key) {
|
|
|
|
return nil, nil, BpTreeError("Tried to split an internal block on duplicate key")
|
|
|
|
}
|
|
|
|
a = self
|
2021-09-18 08:29:47 +00:00
|
|
|
b = NewInternal(self.Capacity())
|
|
|
|
balance_nodes(a, b, key)
|
|
|
|
if b.Len() > 0 && key.Less(b.keys[0]) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if err := a.put_kp(key, ptr); err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if err := b.put_kp(key, ptr); err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
}
|
2021-08-23 01:19:26 +00:00
|
|
|
return a, b, persist(a, b)
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* if the leaf is full then it will defer to a leaf_split
|
|
|
|
* (but in one case that will not actually split in the case of a insert into
|
|
|
|
* a pure block with a matching key)
|
|
|
|
* else this leaf will get a new entry.
|
|
|
|
*/
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) leaf_insert(key ItemKey, value ItemValue) (a, b *BpNode, err error) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Internal() {
|
|
|
|
return nil, nil, BpTreeError("Expected a leaf node")
|
|
|
|
}
|
2021-09-18 08:29:47 +00:00
|
|
|
if true { // no_dup = true
|
2021-08-21 22:13:13 +00:00
|
|
|
i, has := self.find(key)
|
|
|
|
if has {
|
|
|
|
self.values[i] = value
|
2021-08-23 01:19:26 +00:00
|
|
|
return self, nil, self.persist()
|
2021-08-21 22:13:13 +00:00
|
|
|
}
|
|
|
|
}
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Full() {
|
|
|
|
return self.leaf_split(key, value)
|
|
|
|
} else {
|
|
|
|
if err := self.put_kv(key, value); err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
2021-08-23 01:19:26 +00:00
|
|
|
return self, nil, self.persist()
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* on leaf split if the block is pure then it will defer to pure_leaf_split
|
|
|
|
* else
|
|
|
|
* - a new block will be made and inserted after this one
|
|
|
|
* - the two blocks will be balanced with balanced_nodes
|
|
|
|
* - if the key is less than b.keys[0] it will go in a else b
|
|
|
|
*/
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) leaf_split(key ItemKey, value ItemValue) (a, b *BpNode, err error) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Internal() {
|
|
|
|
return nil, nil, BpTreeError("Expected a leaf node")
|
|
|
|
}
|
|
|
|
if self.Pure() {
|
|
|
|
return self.pure_leaf_split(key, value)
|
|
|
|
}
|
|
|
|
a = self
|
2021-09-18 08:29:47 +00:00
|
|
|
b = NewLeaf(self.Capacity())
|
2021-08-21 01:50:16 +00:00
|
|
|
insert_linked_list_node(b, a, a.getNext())
|
2021-09-18 08:29:47 +00:00
|
|
|
balance_nodes(a, b, key)
|
|
|
|
if b.Len() > 0 && key.Less(b.keys[0]) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if err := a.put_kv(key, value); err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if err := b.put_kv(key, value); err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
}
|
2021-08-23 01:19:26 +00:00
|
|
|
return a, b, persist(a, b)
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* a pure leaf split has two cases:
|
|
|
|
* 1) the inserted key is less than the current pure block.
|
|
|
|
* - a new block should be created before the current block
|
|
|
|
* - the key should be put in it
|
|
|
|
* 2) the inserted key is greater than or equal to the pure block.
|
|
|
|
* - the end of run of pure blocks should be found
|
|
|
|
* - if the key is equal to pure block and the last block is not full insert
|
|
|
|
* the new kv
|
|
|
|
* - else split by making a new block after the last block in the run
|
|
|
|
* and putting the new key there.
|
|
|
|
* - always return the current block as "a" and the new block as "b"
|
|
|
|
*/
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) pure_leaf_split(key ItemKey, value ItemValue) (a, b *BpNode, err error) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Internal() || !self.Pure() {
|
|
|
|
return nil, nil, BpTreeError("Expected a pure leaf node")
|
|
|
|
}
|
|
|
|
if key.Less(self.keys[0]) {
|
2021-09-18 08:29:47 +00:00
|
|
|
a = NewLeaf(self.Capacity())
|
2021-08-20 08:12:52 +00:00
|
|
|
b = self
|
|
|
|
if err := a.put_kv(key, value); err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
2021-08-21 01:50:16 +00:00
|
|
|
insert_linked_list_node(a, b.getPrev(), b)
|
2021-08-23 01:19:26 +00:00
|
|
|
return a, b, persist(a, b)
|
2021-08-20 08:12:52 +00:00
|
|
|
} else {
|
|
|
|
a = self
|
|
|
|
e := self.find_end_of_pure_run()
|
|
|
|
if e.keys[0].Equals(key) && !e.Full() {
|
|
|
|
if err := e.put_kv(key, value); err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
2021-08-23 01:19:26 +00:00
|
|
|
return a, nil, a.persist()
|
2021-08-20 08:12:52 +00:00
|
|
|
} else {
|
2021-09-18 08:29:47 +00:00
|
|
|
b = NewLeaf(self.Capacity())
|
2021-08-20 08:12:52 +00:00
|
|
|
if err := b.put_kv(key, value); err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
2021-08-21 01:50:16 +00:00
|
|
|
insert_linked_list_node(b, e, e.getNext())
|
2021-08-20 08:12:52 +00:00
|
|
|
if e.keys[0].Equals(key) {
|
|
|
|
return a, nil, nil
|
|
|
|
}
|
2021-08-23 01:19:26 +00:00
|
|
|
return a, b, persist(a, b)
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) put_kp(key ItemKey, ptr *BpNode) error {
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Full() {
|
|
|
|
return BpTreeError("Block is full.")
|
|
|
|
}
|
|
|
|
if !self.Internal() {
|
|
|
|
return BpTreeError("Expected a internal node")
|
|
|
|
}
|
|
|
|
i, has := self.find(key)
|
|
|
|
if has {
|
|
|
|
return BpTreeError("Tried to insert a duplicate key into an internal node")
|
|
|
|
} else if i < 0 {
|
|
|
|
panic(BpTreeError("find returned a negative int"))
|
|
|
|
} else if i >= cap(self.keys) {
|
|
|
|
panic(BpTreeError("find returned a int > than cap(keys)"))
|
|
|
|
}
|
|
|
|
if err := self.put_key_at(i, key); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if err := self.put_pointer_at(i, ptr); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) put_kv(key ItemKey, value ItemValue) error {
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Full() {
|
|
|
|
return BpTreeError("Block is full.")
|
|
|
|
}
|
|
|
|
if self.Internal() {
|
|
|
|
return BpTreeError("Expected a leaf node")
|
|
|
|
}
|
|
|
|
i, _ := self.find(key)
|
|
|
|
if i < 0 {
|
|
|
|
panic(BpTreeError("find returned a negative int"))
|
|
|
|
} else if i >= cap(self.keys) {
|
|
|
|
panic(BpTreeError("find returned a int > than cap(keys)"))
|
|
|
|
}
|
|
|
|
if err := self.put_key_at(i, key); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if err := self.put_value_at(i, value); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) put_key_at(i int, key ItemKey) error {
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Full() {
|
|
|
|
return BpTreeError("Block is full.")
|
|
|
|
}
|
|
|
|
self.keys = self.keys[:len(self.keys)+1]
|
|
|
|
for j := len(self.keys) - 1; j > i; j-- {
|
|
|
|
self.keys[j] = self.keys[j-1]
|
|
|
|
}
|
|
|
|
self.keys[i] = key
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:52:17 +00:00
|
|
|
func (self *BpNode) put_value_at(i int, value ItemValue) error {
|
2021-08-20 08:12:52 +00:00
|
|
|
if len(self.values) == cap(self.values) {
|
|
|
|
return BpTreeError("Block is full.")
|
|
|
|
}
|
|
|
|
if self.Internal() {
|
|
|
|
return BpTreeError("Expected a leaf node")
|
|
|
|
}
|
|
|
|
self.values = self.values[:len(self.values)+1]
|
|
|
|
for j := len(self.values) - 1; j > i; j-- {
|
|
|
|
self.values[j] = self.values[j-1]
|
|
|
|
}
|
|
|
|
self.values[i] = value
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) put_pointer_at(i int, pointer *BpNode) error {
|
|
|
|
if len(self.pointers) == cap(self.pointers) {
|
|
|
|
return BpTreeError("Block is full.")
|
|
|
|
}
|
|
|
|
if !self.Internal() {
|
|
|
|
return BpTreeError("Expected a internal node")
|
|
|
|
}
|
|
|
|
self.pointers = self.pointers[:len(self.pointers)+1]
|
|
|
|
for j := len(self.pointers) - 1; j > i; j-- {
|
|
|
|
self.pointers[j] = self.pointers[j-1]
|
|
|
|
}
|
|
|
|
self.pointers[i] = pointer
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) remove(key ItemKey, where WhereFunc) (a *BpNode, err error) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Internal() {
|
|
|
|
return self.internal_remove(key, nil, where)
|
|
|
|
} else {
|
|
|
|
return self.leaf_remove(key, self.keys[len(self.keys)-1], where)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) internal_remove(key ItemKey, sibling *BpNode, where WhereFunc) (a *BpNode, err error) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if !self.Internal() {
|
|
|
|
panic(BpTreeError("Expected a internal node"))
|
|
|
|
}
|
|
|
|
i, has := self.find(key)
|
|
|
|
if !has && i > 0 {
|
|
|
|
// if it doesn't have it and the index > 0 then we have the next block
|
|
|
|
// so we have to subtract one from the index.
|
|
|
|
i--
|
|
|
|
}
|
|
|
|
if i+1 < len(self.keys) {
|
|
|
|
sibling = self.pointers[i+1]
|
|
|
|
} else if sibling != nil {
|
|
|
|
sibling = sibling.left_most_leaf()
|
|
|
|
}
|
|
|
|
child := self.pointers[i]
|
2021-08-23 01:19:26 +00:00
|
|
|
oldChild := child
|
2021-08-20 08:12:52 +00:00
|
|
|
if child.Internal() {
|
|
|
|
child, err = child.internal_remove(key, sibling, where)
|
|
|
|
} else {
|
|
|
|
if sibling == nil {
|
|
|
|
child, err = child.leaf_remove(key, nil, where)
|
|
|
|
} else {
|
|
|
|
child, err = child.leaf_remove(key, sibling.keys[0], where)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if child == nil {
|
|
|
|
if err := self.remove_key_at(i); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if err := self.remove_ptr_at(i); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
self.keys[i] = child.keys[0]
|
|
|
|
self.pointers[i] = child
|
|
|
|
}
|
|
|
|
if len(self.keys) == 0 {
|
2021-08-23 01:19:26 +00:00
|
|
|
return nil, self.destroy()
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
2021-08-23 01:19:26 +00:00
|
|
|
return self, self.maybePersist(oldChild != child)
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) leaf_remove(key, stop ItemKey, where WhereFunc) (a *BpNode, err error) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if self.Internal() {
|
|
|
|
return nil, BpTreeError("Expected a leaf node")
|
|
|
|
}
|
|
|
|
a = self
|
2021-08-23 01:19:26 +00:00
|
|
|
hasChange := false
|
2021-08-20 08:12:52 +00:00
|
|
|
for j, l, next := self.forward(key, key)(); next != nil; j, l, next = next() {
|
|
|
|
if where(l.values[j]) {
|
2021-08-23 01:19:26 +00:00
|
|
|
hasChange = true
|
2021-08-20 08:12:52 +00:00
|
|
|
if err := l.remove_key_at(j); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if err := l.remove_value_at(j); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if len(l.keys) == 0 {
|
|
|
|
remove_linked_list_node(l)
|
2021-08-21 01:50:16 +00:00
|
|
|
if l.getNext() == nil {
|
2021-08-20 08:12:52 +00:00
|
|
|
a = nil
|
|
|
|
} else if stop == nil {
|
|
|
|
a = nil
|
2021-08-21 01:50:16 +00:00
|
|
|
} else if !l.getNext().keys[0].Equals(stop) {
|
|
|
|
a = l.getNext()
|
2021-08-20 08:12:52 +00:00
|
|
|
} else {
|
|
|
|
a = nil
|
|
|
|
}
|
2021-08-23 01:19:26 +00:00
|
|
|
if err := l.destroy(); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
}
|
2021-08-23 01:19:26 +00:00
|
|
|
if a != nil {
|
|
|
|
return a, a.maybePersist(hasChange)
|
|
|
|
}
|
2021-08-20 08:12:52 +00:00
|
|
|
return a, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) remove_key_at(i int) error {
|
|
|
|
if i >= len(self.keys) || i < 0 {
|
|
|
|
return BpTreeError("i, %v, is out of bounds, %v, %v %v.", i, len(self.keys), len(self.values), self)
|
|
|
|
}
|
|
|
|
for j := i; j < len(self.keys)-1; j++ {
|
|
|
|
self.keys[j] = self.keys[j+1]
|
|
|
|
}
|
|
|
|
self.keys = self.keys[:len(self.keys)-1]
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) remove_value_at(i int) error {
|
|
|
|
if i >= len(self.values) || i < 0 {
|
|
|
|
return BpTreeError("i, %v, is out of bounds, %v.", i, len(self.values))
|
|
|
|
}
|
|
|
|
for j := i; j < len(self.values)-1; j++ {
|
|
|
|
self.values[j] = self.values[j+1]
|
|
|
|
}
|
|
|
|
self.values = self.values[:len(self.values)-1]
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) remove_ptr_at(i int) error {
|
|
|
|
if i >= len(self.pointers) || i < 0 {
|
|
|
|
return BpTreeError("i, %v, is out of bounds, %v.", i, len(self.pointers))
|
|
|
|
}
|
|
|
|
for j := i; j < len(self.pointers)-1; j++ {
|
|
|
|
self.pointers[j] = self.pointers[j+1]
|
|
|
|
}
|
|
|
|
self.pointers = self.pointers[:len(self.pointers)-1]
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) find(key ItemKey) (int, bool) {
|
2021-08-21 22:52:17 +00:00
|
|
|
var l = 0
|
|
|
|
var r = len(self.keys) - 1
|
2021-08-20 08:12:52 +00:00
|
|
|
var m int
|
|
|
|
for l <= r {
|
|
|
|
m = ((r - l) >> 1) + l
|
|
|
|
if key.Less(self.keys[m]) {
|
|
|
|
r = m - 1
|
|
|
|
} else if key.Equals(self.keys[m]) {
|
2021-09-18 08:29:47 +00:00
|
|
|
return m, true
|
2021-08-20 08:12:52 +00:00
|
|
|
} else {
|
|
|
|
l = m + 1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return l, false
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) find_end_of_pure_run() *BpNode {
|
|
|
|
k := self.keys[0]
|
|
|
|
p := self
|
2021-08-21 01:50:16 +00:00
|
|
|
n := self.getNext()
|
2021-08-20 08:12:52 +00:00
|
|
|
for n != nil && n.Pure() && k.Equals(n.keys[0]) {
|
|
|
|
p = n
|
2021-08-21 01:50:16 +00:00
|
|
|
n = n.getNext()
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
return p
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) all() (li loc_iterator) {
|
|
|
|
j := -1
|
|
|
|
l := self.left_most_leaf()
|
|
|
|
end := false
|
|
|
|
j, l, end = next_location(j, l)
|
|
|
|
li = func() (i int, leaf *BpNode, next loc_iterator) {
|
|
|
|
if end {
|
|
|
|
return -1, nil, nil
|
|
|
|
}
|
|
|
|
i = j
|
|
|
|
leaf = l
|
|
|
|
j, l, end = next_location(j, l)
|
|
|
|
return i, leaf, li
|
|
|
|
}
|
|
|
|
return li
|
|
|
|
}
|
|
|
|
|
|
|
|
func (self *BpNode) all_backward() (li loc_iterator) {
|
|
|
|
l := self.right_most_leaf()
|
|
|
|
j := len(l.keys)
|
|
|
|
end := false
|
|
|
|
j, l, end = prev_location(j, l)
|
|
|
|
li = func() (i int, leaf *BpNode, next loc_iterator) {
|
|
|
|
if end {
|
|
|
|
return -1, nil, nil
|
|
|
|
}
|
|
|
|
i = j
|
|
|
|
leaf = l
|
|
|
|
j, l, end = prev_location(j, l)
|
|
|
|
return i, leaf, li
|
|
|
|
}
|
|
|
|
return li
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) forward(from, to ItemKey) (li loc_iterator) {
|
2021-08-20 08:12:52 +00:00
|
|
|
j, l := self.get_start(from)
|
|
|
|
end := false
|
|
|
|
j--
|
|
|
|
li = func() (i int, leaf *BpNode, next loc_iterator) {
|
|
|
|
j, l, end = next_location(j, l)
|
|
|
|
if end || to.Less(l.keys[j]) {
|
|
|
|
return -1, nil, nil
|
|
|
|
}
|
|
|
|
return j, l, li
|
|
|
|
}
|
|
|
|
return li
|
|
|
|
}
|
|
|
|
|
2021-08-21 22:54:42 +00:00
|
|
|
func (self *BpNode) backward(from, to ItemKey) (li loc_iterator) {
|
2021-08-20 08:12:52 +00:00
|
|
|
j, l := self.get_end(from)
|
|
|
|
end := false
|
|
|
|
li = func() (i int, leaf *BpNode, next loc_iterator) {
|
|
|
|
if end || l.keys[j].Less(to) {
|
|
|
|
return -1, nil, nil
|
|
|
|
}
|
|
|
|
i = j
|
|
|
|
leaf = l
|
|
|
|
j, l, end = prev_location(i, l)
|
|
|
|
return i, leaf, li
|
|
|
|
}
|
|
|
|
return li
|
|
|
|
}
|
|
|
|
|
|
|
|
func insert_linked_list_node(n, prev, next *BpNode) {
|
2021-08-21 01:50:16 +00:00
|
|
|
if (prev != nil && prev.getNext() != next) || (next != nil && next.getPrev() != prev) {
|
2021-08-20 08:12:52 +00:00
|
|
|
panic(BpTreeError("prev and next not hooked up"))
|
|
|
|
}
|
2021-08-21 01:50:16 +00:00
|
|
|
n.setPrev(prev)
|
|
|
|
n.setNext(next)
|
2021-08-20 08:12:52 +00:00
|
|
|
if prev != nil {
|
2021-08-21 01:50:16 +00:00
|
|
|
prev.setNext(n)
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
if next != nil {
|
2021-08-21 01:50:16 +00:00
|
|
|
next.setPrev(n)
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func remove_linked_list_node(n *BpNode) {
|
2021-08-21 01:50:16 +00:00
|
|
|
if n.getPrev() != nil {
|
|
|
|
n.getPrev().setNext(n.getNext())
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
2021-08-21 01:50:16 +00:00
|
|
|
if n.getNext() != nil {
|
|
|
|
n.getNext().setPrev(n.getPrev())
|
2021-08-20 08:12:52 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-09-18 08:29:47 +00:00
|
|
|
/**
|
|
|
|
* a must be full and b must be empty else there will be a panic
|
|
|
|
*
|
|
|
|
* Different from common btree implementation, this splits the nodes by the inserted key.
|
|
|
|
* Items less than the splitKey stays in a, or moved to b if otherwise.
|
|
|
|
* This should help for monotonically increasing inserts.
|
|
|
|
*
|
2021-08-20 08:12:52 +00:00
|
|
|
*/
|
2021-09-18 08:29:47 +00:00
|
|
|
func balance_nodes(a, b *BpNode, splitKey ItemKey) {
|
2021-08-20 08:12:52 +00:00
|
|
|
if len(b.keys) != 0 {
|
|
|
|
panic(BpTreeError("b was not empty"))
|
|
|
|
}
|
|
|
|
if !a.Full() {
|
|
|
|
panic(BpTreeError("a was not full", a))
|
|
|
|
}
|
|
|
|
if cap(a.keys) != cap(b.keys) {
|
|
|
|
panic(BpTreeError("cap(a.keys) != cap(b.keys)"))
|
|
|
|
}
|
|
|
|
if cap(a.values) != cap(b.values) {
|
|
|
|
panic(BpTreeError("cap(a.values) != cap(b.values)"))
|
|
|
|
}
|
|
|
|
if cap(a.pointers) != cap(b.pointers) {
|
|
|
|
panic(BpTreeError("cap(a.pointers) != cap(b.pointers)"))
|
|
|
|
}
|
2021-09-18 08:29:47 +00:00
|
|
|
|
|
|
|
m := find_split_index(a, b, splitKey)
|
2021-08-21 22:52:17 +00:00
|
|
|
var lim = len(a.keys) - m
|
2021-08-20 08:12:52 +00:00
|
|
|
b.keys = b.keys[:lim]
|
|
|
|
if cap(a.values) > 0 {
|
|
|
|
if cap(a.values) != cap(a.keys) {
|
|
|
|
panic(BpTreeError("cap(a.values) != cap(a.keys)"))
|
|
|
|
}
|
|
|
|
b.values = b.values[:lim]
|
|
|
|
}
|
|
|
|
if cap(a.pointers) > 0 {
|
|
|
|
if cap(a.pointers) != cap(a.keys) {
|
|
|
|
panic(BpTreeError("cap(a.pointers) != cap(a.keys)"))
|
|
|
|
}
|
|
|
|
b.pointers = b.pointers[:lim]
|
|
|
|
}
|
|
|
|
for i := 0; i < lim; i++ {
|
|
|
|
j := m + i
|
|
|
|
b.keys[i] = a.keys[j]
|
|
|
|
if cap(a.values) > 0 {
|
|
|
|
b.values[i] = a.values[j]
|
|
|
|
}
|
|
|
|
if cap(a.pointers) > 0 {
|
|
|
|
b.pointers[i] = a.pointers[j]
|
|
|
|
}
|
|
|
|
}
|
|
|
|
a.keys = a.keys[:m]
|
|
|
|
if cap(a.values) > 0 {
|
|
|
|
a.values = a.values[:m]
|
|
|
|
}
|
|
|
|
if cap(a.pointers) > 0 {
|
|
|
|
a.pointers = a.pointers[:m]
|
|
|
|
}
|
|
|
|
}
|
2021-09-18 08:29:47 +00:00
|
|
|
|
|
|
|
func find_split_index(a, b *BpNode, splitKey ItemKey) int {
|
|
|
|
m := len(a.keys)
|
|
|
|
for m > 0 && !a.keys[m-1].Less(splitKey) {
|
|
|
|
m--
|
|
|
|
}
|
|
|
|
return m
|
|
|
|
}
|