ref: e0fffa8ae9627363f518cc7077e5e8e204135db5
parent: 3f842a00016a70d021ddf27a901d564a8e97ab61
author: Ori Bernstein <ori@eigenstate.org>
date: Mon Feb 1 22:40:41 EST 2021
tree: shrink buffer when flushing deletions.
--- a/blk.c
+++ b/blk.c
@@ -43,6 +43,20 @@
return siphash(b->data, Blksz);
}
+ushort
+blkfill(Blk *b)
+{
+ switch(b->type){
+ case Pivot:
+ return 2*b->nmsg + b->bufsz + 2*b->nent + b->valsz;
+ case Leaf:
+ return 2*b->nent + b->valsz;
+ default:
+ abort();
+ return 0; // shut up kencc
+ }
+}
+
int
putblk(Blk *b)
{
--- a/check.c
+++ b/check.c
@@ -41,6 +41,10 @@
}
if(b->type == Pivot){
c = getblk(x.bp, x.bh);
+ if(blkfill(c) != x.fill){
+ fprint(2, "mismatched block fill");
+ fail++;
+ }
if(invalidblk(c, h + 1, &x, &y))
fail++;
}
--- a/dat.h
+++ b/dat.h
@@ -19,7 +19,7 @@
Leafspc = Blkspc,
Keymax = 16,
Inlmax = 64,
- Ptrsz = 16,
+ Ptrsz = 18,
Kvmax = Keymax + Inlmax, /* Key and value */
Kpmax = Keymax + Ptrsz, /* Key and pointer */
Msgmax = 1 + (Kvmax > Kpmax ? Kvmax : Kpmax)
@@ -92,6 +92,7 @@
struct {
uvlong bp;
uvlong bh;
+ ushort fill;
};
/* inline values */
struct {
@@ -123,7 +124,17 @@
Blk *l; /* left of split */
Blk *r; /* right of split */
Blk *n; /* shadowed node */
- int split; /* did we split? */
+ /*
+ * If we merged or rotated, at least
+ * one of these nodes is not nil,
+ * and midx points at the left of
+ * the two nodes.
+ */
+ Blk *ml; /* merged/rotated left */
+ Blk *mr; /* merged/rotated right */
+ int midx; /* merged index */
+ char split; /* did we split? */
+ char merge; /* did we merge? */
};
struct Blk {
--- a/fns.h
+++ b/fns.h
@@ -14,6 +14,7 @@
int putblk(Blk*);
Blk* getblk(uvlong bp, uvlong bh);
void freeblk(Blk *b);
+ushort blkfill(Blk*);
uvlong blkhash(Blk*);
uvlong siphash(void*, usize);
--- a/main.c
+++ b/main.c
@@ -41,7 +41,8 @@
if(kv->type == Vinl)
return fmtprint(fmt, "Kvp(%.*s,%.*s)", kv->nk, kv->k, kv->nv, kv->v);
else
- return fmtprint(fmt, "Kvp(%.*s,(%llx,%llx))", kv->nk, kv->k, kv->bp, kv->bh);
+ return fmtprint(fmt, "Kvp(%.*s,(%llux,%llux,%ud))",
+ kv->nk, kv->k, kv->bp, kv->bh, kv->fill);
}
static int
--- a/tree.c
+++ b/tree.c
@@ -62,6 +62,7 @@
kv->k = b->data + o + 2;
kv->bp = GBIT64(kv->k + kv->nk + 0);
kv->bh = GBIT64(kv->k + kv->nk + 8);
+ kv->fill = GBIT16(kv->k + kv->nk + 16);
}else{
kv->type = Vinl;
kv->nk = GBIT16(b->data + o);
@@ -120,6 +121,7 @@
memcpy(p + 2, kv->k, kv->nk);
PBIT64(p + kv->nk + 2, kv->bp);
PBIT64(p + kv->nk + 10, kv->bh);
+ PBIT16(p + kv->nk + 18, kv->fill);
} else {
assert(kv->type == Vinl);
PBIT16(b->data + 2*i, o);
@@ -305,6 +307,7 @@
*idx = lo;
return 0;
}
+
int
filledbuf(Blk *b, int needed)
{
@@ -343,6 +346,7 @@
kv.type = Vref;
kv.bp = (uintptr)pp->l;
kv.bh = blkhash(pp->l);
+ kv.fill = blkfill(pp->l);
setval(n, i++, &kv, 0);
if(nbytes != nil)
*nbytes += 2 + valsz(&kv);
@@ -351,6 +355,7 @@
kv.type = Vref;
kv.bp = (uintptr)pp->r;
kv.bh = blkhash(pp->r);
+ kv.fill = blkfill(pp->r);
setval(n, i++, &kv, 0);
if(nbytes != nil)
*nbytes += 2 + valsz(&kv);
@@ -359,6 +364,7 @@
kv.type = Vref;
kv.bp = (uintptr)pp->n;
kv.bh = blkhash(pp->n);
+ kv.fill = blkfill(pp->n);
setval(n, i++, &kv, 1);
if(nbytes != nil)
*nbytes += 2 + valsz(&kv);
@@ -374,22 +380,33 @@
*
* When pidx != -1,
*/
-Blk*
-update(Blk *b, Path *p, Path *pp)
+int
+update(Path *p, Path *pp)
{
- int i, j, lo, hi, pidx;
- Blk *n;
+ int i, j, lo, hi, pidx, midx;
+ Blk *b, *n;
Msg m;
j = 0;
+ b = p->b;
lo = (p != nil) ? p->lo : -1;
hi = (p != nil) ? p->hi : -1;
pidx = (p != nil) ? p->idx : -1;
- n = newblk(b->type);
+ midx = (p != nil && p->merge) ? p->midx : -1;
+ if((n = newblk(b->type)) == nil)
+ return -1;
for(i = 0; i < b->nent; i++){
if(i == pidx){
j = copyup(n, j, pp, nil);
continue;
+ }else if(i == midx){
+ getval(p->ml, 0, &m);
+ setval(n, j++, &m, 0);
+ if(p->mr){
+ getval(p->mr, 0, &m);
+ setval(n, j++, &m, 0);
+ }
+ continue;
}
getval(b, i, &m);
setval(n, j++, &m, 0);
@@ -407,7 +424,8 @@
}
b->nmsg = j;
}
- return n;
+ p->n = n;
+ return 0;
}
@@ -432,8 +450,11 @@
*/
l = newblk(b->type);
r = newblk(b->type);
- if(l == nil || r == nil)
- goto error;
+ if(l == nil || r == nil){
+ freeblk(l);
+ freeblk(r);
+ return -1;
+ }
lo = (p != nil) ? p->lo : -1;
hi = (p != nil) ? p->hi : -1;
@@ -486,10 +507,6 @@
p->l = l;
p->r = r;
return 0;
-error:
- if(l != nil) freeblk(l);
- if(r != nil) freeblk(r);
- return -1;
}
int
@@ -514,6 +531,215 @@
return -1;
}
+int
+merge(Path *p, int idx, Blk *a, Blk *b)
+{
+ int i, o;
+ Msg m;
+ Blk *d;
+
+ USED(p);
+ if((d = newblk(a->type)) == nil)
+ return -1;
+ o = 0;
+ for(i = 0; i < a->nent; i++){
+ getval(a, i, &m);
+ setval(d, o++, &m, 0);
+ }
+ for(i = 0; i < b->nent; i++){
+ getval(b, i, &m);
+ setval(d, o++, &m, 0);
+ }
+ if(a->type == Pivot){
+ for(i = 0; i < a->nmsg; i++){
+ getmsg(a, i, &m);
+ setmsg(d, o++, &m);
+ }
+ for(i = 0; i < b->nmsg; i++){
+ getmsg(b, i, &m);
+ setmsg(d, o++, &m);
+ }
+ }
+ p->merge = 1;
+ p->midx = idx;
+ p->ml = d;
+ p->mr = nil;
+ return 0;
+}
+
+/*
+ * Returns whether the keys in b between
+ * idx and m would spill out of the buffer
+ * of d.
+ */
+int
+spillsbuf(Blk *d, Blk *b, Msg *m, int *idx)
+{
+ int i, used;
+ Msg n;
+
+ if(b->type == Leaf)
+ return 0;
+ used = 2*d->nmsg + d->bufsz;
+ for(i = *idx; i < b->nmsg; i++){
+ getmsg(b, i, &n);
+ if(keycmp(&n, m) > 0)
+ break;
+ used += 2 + msgsz(&n);
+ if(used >= Bufspc)
+ return 1;
+ }
+ print("does not spill");
+ *idx = i;
+ return 0;
+}
+
+int
+rotate(Path *p, int idx, Blk *a, Blk *b, int halfbuf)
+{
+ int i, o, copied, split, ovfidx;
+ Blk *d, *l, *r;
+ Msg m;
+
+ l = newblk(a->type);
+ r = newblk(a->type);
+ if(l == nil || r == nil){
+ freeblk(l);
+ freeblk(r);
+ return -1;
+ }
+ o = 0;
+ d = l;
+ split = -1;
+ ovfidx = 0;
+ copied = 0;
+ for(i = 0; i < a->nent; i++){
+ getval(a, i, &m);
+ if(d == l && (copied >= halfbuf || spillsbuf(d, a, &m, &ovfidx))){
+ split = i;
+ o = 0;
+ d = r;
+ }
+ setval(d, o++, &m, 0);
+ copied += valsz(&m);
+ }
+ for(i = 0; i < b->nent; i++){
+ if(d == l && (copied >= halfbuf || spillsbuf(d, b, &m, &ovfidx))){
+ split = i;
+ o = 0;
+ d = r;
+ }
+ getval(b, i, &m);
+ setval(d, o++, &m, 0);
+ copied += valsz(&m);
+ }
+ if(a->type == Pivot){
+ d = l;
+ o = 0;
+ for(i = 0; i < a->nmsg; i++){
+ if(i == split){
+ d = r;
+ o = 0;
+ }
+ getmsg(a, i, &m);
+ setmsg(d, o++, &m);
+ }
+ for(i = 0; i < b->nmsg; i++){
+ if(i == split){
+ d = r;
+ o = 0;
+ }
+ getmsg(b, i, &m);
+ setmsg(d, o++, &m);
+ }
+ }
+ p->merge = 1;
+ p->midx = idx;
+ p->ml = l;
+ p->mr = r;
+ return 0;
+}
+
+int
+rotmerge(Path *p, int idx, Blk *a, Blk *b)
+{
+ int na, nb, ma, mb, imbalance;
+
+ assert(a->type == b->type);
+
+ na = 2*a->nent + a->valsz;
+ nb = 2*b->nent + b->valsz;
+ if(a->type == Leaf){
+ ma = 0;
+ mb = 0;
+ }else{
+ ma = 2*a->nmsg + a->bufsz;
+ mb = 2*b->nmsg + b->bufsz;
+ }
+ imbalance = na - nb;
+ if(imbalance < 0)
+ imbalance *= -1;
+ /* works for leaf, because 0 always < Bufspc */
+ if(na + nb < Pivspc && ma + mb < Bufspc)
+ return merge(p, idx, a, b);
+ else if(imbalance < 4*Msgmax)
+ return rotate(p, idx, a, b, (na + nb)/2);
+ else
+ return 0;
+}
+
+int
+trymerge(Path *p, Path *pp, int idx)
+{
+ Blk *l,*m, *r;
+ Kvp km, kl, kr;
+ int ret;
+
+ l = nil;
+ r = nil;
+ ret = -1;
+ if(p->idx == -1)
+ return 0;
+ if(pp != nil){
+ if((m = pp->n) == nil)
+ return 0;
+ }else{
+ if((m = getblk(km.bp, km.bh)) == nil)
+ return -1;
+ }
+ /* Try merging left */
+ getval(p->b, idx, &km);
+ if(idx > 0){
+ getval(p->b, idx-1, &kl);
+ if(kl.fill + km.fill >= Blkspc)
+ goto next;
+ if((l = getblk(kl.bp, kl.bh)) == nil)
+ goto out;
+ if(rotmerge(p, idx-1, l, m) == -1)
+ goto out;
+ goto done;
+ }
+next:
+ if(idx < p->b->nent){
+ getval(p->b, idx+1, &kr);
+ if(kr.fill + km.fill >= Blkspc)
+ goto done;
+ if((r = getblk(kr.bp, kr.bh)) == nil)
+ goto out;
+ if(rotmerge(p, idx, m, r) == -1)
+ goto out;
+ goto done;
+ }
+done:
+ ret = 0;
+out:
+ putblk(l);
+ putblk(r);
+ if(pp == nil)
+ putblk(m);
+ return ret;
+}
+
static int
flush(Path *path, int npath, Msg *ins, int *redo)
{
@@ -538,7 +764,8 @@
p = &path[npath - 1];
if(p->b->type == Leaf){
if(!filledleaf(p->b, p[-1].sz)){
- p->n = update(p->b, p, pp);
+ if(update(p, pp) == -1)
+ return -1;
for(i = p[-1].lo; i < p[-1].hi; i++){
getmsg(p[-1].b, i, &m);
if(filledleaf(p->n, msgsz(&m)))
@@ -560,12 +787,19 @@
}
}
assert(p->n || (p->l && p->r));
+ p->midx = -1;
pp = p;
p--;
}
for(; p > path; p--){
if(!filledpiv(p->b, 1)){
- p->n = update(p->b, p, pp);
+ if(trymerge(p, pp, p->idx) == -1)
+ goto error;
+ /* If we merged the root node, break out. */
+ if(p[-1].b == nil && p[0].merge && p[0].mr == nil && p[0].b->nent == 2)
+ break;
+ if(update(p, pp) == -1)
+ goto error;
for(i = p[-1].lo; i < p[-1].hi; i++){
getmsg(p[-1].b, i, &m);
if(filledbuf(p->n, msgsz(&m)))
@@ -682,6 +916,7 @@
path = emalloc((fs->height + 2)*sizeof(Path));
path[npath].b = nil;
path[npath].idx = -1;
+ path[npath].midx = -1;
npath++;
b = fs->root;
@@ -703,12 +938,16 @@
npath++;
if(flush(path, npath, m, &redo) == -1)
goto error;
- b = path[0].n;
- if(b != nil)
+ if(path[0].n != nil){
fs->height++;
- else
- b = path[1].n;
- fs->root = b;
+ fs->root = path[0].n;
+ }else if(path[1].n != nil){
+ fs->root = path[1].n;
+ }else if(npath >2 && path[2].n != nil){
+ fs->height--;
+ fs->root = path[2].n;
+ }else
+ abort();
free(path);
if(redo)
goto again;