Merge pull request #3851 from yichengq/storage-kv-data

storage: save the KeyValue instead of Event in backend
This commit is contained in:
Xiang Li 2015-11-19 10:24:50 -08:00
commit cf2d20c5c9
6 changed files with 267 additions and 222 deletions

View File

@ -28,7 +28,7 @@ type index interface {
Put(key []byte, rev revision) Put(key []byte, rev revision)
Restore(key []byte, created, modified revision, ver int64) Restore(key []byte, created, modified revision, ver int64)
Tombstone(key []byte, rev revision) error Tombstone(key []byte, rev revision) error
RangeEvents(key, end []byte, rev int64) []revision RangeSince(key, end []byte, rev int64) []revision
Compact(rev int64) map[revision]struct{} Compact(rev int64) map[revision]struct{}
Equal(b index) bool Equal(b index) bool
} }
@ -134,10 +134,10 @@ func (ti *treeIndex) Tombstone(key []byte, rev revision) error {
return ki.tombstone(rev.main, rev.sub) return ki.tombstone(rev.main, rev.sub)
} }
// RangeEvents returns all revisions from key(including) to end(excluding) // RangeSince returns all revisions from key(including) to end(excluding)
// at or after the given rev. The returned slice is sorted in the order // at or after the given rev. The returned slice is sorted in the order
// of revision. // of revision.
func (ti *treeIndex) RangeEvents(key, end []byte, rev int64) []revision { func (ti *treeIndex) RangeSince(key, end []byte, rev int64) []revision {
ti.RLock() ti.RLock()
defer ti.RUnlock() defer ti.RUnlock()

View File

@ -136,7 +136,7 @@ func TestIndexTombstone(t *testing.T) {
} }
} }
func TestIndexRangeEvents(t *testing.T) { func TestIndexRangeSince(t *testing.T) {
allKeys := [][]byte{[]byte("foo"), []byte("foo1"), []byte("foo2"), []byte("foo2"), []byte("foo1"), []byte("foo")} allKeys := [][]byte{[]byte("foo"), []byte("foo1"), []byte("foo2"), []byte("foo2"), []byte("foo1"), []byte("foo")}
allRevs := []revision{{main: 1}, {main: 2}, {main: 3}, {main: 4}, {main: 5}, {main: 6}} allRevs := []revision{{main: 1}, {main: 2}, {main: 3}, {main: 4}, {main: 5}, {main: 6}}
@ -184,7 +184,7 @@ func TestIndexRangeEvents(t *testing.T) {
}, },
} }
for i, tt := range tests { for i, tt := range tests {
revs := index.RangeEvents(tt.key, tt.end, atRev) revs := index.RangeSince(tt.key, tt.end, atRev)
if !reflect.DeepEqual(revs, tt.wrevs) { if !reflect.DeepEqual(revs, tt.wrevs) {
t.Errorf("#%d: revs = %+v, want %+v", i, revs, tt.wrevs) t.Errorf("#%d: revs = %+v, want %+v", i, revs, tt.wrevs)
} }

View File

@ -32,6 +32,13 @@ var (
keyBucketName = []byte("key") keyBucketName = []byte("key")
metaBucketName = []byte("meta") metaBucketName = []byte("meta")
// markedRevBytesLen is the byte length of marked revision.
// The first `revBytesLen` bytes represents a normal revision. The last
// one byte is the mark.
markedRevBytesLen = revBytesLen + 1
markBytePosition = markedRevBytesLen - 1
markTombstone byte = 't'
scheduledCompactKeyName = []byte("scheduledCompactRev") scheduledCompactKeyName = []byte("scheduledCompactRev")
finishedCompactKeyName = []byte("finishedCompactRev") finishedCompactKeyName = []byte("finishedCompactRev")
@ -193,7 +200,7 @@ func (s *store) TxnDeleteRange(txnID int64, key, end []byte) (n, rev int64, err
return n, rev, nil return n, rev, nil
} }
// RangeEvents gets the events from key to end starting from startRev. // RangeHistory ranges the history from key to end starting from startRev.
// If `end` is nil, the request only observes the events on key. // If `end` is nil, the request only observes the events on key.
// If `end` is not nil, it observes the events on key range [key, range_end). // If `end` is not nil, it observes the events on key range [key, range_end).
// Limit limits the number of events returned. // Limit limits the number of events returned.
@ -202,28 +209,29 @@ func (s *store) TxnDeleteRange(txnID int64, key, end []byte) (n, rev int64, err
// If the required start rev is compacted, ErrCompacted will be returned. // If the required start rev is compacted, ErrCompacted will be returned.
// If the required start rev has not happened, ErrFutureRev will be returned. // If the required start rev has not happened, ErrFutureRev will be returned.
// //
// RangeEvents returns events that satisfy the requirement (0 <= n <= limit). // RangeHistory returns revision bytes slice and key-values that satisfy the requirement (0 <= n <= limit).
// If events in the revision range have not all happened, it returns immeidately // If history in the revision range has not all happened, it returns immeidately
// what is available. // what is available.
// It also returns nextRev which indicates the start revision used for the following // It also returns nextRev which indicates the start revision used for the following
// RangeEvents call. The nextRev could be smaller than the given endRev if the store // RangeEvents call. The nextRev could be smaller than the given endRev if the store
// has not progressed so far or it hits the event limit. // has not progressed so far or it hits the event limit.
// //
// TODO: return byte slices instead of events to avoid meaningless encode and decode. // TODO: return byte slices instead of keyValues to avoid meaningless encode and decode.
func (s *store) RangeEvents(key, end []byte, limit, startRev int64) (evs []storagepb.Event, nextRev int64, err error) { // This also helps to return raw (key, val) pair directly to make API consistent.
func (s *store) RangeHistory(key, end []byte, limit, startRev int64) (revbs [][]byte, kvs []storagepb.KeyValue, nextRev int64, err error) {
s.mu.Lock() s.mu.Lock()
defer s.mu.Unlock() defer s.mu.Unlock()
if startRev > 0 && startRev <= s.compactMainRev { if startRev > 0 && startRev <= s.compactMainRev {
return nil, 0, ErrCompacted return nil, nil, 0, ErrCompacted
} }
if startRev > s.currentRev.main { if startRev > s.currentRev.main {
return nil, 0, ErrFutureRev return nil, nil, 0, ErrFutureRev
} }
revs := s.kvindex.RangeEvents(key, end, startRev) revs := s.kvindex.RangeSince(key, end, startRev)
if len(revs) == 0 { if len(revs) == 0 {
return nil, s.currentRev.main + 1, nil return nil, nil, s.currentRev.main + 1, nil
} }
tx := s.b.BatchTx() tx := s.b.BatchTx()
@ -231,24 +239,24 @@ func (s *store) RangeEvents(key, end []byte, limit, startRev int64) (evs []stora
defer tx.Unlock() defer tx.Unlock()
// fetch events from the backend using revisions // fetch events from the backend using revisions
for _, rev := range revs { for _, rev := range revs {
revbytes := newRevBytes() start, end := revBytesRange(rev)
revToBytes(rev, revbytes)
_, vs := tx.UnsafeRange(keyBucketName, revbytes, nil, 0) ks, vs := tx.UnsafeRange(keyBucketName, start, end, 0)
if len(vs) != 1 { if len(vs) != 1 {
log.Fatalf("storage: range cannot find rev (%d,%d)", rev.main, rev.sub) log.Fatalf("storage: range cannot find rev (%d,%d)", rev.main, rev.sub)
} }
e := storagepb.Event{} var kv storagepb.KeyValue
if err := e.Unmarshal(vs[0]); err != nil { if err := kv.Unmarshal(vs[0]); err != nil {
log.Fatalf("storage: cannot unmarshal event: %v", err) log.Fatalf("storage: cannot unmarshal event: %v", err)
} }
evs = append(evs, e) revbs = append(revbs, ks[0])
if limit > 0 && len(evs) >= int(limit) { kvs = append(kvs, kv)
return evs, rev.main + 1, nil if limit > 0 && len(kvs) >= int(limit) {
return revbs, kvs, rev.main + 1, nil
} }
} }
return evs, s.currentRev.main + 1, nil return revbs, kvs, s.currentRev.main + 1, nil
} }
func (s *store) Compact(rev int64) error { func (s *store) Compact(rev int64) error {
@ -316,21 +324,19 @@ func (s *store) Restore() error {
// TODO: limit N to reduce max memory usage // TODO: limit N to reduce max memory usage
keys, vals := tx.UnsafeRange(keyBucketName, min, max, 0) keys, vals := tx.UnsafeRange(keyBucketName, min, max, 0)
for i, key := range keys { for i, key := range keys {
e := &storagepb.Event{} var kv storagepb.KeyValue
if err := e.Unmarshal(vals[i]); err != nil { if err := kv.Unmarshal(vals[i]); err != nil {
log.Fatalf("storage: cannot unmarshal event: %v", err) log.Fatalf("storage: cannot unmarshal event: %v", err)
} }
rev := bytesToRev(key) rev := bytesToRev(key[:revBytesLen])
// restore index // restore index
switch e.Type { switch {
case storagepb.PUT: case isTombstone(key):
s.kvindex.Restore(e.Kv.Key, revision{e.Kv.CreateRevision, 0}, rev, e.Kv.Version) s.kvindex.Tombstone(kv.Key, rev)
case storagepb.DELETE:
s.kvindex.Tombstone(e.Kv.Key, rev)
default: default:
log.Panicf("storage: unexpected event type %s", e.Type) s.kvindex.Restore(kv.Key, revision{kv.CreateRevision, 0}, rev, kv.Version)
} }
// update revision // update revision
@ -392,19 +398,18 @@ func (s *store) rangeKeys(key, end []byte, limit, rangeRev int64) (kvs []storage
} }
for _, revpair := range revpairs { for _, revpair := range revpairs {
revbytes := newRevBytes() start, end := revBytesRange(revpair)
revToBytes(revpair, revbytes)
_, vs := s.tx.UnsafeRange(keyBucketName, revbytes, nil, 0) _, vs := s.tx.UnsafeRange(keyBucketName, start, end, 0)
if len(vs) != 1 { if len(vs) != 1 {
log.Fatalf("storage: range cannot find rev (%d,%d)", revpair.main, revpair.sub) log.Fatalf("storage: range cannot find rev (%d,%d)", revpair.main, revpair.sub)
} }
e := &storagepb.Event{} var kv storagepb.KeyValue
if err := e.Unmarshal(vs[0]); err != nil { if err := kv.Unmarshal(vs[0]); err != nil {
log.Fatalf("storage: cannot unmarshal event: %v", err) log.Fatalf("storage: cannot unmarshal event: %v", err)
} }
kvs = append(kvs, *e.Kv) kvs = append(kvs, kv)
if limit > 0 && len(kvs) >= int(limit) { if limit > 0 && len(kvs) >= int(limit) {
break break
} }
@ -426,18 +431,15 @@ func (s *store) put(key, value []byte) {
revToBytes(revision{main: rev, sub: s.currentRev.sub}, ibytes) revToBytes(revision{main: rev, sub: s.currentRev.sub}, ibytes)
ver = ver + 1 ver = ver + 1
event := storagepb.Event{ kv := storagepb.KeyValue{
Type: storagepb.PUT,
Kv: &storagepb.KeyValue{
Key: key, Key: key,
Value: value, Value: value,
CreateRevision: c, CreateRevision: c,
ModRevision: rev, ModRevision: rev,
Version: ver, Version: ver,
},
} }
d, err := event.Marshal() d, err := kv.Marshal()
if err != nil { if err != nil {
log.Fatalf("storage: cannot marshal event: %v", err) log.Fatalf("storage: cannot marshal event: %v", err)
} }
@ -469,15 +471,13 @@ func (s *store) delete(key []byte) {
ibytes := newRevBytes() ibytes := newRevBytes()
revToBytes(revision{main: mainrev, sub: s.currentRev.sub}, ibytes) revToBytes(revision{main: mainrev, sub: s.currentRev.sub}, ibytes)
ibytes = appendMarkTombstone(ibytes)
event := storagepb.Event{ kv := storagepb.KeyValue{
Type: storagepb.DELETE,
Kv: &storagepb.KeyValue{
Key: key, Key: key,
},
} }
d, err := event.Marshal() d, err := kv.Marshal()
if err != nil { if err != nil {
log.Fatalf("storage: cannot marshal event: %v", err) log.Fatalf("storage: cannot marshal event: %v", err)
} }
@ -489,3 +489,29 @@ func (s *store) delete(key []byte) {
} }
s.currentRev.sub += 1 s.currentRev.sub += 1
} }
// appendMarkTombstone appends tombstone mark to normal revision bytes.
func appendMarkTombstone(b []byte) []byte {
if len(b) != revBytesLen {
log.Panicf("cannot append mark to non normal revision bytes")
}
return append(b, markTombstone)
}
// isTombstone checks whether the revision bytes is a tombstone.
func isTombstone(b []byte) bool {
return len(b) == markedRevBytesLen && b[markBytePosition] == markTombstone
}
// revBytesRange returns the range of revision bytes at
// the given revision.
func revBytesRange(rev revision) (start, end []byte) {
start = newRevBytes()
revToBytes(rev, start)
end = newRevBytes()
endRev := revision{main: rev.main, sub: rev.sub + 1}
revToBytes(endRev, end)
return start, end
}

View File

@ -46,55 +46,50 @@ func TestStorePut(t *testing.T) {
r indexGetResp r indexGetResp
wrev revision wrev revision
wev storagepb.Event wkey []byte
wkv storagepb.KeyValue
wputrev revision wputrev revision
}{ }{
{ {
revision{1, 0}, revision{1, 0},
indexGetResp{revision{}, revision{}, 0, ErrRevisionNotFound}, indexGetResp{revision{}, revision{}, 0, ErrRevisionNotFound},
revision{1, 1}, revision{1, 1},
storagepb.Event{ newTestKeyBytes(revision{2, 0}, false),
Type: storagepb.PUT, storagepb.KeyValue{
Kv: &storagepb.KeyValue{
Key: []byte("foo"), Key: []byte("foo"),
Value: []byte("bar"), Value: []byte("bar"),
CreateRevision: 2, CreateRevision: 2,
ModRevision: 2, ModRevision: 2,
Version: 1, Version: 1,
}, },
},
revision{2, 0}, revision{2, 0},
}, },
{ {
revision{1, 1}, revision{1, 1},
indexGetResp{revision{2, 0}, revision{2, 0}, 1, nil}, indexGetResp{revision{2, 0}, revision{2, 0}, 1, nil},
revision{1, 2}, revision{1, 2},
storagepb.Event{ newTestKeyBytes(revision{2, 1}, false),
Type: storagepb.PUT, storagepb.KeyValue{
Kv: &storagepb.KeyValue{
Key: []byte("foo"), Key: []byte("foo"),
Value: []byte("bar"), Value: []byte("bar"),
CreateRevision: 2, CreateRevision: 2,
ModRevision: 2, ModRevision: 2,
Version: 2, Version: 2,
}, },
},
revision{2, 1}, revision{2, 1},
}, },
{ {
revision{2, 0}, revision{2, 0},
indexGetResp{revision{2, 1}, revision{2, 0}, 2, nil}, indexGetResp{revision{2, 1}, revision{2, 0}, 2, nil},
revision{2, 1}, revision{2, 1},
storagepb.Event{ newTestKeyBytes(revision{3, 0}, false),
Type: storagepb.PUT, storagepb.KeyValue{
Kv: &storagepb.KeyValue{
Key: []byte("foo"), Key: []byte("foo"),
Value: []byte("bar"), Value: []byte("bar"),
CreateRevision: 2, CreateRevision: 2,
ModRevision: 3, ModRevision: 3,
Version: 3, Version: 3,
}, },
},
revision{3, 0}, revision{3, 0},
}, },
} }
@ -106,12 +101,12 @@ func TestStorePut(t *testing.T) {
s.put([]byte("foo"), []byte("bar")) s.put([]byte("foo"), []byte("bar"))
data, err := tt.wev.Marshal() data, err := tt.wkv.Marshal()
if err != nil { if err != nil {
t.Errorf("#%d: marshal err = %v, want nil", i, err) t.Errorf("#%d: marshal err = %v, want nil", i, err)
} }
wact := []testutil.Action{ wact := []testutil.Action{
{"put", []interface{}{keyBucketName, newTestBytes(tt.wputrev), data}}, {"put", []interface{}{keyBucketName, tt.wkey, data}},
} }
if g := b.tx.Action(); !reflect.DeepEqual(g, wact) { if g := b.tx.Action(); !reflect.DeepEqual(g, wact) {
t.Errorf("#%d: tx action = %+v, want %+v", i, g, wact) t.Errorf("#%d: tx action = %+v, want %+v", i, g, wact)
@ -130,17 +125,15 @@ func TestStorePut(t *testing.T) {
} }
func TestStoreRange(t *testing.T) { func TestStoreRange(t *testing.T) {
ev := storagepb.Event{ key := newTestKeyBytes(revision{2, 0}, false)
Type: storagepb.PUT, kv := storagepb.KeyValue{
Kv: &storagepb.KeyValue{
Key: []byte("foo"), Key: []byte("foo"),
Value: []byte("bar"), Value: []byte("bar"),
CreateRevision: 1, CreateRevision: 1,
ModRevision: 2, ModRevision: 2,
Version: 1, Version: 1,
},
} }
evb, err := ev.Marshal() kvb, err := kv.Marshal()
if err != nil { if err != nil {
t.Fatal(err) t.Fatal(err)
} }
@ -153,11 +146,11 @@ func TestStoreRange(t *testing.T) {
}{ }{
{ {
indexRangeResp{[][]byte{[]byte("foo")}, []revision{{2, 0}}}, indexRangeResp{[][]byte{[]byte("foo")}, []revision{{2, 0}}},
rangeResp{[][]byte{newTestBytes(revision{2, 0})}, [][]byte{evb}}, rangeResp{[][]byte{key}, [][]byte{kvb}},
}, },
{ {
indexRangeResp{[][]byte{[]byte("foo"), []byte("foo1")}, []revision{{2, 0}, {3, 0}}}, indexRangeResp{[][]byte{[]byte("foo"), []byte("foo1")}, []revision{{2, 0}, {3, 0}}},
rangeResp{[][]byte{newTestBytes(revision{2, 0})}, [][]byte{evb}}, rangeResp{[][]byte{key}, [][]byte{kvb}},
}, },
} }
for i, tt := range tests { for i, tt := range tests {
@ -171,15 +164,16 @@ func TestStoreRange(t *testing.T) {
if err != nil { if err != nil {
t.Errorf("#%d: err = %v, want nil", i, err) t.Errorf("#%d: err = %v, want nil", i, err)
} }
if w := []storagepb.KeyValue{*ev.Kv}; !reflect.DeepEqual(kvs, w) { if w := []storagepb.KeyValue{kv}; !reflect.DeepEqual(kvs, w) {
t.Errorf("#%d: kvs = %+v, want %+v", i, kvs, w) t.Errorf("#%d: kvs = %+v, want %+v", i, kvs, w)
} }
if rev != wrev { if rev != wrev {
t.Errorf("#%d: rev = %d, want %d", i, rev, wrev) t.Errorf("#%d: rev = %d, want %d", i, rev, wrev)
} }
wstart, wend := revBytesRange(tt.idxr.revs[0])
wact := []testutil.Action{ wact := []testutil.Action{
{"range", []interface{}{keyBucketName, newTestBytes(tt.idxr.revs[0]), []byte(nil), int64(0)}}, {"range", []interface{}{keyBucketName, wstart, wend, int64(0)}},
} }
if g := b.tx.Action(); !reflect.DeepEqual(g, wact) { if g := b.tx.Action(); !reflect.DeepEqual(g, wact) {
t.Errorf("#%d: tx action = %+v, want %+v", i, g, wact) t.Errorf("#%d: tx action = %+v, want %+v", i, g, wact)
@ -201,6 +195,7 @@ func TestStoreDeleteRange(t *testing.T) {
rev revision rev revision
r indexRangeResp r indexRangeResp
wkey []byte
wrev revision wrev revision
wrrev int64 wrrev int64
wdelrev revision wdelrev revision
@ -208,6 +203,7 @@ func TestStoreDeleteRange(t *testing.T) {
{ {
revision{2, 0}, revision{2, 0},
indexRangeResp{[][]byte{[]byte("foo")}, []revision{{2, 0}}}, indexRangeResp{[][]byte{[]byte("foo")}, []revision{{2, 0}}},
newTestKeyBytes(revision{3, 0}, true),
revision{2, 1}, revision{2, 1},
2, 2,
revision{3, 0}, revision{3, 0},
@ -215,6 +211,7 @@ func TestStoreDeleteRange(t *testing.T) {
{ {
revision{2, 1}, revision{2, 1},
indexRangeResp{[][]byte{[]byte("foo")}, []revision{{2, 0}}}, indexRangeResp{[][]byte{[]byte("foo")}, []revision{{2, 0}}},
newTestKeyBytes(revision{3, 1}, true),
revision{2, 2}, revision{2, 2},
3, 3,
revision{3, 1}, revision{3, 1},
@ -231,17 +228,14 @@ func TestStoreDeleteRange(t *testing.T) {
t.Errorf("#%d: n = %d, want 1", i, n) t.Errorf("#%d: n = %d, want 1", i, n)
} }
data, err := (&storagepb.Event{ data, err := (&storagepb.KeyValue{
Type: storagepb.DELETE,
Kv: &storagepb.KeyValue{
Key: []byte("foo"), Key: []byte("foo"),
},
}).Marshal() }).Marshal()
if err != nil { if err != nil {
t.Errorf("#%d: marshal err = %v, want nil", i, err) t.Errorf("#%d: marshal err = %v, want nil", i, err)
} }
wact := []testutil.Action{ wact := []testutil.Action{
{"put", []interface{}{keyBucketName, newTestBytes(tt.wdelrev), data}}, {"put", []interface{}{keyBucketName, tt.wkey, data}},
} }
if g := b.tx.Action(); !reflect.DeepEqual(g, wact) { if g := b.tx.Action(); !reflect.DeepEqual(g, wact) {
t.Errorf("#%d: tx action = %+v, want %+v", i, g, wact) t.Errorf("#%d: tx action = %+v, want %+v", i, g, wact)
@ -259,18 +253,16 @@ func TestStoreDeleteRange(t *testing.T) {
} }
} }
func TestStoreRangeEvents(t *testing.T) { func TestStoreRangeHistory(t *testing.T) {
ev := storagepb.Event{ key := newTestKeyBytes(revision{2, 0}, false)
Type: storagepb.PUT, kv := storagepb.KeyValue{
Kv: &storagepb.KeyValue{
Key: []byte("foo"), Key: []byte("foo"),
Value: []byte("bar"), Value: []byte("bar"),
CreateRevision: 1, CreateRevision: 1,
ModRevision: 2, ModRevision: 2,
Version: 1, Version: 1,
},
} }
evb, err := ev.Marshal() kvb, err := kv.Marshal()
if err != nil { if err != nil {
t.Fatal(err) t.Fatal(err)
} }
@ -282,11 +274,11 @@ func TestStoreRangeEvents(t *testing.T) {
}{ }{
{ {
indexRangeEventsResp{[]revision{{2, 0}}}, indexRangeEventsResp{[]revision{{2, 0}}},
rangeResp{[][]byte{newTestBytes(revision{2, 0})}, [][]byte{evb}}, rangeResp{[][]byte{key}, [][]byte{kvb}},
}, },
{ {
indexRangeEventsResp{[]revision{{2, 0}, {3, 0}}}, indexRangeEventsResp{[]revision{{2, 0}, {3, 0}}},
rangeResp{[][]byte{newTestBytes(revision{2, 0})}, [][]byte{evb}}, rangeResp{[][]byte{key}, [][]byte{kvb}},
}, },
} }
for i, tt := range tests { for i, tt := range tests {
@ -295,12 +287,15 @@ func TestStoreRangeEvents(t *testing.T) {
index.indexRangeEventsRespc <- tt.idxr index.indexRangeEventsRespc <- tt.idxr
b.tx.rangeRespc <- tt.r b.tx.rangeRespc <- tt.r
evs, _, err := s.RangeEvents([]byte("foo"), []byte("goo"), 1, 1) keys, kvs, _, err := s.RangeHistory([]byte("foo"), []byte("goo"), 1, 1)
if err != nil { if err != nil {
t.Errorf("#%d: err = %v, want nil", i, err) t.Errorf("#%d: err = %v, want nil", i, err)
} }
if w := []storagepb.Event{ev}; !reflect.DeepEqual(evs, w) { if w := [][]byte{key}; !reflect.DeepEqual(keys, w) {
t.Errorf("#%d: evs = %+v, want %+v", i, evs, w) t.Errorf("#%d: keys = %+v, want %+v", i, keys, w)
}
if w := []storagepb.KeyValue{kv}; !reflect.DeepEqual(kvs, w) {
t.Errorf("#%d: kvs = %+v, want %+v", i, kvs, w)
} }
wact := []testutil.Action{ wact := []testutil.Action{
@ -309,8 +304,9 @@ func TestStoreRangeEvents(t *testing.T) {
if g := index.Action(); !reflect.DeepEqual(g, wact) { if g := index.Action(); !reflect.DeepEqual(g, wact) {
t.Errorf("#%d: index action = %+v, want %+v", i, g, wact) t.Errorf("#%d: index action = %+v, want %+v", i, g, wact)
} }
wstart, wend := revBytesRange(tt.idxr.revs[0])
wact = []testutil.Action{ wact = []testutil.Action{
{"range", []interface{}{keyBucketName, newTestBytes(tt.idxr.revs[0]), []byte(nil), int64(0)}}, {"range", []interface{}{keyBucketName, wstart, wend, int64(0)}},
} }
if g := b.tx.Action(); !reflect.DeepEqual(g, wact) { if g := b.tx.Action(); !reflect.DeepEqual(g, wact) {
t.Errorf("#%d: tx action = %+v, want %+v", i, g, wact) t.Errorf("#%d: tx action = %+v, want %+v", i, g, wact)
@ -325,7 +321,9 @@ func TestStoreCompact(t *testing.T) {
s, b, index := newFakeStore() s, b, index := newFakeStore()
s.currentRev = revision{3, 0} s.currentRev = revision{3, 0}
index.indexCompactRespc <- map[revision]struct{}{revision{1, 0}: {}} index.indexCompactRespc <- map[revision]struct{}{revision{1, 0}: {}}
b.tx.rangeRespc <- rangeResp{[][]byte{newTestBytes(revision{1, 0}), newTestBytes(revision{2, 0})}, nil} key1 := newTestKeyBytes(revision{1, 0}, false)
key2 := newTestKeyBytes(revision{2, 0}, false)
b.tx.rangeRespc <- rangeResp{[][]byte{key1, key2}, nil}
s.Compact(3) s.Compact(3)
s.wg.Wait() s.wg.Wait()
@ -336,10 +334,10 @@ func TestStoreCompact(t *testing.T) {
end := make([]byte, 8) end := make([]byte, 8)
binary.BigEndian.PutUint64(end, uint64(4)) binary.BigEndian.PutUint64(end, uint64(4))
wact := []testutil.Action{ wact := []testutil.Action{
{"put", []interface{}{metaBucketName, scheduledCompactKeyName, newTestBytes(revision{3, 0})}}, {"put", []interface{}{metaBucketName, scheduledCompactKeyName, newTestRevBytes(revision{3, 0})}},
{"range", []interface{}{keyBucketName, make([]byte, 17), end, int64(10000)}}, {"range", []interface{}{keyBucketName, make([]byte, 17), end, int64(10000)}},
{"delete", []interface{}{keyBucketName, newTestBytes(revision{2, 0})}}, {"delete", []interface{}{keyBucketName, key2}},
{"put", []interface{}{metaBucketName, finishedCompactKeyName, newTestBytes(revision{3, 0})}}, {"put", []interface{}{metaBucketName, finishedCompactKeyName, newTestRevBytes(revision{3, 0})}},
} }
if g := b.tx.Action(); !reflect.DeepEqual(g, wact) { if g := b.tx.Action(); !reflect.DeepEqual(g, wact) {
t.Errorf("tx actions = %+v, want %+v", g, wact) t.Errorf("tx actions = %+v, want %+v", g, wact)
@ -355,33 +353,29 @@ func TestStoreCompact(t *testing.T) {
func TestStoreRestore(t *testing.T) { func TestStoreRestore(t *testing.T) {
s, b, index := newFakeStore() s, b, index := newFakeStore()
putev := storagepb.Event{ putkey := newTestKeyBytes(revision{3, 0}, false)
Type: storagepb.PUT, putkv := storagepb.KeyValue{
Kv: &storagepb.KeyValue{
Key: []byte("foo"), Key: []byte("foo"),
Value: []byte("bar"), Value: []byte("bar"),
CreateRevision: 3, CreateRevision: 3,
ModRevision: 3, ModRevision: 3,
Version: 1, Version: 1,
},
} }
putevb, err := putev.Marshal() putkvb, err := putkv.Marshal()
if err != nil { if err != nil {
t.Fatal(err) t.Fatal(err)
} }
delev := storagepb.Event{ delkey := newTestKeyBytes(revision{4, 0}, true)
Type: storagepb.DELETE, delkv := storagepb.KeyValue{
Kv: &storagepb.KeyValue{
Key: []byte("foo"), Key: []byte("foo"),
},
} }
delevb, err := delev.Marshal() delkvb, err := delkv.Marshal()
if err != nil { if err != nil {
t.Fatal(err) t.Fatal(err)
} }
b.tx.rangeRespc <- rangeResp{[][]byte{finishedCompactKeyName}, [][]byte{newTestBytes(revision{2, 0})}} b.tx.rangeRespc <- rangeResp{[][]byte{finishedCompactKeyName}, [][]byte{newTestRevBytes(revision{2, 0})}}
b.tx.rangeRespc <- rangeResp{[][]byte{newTestBytes(revision{3, 0}), newTestBytes(revision{4, 0})}, [][]byte{putevb, delevb}} b.tx.rangeRespc <- rangeResp{[][]byte{putkey, delkey}, [][]byte{putkvb, delkvb}}
b.tx.rangeRespc <- rangeResp{[][]byte{scheduledCompactKeyName}, [][]byte{newTestBytes(revision{2, 0})}} b.tx.rangeRespc <- rangeResp{[][]byte{scheduledCompactKeyName}, [][]byte{newTestRevBytes(revision{2, 0})}}
s.Restore() s.Restore()
@ -394,7 +388,7 @@ func TestStoreRestore(t *testing.T) {
} }
wact := []testutil.Action{ wact := []testutil.Action{
{"range", []interface{}{metaBucketName, finishedCompactKeyName, []byte(nil), int64(0)}}, {"range", []interface{}{metaBucketName, finishedCompactKeyName, []byte(nil), int64(0)}},
{"range", []interface{}{keyBucketName, newTestBytes(revision{}), newTestBytes(revision{math.MaxInt64, math.MaxInt64}), int64(0)}}, {"range", []interface{}{keyBucketName, newTestRevBytes(revision{}), newTestRevBytes(revision{math.MaxInt64, math.MaxInt64}), int64(0)}},
{"range", []interface{}{metaBucketName, scheduledCompactKeyName, []byte(nil), int64(0)}}, {"range", []interface{}{metaBucketName, scheduledCompactKeyName, []byte(nil), int64(0)}},
} }
if g := b.tx.Action(); !reflect.DeepEqual(g, wact) { if g := b.tx.Action(); !reflect.DeepEqual(g, wact) {
@ -410,79 +404,79 @@ func TestStoreRestore(t *testing.T) {
} }
// tests end parameter works well // tests end parameter works well
func TestStoreRangeEventsEnd(t *testing.T) { func TestStoreRangeHistoryEnd(t *testing.T) {
s := newStore(tmpPath) s := newStore(tmpPath)
defer cleanup(s, tmpPath) defer cleanup(s, tmpPath)
s.Put([]byte("foo"), []byte("bar")) s.Put([]byte("foo"), []byte("bar"))
s.Put([]byte("foo1"), []byte("bar1")) s.Put([]byte("foo1"), []byte("bar1"))
s.Put([]byte("foo2"), []byte("bar2")) s.Put([]byte("foo2"), []byte("bar2"))
evs := []storagepb.Event{ keys := [][]byte{
{ newTestKeyBytes(revision{1, 0}, false),
Type: storagepb.PUT, newTestKeyBytes(revision{2, 0}, false),
Kv: &storagepb.KeyValue{Key: []byte("foo"), Value: []byte("bar"), CreateRevision: 1, ModRevision: 1, Version: 1}, newTestKeyBytes(revision{3, 0}, false),
}, }
{ kvs := []storagepb.KeyValue{
Type: storagepb.PUT, {Key: []byte("foo"), Value: []byte("bar"), CreateRevision: 1, ModRevision: 1, Version: 1},
Kv: &storagepb.KeyValue{Key: []byte("foo1"), Value: []byte("bar1"), CreateRevision: 2, ModRevision: 2, Version: 1}, {Key: []byte("foo1"), Value: []byte("bar1"), CreateRevision: 2, ModRevision: 2, Version: 1},
}, {Key: []byte("foo2"), Value: []byte("bar2"), CreateRevision: 3, ModRevision: 3, Version: 1},
{
Type: storagepb.PUT,
Kv: &storagepb.KeyValue{Key: []byte("foo2"), Value: []byte("bar2"), CreateRevision: 3, ModRevision: 3, Version: 1},
},
} }
tests := []struct { tests := []struct {
key, end []byte key, end []byte
wevs []storagepb.Event wkeys [][]byte
wkvs []storagepb.KeyValue
}{ }{
// get no keys // get no keys
{ {
[]byte("doo"), []byte("foo"), []byte("doo"), []byte("foo"),
nil, nil, nil,
}, },
// get no keys when key == end // get no keys when key == end
{ {
[]byte("foo"), []byte("foo"), []byte("foo"), []byte("foo"),
nil, nil, nil,
}, },
// get no keys when ranging single key // get no keys when ranging single key
{ {
[]byte("doo"), nil, []byte("doo"), nil,
nil, nil, nil,
}, },
// get all keys // get all keys
{ {
[]byte("foo"), []byte("foo3"), []byte("foo"), []byte("foo3"),
evs, keys, kvs,
}, },
// get partial keys // get partial keys
{ {
[]byte("foo"), []byte("foo1"), []byte("foo"), []byte("foo1"),
evs[:1], keys[:1], kvs[:1],
}, },
// get single key // get single key
{ {
[]byte("foo"), nil, []byte("foo"), nil,
evs[:1], keys[:1], kvs[:1],
}, },
} }
for i, tt := range tests { for i, tt := range tests {
evs, rev, err := s.RangeEvents(tt.key, tt.end, 0, 1) keys, kvs, rev, err := s.RangeHistory(tt.key, tt.end, 0, 1)
if err != nil { if err != nil {
t.Fatal(err) t.Fatal(err)
} }
if rev != 4 { if rev != 4 {
t.Errorf("#%d: rev = %d, want %d", i, rev, 4) t.Errorf("#%d: rev = %d, want %d", i, rev, 4)
} }
if !reflect.DeepEqual(evs, tt.wevs) { if !reflect.DeepEqual(keys, tt.wkeys) {
t.Errorf("#%d: evs = %+v, want %+v", i, evs, tt.wevs) t.Errorf("#%d: actions = %+v, want %+v", i, keys, tt.wkeys)
}
if !reflect.DeepEqual(kvs, tt.wkvs) {
t.Errorf("#%d: kvs = %+v, want %+v", i, kvs, tt.wkvs)
} }
} }
} }
func TestStoreRangeEventsRev(t *testing.T) { func TestStoreRangeHistoryRev(t *testing.T) {
s := newStore(tmpPath) s := newStore(tmpPath)
defer cleanup(s, tmpPath) defer cleanup(s, tmpPath)
@ -490,39 +484,39 @@ func TestStoreRangeEventsRev(t *testing.T) {
s.DeleteRange([]byte("foo"), nil) s.DeleteRange([]byte("foo"), nil)
s.Put([]byte("foo"), []byte("bar")) s.Put([]byte("foo"), []byte("bar"))
s.Put([]byte("unrelated"), []byte("unrelated")) s.Put([]byte("unrelated"), []byte("unrelated"))
evs := []storagepb.Event{ keys := [][]byte{
{ newTestKeyBytes(revision{1, 0}, false),
Type: storagepb.PUT, newTestKeyBytes(revision{2, 0}, true),
Kv: &storagepb.KeyValue{Key: []byte("foo"), Value: []byte("bar"), CreateRevision: 1, ModRevision: 1, Version: 1}, newTestKeyBytes(revision{3, 0}, false),
}, }
{ kvs := []storagepb.KeyValue{
Type: storagepb.DELETE, {Key: []byte("foo"), Value: []byte("bar"), CreateRevision: 1, ModRevision: 1, Version: 1},
Kv: &storagepb.KeyValue{Key: []byte("foo")}, {Key: []byte("foo")},
}, {Key: []byte("foo"), Value: []byte("bar"), CreateRevision: 3, ModRevision: 3, Version: 1},
{
Type: storagepb.PUT,
Kv: &storagepb.KeyValue{Key: []byte("foo"), Value: []byte("bar"), CreateRevision: 3, ModRevision: 3, Version: 1},
},
} }
tests := []struct { tests := []struct {
start int64 start int64
wevs []storagepb.Event wkeys [][]byte
wkvs []storagepb.KeyValue
wnext int64 wnext int64
}{ }{
{0, evs, 5}, {0, keys, kvs, 5},
{1, evs, 5}, {1, keys, kvs, 5},
{3, evs[2:], 5}, {3, keys[2:], kvs[2:], 5},
} }
for i, tt := range tests { for i, tt := range tests {
evs, next, err := s.RangeEvents([]byte("foo"), nil, 0, tt.start) keys, kvs, next, err := s.RangeHistory([]byte("foo"), nil, 0, tt.start)
if err != nil { if err != nil {
t.Fatal(err) t.Fatal(err)
} }
if !reflect.DeepEqual(evs, tt.wevs) { if !reflect.DeepEqual(keys, tt.wkeys) {
t.Errorf("#%d: evs = %+v, want %+v", i, evs, tt.wevs) t.Errorf("#%d: acts = %+v, want %+v", i, keys, tt.wkeys)
}
if !reflect.DeepEqual(kvs, tt.wkvs) {
t.Errorf("#%d: kvs = %+v, want %+v", i, kvs, tt.wkvs)
} }
if next != tt.wnext { if next != tt.wnext {
t.Errorf("#%d: next = %d, want %d", i, next, tt.wnext) t.Errorf("#%d: next = %d, want %d", i, next, tt.wnext)
@ -530,7 +524,7 @@ func TestStoreRangeEventsRev(t *testing.T) {
} }
} }
func TestStoreRangeEventsBad(t *testing.T) { func TestStoreRangeHistoryBad(t *testing.T) {
s := newStore(tmpPath) s := newStore(tmpPath)
defer cleanup(s, tmpPath) defer cleanup(s, tmpPath)
@ -552,55 +546,55 @@ func TestStoreRangeEventsBad(t *testing.T) {
{10, ErrFutureRev}, {10, ErrFutureRev},
} }
for i, tt := range tests { for i, tt := range tests {
_, _, err := s.RangeEvents([]byte("foo"), nil, 0, tt.rev) _, _, _, err := s.RangeHistory([]byte("foo"), nil, 0, tt.rev)
if err != tt.werr { if err != tt.werr {
t.Errorf("#%d: error = %v, want %v", i, err, tt.werr) t.Errorf("#%d: error = %v, want %v", i, err, tt.werr)
} }
} }
} }
func TestStoreRangeEventsLimit(t *testing.T) { func TestStoreRangeHistoryLimit(t *testing.T) {
s := newStore(tmpPath) s := newStore(tmpPath)
defer cleanup(s, tmpPath) defer cleanup(s, tmpPath)
s.Put([]byte("foo"), []byte("bar")) s.Put([]byte("foo"), []byte("bar"))
s.DeleteRange([]byte("foo"), nil) s.DeleteRange([]byte("foo"), nil)
s.Put([]byte("foo"), []byte("bar")) s.Put([]byte("foo"), []byte("bar"))
evs := []storagepb.Event{ keys := [][]byte{
{ newTestKeyBytes(revision{1, 0}, false),
Type: storagepb.PUT, newTestKeyBytes(revision{2, 0}, true),
Kv: &storagepb.KeyValue{Key: []byte("foo"), Value: []byte("bar"), CreateRevision: 1, ModRevision: 1, Version: 1}, newTestKeyBytes(revision{3, 0}, false),
}, }
{ kvs := []storagepb.KeyValue{
Type: storagepb.DELETE, {Key: []byte("foo"), Value: []byte("bar"), CreateRevision: 1, ModRevision: 1, Version: 1},
Kv: &storagepb.KeyValue{Key: []byte("foo")}, {Key: []byte("foo")},
}, {Key: []byte("foo"), Value: []byte("bar"), CreateRevision: 3, ModRevision: 3, Version: 1},
{
Type: storagepb.PUT,
Kv: &storagepb.KeyValue{Key: []byte("foo"), Value: []byte("bar"), CreateRevision: 3, ModRevision: 3, Version: 1},
},
} }
tests := []struct { tests := []struct {
limit int64 limit int64
wevs []storagepb.Event wkeys [][]byte
wkvs []storagepb.KeyValue
}{ }{
// no limit // no limit
{-1, evs}, {-1, keys, kvs},
// no limit // no limit
{0, evs}, {0, keys, kvs},
{1, evs[:1]}, {1, keys[:1], kvs[:1]},
{2, evs[:2]}, {2, keys[:2], kvs[:2]},
{3, evs}, {3, keys, kvs},
{100, evs}, {100, keys, kvs},
} }
for i, tt := range tests { for i, tt := range tests {
evs, _, err := s.RangeEvents([]byte("foo"), nil, tt.limit, 1) keys, kvs, _, err := s.RangeHistory([]byte("foo"), nil, tt.limit, 1)
if err != nil { if err != nil {
t.Fatalf("#%d: range error (%v)", i, err) t.Fatalf("#%d: range error (%v)", i, err)
} }
if !reflect.DeepEqual(evs, tt.wevs) { if !reflect.DeepEqual(keys, tt.wkeys) {
t.Errorf("#%d: evs = %+v, want %+v", i, evs, tt.wevs) t.Errorf("#%d: acts = %+v, want %+v", i, keys, tt.wkeys)
}
if !reflect.DeepEqual(kvs, tt.wkvs) {
t.Errorf("#%d: kvs = %+v, want %+v", i, kvs, tt.wkvs)
} }
} }
} }
@ -688,12 +682,21 @@ func BenchmarkStorePut(b *testing.B) {
} }
} }
func newTestBytes(rev revision) []byte { func newTestRevBytes(rev revision) []byte {
bytes := newRevBytes() bytes := newRevBytes()
revToBytes(rev, bytes) revToBytes(rev, bytes)
return bytes return bytes
} }
func newTestKeyBytes(rev revision, tombstone bool) []byte {
bytes := newRevBytes()
revToBytes(rev, bytes)
if tombstone {
bytes = appendMarkTombstone(bytes)
}
return bytes
}
func newFakeStore() (*store, *fakeBackend, *fakeIndex) { func newFakeStore() (*store, *fakeBackend, *fakeIndex) {
b := &fakeBackend{&fakeBatchTx{rangeRespc: make(chan rangeResp, 5)}} b := &fakeBackend{&fakeBatchTx{rangeRespc: make(chan rangeResp, 5)}}
index := &fakeIndex{ index := &fakeIndex{
@ -792,7 +795,7 @@ func (i *fakeIndex) Tombstone(key []byte, rev revision) error {
i.Recorder.Record(testutil.Action{Name: "tombstone", Params: []interface{}{key, rev}}) i.Recorder.Record(testutil.Action{Name: "tombstone", Params: []interface{}{key, rev}})
return nil return nil
} }
func (i *fakeIndex) RangeEvents(key, end []byte, rev int64) []revision { func (i *fakeIndex) RangeSince(key, end []byte, rev int64) []revision {
i.Recorder.Record(testutil.Action{Name: "rangeEvents", Params: []interface{}{key, end, rev}}) i.Recorder.Record(testutil.Action{Name: "rangeEvents", Params: []interface{}{key, end, rev}})
r := <-i.indexRangeEventsRespc r := <-i.indexRangeEventsRespc
return r.revs return r.revs

View File

@ -16,6 +16,11 @@ package storage
import "encoding/binary" import "encoding/binary"
// revBytesLen is the byte length of a normal revision.
// First 8 bytes is the revision.main in big-endian format. The 9th byte
// is a '_'. The last 8 bytes is the revision.sub in big-endian format.
const revBytesLen = 8 + 1 + 8
type revision struct { type revision struct {
main int64 main int64
sub int64 sub int64
@ -32,7 +37,7 @@ func (a revision) GreaterThan(b revision) bool {
} }
func newRevBytes() []byte { func newRevBytes() []byte {
return make([]byte, 8+1+8) return make([]byte, revBytesLen, markedRevBytesLen)
} }
func revToBytes(rev revision, bytes []byte) { func revToBytes(rev revision, bytes []byte) {

View File

@ -247,7 +247,7 @@ func (s *watchableStore) syncWatchings() {
if limit == 0 { if limit == 0 {
continue continue
} }
evs, nextRev, err := s.store.RangeEvents(w.key, end, int64(limit), w.cur) revbs, kvs, nextRev, err := s.store.RangeHistory(w.key, end, int64(limit), w.cur)
if err != nil { if err != nil {
// TODO: send error event to watching // TODO: send error event to watching
delete(s.unsynced, w) delete(s.unsynced, w)
@ -255,8 +255,19 @@ func (s *watchableStore) syncWatchings() {
} }
// push events to the channel // push events to the channel
for _, ev := range evs { for i, kv := range kvs {
w.ch <- ev var evt storagepb.Event_EventType
switch {
case isTombstone(revbs[i]):
evt = storagepb.DELETE
default:
evt = storagepb.PUT
}
w.ch <- storagepb.Event{
Type: evt,
Kv: &kv,
}
pendingEventsGauge.Inc() pendingEventsGauge.Inc()
} }
// switch to tracking future events if needed // switch to tracking future events if needed