index.go 3.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155
  1. package storage
  2. import (
  3. "log"
  4. "sync"
  5. "github.com/coreos/etcd/Godeps/_workspace/src/github.com/google/btree"
  6. )
  7. type index interface {
  8. Get(key []byte, atRev int64) (rev, created reversion, ver int64, err error)
  9. Range(key, end []byte, atRev int64) ([][]byte, []reversion)
  10. Put(key []byte, rev reversion)
  11. Tombstone(key []byte, rev reversion) error
  12. Compact(rev int64) map[reversion]struct{}
  13. Equal(b index) bool
  14. }
  15. type treeIndex struct {
  16. sync.RWMutex
  17. tree *btree.BTree
  18. }
  19. func newTreeIndex() index {
  20. return &treeIndex{
  21. tree: btree.New(32),
  22. }
  23. }
  24. func (ti *treeIndex) Put(key []byte, rev reversion) {
  25. keyi := &keyIndex{key: key}
  26. ti.Lock()
  27. defer ti.Unlock()
  28. item := ti.tree.Get(keyi)
  29. if item == nil {
  30. keyi.put(rev.main, rev.sub)
  31. ti.tree.ReplaceOrInsert(keyi)
  32. return
  33. }
  34. okeyi := item.(*keyIndex)
  35. okeyi.put(rev.main, rev.sub)
  36. }
  37. func (ti *treeIndex) Get(key []byte, atRev int64) (modified, created reversion, ver int64, err error) {
  38. keyi := &keyIndex{key: key}
  39. ti.RLock()
  40. defer ti.RUnlock()
  41. item := ti.tree.Get(keyi)
  42. if item == nil {
  43. return reversion{}, reversion{}, 0, ErrReversionNotFound
  44. }
  45. keyi = item.(*keyIndex)
  46. return keyi.get(atRev)
  47. }
  48. func (ti *treeIndex) Range(key, end []byte, atRev int64) (keys [][]byte, revs []reversion) {
  49. if end == nil {
  50. rev, _, _, err := ti.Get(key, atRev)
  51. if err != nil {
  52. return nil, nil
  53. }
  54. return [][]byte{key}, []reversion{rev}
  55. }
  56. keyi := &keyIndex{key: key}
  57. endi := &keyIndex{key: end}
  58. ti.RLock()
  59. defer ti.RUnlock()
  60. ti.tree.AscendGreaterOrEqual(keyi, func(item btree.Item) bool {
  61. if !item.Less(endi) {
  62. return false
  63. }
  64. curKeyi := item.(*keyIndex)
  65. rev, _, _, err := curKeyi.get(atRev)
  66. if err != nil {
  67. return true
  68. }
  69. revs = append(revs, rev)
  70. keys = append(keys, curKeyi.key)
  71. return true
  72. })
  73. return keys, revs
  74. }
  75. func (ti *treeIndex) Tombstone(key []byte, rev reversion) error {
  76. keyi := &keyIndex{key: key}
  77. ti.Lock()
  78. defer ti.Unlock()
  79. item := ti.tree.Get(keyi)
  80. if item == nil {
  81. return ErrReversionNotFound
  82. }
  83. ki := item.(*keyIndex)
  84. ki.tombstone(rev.main, rev.sub)
  85. return nil
  86. }
  87. func (ti *treeIndex) Compact(rev int64) map[reversion]struct{} {
  88. available := make(map[reversion]struct{})
  89. emptyki := make([]*keyIndex, 0)
  90. log.Printf("store.index: compact %d", rev)
  91. // TODO: do not hold the lock for long time?
  92. // This is probably OK. Compacting 10M keys takes O(10ms).
  93. ti.Lock()
  94. defer ti.Unlock()
  95. ti.tree.Ascend(compactIndex(rev, available, &emptyki))
  96. for _, ki := range emptyki {
  97. item := ti.tree.Delete(ki)
  98. if item == nil {
  99. log.Panic("store.index: unexpected delete failure during compaction")
  100. }
  101. }
  102. return available
  103. }
  104. func compactIndex(rev int64, available map[reversion]struct{}, emptyki *[]*keyIndex) func(i btree.Item) bool {
  105. return func(i btree.Item) bool {
  106. keyi := i.(*keyIndex)
  107. keyi.compact(rev, available)
  108. if keyi.isEmpty() {
  109. *emptyki = append(*emptyki, keyi)
  110. }
  111. return true
  112. }
  113. }
  114. func (a *treeIndex) Equal(bi index) bool {
  115. b := bi.(*treeIndex)
  116. if a.tree.Len() != b.tree.Len() {
  117. return false
  118. }
  119. equal := true
  120. a.tree.Ascend(func(item btree.Item) bool {
  121. aki := item.(*keyIndex)
  122. bki := b.tree.Get(item).(*keyIndex)
  123. if !aki.equal(bki) {
  124. equal = false
  125. return false
  126. }
  127. return true
  128. })
  129. return equal
  130. }