batch_tx.go 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192
  1. // Copyright 2015 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package backend
  15. import (
  16. "bytes"
  17. "log"
  18. "sync"
  19. "sync/atomic"
  20. "time"
  21. "github.com/boltdb/bolt"
  22. )
  23. type BatchTx interface {
  24. Lock()
  25. Unlock()
  26. UnsafeCreateBucket(name []byte)
  27. UnsafePut(bucketName []byte, key []byte, value []byte)
  28. UnsafeSeqPut(bucketName []byte, key []byte, value []byte)
  29. UnsafeRange(bucketName []byte, key, endKey []byte, limit int64) (keys [][]byte, vals [][]byte)
  30. UnsafeDelete(bucketName []byte, key []byte)
  31. UnsafeForEach(bucketName []byte, visitor func(k, v []byte) error) error
  32. Commit()
  33. CommitAndStop()
  34. }
  35. type batchTx struct {
  36. sync.Mutex
  37. tx *bolt.Tx
  38. backend *backend
  39. pending int
  40. }
  41. func newBatchTx(backend *backend) *batchTx {
  42. tx := &batchTx{backend: backend}
  43. tx.Commit()
  44. return tx
  45. }
  46. func (t *batchTx) UnsafeCreateBucket(name []byte) {
  47. _, err := t.tx.CreateBucket(name)
  48. if err != nil && err != bolt.ErrBucketExists {
  49. log.Fatalf("mvcc: cannot create bucket %s (%v)", name, err)
  50. }
  51. t.pending++
  52. }
  53. // UnsafePut must be called holding the lock on the tx.
  54. func (t *batchTx) UnsafePut(bucketName []byte, key []byte, value []byte) {
  55. t.unsafePut(bucketName, key, value, false)
  56. }
  57. // UnsafeSeqPut must be called holding the lock on the tx.
  58. func (t *batchTx) UnsafeSeqPut(bucketName []byte, key []byte, value []byte) {
  59. t.unsafePut(bucketName, key, value, true)
  60. }
  61. func (t *batchTx) unsafePut(bucketName []byte, key []byte, value []byte, seq bool) {
  62. bucket := t.tx.Bucket(bucketName)
  63. if bucket == nil {
  64. log.Fatalf("mvcc: bucket %s does not exist", bucketName)
  65. }
  66. if seq {
  67. // it is useful to increase fill percent when the workloads are mostly append-only.
  68. // this can delay the page split and reduce space usage.
  69. bucket.FillPercent = 0.9
  70. }
  71. if err := bucket.Put(key, value); err != nil {
  72. log.Fatalf("mvcc: cannot put key into bucket (%v)", err)
  73. }
  74. t.pending++
  75. }
  76. // UnsafeRange must be called holding the lock on the tx.
  77. func (t *batchTx) UnsafeRange(bucketName []byte, key, endKey []byte, limit int64) (keys [][]byte, vs [][]byte) {
  78. bucket := t.tx.Bucket(bucketName)
  79. if bucket == nil {
  80. log.Fatalf("mvcc: bucket %s does not exist", bucketName)
  81. }
  82. if len(endKey) == 0 {
  83. if v := bucket.Get(key); v == nil {
  84. return keys, vs
  85. } else {
  86. return append(keys, key), append(vs, v)
  87. }
  88. }
  89. c := bucket.Cursor()
  90. for ck, cv := c.Seek(key); ck != nil && bytes.Compare(ck, endKey) < 0; ck, cv = c.Next() {
  91. vs = append(vs, cv)
  92. keys = append(keys, ck)
  93. if limit > 0 && limit == int64(len(keys)) {
  94. break
  95. }
  96. }
  97. return keys, vs
  98. }
  99. // UnsafeDelete must be called holding the lock on the tx.
  100. func (t *batchTx) UnsafeDelete(bucketName []byte, key []byte) {
  101. bucket := t.tx.Bucket(bucketName)
  102. if bucket == nil {
  103. log.Fatalf("mvcc: bucket %s does not exist", bucketName)
  104. }
  105. err := bucket.Delete(key)
  106. if err != nil {
  107. log.Fatalf("mvcc: cannot delete key from bucket (%v)", err)
  108. }
  109. t.pending++
  110. }
  111. // UnsafeForEach must be called holding the lock on the tx.
  112. func (t *batchTx) UnsafeForEach(bucketName []byte, visitor func(k, v []byte) error) error {
  113. b := t.tx.Bucket(bucketName)
  114. if b == nil {
  115. // bucket does not exist
  116. return nil
  117. }
  118. return b.ForEach(visitor)
  119. }
  120. // Commit commits a previous tx and begins a new writable one.
  121. func (t *batchTx) Commit() {
  122. t.Lock()
  123. defer t.Unlock()
  124. t.commit(false)
  125. }
  126. // CommitAndStop commits the previous tx and do not create a new one.
  127. func (t *batchTx) CommitAndStop() {
  128. t.Lock()
  129. defer t.Unlock()
  130. t.commit(true)
  131. }
  132. func (t *batchTx) Unlock() {
  133. if t.pending >= t.backend.batchLimit {
  134. t.commit(false)
  135. t.pending = 0
  136. }
  137. t.Mutex.Unlock()
  138. }
  139. func (t *batchTx) commit(stop bool) {
  140. var err error
  141. // commit the last tx
  142. if t.tx != nil {
  143. if t.pending == 0 && !stop {
  144. t.backend.mu.RLock()
  145. defer t.backend.mu.RUnlock()
  146. atomic.StoreInt64(&t.backend.size, t.tx.Size())
  147. return
  148. }
  149. start := time.Now()
  150. err = t.tx.Commit()
  151. commitDurations.Observe(time.Since(start).Seconds())
  152. atomic.AddInt64(&t.backend.commits, 1)
  153. t.pending = 0
  154. if err != nil {
  155. log.Fatalf("mvcc: cannot commit tx (%s)", err)
  156. }
  157. }
  158. if stop {
  159. return
  160. }
  161. t.backend.mu.RLock()
  162. defer t.backend.mu.RUnlock()
  163. // begin a new tx
  164. t.tx, err = t.backend.db.Begin(true)
  165. if err != nil {
  166. log.Fatalf("mvcc: cannot begin tx (%s)", err)
  167. }
  168. atomic.StoreInt64(&t.backend.size, t.tx.Size())
  169. }