v3demo_server.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530
  1. // Copyright 2015 CoreOS, Inc.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package etcdserver
  15. import (
  16. "bytes"
  17. "fmt"
  18. "sort"
  19. "time"
  20. "github.com/coreos/etcd/Godeps/_workspace/src/github.com/gogo/protobuf/proto"
  21. "github.com/coreos/etcd/Godeps/_workspace/src/golang.org/x/net/context"
  22. pb "github.com/coreos/etcd/etcdserver/etcdserverpb"
  23. "github.com/coreos/etcd/lease"
  24. dstorage "github.com/coreos/etcd/storage"
  25. "github.com/coreos/etcd/storage/storagepb"
  26. )
  27. type RaftKV interface {
  28. Range(ctx context.Context, r *pb.RangeRequest) (*pb.RangeResponse, error)
  29. Put(ctx context.Context, r *pb.PutRequest) (*pb.PutResponse, error)
  30. DeleteRange(ctx context.Context, r *pb.DeleteRangeRequest) (*pb.DeleteRangeResponse, error)
  31. Txn(ctx context.Context, r *pb.TxnRequest) (*pb.TxnResponse, error)
  32. Compact(ctx context.Context, r *pb.CompactionRequest) (*pb.CompactionResponse, error)
  33. }
  34. type Lessor interface {
  35. // LeaseCreate sends LeaseCreate request to raft and apply it after committed.
  36. LeaseCreate(ctx context.Context, r *pb.LeaseCreateRequest) (*pb.LeaseCreateResponse, error)
  37. // LeaseRevoke sends LeaseRevoke request to raft and apply it after committed.
  38. LeaseRevoke(ctx context.Context, r *pb.LeaseRevokeRequest) (*pb.LeaseRevokeResponse, error)
  39. // LeaseRenew renews the lease with given ID. The renewed TTL is returned. Or an error
  40. // is returned.
  41. LeaseRenew(id lease.LeaseID) (int64, error)
  42. }
  43. func (s *EtcdServer) Range(ctx context.Context, r *pb.RangeRequest) (*pb.RangeResponse, error) {
  44. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{Range: r})
  45. if err != nil {
  46. return nil, err
  47. }
  48. return result.resp.(*pb.RangeResponse), result.err
  49. }
  50. func (s *EtcdServer) Put(ctx context.Context, r *pb.PutRequest) (*pb.PutResponse, error) {
  51. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{Put: r})
  52. if err != nil {
  53. return nil, err
  54. }
  55. return result.resp.(*pb.PutResponse), result.err
  56. }
  57. func (s *EtcdServer) DeleteRange(ctx context.Context, r *pb.DeleteRangeRequest) (*pb.DeleteRangeResponse, error) {
  58. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{DeleteRange: r})
  59. if err != nil {
  60. return nil, err
  61. }
  62. return result.resp.(*pb.DeleteRangeResponse), result.err
  63. }
  64. func (s *EtcdServer) Txn(ctx context.Context, r *pb.TxnRequest) (*pb.TxnResponse, error) {
  65. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{Txn: r})
  66. if err != nil {
  67. return nil, err
  68. }
  69. return result.resp.(*pb.TxnResponse), result.err
  70. }
  71. func (s *EtcdServer) Compact(ctx context.Context, r *pb.CompactionRequest) (*pb.CompactionResponse, error) {
  72. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{Compaction: r})
  73. if err != nil {
  74. return nil, err
  75. }
  76. return result.resp.(*pb.CompactionResponse), result.err
  77. }
  78. func (s *EtcdServer) LeaseCreate(ctx context.Context, r *pb.LeaseCreateRequest) (*pb.LeaseCreateResponse, error) {
  79. // no id given? choose one
  80. for r.ID == int64(lease.NoLease) {
  81. // only use positive int64 id's
  82. r.ID = int64(s.reqIDGen.Next() & ((1 << 63) - 1))
  83. }
  84. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{LeaseCreate: r})
  85. if err != nil {
  86. return nil, err
  87. }
  88. resp := result.resp.(*pb.LeaseCreateResponse)
  89. if result.err != nil {
  90. resp.Error = result.err.Error()
  91. }
  92. return resp, nil
  93. }
  94. func (s *EtcdServer) LeaseRevoke(ctx context.Context, r *pb.LeaseRevokeRequest) (*pb.LeaseRevokeResponse, error) {
  95. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{LeaseRevoke: r})
  96. if err != nil {
  97. return nil, err
  98. }
  99. return result.resp.(*pb.LeaseRevokeResponse), result.err
  100. }
  101. func (s *EtcdServer) LeaseRenew(id lease.LeaseID) (int64, error) {
  102. ttl, err := s.lessor.Renew(id)
  103. if err == nil {
  104. return ttl, nil
  105. }
  106. if err != lease.ErrNotPrimary {
  107. return -1, err
  108. }
  109. // renewals don't go through raft; forward to leader manually
  110. leader := s.cluster.Member(s.Leader())
  111. for i := 0; i < 5 && leader == nil; i++ {
  112. // wait an election
  113. dur := time.Duration(s.cfg.ElectionTicks) * time.Duration(s.cfg.TickMs) * time.Millisecond
  114. select {
  115. case <-time.After(dur):
  116. leader = s.cluster.Member(s.Leader())
  117. case <-s.done:
  118. return -1, ErrStopped
  119. }
  120. }
  121. if leader == nil || len(leader.PeerURLs) == 0 {
  122. return -1, ErrNoLeader
  123. }
  124. for _, url := range leader.PeerURLs {
  125. lurl := url + "/leases"
  126. ttl, err = lease.RenewHTTP(id, lurl, s.cfg.PeerTLSInfo, s.cfg.peerDialTimeout())
  127. if err == nil {
  128. break
  129. }
  130. }
  131. return ttl, err
  132. }
  133. type applyResult struct {
  134. resp proto.Message
  135. err error
  136. }
  137. func (s *EtcdServer) processInternalRaftRequest(ctx context.Context, r pb.InternalRaftRequest) (*applyResult, error) {
  138. r.ID = s.reqIDGen.Next()
  139. data, err := r.Marshal()
  140. if err != nil {
  141. return nil, err
  142. }
  143. ch := s.w.Register(r.ID)
  144. s.r.Propose(ctx, data)
  145. select {
  146. case x := <-ch:
  147. return x.(*applyResult), nil
  148. case <-ctx.Done():
  149. s.w.Trigger(r.ID, nil) // GC wait
  150. return nil, ctx.Err()
  151. case <-s.done:
  152. return nil, ErrStopped
  153. }
  154. }
  155. // Watchable returns a watchable interface attached to the etcdserver.
  156. func (s *EtcdServer) Watchable() dstorage.Watchable {
  157. return s.getKV()
  158. }
  159. const (
  160. // noTxn is an invalid txn ID.
  161. // To apply with independent Range, Put, Delete, you can pass noTxn
  162. // to apply functions instead of a valid txn ID.
  163. noTxn = -1
  164. )
  165. func (s *EtcdServer) applyV3Request(r *pb.InternalRaftRequest) interface{} {
  166. kv := s.getKV()
  167. le := s.lessor
  168. ar := &applyResult{}
  169. switch {
  170. case r.Range != nil:
  171. ar.resp, ar.err = applyRange(noTxn, kv, r.Range)
  172. case r.Put != nil:
  173. ar.resp, ar.err = applyPut(noTxn, kv, r.Put)
  174. case r.DeleteRange != nil:
  175. ar.resp, ar.err = applyDeleteRange(noTxn, kv, r.DeleteRange)
  176. case r.Txn != nil:
  177. ar.resp, ar.err = applyTxn(kv, r.Txn)
  178. case r.Compaction != nil:
  179. ar.resp, ar.err = applyCompaction(kv, r.Compaction)
  180. case r.LeaseCreate != nil:
  181. ar.resp, ar.err = applyLeaseCreate(le, r.LeaseCreate)
  182. case r.LeaseRevoke != nil:
  183. ar.resp, ar.err = applyLeaseRevoke(le, r.LeaseRevoke)
  184. default:
  185. panic("not implemented")
  186. }
  187. return ar
  188. }
  189. func applyPut(txnID int64, kv dstorage.KV, p *pb.PutRequest) (*pb.PutResponse, error) {
  190. resp := &pb.PutResponse{}
  191. resp.Header = &pb.ResponseHeader{}
  192. var (
  193. rev int64
  194. err error
  195. )
  196. if txnID != noTxn {
  197. rev, err = kv.TxnPut(txnID, p.Key, p.Value, lease.LeaseID(p.Lease))
  198. if err != nil {
  199. return nil, err
  200. }
  201. } else {
  202. rev = kv.Put(p.Key, p.Value, lease.LeaseID(p.Lease))
  203. }
  204. resp.Header.Revision = rev
  205. return resp, nil
  206. }
  207. type kvSort struct{ kvs []storagepb.KeyValue }
  208. func (s *kvSort) Swap(i, j int) {
  209. t := s.kvs[i]
  210. s.kvs[i] = s.kvs[j]
  211. s.kvs[j] = t
  212. }
  213. func (s *kvSort) Len() int { return len(s.kvs) }
  214. type kvSortByKey struct{ *kvSort }
  215. func (s *kvSortByKey) Less(i, j int) bool {
  216. return bytes.Compare(s.kvs[i].Key, s.kvs[j].Key) < 0
  217. }
  218. type kvSortByVersion struct{ *kvSort }
  219. func (s *kvSortByVersion) Less(i, j int) bool {
  220. return (s.kvs[i].Version - s.kvs[j].Version) < 0
  221. }
  222. type kvSortByCreate struct{ *kvSort }
  223. func (s *kvSortByCreate) Less(i, j int) bool {
  224. return (s.kvs[i].CreateRevision - s.kvs[j].CreateRevision) < 0
  225. }
  226. type kvSortByMod struct{ *kvSort }
  227. func (s *kvSortByMod) Less(i, j int) bool {
  228. return (s.kvs[i].ModRevision - s.kvs[j].ModRevision) < 0
  229. }
  230. type kvSortByValue struct{ *kvSort }
  231. func (s *kvSortByValue) Less(i, j int) bool {
  232. return bytes.Compare(s.kvs[i].Value, s.kvs[j].Value) < 0
  233. }
  234. func applyRange(txnID int64, kv dstorage.KV, r *pb.RangeRequest) (*pb.RangeResponse, error) {
  235. resp := &pb.RangeResponse{}
  236. resp.Header = &pb.ResponseHeader{}
  237. var (
  238. kvs []storagepb.KeyValue
  239. rev int64
  240. err error
  241. )
  242. limit := r.Limit
  243. if r.SortOrder != pb.RangeRequest_NONE {
  244. // fetch everything; sort and truncate afterwards
  245. limit = 0
  246. }
  247. if limit > 0 {
  248. // fetch one extra for 'more' flag
  249. limit = limit + 1
  250. }
  251. if txnID != noTxn {
  252. kvs, rev, err = kv.TxnRange(txnID, r.Key, r.RangeEnd, limit, r.Revision)
  253. if err != nil {
  254. return nil, err
  255. }
  256. } else {
  257. kvs, rev, err = kv.Range(r.Key, r.RangeEnd, limit, r.Revision)
  258. if err != nil {
  259. return nil, err
  260. }
  261. }
  262. if r.SortOrder != pb.RangeRequest_NONE {
  263. var sorter sort.Interface
  264. switch {
  265. case r.SortTarget == pb.RangeRequest_KEY:
  266. sorter = &kvSortByKey{&kvSort{kvs}}
  267. case r.SortTarget == pb.RangeRequest_VERSION:
  268. sorter = &kvSortByVersion{&kvSort{kvs}}
  269. case r.SortTarget == pb.RangeRequest_CREATE:
  270. sorter = &kvSortByCreate{&kvSort{kvs}}
  271. case r.SortTarget == pb.RangeRequest_MOD:
  272. sorter = &kvSortByMod{&kvSort{kvs}}
  273. case r.SortTarget == pb.RangeRequest_VALUE:
  274. sorter = &kvSortByValue{&kvSort{kvs}}
  275. }
  276. switch {
  277. case r.SortOrder == pb.RangeRequest_ASCEND:
  278. sort.Sort(sorter)
  279. case r.SortOrder == pb.RangeRequest_DESCEND:
  280. sort.Sort(sort.Reverse(sorter))
  281. }
  282. }
  283. if r.Limit > 0 && len(kvs) > int(r.Limit) {
  284. kvs = kvs[:r.Limit]
  285. resp.More = true
  286. }
  287. resp.Header.Revision = rev
  288. for i := range kvs {
  289. resp.Kvs = append(resp.Kvs, &kvs[i])
  290. }
  291. return resp, nil
  292. }
  293. func applyDeleteRange(txnID int64, kv dstorage.KV, dr *pb.DeleteRangeRequest) (*pb.DeleteRangeResponse, error) {
  294. resp := &pb.DeleteRangeResponse{}
  295. resp.Header = &pb.ResponseHeader{}
  296. var (
  297. rev int64
  298. err error
  299. )
  300. if txnID != noTxn {
  301. _, rev, err = kv.TxnDeleteRange(txnID, dr.Key, dr.RangeEnd)
  302. if err != nil {
  303. return nil, err
  304. }
  305. } else {
  306. _, rev = kv.DeleteRange(dr.Key, dr.RangeEnd)
  307. }
  308. resp.Header.Revision = rev
  309. return resp, nil
  310. }
  311. func applyTxn(kv dstorage.KV, rt *pb.TxnRequest) (*pb.TxnResponse, error) {
  312. var revision int64
  313. txnID := kv.TxnBegin()
  314. defer func() {
  315. err := kv.TxnEnd(txnID)
  316. if err != nil {
  317. panic(fmt.Sprint("unexpected error when closing txn", txnID))
  318. }
  319. }()
  320. ok := true
  321. for _, c := range rt.Compare {
  322. if revision, ok = applyCompare(txnID, kv, c); !ok {
  323. break
  324. }
  325. }
  326. // TODO: check potential errors before actually applying anything
  327. var reqs []*pb.RequestUnion
  328. if ok {
  329. reqs = rt.Success
  330. } else {
  331. reqs = rt.Failure
  332. }
  333. resps := make([]*pb.ResponseUnion, len(reqs))
  334. for i := range reqs {
  335. resps[i] = applyUnion(txnID, kv, reqs[i])
  336. }
  337. if len(resps) != 0 {
  338. revision += 1
  339. }
  340. txnResp := &pb.TxnResponse{}
  341. txnResp.Header = &pb.ResponseHeader{}
  342. txnResp.Header.Revision = revision
  343. txnResp.Responses = resps
  344. txnResp.Succeeded = ok
  345. return txnResp, nil
  346. }
  347. func applyCompaction(kv dstorage.KV, compaction *pb.CompactionRequest) (*pb.CompactionResponse, error) {
  348. resp := &pb.CompactionResponse{}
  349. resp.Header = &pb.ResponseHeader{}
  350. err := kv.Compact(compaction.Revision)
  351. if err != nil {
  352. return nil, err
  353. }
  354. // get the current revision. which key to get is not important.
  355. _, resp.Header.Revision, _ = kv.Range([]byte("compaction"), nil, 1, 0)
  356. return resp, err
  357. }
  358. func applyUnion(txnID int64, kv dstorage.KV, union *pb.RequestUnion) *pb.ResponseUnion {
  359. switch {
  360. case union.RequestRange != nil:
  361. resp, err := applyRange(txnID, kv, union.RequestRange)
  362. if err != nil {
  363. panic("unexpected error during txn")
  364. }
  365. return &pb.ResponseUnion{ResponseRange: resp}
  366. case union.RequestPut != nil:
  367. resp, err := applyPut(txnID, kv, union.RequestPut)
  368. if err != nil {
  369. panic("unexpected error during txn")
  370. }
  371. return &pb.ResponseUnion{ResponsePut: resp}
  372. case union.RequestDeleteRange != nil:
  373. resp, err := applyDeleteRange(txnID, kv, union.RequestDeleteRange)
  374. if err != nil {
  375. panic("unexpected error during txn")
  376. }
  377. return &pb.ResponseUnion{ResponseDeleteRange: resp}
  378. default:
  379. // empty union
  380. return nil
  381. }
  382. }
  383. // applyCompare applies the compare request.
  384. // applyCompare should only be called within a txn request and an valid txn ID must
  385. // be presented. Or applyCompare panics.
  386. // It returns the revision at which the comparison happens. If the comparison
  387. // succeeds, the it returns true. Otherwise it returns false.
  388. func applyCompare(txnID int64, kv dstorage.KV, c *pb.Compare) (int64, bool) {
  389. if txnID == noTxn {
  390. panic("applyCompare called with noTxn")
  391. }
  392. ckvs, rev, err := kv.TxnRange(txnID, c.Key, nil, 1, 0)
  393. if err != nil {
  394. if err == dstorage.ErrTxnIDMismatch {
  395. panic("unexpected txn ID mismatch error")
  396. }
  397. return rev, false
  398. }
  399. var ckv storagepb.KeyValue
  400. if len(ckvs) != 0 {
  401. ckv = ckvs[0]
  402. } else {
  403. // Use the zero value of ckv normally. However...
  404. if c.Target == pb.Compare_VALUE {
  405. // Always fail if we're comparing a value on a key that doesn't exist.
  406. // We can treat non-existence as the empty set explicitly, such that
  407. // even a key with a value of length 0 bytes is still a real key
  408. // that was written that way
  409. return rev, false
  410. }
  411. }
  412. // -1 is less, 0 is equal, 1 is greater
  413. var result int
  414. switch c.Target {
  415. case pb.Compare_VALUE:
  416. result = bytes.Compare(ckv.Value, c.Value)
  417. case pb.Compare_CREATE:
  418. result = compareInt64(ckv.CreateRevision, c.CreateRevision)
  419. case pb.Compare_MOD:
  420. result = compareInt64(ckv.ModRevision, c.ModRevision)
  421. case pb.Compare_VERSION:
  422. result = compareInt64(ckv.Version, c.Version)
  423. }
  424. switch c.Result {
  425. case pb.Compare_EQUAL:
  426. if result != 0 {
  427. return rev, false
  428. }
  429. case pb.Compare_GREATER:
  430. if result != 1 {
  431. return rev, false
  432. }
  433. case pb.Compare_LESS:
  434. if result != -1 {
  435. return rev, false
  436. }
  437. }
  438. return rev, true
  439. }
  440. func applyLeaseCreate(le lease.Lessor, lc *pb.LeaseCreateRequest) (*pb.LeaseCreateResponse, error) {
  441. l, err := le.Grant(lease.LeaseID(lc.ID), lc.TTL)
  442. resp := &pb.LeaseCreateResponse{}
  443. if err == nil {
  444. resp.ID = int64(l.ID)
  445. resp.TTL = l.TTL
  446. }
  447. return resp, err
  448. }
  449. func applyLeaseRevoke(le lease.Lessor, lc *pb.LeaseRevokeRequest) (*pb.LeaseRevokeResponse, error) {
  450. err := le.Revoke(lease.LeaseID(lc.ID))
  451. return &pb.LeaseRevokeResponse{}, err
  452. }
  453. func compareInt64(a, b int64) int {
  454. switch {
  455. case a < b:
  456. return -1
  457. case a > b:
  458. return 1
  459. default:
  460. return 0
  461. }
  462. }