v3demo_server.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553
  1. // Copyright 2015 CoreOS, Inc.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package etcdserver
  15. import (
  16. "bytes"
  17. "fmt"
  18. "sort"
  19. "time"
  20. "github.com/coreos/etcd/Godeps/_workspace/src/github.com/gogo/protobuf/proto"
  21. "github.com/coreos/etcd/Godeps/_workspace/src/golang.org/x/net/context"
  22. pb "github.com/coreos/etcd/etcdserver/etcdserverpb"
  23. "github.com/coreos/etcd/lease"
  24. dstorage "github.com/coreos/etcd/storage"
  25. "github.com/coreos/etcd/storage/storagepb"
  26. )
  27. type RaftKV interface {
  28. Range(ctx context.Context, r *pb.RangeRequest) (*pb.RangeResponse, error)
  29. Put(ctx context.Context, r *pb.PutRequest) (*pb.PutResponse, error)
  30. DeleteRange(ctx context.Context, r *pb.DeleteRangeRequest) (*pb.DeleteRangeResponse, error)
  31. Txn(ctx context.Context, r *pb.TxnRequest) (*pb.TxnResponse, error)
  32. Compact(ctx context.Context, r *pb.CompactionRequest) (*pb.CompactionResponse, error)
  33. }
  34. type Lessor interface {
  35. // LeaseCreate sends LeaseCreate request to raft and apply it after committed.
  36. LeaseCreate(ctx context.Context, r *pb.LeaseCreateRequest) (*pb.LeaseCreateResponse, error)
  37. // LeaseRevoke sends LeaseRevoke request to raft and apply it after committed.
  38. LeaseRevoke(ctx context.Context, r *pb.LeaseRevokeRequest) (*pb.LeaseRevokeResponse, error)
  39. // LeaseRenew renews the lease with given ID. The renewed TTL is returned. Or an error
  40. // is returned.
  41. LeaseRenew(id lease.LeaseID) (int64, error)
  42. }
  43. func (s *EtcdServer) Range(ctx context.Context, r *pb.RangeRequest) (*pb.RangeResponse, error) {
  44. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{Range: r})
  45. if err != nil {
  46. return nil, err
  47. }
  48. return result.resp.(*pb.RangeResponse), result.err
  49. }
  50. func (s *EtcdServer) Put(ctx context.Context, r *pb.PutRequest) (*pb.PutResponse, error) {
  51. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{Put: r})
  52. if err != nil {
  53. return nil, err
  54. }
  55. return result.resp.(*pb.PutResponse), result.err
  56. }
  57. func (s *EtcdServer) DeleteRange(ctx context.Context, r *pb.DeleteRangeRequest) (*pb.DeleteRangeResponse, error) {
  58. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{DeleteRange: r})
  59. if err != nil {
  60. return nil, err
  61. }
  62. return result.resp.(*pb.DeleteRangeResponse), result.err
  63. }
  64. func (s *EtcdServer) Txn(ctx context.Context, r *pb.TxnRequest) (*pb.TxnResponse, error) {
  65. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{Txn: r})
  66. if err != nil {
  67. return nil, err
  68. }
  69. return result.resp.(*pb.TxnResponse), result.err
  70. }
  71. func (s *EtcdServer) Compact(ctx context.Context, r *pb.CompactionRequest) (*pb.CompactionResponse, error) {
  72. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{Compaction: r})
  73. if err != nil {
  74. return nil, err
  75. }
  76. return result.resp.(*pb.CompactionResponse), result.err
  77. }
  78. func (s *EtcdServer) LeaseCreate(ctx context.Context, r *pb.LeaseCreateRequest) (*pb.LeaseCreateResponse, error) {
  79. // no id given? choose one
  80. for r.ID == int64(lease.NoLease) {
  81. // only use positive int64 id's
  82. r.ID = int64(s.reqIDGen.Next() & ((1 << 63) - 1))
  83. }
  84. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{LeaseCreate: r})
  85. if err != nil {
  86. return nil, err
  87. }
  88. resp := result.resp.(*pb.LeaseCreateResponse)
  89. if result.err != nil {
  90. resp.Error = result.err.Error()
  91. }
  92. return resp, nil
  93. }
  94. func (s *EtcdServer) LeaseRevoke(ctx context.Context, r *pb.LeaseRevokeRequest) (*pb.LeaseRevokeResponse, error) {
  95. result, err := s.processInternalRaftRequest(ctx, pb.InternalRaftRequest{LeaseRevoke: r})
  96. if err != nil {
  97. return nil, err
  98. }
  99. return result.resp.(*pb.LeaseRevokeResponse), result.err
  100. }
  101. func (s *EtcdServer) LeaseRenew(id lease.LeaseID) (int64, error) {
  102. ttl, err := s.lessor.Renew(id)
  103. if err == nil {
  104. return ttl, nil
  105. }
  106. if err != lease.ErrNotPrimary {
  107. return -1, err
  108. }
  109. // renewals don't go through raft; forward to leader manually
  110. leader := s.cluster.Member(s.Leader())
  111. for i := 0; i < 5 && leader == nil; i++ {
  112. // wait an election
  113. dur := time.Duration(s.cfg.ElectionTicks) * time.Duration(s.cfg.TickMs) * time.Millisecond
  114. select {
  115. case <-time.After(dur):
  116. leader = s.cluster.Member(s.Leader())
  117. case <-s.done:
  118. return -1, ErrStopped
  119. }
  120. }
  121. if leader == nil || len(leader.PeerURLs) == 0 {
  122. return -1, ErrNoLeader
  123. }
  124. for _, url := range leader.PeerURLs {
  125. lurl := url + "/leases"
  126. ttl, err = lease.RenewHTTP(id, lurl, s.cfg.PeerTLSInfo, s.cfg.peerDialTimeout())
  127. if err == nil {
  128. break
  129. }
  130. }
  131. return ttl, err
  132. }
  133. type applyResult struct {
  134. resp proto.Message
  135. err error
  136. }
  137. func (s *EtcdServer) processInternalRaftRequest(ctx context.Context, r pb.InternalRaftRequest) (*applyResult, error) {
  138. r.ID = s.reqIDGen.Next()
  139. data, err := r.Marshal()
  140. if err != nil {
  141. return nil, err
  142. }
  143. ch := s.w.Register(r.ID)
  144. s.r.Propose(ctx, data)
  145. select {
  146. case x := <-ch:
  147. return x.(*applyResult), nil
  148. case <-ctx.Done():
  149. s.w.Trigger(r.ID, nil) // GC wait
  150. return nil, ctx.Err()
  151. case <-s.done:
  152. return nil, ErrStopped
  153. }
  154. }
  155. // Watchable returns a watchable interface attached to the etcdserver.
  156. func (s *EtcdServer) Watchable() dstorage.Watchable {
  157. return s.getKV()
  158. }
  159. const (
  160. // noTxn is an invalid txn ID.
  161. // To apply with independent Range, Put, Delete, you can pass noTxn
  162. // to apply functions instead of a valid txn ID.
  163. noTxn = -1
  164. )
  165. func (s *EtcdServer) applyV3Request(r *pb.InternalRaftRequest) interface{} {
  166. kv := s.getKV()
  167. le := s.lessor
  168. ar := &applyResult{}
  169. switch {
  170. case r.Range != nil:
  171. ar.resp, ar.err = applyRange(noTxn, kv, r.Range)
  172. case r.Put != nil:
  173. ar.resp, ar.err = applyPut(noTxn, kv, le, r.Put)
  174. case r.DeleteRange != nil:
  175. ar.resp, ar.err = applyDeleteRange(noTxn, kv, r.DeleteRange)
  176. case r.Txn != nil:
  177. ar.resp, ar.err = applyTxn(kv, le, r.Txn)
  178. case r.Compaction != nil:
  179. ar.resp, ar.err = applyCompaction(kv, r.Compaction)
  180. case r.LeaseCreate != nil:
  181. ar.resp, ar.err = applyLeaseCreate(le, r.LeaseCreate)
  182. case r.LeaseRevoke != nil:
  183. ar.resp, ar.err = applyLeaseRevoke(le, r.LeaseRevoke)
  184. default:
  185. panic("not implemented")
  186. }
  187. return ar
  188. }
  189. func applyPut(txnID int64, kv dstorage.KV, le lease.Lessor, p *pb.PutRequest) (*pb.PutResponse, error) {
  190. resp := &pb.PutResponse{}
  191. resp.Header = &pb.ResponseHeader{}
  192. var (
  193. rev int64
  194. err error
  195. )
  196. if txnID != noTxn {
  197. rev, err = kv.TxnPut(txnID, p.Key, p.Value, lease.LeaseID(p.Lease))
  198. if err != nil {
  199. return nil, err
  200. }
  201. } else {
  202. leaseID := lease.LeaseID(p.Lease)
  203. if leaseID != lease.NoLease {
  204. if l := le.Lookup(leaseID); l == nil {
  205. return nil, lease.ErrLeaseNotFound
  206. }
  207. }
  208. rev = kv.Put(p.Key, p.Value, leaseID)
  209. }
  210. resp.Header.Revision = rev
  211. return resp, nil
  212. }
  213. type kvSort struct{ kvs []storagepb.KeyValue }
  214. func (s *kvSort) Swap(i, j int) {
  215. t := s.kvs[i]
  216. s.kvs[i] = s.kvs[j]
  217. s.kvs[j] = t
  218. }
  219. func (s *kvSort) Len() int { return len(s.kvs) }
  220. type kvSortByKey struct{ *kvSort }
  221. func (s *kvSortByKey) Less(i, j int) bool {
  222. return bytes.Compare(s.kvs[i].Key, s.kvs[j].Key) < 0
  223. }
  224. type kvSortByVersion struct{ *kvSort }
  225. func (s *kvSortByVersion) Less(i, j int) bool {
  226. return (s.kvs[i].Version - s.kvs[j].Version) < 0
  227. }
  228. type kvSortByCreate struct{ *kvSort }
  229. func (s *kvSortByCreate) Less(i, j int) bool {
  230. return (s.kvs[i].CreateRevision - s.kvs[j].CreateRevision) < 0
  231. }
  232. type kvSortByMod struct{ *kvSort }
  233. func (s *kvSortByMod) Less(i, j int) bool {
  234. return (s.kvs[i].ModRevision - s.kvs[j].ModRevision) < 0
  235. }
  236. type kvSortByValue struct{ *kvSort }
  237. func (s *kvSortByValue) Less(i, j int) bool {
  238. return bytes.Compare(s.kvs[i].Value, s.kvs[j].Value) < 0
  239. }
  240. func applyRange(txnID int64, kv dstorage.KV, r *pb.RangeRequest) (*pb.RangeResponse, error) {
  241. resp := &pb.RangeResponse{}
  242. resp.Header = &pb.ResponseHeader{}
  243. var (
  244. kvs []storagepb.KeyValue
  245. rev int64
  246. err error
  247. )
  248. limit := r.Limit
  249. if r.SortOrder != pb.RangeRequest_NONE {
  250. // fetch everything; sort and truncate afterwards
  251. limit = 0
  252. }
  253. if limit > 0 {
  254. // fetch one extra for 'more' flag
  255. limit = limit + 1
  256. }
  257. if txnID != noTxn {
  258. kvs, rev, err = kv.TxnRange(txnID, r.Key, r.RangeEnd, limit, r.Revision)
  259. if err != nil {
  260. return nil, err
  261. }
  262. } else {
  263. kvs, rev, err = kv.Range(r.Key, r.RangeEnd, limit, r.Revision)
  264. if err != nil {
  265. return nil, err
  266. }
  267. }
  268. if r.SortOrder != pb.RangeRequest_NONE {
  269. var sorter sort.Interface
  270. switch {
  271. case r.SortTarget == pb.RangeRequest_KEY:
  272. sorter = &kvSortByKey{&kvSort{kvs}}
  273. case r.SortTarget == pb.RangeRequest_VERSION:
  274. sorter = &kvSortByVersion{&kvSort{kvs}}
  275. case r.SortTarget == pb.RangeRequest_CREATE:
  276. sorter = &kvSortByCreate{&kvSort{kvs}}
  277. case r.SortTarget == pb.RangeRequest_MOD:
  278. sorter = &kvSortByMod{&kvSort{kvs}}
  279. case r.SortTarget == pb.RangeRequest_VALUE:
  280. sorter = &kvSortByValue{&kvSort{kvs}}
  281. }
  282. switch {
  283. case r.SortOrder == pb.RangeRequest_ASCEND:
  284. sort.Sort(sorter)
  285. case r.SortOrder == pb.RangeRequest_DESCEND:
  286. sort.Sort(sort.Reverse(sorter))
  287. }
  288. }
  289. if r.Limit > 0 && len(kvs) > int(r.Limit) {
  290. kvs = kvs[:r.Limit]
  291. resp.More = true
  292. }
  293. resp.Header.Revision = rev
  294. for i := range kvs {
  295. resp.Kvs = append(resp.Kvs, &kvs[i])
  296. }
  297. return resp, nil
  298. }
  299. func applyDeleteRange(txnID int64, kv dstorage.KV, dr *pb.DeleteRangeRequest) (*pb.DeleteRangeResponse, error) {
  300. resp := &pb.DeleteRangeResponse{}
  301. resp.Header = &pb.ResponseHeader{}
  302. var (
  303. rev int64
  304. err error
  305. )
  306. if txnID != noTxn {
  307. _, rev, err = kv.TxnDeleteRange(txnID, dr.Key, dr.RangeEnd)
  308. if err != nil {
  309. return nil, err
  310. }
  311. } else {
  312. _, rev = kv.DeleteRange(dr.Key, dr.RangeEnd)
  313. }
  314. resp.Header.Revision = rev
  315. return resp, nil
  316. }
  317. func checkRequestLeases(le lease.Lessor, reqs []*pb.RequestUnion) error {
  318. for _, requ := range reqs {
  319. preq := requ.RequestPut
  320. if preq == nil || lease.LeaseID(preq.Lease) == lease.NoLease {
  321. continue
  322. }
  323. if l := le.Lookup(lease.LeaseID(preq.Lease)); l == nil {
  324. return lease.ErrLeaseNotFound
  325. }
  326. }
  327. return nil
  328. }
  329. func applyTxn(kv dstorage.KV, le lease.Lessor, rt *pb.TxnRequest) (*pb.TxnResponse, error) {
  330. var revision int64
  331. txnID := kv.TxnBegin()
  332. defer func() {
  333. err := kv.TxnEnd(txnID)
  334. if err != nil {
  335. panic(fmt.Sprint("unexpected error when closing txn", txnID))
  336. }
  337. }()
  338. ok := true
  339. for _, c := range rt.Compare {
  340. if revision, ok = applyCompare(txnID, kv, c); !ok {
  341. break
  342. }
  343. }
  344. // TODO: check potential errors before actually applying anything
  345. var reqs []*pb.RequestUnion
  346. if ok {
  347. reqs = rt.Success
  348. } else {
  349. reqs = rt.Failure
  350. }
  351. if err := checkRequestLeases(le, reqs); err != nil {
  352. return nil, err
  353. }
  354. resps := make([]*pb.ResponseUnion, len(reqs))
  355. for i := range reqs {
  356. resps[i] = applyUnion(txnID, kv, reqs[i])
  357. }
  358. if len(resps) != 0 {
  359. revision += 1
  360. }
  361. txnResp := &pb.TxnResponse{}
  362. txnResp.Header = &pb.ResponseHeader{}
  363. txnResp.Header.Revision = revision
  364. txnResp.Responses = resps
  365. txnResp.Succeeded = ok
  366. return txnResp, nil
  367. }
  368. func applyCompaction(kv dstorage.KV, compaction *pb.CompactionRequest) (*pb.CompactionResponse, error) {
  369. resp := &pb.CompactionResponse{}
  370. resp.Header = &pb.ResponseHeader{}
  371. err := kv.Compact(compaction.Revision)
  372. if err != nil {
  373. return nil, err
  374. }
  375. // get the current revision. which key to get is not important.
  376. _, resp.Header.Revision, _ = kv.Range([]byte("compaction"), nil, 1, 0)
  377. return resp, err
  378. }
  379. func applyUnion(txnID int64, kv dstorage.KV, union *pb.RequestUnion) *pb.ResponseUnion {
  380. switch {
  381. case union.RequestRange != nil:
  382. resp, err := applyRange(txnID, kv, union.RequestRange)
  383. if err != nil {
  384. panic("unexpected error during txn")
  385. }
  386. return &pb.ResponseUnion{ResponseRange: resp}
  387. case union.RequestPut != nil:
  388. resp, err := applyPut(txnID, kv, nil, union.RequestPut)
  389. if err != nil {
  390. panic("unexpected error during txn")
  391. }
  392. return &pb.ResponseUnion{ResponsePut: resp}
  393. case union.RequestDeleteRange != nil:
  394. resp, err := applyDeleteRange(txnID, kv, union.RequestDeleteRange)
  395. if err != nil {
  396. panic("unexpected error during txn")
  397. }
  398. return &pb.ResponseUnion{ResponseDeleteRange: resp}
  399. default:
  400. // empty union
  401. return nil
  402. }
  403. }
  404. // applyCompare applies the compare request.
  405. // applyCompare should only be called within a txn request and an valid txn ID must
  406. // be presented. Or applyCompare panics.
  407. // It returns the revision at which the comparison happens. If the comparison
  408. // succeeds, the it returns true. Otherwise it returns false.
  409. func applyCompare(txnID int64, kv dstorage.KV, c *pb.Compare) (int64, bool) {
  410. if txnID == noTxn {
  411. panic("applyCompare called with noTxn")
  412. }
  413. ckvs, rev, err := kv.TxnRange(txnID, c.Key, nil, 1, 0)
  414. if err != nil {
  415. if err == dstorage.ErrTxnIDMismatch {
  416. panic("unexpected txn ID mismatch error")
  417. }
  418. return rev, false
  419. }
  420. var ckv storagepb.KeyValue
  421. if len(ckvs) != 0 {
  422. ckv = ckvs[0]
  423. } else {
  424. // Use the zero value of ckv normally. However...
  425. if c.Target == pb.Compare_VALUE {
  426. // Always fail if we're comparing a value on a key that doesn't exist.
  427. // We can treat non-existence as the empty set explicitly, such that
  428. // even a key with a value of length 0 bytes is still a real key
  429. // that was written that way
  430. return rev, false
  431. }
  432. }
  433. // -1 is less, 0 is equal, 1 is greater
  434. var result int
  435. switch c.Target {
  436. case pb.Compare_VALUE:
  437. result = bytes.Compare(ckv.Value, c.Value)
  438. case pb.Compare_CREATE:
  439. result = compareInt64(ckv.CreateRevision, c.CreateRevision)
  440. case pb.Compare_MOD:
  441. result = compareInt64(ckv.ModRevision, c.ModRevision)
  442. case pb.Compare_VERSION:
  443. result = compareInt64(ckv.Version, c.Version)
  444. }
  445. switch c.Result {
  446. case pb.Compare_EQUAL:
  447. if result != 0 {
  448. return rev, false
  449. }
  450. case pb.Compare_GREATER:
  451. if result != 1 {
  452. return rev, false
  453. }
  454. case pb.Compare_LESS:
  455. if result != -1 {
  456. return rev, false
  457. }
  458. }
  459. return rev, true
  460. }
  461. func applyLeaseCreate(le lease.Lessor, lc *pb.LeaseCreateRequest) (*pb.LeaseCreateResponse, error) {
  462. l, err := le.Grant(lease.LeaseID(lc.ID), lc.TTL)
  463. resp := &pb.LeaseCreateResponse{}
  464. if err == nil {
  465. resp.ID = int64(l.ID)
  466. resp.TTL = l.TTL
  467. }
  468. return resp, err
  469. }
  470. func applyLeaseRevoke(le lease.Lessor, lc *pb.LeaseRevokeRequest) (*pb.LeaseRevokeResponse, error) {
  471. err := le.Revoke(lease.LeaseID(lc.ID))
  472. return &pb.LeaseRevokeResponse{}, err
  473. }
  474. func compareInt64(a, b int64) int {
  475. switch {
  476. case a < b:
  477. return -1
  478. case a > b:
  479. return 1
  480. default:
  481. return 0
  482. }
  483. }