lease_test.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632
  1. // Copyright 2016 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package integration
  15. import (
  16. "reflect"
  17. "sort"
  18. "sync"
  19. "testing"
  20. "time"
  21. "github.com/coreos/etcd/clientv3"
  22. "github.com/coreos/etcd/clientv3/concurrency"
  23. "github.com/coreos/etcd/etcdserver/api/v3rpc/rpctypes"
  24. "github.com/coreos/etcd/integration"
  25. "github.com/coreos/etcd/pkg/testutil"
  26. "golang.org/x/net/context"
  27. "google.golang.org/grpc"
  28. )
  29. func TestLeaseNotFoundError(t *testing.T) {
  30. defer testutil.AfterTest(t)
  31. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  32. defer clus.Terminate(t)
  33. lapi := clientv3.NewLease(clus.RandClient())
  34. defer lapi.Close()
  35. kv := clientv3.NewKV(clus.RandClient())
  36. _, err := kv.Put(context.TODO(), "foo", "bar", clientv3.WithLease(clientv3.LeaseID(500)))
  37. if err != rpctypes.ErrLeaseNotFound {
  38. t.Fatalf("expected %v, got %v", rpctypes.ErrLeaseNotFound, err)
  39. }
  40. }
  41. func TestLeaseGrant(t *testing.T) {
  42. defer testutil.AfterTest(t)
  43. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  44. defer clus.Terminate(t)
  45. lapi := clientv3.NewLease(clus.RandClient())
  46. defer lapi.Close()
  47. kv := clientv3.NewKV(clus.RandClient())
  48. resp, err := lapi.Grant(context.Background(), 10)
  49. if err != nil {
  50. t.Errorf("failed to create lease %v", err)
  51. }
  52. _, err = kv.Put(context.TODO(), "foo", "bar", clientv3.WithLease(resp.ID))
  53. if err != nil {
  54. t.Fatalf("failed to create key with lease %v", err)
  55. }
  56. }
  57. func TestLeaseRevoke(t *testing.T) {
  58. defer testutil.AfterTest(t)
  59. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  60. defer clus.Terminate(t)
  61. lapi := clientv3.NewLease(clus.RandClient())
  62. defer lapi.Close()
  63. kv := clientv3.NewKV(clus.RandClient())
  64. resp, err := lapi.Grant(context.Background(), 10)
  65. if err != nil {
  66. t.Errorf("failed to create lease %v", err)
  67. }
  68. _, err = lapi.Revoke(context.Background(), clientv3.LeaseID(resp.ID))
  69. if err != nil {
  70. t.Errorf("failed to revoke lease %v", err)
  71. }
  72. _, err = kv.Put(context.TODO(), "foo", "bar", clientv3.WithLease(resp.ID))
  73. if err != rpctypes.ErrLeaseNotFound {
  74. t.Fatalf("err = %v, want %v", err, rpctypes.ErrLeaseNotFound)
  75. }
  76. }
  77. func TestLeaseKeepAliveOnce(t *testing.T) {
  78. defer testutil.AfterTest(t)
  79. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  80. defer clus.Terminate(t)
  81. lapi := clientv3.NewLease(clus.RandClient())
  82. defer lapi.Close()
  83. resp, err := lapi.Grant(context.Background(), 10)
  84. if err != nil {
  85. t.Errorf("failed to create lease %v", err)
  86. }
  87. _, err = lapi.KeepAliveOnce(context.Background(), resp.ID)
  88. if err != nil {
  89. t.Errorf("failed to keepalive lease %v", err)
  90. }
  91. _, err = lapi.KeepAliveOnce(context.Background(), clientv3.LeaseID(0))
  92. if err != rpctypes.ErrLeaseNotFound {
  93. t.Errorf("expected %v, got %v", rpctypes.ErrLeaseNotFound, err)
  94. }
  95. }
  96. func TestLeaseKeepAlive(t *testing.T) {
  97. defer testutil.AfterTest(t)
  98. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  99. defer clus.Terminate(t)
  100. lapi := clientv3.NewLease(clus.RandClient())
  101. resp, err := lapi.Grant(context.Background(), 10)
  102. if err != nil {
  103. t.Errorf("failed to create lease %v", err)
  104. }
  105. rc, kerr := lapi.KeepAlive(context.Background(), resp.ID)
  106. if kerr != nil {
  107. t.Errorf("failed to keepalive lease %v", kerr)
  108. }
  109. kresp, ok := <-rc
  110. if !ok {
  111. t.Errorf("chan is closed, want not closed")
  112. }
  113. if kresp.ID != resp.ID {
  114. t.Errorf("ID = %x, want %x", kresp.ID, resp.ID)
  115. }
  116. lapi.Close()
  117. _, ok = <-rc
  118. if ok {
  119. t.Errorf("chan is not closed, want lease Close() closes chan")
  120. }
  121. }
  122. // TODO: add a client that can connect to all the members of cluster via unix sock.
  123. // TODO: test handle more complicated failures.
  124. func TestLeaseKeepAliveHandleFailure(t *testing.T) {
  125. t.Skip("test it when we have a cluster client")
  126. defer testutil.AfterTest(t)
  127. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  128. defer clus.Terminate(t)
  129. // TODO: change this line to get a cluster client
  130. lapi := clientv3.NewLease(clus.RandClient())
  131. resp, err := lapi.Grant(context.Background(), 10)
  132. if err != nil {
  133. t.Errorf("failed to create lease %v", err)
  134. }
  135. rc, kerr := lapi.KeepAlive(context.Background(), resp.ID)
  136. if kerr != nil {
  137. t.Errorf("failed to keepalive lease %v", kerr)
  138. }
  139. kresp := <-rc
  140. if kresp.ID != resp.ID {
  141. t.Errorf("ID = %x, want %x", kresp.ID, resp.ID)
  142. }
  143. // restart the connected member.
  144. clus.Members[0].Stop(t)
  145. select {
  146. case <-rc:
  147. t.Fatalf("unexpected keepalive")
  148. case <-time.After(10*time.Second/3 + 1):
  149. }
  150. // recover the member.
  151. clus.Members[0].Restart(t)
  152. kresp = <-rc
  153. if kresp.ID != resp.ID {
  154. t.Errorf("ID = %x, want %x", kresp.ID, resp.ID)
  155. }
  156. lapi.Close()
  157. _, ok := <-rc
  158. if ok {
  159. t.Errorf("chan is not closed, want lease Close() closes chan")
  160. }
  161. }
  162. type leaseCh struct {
  163. lid clientv3.LeaseID
  164. ch <-chan *clientv3.LeaseKeepAliveResponse
  165. }
  166. // TestLeaseKeepAliveNotFound ensures a revoked lease won't stop other keep alives
  167. func TestLeaseKeepAliveNotFound(t *testing.T) {
  168. defer testutil.AfterTest(t)
  169. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  170. defer clus.Terminate(t)
  171. cli := clus.RandClient()
  172. lchs := []leaseCh{}
  173. for i := 0; i < 3; i++ {
  174. resp, rerr := cli.Grant(context.TODO(), 5)
  175. if rerr != nil {
  176. t.Fatal(rerr)
  177. }
  178. kach, kaerr := cli.KeepAlive(context.Background(), resp.ID)
  179. if kaerr != nil {
  180. t.Fatal(kaerr)
  181. }
  182. lchs = append(lchs, leaseCh{resp.ID, kach})
  183. }
  184. if _, err := cli.Revoke(context.TODO(), lchs[1].lid); err != nil {
  185. t.Fatal(err)
  186. }
  187. <-lchs[0].ch
  188. if _, ok := <-lchs[0].ch; !ok {
  189. t.Fatalf("closed keepalive on wrong lease")
  190. }
  191. timec := time.After(5 * time.Second)
  192. for range lchs[1].ch {
  193. select {
  194. case <-timec:
  195. t.Fatalf("revoke did not close keep alive")
  196. default:
  197. }
  198. }
  199. }
  200. func TestLeaseGrantErrConnClosed(t *testing.T) {
  201. defer testutil.AfterTest(t)
  202. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  203. defer clus.Terminate(t)
  204. cli := clus.Client(0)
  205. le := clientv3.NewLease(cli)
  206. donec := make(chan struct{})
  207. go func() {
  208. defer close(donec)
  209. _, err := le.Grant(context.TODO(), 5)
  210. if err != nil && err != grpc.ErrClientConnClosing {
  211. t.Fatalf("expected %v, got %v", grpc.ErrClientConnClosing, err)
  212. }
  213. }()
  214. if err := cli.Close(); err != nil {
  215. t.Fatal(err)
  216. }
  217. clus.TakeClient(0)
  218. select {
  219. case <-time.After(3 * time.Second):
  220. t.Fatal("le.Grant took too long")
  221. case <-donec:
  222. }
  223. }
  224. func TestLeaseGrantNewAfterClose(t *testing.T) {
  225. defer testutil.AfterTest(t)
  226. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  227. defer clus.Terminate(t)
  228. cli := clus.Client(0)
  229. clus.TakeClient(0)
  230. if err := cli.Close(); err != nil {
  231. t.Fatal(err)
  232. }
  233. donec := make(chan struct{})
  234. go func() {
  235. le := clientv3.NewLease(cli)
  236. if _, err := le.Grant(context.TODO(), 5); err != grpc.ErrClientConnClosing {
  237. t.Fatalf("expected %v, got %v", grpc.ErrClientConnClosing, err)
  238. }
  239. close(donec)
  240. }()
  241. select {
  242. case <-time.After(3 * time.Second):
  243. t.Fatal("le.Grant took too long")
  244. case <-donec:
  245. }
  246. }
  247. func TestLeaseRevokeNewAfterClose(t *testing.T) {
  248. defer testutil.AfterTest(t)
  249. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  250. defer clus.Terminate(t)
  251. cli := clus.Client(0)
  252. le := clientv3.NewLease(cli)
  253. resp, err := le.Grant(context.TODO(), 5)
  254. if err != nil {
  255. t.Fatal(err)
  256. }
  257. leaseID := resp.ID
  258. clus.TakeClient(0)
  259. if err := cli.Close(); err != nil {
  260. t.Fatal(err)
  261. }
  262. donec := make(chan struct{})
  263. go func() {
  264. if _, err := le.Revoke(context.TODO(), leaseID); err != grpc.ErrClientConnClosing {
  265. t.Fatalf("expected %v, got %v", grpc.ErrClientConnClosing, err)
  266. }
  267. close(donec)
  268. }()
  269. select {
  270. case <-time.After(3 * time.Second):
  271. t.Fatal("le.Revoke took too long")
  272. case <-donec:
  273. }
  274. }
  275. // TestLeaseKeepAliveCloseAfterDisconnectExpire ensures the keep alive channel is closed
  276. // following a disconnection, lease revoke, then reconnect.
  277. func TestLeaseKeepAliveCloseAfterDisconnectRevoke(t *testing.T) {
  278. defer testutil.AfterTest(t)
  279. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  280. defer clus.Terminate(t)
  281. cli := clus.Client(0)
  282. // setup lease and do a keepalive
  283. resp, err := cli.Grant(context.Background(), 10)
  284. if err != nil {
  285. t.Fatal(err)
  286. }
  287. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  288. if kerr != nil {
  289. t.Fatal(kerr)
  290. }
  291. kresp := <-rc
  292. if kresp.ID != resp.ID {
  293. t.Fatalf("ID = %x, want %x", kresp.ID, resp.ID)
  294. }
  295. // keep client disconnected
  296. clus.Members[0].Stop(t)
  297. time.Sleep(time.Second)
  298. clus.WaitLeader(t)
  299. if _, err := clus.Client(1).Revoke(context.TODO(), resp.ID); err != nil {
  300. t.Fatal(err)
  301. }
  302. clus.Members[0].Restart(t)
  303. // some keep-alives may still be buffered; drain until close
  304. timer := time.After(time.Duration(kresp.TTL) * time.Second)
  305. for kresp != nil {
  306. select {
  307. case kresp = <-rc:
  308. case <-timer:
  309. t.Fatalf("keepalive channel did not close")
  310. }
  311. }
  312. }
  313. // TestLeaseKeepAliveInitTimeout ensures the keep alive channel closes if
  314. // the initial keep alive request never gets a response.
  315. func TestLeaseKeepAliveInitTimeout(t *testing.T) {
  316. defer testutil.AfterTest(t)
  317. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  318. defer clus.Terminate(t)
  319. cli := clus.Client(0)
  320. // setup lease and do a keepalive
  321. resp, err := cli.Grant(context.Background(), 5)
  322. if err != nil {
  323. t.Fatal(err)
  324. }
  325. // keep client disconnected
  326. clus.Members[0].Stop(t)
  327. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  328. if kerr != nil {
  329. t.Fatal(kerr)
  330. }
  331. select {
  332. case ka, ok := <-rc:
  333. if ok {
  334. t.Fatalf("unexpected keepalive %v, expected closed channel", ka)
  335. }
  336. case <-time.After(10 * time.Second):
  337. t.Fatalf("keepalive channel did not close")
  338. }
  339. clus.Members[0].Restart(t)
  340. }
  341. // TestLeaseKeepAliveInitTimeout ensures the keep alive channel closes if
  342. // a keep alive request after the first never gets a response.
  343. func TestLeaseKeepAliveTTLTimeout(t *testing.T) {
  344. defer testutil.AfterTest(t)
  345. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  346. defer clus.Terminate(t)
  347. cli := clus.Client(0)
  348. // setup lease and do a keepalive
  349. resp, err := cli.Grant(context.Background(), 5)
  350. if err != nil {
  351. t.Fatal(err)
  352. }
  353. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  354. if kerr != nil {
  355. t.Fatal(kerr)
  356. }
  357. if kresp := <-rc; kresp.ID != resp.ID {
  358. t.Fatalf("ID = %x, want %x", kresp.ID, resp.ID)
  359. }
  360. // keep client disconnected
  361. clus.Members[0].Stop(t)
  362. select {
  363. case ka, ok := <-rc:
  364. if ok {
  365. t.Fatalf("unexpected keepalive %v, expected closed channel", ka)
  366. }
  367. case <-time.After(10 * time.Second):
  368. t.Fatalf("keepalive channel did not close")
  369. }
  370. clus.Members[0].Restart(t)
  371. }
  372. func TestLeaseTimeToLive(t *testing.T) {
  373. defer testutil.AfterTest(t)
  374. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  375. defer clus.Terminate(t)
  376. lapi := clientv3.NewLease(clus.RandClient())
  377. defer lapi.Close()
  378. resp, err := lapi.Grant(context.Background(), 10)
  379. if err != nil {
  380. t.Errorf("failed to create lease %v", err)
  381. }
  382. kv := clientv3.NewKV(clus.RandClient())
  383. keys := []string{"foo1", "foo2"}
  384. for i := range keys {
  385. if _, err = kv.Put(context.TODO(), keys[i], "bar", clientv3.WithLease(resp.ID)); err != nil {
  386. t.Fatal(err)
  387. }
  388. }
  389. lresp, lerr := lapi.TimeToLive(context.Background(), resp.ID, clientv3.WithAttachedKeys())
  390. if lerr != nil {
  391. t.Fatal(lerr)
  392. }
  393. if lresp.ID != resp.ID {
  394. t.Fatalf("leaseID expected %d, got %d", resp.ID, lresp.ID)
  395. }
  396. if lresp.GrantedTTL != int64(10) {
  397. t.Fatalf("GrantedTTL expected %d, got %d", 10, lresp.GrantedTTL)
  398. }
  399. if lresp.TTL == 0 || lresp.TTL > lresp.GrantedTTL {
  400. t.Fatalf("unexpected TTL %d (granted %d)", lresp.TTL, lresp.GrantedTTL)
  401. }
  402. ks := make([]string, len(lresp.Keys))
  403. for i := range lresp.Keys {
  404. ks[i] = string(lresp.Keys[i])
  405. }
  406. sort.Strings(ks)
  407. if !reflect.DeepEqual(ks, keys) {
  408. t.Fatalf("keys expected %v, got %v", keys, ks)
  409. }
  410. lresp, lerr = lapi.TimeToLive(context.Background(), resp.ID)
  411. if lerr != nil {
  412. t.Fatal(lerr)
  413. }
  414. if len(lresp.Keys) != 0 {
  415. t.Fatalf("unexpected keys %+v", lresp.Keys)
  416. }
  417. }
  418. // TestLeaseRenewLostQuorum ensures keepalives work after losing quorum
  419. // for a while.
  420. func TestLeaseRenewLostQuorum(t *testing.T) {
  421. defer testutil.AfterTest(t)
  422. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  423. defer clus.Terminate(t)
  424. cli := clus.Client(0)
  425. r, err := cli.Grant(context.TODO(), 4)
  426. if err != nil {
  427. t.Fatal(err)
  428. }
  429. kctx, kcancel := context.WithCancel(context.Background())
  430. defer kcancel()
  431. ka, err := cli.KeepAlive(kctx, r.ID)
  432. if err != nil {
  433. t.Fatal(err)
  434. }
  435. // consume first keepalive so next message sends when cluster is down
  436. <-ka
  437. // force keepalive stream message to timeout
  438. clus.Members[1].Stop(t)
  439. clus.Members[2].Stop(t)
  440. // Use TTL-1 since the client closes the keepalive channel if no
  441. // keepalive arrives before the lease deadline.
  442. // The cluster has 1 second to recover and reply to the keepalive.
  443. time.Sleep(time.Duration(r.TTL-1) * time.Second)
  444. clus.Members[1].Restart(t)
  445. clus.Members[2].Restart(t)
  446. select {
  447. case _, ok := <-ka:
  448. if !ok {
  449. t.Fatalf("keepalive closed")
  450. }
  451. case <-time.After(time.Duration(r.TTL) * time.Second):
  452. t.Fatalf("timed out waiting for keepalive")
  453. }
  454. }
  455. func TestLeaseKeepAliveLoopExit(t *testing.T) {
  456. defer testutil.AfterTest(t)
  457. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  458. defer clus.Terminate(t)
  459. ctx := context.Background()
  460. cli := clus.Client(0)
  461. resp, err := cli.Grant(ctx, 5)
  462. if err != nil {
  463. t.Fatal(err)
  464. }
  465. cli.Lease.Close()
  466. _, err = cli.KeepAlive(ctx, resp.ID)
  467. if _, ok := err.(clientv3.ErrKeepAliveHalted); !ok {
  468. t.Fatalf("expected %T, got %v(%T)", clientv3.ErrKeepAliveHalted{}, err, err)
  469. }
  470. }
  471. // TestV3LeaseFailureOverlap issues Grant and Keepalive requests to a cluster
  472. // before, during, and after quorum loss to confirm Grant/Keepalive tolerates
  473. // transient cluster failure.
  474. func TestV3LeaseFailureOverlap(t *testing.T) {
  475. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 2})
  476. defer clus.Terminate(t)
  477. numReqs := 5
  478. cli := clus.Client(0)
  479. // bring up a session, tear it down
  480. updown := func(i int) error {
  481. sess, err := concurrency.NewSession(cli)
  482. if err != nil {
  483. return err
  484. }
  485. ch := make(chan struct{})
  486. go func() {
  487. defer close(ch)
  488. sess.Close()
  489. }()
  490. select {
  491. case <-ch:
  492. case <-time.After(time.Minute / 4):
  493. t.Fatalf("timeout %d", i)
  494. }
  495. return nil
  496. }
  497. var wg sync.WaitGroup
  498. mkReqs := func(n int) {
  499. wg.Add(numReqs)
  500. for i := 0; i < numReqs; i++ {
  501. go func() {
  502. defer wg.Done()
  503. err := updown(n)
  504. if err == nil || err == rpctypes.ErrTimeoutDueToConnectionLost {
  505. return
  506. }
  507. t.Fatal(err)
  508. }()
  509. }
  510. }
  511. mkReqs(1)
  512. clus.Members[1].Stop(t)
  513. mkReqs(2)
  514. time.Sleep(time.Second)
  515. mkReqs(3)
  516. clus.Members[1].Restart(t)
  517. mkReqs(4)
  518. wg.Wait()
  519. }