lease_test.go 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805
  1. // Copyright 2016 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package integration
  15. import (
  16. "context"
  17. "reflect"
  18. "sort"
  19. "sync"
  20. "testing"
  21. "time"
  22. "github.com/coreos/etcd/clientv3"
  23. "github.com/coreos/etcd/clientv3/concurrency"
  24. "github.com/coreos/etcd/etcdserver/api/v3rpc/rpctypes"
  25. "github.com/coreos/etcd/integration"
  26. "github.com/coreos/etcd/pkg/testutil"
  27. "google.golang.org/grpc"
  28. )
  29. func TestLeaseNotFoundError(t *testing.T) {
  30. defer testutil.AfterTest(t)
  31. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  32. defer clus.Terminate(t)
  33. kv := clus.RandClient()
  34. _, err := kv.Put(context.TODO(), "foo", "bar", clientv3.WithLease(clientv3.LeaseID(500)))
  35. if err != rpctypes.ErrLeaseNotFound {
  36. t.Fatalf("expected %v, got %v", rpctypes.ErrLeaseNotFound, err)
  37. }
  38. }
  39. func TestLeaseGrant(t *testing.T) {
  40. defer testutil.AfterTest(t)
  41. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  42. defer clus.Terminate(t)
  43. lapi := clus.RandClient()
  44. kv := clus.RandClient()
  45. _, merr := lapi.Grant(context.Background(), clientv3.MaxLeaseTTL+1)
  46. if merr != rpctypes.ErrLeaseTTLTooLarge {
  47. t.Fatalf("err = %v, want %v", merr, rpctypes.ErrLeaseTTLTooLarge)
  48. }
  49. resp, err := lapi.Grant(context.Background(), 10)
  50. if err != nil {
  51. t.Errorf("failed to create lease %v", err)
  52. }
  53. _, err = kv.Put(context.TODO(), "foo", "bar", clientv3.WithLease(resp.ID))
  54. if err != nil {
  55. t.Fatalf("failed to create key with lease %v", err)
  56. }
  57. }
  58. func TestLeaseRevoke(t *testing.T) {
  59. defer testutil.AfterTest(t)
  60. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  61. defer clus.Terminate(t)
  62. lapi := clus.RandClient()
  63. kv := clus.RandClient()
  64. resp, err := lapi.Grant(context.Background(), 10)
  65. if err != nil {
  66. t.Errorf("failed to create lease %v", err)
  67. }
  68. _, err = lapi.Revoke(context.Background(), clientv3.LeaseID(resp.ID))
  69. if err != nil {
  70. t.Errorf("failed to revoke lease %v", err)
  71. }
  72. _, err = kv.Put(context.TODO(), "foo", "bar", clientv3.WithLease(resp.ID))
  73. if err != rpctypes.ErrLeaseNotFound {
  74. t.Fatalf("err = %v, want %v", err, rpctypes.ErrLeaseNotFound)
  75. }
  76. }
  77. func TestLeaseKeepAliveOnce(t *testing.T) {
  78. defer testutil.AfterTest(t)
  79. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  80. defer clus.Terminate(t)
  81. lapi := clus.RandClient()
  82. resp, err := lapi.Grant(context.Background(), 10)
  83. if err != nil {
  84. t.Errorf("failed to create lease %v", err)
  85. }
  86. _, err = lapi.KeepAliveOnce(context.Background(), resp.ID)
  87. if err != nil {
  88. t.Errorf("failed to keepalive lease %v", err)
  89. }
  90. _, err = lapi.KeepAliveOnce(context.Background(), clientv3.LeaseID(0))
  91. if err != rpctypes.ErrLeaseNotFound {
  92. t.Errorf("expected %v, got %v", rpctypes.ErrLeaseNotFound, err)
  93. }
  94. }
  95. func TestLeaseKeepAlive(t *testing.T) {
  96. defer testutil.AfterTest(t)
  97. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  98. defer clus.Terminate(t)
  99. lapi := clus.Client(0)
  100. clus.TakeClient(0)
  101. resp, err := lapi.Grant(context.Background(), 10)
  102. if err != nil {
  103. t.Errorf("failed to create lease %v", err)
  104. }
  105. rc, kerr := lapi.KeepAlive(context.Background(), resp.ID)
  106. if kerr != nil {
  107. t.Errorf("failed to keepalive lease %v", kerr)
  108. }
  109. kresp, ok := <-rc
  110. if !ok {
  111. t.Errorf("chan is closed, want not closed")
  112. }
  113. if kresp == nil {
  114. t.Fatalf("unexpected null response")
  115. }
  116. if kresp.ID != resp.ID {
  117. t.Errorf("ID = %x, want %x", kresp.ID, resp.ID)
  118. }
  119. lapi.Close()
  120. _, ok = <-rc
  121. if ok {
  122. t.Errorf("chan is not closed, want lease Close() closes chan")
  123. }
  124. }
  125. func TestLeaseKeepAliveOneSecond(t *testing.T) {
  126. defer testutil.AfterTest(t)
  127. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  128. defer clus.Terminate(t)
  129. cli := clus.Client(0)
  130. resp, err := cli.Grant(context.Background(), 1)
  131. if err != nil {
  132. t.Errorf("failed to create lease %v", err)
  133. }
  134. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  135. if kerr != nil {
  136. t.Errorf("failed to keepalive lease %v", kerr)
  137. }
  138. for i := 0; i < 3; i++ {
  139. if _, ok := <-rc; !ok {
  140. t.Errorf("chan is closed, want not closed")
  141. }
  142. }
  143. }
  144. // TODO: add a client that can connect to all the members of cluster via unix sock.
  145. // TODO: test handle more complicated failures.
  146. func TestLeaseKeepAliveHandleFailure(t *testing.T) {
  147. t.Skip("test it when we have a cluster client")
  148. defer testutil.AfterTest(t)
  149. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  150. defer clus.Terminate(t)
  151. // TODO: change this line to get a cluster client
  152. lapi := clus.RandClient()
  153. resp, err := lapi.Grant(context.Background(), 10)
  154. if err != nil {
  155. t.Errorf("failed to create lease %v", err)
  156. }
  157. rc, kerr := lapi.KeepAlive(context.Background(), resp.ID)
  158. if kerr != nil {
  159. t.Errorf("failed to keepalive lease %v", kerr)
  160. }
  161. kresp := <-rc
  162. if kresp.ID != resp.ID {
  163. t.Errorf("ID = %x, want %x", kresp.ID, resp.ID)
  164. }
  165. // restart the connected member.
  166. clus.Members[0].Stop(t)
  167. select {
  168. case <-rc:
  169. t.Fatalf("unexpected keepalive")
  170. case <-time.After(10*time.Second/3 + 1):
  171. }
  172. // recover the member.
  173. clus.Members[0].Restart(t)
  174. kresp = <-rc
  175. if kresp.ID != resp.ID {
  176. t.Errorf("ID = %x, want %x", kresp.ID, resp.ID)
  177. }
  178. lapi.Close()
  179. _, ok := <-rc
  180. if ok {
  181. t.Errorf("chan is not closed, want lease Close() closes chan")
  182. }
  183. }
  184. type leaseCh struct {
  185. lid clientv3.LeaseID
  186. ch <-chan *clientv3.LeaseKeepAliveResponse
  187. }
  188. // TestLeaseKeepAliveNotFound ensures a revoked lease won't halt other leases.
  189. func TestLeaseKeepAliveNotFound(t *testing.T) {
  190. defer testutil.AfterTest(t)
  191. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  192. defer clus.Terminate(t)
  193. cli := clus.RandClient()
  194. lchs := []leaseCh{}
  195. for i := 0; i < 3; i++ {
  196. resp, rerr := cli.Grant(context.TODO(), 5)
  197. if rerr != nil {
  198. t.Fatal(rerr)
  199. }
  200. kach, kaerr := cli.KeepAlive(context.Background(), resp.ID)
  201. if kaerr != nil {
  202. t.Fatal(kaerr)
  203. }
  204. lchs = append(lchs, leaseCh{resp.ID, kach})
  205. }
  206. if _, err := cli.Revoke(context.TODO(), lchs[1].lid); err != nil {
  207. t.Fatal(err)
  208. }
  209. <-lchs[0].ch
  210. if _, ok := <-lchs[0].ch; !ok {
  211. t.Fatalf("closed keepalive on wrong lease")
  212. }
  213. timec := time.After(5 * time.Second)
  214. for range lchs[1].ch {
  215. select {
  216. case <-timec:
  217. t.Fatalf("revoke did not close keep alive")
  218. default:
  219. }
  220. }
  221. }
  222. func TestLeaseGrantErrConnClosed(t *testing.T) {
  223. defer testutil.AfterTest(t)
  224. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  225. defer clus.Terminate(t)
  226. cli := clus.Client(0)
  227. clus.TakeClient(0)
  228. donec := make(chan struct{})
  229. go func() {
  230. defer close(donec)
  231. _, err := cli.Grant(context.TODO(), 5)
  232. if !clientv3.IsConnCanceled(err) {
  233. // grpc.ErrClientConnClosing if grpc-go balancer calls 'Get' after client.Close.
  234. // context.Canceled if grpc-go balancer calls 'Get' with an inflight client.Close.
  235. t.Fatalf("expected %v, %v or server unavailable, got %v", err != context.Canceled, grpc.ErrClientConnClosing, err)
  236. }
  237. }()
  238. if err := cli.Close(); err != nil {
  239. t.Fatal(err)
  240. }
  241. select {
  242. case <-time.After(integration.RequestWaitTimeout):
  243. t.Fatal("le.Grant took too long")
  244. case <-donec:
  245. }
  246. }
  247. func TestLeaseGrantNewAfterClose(t *testing.T) {
  248. defer testutil.AfterTest(t)
  249. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  250. defer clus.Terminate(t)
  251. cli := clus.Client(0)
  252. clus.TakeClient(0)
  253. if err := cli.Close(); err != nil {
  254. t.Fatal(err)
  255. }
  256. donec := make(chan struct{})
  257. go func() {
  258. _, err := cli.Grant(context.TODO(), 5)
  259. if !clientv3.IsConnCanceled(err) {
  260. t.Fatalf("expected %v, %v or server unavailable, got %v", err != context.Canceled, grpc.ErrClientConnClosing, err)
  261. }
  262. close(donec)
  263. }()
  264. select {
  265. case <-time.After(integration.RequestWaitTimeout):
  266. t.Fatal("le.Grant took too long")
  267. case <-donec:
  268. }
  269. }
  270. func TestLeaseRevokeNewAfterClose(t *testing.T) {
  271. defer testutil.AfterTest(t)
  272. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  273. defer clus.Terminate(t)
  274. cli := clus.Client(0)
  275. resp, err := cli.Grant(context.TODO(), 5)
  276. if err != nil {
  277. t.Fatal(err)
  278. }
  279. leaseID := resp.ID
  280. clus.TakeClient(0)
  281. if err := cli.Close(); err != nil {
  282. t.Fatal(err)
  283. }
  284. donec := make(chan struct{})
  285. go func() {
  286. _, err := cli.Revoke(context.TODO(), leaseID)
  287. if !clientv3.IsConnCanceled(err) {
  288. t.Fatalf("expected %v, %v or server unavailable, got %v", err != context.Canceled, grpc.ErrClientConnClosing, err)
  289. }
  290. close(donec)
  291. }()
  292. select {
  293. case <-time.After(integration.RequestWaitTimeout):
  294. t.Fatal("le.Revoke took too long")
  295. case <-donec:
  296. }
  297. }
  298. // TestLeaseKeepAliveCloseAfterDisconnectRevoke ensures the keep alive channel is closed
  299. // following a disconnection, lease revoke, then reconnect.
  300. func TestLeaseKeepAliveCloseAfterDisconnectRevoke(t *testing.T) {
  301. defer testutil.AfterTest(t)
  302. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  303. defer clus.Terminate(t)
  304. cli := clus.Client(0)
  305. // setup lease and do a keepalive
  306. resp, err := cli.Grant(context.Background(), 10)
  307. if err != nil {
  308. t.Fatal(err)
  309. }
  310. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  311. if kerr != nil {
  312. t.Fatal(kerr)
  313. }
  314. kresp := <-rc
  315. if kresp.ID != resp.ID {
  316. t.Fatalf("ID = %x, want %x", kresp.ID, resp.ID)
  317. }
  318. // keep client disconnected
  319. clus.Members[0].Stop(t)
  320. time.Sleep(time.Second)
  321. clus.WaitLeader(t)
  322. if _, err := clus.Client(1).Revoke(context.TODO(), resp.ID); err != nil {
  323. t.Fatal(err)
  324. }
  325. clus.Members[0].Restart(t)
  326. // some responses may still be buffered; drain until close
  327. timer := time.After(time.Duration(kresp.TTL) * time.Second)
  328. for kresp != nil {
  329. select {
  330. case kresp = <-rc:
  331. case <-timer:
  332. t.Fatalf("keepalive channel did not close")
  333. }
  334. }
  335. }
  336. // TestLeaseKeepAliveInitTimeout ensures the keep alive channel closes if
  337. // the initial keep alive request never gets a response.
  338. func TestLeaseKeepAliveInitTimeout(t *testing.T) {
  339. defer testutil.AfterTest(t)
  340. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  341. defer clus.Terminate(t)
  342. cli := clus.Client(0)
  343. // setup lease and do a keepalive
  344. resp, err := cli.Grant(context.Background(), 5)
  345. if err != nil {
  346. t.Fatal(err)
  347. }
  348. // keep client disconnected
  349. clus.Members[0].Stop(t)
  350. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  351. if kerr != nil {
  352. t.Fatal(kerr)
  353. }
  354. select {
  355. case ka, ok := <-rc:
  356. if ok {
  357. t.Fatalf("unexpected keepalive %v, expected closed channel", ka)
  358. }
  359. case <-time.After(10 * time.Second):
  360. t.Fatalf("keepalive channel did not close")
  361. }
  362. clus.Members[0].Restart(t)
  363. }
  364. // TestLeaseKeepAliveInitTimeout ensures the keep alive channel closes if
  365. // a keep alive request after the first never gets a response.
  366. func TestLeaseKeepAliveTTLTimeout(t *testing.T) {
  367. defer testutil.AfterTest(t)
  368. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  369. defer clus.Terminate(t)
  370. cli := clus.Client(0)
  371. // setup lease and do a keepalive
  372. resp, err := cli.Grant(context.Background(), 5)
  373. if err != nil {
  374. t.Fatal(err)
  375. }
  376. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  377. if kerr != nil {
  378. t.Fatal(kerr)
  379. }
  380. if kresp := <-rc; kresp.ID != resp.ID {
  381. t.Fatalf("ID = %x, want %x", kresp.ID, resp.ID)
  382. }
  383. // keep client disconnected
  384. clus.Members[0].Stop(t)
  385. select {
  386. case ka, ok := <-rc:
  387. if ok {
  388. t.Fatalf("unexpected keepalive %v, expected closed channel", ka)
  389. }
  390. case <-time.After(10 * time.Second):
  391. t.Fatalf("keepalive channel did not close")
  392. }
  393. clus.Members[0].Restart(t)
  394. }
  395. func TestLeaseTimeToLive(t *testing.T) {
  396. defer testutil.AfterTest(t)
  397. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  398. defer clus.Terminate(t)
  399. c := clus.RandClient()
  400. lapi := c
  401. resp, err := lapi.Grant(context.Background(), 10)
  402. if err != nil {
  403. t.Errorf("failed to create lease %v", err)
  404. }
  405. kv := clus.RandClient()
  406. keys := []string{"foo1", "foo2"}
  407. for i := range keys {
  408. if _, err = kv.Put(context.TODO(), keys[i], "bar", clientv3.WithLease(resp.ID)); err != nil {
  409. t.Fatal(err)
  410. }
  411. }
  412. // linearized read to ensure Puts propagated to server backing lapi
  413. if _, err := c.Get(context.TODO(), "abc"); err != nil {
  414. t.Fatal(err)
  415. }
  416. lresp, lerr := lapi.TimeToLive(context.Background(), resp.ID, clientv3.WithAttachedKeys())
  417. if lerr != nil {
  418. t.Fatal(lerr)
  419. }
  420. if lresp.ID != resp.ID {
  421. t.Fatalf("leaseID expected %d, got %d", resp.ID, lresp.ID)
  422. }
  423. if lresp.GrantedTTL != int64(10) {
  424. t.Fatalf("GrantedTTL expected %d, got %d", 10, lresp.GrantedTTL)
  425. }
  426. if lresp.TTL == 0 || lresp.TTL > lresp.GrantedTTL {
  427. t.Fatalf("unexpected TTL %d (granted %d)", lresp.TTL, lresp.GrantedTTL)
  428. }
  429. ks := make([]string, len(lresp.Keys))
  430. for i := range lresp.Keys {
  431. ks[i] = string(lresp.Keys[i])
  432. }
  433. sort.Strings(ks)
  434. if !reflect.DeepEqual(ks, keys) {
  435. t.Fatalf("keys expected %v, got %v", keys, ks)
  436. }
  437. lresp, lerr = lapi.TimeToLive(context.Background(), resp.ID)
  438. if lerr != nil {
  439. t.Fatal(lerr)
  440. }
  441. if len(lresp.Keys) != 0 {
  442. t.Fatalf("unexpected keys %+v", lresp.Keys)
  443. }
  444. }
  445. func TestLeaseTimeToLiveLeaseNotFound(t *testing.T) {
  446. defer testutil.AfterTest(t)
  447. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  448. defer clus.Terminate(t)
  449. cli := clus.RandClient()
  450. resp, err := cli.Grant(context.Background(), 10)
  451. if err != nil {
  452. t.Errorf("failed to create lease %v", err)
  453. }
  454. _, err = cli.Revoke(context.Background(), resp.ID)
  455. if err != nil {
  456. t.Errorf("failed to Revoke lease %v", err)
  457. }
  458. lresp, err := cli.TimeToLive(context.Background(), resp.ID)
  459. // TimeToLive() should return a response with TTL=-1.
  460. if err != nil {
  461. t.Fatalf("expected err to be nil")
  462. }
  463. if lresp == nil {
  464. t.Fatalf("expected lresp not to be nil")
  465. }
  466. if lresp.ResponseHeader == nil {
  467. t.Fatalf("expected ResponseHeader not to be nil")
  468. }
  469. if lresp.ID != resp.ID {
  470. t.Fatalf("expected Lease ID %v, but got %v", resp.ID, lresp.ID)
  471. }
  472. if lresp.TTL != -1 {
  473. t.Fatalf("expected TTL %v, but got %v", lresp.TTL, lresp.TTL)
  474. }
  475. }
  476. func TestLeaseLeases(t *testing.T) {
  477. defer testutil.AfterTest(t)
  478. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  479. defer clus.Terminate(t)
  480. cli := clus.RandClient()
  481. ids := []clientv3.LeaseID{}
  482. for i := 0; i < 5; i++ {
  483. resp, err := cli.Grant(context.Background(), 10)
  484. if err != nil {
  485. t.Errorf("failed to create lease %v", err)
  486. }
  487. ids = append(ids, resp.ID)
  488. }
  489. resp, err := cli.Leases(context.Background())
  490. if err != nil {
  491. t.Fatal(err)
  492. }
  493. if len(resp.Leases) != 5 {
  494. t.Fatalf("len(resp.Leases) expected 5, got %d", len(resp.Leases))
  495. }
  496. for i := range resp.Leases {
  497. if ids[i] != resp.Leases[i].ID {
  498. t.Fatalf("#%d: lease ID expected %d, got %d", i, ids[i], resp.Leases[i].ID)
  499. }
  500. }
  501. }
  502. // TestLeaseRenewLostQuorum ensures keepalives work after losing quorum
  503. // for a while.
  504. func TestLeaseRenewLostQuorum(t *testing.T) {
  505. defer testutil.AfterTest(t)
  506. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  507. defer clus.Terminate(t)
  508. cli := clus.Client(0)
  509. r, err := cli.Grant(context.TODO(), 4)
  510. if err != nil {
  511. t.Fatal(err)
  512. }
  513. kctx, kcancel := context.WithCancel(context.Background())
  514. defer kcancel()
  515. ka, err := cli.KeepAlive(kctx, r.ID)
  516. if err != nil {
  517. t.Fatal(err)
  518. }
  519. // consume first keepalive so next message sends when cluster is down
  520. <-ka
  521. lastKa := time.Now()
  522. // force keepalive stream message to timeout
  523. clus.Members[1].Stop(t)
  524. clus.Members[2].Stop(t)
  525. // Use TTL-2 since the client closes the keepalive channel if no
  526. // keepalive arrives before the lease deadline; the client will
  527. // try to resend a keepalive after TTL/3 seconds, so for a TTL of 4,
  528. // sleeping for 2s should be sufficient time for issuing a retry.
  529. // The cluster has two seconds to recover and reply to the keepalive.
  530. time.Sleep(time.Duration(r.TTL-2) * time.Second)
  531. clus.Members[1].Restart(t)
  532. clus.Members[2].Restart(t)
  533. if time.Since(lastKa) > time.Duration(r.TTL)*time.Second {
  534. t.Skip("waited too long for server stop and restart")
  535. }
  536. select {
  537. case _, ok := <-ka:
  538. if !ok {
  539. t.Fatalf("keepalive closed")
  540. }
  541. case <-time.After(time.Duration(r.TTL) * time.Second):
  542. t.Fatalf("timed out waiting for keepalive")
  543. }
  544. }
  545. func TestLeaseKeepAliveLoopExit(t *testing.T) {
  546. defer testutil.AfterTest(t)
  547. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  548. defer clus.Terminate(t)
  549. ctx := context.Background()
  550. cli := clus.Client(0)
  551. clus.TakeClient(0)
  552. resp, err := cli.Grant(ctx, 5)
  553. if err != nil {
  554. t.Fatal(err)
  555. }
  556. cli.Close()
  557. _, err = cli.KeepAlive(ctx, resp.ID)
  558. if _, ok := err.(clientv3.ErrKeepAliveHalted); !ok {
  559. t.Fatalf("expected %T, got %v(%T)", clientv3.ErrKeepAliveHalted{}, err, err)
  560. }
  561. }
  562. // TestV3LeaseFailureOverlap issues Grant and KeepAlive requests to a cluster
  563. // before, during, and after quorum loss to confirm Grant/KeepAlive tolerates
  564. // transient cluster failure.
  565. func TestV3LeaseFailureOverlap(t *testing.T) {
  566. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 2})
  567. defer clus.Terminate(t)
  568. numReqs := 5
  569. cli := clus.Client(0)
  570. // bring up a session, tear it down
  571. updown := func(i int) error {
  572. sess, err := concurrency.NewSession(cli)
  573. if err != nil {
  574. return err
  575. }
  576. ch := make(chan struct{})
  577. go func() {
  578. defer close(ch)
  579. sess.Close()
  580. }()
  581. select {
  582. case <-ch:
  583. case <-time.After(time.Minute / 4):
  584. t.Fatalf("timeout %d", i)
  585. }
  586. return nil
  587. }
  588. var wg sync.WaitGroup
  589. mkReqs := func(n int) {
  590. wg.Add(numReqs)
  591. for i := 0; i < numReqs; i++ {
  592. go func() {
  593. defer wg.Done()
  594. err := updown(n)
  595. if err == nil || err == rpctypes.ErrTimeoutDueToConnectionLost {
  596. return
  597. }
  598. t.Fatal(err)
  599. }()
  600. }
  601. }
  602. mkReqs(1)
  603. clus.Members[1].Stop(t)
  604. mkReqs(2)
  605. time.Sleep(time.Second)
  606. mkReqs(3)
  607. clus.Members[1].Restart(t)
  608. mkReqs(4)
  609. wg.Wait()
  610. }
  611. // TestLeaseWithRequireLeader checks keep-alive channel close when no leader.
  612. func TestLeaseWithRequireLeader(t *testing.T) {
  613. defer testutil.AfterTest(t)
  614. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 2})
  615. defer clus.Terminate(t)
  616. c := clus.Client(0)
  617. lid1, err1 := c.Grant(context.TODO(), 60)
  618. if err1 != nil {
  619. t.Fatal(err1)
  620. }
  621. lid2, err2 := c.Grant(context.TODO(), 60)
  622. if err2 != nil {
  623. t.Fatal(err2)
  624. }
  625. // kaReqLeader close if the leader is lost
  626. kaReqLeader, kerr1 := c.KeepAlive(clientv3.WithRequireLeader(context.TODO()), lid1.ID)
  627. if kerr1 != nil {
  628. t.Fatal(kerr1)
  629. }
  630. // kaWait will wait even if the leader is lost
  631. kaWait, kerr2 := c.KeepAlive(context.TODO(), lid2.ID)
  632. if kerr2 != nil {
  633. t.Fatal(kerr2)
  634. }
  635. select {
  636. case <-kaReqLeader:
  637. case <-time.After(5 * time.Second):
  638. t.Fatalf("require leader first keep-alive timed out")
  639. }
  640. select {
  641. case <-kaWait:
  642. case <-time.After(5 * time.Second):
  643. t.Fatalf("leader not required first keep-alive timed out")
  644. }
  645. clus.Members[1].Stop(t)
  646. // kaReqLeader may issue multiple requests while waiting for the first
  647. // response from proxy server; drain any stray keepalive responses
  648. time.Sleep(100 * time.Millisecond)
  649. for len(kaReqLeader) > 0 {
  650. <-kaReqLeader
  651. }
  652. select {
  653. case resp, ok := <-kaReqLeader:
  654. if ok {
  655. t.Fatalf("expected closed require leader, got response %+v", resp)
  656. }
  657. case <-time.After(5 * time.Second):
  658. t.Fatal("keepalive with require leader took too long to close")
  659. }
  660. select {
  661. case _, ok := <-kaWait:
  662. if !ok {
  663. t.Fatalf("got closed channel with no require leader, expected non-closed")
  664. }
  665. case <-time.After(10 * time.Millisecond):
  666. // wait some to detect any closes happening soon after kaReqLeader closing
  667. }
  668. }