lease_test.go 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768
  1. // Copyright 2016 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package integration
  15. import (
  16. "reflect"
  17. "sort"
  18. "sync"
  19. "testing"
  20. "time"
  21. "github.com/coreos/etcd/clientv3"
  22. "github.com/coreos/etcd/clientv3/concurrency"
  23. "github.com/coreos/etcd/etcdserver/api/v3rpc/rpctypes"
  24. "github.com/coreos/etcd/integration"
  25. "github.com/coreos/etcd/pkg/testutil"
  26. "golang.org/x/net/context"
  27. "google.golang.org/grpc"
  28. )
  29. func TestLeaseNotFoundError(t *testing.T) {
  30. defer testutil.AfterTest(t)
  31. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  32. defer clus.Terminate(t)
  33. kv := clus.RandClient()
  34. _, err := kv.Put(context.TODO(), "foo", "bar", clientv3.WithLease(clientv3.LeaseID(500)))
  35. if err != rpctypes.ErrLeaseNotFound {
  36. t.Fatalf("expected %v, got %v", rpctypes.ErrLeaseNotFound, err)
  37. }
  38. }
  39. func TestLeaseGrant(t *testing.T) {
  40. defer testutil.AfterTest(t)
  41. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  42. defer clus.Terminate(t)
  43. lapi := clus.RandClient()
  44. kv := clus.RandClient()
  45. _, merr := lapi.Grant(context.Background(), clientv3.MaxLeaseTTL+1)
  46. if merr != rpctypes.ErrLeaseTTLTooLarge {
  47. t.Fatalf("err = %v, want %v", merr, rpctypes.ErrLeaseTTLTooLarge)
  48. }
  49. resp, err := lapi.Grant(context.Background(), 10)
  50. if err != nil {
  51. t.Errorf("failed to create lease %v", err)
  52. }
  53. _, err = kv.Put(context.TODO(), "foo", "bar", clientv3.WithLease(resp.ID))
  54. if err != nil {
  55. t.Fatalf("failed to create key with lease %v", err)
  56. }
  57. }
  58. func TestLeaseRevoke(t *testing.T) {
  59. defer testutil.AfterTest(t)
  60. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  61. defer clus.Terminate(t)
  62. lapi := clus.RandClient()
  63. kv := clus.RandClient()
  64. resp, err := lapi.Grant(context.Background(), 10)
  65. if err != nil {
  66. t.Errorf("failed to create lease %v", err)
  67. }
  68. _, err = lapi.Revoke(context.Background(), clientv3.LeaseID(resp.ID))
  69. if err != nil {
  70. t.Errorf("failed to revoke lease %v", err)
  71. }
  72. _, err = kv.Put(context.TODO(), "foo", "bar", clientv3.WithLease(resp.ID))
  73. if err != rpctypes.ErrLeaseNotFound {
  74. t.Fatalf("err = %v, want %v", err, rpctypes.ErrLeaseNotFound)
  75. }
  76. }
  77. func TestLeaseKeepAliveOnce(t *testing.T) {
  78. defer testutil.AfterTest(t)
  79. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  80. defer clus.Terminate(t)
  81. lapi := clus.RandClient()
  82. resp, err := lapi.Grant(context.Background(), 10)
  83. if err != nil {
  84. t.Errorf("failed to create lease %v", err)
  85. }
  86. _, err = lapi.KeepAliveOnce(context.Background(), resp.ID)
  87. if err != nil {
  88. t.Errorf("failed to keepalive lease %v", err)
  89. }
  90. _, err = lapi.KeepAliveOnce(context.Background(), clientv3.LeaseID(0))
  91. if err != rpctypes.ErrLeaseNotFound {
  92. t.Errorf("expected %v, got %v", rpctypes.ErrLeaseNotFound, err)
  93. }
  94. }
  95. func TestLeaseKeepAlive(t *testing.T) {
  96. defer testutil.AfterTest(t)
  97. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  98. defer clus.Terminate(t)
  99. lapi := clus.Client(0)
  100. clus.TakeClient(0)
  101. resp, err := lapi.Grant(context.Background(), 10)
  102. if err != nil {
  103. t.Errorf("failed to create lease %v", err)
  104. }
  105. rc, kerr := lapi.KeepAlive(context.Background(), resp.ID)
  106. if kerr != nil {
  107. t.Errorf("failed to keepalive lease %v", kerr)
  108. }
  109. kresp, ok := <-rc
  110. if !ok {
  111. t.Errorf("chan is closed, want not closed")
  112. }
  113. if kresp.ID != resp.ID {
  114. t.Errorf("ID = %x, want %x", kresp.ID, resp.ID)
  115. }
  116. lapi.Close()
  117. _, ok = <-rc
  118. if ok {
  119. t.Errorf("chan is not closed, want lease Close() closes chan")
  120. }
  121. }
  122. func TestLeaseKeepAliveOneSecond(t *testing.T) {
  123. defer testutil.AfterTest(t)
  124. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  125. defer clus.Terminate(t)
  126. cli := clus.Client(0)
  127. resp, err := cli.Grant(context.Background(), 1)
  128. if err != nil {
  129. t.Errorf("failed to create lease %v", err)
  130. }
  131. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  132. if kerr != nil {
  133. t.Errorf("failed to keepalive lease %v", kerr)
  134. }
  135. for i := 0; i < 3; i++ {
  136. if _, ok := <-rc; !ok {
  137. t.Errorf("chan is closed, want not closed")
  138. }
  139. }
  140. }
  141. // TODO: add a client that can connect to all the members of cluster via unix sock.
  142. // TODO: test handle more complicated failures.
  143. func TestLeaseKeepAliveHandleFailure(t *testing.T) {
  144. t.Skip("test it when we have a cluster client")
  145. defer testutil.AfterTest(t)
  146. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  147. defer clus.Terminate(t)
  148. // TODO: change this line to get a cluster client
  149. lapi := clus.RandClient()
  150. resp, err := lapi.Grant(context.Background(), 10)
  151. if err != nil {
  152. t.Errorf("failed to create lease %v", err)
  153. }
  154. rc, kerr := lapi.KeepAlive(context.Background(), resp.ID)
  155. if kerr != nil {
  156. t.Errorf("failed to keepalive lease %v", kerr)
  157. }
  158. kresp := <-rc
  159. if kresp.ID != resp.ID {
  160. t.Errorf("ID = %x, want %x", kresp.ID, resp.ID)
  161. }
  162. // restart the connected member.
  163. clus.Members[0].Stop(t)
  164. select {
  165. case <-rc:
  166. t.Fatalf("unexpected keepalive")
  167. case <-time.After(10*time.Second/3 + 1):
  168. }
  169. // recover the member.
  170. clus.Members[0].Restart(t)
  171. kresp = <-rc
  172. if kresp.ID != resp.ID {
  173. t.Errorf("ID = %x, want %x", kresp.ID, resp.ID)
  174. }
  175. lapi.Close()
  176. _, ok := <-rc
  177. if ok {
  178. t.Errorf("chan is not closed, want lease Close() closes chan")
  179. }
  180. }
  181. type leaseCh struct {
  182. lid clientv3.LeaseID
  183. ch <-chan *clientv3.LeaseKeepAliveResponse
  184. }
  185. // TestLeaseKeepAliveNotFound ensures a revoked lease won't halt other leases.
  186. func TestLeaseKeepAliveNotFound(t *testing.T) {
  187. defer testutil.AfterTest(t)
  188. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  189. defer clus.Terminate(t)
  190. cli := clus.RandClient()
  191. lchs := []leaseCh{}
  192. for i := 0; i < 3; i++ {
  193. resp, rerr := cli.Grant(context.TODO(), 5)
  194. if rerr != nil {
  195. t.Fatal(rerr)
  196. }
  197. kach, kaerr := cli.KeepAlive(context.Background(), resp.ID)
  198. if kaerr != nil {
  199. t.Fatal(kaerr)
  200. }
  201. lchs = append(lchs, leaseCh{resp.ID, kach})
  202. }
  203. if _, err := cli.Revoke(context.TODO(), lchs[1].lid); err != nil {
  204. t.Fatal(err)
  205. }
  206. <-lchs[0].ch
  207. if _, ok := <-lchs[0].ch; !ok {
  208. t.Fatalf("closed keepalive on wrong lease")
  209. }
  210. timec := time.After(5 * time.Second)
  211. for range lchs[1].ch {
  212. select {
  213. case <-timec:
  214. t.Fatalf("revoke did not close keep alive")
  215. default:
  216. }
  217. }
  218. }
  219. func TestLeaseGrantErrConnClosed(t *testing.T) {
  220. defer testutil.AfterTest(t)
  221. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  222. defer clus.Terminate(t)
  223. cli := clus.Client(0)
  224. clus.TakeClient(0)
  225. donec := make(chan struct{})
  226. go func() {
  227. defer close(donec)
  228. _, err := cli.Grant(context.TODO(), 5)
  229. if err != nil && err != grpc.ErrClientConnClosing && err != context.Canceled {
  230. // grpc.ErrClientConnClosing if grpc-go balancer calls 'Get' after client.Close.
  231. // context.Canceled if grpc-go balancer calls 'Get' with an inflight client.Close.
  232. t.Fatalf("expected %v or %v, got %v", grpc.ErrClientConnClosing, context.Canceled, err)
  233. }
  234. }()
  235. if err := cli.Close(); err != nil {
  236. t.Fatal(err)
  237. }
  238. select {
  239. case <-time.After(3 * time.Second):
  240. t.Fatal("le.Grant took too long")
  241. case <-donec:
  242. }
  243. }
  244. func TestLeaseGrantNewAfterClose(t *testing.T) {
  245. defer testutil.AfterTest(t)
  246. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  247. defer clus.Terminate(t)
  248. cli := clus.Client(0)
  249. clus.TakeClient(0)
  250. if err := cli.Close(); err != nil {
  251. t.Fatal(err)
  252. }
  253. donec := make(chan struct{})
  254. go func() {
  255. if _, err := cli.Grant(context.TODO(), 5); err != context.Canceled && err != grpc.ErrClientConnClosing {
  256. t.Fatalf("expected %v or %v, got %v", err != context.Canceled, grpc.ErrClientConnClosing, err)
  257. }
  258. close(donec)
  259. }()
  260. select {
  261. case <-time.After(3 * time.Second):
  262. t.Fatal("le.Grant took too long")
  263. case <-donec:
  264. }
  265. }
  266. func TestLeaseRevokeNewAfterClose(t *testing.T) {
  267. defer testutil.AfterTest(t)
  268. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  269. defer clus.Terminate(t)
  270. cli := clus.Client(0)
  271. resp, err := cli.Grant(context.TODO(), 5)
  272. if err != nil {
  273. t.Fatal(err)
  274. }
  275. leaseID := resp.ID
  276. clus.TakeClient(0)
  277. if err := cli.Close(); err != nil {
  278. t.Fatal(err)
  279. }
  280. donec := make(chan struct{})
  281. go func() {
  282. if _, err := cli.Revoke(context.TODO(), leaseID); err != context.Canceled && err != grpc.ErrClientConnClosing {
  283. t.Fatalf("expected %v or %v, got %v", err != context.Canceled, grpc.ErrClientConnClosing, err)
  284. }
  285. close(donec)
  286. }()
  287. select {
  288. case <-time.After(3 * time.Second):
  289. t.Fatal("le.Revoke took too long")
  290. case <-donec:
  291. }
  292. }
  293. // TestLeaseKeepAliveCloseAfterDisconnectRevoke ensures the keep alive channel is closed
  294. // following a disconnection, lease revoke, then reconnect.
  295. func TestLeaseKeepAliveCloseAfterDisconnectRevoke(t *testing.T) {
  296. defer testutil.AfterTest(t)
  297. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  298. defer clus.Terminate(t)
  299. cli := clus.Client(0)
  300. // setup lease and do a keepalive
  301. resp, err := cli.Grant(context.Background(), 10)
  302. if err != nil {
  303. t.Fatal(err)
  304. }
  305. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  306. if kerr != nil {
  307. t.Fatal(kerr)
  308. }
  309. kresp := <-rc
  310. if kresp.ID != resp.ID {
  311. t.Fatalf("ID = %x, want %x", kresp.ID, resp.ID)
  312. }
  313. // keep client disconnected
  314. clus.Members[0].Stop(t)
  315. time.Sleep(time.Second)
  316. clus.WaitLeader(t)
  317. if _, err := clus.Client(1).Revoke(context.TODO(), resp.ID); err != nil {
  318. t.Fatal(err)
  319. }
  320. clus.Members[0].Restart(t)
  321. // some responses may still be buffered; drain until close
  322. timer := time.After(time.Duration(kresp.TTL) * time.Second)
  323. for kresp != nil {
  324. select {
  325. case kresp = <-rc:
  326. case <-timer:
  327. t.Fatalf("keepalive channel did not close")
  328. }
  329. }
  330. }
  331. // TestLeaseKeepAliveInitTimeout ensures the keep alive channel closes if
  332. // the initial keep alive request never gets a response.
  333. func TestLeaseKeepAliveInitTimeout(t *testing.T) {
  334. defer testutil.AfterTest(t)
  335. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  336. defer clus.Terminate(t)
  337. cli := clus.Client(0)
  338. // setup lease and do a keepalive
  339. resp, err := cli.Grant(context.Background(), 5)
  340. if err != nil {
  341. t.Fatal(err)
  342. }
  343. // keep client disconnected
  344. clus.Members[0].Stop(t)
  345. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  346. if kerr != nil {
  347. t.Fatal(kerr)
  348. }
  349. select {
  350. case ka, ok := <-rc:
  351. if ok {
  352. t.Fatalf("unexpected keepalive %v, expected closed channel", ka)
  353. }
  354. case <-time.After(10 * time.Second):
  355. t.Fatalf("keepalive channel did not close")
  356. }
  357. clus.Members[0].Restart(t)
  358. }
  359. // TestLeaseKeepAliveInitTimeout ensures the keep alive channel closes if
  360. // a keep alive request after the first never gets a response.
  361. func TestLeaseKeepAliveTTLTimeout(t *testing.T) {
  362. defer testutil.AfterTest(t)
  363. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  364. defer clus.Terminate(t)
  365. cli := clus.Client(0)
  366. // setup lease and do a keepalive
  367. resp, err := cli.Grant(context.Background(), 5)
  368. if err != nil {
  369. t.Fatal(err)
  370. }
  371. rc, kerr := cli.KeepAlive(context.Background(), resp.ID)
  372. if kerr != nil {
  373. t.Fatal(kerr)
  374. }
  375. if kresp := <-rc; kresp.ID != resp.ID {
  376. t.Fatalf("ID = %x, want %x", kresp.ID, resp.ID)
  377. }
  378. // keep client disconnected
  379. clus.Members[0].Stop(t)
  380. select {
  381. case ka, ok := <-rc:
  382. if ok {
  383. t.Fatalf("unexpected keepalive %v, expected closed channel", ka)
  384. }
  385. case <-time.After(10 * time.Second):
  386. t.Fatalf("keepalive channel did not close")
  387. }
  388. clus.Members[0].Restart(t)
  389. }
  390. func TestLeaseTimeToLive(t *testing.T) {
  391. defer testutil.AfterTest(t)
  392. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  393. defer clus.Terminate(t)
  394. c := clus.RandClient()
  395. lapi := c
  396. resp, err := lapi.Grant(context.Background(), 10)
  397. if err != nil {
  398. t.Errorf("failed to create lease %v", err)
  399. }
  400. kv := clus.RandClient()
  401. keys := []string{"foo1", "foo2"}
  402. for i := range keys {
  403. if _, err = kv.Put(context.TODO(), keys[i], "bar", clientv3.WithLease(resp.ID)); err != nil {
  404. t.Fatal(err)
  405. }
  406. }
  407. // linearized read to ensure Puts propagated to server backing lapi
  408. if _, err := c.Get(context.TODO(), "abc"); err != nil {
  409. t.Fatal(err)
  410. }
  411. lresp, lerr := lapi.TimeToLive(context.Background(), resp.ID, clientv3.WithAttachedKeys())
  412. if lerr != nil {
  413. t.Fatal(lerr)
  414. }
  415. if lresp.ID != resp.ID {
  416. t.Fatalf("leaseID expected %d, got %d", resp.ID, lresp.ID)
  417. }
  418. if lresp.GrantedTTL != int64(10) {
  419. t.Fatalf("GrantedTTL expected %d, got %d", 10, lresp.GrantedTTL)
  420. }
  421. if lresp.TTL == 0 || lresp.TTL > lresp.GrantedTTL {
  422. t.Fatalf("unexpected TTL %d (granted %d)", lresp.TTL, lresp.GrantedTTL)
  423. }
  424. ks := make([]string, len(lresp.Keys))
  425. for i := range lresp.Keys {
  426. ks[i] = string(lresp.Keys[i])
  427. }
  428. sort.Strings(ks)
  429. if !reflect.DeepEqual(ks, keys) {
  430. t.Fatalf("keys expected %v, got %v", keys, ks)
  431. }
  432. lresp, lerr = lapi.TimeToLive(context.Background(), resp.ID)
  433. if lerr != nil {
  434. t.Fatal(lerr)
  435. }
  436. if len(lresp.Keys) != 0 {
  437. t.Fatalf("unexpected keys %+v", lresp.Keys)
  438. }
  439. }
  440. func TestLeaseTimeToLiveLeaseNotFound(t *testing.T) {
  441. defer testutil.AfterTest(t)
  442. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  443. defer clus.Terminate(t)
  444. cli := clus.RandClient()
  445. resp, err := cli.Grant(context.Background(), 10)
  446. if err != nil {
  447. t.Errorf("failed to create lease %v", err)
  448. }
  449. _, err = cli.Revoke(context.Background(), resp.ID)
  450. if err != nil {
  451. t.Errorf("failed to Revoke lease %v", err)
  452. }
  453. lresp, err := cli.TimeToLive(context.Background(), resp.ID)
  454. // TimeToLive() should return a response with TTL=-1.
  455. if err != nil {
  456. t.Fatalf("expected err to be nil")
  457. }
  458. if lresp == nil {
  459. t.Fatalf("expected lresp not to be nil")
  460. }
  461. if lresp.ResponseHeader == nil {
  462. t.Fatalf("expected ResponseHeader not to be nil")
  463. }
  464. if lresp.ID != resp.ID {
  465. t.Fatalf("expected Lease ID %v, but got %v", resp.ID, lresp.ID)
  466. }
  467. if lresp.TTL != -1 {
  468. t.Fatalf("expected TTL %v, but got %v", lresp.TTL, lresp.TTL)
  469. }
  470. }
  471. // TestLeaseRenewLostQuorum ensures keepalives work after losing quorum
  472. // for a while.
  473. func TestLeaseRenewLostQuorum(t *testing.T) {
  474. defer testutil.AfterTest(t)
  475. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  476. defer clus.Terminate(t)
  477. cli := clus.Client(0)
  478. r, err := cli.Grant(context.TODO(), 4)
  479. if err != nil {
  480. t.Fatal(err)
  481. }
  482. kctx, kcancel := context.WithCancel(context.Background())
  483. defer kcancel()
  484. ka, err := cli.KeepAlive(kctx, r.ID)
  485. if err != nil {
  486. t.Fatal(err)
  487. }
  488. // consume first keepalive so next message sends when cluster is down
  489. <-ka
  490. lastKa := time.Now()
  491. // force keepalive stream message to timeout
  492. clus.Members[1].Stop(t)
  493. clus.Members[2].Stop(t)
  494. // Use TTL-2 since the client closes the keepalive channel if no
  495. // keepalive arrives before the lease deadline; the client will
  496. // try to resend a keepalive after TTL/3 seconds, so for a TTL of 4,
  497. // sleeping for 2s should be sufficient time for issuing a retry.
  498. // The cluster has two seconds to recover and reply to the keepalive.
  499. time.Sleep(time.Duration(r.TTL-2) * time.Second)
  500. clus.Members[1].Restart(t)
  501. clus.Members[2].Restart(t)
  502. if time.Since(lastKa) > time.Duration(r.TTL)*time.Second {
  503. t.Skip("waited too long for server stop and restart")
  504. }
  505. select {
  506. case _, ok := <-ka:
  507. if !ok {
  508. t.Fatalf("keepalive closed")
  509. }
  510. case <-time.After(time.Duration(r.TTL) * time.Second):
  511. t.Fatalf("timed out waiting for keepalive")
  512. }
  513. }
  514. func TestLeaseKeepAliveLoopExit(t *testing.T) {
  515. defer testutil.AfterTest(t)
  516. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  517. defer clus.Terminate(t)
  518. ctx := context.Background()
  519. cli := clus.Client(0)
  520. clus.TakeClient(0)
  521. resp, err := cli.Grant(ctx, 5)
  522. if err != nil {
  523. t.Fatal(err)
  524. }
  525. cli.Close()
  526. _, err = cli.KeepAlive(ctx, resp.ID)
  527. if _, ok := err.(clientv3.ErrKeepAliveHalted); !ok {
  528. t.Fatalf("expected %T, got %v(%T)", clientv3.ErrKeepAliveHalted{}, err, err)
  529. }
  530. }
  531. // TestV3LeaseFailureOverlap issues Grant and KeepAlive requests to a cluster
  532. // before, during, and after quorum loss to confirm Grant/KeepAlive tolerates
  533. // transient cluster failure.
  534. func TestV3LeaseFailureOverlap(t *testing.T) {
  535. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 2})
  536. defer clus.Terminate(t)
  537. numReqs := 5
  538. cli := clus.Client(0)
  539. // bring up a session, tear it down
  540. updown := func(i int) error {
  541. sess, err := concurrency.NewSession(cli)
  542. if err != nil {
  543. return err
  544. }
  545. ch := make(chan struct{})
  546. go func() {
  547. defer close(ch)
  548. sess.Close()
  549. }()
  550. select {
  551. case <-ch:
  552. case <-time.After(time.Minute / 4):
  553. t.Fatalf("timeout %d", i)
  554. }
  555. return nil
  556. }
  557. var wg sync.WaitGroup
  558. mkReqs := func(n int) {
  559. wg.Add(numReqs)
  560. for i := 0; i < numReqs; i++ {
  561. go func() {
  562. defer wg.Done()
  563. err := updown(n)
  564. if err == nil || err == rpctypes.ErrTimeoutDueToConnectionLost {
  565. return
  566. }
  567. t.Fatal(err)
  568. }()
  569. }
  570. }
  571. mkReqs(1)
  572. clus.Members[1].Stop(t)
  573. mkReqs(2)
  574. time.Sleep(time.Second)
  575. mkReqs(3)
  576. clus.Members[1].Restart(t)
  577. mkReqs(4)
  578. wg.Wait()
  579. }
  580. // TestLeaseWithRequireLeader checks keep-alive channel close when no leader.
  581. func TestLeaseWithRequireLeader(t *testing.T) {
  582. defer testutil.AfterTest(t)
  583. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 2})
  584. defer clus.Terminate(t)
  585. c := clus.Client(0)
  586. lid1, err1 := c.Grant(context.TODO(), 60)
  587. if err1 != nil {
  588. t.Fatal(err1)
  589. }
  590. lid2, err2 := c.Grant(context.TODO(), 60)
  591. if err2 != nil {
  592. t.Fatal(err2)
  593. }
  594. // kaReqLeader close if the leader is lost
  595. kaReqLeader, kerr1 := c.KeepAlive(clientv3.WithRequireLeader(context.TODO()), lid1.ID)
  596. if kerr1 != nil {
  597. t.Fatal(kerr1)
  598. }
  599. // kaWait will wait even if the leader is lost
  600. kaWait, kerr2 := c.KeepAlive(context.TODO(), lid2.ID)
  601. if kerr2 != nil {
  602. t.Fatal(kerr2)
  603. }
  604. select {
  605. case <-kaReqLeader:
  606. case <-time.After(5 * time.Second):
  607. t.Fatalf("require leader first keep-alive timed out")
  608. }
  609. select {
  610. case <-kaWait:
  611. case <-time.After(5 * time.Second):
  612. t.Fatalf("leader not required first keep-alive timed out")
  613. }
  614. clus.Members[1].Stop(t)
  615. // kaReqLeader may issue multiple requests while waiting for the first
  616. // response from proxy server; drain any stray keepalive responses
  617. time.Sleep(100 * time.Millisecond)
  618. for len(kaReqLeader) > 0 {
  619. <-kaReqLeader
  620. }
  621. select {
  622. case resp, ok := <-kaReqLeader:
  623. if ok {
  624. t.Fatalf("expected closed require leader, got response %+v", resp)
  625. }
  626. case <-time.After(5 * time.Second):
  627. t.Fatal("keepalive with require leader took too long to close")
  628. }
  629. select {
  630. case _, ok := <-kaWait:
  631. if !ok {
  632. t.Fatalf("got closed channel with no require leader, expected non-closed")
  633. }
  634. case <-time.After(10 * time.Millisecond):
  635. // wait some to detect any closes happening soon after kaReqLeader closing
  636. }
  637. }