maintenance_test.go 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241
  1. // Copyright 2017 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package integration
  15. import (
  16. "bytes"
  17. "context"
  18. "fmt"
  19. "io"
  20. "io/ioutil"
  21. "path/filepath"
  22. "testing"
  23. "time"
  24. "go.uber.org/zap"
  25. "google.golang.org/grpc"
  26. "go.etcd.io/etcd/clientv3"
  27. "go.etcd.io/etcd/etcdserver/api/v3rpc/rpctypes"
  28. "go.etcd.io/etcd/integration"
  29. "go.etcd.io/etcd/lease"
  30. "go.etcd.io/etcd/mvcc"
  31. "go.etcd.io/etcd/mvcc/backend"
  32. "go.etcd.io/etcd/pkg/testutil"
  33. )
  34. func TestMaintenanceHashKV(t *testing.T) {
  35. defer testutil.AfterTest(t)
  36. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  37. defer clus.Terminate(t)
  38. for i := 0; i < 3; i++ {
  39. if _, err := clus.RandClient().Put(context.Background(), "foo", "bar"); err != nil {
  40. t.Fatal(err)
  41. }
  42. }
  43. var hv uint32
  44. for i := 0; i < 3; i++ {
  45. cli := clus.Client(i)
  46. // ensure writes are replicated
  47. if _, err := cli.Get(context.TODO(), "foo"); err != nil {
  48. t.Fatal(err)
  49. }
  50. hresp, err := cli.HashKV(context.Background(), clus.Members[i].GRPCAddr(), 0)
  51. if err != nil {
  52. t.Fatal(err)
  53. }
  54. if hv == 0 {
  55. hv = hresp.Hash
  56. continue
  57. }
  58. if hv != hresp.Hash {
  59. t.Fatalf("#%d: hash expected %d, got %d", i, hv, hresp.Hash)
  60. }
  61. }
  62. }
  63. func TestMaintenanceMoveLeader(t *testing.T) {
  64. defer testutil.AfterTest(t)
  65. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  66. defer clus.Terminate(t)
  67. oldLeadIdx := clus.WaitLeader(t)
  68. targetIdx := (oldLeadIdx + 1) % 3
  69. target := uint64(clus.Members[targetIdx].ID())
  70. cli := clus.Client(targetIdx)
  71. _, err := cli.MoveLeader(context.Background(), target)
  72. if err != rpctypes.ErrNotLeader {
  73. t.Fatalf("error expected %v, got %v", rpctypes.ErrNotLeader, err)
  74. }
  75. cli = clus.Client(oldLeadIdx)
  76. _, err = cli.MoveLeader(context.Background(), target)
  77. if err != nil {
  78. t.Fatal(err)
  79. }
  80. leadIdx := clus.WaitLeader(t)
  81. lead := uint64(clus.Members[leadIdx].ID())
  82. if target != lead {
  83. t.Fatalf("new leader expected %d, got %d", target, lead)
  84. }
  85. }
  86. // TestMaintenanceSnapshotError ensures that context cancel/timeout
  87. // before snapshot reading returns corresponding context errors.
  88. func TestMaintenanceSnapshotError(t *testing.T) {
  89. defer testutil.AfterTest(t)
  90. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  91. defer clus.Terminate(t)
  92. // reading snapshot with canceled context should error out
  93. ctx, cancel := context.WithCancel(context.Background())
  94. rc1, err := clus.RandClient().Snapshot(ctx)
  95. if err != nil {
  96. t.Fatal(err)
  97. }
  98. defer rc1.Close()
  99. cancel()
  100. _, err = io.Copy(ioutil.Discard, rc1)
  101. if err != context.Canceled {
  102. t.Errorf("expected %v, got %v", context.Canceled, err)
  103. }
  104. // reading snapshot with deadline exceeded should error out
  105. ctx, cancel = context.WithTimeout(context.Background(), time.Second)
  106. defer cancel()
  107. rc2, err := clus.RandClient().Snapshot(ctx)
  108. if err != nil {
  109. t.Fatal(err)
  110. }
  111. defer rc2.Close()
  112. time.Sleep(2 * time.Second)
  113. _, err = io.Copy(ioutil.Discard, rc2)
  114. if err != nil && !isClientTimeout(err) {
  115. t.Errorf("expected client timeout, got %v", err)
  116. }
  117. }
  118. // TestMaintenanceSnapshotErrorInflight ensures that inflight context cancel/timeout
  119. // fails snapshot reading with corresponding context errors.
  120. func TestMaintenanceSnapshotErrorInflight(t *testing.T) {
  121. defer testutil.AfterTest(t)
  122. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 1})
  123. defer clus.Terminate(t)
  124. // take about 1-second to read snapshot
  125. clus.Members[0].Stop(t)
  126. dpath := filepath.Join(clus.Members[0].DataDir, "member", "snap", "db")
  127. b := backend.NewDefaultBackend(dpath)
  128. s := mvcc.NewStore(zap.NewExample(), b, &lease.FakeLessor{}, nil)
  129. rev := 100000
  130. for i := 2; i <= rev; i++ {
  131. s.Put([]byte(fmt.Sprintf("%10d", i)), bytes.Repeat([]byte("a"), 1024), lease.NoLease)
  132. }
  133. s.Close()
  134. b.Close()
  135. clus.Members[0].Restart(t)
  136. cli := clus.RandClient()
  137. // reading snapshot with canceled context should error out
  138. ctx, cancel := context.WithCancel(context.Background())
  139. rc1, err := cli.Snapshot(ctx)
  140. if err != nil {
  141. t.Fatal(err)
  142. }
  143. defer rc1.Close()
  144. donec := make(chan struct{})
  145. go func() {
  146. time.Sleep(300 * time.Millisecond)
  147. cancel()
  148. close(donec)
  149. }()
  150. _, err = io.Copy(ioutil.Discard, rc1)
  151. if err != nil && err != context.Canceled {
  152. t.Errorf("expected %v, got %v", context.Canceled, err)
  153. }
  154. <-donec
  155. // reading snapshot with deadline exceeded should error out
  156. ctx, cancel = context.WithTimeout(context.Background(), time.Second)
  157. defer cancel()
  158. rc2, err := clus.RandClient().Snapshot(ctx)
  159. if err != nil {
  160. t.Fatal(err)
  161. }
  162. defer rc2.Close()
  163. // 300ms left and expect timeout while snapshot reading is in progress
  164. time.Sleep(700 * time.Millisecond)
  165. _, err = io.Copy(ioutil.Discard, rc2)
  166. if err != nil && !isClientTimeout(err) {
  167. t.Errorf("expected client timeout, got %v", err)
  168. }
  169. }
  170. func TestMaintenanceStatus(t *testing.T) {
  171. defer testutil.AfterTest(t)
  172. clus := integration.NewClusterV3(t, &integration.ClusterConfig{Size: 3})
  173. defer clus.Terminate(t)
  174. clus.WaitLeader(t)
  175. eps := make([]string, 3)
  176. for i := 0; i < 3; i++ {
  177. eps[i] = clus.Members[i].GRPCAddr()
  178. }
  179. cli, err := clientv3.New(clientv3.Config{Endpoints: eps, DialOptions: []grpc.DialOption{grpc.WithBlock()}})
  180. if err != nil {
  181. t.Fatal(err)
  182. }
  183. defer cli.Close()
  184. prevID, leaderFound := uint64(0), false
  185. for i := 0; i < 3; i++ {
  186. resp, err := cli.Status(context.TODO(), eps[i])
  187. if err != nil {
  188. t.Fatal(err)
  189. }
  190. if prevID == 0 {
  191. prevID, leaderFound = resp.Header.MemberId, resp.Header.MemberId == resp.Leader
  192. continue
  193. }
  194. if prevID == resp.Header.MemberId {
  195. t.Errorf("#%d: status returned duplicate member ID with %016x", i, prevID)
  196. }
  197. if leaderFound && resp.Header.MemberId == resp.Leader {
  198. t.Errorf("#%d: leader already found, but found another %016x", i, resp.Header.MemberId)
  199. }
  200. if !leaderFound {
  201. leaderFound = resp.Header.MemberId == resp.Leader
  202. }
  203. }
  204. if !leaderFound {
  205. t.Fatal("no leader found")
  206. }
  207. }