balancer_test.go 8.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308
  1. // Copyright 2018 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package balancer
  15. import (
  16. "context"
  17. "fmt"
  18. "strings"
  19. "testing"
  20. "time"
  21. "github.com/coreos/etcd/clientv3/balancer/picker"
  22. "github.com/coreos/etcd/clientv3/balancer/resolver/endpoint"
  23. pb "github.com/coreos/etcd/etcdserver/etcdserverpb"
  24. "github.com/coreos/etcd/pkg/mock/mockserver"
  25. "go.uber.org/zap"
  26. "google.golang.org/grpc"
  27. "google.golang.org/grpc/codes"
  28. "google.golang.org/grpc/peer"
  29. "google.golang.org/grpc/status"
  30. )
  31. // TestRoundRobinBalancedResolvableNoFailover ensures that
  32. // requests to a resolvable endpoint can be balanced between
  33. // multiple, if any, nodes. And there needs be no failover.
  34. func TestRoundRobinBalancedResolvableNoFailover(t *testing.T) {
  35. testCases := []struct {
  36. name string
  37. serverCount int
  38. reqN int
  39. network string
  40. }{
  41. {name: "rrBalanced_1", serverCount: 1, reqN: 5, network: "tcp"},
  42. {name: "rrBalanced_1_unix_sockets", serverCount: 1, reqN: 5, network: "unix"},
  43. {name: "rrBalanced_3", serverCount: 3, reqN: 7, network: "tcp"},
  44. {name: "rrBalanced_5", serverCount: 5, reqN: 10, network: "tcp"},
  45. }
  46. for _, tc := range testCases {
  47. t.Run(tc.name, func(t *testing.T) {
  48. ms, err := mockserver.StartMockServersOnNetwork(tc.serverCount, tc.network)
  49. if err != nil {
  50. t.Fatalf("failed to start mock servers: %v", err)
  51. }
  52. defer ms.Stop()
  53. var eps []string
  54. for _, svr := range ms.Servers {
  55. eps = append(eps, svr.ResolverAddress().Addr)
  56. }
  57. rsv, err := endpoint.NewResolverGroup("nofailover")
  58. if err != nil {
  59. t.Fatal(err)
  60. }
  61. defer rsv.Close()
  62. rsv.SetEndpoints(eps)
  63. name := genName()
  64. cfg := Config{
  65. Policy: picker.RoundrobinBalanced,
  66. Name: name,
  67. Logger: zap.NewExample(),
  68. }
  69. RegisterBuilder(cfg)
  70. conn, err := grpc.Dial(fmt.Sprintf("endpoint://nofailover/*"), grpc.WithInsecure(), grpc.WithBalancerName(name))
  71. if err != nil {
  72. t.Fatalf("failed to dial mock server: %v", err)
  73. }
  74. defer conn.Close()
  75. cli := pb.NewKVClient(conn)
  76. reqFunc := func(ctx context.Context) (picked string, err error) {
  77. var p peer.Peer
  78. _, err = cli.Range(ctx, &pb.RangeRequest{Key: []byte("/x")}, grpc.Peer(&p))
  79. if p.Addr != nil {
  80. picked = p.Addr.String()
  81. }
  82. return picked, err
  83. }
  84. prev, switches := "", 0
  85. for i := 0; i < tc.reqN; i++ {
  86. picked, err := reqFunc(context.Background())
  87. if err != nil {
  88. t.Fatalf("#%d: unexpected failure %v", i, err)
  89. }
  90. if prev == "" {
  91. prev = picked
  92. continue
  93. }
  94. if prev != picked {
  95. switches++
  96. }
  97. prev = picked
  98. }
  99. if tc.serverCount > 1 && switches < tc.reqN-3 { // -3 for initial resolutions
  100. t.Fatalf("expected balanced loads for %d requests, got switches %d", tc.reqN, switches)
  101. }
  102. })
  103. }
  104. }
  105. // TestRoundRobinBalancedResolvableFailoverFromServerFail ensures that
  106. // loads be rebalanced while one server goes down and comes back.
  107. func TestRoundRobinBalancedResolvableFailoverFromServerFail(t *testing.T) {
  108. serverCount := 5
  109. ms, err := mockserver.StartMockServers(serverCount)
  110. if err != nil {
  111. t.Fatalf("failed to start mock servers: %s", err)
  112. }
  113. defer ms.Stop()
  114. var eps []string
  115. for _, svr := range ms.Servers {
  116. eps = append(eps, svr.ResolverAddress().Addr)
  117. }
  118. rsv, err := endpoint.NewResolverGroup("serverfail")
  119. if err != nil {
  120. t.Fatal(err)
  121. }
  122. defer rsv.Close()
  123. rsv.SetEndpoints(eps)
  124. name := genName()
  125. cfg := Config{
  126. Policy: picker.RoundrobinBalanced,
  127. Name: name,
  128. Logger: zap.NewExample(),
  129. }
  130. RegisterBuilder(cfg)
  131. conn, err := grpc.Dial(fmt.Sprintf("endpoint://serverfail/mock.server"), grpc.WithInsecure(), grpc.WithBalancerName(name))
  132. if err != nil {
  133. t.Fatalf("failed to dial mock server: %s", err)
  134. }
  135. defer conn.Close()
  136. cli := pb.NewKVClient(conn)
  137. reqFunc := func(ctx context.Context) (picked string, err error) {
  138. var p peer.Peer
  139. _, err = cli.Range(ctx, &pb.RangeRequest{Key: []byte("/x")}, grpc.Peer(&p))
  140. if p.Addr != nil {
  141. picked = p.Addr.String()
  142. }
  143. return picked, err
  144. }
  145. // stop first server, loads should be redistributed
  146. // stopped server should never be picked
  147. ms.StopAt(0)
  148. available := make(map[string]struct{})
  149. for i := 1; i < serverCount; i++ {
  150. available[eps[i]] = struct{}{}
  151. }
  152. reqN := 10
  153. prev, switches := "", 0
  154. for i := 0; i < reqN; i++ {
  155. picked, err := reqFunc(context.Background())
  156. if err != nil && strings.Contains(err.Error(), "transport is closing") {
  157. continue
  158. }
  159. if prev == "" { // first failover
  160. if eps[0] == picked {
  161. t.Fatalf("expected failover from %q, picked %q", eps[0], picked)
  162. }
  163. prev = picked
  164. continue
  165. }
  166. if _, ok := available[picked]; !ok {
  167. t.Fatalf("picked unavailable address %q (available %v)", picked, available)
  168. }
  169. if prev != picked {
  170. switches++
  171. }
  172. prev = picked
  173. }
  174. if switches < reqN-3 { // -3 for initial resolutions + failover
  175. t.Fatalf("expected balanced loads for %d requests, got switches %d", reqN, switches)
  176. }
  177. // now failed server comes back
  178. ms.StartAt(0)
  179. // enough time for reconnecting to recovered server
  180. time.Sleep(time.Second)
  181. prev, switches = "", 0
  182. recoveredAddr, recovered := eps[0], 0
  183. available[recoveredAddr] = struct{}{}
  184. for i := 0; i < 2*reqN; i++ {
  185. picked, err := reqFunc(context.Background())
  186. if err != nil {
  187. t.Fatalf("#%d: unexpected failure %v", i, err)
  188. }
  189. if prev == "" {
  190. prev = picked
  191. continue
  192. }
  193. if _, ok := available[picked]; !ok {
  194. t.Fatalf("#%d: picked unavailable address %q (available %v)", i, picked, available)
  195. }
  196. if prev != picked {
  197. switches++
  198. }
  199. if picked == recoveredAddr {
  200. recovered++
  201. }
  202. prev = picked
  203. }
  204. if switches < reqN-3 { // -3 for initial resolutions
  205. t.Fatalf("expected balanced loads for %d requests, got switches %d", reqN, switches)
  206. }
  207. if recovered < reqN/serverCount {
  208. t.Fatalf("recovered server %q got only %d requests", recoveredAddr, recovered)
  209. }
  210. }
  211. // TestRoundRobinBalancedResolvableFailoverFromRequestFail ensures that
  212. // loads be rebalanced while some requests are failed.
  213. func TestRoundRobinBalancedResolvableFailoverFromRequestFail(t *testing.T) {
  214. serverCount := 5
  215. ms, err := mockserver.StartMockServers(serverCount)
  216. if err != nil {
  217. t.Fatalf("failed to start mock servers: %s", err)
  218. }
  219. defer ms.Stop()
  220. var eps []string
  221. available := make(map[string]struct{})
  222. for _, svr := range ms.Servers {
  223. eps = append(eps, svr.ResolverAddress().Addr)
  224. available[svr.Address] = struct{}{}
  225. }
  226. rsv, err := endpoint.NewResolverGroup("requestfail")
  227. if err != nil {
  228. t.Fatal(err)
  229. }
  230. defer rsv.Close()
  231. rsv.SetEndpoints(eps)
  232. name := genName()
  233. cfg := Config{
  234. Policy: picker.RoundrobinBalanced,
  235. Name: name,
  236. Logger: zap.NewExample(),
  237. }
  238. RegisterBuilder(cfg)
  239. conn, err := grpc.Dial(fmt.Sprintf("endpoint://requestfail/mock.server"), grpc.WithInsecure(), grpc.WithBalancerName(name))
  240. if err != nil {
  241. t.Fatalf("failed to dial mock server: %s", err)
  242. }
  243. defer conn.Close()
  244. cli := pb.NewKVClient(conn)
  245. reqFunc := func(ctx context.Context) (picked string, err error) {
  246. var p peer.Peer
  247. _, err = cli.Range(ctx, &pb.RangeRequest{Key: []byte("/x")}, grpc.Peer(&p))
  248. if p.Addr != nil {
  249. picked = p.Addr.String()
  250. }
  251. return picked, err
  252. }
  253. reqN := 20
  254. prev, switches := "", 0
  255. for i := 0; i < reqN; i++ {
  256. ctx, cancel := context.WithCancel(context.Background())
  257. defer cancel()
  258. if i%2 == 0 {
  259. cancel()
  260. }
  261. picked, err := reqFunc(ctx)
  262. if i%2 == 0 {
  263. if s, ok := status.FromError(err); ok && s.Code() != codes.Canceled || picked != "" {
  264. t.Fatalf("#%d: expected %v, got %v", i, context.Canceled, err)
  265. }
  266. continue
  267. }
  268. if prev == "" && picked != "" {
  269. prev = picked
  270. continue
  271. }
  272. if _, ok := available[picked]; !ok {
  273. t.Fatalf("#%d: picked unavailable address %q (available %v)", i, picked, available)
  274. }
  275. if prev != picked {
  276. switches++
  277. }
  278. prev = picked
  279. }
  280. if switches < reqN/2-3 { // -3 for initial resolutions + failover
  281. t.Fatalf("expected balanced loads for %d requests, got switches %d", reqN, switches)
  282. }
  283. }