main.go 5.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162
  1. // Copyright 2015 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package main
  15. import (
  16. "flag"
  17. "fmt"
  18. "net/http"
  19. "os"
  20. "strings"
  21. "github.com/coreos/pkg/capnslog"
  22. "github.com/prometheus/client_golang/prometheus"
  23. )
  24. var plog = capnslog.NewPackageLogger("github.com/coreos/etcd", "etcd-tester")
  25. const (
  26. defaultClientPort = 2379
  27. defaultPeerPort = 2380
  28. defaultFailpointPort = 2381
  29. )
  30. func main() {
  31. endpointStr := flag.String("agent-endpoints", "localhost:9027", "HTTP RPC endpoints of agents. Do not specify the schema.")
  32. clientPorts := flag.String("client-ports", "", "etcd client port for each agent endpoint")
  33. peerPorts := flag.String("peer-ports", "", "etcd peer port for each agent endpoint")
  34. failpointPorts := flag.String("failpoint-ports", "", "etcd failpoint port for each agent endpoint")
  35. datadir := flag.String("data-dir", "agent.etcd", "etcd data directory location on agent machine.")
  36. stressKeyLargeSize := flag.Uint("stress-key-large-size", 32*1024+1, "the size of each large key written into etcd.")
  37. stressKeySize := flag.Uint("stress-key-size", 100, "the size of each small key written into etcd.")
  38. stressKeySuffixRange := flag.Uint("stress-key-count", 250000, "the count of key range written into etcd.")
  39. limit := flag.Int("limit", -1, "the limit of rounds to run failure set (-1 to run without limits).")
  40. stressQPS := flag.Int("stress-qps", 10000, "maximum number of stresser requests per second.")
  41. schedCases := flag.String("schedule-cases", "", "test case schedule")
  42. consistencyCheck := flag.Bool("consistency-check", true, "true to check consistency (revision, hash)")
  43. isV2Only := flag.Bool("v2-only", false, "'true' to run V2 only tester.")
  44. stresserType := flag.String("stresser", "default", "specify stresser (\"default\" or \"nop\").")
  45. flag.Parse()
  46. eps := strings.Split(*endpointStr, ",")
  47. cports := portsFromArg(*clientPorts, len(eps), defaultClientPort)
  48. pports := portsFromArg(*peerPorts, len(eps), defaultPeerPort)
  49. fports := portsFromArg(*failpointPorts, len(eps), defaultFailpointPort)
  50. agents := make([]agentConfig, len(eps))
  51. for i := range eps {
  52. agents[i].endpoint = eps[i]
  53. agents[i].clientPort = cports[i]
  54. agents[i].peerPort = pports[i]
  55. agents[i].failpointPort = fports[i]
  56. agents[i].datadir = *datadir
  57. }
  58. sConfig := &stressConfig{
  59. qps: *stressQPS,
  60. keyLargeSize: int(*stressKeyLargeSize),
  61. keySize: int(*stressKeySize),
  62. keySuffixRange: int(*stressKeySuffixRange),
  63. v2: *isV2Only,
  64. }
  65. c := &cluster{
  66. agents: agents,
  67. v2Only: *isV2Only,
  68. stressBuilder: newStressBuilder(*stresserType, sConfig),
  69. }
  70. if err := c.bootstrap(); err != nil {
  71. plog.Fatal(err)
  72. }
  73. defer c.Terminate()
  74. failures := []failure{
  75. newFailureKillAll(),
  76. newFailureKillMajority(),
  77. newFailureKillOne(),
  78. newFailureKillLeader(),
  79. newFailureKillOneForLongTime(),
  80. newFailureKillLeaderForLongTime(),
  81. newFailureIsolate(),
  82. newFailureIsolateAll(),
  83. newFailureSlowNetworkOneMember(),
  84. newFailureSlowNetworkLeader(),
  85. newFailureSlowNetworkAll(),
  86. }
  87. // ensure cluster is fully booted to know failpoints are available
  88. c.WaitHealth()
  89. fpFailures, fperr := failpointFailures(c)
  90. if len(fpFailures) == 0 {
  91. plog.Infof("no failpoints found (%v)", fperr)
  92. }
  93. failures = append(failures, fpFailures...)
  94. schedule := failures
  95. if schedCases != nil && *schedCases != "" {
  96. cases := strings.Split(*schedCases, " ")
  97. schedule = make([]failure, len(cases))
  98. for i := range cases {
  99. caseNum := 0
  100. n, err := fmt.Sscanf(cases[i], "%d", &caseNum)
  101. if n == 0 || err != nil {
  102. plog.Fatalf(`couldn't parse case "%s" (%v)`, cases[i], err)
  103. }
  104. schedule[i] = failures[caseNum]
  105. }
  106. }
  107. t := &tester{
  108. failures: schedule,
  109. cluster: c,
  110. limit: *limit,
  111. checker: newNoChecker(),
  112. }
  113. if *consistencyCheck && !c.v2Only {
  114. t.checker = newHashChecker(t)
  115. }
  116. sh := statusHandler{status: &t.status}
  117. http.Handle("/status", sh)
  118. http.Handle("/metrics", prometheus.Handler())
  119. go func() { plog.Fatal(http.ListenAndServe(":9028", nil)) }()
  120. t.runLoop()
  121. }
  122. // portsFromArg converts a comma separated list into a slice of ints
  123. func portsFromArg(arg string, n, defaultPort int) []int {
  124. ret := make([]int, n)
  125. if len(arg) == 0 {
  126. for i := range ret {
  127. ret[i] = defaultPort
  128. }
  129. return ret
  130. }
  131. s := strings.Split(arg, ",")
  132. if len(s) != n {
  133. fmt.Printf("expected %d ports, got %d (%s)\n", n, len(s), arg)
  134. os.Exit(1)
  135. }
  136. for i := range s {
  137. if _, err := fmt.Sscanf(s[i], "%d", &ret[i]); err != nil {
  138. fmt.Println(err)
  139. os.Exit(1)
  140. }
  141. }
  142. return ret
  143. }