etcd_functional_test.go 4.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226
  1. /*
  2. Copyright 2014 CoreOS Inc.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package etcd
  14. import (
  15. "math/rand"
  16. "net/http/httptest"
  17. "testing"
  18. "time"
  19. "github.com/coreos/etcd/config"
  20. "github.com/coreos/etcd/store"
  21. )
  22. func TestKillLeader(t *testing.T) {
  23. tests := []int{3, 5, 9, 11}
  24. for i, tt := range tests {
  25. es, hs := buildCluster(tt, false)
  26. waitCluster(t, es)
  27. waitLeader(es)
  28. lead := es[0].p.node.Leader()
  29. es[lead].Stop()
  30. time.Sleep(es[0].tickDuration * defaultElection * 2)
  31. waitLeader(es)
  32. if es[1].p.node.Leader() == 0 {
  33. t.Errorf("#%d: lead = %d, want not 0", i, es[1].p.node.Leader())
  34. }
  35. destoryCluster(t, es, hs)
  36. }
  37. afterTest(t)
  38. }
  39. func TestRandomKill(t *testing.T) {
  40. tests := []int{3, 5, 9, 11}
  41. for _, tt := range tests {
  42. es, hs := buildCluster(tt, false)
  43. waitCluster(t, es)
  44. waitLeader(es)
  45. toKill := make(map[int64]struct{})
  46. for len(toKill) != tt/2-1 {
  47. toKill[rand.Int63n(int64(tt))] = struct{}{}
  48. }
  49. for k := range toKill {
  50. es[k].Stop()
  51. }
  52. time.Sleep(es[0].tickDuration * defaultElection * 2)
  53. waitLeader(es)
  54. destoryCluster(t, es, hs)
  55. }
  56. afterTest(t)
  57. }
  58. func TestJoinThroughFollower(t *testing.T) {
  59. tests := []int{3, 4, 5, 6}
  60. for _, tt := range tests {
  61. es := make([]*Server, tt)
  62. hs := make([]*httptest.Server, tt)
  63. for i := 0; i < tt; i++ {
  64. c := config.New()
  65. if i > 0 {
  66. c.Peers = []string{hs[i-1].URL}
  67. }
  68. es[i], hs[i] = initTestServer(c, int64(i), false)
  69. }
  70. go es[0].Run()
  71. for i := 1; i < tt; i++ {
  72. go es[i].Run()
  73. waitLeader(es[:i])
  74. }
  75. waitCluster(t, es)
  76. destoryCluster(t, es, hs)
  77. }
  78. afterTest(t)
  79. }
  80. func BenchmarkEndToEndSet(b *testing.B) {
  81. es, hs := buildCluster(3, false)
  82. waitLeader(es)
  83. b.ResetTimer()
  84. for n := 0; n < b.N; n++ {
  85. _, err := es[0].p.Set("foo", false, "bar", store.Permanent)
  86. if err != nil {
  87. panic("unexpect error")
  88. }
  89. }
  90. b.StopTimer()
  91. destoryCluster(nil, es, hs)
  92. }
  93. // TODO(yichengq): cannot handle previous msgDenial correctly now
  94. func TestModeSwitch(t *testing.T) {
  95. t.Skip("not passed")
  96. size := 5
  97. round := 3
  98. for i := 0; i < size; i++ {
  99. es, hs := buildCluster(size, false)
  100. waitCluster(t, es)
  101. config := config.NewClusterConfig()
  102. config.SyncInterval = 0
  103. id := int64(i)
  104. for j := 0; j < round; j++ {
  105. lead, _ := waitActiveLeader(es)
  106. // cluster only demotes follower
  107. if lead == id {
  108. continue
  109. }
  110. config.ActiveSize = size - 1
  111. if err := es[lead].p.setClusterConfig(config); err != nil {
  112. t.Fatalf("#%d: setClusterConfig err = %v", i, err)
  113. }
  114. if err := es[lead].p.remove(id); err != nil {
  115. t.Fatalf("#%d: remove err = %v", i, err)
  116. }
  117. waitMode(standbyMode, es[i])
  118. for k := 0; k < 4; k++ {
  119. if es[i].s.leader != noneId {
  120. break
  121. }
  122. time.Sleep(20 * time.Millisecond)
  123. }
  124. if g := es[i].s.leader; g != lead {
  125. t.Errorf("#%d: lead = %d, want %d", i, g, lead)
  126. }
  127. config.ActiveSize = size
  128. if err := es[lead].p.setClusterConfig(config); err != nil {
  129. t.Fatalf("#%d: setClusterConfig err = %v", i, err)
  130. }
  131. waitMode(participantMode, es[i])
  132. if err := checkParticipant(i, es); err != nil {
  133. t.Errorf("#%d: check alive err = %v", i, err)
  134. }
  135. }
  136. destoryCluster(t, es, hs)
  137. }
  138. afterTest(t)
  139. }
  140. type leadterm struct {
  141. lead int64
  142. term int64
  143. }
  144. func waitActiveLeader(es []*Server) (lead, term int64) {
  145. for {
  146. if l, t := waitLeader(es); l >= 0 && es[l].mode.Get() == participantMode {
  147. return l, t
  148. }
  149. }
  150. }
  151. // waitLeader waits until all alive servers are checked to have the same leader.
  152. // WARNING: The lead returned is not guaranteed to be actual leader.
  153. func waitLeader(es []*Server) (lead, term int64) {
  154. for {
  155. ls := make([]leadterm, 0, len(es))
  156. for i := range es {
  157. switch es[i].mode.Get() {
  158. case participantMode:
  159. ls = append(ls, getLead(es[i]))
  160. case standbyMode:
  161. //TODO(xiangli) add standby support
  162. case stopMode:
  163. }
  164. }
  165. if isSameLead(ls) {
  166. return ls[0].lead, ls[0].term
  167. }
  168. time.Sleep(es[0].tickDuration * defaultElection)
  169. }
  170. }
  171. func getLead(s *Server) leadterm {
  172. return leadterm{s.p.node.Leader(), s.p.node.Term()}
  173. }
  174. func isSameLead(ls []leadterm) bool {
  175. m := make(map[leadterm]int)
  176. for i := range ls {
  177. m[ls[i]] = m[ls[i]] + 1
  178. }
  179. if len(m) == 1 {
  180. if ls[0].lead == -1 {
  181. return false
  182. }
  183. return true
  184. }
  185. // todo(xiangli): printout the current cluster status for debugging....
  186. return false
  187. }