etcd_test.go 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441
  1. /*
  2. Copyright 2014 CoreOS Inc.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package etcd
  14. import (
  15. "fmt"
  16. "io/ioutil"
  17. "math/rand"
  18. "net/http"
  19. "net/http/httptest"
  20. "net/url"
  21. "testing"
  22. "time"
  23. "github.com/coreos/etcd/config"
  24. "github.com/coreos/etcd/store"
  25. )
  26. func TestMultipleNodes(t *testing.T) {
  27. tests := []int{1, 3, 5, 9, 11}
  28. for _, tt := range tests {
  29. es, hs := buildCluster(tt, false)
  30. waitCluster(t, es)
  31. for i := range es {
  32. es[len(es)-i-1].Stop()
  33. }
  34. for i := range hs {
  35. hs[len(hs)-i-1].Close()
  36. }
  37. }
  38. afterTest(t)
  39. }
  40. func TestMultipleTLSNodes(t *testing.T) {
  41. tests := []int{1, 3, 5}
  42. for _, tt := range tests {
  43. es, hs := buildCluster(tt, true)
  44. waitCluster(t, es)
  45. for i := range es {
  46. es[len(es)-i-1].Stop()
  47. }
  48. for i := range hs {
  49. hs[len(hs)-i-1].Close()
  50. }
  51. }
  52. afterTest(t)
  53. }
  54. func TestV2Redirect(t *testing.T) {
  55. es, hs := buildCluster(3, false)
  56. waitCluster(t, es)
  57. u := hs[1].URL
  58. ru := fmt.Sprintf("%s%s", hs[0].URL, "/v2/keys/foo")
  59. tc := NewTestClient()
  60. v := url.Values{}
  61. v.Set("value", "XXX")
  62. resp, _ := tc.PutForm(fmt.Sprintf("%s%s", u, "/v2/keys/foo"), v)
  63. if resp.StatusCode != http.StatusTemporaryRedirect {
  64. t.Errorf("status = %d, want %d", resp.StatusCode, http.StatusTemporaryRedirect)
  65. }
  66. location, err := resp.Location()
  67. if err != nil {
  68. t.Errorf("want err = %, want nil", err)
  69. }
  70. if location.String() != ru {
  71. t.Errorf("location = %v, want %v", location.String(), ru)
  72. }
  73. resp.Body.Close()
  74. for i := range es {
  75. es[len(es)-i-1].Stop()
  76. }
  77. for i := range hs {
  78. hs[len(hs)-i-1].Close()
  79. }
  80. afterTest(t)
  81. }
  82. func TestAdd(t *testing.T) {
  83. tests := []int{3, 4, 5, 6}
  84. for _, tt := range tests {
  85. es := make([]*Server, tt)
  86. hs := make([]*httptest.Server, tt)
  87. for i := 0; i < tt; i++ {
  88. c := config.New()
  89. if i > 0 {
  90. c.Peers = []string{hs[0].URL}
  91. }
  92. es[i], hs[i] = initTestServer(c, int64(i), false)
  93. }
  94. go es[0].Run()
  95. waitMode(participantMode, es[0])
  96. for i := 1; i < tt; i++ {
  97. id := int64(i)
  98. for {
  99. lead := es[0].p.node.Leader()
  100. if lead == -1 {
  101. time.Sleep(defaultElection * es[0].tickDuration)
  102. continue
  103. }
  104. err := es[lead].p.add(id, es[id].raftPubAddr, es[id].pubAddr)
  105. if err == nil {
  106. break
  107. }
  108. switch err {
  109. case tmpErr:
  110. time.Sleep(defaultElection * es[0].tickDuration)
  111. case raftStopErr, stopErr:
  112. t.Fatalf("#%d on %d: unexpected stop", i, lead)
  113. default:
  114. t.Fatal(err)
  115. }
  116. }
  117. go es[i].Run()
  118. waitMode(participantMode, es[i])
  119. for j := 0; j <= i; j++ {
  120. p := fmt.Sprintf("%s/%d", v2machineKVPrefix, id)
  121. w, err := es[j].p.Watch(p, false, false, 1)
  122. if err != nil {
  123. t.Errorf("#%d on %d: %v", i, j, err)
  124. break
  125. }
  126. <-w.EventChan
  127. }
  128. }
  129. for i := range hs {
  130. es[len(hs)-i-1].Stop()
  131. }
  132. for i := range hs {
  133. hs[len(hs)-i-1].Close()
  134. }
  135. }
  136. afterTest(t)
  137. }
  138. func TestRemove(t *testing.T) {
  139. tests := []int{3, 4, 5, 6}
  140. for k, tt := range tests {
  141. es, hs := buildCluster(tt, false)
  142. waitCluster(t, es)
  143. lead, _ := waitLeader(es)
  144. config := config.NewClusterConfig()
  145. config.ActiveSize = 0
  146. if err := es[lead].p.setClusterConfig(config); err != nil {
  147. t.Fatalf("#%d: setClusterConfig err = %v", k, err)
  148. }
  149. // we don't remove the machine from 2-node cluster because it is
  150. // not 100 percent safe in our raft.
  151. // TODO(yichengq): improve it later.
  152. for i := 0; i < tt-2; i++ {
  153. id := int64(i)
  154. send := id
  155. for {
  156. send++
  157. if send > int64(tt-1) {
  158. send = id
  159. }
  160. lead := es[send].p.node.Leader()
  161. if lead == -1 {
  162. time.Sleep(defaultElection * 5 * time.Millisecond)
  163. continue
  164. }
  165. err := es[lead].p.remove(id)
  166. if err == nil {
  167. break
  168. }
  169. switch err {
  170. case tmpErr:
  171. time.Sleep(defaultElection * 5 * time.Millisecond)
  172. case raftStopErr, stopErr:
  173. if lead == id {
  174. break
  175. }
  176. default:
  177. t.Fatal(err)
  178. }
  179. }
  180. waitMode(standbyMode, es[i])
  181. }
  182. for i := range es {
  183. es[len(hs)-i-1].Stop()
  184. }
  185. for i := range hs {
  186. hs[len(hs)-i-1].Close()
  187. }
  188. }
  189. afterTest(t)
  190. // ensure that no goroutines are running
  191. TestGoroutinesRunning(t)
  192. }
  193. func TestBecomeStandby(t *testing.T) {
  194. size := 5
  195. round := 1
  196. for j := 0; j < round; j++ {
  197. es, hs := buildCluster(size, false)
  198. waitCluster(t, es)
  199. lead, _ := waitActiveLeader(es)
  200. i := rand.Intn(size)
  201. // cluster only demotes follower
  202. if int64(i) == lead {
  203. i = (i + 1) % size
  204. }
  205. id := int64(i)
  206. config := config.NewClusterConfig()
  207. config.SyncInterval = 1000
  208. config.ActiveSize = size - 1
  209. if err := es[lead].p.setClusterConfig(config); err != nil {
  210. t.Fatalf("#%d: setClusterConfig err = %v", i, err)
  211. }
  212. for {
  213. err := es[lead].p.remove(id)
  214. if err == nil {
  215. break
  216. }
  217. switch err {
  218. case tmpErr:
  219. time.Sleep(defaultElection * 5 * time.Millisecond)
  220. default:
  221. t.Fatalf("#%d: remove err = %v", i, err)
  222. }
  223. }
  224. waitMode(standbyMode, es[i])
  225. var leader int64
  226. for k := 0; k < 3; k++ {
  227. leader, _ = es[i].s.leaderInfo()
  228. if leader != noneId {
  229. break
  230. }
  231. time.Sleep(50 * time.Millisecond)
  232. }
  233. if g := leader; g != lead {
  234. t.Errorf("#%d: lead = %d, want %d", i, g, lead)
  235. }
  236. for i := range hs {
  237. es[len(hs)-i-1].Stop()
  238. }
  239. for i := range hs {
  240. hs[len(hs)-i-1].Close()
  241. }
  242. }
  243. afterTest(t)
  244. }
  245. func TestReleaseVersion(t *testing.T) {
  246. es, hs := buildCluster(1, false)
  247. resp, err := http.Get(hs[0].URL + "/version")
  248. if err != nil {
  249. t.Fatal(err)
  250. }
  251. defer resp.Body.Close()
  252. g, err := ioutil.ReadAll(resp.Body)
  253. if err != nil {
  254. t.Error(err)
  255. }
  256. gs := string(g)
  257. w := fmt.Sprintf("etcd %s", releaseVersion)
  258. if gs != w {
  259. t.Errorf("version = %v, want %v", gs, w)
  260. }
  261. for i := range hs {
  262. es[len(hs)-i-1].Stop()
  263. }
  264. for i := range hs {
  265. hs[len(hs)-i-1].Close()
  266. }
  267. }
  268. func TestVersionCheck(t *testing.T) {
  269. es, hs := buildCluster(1, false)
  270. u := hs[0].URL
  271. currentVersion := 2
  272. tests := []struct {
  273. version int
  274. wStatus int
  275. }{
  276. {currentVersion - 1, http.StatusForbidden},
  277. {currentVersion, http.StatusOK},
  278. {currentVersion + 1, http.StatusForbidden},
  279. }
  280. for i, tt := range tests {
  281. resp, err := http.Get(fmt.Sprintf("%s/raft/version/%d/check", u, tt.version))
  282. if err != nil {
  283. t.Fatal(err)
  284. }
  285. resp.Body.Close()
  286. if resp.StatusCode != tt.wStatus {
  287. t.Fatal("#%d: status = %d, want %d", i, resp.StatusCode, tt.wStatus)
  288. }
  289. }
  290. for i := range hs {
  291. es[len(hs)-i-1].Stop()
  292. }
  293. for i := range hs {
  294. hs[len(hs)-i-1].Close()
  295. }
  296. }
  297. func buildCluster(number int, tls bool) ([]*Server, []*httptest.Server) {
  298. bootstrapper := 0
  299. es := make([]*Server, number)
  300. hs := make([]*httptest.Server, number)
  301. var seed string
  302. for i := range es {
  303. c := config.New()
  304. if seed != "" {
  305. c.Peers = []string{seed}
  306. }
  307. es[i], hs[i] = initTestServer(c, int64(i), tls)
  308. if i == bootstrapper {
  309. seed = hs[i].URL
  310. } else {
  311. // wait for the previous configuration change to be committed
  312. // or this configuration request might be dropped
  313. w, err := es[0].p.Watch(v2machineKVPrefix, true, false, uint64(i))
  314. if err != nil {
  315. panic(err)
  316. }
  317. <-w.EventChan
  318. }
  319. go es[i].Run()
  320. waitMode(participantMode, es[i])
  321. }
  322. return es, hs
  323. }
  324. func initTestServer(c *config.Config, id int64, tls bool) (e *Server, h *httptest.Server) {
  325. e = New(c)
  326. e.setId(id)
  327. e.SetTick(time.Millisecond * 5)
  328. m := http.NewServeMux()
  329. m.Handle("/", e)
  330. m.Handle("/raft", e.RaftHandler())
  331. m.Handle("/raft/", e.RaftHandler())
  332. if tls {
  333. h = httptest.NewTLSServer(m)
  334. } else {
  335. h = httptest.NewServer(m)
  336. }
  337. e.raftPubAddr = h.URL
  338. e.pubAddr = h.URL
  339. return
  340. }
  341. func waitCluster(t *testing.T, es []*Server) {
  342. n := len(es)
  343. for _, e := range es {
  344. for k := 0; k < n; k++ {
  345. w, err := e.p.Watch(v2machineKVPrefix+fmt.Sprintf("/%d", es[k].id), true, false, 1)
  346. if err != nil {
  347. panic(err)
  348. }
  349. <-w.EventChan
  350. }
  351. }
  352. clusterId := es[0].p.node.ClusterId()
  353. for i, e := range es {
  354. if e.p.node.ClusterId() != clusterId {
  355. t.Errorf("#%d: clusterId = %x, want %x", i, e.p.node.ClusterId(), clusterId)
  356. }
  357. }
  358. }
  359. func waitMode(mode int64, e *Server) {
  360. for {
  361. if e.mode.Get() == mode {
  362. return
  363. }
  364. time.Sleep(10 * time.Millisecond)
  365. }
  366. }
  367. // checkParticipant checks the i-th server works well as participant.
  368. func checkParticipant(i int, es []*Server) error {
  369. lead, _ := waitActiveLeader(es)
  370. key := fmt.Sprintf("/%d", rand.Int31())
  371. ev, err := es[lead].p.Set(key, false, "bar", store.Permanent)
  372. if err != nil {
  373. return err
  374. }
  375. w, err := es[i].p.Watch(key, false, false, ev.Index())
  376. if err != nil {
  377. return err
  378. }
  379. select {
  380. case <-w.EventChan:
  381. case <-time.After(8 * defaultHeartbeat * es[i].tickDuration):
  382. return fmt.Errorf("watch timeout")
  383. }
  384. return nil
  385. }