etcd_test.go 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446
  1. /*
  2. Copyright 2014 CoreOS Inc.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package etcd
  14. import (
  15. "fmt"
  16. "io/ioutil"
  17. "math/rand"
  18. "net/http"
  19. "net/http/httptest"
  20. "net/url"
  21. "os"
  22. "testing"
  23. "time"
  24. "github.com/coreos/etcd/config"
  25. "github.com/coreos/etcd/store"
  26. )
  27. func TestMultipleNodes(t *testing.T) {
  28. tests := []int{1, 3, 5, 9, 11}
  29. for _, tt := range tests {
  30. es, hs := buildCluster(tt, false)
  31. waitCluster(t, es)
  32. destoryCluster(t, es, hs)
  33. }
  34. afterTest(t)
  35. }
  36. func TestMultipleTLSNodes(t *testing.T) {
  37. tests := []int{1, 3, 5}
  38. for _, tt := range tests {
  39. es, hs := buildCluster(tt, true)
  40. waitCluster(t, es)
  41. destoryCluster(t, es, hs)
  42. }
  43. afterTest(t)
  44. }
  45. func TestV2Redirect(t *testing.T) {
  46. es, hs := buildCluster(3, false)
  47. waitCluster(t, es)
  48. u := hs[1].URL
  49. ru := fmt.Sprintf("%s%s", hs[0].URL, "/v2/keys/foo")
  50. tc := NewTestClient()
  51. v := url.Values{}
  52. v.Set("value", "XXX")
  53. resp, _ := tc.PutForm(fmt.Sprintf("%s%s", u, "/v2/keys/foo"), v)
  54. if resp.StatusCode != http.StatusTemporaryRedirect {
  55. t.Errorf("status = %d, want %d", resp.StatusCode, http.StatusTemporaryRedirect)
  56. }
  57. location, err := resp.Location()
  58. if err != nil {
  59. t.Errorf("want err = %, want nil", err)
  60. }
  61. if location.String() != ru {
  62. t.Errorf("location = %v, want %v", location.String(), ru)
  63. }
  64. resp.Body.Close()
  65. destoryCluster(t, es, hs)
  66. afterTest(t)
  67. }
  68. func TestAdd(t *testing.T) {
  69. tests := []int{3, 4, 5, 6}
  70. for _, tt := range tests {
  71. es := make([]*Server, tt)
  72. hs := make([]*httptest.Server, tt)
  73. for i := 0; i < tt; i++ {
  74. c := config.New()
  75. if i > 0 {
  76. c.Peers = []string{hs[0].URL}
  77. }
  78. es[i], hs[i] = initTestServer(c, int64(i), false)
  79. }
  80. go es[0].Run()
  81. waitMode(participantMode, es[0])
  82. for i := 1; i < tt; i++ {
  83. id := int64(i)
  84. for {
  85. lead := es[0].p.node.Leader()
  86. if lead == -1 {
  87. time.Sleep(defaultElection * es[0].tickDuration)
  88. continue
  89. }
  90. err := es[lead].p.add(id, es[id].raftPubAddr, es[id].pubAddr)
  91. if err == nil {
  92. break
  93. }
  94. switch err {
  95. case tmpErr:
  96. time.Sleep(defaultElection * es[0].tickDuration)
  97. case raftStopErr, stopErr:
  98. t.Fatalf("#%d on %d: unexpected stop", i, lead)
  99. default:
  100. t.Fatal(err)
  101. }
  102. }
  103. go es[i].Run()
  104. waitMode(participantMode, es[i])
  105. for j := 0; j <= i; j++ {
  106. p := fmt.Sprintf("%s/%d", v2machineKVPrefix, id)
  107. w, err := es[j].p.Watch(p, false, false, 1)
  108. if err != nil {
  109. t.Errorf("#%d on %d: %v", i, j, err)
  110. break
  111. }
  112. <-w.EventChan
  113. }
  114. }
  115. destoryCluster(t, es, hs)
  116. }
  117. afterTest(t)
  118. }
  119. func TestRemove(t *testing.T) {
  120. tests := []int{3, 4, 5, 6}
  121. for k, tt := range tests {
  122. es, hs := buildCluster(tt, false)
  123. waitCluster(t, es)
  124. lead, _ := waitLeader(es)
  125. config := config.NewClusterConfig()
  126. config.ActiveSize = 0
  127. if err := es[lead].p.setClusterConfig(config); err != nil {
  128. t.Fatalf("#%d: setClusterConfig err = %v", k, err)
  129. }
  130. // we don't remove the machine from 2-node cluster because it is
  131. // not 100 percent safe in our raft.
  132. // TODO(yichengq): improve it later.
  133. for i := 0; i < tt-2; i++ {
  134. id := int64(i)
  135. send := id
  136. for {
  137. send++
  138. if send > int64(tt-1) {
  139. send = id
  140. }
  141. lead := es[send].p.node.Leader()
  142. if lead == -1 {
  143. time.Sleep(defaultElection * 5 * time.Millisecond)
  144. continue
  145. }
  146. err := es[lead].p.remove(id)
  147. if err == nil {
  148. break
  149. }
  150. switch err {
  151. case tmpErr:
  152. time.Sleep(defaultElection * 5 * time.Millisecond)
  153. case raftStopErr, stopErr:
  154. if lead == id {
  155. break
  156. }
  157. default:
  158. t.Fatal(err)
  159. }
  160. }
  161. waitMode(standbyMode, es[i])
  162. }
  163. destoryCluster(t, es, hs)
  164. }
  165. afterTest(t)
  166. // ensure that no goroutines are running
  167. TestGoroutinesRunning(t)
  168. }
  169. func TestBecomeStandby(t *testing.T) {
  170. size := 5
  171. round := 1
  172. for j := 0; j < round; j++ {
  173. es, hs := buildCluster(size, false)
  174. waitCluster(t, es)
  175. lead, _ := waitActiveLeader(es)
  176. i := rand.Intn(size)
  177. // cluster only demotes follower
  178. if int64(i) == lead {
  179. i = (i + 1) % size
  180. }
  181. id := int64(i)
  182. config := config.NewClusterConfig()
  183. config.SyncInterval = 1000
  184. config.ActiveSize = size - 1
  185. if err := es[lead].p.setClusterConfig(config); err != nil {
  186. t.Fatalf("#%d: setClusterConfig err = %v", i, err)
  187. }
  188. for {
  189. err := es[lead].p.remove(id)
  190. if err == nil {
  191. break
  192. }
  193. switch err {
  194. case tmpErr:
  195. time.Sleep(defaultElection * 5 * time.Millisecond)
  196. default:
  197. t.Fatalf("#%d: remove err = %v", i, err)
  198. }
  199. }
  200. waitMode(standbyMode, es[i])
  201. var leader int64
  202. for k := 0; k < 3; k++ {
  203. leader, _ = es[i].s.leaderInfo()
  204. if leader != noneId {
  205. break
  206. }
  207. time.Sleep(50 * time.Millisecond)
  208. }
  209. if g := leader; g != lead {
  210. t.Errorf("#%d: lead = %d, want %d", i, g, lead)
  211. }
  212. destoryCluster(t, es, hs)
  213. }
  214. afterTest(t)
  215. }
  216. func TestReleaseVersion(t *testing.T) {
  217. es, hs := buildCluster(1, false)
  218. resp, err := http.Get(hs[0].URL + "/version")
  219. if err != nil {
  220. t.Fatal(err)
  221. }
  222. defer resp.Body.Close()
  223. g, err := ioutil.ReadAll(resp.Body)
  224. if err != nil {
  225. t.Error(err)
  226. }
  227. gs := string(g)
  228. w := fmt.Sprintf("etcd %s", releaseVersion)
  229. if gs != w {
  230. t.Errorf("version = %v, want %v", gs, w)
  231. }
  232. for i := range hs {
  233. es[len(hs)-i-1].Stop()
  234. }
  235. for i := range hs {
  236. hs[len(hs)-i-1].Close()
  237. }
  238. }
  239. func TestVersionCheck(t *testing.T) {
  240. es, hs := buildCluster(1, false)
  241. u := hs[0].URL
  242. currentVersion := 2
  243. tests := []struct {
  244. version int
  245. wStatus int
  246. }{
  247. {currentVersion - 1, http.StatusForbidden},
  248. {currentVersion, http.StatusOK},
  249. {currentVersion + 1, http.StatusForbidden},
  250. }
  251. for i, tt := range tests {
  252. resp, err := http.Get(fmt.Sprintf("%s/raft/version/%d/check", u, tt.version))
  253. if err != nil {
  254. t.Fatal(err)
  255. }
  256. resp.Body.Close()
  257. if resp.StatusCode != tt.wStatus {
  258. t.Fatal("#%d: status = %d, want %d", i, resp.StatusCode, tt.wStatus)
  259. }
  260. }
  261. for i := range hs {
  262. es[len(hs)-i-1].Stop()
  263. }
  264. for i := range hs {
  265. hs[len(hs)-i-1].Close()
  266. }
  267. }
  268. func buildCluster(number int, tls bool) ([]*Server, []*httptest.Server) {
  269. bootstrapper := 0
  270. es := make([]*Server, number)
  271. hs := make([]*httptest.Server, number)
  272. var seed string
  273. for i := range es {
  274. c := config.New()
  275. if seed != "" {
  276. c.Peers = []string{seed}
  277. }
  278. es[i], hs[i] = initTestServer(c, int64(i), tls)
  279. if i == bootstrapper {
  280. seed = hs[i].URL
  281. } else {
  282. // wait for the previous configuration change to be committed
  283. // or this configuration request might be dropped
  284. w, err := es[0].p.Watch(v2machineKVPrefix, true, false, uint64(i))
  285. if err != nil {
  286. panic(err)
  287. }
  288. <-w.EventChan
  289. }
  290. go es[i].Run()
  291. waitMode(participantMode, es[i])
  292. }
  293. return es, hs
  294. }
  295. func initTestServer(c *config.Config, id int64, tls bool) (e *Server, h *httptest.Server) {
  296. n, err := ioutil.TempDir(os.TempDir(), "etcd")
  297. if err != nil {
  298. panic(err)
  299. }
  300. c.DataDir = n
  301. e, err = New(c)
  302. if err != nil {
  303. panic(err)
  304. }
  305. e.setId(id)
  306. e.SetTick(time.Millisecond * 5)
  307. m := http.NewServeMux()
  308. m.Handle("/", e)
  309. m.Handle("/raft", e.RaftHandler())
  310. m.Handle("/raft/", e.RaftHandler())
  311. if tls {
  312. h = httptest.NewTLSServer(m)
  313. } else {
  314. h = httptest.NewServer(m)
  315. }
  316. e.raftPubAddr = h.URL
  317. e.pubAddr = h.URL
  318. return
  319. }
  320. func destoryCluster(t *testing.T, es []*Server, hs []*httptest.Server) {
  321. for i := range es {
  322. e := es[len(es)-i-1]
  323. e.Stop()
  324. err := os.RemoveAll(e.config.DataDir)
  325. if err != nil {
  326. panic(err)
  327. t.Fatal(err)
  328. }
  329. }
  330. for i := range hs {
  331. hs[len(hs)-i-1].Close()
  332. }
  333. }
  334. func destroyServer(t *testing.T, e *Server, h *httptest.Server) {
  335. e.Stop()
  336. h.Close()
  337. err := os.RemoveAll(e.config.DataDir)
  338. if err != nil {
  339. panic(err)
  340. t.Fatal(err)
  341. }
  342. }
  343. func waitCluster(t *testing.T, es []*Server) {
  344. n := len(es)
  345. for _, e := range es {
  346. for k := 0; k < n; k++ {
  347. w, err := e.p.Watch(v2machineKVPrefix+fmt.Sprintf("/%d", es[k].id), true, false, 1)
  348. if err != nil {
  349. panic(err)
  350. }
  351. <-w.EventChan
  352. }
  353. }
  354. clusterId := es[0].p.node.ClusterId()
  355. for i, e := range es {
  356. if e.p.node.ClusterId() != clusterId {
  357. t.Errorf("#%d: clusterId = %x, want %x", i, e.p.node.ClusterId(), clusterId)
  358. }
  359. }
  360. }
  361. func waitMode(mode int64, e *Server) {
  362. for {
  363. if e.mode.Get() == mode {
  364. return
  365. }
  366. time.Sleep(10 * time.Millisecond)
  367. }
  368. }
  369. // checkParticipant checks the i-th server works well as participant.
  370. func checkParticipant(i int, es []*Server) error {
  371. lead, _ := waitActiveLeader(es)
  372. key := fmt.Sprintf("/%d", rand.Int31())
  373. ev, err := es[lead].p.Set(key, false, "bar", store.Permanent)
  374. if err != nil {
  375. return err
  376. }
  377. w, err := es[i].p.Watch(key, false, false, ev.Index())
  378. if err != nil {
  379. return err
  380. }
  381. select {
  382. case <-w.EventChan:
  383. case <-time.After(8 * defaultHeartbeat * es[i].tickDuration):
  384. return fmt.Errorf("watch timeout")
  385. }
  386. return nil
  387. }