etcd_test.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604
  1. package main
  2. import (
  3. "fmt"
  4. "math/rand"
  5. "net/http"
  6. "net/http/httptest"
  7. "net/url"
  8. "os"
  9. "strconv"
  10. "strings"
  11. "testing"
  12. "time"
  13. "github.com/coreos/etcd/server"
  14. "github.com/coreos/etcd/test"
  15. "github.com/coreos/go-etcd/etcd"
  16. )
  17. // Create a single node and try to set value
  18. func TestSingleNode(t *testing.T) {
  19. procAttr := new(os.ProcAttr)
  20. procAttr.Files = []*os.File{nil, os.Stdout, os.Stderr}
  21. args := []string{"etcd", "-vv", "-n=node1", "-f", "-d=/tmp/node1"}
  22. process, err := os.StartProcess("etcd", args, procAttr)
  23. if err != nil {
  24. t.Fatal("start process failed:" + err.Error())
  25. return
  26. }
  27. defer process.Kill()
  28. time.Sleep(time.Second)
  29. c := etcd.NewClient()
  30. c.SyncCluster()
  31. // Test Set
  32. result, err := c.Set("foo", "bar", 100)
  33. if err != nil || result.Key != "/foo" || result.Value != "bar" || result.TTL < 95 {
  34. if err != nil {
  35. t.Fatal("Set 1: ", err)
  36. }
  37. t.Fatalf("Set 1 failed with %s %s %v", result.Key, result.Value, result.TTL)
  38. }
  39. time.Sleep(time.Second)
  40. result, err = c.Set("foo", "bar", 100)
  41. if err != nil || result.Key != "/foo" || result.Value != "bar" || result.PrevValue != "bar" || result.TTL != 100 {
  42. if err != nil {
  43. t.Fatal("Set 2: ", err)
  44. }
  45. t.Fatalf("Set 2 failed with %s %s %v", result.Key, result.Value, result.TTL)
  46. }
  47. // Add a test-and-set test
  48. // First, we'll test we can change the value if we get it write
  49. result, match, err := c.TestAndSet("foo", "bar", "foobar", 100)
  50. if err != nil || result.Key != "/foo" || result.Value != "foobar" || result.PrevValue != "bar" || result.TTL != 100 || !match {
  51. if err != nil {
  52. t.Fatal(err)
  53. }
  54. t.Fatalf("Set 3 failed with %s %s %v", result.Key, result.Value, result.TTL)
  55. }
  56. // Next, we'll make sure we can't set it without the correct prior value
  57. _, _, err = c.TestAndSet("foo", "bar", "foofoo", 100)
  58. if err == nil {
  59. t.Fatalf("Set 4 expecting error when setting key with incorrect previous value")
  60. }
  61. // Finally, we'll make sure a blank previous value still counts as a test-and-set and still has to match
  62. _, _, err = c.TestAndSet("foo", "", "barbar", 100)
  63. if err == nil {
  64. t.Fatalf("Set 5 expecting error when setting key with blank (incorrect) previous value")
  65. }
  66. }
  67. // TestInternalVersionFail will ensure that etcd does not come up if the internal raft
  68. // versions do not match.
  69. func TestInternalVersionFail(t *testing.T) {
  70. checkedVersion := false
  71. testMux := http.NewServeMux()
  72. testMux.HandleFunc("/version", func(w http.ResponseWriter, r *http.Request) {
  73. fmt.Fprintln(w, "This is not a version number")
  74. checkedVersion = true
  75. })
  76. testMux.HandleFunc("/join", func(w http.ResponseWriter, r *http.Request) {
  77. t.Fatal("should not attempt to join!")
  78. })
  79. ts := httptest.NewServer(testMux)
  80. defer ts.Close()
  81. fakeURL, _ := url.Parse(ts.URL)
  82. procAttr := new(os.ProcAttr)
  83. procAttr.Files = []*os.File{nil, os.Stdout, os.Stderr}
  84. args := []string{"etcd", "-n=node1", "-f", "-d=/tmp/node1", "-vv", "-C=" + fakeURL.Host}
  85. process, err := os.StartProcess("etcd", args, procAttr)
  86. if err != nil {
  87. t.Fatal("start process failed:" + err.Error())
  88. return
  89. }
  90. defer process.Kill()
  91. time.Sleep(time.Second)
  92. _, err = http.Get("http://127.0.0.1:4001")
  93. if err == nil {
  94. t.Fatal("etcd node should not be up")
  95. return
  96. }
  97. if checkedVersion == false {
  98. t.Fatal("etcd did not check the version")
  99. return
  100. }
  101. }
  102. // This test creates a single node and then set a value to it.
  103. // Then this test kills the node and restart it and tries to get the value again.
  104. func TestSingleNodeRecovery(t *testing.T) {
  105. procAttr := new(os.ProcAttr)
  106. procAttr.Files = []*os.File{nil, os.Stdout, os.Stderr}
  107. args := []string{"etcd", "-n=node1", "-d=/tmp/node1"}
  108. process, err := os.StartProcess("etcd", append(args, "-f"), procAttr)
  109. if err != nil {
  110. t.Fatal("start process failed:" + err.Error())
  111. return
  112. }
  113. time.Sleep(time.Second)
  114. c := etcd.NewClient()
  115. c.SyncCluster()
  116. // Test Set
  117. result, err := c.Set("foo", "bar", 100)
  118. if err != nil || result.Key != "/foo" || result.Value != "bar" || result.TTL < 95 {
  119. if err != nil {
  120. t.Fatal(err)
  121. }
  122. t.Fatalf("Set 1 failed with %s %s %v", result.Key, result.Value, result.TTL)
  123. }
  124. time.Sleep(time.Second)
  125. process.Kill()
  126. process, err = os.StartProcess("etcd", args, procAttr)
  127. defer process.Kill()
  128. if err != nil {
  129. t.Fatal("start process failed:" + err.Error())
  130. return
  131. }
  132. time.Sleep(time.Second)
  133. results, err := c.Get("foo")
  134. if err != nil {
  135. t.Fatal("get fail: " + err.Error())
  136. return
  137. }
  138. result = results[0]
  139. if err != nil || result.Key != "/foo" || result.Value != "bar" || result.TTL > 99 {
  140. if err != nil {
  141. t.Fatal(err)
  142. }
  143. t.Fatalf("Recovery Get failed with %s %s %v", result.Key, result.Value, result.TTL)
  144. }
  145. }
  146. // Create a three nodes and try to set value
  147. func templateTestSimpleMultiNode(t *testing.T, tls bool) {
  148. procAttr := new(os.ProcAttr)
  149. procAttr.Files = []*os.File{nil, os.Stdout, os.Stderr}
  150. clusterSize := 3
  151. _, etcds, err := test.CreateCluster(clusterSize, procAttr, tls)
  152. if err != nil {
  153. t.Fatal("cannot create cluster")
  154. }
  155. defer test.DestroyCluster(etcds)
  156. time.Sleep(time.Second)
  157. c := etcd.NewClient()
  158. c.SyncCluster()
  159. // Test Set
  160. result, err := c.Set("foo", "bar", 100)
  161. if err != nil || result.Key != "/foo" || result.Value != "bar" || result.TTL < 95 {
  162. if err != nil {
  163. t.Fatal(err)
  164. }
  165. t.Fatalf("Set 1 failed with %s %s %v", result.Key, result.Value, result.TTL)
  166. }
  167. time.Sleep(time.Second)
  168. result, err = c.Set("foo", "bar", 100)
  169. if err != nil || result.Key != "/foo" || result.Value != "bar" || result.PrevValue != "bar" || result.TTL != 100 {
  170. if err != nil {
  171. t.Fatal(err)
  172. }
  173. t.Fatalf("Set 2 failed with %s %s %v", result.Key, result.Value, result.TTL)
  174. }
  175. }
  176. func TestSimpleMultiNode(t *testing.T) {
  177. templateTestSimpleMultiNode(t, false)
  178. }
  179. func TestSimpleMultiNodeTls(t *testing.T) {
  180. templateTestSimpleMultiNode(t, true)
  181. }
  182. // Create a five nodes
  183. // Kill all the nodes and restart
  184. func TestMultiNodeKillAllAndRecovery(t *testing.T) {
  185. procAttr := new(os.ProcAttr)
  186. procAttr.Files = []*os.File{nil, os.Stdout, os.Stderr}
  187. clusterSize := 5
  188. argGroup, etcds, err := test.CreateCluster(clusterSize, procAttr, false)
  189. if err != nil {
  190. t.Fatal("cannot create cluster")
  191. }
  192. c := etcd.NewClient()
  193. c.SyncCluster()
  194. time.Sleep(time.Second)
  195. // send 10 commands
  196. for i := 0; i < 10; i++ {
  197. // Test Set
  198. _, err := c.Set("foo", "bar", 0)
  199. if err != nil {
  200. panic(err)
  201. }
  202. }
  203. time.Sleep(time.Second)
  204. // kill all
  205. test.DestroyCluster(etcds)
  206. time.Sleep(time.Second)
  207. stop := make(chan bool)
  208. leaderChan := make(chan string, 1)
  209. all := make(chan bool, 1)
  210. time.Sleep(time.Second)
  211. for i := 0; i < clusterSize; i++ {
  212. etcds[i], err = os.StartProcess("etcd", argGroup[i], procAttr)
  213. }
  214. go test.Monitor(clusterSize, 1, leaderChan, all, stop)
  215. <-all
  216. <-leaderChan
  217. result, err := c.Set("foo", "bar", 0)
  218. if err != nil {
  219. t.Fatalf("Recovery error: %s", err)
  220. }
  221. if result.Index != 18 {
  222. t.Fatalf("recovery failed! [%d/18]", result.Index)
  223. }
  224. // kill all
  225. test.DestroyCluster(etcds)
  226. }
  227. // Create a five nodes
  228. // Randomly kill one of the node and keep on sending set command to the cluster
  229. func TestMultiNodeKillOne(t *testing.T) {
  230. procAttr := new(os.ProcAttr)
  231. procAttr.Files = []*os.File{nil, os.Stdout, os.Stderr}
  232. clusterSize := 5
  233. argGroup, etcds, err := test.CreateCluster(clusterSize, procAttr, false)
  234. if err != nil {
  235. t.Fatal("cannot create cluster")
  236. }
  237. defer test.DestroyCluster(etcds)
  238. time.Sleep(2 * time.Second)
  239. c := etcd.NewClient()
  240. c.SyncCluster()
  241. stop := make(chan bool)
  242. // Test Set
  243. go test.Set(stop)
  244. for i := 0; i < 10; i++ {
  245. num := rand.Int() % clusterSize
  246. fmt.Println("kill node", num+1)
  247. // kill
  248. etcds[num].Kill()
  249. etcds[num].Release()
  250. time.Sleep(time.Second)
  251. // restart
  252. etcds[num], err = os.StartProcess("etcd", argGroup[num], procAttr)
  253. if err != nil {
  254. panic(err)
  255. }
  256. time.Sleep(time.Second)
  257. }
  258. fmt.Println("stop")
  259. stop <- true
  260. <-stop
  261. }
  262. // This test will kill the current leader and wait for the etcd cluster to elect a new leader for 200 times.
  263. // It will print out the election time and the average election time.
  264. func TestKillLeader(t *testing.T) {
  265. procAttr := new(os.ProcAttr)
  266. procAttr.Files = []*os.File{nil, os.Stdout, os.Stderr}
  267. clusterSize := 5
  268. argGroup, etcds, err := test.CreateCluster(clusterSize, procAttr, false)
  269. if err != nil {
  270. t.Fatal("cannot create cluster")
  271. }
  272. defer test.DestroyCluster(etcds)
  273. stop := make(chan bool)
  274. leaderChan := make(chan string, 1)
  275. all := make(chan bool, 1)
  276. time.Sleep(time.Second)
  277. go test.Monitor(clusterSize, 1, leaderChan, all, stop)
  278. var totalTime time.Duration
  279. leader := "http://127.0.0.1:7001"
  280. for i := 0; i < clusterSize; i++ {
  281. fmt.Println("leader is ", leader)
  282. port, _ := strconv.Atoi(strings.Split(leader, ":")[2])
  283. num := port - 7001
  284. fmt.Println("kill server ", num)
  285. etcds[num].Kill()
  286. etcds[num].Release()
  287. start := time.Now()
  288. for {
  289. newLeader := <-leaderChan
  290. if newLeader != leader {
  291. leader = newLeader
  292. break
  293. }
  294. }
  295. take := time.Now().Sub(start)
  296. totalTime += take
  297. avgTime := totalTime / (time.Duration)(i+1)
  298. fmt.Println("Leader election time is ", take, "with election timeout", server.ElectionTimeout)
  299. fmt.Println("Leader election time average is", avgTime, "with election timeout", server.ElectionTimeout)
  300. etcds[num], err = os.StartProcess("etcd", argGroup[num], procAttr)
  301. }
  302. stop <- true
  303. }
  304. // TestKillRandom kills random machines in the cluster and
  305. // restart them after all other machines agree on the same leader
  306. func TestKillRandom(t *testing.T) {
  307. procAttr := new(os.ProcAttr)
  308. procAttr.Files = []*os.File{nil, os.Stdout, os.Stderr}
  309. clusterSize := 9
  310. argGroup, etcds, err := test.CreateCluster(clusterSize, procAttr, false)
  311. if err != nil {
  312. t.Fatal("cannot create cluster")
  313. }
  314. defer test.DestroyCluster(etcds)
  315. stop := make(chan bool)
  316. leaderChan := make(chan string, 1)
  317. all := make(chan bool, 1)
  318. time.Sleep(3 * time.Second)
  319. go test.Monitor(clusterSize, 4, leaderChan, all, stop)
  320. toKill := make(map[int]bool)
  321. for i := 0; i < 20; i++ {
  322. fmt.Printf("TestKillRandom Round[%d/20]\n", i)
  323. j := 0
  324. for {
  325. r := rand.Int31n(9)
  326. if _, ok := toKill[int(r)]; !ok {
  327. j++
  328. toKill[int(r)] = true
  329. }
  330. if j > 3 {
  331. break
  332. }
  333. }
  334. for num, _ := range toKill {
  335. err := etcds[num].Kill()
  336. if err != nil {
  337. panic(err)
  338. }
  339. etcds[num].Wait()
  340. }
  341. time.Sleep(server.ElectionTimeout)
  342. <-leaderChan
  343. for num, _ := range toKill {
  344. etcds[num], err = os.StartProcess("etcd", argGroup[num], procAttr)
  345. }
  346. toKill = make(map[int]bool)
  347. <-all
  348. }
  349. stop <- true
  350. }
  351. // remove the node and node rejoin with previous log
  352. func TestRemoveNode(t *testing.T) {
  353. procAttr := new(os.ProcAttr)
  354. procAttr.Files = []*os.File{nil, os.Stdout, os.Stderr}
  355. clusterSize := 3
  356. argGroup, etcds, _ := test.CreateCluster(clusterSize, procAttr, false)
  357. time.Sleep(time.Second)
  358. c := etcd.NewClient()
  359. c.SyncCluster()
  360. rmReq, _ := http.NewRequest("DELETE", "http://127.0.0.1:7001/remove/node3", nil)
  361. client := &http.Client{}
  362. for i := 0; i < 2; i++ {
  363. for i := 0; i < 2; i++ {
  364. client.Do(rmReq)
  365. etcds[2].Wait()
  366. resp, err := c.Get("_etcd/machines")
  367. if err != nil {
  368. panic(err)
  369. }
  370. if len(resp) != 2 {
  371. t.Fatal("cannot remove machine")
  372. }
  373. if i == 1 {
  374. // rejoin with log
  375. etcds[2], err = os.StartProcess("etcd", argGroup[2], procAttr)
  376. } else {
  377. // rejoin without log
  378. etcds[2], err = os.StartProcess("etcd", append(argGroup[2], "-f"), procAttr)
  379. }
  380. if err != nil {
  381. panic(err)
  382. }
  383. time.Sleep(time.Second)
  384. resp, err = c.Get("_etcd/machines")
  385. if err != nil {
  386. panic(err)
  387. }
  388. if len(resp) != 3 {
  389. t.Fatal("add machine fails")
  390. }
  391. }
  392. // first kill the node, then remove it, then add it back
  393. for i := 0; i < 2; i++ {
  394. etcds[2].Kill()
  395. etcds[2].Wait()
  396. client.Do(rmReq)
  397. resp, err := c.Get("_etcd/machines")
  398. if err != nil {
  399. panic(err)
  400. }
  401. if len(resp) != 2 {
  402. t.Fatal("cannot remove machine")
  403. }
  404. if i == 1 {
  405. // rejoin with log
  406. etcds[2], err = os.StartProcess("etcd", append(argGroup[2]), procAttr)
  407. } else {
  408. // rejoin without log
  409. etcds[2], err = os.StartProcess("etcd", append(argGroup[2], "-f"), procAttr)
  410. }
  411. if err != nil {
  412. panic(err)
  413. }
  414. time.Sleep(time.Second)
  415. resp, err = c.Get("_etcd/machines")
  416. if err != nil {
  417. panic(err)
  418. }
  419. if len(resp) != 3 {
  420. t.Fatal("add machine fails")
  421. }
  422. }
  423. }
  424. test.DestroyCluster(etcds)
  425. }
  426. func templateBenchmarkEtcdDirectCall(b *testing.B, tls bool) {
  427. procAttr := new(os.ProcAttr)
  428. procAttr.Files = []*os.File{nil, os.Stdout, os.Stderr}
  429. clusterSize := 3
  430. _, etcds, _ := test.CreateCluster(clusterSize, procAttr, tls)
  431. defer test.DestroyCluster(etcds)
  432. time.Sleep(time.Second)
  433. b.ResetTimer()
  434. for i := 0; i < b.N; i++ {
  435. resp, _ := http.Get("http://127.0.0.1:4001/test/speed")
  436. resp.Body.Close()
  437. }
  438. }
  439. func BenchmarkEtcdDirectCall(b *testing.B) {
  440. templateBenchmarkEtcdDirectCall(b, false)
  441. }
  442. func BenchmarkEtcdDirectCallTls(b *testing.B) {
  443. templateBenchmarkEtcdDirectCall(b, true)
  444. }