cluster_test.go 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623
  1. /*
  2. Copyright 2014 CoreOS, Inc.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package integration
  14. import (
  15. "fmt"
  16. "io/ioutil"
  17. "log"
  18. "math/rand"
  19. "net"
  20. "net/http"
  21. "net/http/httptest"
  22. "os"
  23. "reflect"
  24. "sort"
  25. "strconv"
  26. "strings"
  27. "testing"
  28. "time"
  29. "github.com/coreos/etcd/client"
  30. "github.com/coreos/etcd/etcdserver"
  31. "github.com/coreos/etcd/etcdserver/etcdhttp"
  32. "github.com/coreos/etcd/etcdserver/etcdhttp/httptypes"
  33. "github.com/coreos/etcd/pkg/testutil"
  34. "github.com/coreos/etcd/pkg/transport"
  35. "github.com/coreos/etcd/pkg/types"
  36. "github.com/coreos/etcd/rafthttp"
  37. "github.com/coreos/etcd/Godeps/_workspace/src/golang.org/x/net/context"
  38. )
  39. const (
  40. tickDuration = 10 * time.Millisecond
  41. clusterName = "etcd"
  42. requestTimeout = 2 * time.Second
  43. )
  44. var (
  45. electionTicks = 10
  46. )
  47. func init() {
  48. // open microsecond-level time log for integration test debugging
  49. log.SetFlags(log.Ltime | log.Lmicroseconds | log.Lshortfile)
  50. if t := os.Getenv("ETCD_ELECTION_TIMEOUT_TICKS"); t != "" {
  51. if i, err := strconv.ParseInt(t, 10, 64); err == nil {
  52. electionTicks = int(i)
  53. }
  54. }
  55. }
  56. func TestClusterOf1(t *testing.T) { testCluster(t, 1) }
  57. func TestClusterOf3(t *testing.T) { testCluster(t, 3) }
  58. func testCluster(t *testing.T, size int) {
  59. defer afterTest(t)
  60. c := NewCluster(t, size)
  61. c.Launch(t)
  62. defer c.Terminate(t)
  63. clusterMustProgress(t, c.Members)
  64. }
  65. func TestClusterOf1UsingDiscovery(t *testing.T) { testClusterUsingDiscovery(t, 1) }
  66. func TestClusterOf3UsingDiscovery(t *testing.T) { testClusterUsingDiscovery(t, 3) }
  67. func testClusterUsingDiscovery(t *testing.T, size int) {
  68. defer afterTest(t)
  69. dc := NewCluster(t, 1)
  70. dc.Launch(t)
  71. defer dc.Terminate(t)
  72. // init discovery token space
  73. dcc := mustNewHTTPClient(t, dc.URLs())
  74. dkapi := client.NewKeysAPI(dcc)
  75. ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
  76. if _, err := dkapi.Create(ctx, "/_config/size", fmt.Sprintf("%d", size), -1); err != nil {
  77. t.Fatal(err)
  78. }
  79. cancel()
  80. c := NewClusterByDiscovery(t, size, dc.URL(0)+"/v2/keys")
  81. c.Launch(t)
  82. defer c.Terminate(t)
  83. clusterMustProgress(t, c.Members)
  84. }
  85. func TestDoubleClusterSizeOf1(t *testing.T) { testDoubleClusterSize(t, 1) }
  86. func TestDoubleClusterSizeOf3(t *testing.T) { testDoubleClusterSize(t, 3) }
  87. func testDoubleClusterSize(t *testing.T, size int) {
  88. defer afterTest(t)
  89. c := NewCluster(t, size)
  90. c.Launch(t)
  91. defer c.Terminate(t)
  92. for i := 0; i < size; i++ {
  93. c.AddMember(t)
  94. }
  95. clusterMustProgress(t, c.Members)
  96. }
  97. func TestDecreaseClusterSizeOf3(t *testing.T) { testDecreaseClusterSize(t, 3) }
  98. func TestDecreaseClusterSizeOf5(t *testing.T) { testDecreaseClusterSize(t, 5) }
  99. func testDecreaseClusterSize(t *testing.T, size int) {
  100. defer afterTest(t)
  101. c := NewCluster(t, size)
  102. c.Launch(t)
  103. defer c.Terminate(t)
  104. // TODO: remove the last but one member
  105. for i := 0; i < size-1; i++ {
  106. id := c.Members[len(c.Members)-1].s.ID()
  107. c.RemoveMember(t, uint64(id))
  108. c.waitLeader(t, c.Members)
  109. }
  110. clusterMustProgress(t, c.Members)
  111. }
  112. func TestForceNewCluster(t *testing.T) {
  113. c := NewCluster(t, 3)
  114. c.Launch(t)
  115. cc := mustNewHTTPClient(t, []string{c.Members[0].URL()})
  116. kapi := client.NewKeysAPI(cc)
  117. ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
  118. resp, err := kapi.Create(ctx, "/foo", "bar", -1)
  119. if err != nil {
  120. t.Fatalf("unexpected create error: %v", err)
  121. }
  122. cancel()
  123. // ensure create has been applied in this machine
  124. ctx, cancel = context.WithTimeout(context.Background(), requestTimeout)
  125. if _, err := kapi.Watch("/foo", resp.Node.ModifiedIndex).Next(ctx); err != nil {
  126. t.Fatalf("unexpected watch error: %v", err)
  127. }
  128. cancel()
  129. c.Members[0].Stop(t)
  130. c.Members[1].Terminate(t)
  131. c.Members[2].Terminate(t)
  132. c.Members[0].ForceNewCluster = true
  133. err = c.Members[0].Restart(t)
  134. if err != nil {
  135. t.Fatalf("unexpected ForceRestart error: %v", err)
  136. }
  137. defer c.Members[0].Terminate(t)
  138. c.waitLeader(t, c.Members[:1])
  139. // use new http client to init new connection
  140. cc = mustNewHTTPClient(t, []string{c.Members[0].URL()})
  141. kapi = client.NewKeysAPI(cc)
  142. // ensure force restart keep the old data, and new cluster can make progress
  143. ctx, cancel = context.WithTimeout(context.Background(), requestTimeout)
  144. if _, err := kapi.Watch("/foo", resp.Node.ModifiedIndex).Next(ctx); err != nil {
  145. t.Fatalf("unexpected watch error: %v", err)
  146. }
  147. cancel()
  148. clusterMustProgress(t, c.Members[:1])
  149. }
  150. // clusterMustProgress ensures that cluster can make progress. It creates
  151. // a random key first, and check the new key could be got from all client urls
  152. // of the cluster.
  153. func clusterMustProgress(t *testing.T, membs []*member) {
  154. cc := mustNewHTTPClient(t, []string{membs[0].URL()})
  155. kapi := client.NewKeysAPI(cc)
  156. ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
  157. key := fmt.Sprintf("foo%d", rand.Int())
  158. resp, err := kapi.Create(ctx, "/"+key, "bar", -1)
  159. if err != nil {
  160. t.Fatalf("create on %s error: %v", membs[0].URL(), err)
  161. }
  162. cancel()
  163. for i, m := range membs {
  164. u := m.URL()
  165. cc := mustNewHTTPClient(t, []string{u})
  166. kapi := client.NewKeysAPI(cc)
  167. ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
  168. if _, err := kapi.Watch(key, resp.Node.ModifiedIndex).Next(ctx); err != nil {
  169. t.Fatalf("#%d: watch on %s error: %v", i, u, err)
  170. }
  171. cancel()
  172. }
  173. }
  174. // TODO: support TLS
  175. type cluster struct {
  176. Members []*member
  177. }
  178. func fillClusterForMembers(ms []*member, cName string) error {
  179. addrs := make([]string, 0)
  180. for _, m := range ms {
  181. for _, l := range m.PeerListeners {
  182. addrs = append(addrs, fmt.Sprintf("%s=%s", m.Name, "http://"+l.Addr().String()))
  183. }
  184. }
  185. clusterStr := strings.Join(addrs, ",")
  186. var err error
  187. for _, m := range ms {
  188. m.Cluster, err = etcdserver.NewClusterFromString(cName, clusterStr)
  189. if err != nil {
  190. return err
  191. }
  192. }
  193. return nil
  194. }
  195. // NewCluster returns an unlaunched cluster of the given size which has been
  196. // set to use static bootstrap.
  197. func NewCluster(t *testing.T, size int) *cluster {
  198. c := &cluster{}
  199. ms := make([]*member, size)
  200. for i := 0; i < size; i++ {
  201. ms[i] = mustNewMember(t, c.name(i))
  202. }
  203. c.Members = ms
  204. if err := fillClusterForMembers(c.Members, clusterName); err != nil {
  205. t.Fatal(err)
  206. }
  207. return c
  208. }
  209. // NewClusterUsingDiscovery returns an unlaunched cluster of the given size
  210. // which has been set to use the given url as discovery service to bootstrap.
  211. func NewClusterByDiscovery(t *testing.T, size int, url string) *cluster {
  212. c := &cluster{}
  213. ms := make([]*member, size)
  214. for i := 0; i < size; i++ {
  215. ms[i] = mustNewMember(t, c.name(i))
  216. ms[i].DiscoveryURL = url
  217. }
  218. c.Members = ms
  219. return c
  220. }
  221. func (c *cluster) Launch(t *testing.T) {
  222. errc := make(chan error)
  223. for _, m := range c.Members {
  224. // Members are launched in separate goroutines because if they boot
  225. // using discovery url, they have to wait for others to register to continue.
  226. go func(m *member) {
  227. errc <- m.Launch()
  228. }(m)
  229. }
  230. for _ = range c.Members {
  231. if err := <-errc; err != nil {
  232. t.Fatalf("error setting up member: %v", err)
  233. }
  234. }
  235. // wait cluster to be stable to receive future client requests
  236. c.waitMembersMatch(t, c.HTTPMembers())
  237. }
  238. func (c *cluster) URL(i int) string {
  239. return c.Members[i].ClientURLs[0].String()
  240. }
  241. func (c *cluster) URLs() []string {
  242. urls := make([]string, 0)
  243. for _, m := range c.Members {
  244. for _, u := range m.ClientURLs {
  245. urls = append(urls, u.String())
  246. }
  247. }
  248. return urls
  249. }
  250. func (c *cluster) HTTPMembers() []httptypes.Member {
  251. ms := make([]httptypes.Member, len(c.Members))
  252. for i, m := range c.Members {
  253. ms[i].Name = m.Name
  254. for _, ln := range m.PeerListeners {
  255. ms[i].PeerURLs = append(ms[i].PeerURLs, "http://"+ln.Addr().String())
  256. }
  257. for _, ln := range m.ClientListeners {
  258. ms[i].ClientURLs = append(ms[i].ClientURLs, "http://"+ln.Addr().String())
  259. }
  260. }
  261. return ms
  262. }
  263. func (c *cluster) AddMember(t *testing.T) {
  264. clusterStr := c.Members[0].Cluster.String()
  265. idx := len(c.Members)
  266. m := mustNewMember(t, c.name(idx))
  267. // send add request to the cluster
  268. cc := mustNewHTTPClient(t, []string{c.URL(0)})
  269. ma := client.NewMembersAPI(cc)
  270. ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
  271. peerURL := "http://" + m.PeerListeners[0].Addr().String()
  272. if _, err := ma.Add(ctx, peerURL); err != nil {
  273. t.Fatalf("add member on %s error: %v", c.URL(0), err)
  274. }
  275. cancel()
  276. // wait for the add node entry applied in the cluster
  277. members := append(c.HTTPMembers(), httptypes.Member{PeerURLs: []string{peerURL}, ClientURLs: []string{}})
  278. c.waitMembersMatch(t, members)
  279. for _, ln := range m.PeerListeners {
  280. clusterStr += fmt.Sprintf(",%s=http://%s", m.Name, ln.Addr().String())
  281. }
  282. var err error
  283. m.Cluster, err = etcdserver.NewClusterFromString(clusterName, clusterStr)
  284. if err != nil {
  285. t.Fatal(err)
  286. }
  287. m.NewCluster = false
  288. if err := m.Launch(); err != nil {
  289. t.Fatal(err)
  290. }
  291. c.Members = append(c.Members, m)
  292. // wait cluster to be stable to receive future client requests
  293. c.waitMembersMatch(t, c.HTTPMembers())
  294. }
  295. func (c *cluster) RemoveMember(t *testing.T, id uint64) {
  296. // send remove request to the cluster
  297. cc := mustNewHTTPClient(t, []string{c.URL(0)})
  298. ma := client.NewMembersAPI(cc)
  299. ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
  300. if err := ma.Remove(ctx, types.ID(id).String()); err != nil {
  301. t.Fatalf("unexpected remove error %v", err)
  302. }
  303. cancel()
  304. newMembers := make([]*member, 0)
  305. for _, m := range c.Members {
  306. if uint64(m.s.ID()) != id {
  307. newMembers = append(newMembers, m)
  308. } else {
  309. select {
  310. case <-m.s.StopNotify():
  311. m.Terminate(t)
  312. // stop delay / election timeout + 1s disk and network delay
  313. case <-time.After(time.Duration(electionTicks)*tickDuration + time.Second):
  314. t.Fatalf("failed to remove member %s in time", m.s.ID())
  315. }
  316. }
  317. }
  318. c.Members = newMembers
  319. c.waitMembersMatch(t, c.HTTPMembers())
  320. }
  321. func (c *cluster) Terminate(t *testing.T) {
  322. for _, m := range c.Members {
  323. m.Terminate(t)
  324. }
  325. }
  326. func (c *cluster) waitMembersMatch(t *testing.T, membs []httptypes.Member) {
  327. for _, u := range c.URLs() {
  328. cc := mustNewHTTPClient(t, []string{u})
  329. ma := client.NewMembersAPI(cc)
  330. for {
  331. ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
  332. ms, err := ma.List(ctx)
  333. cancel()
  334. if err == nil && isMembersEqual(ms, membs) {
  335. break
  336. }
  337. time.Sleep(tickDuration)
  338. }
  339. }
  340. return
  341. }
  342. func (c *cluster) waitLeader(t *testing.T, membs []*member) {
  343. possibleLead := make(map[uint64]bool)
  344. var lead uint64
  345. for _, m := range membs {
  346. possibleLead[uint64(m.s.ID())] = true
  347. }
  348. for lead == 0 || !possibleLead[lead] {
  349. lead = 0
  350. for _, m := range membs {
  351. if lead != 0 && lead != m.s.Lead() {
  352. lead = 0
  353. break
  354. }
  355. lead = m.s.Lead()
  356. }
  357. time.Sleep(10 * tickDuration)
  358. }
  359. }
  360. func (c *cluster) name(i int) string {
  361. return fmt.Sprint("node", i)
  362. }
  363. // isMembersEqual checks whether two members equal except ID field.
  364. // The given wmembs should always set ID field to empty string.
  365. func isMembersEqual(membs []httptypes.Member, wmembs []httptypes.Member) bool {
  366. sort.Sort(SortableMemberSliceByPeerURLs(membs))
  367. sort.Sort(SortableMemberSliceByPeerURLs(wmembs))
  368. for i := range membs {
  369. membs[i].ID = ""
  370. }
  371. return reflect.DeepEqual(membs, wmembs)
  372. }
  373. func newLocalListener(t *testing.T) net.Listener {
  374. l, err := net.Listen("tcp", "127.0.0.1:0")
  375. if err != nil {
  376. t.Fatal(err)
  377. }
  378. return l
  379. }
  380. func newListenerWithAddr(t *testing.T, addr string) net.Listener {
  381. var err error
  382. var l net.Listener
  383. // TODO: we want to reuse a previous closed port immediately.
  384. // a better way is to set SO_REUSExx instead of doing retry.
  385. for i := 0; i < 5; i++ {
  386. l, err = net.Listen("tcp", addr)
  387. if err == nil {
  388. break
  389. }
  390. time.Sleep(500 * time.Millisecond)
  391. }
  392. if err != nil {
  393. t.Fatal(err)
  394. }
  395. return l
  396. }
  397. type member struct {
  398. etcdserver.ServerConfig
  399. PeerListeners, ClientListeners []net.Listener
  400. raftHandler *testutil.PauseableHandler
  401. s *etcdserver.EtcdServer
  402. hss []*httptest.Server
  403. }
  404. func mustNewMember(t *testing.T, name string) *member {
  405. var err error
  406. m := &member{}
  407. pln := newLocalListener(t)
  408. m.PeerListeners = []net.Listener{pln}
  409. m.PeerURLs, err = types.NewURLs([]string{"http://" + pln.Addr().String()})
  410. if err != nil {
  411. t.Fatal(err)
  412. }
  413. cln := newLocalListener(t)
  414. m.ClientListeners = []net.Listener{cln}
  415. m.ClientURLs, err = types.NewURLs([]string{"http://" + cln.Addr().String()})
  416. if err != nil {
  417. t.Fatal(err)
  418. }
  419. m.Name = name
  420. m.DataDir, err = ioutil.TempDir(os.TempDir(), "etcd")
  421. if err != nil {
  422. t.Fatal(err)
  423. }
  424. clusterStr := fmt.Sprintf("%s=http://%s", name, pln.Addr().String())
  425. m.Cluster, err = etcdserver.NewClusterFromString(clusterName, clusterStr)
  426. if err != nil {
  427. t.Fatal(err)
  428. }
  429. m.NewCluster = true
  430. m.Transport = mustNewTransport(t)
  431. m.ElectionTimeoutTicks = electionTicks
  432. return m
  433. }
  434. // Clone returns a member with the same server configuration. The returned
  435. // member will not set PeerListeners and ClientListeners.
  436. func (m *member) Clone(t *testing.T) *member {
  437. mm := &member{}
  438. mm.ServerConfig = m.ServerConfig
  439. var err error
  440. clientURLStrs := m.ClientURLs.StringSlice()
  441. mm.ClientURLs, err = types.NewURLs(clientURLStrs)
  442. if err != nil {
  443. // this should never fail
  444. panic(err)
  445. }
  446. peerURLStrs := m.PeerURLs.StringSlice()
  447. mm.PeerURLs, err = types.NewURLs(peerURLStrs)
  448. if err != nil {
  449. // this should never fail
  450. panic(err)
  451. }
  452. clusterStr := m.Cluster.String()
  453. mm.Cluster, err = etcdserver.NewClusterFromString(clusterName, clusterStr)
  454. if err != nil {
  455. // this should never fail
  456. panic(err)
  457. }
  458. mm.Transport = mustNewTransport(t)
  459. mm.ElectionTimeoutTicks = m.ElectionTimeoutTicks
  460. return mm
  461. }
  462. // Launch starts a member based on ServerConfig, PeerListeners
  463. // and ClientListeners.
  464. func (m *member) Launch() error {
  465. var err error
  466. if m.s, err = etcdserver.NewServer(&m.ServerConfig); err != nil {
  467. return fmt.Errorf("failed to initialize the etcd server: %v", err)
  468. }
  469. m.s.Ticker = time.Tick(tickDuration)
  470. m.s.SyncTicker = time.Tick(500 * time.Millisecond)
  471. m.s.Start()
  472. m.raftHandler = &testutil.PauseableHandler{Next: etcdhttp.NewPeerHandler(m.s.Cluster, m.s.RaftHandler())}
  473. for _, ln := range m.PeerListeners {
  474. hs := &httptest.Server{
  475. Listener: ln,
  476. Config: &http.Server{Handler: m.raftHandler},
  477. }
  478. hs.Start()
  479. m.hss = append(m.hss, hs)
  480. }
  481. for _, ln := range m.ClientListeners {
  482. hs := &httptest.Server{
  483. Listener: ln,
  484. Config: &http.Server{Handler: etcdhttp.NewClientHandler(m.s)},
  485. }
  486. hs.Start()
  487. m.hss = append(m.hss, hs)
  488. }
  489. return nil
  490. }
  491. func (m *member) URL() string { return m.ClientURLs[0].String() }
  492. func (m *member) Pause() {
  493. m.raftHandler.Pause()
  494. m.s.PauseSending()
  495. }
  496. func (m *member) Resume() {
  497. m.raftHandler.Resume()
  498. m.s.ResumeSending()
  499. }
  500. // Stop stops the member, but the data dir of the member is preserved.
  501. func (m *member) Stop(t *testing.T) {
  502. m.s.Stop()
  503. for _, hs := range m.hss {
  504. hs.CloseClientConnections()
  505. hs.Close()
  506. }
  507. m.hss = nil
  508. }
  509. // Start starts the member using the preserved data dir.
  510. func (m *member) Restart(t *testing.T) error {
  511. newPeerListeners := make([]net.Listener, 0)
  512. for _, ln := range m.PeerListeners {
  513. newPeerListeners = append(newPeerListeners, newListenerWithAddr(t, ln.Addr().String()))
  514. }
  515. m.PeerListeners = newPeerListeners
  516. newClientListeners := make([]net.Listener, 0)
  517. for _, ln := range m.ClientListeners {
  518. newClientListeners = append(newClientListeners, newListenerWithAddr(t, ln.Addr().String()))
  519. }
  520. m.ClientListeners = newClientListeners
  521. return m.Launch()
  522. }
  523. // Terminate stops the member and removes the data dir.
  524. func (m *member) Terminate(t *testing.T) {
  525. m.s.Stop()
  526. for _, hs := range m.hss {
  527. hs.CloseClientConnections()
  528. hs.Close()
  529. }
  530. if err := os.RemoveAll(m.ServerConfig.DataDir); err != nil {
  531. t.Fatal(err)
  532. }
  533. }
  534. func mustNewHTTPClient(t *testing.T, eps []string) client.HTTPClient {
  535. cc, err := client.NewHTTPClient(mustNewTransport(t), eps)
  536. if err != nil {
  537. t.Fatal(err)
  538. }
  539. return cc
  540. }
  541. func mustNewTransport(t *testing.T) *http.Transport {
  542. tr, err := transport.NewTimeoutTransport(transport.TLSInfo{}, rafthttp.ConnReadTimeout, rafthttp.ConnWriteTimeout)
  543. if err != nil {
  544. t.Fatal(err)
  545. }
  546. return tr
  547. }
  548. type SortableMemberSliceByPeerURLs []httptypes.Member
  549. func (p SortableMemberSliceByPeerURLs) Len() int { return len(p) }
  550. func (p SortableMemberSliceByPeerURLs) Less(i, j int) bool {
  551. return p[i].PeerURLs[0] < p[j].PeerURLs[0]
  552. }
  553. func (p SortableMemberSliceByPeerURLs) Swap(i, j int) { p[i], p[j] = p[j], p[i] }