| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639 |
- // Copyright 2015 CoreOS, Inc.
- //
- // Licensed under the Apache License, Version 2.0 (the "License");
- // you may not use this file except in compliance with the License.
- // You may obtain a copy of the License at
- //
- // http://www.apache.org/licenses/LICENSE-2.0
- //
- // Unless required by applicable law or agreed to in writing, software
- // distributed under the License is distributed on an "AS IS" BASIS,
- // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- // See the License for the specific language governing permissions and
- // limitations under the License.
- package integration
- import (
- "fmt"
- "io/ioutil"
- "log"
- "math/rand"
- "net"
- "net/http"
- "net/http/httptest"
- "os"
- "reflect"
- "sort"
- "strconv"
- "strings"
- "testing"
- "time"
- "github.com/coreos/etcd/client"
- "github.com/coreos/etcd/etcdserver"
- "github.com/coreos/etcd/etcdserver/etcdhttp"
- "github.com/coreos/etcd/pkg/testutil"
- "github.com/coreos/etcd/pkg/transport"
- "github.com/coreos/etcd/pkg/types"
- "github.com/coreos/etcd/rafthttp"
- "github.com/coreos/etcd/Godeps/_workspace/src/golang.org/x/net/context"
- )
- const (
- tickDuration = 10 * time.Millisecond
- clusterName = "etcd"
- requestTimeout = 2 * time.Second
- )
- var (
- electionTicks = 10
- )
- func init() {
- // open microsecond-level time log for integration test debugging
- log.SetFlags(log.Ltime | log.Lmicroseconds | log.Lshortfile)
- if t := os.Getenv("ETCD_ELECTION_TIMEOUT_TICKS"); t != "" {
- if i, err := strconv.ParseInt(t, 10, 64); err == nil {
- electionTicks = int(i)
- }
- }
- }
- func TestClusterOf1(t *testing.T) { testCluster(t, 1) }
- func TestClusterOf3(t *testing.T) { testCluster(t, 3) }
- func testCluster(t *testing.T, size int) {
- defer afterTest(t)
- c := NewCluster(t, size)
- c.Launch(t)
- defer c.Terminate(t)
- clusterMustProgress(t, c.Members)
- }
- func TestClusterOf1UsingDiscovery(t *testing.T) { testClusterUsingDiscovery(t, 1) }
- func TestClusterOf3UsingDiscovery(t *testing.T) { testClusterUsingDiscovery(t, 3) }
- func testClusterUsingDiscovery(t *testing.T, size int) {
- defer afterTest(t)
- dc := NewCluster(t, 1)
- dc.Launch(t)
- defer dc.Terminate(t)
- // init discovery token space
- dcc := mustNewHTTPClient(t, dc.URLs())
- dkapi := client.NewKeysAPI(dcc)
- ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
- if _, err := dkapi.Create(ctx, "/_config/size", fmt.Sprintf("%d", size)); err != nil {
- t.Fatal(err)
- }
- cancel()
- c := NewClusterByDiscovery(t, size, dc.URL(0)+"/v2/keys")
- c.Launch(t)
- defer c.Terminate(t)
- clusterMustProgress(t, c.Members)
- }
- func TestDoubleClusterSizeOf1(t *testing.T) { testDoubleClusterSize(t, 1) }
- func TestDoubleClusterSizeOf3(t *testing.T) { testDoubleClusterSize(t, 3) }
- func testDoubleClusterSize(t *testing.T, size int) {
- defer afterTest(t)
- c := NewCluster(t, size)
- c.Launch(t)
- defer c.Terminate(t)
- for i := 0; i < size; i++ {
- c.AddMember(t)
- }
- clusterMustProgress(t, c.Members)
- }
- func TestDecreaseClusterSizeOf3(t *testing.T) { testDecreaseClusterSize(t, 3) }
- func TestDecreaseClusterSizeOf5(t *testing.T) { testDecreaseClusterSize(t, 5) }
- func testDecreaseClusterSize(t *testing.T, size int) {
- defer afterTest(t)
- c := NewCluster(t, size)
- c.Launch(t)
- defer c.Terminate(t)
- // TODO: remove the last but one member
- for i := 0; i < size-1; i++ {
- id := c.Members[len(c.Members)-1].s.ID()
- c.RemoveMember(t, uint64(id))
- c.waitLeader(t, c.Members)
- }
- clusterMustProgress(t, c.Members)
- }
- func TestForceNewCluster(t *testing.T) {
- c := NewCluster(t, 3)
- c.Launch(t)
- cc := mustNewHTTPClient(t, []string{c.Members[0].URL()})
- kapi := client.NewKeysAPI(cc)
- ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
- resp, err := kapi.Create(ctx, "/foo", "bar")
- if err != nil {
- t.Fatalf("unexpected create error: %v", err)
- }
- cancel()
- // ensure create has been applied in this machine
- ctx, cancel = context.WithTimeout(context.Background(), requestTimeout)
- if _, err := kapi.Watcher("/foo", &client.WatcherOptions{AfterIndex: resp.Node.ModifiedIndex - 1}).Next(ctx); err != nil {
- t.Fatalf("unexpected watch error: %v", err)
- }
- cancel()
- c.Members[0].Stop(t)
- c.Members[1].Terminate(t)
- c.Members[2].Terminate(t)
- c.Members[0].ForceNewCluster = true
- err = c.Members[0].Restart(t)
- if err != nil {
- t.Fatalf("unexpected ForceRestart error: %v", err)
- }
- defer c.Members[0].Terminate(t)
- c.waitLeader(t, c.Members[:1])
- // use new http client to init new connection
- cc = mustNewHTTPClient(t, []string{c.Members[0].URL()})
- kapi = client.NewKeysAPI(cc)
- // ensure force restart keep the old data, and new cluster can make progress
- ctx, cancel = context.WithTimeout(context.Background(), requestTimeout)
- if _, err := kapi.Watcher("/foo", &client.WatcherOptions{AfterIndex: resp.Node.ModifiedIndex - 1}).Next(ctx); err != nil {
- t.Fatalf("unexpected watch error: %v", err)
- }
- cancel()
- clusterMustProgress(t, c.Members[:1])
- }
- // clusterMustProgress ensures that cluster can make progress. It creates
- // a random key first, and check the new key could be got from all client urls
- // of the cluster.
- func clusterMustProgress(t *testing.T, membs []*member) {
- cc := mustNewHTTPClient(t, []string{membs[0].URL()})
- kapi := client.NewKeysAPI(cc)
- ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
- key := fmt.Sprintf("foo%d", rand.Int())
- resp, err := kapi.Create(ctx, "/"+key, "bar")
- if err != nil {
- t.Fatalf("create on %s error: %v", membs[0].URL(), err)
- }
- cancel()
- for i, m := range membs {
- u := m.URL()
- mcc := mustNewHTTPClient(t, []string{u})
- mkapi := client.NewKeysAPI(mcc)
- mctx, mcancel := context.WithTimeout(context.Background(), requestTimeout)
- if _, err := mkapi.Watcher(key, &client.WatcherOptions{AfterIndex: resp.Node.ModifiedIndex - 1}).Next(mctx); err != nil {
- t.Fatalf("#%d: watch on %s error: %v", i, u, err)
- }
- mcancel()
- }
- }
- // TODO: support TLS
- type cluster struct {
- Members []*member
- }
- func fillClusterForMembers(ms []*member, cName string) error {
- addrs := make([]string, 0)
- for _, m := range ms {
- for _, l := range m.PeerListeners {
- addrs = append(addrs, fmt.Sprintf("%s=%s", m.Name, "http://"+l.Addr().String()))
- }
- }
- clusterStr := strings.Join(addrs, ",")
- var err error
- for _, m := range ms {
- m.Cluster, err = etcdserver.NewClusterFromString(cName, clusterStr)
- if err != nil {
- return err
- }
- }
- return nil
- }
- // NewCluster returns an unlaunched cluster of the given size which has been
- // set to use static bootstrap.
- func NewCluster(t *testing.T, size int) *cluster {
- c := &cluster{}
- ms := make([]*member, size)
- for i := 0; i < size; i++ {
- ms[i] = mustNewMember(t, c.name(i))
- }
- c.Members = ms
- if err := fillClusterForMembers(c.Members, clusterName); err != nil {
- t.Fatal(err)
- }
- return c
- }
- // NewClusterUsingDiscovery returns an unlaunched cluster of the given size
- // which has been set to use the given url as discovery service to bootstrap.
- func NewClusterByDiscovery(t *testing.T, size int, url string) *cluster {
- c := &cluster{}
- ms := make([]*member, size)
- for i := 0; i < size; i++ {
- ms[i] = mustNewMember(t, c.name(i))
- ms[i].DiscoveryURL = url
- }
- c.Members = ms
- return c
- }
- func (c *cluster) Launch(t *testing.T) {
- errc := make(chan error)
- for _, m := range c.Members {
- // Members are launched in separate goroutines because if they boot
- // using discovery url, they have to wait for others to register to continue.
- go func(m *member) {
- errc <- m.Launch()
- }(m)
- }
- for _ = range c.Members {
- if err := <-errc; err != nil {
- t.Fatalf("error setting up member: %v", err)
- }
- }
- // wait cluster to be stable to receive future client requests
- c.waitMembersMatch(t, c.HTTPMembers())
- }
- func (c *cluster) URL(i int) string {
- return c.Members[i].ClientURLs[0].String()
- }
- func (c *cluster) URLs() []string {
- urls := make([]string, 0)
- for _, m := range c.Members {
- for _, u := range m.ClientURLs {
- urls = append(urls, u.String())
- }
- }
- return urls
- }
- func (c *cluster) HTTPMembers() []client.Member {
- ms := make([]client.Member, len(c.Members))
- for i, m := range c.Members {
- ms[i].Name = m.Name
- for _, ln := range m.PeerListeners {
- ms[i].PeerURLs = append(ms[i].PeerURLs, "http://"+ln.Addr().String())
- }
- for _, ln := range m.ClientListeners {
- ms[i].ClientURLs = append(ms[i].ClientURLs, "http://"+ln.Addr().String())
- }
- }
- return ms
- }
- func (c *cluster) AddMember(t *testing.T) {
- clusterStr := c.Members[0].Cluster.String()
- idx := len(c.Members)
- m := mustNewMember(t, c.name(idx))
- // send add request to the cluster
- cc := mustNewHTTPClient(t, []string{c.URL(0)})
- ma := client.NewMembersAPI(cc)
- ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
- peerURL := "http://" + m.PeerListeners[0].Addr().String()
- if _, err := ma.Add(ctx, peerURL); err != nil {
- t.Fatalf("add member on %s error: %v", c.URL(0), err)
- }
- cancel()
- // wait for the add node entry applied in the cluster
- members := append(c.HTTPMembers(), client.Member{PeerURLs: []string{peerURL}, ClientURLs: []string{}})
- c.waitMembersMatch(t, members)
- for _, ln := range m.PeerListeners {
- clusterStr += fmt.Sprintf(",%s=http://%s", m.Name, ln.Addr().String())
- }
- var err error
- m.Cluster, err = etcdserver.NewClusterFromString(clusterName, clusterStr)
- if err != nil {
- t.Fatal(err)
- }
- m.NewCluster = false
- if err := m.Launch(); err != nil {
- t.Fatal(err)
- }
- c.Members = append(c.Members, m)
- // wait cluster to be stable to receive future client requests
- c.waitMembersMatch(t, c.HTTPMembers())
- }
- func (c *cluster) RemoveMember(t *testing.T, id uint64) {
- // send remove request to the cluster
- cc := mustNewHTTPClient(t, []string{c.URL(0)})
- ma := client.NewMembersAPI(cc)
- ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
- if err := ma.Remove(ctx, types.ID(id).String()); err != nil {
- t.Fatalf("unexpected remove error %v", err)
- }
- cancel()
- newMembers := make([]*member, 0)
- for _, m := range c.Members {
- if uint64(m.s.ID()) != id {
- newMembers = append(newMembers, m)
- } else {
- select {
- case <-m.s.StopNotify():
- m.Terminate(t)
- // stop delay / election timeout + 1s disk and network delay
- case <-time.After(time.Duration(electionTicks)*tickDuration + time.Second):
- t.Fatalf("failed to remove member %s in time", m.s.ID())
- }
- }
- }
- c.Members = newMembers
- c.waitMembersMatch(t, c.HTTPMembers())
- }
- func (c *cluster) Terminate(t *testing.T) {
- for _, m := range c.Members {
- m.Terminate(t)
- }
- }
- func (c *cluster) waitMembersMatch(t *testing.T, membs []client.Member) {
- for _, u := range c.URLs() {
- cc := mustNewHTTPClient(t, []string{u})
- ma := client.NewMembersAPI(cc)
- for {
- ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
- ms, err := ma.List(ctx)
- cancel()
- if err == nil && isMembersEqual(ms, membs) {
- break
- }
- time.Sleep(tickDuration)
- }
- }
- return
- }
- func (c *cluster) waitLeader(t *testing.T, membs []*member) {
- possibleLead := make(map[uint64]bool)
- var lead uint64
- for _, m := range membs {
- possibleLead[uint64(m.s.ID())] = true
- }
- for lead == 0 || !possibleLead[lead] {
- lead = 0
- for _, m := range membs {
- if lead != 0 && lead != m.s.Lead() {
- lead = 0
- break
- }
- lead = m.s.Lead()
- }
- time.Sleep(10 * tickDuration)
- }
- }
- func (c *cluster) name(i int) string {
- return fmt.Sprint("node", i)
- }
- // isMembersEqual checks whether two members equal except ID field.
- // The given wmembs should always set ID field to empty string.
- func isMembersEqual(membs []client.Member, wmembs []client.Member) bool {
- sort.Sort(SortableMemberSliceByPeerURLs(membs))
- sort.Sort(SortableMemberSliceByPeerURLs(wmembs))
- for i := range membs {
- membs[i].ID = ""
- }
- return reflect.DeepEqual(membs, wmembs)
- }
- func newLocalListener(t *testing.T) net.Listener {
- l, err := net.Listen("tcp", "127.0.0.1:0")
- if err != nil {
- t.Fatal(err)
- }
- return l
- }
- func newListenerWithAddr(t *testing.T, addr string) net.Listener {
- var err error
- var l net.Listener
- // TODO: we want to reuse a previous closed port immediately.
- // a better way is to set SO_REUSExx instead of doing retry.
- for i := 0; i < 5; i++ {
- l, err = net.Listen("tcp", addr)
- if err == nil {
- break
- }
- time.Sleep(500 * time.Millisecond)
- }
- if err != nil {
- t.Fatal(err)
- }
- return l
- }
- type member struct {
- etcdserver.ServerConfig
- PeerListeners, ClientListeners []net.Listener
- raftHandler *testutil.PauseableHandler
- s *etcdserver.EtcdServer
- hss []*httptest.Server
- }
- func mustNewMember(t *testing.T, name string) *member {
- var err error
- m := &member{}
- pln := newLocalListener(t)
- m.PeerListeners = []net.Listener{pln}
- m.PeerURLs, err = types.NewURLs([]string{"http://" + pln.Addr().String()})
- if err != nil {
- t.Fatal(err)
- }
- cln := newLocalListener(t)
- m.ClientListeners = []net.Listener{cln}
- m.ClientURLs, err = types.NewURLs([]string{"http://" + cln.Addr().String()})
- if err != nil {
- t.Fatal(err)
- }
- m.Name = name
- m.DataDir, err = ioutil.TempDir(os.TempDir(), "etcd")
- if err != nil {
- t.Fatal(err)
- }
- clusterStr := fmt.Sprintf("%s=http://%s", name, pln.Addr().String())
- m.Cluster, err = etcdserver.NewClusterFromString(clusterName, clusterStr)
- if err != nil {
- t.Fatal(err)
- }
- m.NewCluster = true
- m.Transport = mustNewTransport(t)
- m.ElectionTicks = electionTicks
- m.TickMs = uint(tickDuration / time.Millisecond)
- return m
- }
- // Clone returns a member with the same server configuration. The returned
- // member will not set PeerListeners and ClientListeners.
- func (m *member) Clone(t *testing.T) *member {
- mm := &member{}
- mm.ServerConfig = m.ServerConfig
- var err error
- clientURLStrs := m.ClientURLs.StringSlice()
- mm.ClientURLs, err = types.NewURLs(clientURLStrs)
- if err != nil {
- // this should never fail
- panic(err)
- }
- peerURLStrs := m.PeerURLs.StringSlice()
- mm.PeerURLs, err = types.NewURLs(peerURLStrs)
- if err != nil {
- // this should never fail
- panic(err)
- }
- clusterStr := m.Cluster.String()
- mm.Cluster, err = etcdserver.NewClusterFromString(clusterName, clusterStr)
- if err != nil {
- // this should never fail
- panic(err)
- }
- mm.Transport = mustNewTransport(t)
- mm.ElectionTicks = m.ElectionTicks
- return mm
- }
- // Launch starts a member based on ServerConfig, PeerListeners
- // and ClientListeners.
- func (m *member) Launch() error {
- var err error
- if m.s, err = etcdserver.NewServer(&m.ServerConfig); err != nil {
- return fmt.Errorf("failed to initialize the etcd server: %v", err)
- }
- m.s.SyncTicker = time.Tick(500 * time.Millisecond)
- m.s.Start()
- m.raftHandler = &testutil.PauseableHandler{Next: etcdhttp.NewPeerHandler(m.s.Cluster, m.s, m.s.RaftHandler())}
- for _, ln := range m.PeerListeners {
- hs := &httptest.Server{
- Listener: ln,
- Config: &http.Server{Handler: m.raftHandler},
- }
- hs.Start()
- m.hss = append(m.hss, hs)
- }
- for _, ln := range m.ClientListeners {
- hs := &httptest.Server{
- Listener: ln,
- Config: &http.Server{Handler: etcdhttp.NewClientHandler(m.s)},
- }
- hs.Start()
- m.hss = append(m.hss, hs)
- }
- return nil
- }
- func (m *member) WaitOK(t *testing.T) {
- cc := mustNewHTTPClient(t, []string{m.URL()})
- kapi := client.NewKeysAPI(cc)
- for {
- ctx, cancel := context.WithTimeout(context.Background(), requestTimeout)
- _, err := kapi.Get(ctx, "/", nil)
- if err != nil {
- time.Sleep(tickDuration)
- continue
- }
- cancel()
- break
- }
- for m.s.Leader() == 0 {
- time.Sleep(tickDuration)
- }
- }
- func (m *member) URL() string { return m.ClientURLs[0].String() }
- func (m *member) Pause() {
- m.raftHandler.Pause()
- m.s.PauseSending()
- }
- func (m *member) Resume() {
- m.raftHandler.Resume()
- m.s.ResumeSending()
- }
- // Stop stops the member, but the data dir of the member is preserved.
- func (m *member) Stop(t *testing.T) {
- m.s.Stop()
- for _, hs := range m.hss {
- hs.CloseClientConnections()
- hs.Close()
- }
- m.hss = nil
- }
- // Start starts the member using the preserved data dir.
- func (m *member) Restart(t *testing.T) error {
- newPeerListeners := make([]net.Listener, 0)
- for _, ln := range m.PeerListeners {
- newPeerListeners = append(newPeerListeners, newListenerWithAddr(t, ln.Addr().String()))
- }
- m.PeerListeners = newPeerListeners
- newClientListeners := make([]net.Listener, 0)
- for _, ln := range m.ClientListeners {
- newClientListeners = append(newClientListeners, newListenerWithAddr(t, ln.Addr().String()))
- }
- m.ClientListeners = newClientListeners
- return m.Launch()
- }
- // Terminate stops the member and removes the data dir.
- func (m *member) Terminate(t *testing.T) {
- m.s.Stop()
- for _, hs := range m.hss {
- hs.CloseClientConnections()
- hs.Close()
- }
- if err := os.RemoveAll(m.ServerConfig.DataDir); err != nil {
- t.Fatal(err)
- }
- }
- func mustNewHTTPClient(t *testing.T, eps []string) client.Client {
- cfg := client.Config{Transport: mustNewTransport(t), Endpoints: eps}
- c, err := client.New(cfg)
- if err != nil {
- t.Fatal(err)
- }
- return c
- }
- func mustNewTransport(t *testing.T) *http.Transport {
- tr, err := transport.NewTimeoutTransport(transport.TLSInfo{}, rafthttp.ConnReadTimeout, rafthttp.ConnWriteTimeout)
- if err != nil {
- t.Fatal(err)
- }
- return tr
- }
- type SortableMemberSliceByPeerURLs []client.Member
- func (p SortableMemberSliceByPeerURLs) Len() int { return len(p) }
- func (p SortableMemberSliceByPeerURLs) Less(i, j int) bool {
- return p[i].PeerURLs[0] < p[j].PeerURLs[0]
- }
- func (p SortableMemberSliceByPeerURLs) Swap(i, j int) { p[i], p[j] = p[j], p[i] }
|