etcd.go 7.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242
  1. /*
  2. Copyright 2013 CoreOS Inc.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package etcd
  14. import (
  15. "net"
  16. "net/http"
  17. "os"
  18. "path/filepath"
  19. "runtime"
  20. "strings"
  21. "time"
  22. goetcd "github.com/coreos/etcd/third_party/github.com/coreos/go-etcd/etcd"
  23. golog "github.com/coreos/etcd/third_party/github.com/coreos/go-log/log"
  24. "github.com/coreos/etcd/third_party/github.com/goraft/raft"
  25. "github.com/coreos/etcd/config"
  26. ehttp "github.com/coreos/etcd/http"
  27. "github.com/coreos/etcd/log"
  28. "github.com/coreos/etcd/metrics"
  29. "github.com/coreos/etcd/server"
  30. "github.com/coreos/etcd/store"
  31. )
  32. type Etcd struct {
  33. Config *config.Config // etcd config
  34. Store store.Store // data store
  35. Registry *server.Registry // stores URL information for nodes
  36. Server *server.Server // http server, runs on 4001 by default
  37. PeerServer *server.PeerServer // peer server, runs on 7001 by default
  38. listener net.Listener // Listener for Server
  39. peerListener net.Listener // Listener for PeerServer
  40. readyC chan bool // To signal when server is ready to accept connections
  41. }
  42. // New returns a new Etcd instance.
  43. func New(c *config.Config) *Etcd {
  44. if c == nil {
  45. c = config.New()
  46. }
  47. return &Etcd{
  48. Config: c,
  49. readyC: make(chan bool),
  50. }
  51. }
  52. // Run the etcd instance.
  53. func (e *Etcd) Run() {
  54. // Enable options.
  55. if e.Config.VeryVeryVerbose {
  56. log.Verbose = true
  57. raft.SetLogLevel(raft.Trace)
  58. goetcd.SetLogger(
  59. golog.New(
  60. "go-etcd",
  61. false,
  62. golog.CombinedSink(
  63. os.Stdout,
  64. "[%s] %s %-9s | %s\n",
  65. []string{"prefix", "time", "priority", "message"},
  66. ),
  67. ),
  68. )
  69. } else if e.Config.VeryVerbose {
  70. log.Verbose = true
  71. raft.SetLogLevel(raft.Debug)
  72. } else if e.Config.Verbose {
  73. log.Verbose = true
  74. }
  75. if e.Config.CPUProfileFile != "" {
  76. profile(e.Config.CPUProfileFile)
  77. }
  78. if e.Config.DataDir == "" {
  79. log.Fatal("The data dir was not set and could not be guessed from machine name")
  80. }
  81. // Create data directory if it doesn't already exist.
  82. if err := os.MkdirAll(e.Config.DataDir, 0744); err != nil {
  83. log.Fatalf("Unable to create path: %s", err)
  84. }
  85. // Warn people if they have an info file
  86. info := filepath.Join(e.Config.DataDir, "info")
  87. if _, err := os.Stat(info); err == nil {
  88. log.Warnf("All cached configuration is now ignored. The file %s can be removed.", info)
  89. }
  90. var mbName string
  91. if e.Config.Trace() {
  92. mbName = e.Config.MetricsBucketName()
  93. runtime.SetBlockProfileRate(1)
  94. }
  95. mb := metrics.NewBucket(mbName)
  96. if e.Config.GraphiteHost != "" {
  97. err := mb.Publish(e.Config.GraphiteHost)
  98. if err != nil {
  99. panic(err)
  100. }
  101. }
  102. // Retrieve CORS configuration
  103. corsInfo, err := ehttp.NewCORSInfo(e.Config.CorsOrigins)
  104. if err != nil {
  105. log.Fatal("CORS:", err)
  106. }
  107. // Create etcd key-value store and registry.
  108. e.Store = store.New()
  109. e.Registry = server.NewRegistry(e.Store)
  110. // Create stats objects
  111. followersStats := server.NewRaftFollowersStats(e.Config.Name)
  112. serverStats := server.NewRaftServerStats(e.Config.Name)
  113. // Calculate all of our timeouts
  114. heartbeatInterval := time.Duration(e.Config.Peer.HeartbeatInterval) * time.Millisecond
  115. electionTimeout := time.Duration(e.Config.Peer.ElectionTimeout) * time.Millisecond
  116. // TODO(yichengq): constant 1000 is a hack here. The reason to use this
  117. // is to ensure etcd instances could start successfully at the same time.
  118. // Current problem for the failure comes from the lag between join command
  119. // execution and join success.
  120. // Fix it later. It should be removed when proper method is found and
  121. // enough tests are provided.
  122. dialTimeout := (3 * heartbeatInterval) + electionTimeout + 1000
  123. responseHeaderTimeout := (3 * heartbeatInterval) + electionTimeout + 1000
  124. // Create peer server
  125. psConfig := server.PeerServerConfig{
  126. Name: e.Config.Name,
  127. Scheme: e.Config.PeerTLSInfo().Scheme(),
  128. URL: e.Config.Peer.Addr,
  129. SnapshotCount: e.Config.SnapshotCount,
  130. RetryTimes: e.Config.MaxRetryAttempts,
  131. RetryInterval: e.Config.RetryInterval,
  132. }
  133. e.PeerServer = server.NewPeerServer(psConfig, e.Registry, e.Store, &mb, followersStats, serverStats)
  134. // Create raft transporter and server
  135. raftTransporter := server.NewTransporter(followersStats, serverStats, e.Registry, heartbeatInterval, dialTimeout, responseHeaderTimeout)
  136. if psConfig.Scheme == "https" {
  137. raftClientTLSConfig, err := e.Config.PeerTLSInfo().ClientConfig()
  138. if err != nil {
  139. log.Fatal("raft client TLS error: ", err)
  140. }
  141. raftTransporter.SetTLSConfig(*raftClientTLSConfig)
  142. }
  143. raftServer, err := raft.NewServer(e.Config.Name, e.Config.DataDir, raftTransporter, e.Store, e.PeerServer, "")
  144. if err != nil {
  145. log.Fatal(err)
  146. }
  147. raftServer.SetElectionTimeout(electionTimeout)
  148. raftServer.SetHeartbeatInterval(heartbeatInterval)
  149. e.PeerServer.SetRaftServer(raftServer)
  150. // Create etcd server
  151. e.Server = server.New(e.Config.Name, e.Config.Addr, e.PeerServer, e.Registry, e.Store, &mb)
  152. if e.Config.Trace() {
  153. e.Server.EnableTracing()
  154. }
  155. e.PeerServer.SetServer(e.Server)
  156. // Generating config could be slow.
  157. // Put it here to make listen happen immediately after peer-server starting.
  158. peerTLSConfig := server.TLSServerConfig(e.Config.PeerTLSInfo())
  159. etcdTLSConfig := server.TLSServerConfig(e.Config.EtcdTLSInfo())
  160. log.Infof("etcd server [name %s, listen on %s, advertised url %s]", e.Server.Name, e.Config.BindAddr, e.Server.URL())
  161. e.listener = server.NewListener(e.Config.EtcdTLSInfo().Scheme(), e.Config.BindAddr, etcdTLSConfig)
  162. // An error string equivalent to net.errClosing for using with
  163. // http.Serve() during server shutdown. Need to re-declare
  164. // here because it is not exported by "net" package.
  165. const errClosing = "use of closed network connection"
  166. peerServerClosed := make(chan bool)
  167. go func() {
  168. // Starting peer server should be followed close by listening on its port
  169. // If not, it may leave many requests unaccepted, or cannot receive heartbeat from the cluster.
  170. // One severe problem caused if failing receiving heartbeats is when the second node joins one-node cluster,
  171. // the cluster could be out of work as long as the two nodes cannot transfer messages.
  172. e.PeerServer.Start(e.Config.Snapshot, e.Config.Discovery, e.Config.Peers)
  173. log.Infof("peer server [name %s, listen on %s, advertised url %s]", e.PeerServer.Config.Name, e.Config.Peer.BindAddr, e.PeerServer.Config.URL)
  174. e.peerListener = server.NewListener(psConfig.Scheme, e.Config.Peer.BindAddr, peerTLSConfig)
  175. close(e.readyC) // etcd server is ready to accept connections, notify waiters.
  176. sHTTP := &ehttp.CORSHandler{e.PeerServer.HTTPHandler(), corsInfo}
  177. if err := http.Serve(e.peerListener, sHTTP); err != nil {
  178. if !strings.Contains(err.Error(), errClosing) {
  179. log.Fatal(err)
  180. }
  181. }
  182. close(peerServerClosed)
  183. }()
  184. sHTTP := &ehttp.CORSHandler{e.Server.HTTPHandler(), corsInfo}
  185. if err := http.Serve(e.listener, sHTTP); err != nil {
  186. if !strings.Contains(err.Error(), errClosing) {
  187. log.Fatal(err)
  188. }
  189. }
  190. <-peerServerClosed
  191. log.Infof("etcd instance is stopped [name %s]", e.Config.Name)
  192. }
  193. // Stop the etcd instance.
  194. //
  195. // TODO Shutdown gracefully.
  196. func (e *Etcd) Stop() {
  197. e.PeerServer.Stop()
  198. e.peerListener.Close()
  199. e.listener.Close()
  200. }
  201. // ReadyNotify returns a channel that is going to be closed
  202. // when the etcd instance is ready to accept connections.
  203. func (e *Etcd) ReadyNotify() <-chan bool {
  204. return e.readyC
  205. }