etcd.go 8.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252
  1. /*
  2. Copyright 2013 CoreOS Inc.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package etcd
  14. import (
  15. "net"
  16. "net/http"
  17. "os"
  18. "path/filepath"
  19. "runtime"
  20. "strings"
  21. "time"
  22. goetcd "github.com/coreos/etcd/third_party/github.com/coreos/go-etcd/etcd"
  23. golog "github.com/coreos/etcd/third_party/github.com/coreos/go-log/log"
  24. "github.com/coreos/etcd/third_party/github.com/goraft/raft"
  25. "github.com/coreos/etcd/config"
  26. ehttp "github.com/coreos/etcd/http"
  27. "github.com/coreos/etcd/log"
  28. "github.com/coreos/etcd/metrics"
  29. "github.com/coreos/etcd/server"
  30. "github.com/coreos/etcd/store"
  31. )
  32. type Etcd struct {
  33. Config *config.Config // etcd config
  34. Store store.Store // data store
  35. Registry *server.Registry // stores URL information for nodes
  36. Server *server.Server // http server, runs on 4001 by default
  37. PeerServer *server.PeerServer // peer server, runs on 7001 by default
  38. listener net.Listener // Listener for Server
  39. peerListener net.Listener // Listener for PeerServer
  40. readyC chan bool // To signal when server is ready to accept connections
  41. }
  42. // New returns a new Etcd instance.
  43. func New(c *config.Config) *Etcd {
  44. if c == nil {
  45. c = config.New()
  46. }
  47. return &Etcd{
  48. Config: c,
  49. readyC: make(chan bool),
  50. }
  51. }
  52. // Run the etcd instance.
  53. func (e *Etcd) Run() {
  54. // Sanitize all the input fields.
  55. if err := e.Config.Sanitize(); err != nil {
  56. log.Fatalf("failed sanitizing configuration: %v", err)
  57. }
  58. // Force remove server configuration if specified.
  59. if e.Config.Force {
  60. e.Config.Reset()
  61. }
  62. // Enable options.
  63. if e.Config.VeryVeryVerbose {
  64. log.Verbose = true
  65. raft.SetLogLevel(raft.Trace)
  66. goetcd.SetLogger(
  67. golog.New(
  68. "go-etcd",
  69. false,
  70. golog.CombinedSink(
  71. os.Stdout,
  72. "[%s] %s %-9s | %s\n",
  73. []string{"prefix", "time", "priority", "message"},
  74. ),
  75. ),
  76. )
  77. } else if e.Config.VeryVerbose {
  78. log.Verbose = true
  79. raft.SetLogLevel(raft.Debug)
  80. } else if e.Config.Verbose {
  81. log.Verbose = true
  82. }
  83. if e.Config.CPUProfileFile != "" {
  84. profile(e.Config.CPUProfileFile)
  85. }
  86. if e.Config.DataDir == "" {
  87. log.Fatal("The data dir was not set and could not be guessed from machine name")
  88. }
  89. // Create data directory if it doesn't already exist.
  90. if err := os.MkdirAll(e.Config.DataDir, 0744); err != nil {
  91. log.Fatalf("Unable to create path: %s", err)
  92. }
  93. // Warn people if they have an info file
  94. info := filepath.Join(e.Config.DataDir, "info")
  95. if _, err := os.Stat(info); err == nil {
  96. log.Warnf("All cached configuration is now ignored. The file %s can be removed.", info)
  97. }
  98. var mbName string
  99. if e.Config.Trace() {
  100. mbName = e.Config.MetricsBucketName()
  101. runtime.SetBlockProfileRate(1)
  102. }
  103. mb := metrics.NewBucket(mbName)
  104. if e.Config.GraphiteHost != "" {
  105. err := mb.Publish(e.Config.GraphiteHost)
  106. if err != nil {
  107. panic(err)
  108. }
  109. }
  110. // Retrieve CORS configuration
  111. corsInfo, err := ehttp.NewCORSInfo(e.Config.CorsOrigins)
  112. if err != nil {
  113. log.Fatal("CORS:", err)
  114. }
  115. // Create etcd key-value store and registry.
  116. e.Store = store.New()
  117. e.Registry = server.NewRegistry(e.Store)
  118. // Create stats objects
  119. followersStats := server.NewRaftFollowersStats(e.Config.Name)
  120. serverStats := server.NewRaftServerStats(e.Config.Name)
  121. // Calculate all of our timeouts
  122. heartbeatInterval := time.Duration(e.Config.Peer.HeartbeatInterval) * time.Millisecond
  123. electionTimeout := time.Duration(e.Config.Peer.ElectionTimeout) * time.Millisecond
  124. // TODO(yichengq): constant 1000 is a hack here. The reason to use this
  125. // is to ensure etcd instances could start successfully at the same time.
  126. // Current problem for the failure comes from the lag between join command
  127. // execution and join success.
  128. // Fix it later. It should be removed when proper method is found and
  129. // enough tests are provided.
  130. dialTimeout := (3 * heartbeatInterval) + electionTimeout + 1000
  131. responseHeaderTimeout := (3 * heartbeatInterval) + electionTimeout + 1000
  132. // Create peer server
  133. psConfig := server.PeerServerConfig{
  134. Name: e.Config.Name,
  135. Scheme: e.Config.PeerTLSInfo().Scheme(),
  136. URL: e.Config.Peer.Addr,
  137. SnapshotCount: e.Config.SnapshotCount,
  138. RetryTimes: e.Config.MaxRetryAttempts,
  139. RetryInterval: e.Config.RetryInterval,
  140. }
  141. e.PeerServer = server.NewPeerServer(psConfig, e.Registry, e.Store, &mb, followersStats, serverStats)
  142. // Create raft transporter and server
  143. raftTransporter := server.NewTransporter(followersStats, serverStats, e.Registry, heartbeatInterval, dialTimeout, responseHeaderTimeout)
  144. if psConfig.Scheme == "https" {
  145. raftClientTLSConfig, err := e.Config.PeerTLSInfo().ClientConfig()
  146. if err != nil {
  147. log.Fatal("raft client TLS error: ", err)
  148. }
  149. raftTransporter.SetTLSConfig(*raftClientTLSConfig)
  150. }
  151. raftServer, err := raft.NewServer(e.Config.Name, e.Config.DataDir, raftTransporter, e.Store, e.PeerServer, "")
  152. if err != nil {
  153. log.Fatal(err)
  154. }
  155. raftServer.SetElectionTimeout(electionTimeout)
  156. raftServer.SetHeartbeatInterval(heartbeatInterval)
  157. e.PeerServer.SetRaftServer(raftServer)
  158. // Create etcd server
  159. e.Server = server.New(e.Config.Name, e.Config.Addr, e.PeerServer, e.Registry, e.Store, &mb)
  160. if e.Config.Trace() {
  161. e.Server.EnableTracing()
  162. }
  163. e.PeerServer.SetServer(e.Server)
  164. // Generating config could be slow.
  165. // Put it here to make listen happen immediately after peer-server starting.
  166. peerTLSConfig := server.TLSServerConfig(e.Config.PeerTLSInfo())
  167. etcdTLSConfig := server.TLSServerConfig(e.Config.EtcdTLSInfo())
  168. log.Infof("etcd server [name %s, listen on %s, advertised url %s]", e.Server.Name, e.Config.BindAddr, e.Server.URL())
  169. e.listener = server.NewListener(e.Config.EtcdTLSInfo().Scheme(), e.Config.BindAddr, etcdTLSConfig)
  170. // An error string equivalent to net.errClosing for using with
  171. // http.Serve() during server shutdown. Need to re-declare
  172. // here because it is not exported by "net" package.
  173. const errClosing = "use of closed network connection"
  174. peerServerClosed := make(chan bool)
  175. go func() {
  176. // Starting peer server should be followed close by listening on its port
  177. // If not, it may leave many requests unaccepted, or cannot receive heartbeat from the cluster.
  178. // One severe problem caused if failing receiving heartbeats is when the second node joins one-node cluster,
  179. // the cluster could be out of work as long as the two nodes cannot transfer messages.
  180. e.PeerServer.Start(e.Config.Snapshot, e.Config.Discovery, e.Config.Peers)
  181. log.Infof("peer server [name %s, listen on %s, advertised url %s]", e.PeerServer.Config.Name, e.Config.Peer.BindAddr, e.PeerServer.Config.URL)
  182. e.peerListener = server.NewListener(psConfig.Scheme, e.Config.Peer.BindAddr, peerTLSConfig)
  183. close(e.readyC) // etcd server is ready to accept connections, notify waiters.
  184. sHTTP := &ehttp.CORSHandler{e.PeerServer.HTTPHandler(), corsInfo}
  185. if err := http.Serve(e.peerListener, sHTTP); err != nil {
  186. if !strings.Contains(err.Error(), errClosing) {
  187. log.Fatal(err)
  188. }
  189. }
  190. close(peerServerClosed)
  191. }()
  192. sHTTP := &ehttp.CORSHandler{e.Server.HTTPHandler(), corsInfo}
  193. if err := http.Serve(e.listener, sHTTP); err != nil {
  194. if !strings.Contains(err.Error(), errClosing) {
  195. log.Fatal(err)
  196. }
  197. }
  198. <-peerServerClosed
  199. log.Infof("etcd instance is stopped [name %s]", e.Config.Name)
  200. }
  201. // Stop the etcd instance.
  202. //
  203. // TODO Shutdown gracefully.
  204. func (e *Etcd) Stop() {
  205. e.PeerServer.Stop()
  206. e.peerListener.Close()
  207. e.listener.Close()
  208. }
  209. // ReadyNotify returns a channel that is going to be closed
  210. // when the etcd instance is ready to accept connections.
  211. func (e *Etcd) ReadyNotify() <-chan bool {
  212. return e.readyC
  213. }