config.go 10 KB

  1. // Copyright 2015 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. //
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package etcdserver
  15. import (
  16. "context"
  17. "fmt"
  18. "path/filepath"
  19. "sort"
  20. "strings"
  21. "time"
  22. ""
  23. ""
  24. ""
  25. bolt ""
  26. ""
  27. ""
  28. )
  29. // ServerConfig holds the configuration of etcd as taken from the command line or discovery.
  30. type ServerConfig struct {
  31. Name string
  32. DiscoveryURL string
  33. DiscoveryProxy string
  34. ClientURLs types.URLs
  35. PeerURLs types.URLs
  36. DataDir string
  37. // DedicatedWALDir config will make the etcd to write the WAL to the WALDir
  38. // rather than the dataDir/member/wal.
  39. DedicatedWALDir string
  40. SnapshotCount uint64
  41. // SnapshotCatchUpEntries is the number of entries for a slow follower
  42. // to catch-up after compacting the raft storage entries.
  43. // We expect the follower has a millisecond level latency with the leader.
  44. // The max throughput is around 10K. Keep a 5K entries is enough for helping
  45. // follower to catch up.
  46. // WARNING: only change this for tests. Always use "DefaultSnapshotCatchUpEntries"
  47. SnapshotCatchUpEntries uint64
  48. MaxSnapFiles uint
  49. MaxWALFiles uint
  50. // BackendBatchInterval is the maximum time before commit the backend transaction.
  51. BackendBatchInterval time.Duration
  52. // BackendBatchLimit is the maximum operations before commit the backend transaction.
  53. BackendBatchLimit int
  54. // BackendFreelistType is the type of the backend boltdb freelist.
  55. BackendFreelistType bolt.FreelistType
  56. InitialPeerURLsMap types.URLsMap
  57. InitialClusterToken string
  58. NewCluster bool
  59. PeerTLSInfo transport.TLSInfo
  60. CORS map[string]struct{}
  61. // HostWhitelist lists acceptable hostnames from client requests.
  62. // If server is insecure (no TLS), server only accepts requests
  63. // whose Host header value exists in this white list.
  64. HostWhitelist map[string]struct{}
  65. TickMs uint
  66. ElectionTicks int
  67. // InitialElectionTickAdvance is true, then local member fast-forwards
  68. // election ticks to speed up "initial" leader election trigger. This
  69. // benefits the case of larger election ticks. For instance, cross
  70. // datacenter deployment may require longer election timeout of 10-second.
  71. // If true, local node does not need wait up to 10-second. Instead,
  72. // forwards its election ticks to 8-second, and have only 2-second left
  73. // before leader election.
  74. //
  75. // Major assumptions are that:
  76. // - cluster has no active leader thus advancing ticks enables faster
  77. // leader election, or
  78. // - cluster already has an established leader, and rejoining follower
  79. // is likely to receive heartbeats from the leader after tick advance
  80. // and before election timeout.
  81. //
  82. // However, when network from leader to rejoining follower is congested,
  83. // and the follower does not receive leader heartbeat within left election
  84. // ticks, disruptive election has to happen thus affecting cluster
  85. // availabilities.
  86. //
  87. // Disabling this would slow down initial bootstrap process for cross
  88. // datacenter deployments. Make your own tradeoffs by configuring
  89. // --initial-election-tick-advance at the cost of slow initial bootstrap.
  90. //
  91. // If single-node, it advances ticks regardless.
  92. //
  93. // See for more detail.
  94. InitialElectionTickAdvance bool
  95. BootstrapTimeout time.Duration
  96. AutoCompactionRetention time.Duration
  97. AutoCompactionMode string
  98. CompactionBatchLimit int
  99. QuotaBackendBytes int64
  100. MaxTxnOps uint
  101. // MaxRequestBytes is the maximum request size to send over raft.
  102. MaxRequestBytes uint
  103. StrictReconfigCheck bool
  104. // ClientCertAuthEnabled is true when cert has been signed by the client CA.
  105. ClientCertAuthEnabled bool
  106. AuthToken string
  107. BcryptCost uint
  108. // InitialCorruptCheck is true to check data corruption on boot
  109. // before serving any peer/client traffic.
  110. InitialCorruptCheck bool
  111. CorruptCheckTime time.Duration
  112. // PreVote is true to enable Raft Pre-Vote.
  113. PreVote bool
  114. // Logger logs server-side operations.
  115. // If not nil, it disables "capnslog" and uses the given logger.
  116. Logger *zap.Logger
  117. // LoggerConfig is server logger configuration for Raft logger.
  118. // Must be either: "LoggerConfig != nil" or "LoggerCore != nil && LoggerWriteSyncer != nil".
  119. LoggerConfig *zap.Config
  120. // LoggerCore is "zapcore.Core" for raft logger.
  121. // Must be either: "LoggerConfig != nil" or "LoggerCore != nil && LoggerWriteSyncer != nil".
  122. LoggerCore zapcore.Core
  123. LoggerWriteSyncer zapcore.WriteSyncer
  124. Debug bool
  125. ForceNewCluster bool
  126. // EnableLeaseCheckpoint enables primary lessor to persist lease remainingTTL to prevent indefinite auto-renewal of long lived leases.
  127. EnableLeaseCheckpoint bool
  128. // LeaseCheckpointInterval time.Duration is the wait duration between lease checkpoints.
  129. LeaseCheckpointInterval time.Duration
  130. EnableGRPCGateway bool
  131. }
  132. // VerifyBootstrap sanity-checks the initial config for bootstrap case
  133. // and returns an error for things that should never happen.
  134. func (c *ServerConfig) VerifyBootstrap() error {
  135. if err := c.hasLocalMember(); err != nil {
  136. return err
  137. }
  138. if err := c.advertiseMatchesCluster(); err != nil {
  139. return err
  140. }
  141. if checkDuplicateURL(c.InitialPeerURLsMap) {
  142. return fmt.Errorf("initial cluster %s has duplicate url", c.InitialPeerURLsMap)
  143. }
  144. if c.InitialPeerURLsMap.String() == "" && c.DiscoveryURL == "" {
  145. return fmt.Errorf("initial cluster unset and no discovery URL found")
  146. }
  147. return nil
  148. }
  149. // VerifyJoinExisting sanity-checks the initial config for join existing cluster
  150. // case and returns an error for things that should never happen.
  151. func (c *ServerConfig) VerifyJoinExisting() error {
  152. // The member has announced its peer urls to the cluster before starting; no need to
  153. // set the configuration again.
  154. if err := c.hasLocalMember(); err != nil {
  155. return err
  156. }
  157. if checkDuplicateURL(c.InitialPeerURLsMap) {
  158. return fmt.Errorf("initial cluster %s has duplicate url", c.InitialPeerURLsMap)
  159. }
  160. if c.DiscoveryURL != "" {
  161. return fmt.Errorf("discovery URL should not be set when joining existing initial cluster")
  162. }
  163. return nil
  164. }
  165. // hasLocalMember checks that the cluster at least contains the local server.
  166. func (c *ServerConfig) hasLocalMember() error {
  167. if urls := c.InitialPeerURLsMap[c.Name]; urls == nil {
  168. return fmt.Errorf("couldn't find local name %q in the initial cluster configuration", c.Name)
  169. }
  170. return nil
  171. }
  172. // advertiseMatchesCluster confirms peer URLs match those in the cluster peer list.
  173. func (c *ServerConfig) advertiseMatchesCluster() error {
  174. urls, apurls := c.InitialPeerURLsMap[c.Name], c.PeerURLs.StringSlice()
  175. urls.Sort()
  176. sort.Strings(apurls)
  177. ctx, cancel := context.WithTimeout(context.TODO(), 30*time.Second)
  178. defer cancel()
  179. ok, err := netutil.URLStringsEqual(ctx, c.Logger, apurls, urls.StringSlice())
  180. if ok {
  181. return nil
  182. }
  183. initMap, apMap := make(map[string]struct{}), make(map[string]struct{})
  184. for _, url := range c.PeerURLs {
  185. apMap[url.String()] = struct{}{}
  186. }
  187. for _, url := range c.InitialPeerURLsMap[c.Name] {
  188. initMap[url.String()] = struct{}{}
  189. }
  190. missing := []string{}
  191. for url := range initMap {
  192. if _, ok := apMap[url]; !ok {
  193. missing = append(missing, url)
  194. }
  195. }
  196. if len(missing) > 0 {
  197. for i := range missing {
  198. missing[i] = c.Name + "=" + missing[i]
  199. }
  200. mstr := strings.Join(missing, ",")
  201. apStr := strings.Join(apurls, ",")
  202. return fmt.Errorf("--initial-cluster has %s but missing from --initial-advertise-peer-urls=%s (%v)", mstr, apStr, err)
  203. }
  204. for url := range apMap {
  205. if _, ok := initMap[url]; !ok {
  206. missing = append(missing, url)
  207. }
  208. }
  209. if len(missing) > 0 {
  210. mstr := strings.Join(missing, ",")
  211. umap := types.URLsMap(map[string]types.URLs{c.Name: c.PeerURLs})
  212. return fmt.Errorf("--initial-advertise-peer-urls has %s but missing from --initial-cluster=%s", mstr, umap.String())
  213. }
  214. // resolved URLs from "--initial-advertise-peer-urls" and "--initial-cluster" did not match or failed
  215. apStr := strings.Join(apurls, ",")
  216. umap := types.URLsMap(map[string]types.URLs{c.Name: c.PeerURLs})
  217. return fmt.Errorf("failed to resolve %s to match --initial-cluster=%s (%v)", apStr, umap.String(), err)
  218. }
  219. func (c *ServerConfig) MemberDir() string { return filepath.Join(c.DataDir, "member") }
  220. func (c *ServerConfig) WALDir() string {
  221. if c.DedicatedWALDir != "" {
  222. return c.DedicatedWALDir
  223. }
  224. return filepath.Join(c.MemberDir(), "wal")
  225. }
  226. func (c *ServerConfig) SnapDir() string { return filepath.Join(c.MemberDir(), "snap") }
  227. func (c *ServerConfig) ShouldDiscover() bool { return c.DiscoveryURL != "" }
  228. // ReqTimeout returns timeout for request to finish.
  229. func (c *ServerConfig) ReqTimeout() time.Duration {
  230. // 5s for queue waiting, computation and disk IO delay
  231. // + 2 * election timeout for possible leader election
  232. return 5*time.Second + 2*time.Duration(c.ElectionTicks*int(c.TickMs))*time.Millisecond
  233. }
  234. func (c *ServerConfig) electionTimeout() time.Duration {
  235. return time.Duration(c.ElectionTicks*int(c.TickMs)) * time.Millisecond
  236. }
  237. func (c *ServerConfig) peerDialTimeout() time.Duration {
  238. // 1s for queue wait and election timeout
  239. return time.Second + time.Duration(c.ElectionTicks*int(c.TickMs))*time.Millisecond
  240. }
  241. func checkDuplicateURL(urlsmap types.URLsMap) bool {
  242. um := make(map[string]bool)
  243. for _, urls := range urlsmap {
  244. for _, url := range urls {
  245. u := url.String()
  246. if um[u] {
  247. return true
  248. }
  249. um[u] = true
  250. }
  251. }
  252. return false
  253. }
  254. func (c *ServerConfig) bootstrapTimeout() time.Duration {
  255. if c.BootstrapTimeout != 0 {
  256. return c.BootstrapTimeout
  257. }
  258. return time.Second
  259. }
  260. func (c *ServerConfig) backendPath() string { return filepath.Join(c.SnapDir(), "db") }