cluster_util.go 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357
  1. // Copyright 2015 The etcd Authors
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package etcdserver
  15. import (
  16. "encoding/json"
  17. "fmt"
  18. "io/ioutil"
  19. "net/http"
  20. "sort"
  21. "time"
  22. "github.com/coreos/etcd/etcdserver/membership"
  23. "github.com/coreos/etcd/pkg/types"
  24. "github.com/coreos/etcd/version"
  25. "github.com/coreos/go-semver/semver"
  26. "go.uber.org/zap"
  27. )
  28. // isMemberBootstrapped tries to check if the given member has been bootstrapped
  29. // in the given cluster.
  30. func isMemberBootstrapped(lg *zap.Logger, cl *membership.RaftCluster, member string, rt http.RoundTripper, timeout time.Duration) bool {
  31. rcl, err := getClusterFromRemotePeers(lg, getRemotePeerURLs(cl, member), timeout, false, rt)
  32. if err != nil {
  33. return false
  34. }
  35. id := cl.MemberByName(member).ID
  36. m := rcl.Member(id)
  37. if m == nil {
  38. return false
  39. }
  40. if len(m.ClientURLs) > 0 {
  41. return true
  42. }
  43. return false
  44. }
  45. // GetClusterFromRemotePeers takes a set of URLs representing etcd peers, and
  46. // attempts to construct a Cluster by accessing the members endpoint on one of
  47. // these URLs. The first URL to provide a response is used. If no URLs provide
  48. // a response, or a Cluster cannot be successfully created from a received
  49. // response, an error is returned.
  50. // Each request has a 10-second timeout. Because the upper limit of TTL is 5s,
  51. // 10 second is enough for building connection and finishing request.
  52. func GetClusterFromRemotePeers(lg *zap.Logger, urls []string, rt http.RoundTripper) (*membership.RaftCluster, error) {
  53. return getClusterFromRemotePeers(lg, urls, 10*time.Second, true, rt)
  54. }
  55. // If logerr is true, it prints out more error messages.
  56. func getClusterFromRemotePeers(lg *zap.Logger, urls []string, timeout time.Duration, logerr bool, rt http.RoundTripper) (*membership.RaftCluster, error) {
  57. cc := &http.Client{
  58. Transport: rt,
  59. Timeout: timeout,
  60. }
  61. for _, u := range urls {
  62. addr := u + "/members"
  63. resp, err := cc.Get(addr)
  64. if err != nil {
  65. if logerr {
  66. if lg != nil {
  67. lg.Warn("failed to get cluster response", zap.String("address", addr), zap.Error(err))
  68. } else {
  69. plog.Warningf("could not get cluster response from %s: %v", u, err)
  70. }
  71. }
  72. continue
  73. }
  74. b, err := ioutil.ReadAll(resp.Body)
  75. resp.Body.Close()
  76. if err != nil {
  77. if logerr {
  78. if lg != nil {
  79. lg.Warn("failed to read body of cluster response", zap.String("address", addr), zap.Error(err))
  80. } else {
  81. plog.Warningf("could not read the body of cluster response: %v", err)
  82. }
  83. }
  84. continue
  85. }
  86. var membs []*membership.Member
  87. if err = json.Unmarshal(b, &membs); err != nil {
  88. if logerr {
  89. if lg != nil {
  90. lg.Warn("failed to unmarshal cluster response", zap.String("address", addr), zap.Error(err))
  91. } else {
  92. plog.Warningf("could not unmarshal cluster response: %v", err)
  93. }
  94. }
  95. continue
  96. }
  97. id, err := types.IDFromString(resp.Header.Get("X-Etcd-Cluster-ID"))
  98. if err != nil {
  99. if logerr {
  100. if lg != nil {
  101. lg.Warn(
  102. "failed to parse cluster ID",
  103. zap.String("address", addr),
  104. zap.String("header", resp.Header.Get("X-Etcd-Cluster-ID")),
  105. zap.Error(err),
  106. )
  107. } else {
  108. plog.Warningf("could not parse the cluster ID from cluster res: %v", err)
  109. }
  110. }
  111. continue
  112. }
  113. // check the length of membership members
  114. // if the membership members are present then prepare and return raft cluster
  115. // if membership members are not present then the raft cluster formed will be
  116. // an invalid empty cluster hence return failed to get raft cluster member(s) from the given urls error
  117. if len(membs) > 0 {
  118. return membership.NewClusterFromMembers(lg, "", id, membs), nil
  119. }
  120. return nil, fmt.Errorf("failed to get raft cluster member(s) from the given URLs")
  121. }
  122. return nil, fmt.Errorf("could not retrieve cluster information from the given URLs")
  123. }
  124. // getRemotePeerURLs returns peer urls of remote members in the cluster. The
  125. // returned list is sorted in ascending lexicographical order.
  126. func getRemotePeerURLs(cl *membership.RaftCluster, local string) []string {
  127. us := make([]string, 0)
  128. for _, m := range cl.Members() {
  129. if m.Name == local {
  130. continue
  131. }
  132. us = append(us, m.PeerURLs...)
  133. }
  134. sort.Strings(us)
  135. return us
  136. }
  137. // getVersions returns the versions of the members in the given cluster.
  138. // The key of the returned map is the member's ID. The value of the returned map
  139. // is the semver versions string, including server and cluster.
  140. // If it fails to get the version of a member, the key will be nil.
  141. func getVersions(lg *zap.Logger, cl *membership.RaftCluster, local types.ID, rt http.RoundTripper) map[string]*version.Versions {
  142. members := cl.Members()
  143. vers := make(map[string]*version.Versions)
  144. for _, m := range members {
  145. if m.ID == local {
  146. cv := "not_decided"
  147. if cl.Version() != nil {
  148. cv = cl.Version().String()
  149. }
  150. vers[m.ID.String()] = &version.Versions{Server: version.Version, Cluster: cv}
  151. continue
  152. }
  153. ver, err := getVersion(lg, m, rt)
  154. if err != nil {
  155. if lg != nil {
  156. lg.Warn("failed to get version", zap.String("remote-member-id", m.ID.String()), zap.Error(err))
  157. } else {
  158. plog.Warningf("cannot get the version of member %s (%v)", m.ID, err)
  159. }
  160. vers[m.ID.String()] = nil
  161. } else {
  162. vers[m.ID.String()] = ver
  163. }
  164. }
  165. return vers
  166. }
  167. // decideClusterVersion decides the cluster version based on the versions map.
  168. // The returned version is the min server version in the map, or nil if the min
  169. // version in unknown.
  170. func decideClusterVersion(lg *zap.Logger, vers map[string]*version.Versions) *semver.Version {
  171. var cv *semver.Version
  172. lv := semver.Must(semver.NewVersion(version.Version))
  173. for mid, ver := range vers {
  174. if ver == nil {
  175. return nil
  176. }
  177. v, err := semver.NewVersion(ver.Server)
  178. if err != nil {
  179. if lg != nil {
  180. lg.Warn(
  181. "failed to parse server version of remote member",
  182. zap.String("remote-member-id", mid),
  183. zap.String("remote-member-version", ver.Server),
  184. zap.Error(err),
  185. )
  186. } else {
  187. plog.Errorf("cannot understand the version of member %s (%v)", mid, err)
  188. }
  189. return nil
  190. }
  191. if lv.LessThan(*v) {
  192. if lg != nil {
  193. lg.Warn(
  194. "local etcd version is not up-to-date",
  195. zap.String("local-member-version", lv.String()),
  196. zap.String("remote-member-id", mid),
  197. zap.String("remote-member-version", ver.Server),
  198. )
  199. } else {
  200. plog.Warningf("the local etcd version %s is not up-to-date", lv.String())
  201. plog.Warningf("member %s has a higher version %s", mid, ver.Server)
  202. }
  203. }
  204. if cv == nil {
  205. cv = v
  206. } else if v.LessThan(*cv) {
  207. cv = v
  208. }
  209. }
  210. return cv
  211. }
  212. // isCompatibleWithCluster return true if the local member has a compatible version with
  213. // the current running cluster.
  214. // The version is considered as compatible when at least one of the other members in the cluster has a
  215. // cluster version in the range of [MinClusterVersion, Version] and no known members has a cluster version
  216. // out of the range.
  217. // We set this rule since when the local member joins, another member might be offline.
  218. func isCompatibleWithCluster(lg *zap.Logger, cl *membership.RaftCluster, local types.ID, rt http.RoundTripper) bool {
  219. vers := getVersions(lg, cl, local, rt)
  220. minV := semver.Must(semver.NewVersion(version.MinClusterVersion))
  221. maxV := semver.Must(semver.NewVersion(version.Version))
  222. maxV = &semver.Version{
  223. Major: maxV.Major,
  224. Minor: maxV.Minor,
  225. }
  226. return isCompatibleWithVers(lg, vers, local, minV, maxV)
  227. }
  228. func isCompatibleWithVers(lg *zap.Logger, vers map[string]*version.Versions, local types.ID, minV, maxV *semver.Version) bool {
  229. var ok bool
  230. for id, v := range vers {
  231. // ignore comparison with local version
  232. if id == local.String() {
  233. continue
  234. }
  235. if v == nil {
  236. continue
  237. }
  238. clusterv, err := semver.NewVersion(v.Cluster)
  239. if err != nil {
  240. if lg != nil {
  241. lg.Warn(
  242. "failed to parse cluster version of remote member",
  243. zap.String("remote-member-id", id),
  244. zap.String("remote-member-cluster-version", v.Cluster),
  245. zap.Error(err),
  246. )
  247. } else {
  248. plog.Errorf("cannot understand the cluster version of member %s (%v)", id, err)
  249. }
  250. continue
  251. }
  252. if clusterv.LessThan(*minV) {
  253. if lg != nil {
  254. lg.Warn(
  255. "cluster version of remote member is not compatible; too low",
  256. zap.String("remote-member-id", id),
  257. zap.String("remote-member-cluster-version", clusterv.String()),
  258. zap.String("minimum-cluster-version-supported", minV.String()),
  259. )
  260. } else {
  261. plog.Warningf("the running cluster version(%v) is lower than the minimal cluster version(%v) supported", clusterv.String(), minV.String())
  262. }
  263. return false
  264. }
  265. if maxV.LessThan(*clusterv) {
  266. if lg != nil {
  267. lg.Warn(
  268. "cluster version of remote member is not compatible; too high",
  269. zap.String("remote-member-id", id),
  270. zap.String("remote-member-cluster-version", clusterv.String()),
  271. zap.String("minimum-cluster-version-supported", minV.String()),
  272. )
  273. } else {
  274. plog.Warningf("the running cluster version(%v) is higher than the maximum cluster version(%v) supported", clusterv.String(), maxV.String())
  275. }
  276. return false
  277. }
  278. ok = true
  279. }
  280. return ok
  281. }
  282. // getVersion returns the Versions of the given member via its
  283. // peerURLs. Returns the last error if it fails to get the version.
  284. func getVersion(lg *zap.Logger, m *membership.Member, rt http.RoundTripper) (*version.Versions, error) {
  285. cc := &http.Client{
  286. Transport: rt,
  287. }
  288. var (
  289. err error
  290. resp *http.Response
  291. )
  292. for _, u := range m.PeerURLs {
  293. addr := u + "/version"
  294. resp, err = cc.Get(addr)
  295. if err != nil {
  296. if lg != nil {
  297. lg.Warn(
  298. "failed to reach the peer URL",
  299. zap.String("address", addr),
  300. zap.String("remote-member-id", m.ID.String()),
  301. zap.Error(err),
  302. )
  303. } else {
  304. plog.Warningf("failed to reach the peerURL(%s) of member %s (%v)", u, m.ID, err)
  305. }
  306. continue
  307. }
  308. var b []byte
  309. b, err = ioutil.ReadAll(resp.Body)
  310. resp.Body.Close()
  311. if err != nil {
  312. if lg != nil {
  313. lg.Warn(
  314. "failed to read body of response",
  315. zap.String("address", addr),
  316. zap.String("remote-member-id", m.ID.String()),
  317. zap.Error(err),
  318. )
  319. } else {
  320. plog.Warningf("failed to read out the response body from the peerURL(%s) of member %s (%v)", u, m.ID, err)
  321. }
  322. continue
  323. }
  324. var vers version.Versions
  325. if err = json.Unmarshal(b, &vers); err != nil {
  326. if lg != nil {
  327. lg.Warn(
  328. "failed to unmarshal response",
  329. zap.String("address", addr),
  330. zap.String("remote-member-id", m.ID.String()),
  331. zap.Error(err),
  332. )
  333. } else {
  334. plog.Warningf("failed to unmarshal the response body got from the peerURL(%s) of member %s (%v)", u, m.ID, err)
  335. }
  336. continue
  337. }
  338. return &vers, nil
  339. }
  340. return nil, err
  341. }