cluster.go 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406
  1. /*
  2. Copyright 2014 CoreOS, Inc.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package etcdserver
  14. import (
  15. "crypto/sha1"
  16. "encoding/binary"
  17. "encoding/json"
  18. "fmt"
  19. "log"
  20. "net/url"
  21. "path"
  22. "reflect"
  23. "sort"
  24. "strings"
  25. "sync"
  26. "github.com/coreos/etcd/pkg/flags"
  27. "github.com/coreos/etcd/pkg/types"
  28. "github.com/coreos/etcd/raft/raftpb"
  29. "github.com/coreos/etcd/store"
  30. )
  31. const (
  32. raftAttributesSuffix = "raftAttributes"
  33. attributesSuffix = "attributes"
  34. )
  35. type ClusterInfo interface {
  36. // ID returns the cluster ID
  37. ID() types.ID
  38. // ClientURLs returns an aggregate set of all URLs on which this
  39. // cluster is listening for client requests
  40. ClientURLs() []string
  41. // Members returns a slice of members sorted by their ID
  42. Members() []*Member
  43. // Member retrieves a particular member based on ID, or nil if the
  44. // member does not exist in the cluster
  45. Member(id types.ID) *Member
  46. // IsIDRemoved checks whether the given ID has been removed from this
  47. // cluster at some point in the past
  48. IsIDRemoved(id types.ID) bool
  49. }
  50. // Cluster is a list of Members that belong to the same raft cluster
  51. type Cluster struct {
  52. id types.ID
  53. token string
  54. members map[types.ID]*Member
  55. // removed contains the ids of removed members in the cluster.
  56. // removed id cannot be reused.
  57. removed map[types.ID]bool
  58. store store.Store
  59. sync.Mutex
  60. }
  61. // NewClusterFromString returns a Cluster instantiated from the given cluster token
  62. // and cluster string, by parsing members from a set of discovery-formatted
  63. // names-to-IPs, like:
  64. // mach0=http://1.1.1.1,mach0=http://2.2.2.2,mach1=http://3.3.3.3,mach2=http://4.4.4.4
  65. func NewClusterFromString(token string, cluster string) (*Cluster, error) {
  66. c := newCluster(token)
  67. v, err := url.ParseQuery(strings.Replace(cluster, ",", "&", -1))
  68. if err != nil {
  69. return nil, err
  70. }
  71. for name, urls := range v {
  72. if len(urls) == 0 || urls[0] == "" {
  73. return nil, fmt.Errorf("Empty URL given for %q", name)
  74. }
  75. purls := &flags.URLsValue{}
  76. if err := purls.Set(strings.Join(urls, ",")); err != nil {
  77. return nil, err
  78. }
  79. m := NewMember(name, types.URLs(*purls), c.token, nil)
  80. if _, ok := c.members[m.ID]; ok {
  81. return nil, fmt.Errorf("Member exists with identical ID %v", m)
  82. }
  83. c.members[m.ID] = m
  84. }
  85. c.genID()
  86. return c, nil
  87. }
  88. func NewClusterFromStore(token string, st store.Store) *Cluster {
  89. c := newCluster(token)
  90. c.store = st
  91. c.members, c.removed = membersFromStore(c.store)
  92. return c
  93. }
  94. func NewClusterFromMembers(token string, id types.ID, membs []*Member) *Cluster {
  95. c := newCluster(token)
  96. c.id = id
  97. for _, m := range membs {
  98. c.members[m.ID] = m
  99. }
  100. return c
  101. }
  102. func newCluster(token string) *Cluster {
  103. return &Cluster{
  104. token: token,
  105. members: make(map[types.ID]*Member),
  106. removed: make(map[types.ID]bool),
  107. }
  108. }
  109. func (c *Cluster) ID() types.ID { return c.id }
  110. func (c *Cluster) Members() []*Member {
  111. c.Lock()
  112. defer c.Unlock()
  113. var sms SortableMemberSlice
  114. for _, m := range c.members {
  115. sms = append(sms, m.Clone())
  116. }
  117. sort.Sort(sms)
  118. return []*Member(sms)
  119. }
  120. func (c *Cluster) Member(id types.ID) *Member {
  121. c.Lock()
  122. defer c.Unlock()
  123. return c.members[id].Clone()
  124. }
  125. // MemberByName returns a Member with the given name if exists.
  126. // If more than one member has the given name, it will panic.
  127. func (c *Cluster) MemberByName(name string) *Member {
  128. c.Lock()
  129. defer c.Unlock()
  130. var memb *Member
  131. for _, m := range c.members {
  132. if m.Name == name {
  133. if memb != nil {
  134. log.Panicf("two members with the given name %q exist", name)
  135. }
  136. memb = m
  137. }
  138. }
  139. return memb.Clone()
  140. }
  141. func (c *Cluster) MemberIDs() []types.ID {
  142. c.Lock()
  143. defer c.Unlock()
  144. var ids []types.ID
  145. for _, m := range c.members {
  146. ids = append(ids, m.ID)
  147. }
  148. sort.Sort(types.IDSlice(ids))
  149. return ids
  150. }
  151. func (c *Cluster) IsIDRemoved(id types.ID) bool {
  152. c.Lock()
  153. defer c.Unlock()
  154. return c.removed[id]
  155. }
  156. // PeerURLs returns a list of all peer addresses.
  157. // The returned list is sorted in ascending lexicographical order.
  158. func (c *Cluster) PeerURLs() []string {
  159. c.Lock()
  160. defer c.Unlock()
  161. urls := make([]string, 0)
  162. for _, p := range c.members {
  163. for _, addr := range p.PeerURLs {
  164. urls = append(urls, addr)
  165. }
  166. }
  167. sort.Strings(urls)
  168. return urls
  169. }
  170. // ClientURLs returns a list of all client addresses.
  171. // The returned list is sorted in ascending lexicographical order.
  172. func (c *Cluster) ClientURLs() []string {
  173. c.Lock()
  174. defer c.Unlock()
  175. urls := make([]string, 0)
  176. for _, p := range c.members {
  177. for _, url := range p.ClientURLs {
  178. urls = append(urls, url)
  179. }
  180. }
  181. sort.Strings(urls)
  182. return urls
  183. }
  184. func (c *Cluster) String() string {
  185. c.Lock()
  186. defer c.Unlock()
  187. sl := []string{}
  188. for _, m := range c.members {
  189. for _, u := range m.PeerURLs {
  190. sl = append(sl, fmt.Sprintf("%s=%s", m.Name, u))
  191. }
  192. }
  193. sort.Strings(sl)
  194. return strings.Join(sl, ",")
  195. }
  196. func (c *Cluster) genID() {
  197. mIDs := c.MemberIDs()
  198. b := make([]byte, 8*len(mIDs))
  199. for i, id := range mIDs {
  200. binary.BigEndian.PutUint64(b[8*i:], uint64(id))
  201. }
  202. hash := sha1.Sum(b)
  203. c.id = types.ID(binary.BigEndian.Uint64(hash[:8]))
  204. }
  205. func (c *Cluster) SetID(id types.ID) { c.id = id }
  206. func (c *Cluster) SetStore(st store.Store) { c.store = st }
  207. func (c *Cluster) Recover() {
  208. c.members, c.removed = membersFromStore(c.store)
  209. }
  210. // ValidateConfigurationChange takes a proposed ConfChange and
  211. // ensures that it is still valid.
  212. func (c *Cluster) ValidateConfigurationChange(cc raftpb.ConfChange) error {
  213. members, removed := membersFromStore(c.store)
  214. id := types.ID(cc.NodeID)
  215. if removed[id] {
  216. return ErrIDRemoved
  217. }
  218. switch cc.Type {
  219. case raftpb.ConfChangeAddNode:
  220. if members[id] != nil {
  221. return ErrIDExists
  222. }
  223. urls := make(map[string]bool)
  224. for _, m := range members {
  225. for _, u := range m.PeerURLs {
  226. urls[u] = true
  227. }
  228. }
  229. m := new(Member)
  230. if err := json.Unmarshal(cc.Context, m); err != nil {
  231. log.Panicf("unmarshal member should never fail: %v", err)
  232. }
  233. for _, u := range m.PeerURLs {
  234. if urls[u] {
  235. return ErrPeerURLexists
  236. }
  237. }
  238. case raftpb.ConfChangeRemoveNode:
  239. if members[id] == nil {
  240. return ErrIDNotFound
  241. }
  242. case raftpb.ConfChangeUpdateNode:
  243. if members[id] == nil {
  244. return ErrIDNotFound
  245. }
  246. urls := make(map[string]bool)
  247. for _, m := range members {
  248. if m.ID == id {
  249. continue
  250. }
  251. for _, u := range m.PeerURLs {
  252. urls[u] = true
  253. }
  254. }
  255. m := new(Member)
  256. if err := json.Unmarshal(cc.Context, m); err != nil {
  257. log.Panicf("unmarshal member should never fail: %v", err)
  258. }
  259. for _, u := range m.PeerURLs {
  260. if urls[u] {
  261. return ErrPeerURLexists
  262. }
  263. }
  264. default:
  265. log.Panicf("ConfChange type should be either AddNode, RemoveNode or UpdateNode")
  266. }
  267. return nil
  268. }
  269. // AddMember adds a new Member into the cluster, and saves the given member's
  270. // raftAttributes into the store. The given member should have empty attributes.
  271. // A Member with a matching id must not exist.
  272. func (c *Cluster) AddMember(m *Member) {
  273. c.Lock()
  274. defer c.Unlock()
  275. b, err := json.Marshal(m.RaftAttributes)
  276. if err != nil {
  277. log.Panicf("marshal raftAttributes should never fail: %v", err)
  278. }
  279. p := path.Join(memberStoreKey(m.ID), raftAttributesSuffix)
  280. if _, err := c.store.Create(p, false, string(b), false, store.Permanent); err != nil {
  281. log.Panicf("create raftAttributes should never fail: %v", err)
  282. }
  283. c.members[m.ID] = m
  284. }
  285. // RemoveMember removes a member from the store.
  286. // The given id MUST exist, or the function panics.
  287. func (c *Cluster) RemoveMember(id types.ID) {
  288. c.Lock()
  289. defer c.Unlock()
  290. if _, err := c.store.Delete(memberStoreKey(id), true, true); err != nil {
  291. log.Panicf("delete member should never fail: %v", err)
  292. }
  293. delete(c.members, id)
  294. if _, err := c.store.Create(removedMemberStoreKey(id), false, "", false, store.Permanent); err != nil {
  295. log.Panicf("create removedMember should never fail: %v", err)
  296. }
  297. c.removed[id] = true
  298. }
  299. func (c *Cluster) UpdateAttributes(id types.ID, attr Attributes) {
  300. c.Lock()
  301. defer c.Unlock()
  302. c.members[id].Attributes = attr
  303. // TODO: update store in this function
  304. }
  305. func (c *Cluster) UpdateRaftAttributes(id types.ID, raftAttr RaftAttributes) {
  306. c.Lock()
  307. defer c.Unlock()
  308. b, err := json.Marshal(raftAttr)
  309. if err != nil {
  310. log.Panicf("marshal raftAttributes should never fail: %v", err)
  311. }
  312. p := path.Join(memberStoreKey(id), raftAttributesSuffix)
  313. if _, err := c.store.Update(p, string(b), store.Permanent); err != nil {
  314. log.Panicf("update raftAttributes should never fail: %v", err)
  315. }
  316. c.members[id].RaftAttributes = raftAttr
  317. }
  318. func membersFromStore(st store.Store) (map[types.ID]*Member, map[types.ID]bool) {
  319. members := make(map[types.ID]*Member)
  320. removed := make(map[types.ID]bool)
  321. e, err := st.Get(storeMembersPrefix, true, true)
  322. if err != nil {
  323. if isKeyNotFound(err) {
  324. return members, removed
  325. }
  326. log.Panicf("get storeMembers should never fail: %v", err)
  327. }
  328. for _, n := range e.Node.Nodes {
  329. m, err := nodeToMember(n)
  330. if err != nil {
  331. log.Panicf("nodeToMember should never fail: %v", err)
  332. }
  333. members[m.ID] = m
  334. }
  335. e, err = st.Get(storeRemovedMembersPrefix, true, true)
  336. if err != nil {
  337. if isKeyNotFound(err) {
  338. return members, removed
  339. }
  340. log.Panicf("get storeRemovedMembers should never fail: %v", err)
  341. }
  342. for _, n := range e.Node.Nodes {
  343. removed[mustParseMemberIDFromKey(n.Key)] = true
  344. }
  345. return members, removed
  346. }
  347. // ValidateClusterAndAssignIDs validates the local cluster by matching the PeerURLs
  348. // with the existing cluster. If the validation succeeds, it assigns the IDs
  349. // from the existing cluster to the local cluster.
  350. // If the validation fails, an error will be returned.
  351. func ValidateClusterAndAssignIDs(local *Cluster, existing *Cluster) error {
  352. ems := existing.Members()
  353. lms := local.Members()
  354. if len(ems) != len(lms) {
  355. return fmt.Errorf("member count is unequal")
  356. }
  357. sort.Sort(SortableMemberSliceByPeerURLs(ems))
  358. sort.Sort(SortableMemberSliceByPeerURLs(lms))
  359. for i := range ems {
  360. if !reflect.DeepEqual(ems[i].PeerURLs, lms[i].PeerURLs) {
  361. return fmt.Errorf("unmatched member while checking PeerURLs")
  362. }
  363. lms[i].ID = ems[i].ID
  364. }
  365. local.members = make(map[types.ID]*Member)
  366. for _, m := range lms {
  367. local.members[m.ID] = m
  368. }
  369. return nil
  370. }