cluster.go 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370
  1. /*
  2. Copyright 2014 CoreOS, Inc.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package etcdserver
  14. import (
  15. "crypto/sha1"
  16. "encoding/binary"
  17. "encoding/json"
  18. "fmt"
  19. "log"
  20. "net/url"
  21. "path"
  22. "reflect"
  23. "sort"
  24. "strings"
  25. etcdErr "github.com/coreos/etcd/error"
  26. "github.com/coreos/etcd/pkg/flags"
  27. "github.com/coreos/etcd/pkg/types"
  28. "github.com/coreos/etcd/raft/raftpb"
  29. "github.com/coreos/etcd/store"
  30. )
  31. const (
  32. raftAttributesSuffix = "raftAttributes"
  33. attributesSuffix = "attributes"
  34. )
  35. type ClusterInfo interface {
  36. ID() types.ID
  37. ClientURLs() []string
  38. // Members returns a slice of members sorted by their ID
  39. Members() []*Member
  40. Member(id types.ID) *Member
  41. IsIDRemoved(id types.ID) bool
  42. }
  43. // Cluster is a list of Members that belong to the same raft cluster
  44. type Cluster struct {
  45. id types.ID
  46. token string
  47. members map[types.ID]*Member
  48. // removed contains the ids of removed members in the cluster.
  49. // removed id cannot be reused.
  50. removed map[types.ID]bool
  51. store store.Store
  52. }
  53. // NewClusterFromString returns Cluster through given cluster token and parsing
  54. // members from a sets of names to IPs discovery formatted like:
  55. // mach0=http://1.1.1.1,mach0=http://2.2.2.2,mach1=http://3.3.3.3,mach2=http://4.4.4.4
  56. func NewClusterFromString(token string, cluster string) (*Cluster, error) {
  57. c := newCluster(token)
  58. v, err := url.ParseQuery(strings.Replace(cluster, ",", "&", -1))
  59. if err != nil {
  60. return nil, err
  61. }
  62. for name, urls := range v {
  63. if len(urls) == 0 || urls[0] == "" {
  64. return nil, fmt.Errorf("Empty URL given for %q", name)
  65. }
  66. purls := &flags.URLsValue{}
  67. if err := purls.Set(strings.Join(urls, ",")); err != nil {
  68. return nil, err
  69. }
  70. m := NewMember(name, types.URLs(*purls), c.token, nil)
  71. if _, ok := c.members[m.ID]; ok {
  72. return nil, fmt.Errorf("Member exists with identical ID %v", m)
  73. }
  74. c.members[m.ID] = m
  75. }
  76. c.genID()
  77. return c, nil
  78. }
  79. func NewClusterFromStore(token string, st store.Store) *Cluster {
  80. c := newCluster(token)
  81. c.store = st
  82. c.members, c.removed = membersFromStore(c.store)
  83. return c
  84. }
  85. func NewClusterFromMembers(token string, id types.ID, membs []*Member) *Cluster {
  86. c := newCluster(token)
  87. c.id = id
  88. for _, m := range membs {
  89. c.members[m.ID] = m
  90. }
  91. return c
  92. }
  93. func newCluster(token string) *Cluster {
  94. return &Cluster{
  95. token: token,
  96. members: make(map[types.ID]*Member),
  97. removed: make(map[types.ID]bool),
  98. }
  99. }
  100. func (c Cluster) ID() types.ID { return c.id }
  101. func (c Cluster) Members() []*Member {
  102. var sms SortableMemberSlice
  103. for _, m := range c.members {
  104. sms = append(sms, m)
  105. }
  106. sort.Sort(sms)
  107. return []*Member(sms)
  108. }
  109. type SortableMemberSlice []*Member
  110. func (s SortableMemberSlice) Len() int { return len(s) }
  111. func (s SortableMemberSlice) Less(i, j int) bool { return s[i].ID < s[j].ID }
  112. func (s SortableMemberSlice) Swap(i, j int) { s[i], s[j] = s[j], s[i] }
  113. func (c *Cluster) Member(id types.ID) *Member {
  114. return c.members[id]
  115. }
  116. // MemberByName returns a Member with the given name if exists.
  117. // If more than one member has the given name, it will panic.
  118. func (c *Cluster) MemberByName(name string) *Member {
  119. var memb *Member
  120. for _, m := range c.members {
  121. if m.Name == name {
  122. if memb != nil {
  123. log.Panicf("two members with the given name %q exist", name)
  124. }
  125. memb = m
  126. }
  127. }
  128. return memb
  129. }
  130. func (c Cluster) MemberIDs() []types.ID {
  131. var ids []types.ID
  132. for _, m := range c.members {
  133. ids = append(ids, m.ID)
  134. }
  135. sort.Sort(types.IDSlice(ids))
  136. return ids
  137. }
  138. func (c *Cluster) IsIDRemoved(id types.ID) bool {
  139. return c.removed[id]
  140. }
  141. // PeerURLs returns a list of all peer addresses. Each address is prefixed
  142. // with the scheme (currently "http://"). The returned list is sorted in
  143. // ascending lexicographical order.
  144. func (c Cluster) PeerURLs() []string {
  145. endpoints := make([]string, 0)
  146. for _, p := range c.members {
  147. for _, addr := range p.PeerURLs {
  148. endpoints = append(endpoints, addr)
  149. }
  150. }
  151. sort.Strings(endpoints)
  152. return endpoints
  153. }
  154. // ClientURLs returns a list of all client addresses. Each address is prefixed
  155. // with the scheme (currently "http://"). The returned list is sorted in
  156. // ascending lexicographical order.
  157. func (c Cluster) ClientURLs() []string {
  158. urls := make([]string, 0)
  159. for _, p := range c.members {
  160. for _, url := range p.ClientURLs {
  161. urls = append(urls, url)
  162. }
  163. }
  164. sort.Strings(urls)
  165. return urls
  166. }
  167. func (c Cluster) String() string {
  168. sl := []string{}
  169. for _, m := range c.members {
  170. for _, u := range m.PeerURLs {
  171. sl = append(sl, fmt.Sprintf("%s=%s", m.Name, u))
  172. }
  173. }
  174. sort.Strings(sl)
  175. return strings.Join(sl, ",")
  176. }
  177. // ValidateAndAssignIDs validates the given members by matching their PeerURLs
  178. // with the existing members in the cluster. If the validation succeeds, it
  179. // assigns the IDs from the given members to the existing members in the
  180. // cluster. If the validation fails, an error will be returned.
  181. func (c *Cluster) ValidateAndAssignIDs(membs []*Member) error {
  182. if len(c.members) != len(membs) {
  183. return fmt.Errorf("member count is unequal")
  184. }
  185. omembs := make([]*Member, 0)
  186. for _, m := range c.members {
  187. omembs = append(omembs, m)
  188. }
  189. sort.Sort(SortableMemberSliceByPeerURLs(omembs))
  190. sort.Sort(SortableMemberSliceByPeerURLs(membs))
  191. for i := range omembs {
  192. if !reflect.DeepEqual(omembs[i].PeerURLs, membs[i].PeerURLs) {
  193. return fmt.Errorf("unmatched member while checking PeerURLs")
  194. }
  195. omembs[i].ID = membs[i].ID
  196. }
  197. c.members = make(map[types.ID]*Member)
  198. for _, m := range omembs {
  199. c.members[m.ID] = m
  200. }
  201. return nil
  202. }
  203. func (c *Cluster) genID() {
  204. mIDs := c.MemberIDs()
  205. b := make([]byte, 8*len(mIDs))
  206. for i, id := range mIDs {
  207. binary.BigEndian.PutUint64(b[8*i:], uint64(id))
  208. }
  209. hash := sha1.Sum(b)
  210. c.id = types.ID(binary.BigEndian.Uint64(hash[:8]))
  211. }
  212. func (c *Cluster) SetID(id types.ID) { c.id = id }
  213. func (c *Cluster) SetStore(st store.Store) { c.store = st }
  214. func (c *Cluster) ValidateConfigurationChange(cc raftpb.ConfChange) error {
  215. appliedMembers, appliedRemoved := membersFromStore(c.store)
  216. if appliedRemoved[types.ID(cc.NodeID)] {
  217. return ErrIDRemoved
  218. }
  219. switch cc.Type {
  220. case raftpb.ConfChangeAddNode:
  221. if appliedMembers[types.ID(cc.NodeID)] != nil {
  222. return ErrIDExists
  223. }
  224. urls := make(map[string]bool)
  225. for _, m := range appliedMembers {
  226. for _, u := range m.PeerURLs {
  227. urls[u] = true
  228. }
  229. }
  230. m := new(Member)
  231. if err := json.Unmarshal(cc.Context, m); err != nil {
  232. log.Panicf("unmarshal member should never fail: %v", err)
  233. }
  234. for _, u := range m.PeerURLs {
  235. if urls[u] {
  236. return ErrPeerURLexists
  237. }
  238. }
  239. case raftpb.ConfChangeRemoveNode:
  240. if appliedMembers[types.ID(cc.NodeID)] == nil {
  241. return ErrIDNotFound
  242. }
  243. default:
  244. log.Panicf("ConfChange type should be either AddNode or RemoveNode")
  245. }
  246. return nil
  247. }
  248. // AddMember puts a new Member into the store.
  249. // A Member with a matching id must not exist.
  250. func (c *Cluster) AddMember(m *Member) {
  251. b, err := json.Marshal(m.RaftAttributes)
  252. if err != nil {
  253. log.Panicf("marshal raftAttributes should never fail: %v", err)
  254. }
  255. p := path.Join(memberStoreKey(m.ID), raftAttributesSuffix)
  256. if _, err := c.store.Create(p, false, string(b), false, store.Permanent); err != nil {
  257. log.Panicf("create raftAttributes should never fail: %v", err)
  258. }
  259. b, err = json.Marshal(m.Attributes)
  260. if err != nil {
  261. log.Panicf("marshal attributes should never fail: %v", err)
  262. }
  263. p = path.Join(memberStoreKey(m.ID), attributesSuffix)
  264. if _, err := c.store.Create(p, false, string(b), false, store.Permanent); err != nil {
  265. log.Panicf("create attributes should never fail: %v", err)
  266. }
  267. c.members[m.ID] = m
  268. }
  269. // RemoveMember removes a member from the store.
  270. // The given id MUST exist, or the function panics.
  271. func (c *Cluster) RemoveMember(id types.ID) {
  272. if _, err := c.store.Delete(memberStoreKey(id), true, true); err != nil {
  273. log.Panicf("delete member should never fail: %v", err)
  274. }
  275. delete(c.members, id)
  276. if _, err := c.store.Create(removedMemberStoreKey(id), false, "", false, store.Permanent); err != nil {
  277. log.Panicf("create removedMember should never fail: %v", err)
  278. }
  279. c.removed[id] = true
  280. }
  281. // nodeToMember builds member through a store node.
  282. // the child nodes of the given node should be sorted by key.
  283. func nodeToMember(n *store.NodeExtern) (*Member, error) {
  284. m := &Member{ID: mustParseMemberIDFromKey(n.Key)}
  285. if len(n.Nodes) != 2 {
  286. return m, fmt.Errorf("len(nodes) = %d, want 2", len(n.Nodes))
  287. }
  288. if w := path.Join(n.Key, attributesSuffix); n.Nodes[0].Key != w {
  289. return m, fmt.Errorf("key = %v, want %v", n.Nodes[0].Key, w)
  290. }
  291. if err := json.Unmarshal([]byte(*n.Nodes[0].Value), &m.Attributes); err != nil {
  292. return m, fmt.Errorf("unmarshal attributes error: %v", err)
  293. }
  294. if w := path.Join(n.Key, raftAttributesSuffix); n.Nodes[1].Key != w {
  295. return m, fmt.Errorf("key = %v, want %v", n.Nodes[1].Key, w)
  296. }
  297. if err := json.Unmarshal([]byte(*n.Nodes[1].Value), &m.RaftAttributes); err != nil {
  298. return m, fmt.Errorf("unmarshal raftAttributes error: %v", err)
  299. }
  300. return m, nil
  301. }
  302. func membersFromStore(st store.Store) (map[types.ID]*Member, map[types.ID]bool) {
  303. members := make(map[types.ID]*Member)
  304. removed := make(map[types.ID]bool)
  305. e, err := st.Get(storeMembersPrefix, true, true)
  306. if err != nil {
  307. if isKeyNotFound(err) {
  308. return members, removed
  309. }
  310. log.Panicf("get storeMembers should never fail: %v", err)
  311. }
  312. for _, n := range e.Node.Nodes {
  313. m, err := nodeToMember(n)
  314. if err != nil {
  315. log.Panicf("nodeToMember should never fail: %v", err)
  316. }
  317. members[m.ID] = m
  318. }
  319. e, err = st.Get(storeRemovedMembersPrefix, true, true)
  320. if err != nil {
  321. if isKeyNotFound(err) {
  322. return members, removed
  323. }
  324. log.Panicf("get storeRemovedMembers should never fail: %v", err)
  325. }
  326. for _, n := range e.Node.Nodes {
  327. removed[mustParseMemberIDFromKey(n.Key)] = true
  328. }
  329. return members, removed
  330. }
  331. func isKeyNotFound(err error) bool {
  332. e, ok := err.(*etcdErr.Error)
  333. return ok && e.ErrorCode == etcdErr.EcodeKeyNotFound
  334. }