raft_server.go 4.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219
  1. package main
  2. import (
  3. "bytes"
  4. "crypto/tls"
  5. "encoding/json"
  6. "fmt"
  7. etcdErr "github.com/coreos/etcd/error"
  8. "github.com/coreos/go-raft"
  9. "net/http"
  10. "net/url"
  11. "time"
  12. )
  13. type raftServer struct {
  14. *raft.Server
  15. name string
  16. url string
  17. tlsConf *TLSConfig
  18. tlsInfo *TLSInfo
  19. }
  20. var r *raftServer
  21. func newRaftServer(name string, url string, tlsConf *TLSConfig, tlsInfo *TLSInfo) *raftServer {
  22. // Create transporter for raft
  23. raftTransporter := newTransporter(tlsConf.Scheme, tlsConf.Client)
  24. // Create raft server
  25. server, err := raft.NewServer(name, dirPath, raftTransporter, etcdStore, nil)
  26. check(err)
  27. return &raftServer{
  28. Server: server,
  29. name: name,
  30. url: url,
  31. tlsConf: tlsConf,
  32. tlsInfo: tlsInfo,
  33. }
  34. }
  35. // Start the raft server
  36. func (r *raftServer) ListenAndServe() {
  37. // Setup commands.
  38. registerCommands()
  39. // LoadSnapshot
  40. if snapshot {
  41. err := r.LoadSnapshot()
  42. if err == nil {
  43. debugf("%s finished load snapshot", r.name)
  44. } else {
  45. debug(err)
  46. }
  47. }
  48. r.SetElectionTimeout(ElectionTimeout)
  49. r.SetHeartbeatTimeout(HeartbeatTimeout)
  50. r.Start()
  51. if r.IsLogEmpty() {
  52. // start as a leader in a new cluster
  53. if len(cluster) == 0 {
  54. startAsLeader()
  55. } else {
  56. startAsFollower()
  57. }
  58. } else {
  59. // rejoin the previous cluster
  60. debugf("%s restart as a follower", r.name)
  61. }
  62. // open the snapshot
  63. if snapshot {
  64. go monitorSnapshot()
  65. }
  66. // start to response to raft requests
  67. go r.startTransport(r.tlsConf.Scheme, r.tlsConf.Server)
  68. }
  69. func startAsLeader() {
  70. // leader need to join self as a peer
  71. for {
  72. _, err := r.Do(newJoinCommand())
  73. if err == nil {
  74. break
  75. }
  76. }
  77. debugf("%s start as a leader", r.name)
  78. }
  79. func startAsFollower() {
  80. // start as a follower in a existing cluster
  81. for i := 0; i < retryTimes; i++ {
  82. for _, machine := range cluster {
  83. if len(machine) == 0 {
  84. continue
  85. }
  86. err := joinCluster(r.Server, machine, r.tlsConf.Scheme)
  87. if err == nil {
  88. debugf("%s success join to the cluster via machine %s", r.name, machine)
  89. return
  90. } else {
  91. if _, ok := err.(etcdErr.Error); ok {
  92. fatal(err)
  93. }
  94. debugf("cannot join to cluster via machine %s %s", machine, err)
  95. }
  96. }
  97. warnf("cannot join to cluster via given machines, retry in %d seconds", RetryInterval)
  98. time.Sleep(time.Second * RetryInterval)
  99. }
  100. fatalf("Cannot join the cluster via given machines after %x retries", retryTimes)
  101. }
  102. // Start to listen and response raft command
  103. func (r *raftServer) startTransport(scheme string, tlsConf tls.Config) {
  104. u, _ := url.Parse(r.url)
  105. infof("raft server [%s:%s]", r.name, u)
  106. raftMux := http.NewServeMux()
  107. server := &http.Server{
  108. Handler: raftMux,
  109. TLSConfig: &tlsConf,
  110. Addr: u.Host,
  111. }
  112. // internal commands
  113. raftMux.HandleFunc("/name", NameHttpHandler)
  114. raftMux.Handle("/join", errorHandler(JoinHttpHandler))
  115. raftMux.HandleFunc("/vote", VoteHttpHandler)
  116. raftMux.HandleFunc("/log", GetLogHttpHandler)
  117. raftMux.HandleFunc("/log/append", AppendEntriesHttpHandler)
  118. raftMux.HandleFunc("/snapshot", SnapshotHttpHandler)
  119. raftMux.HandleFunc("/snapshotRecovery", SnapshotRecoveryHttpHandler)
  120. raftMux.HandleFunc("/etcdURL", EtcdURLHttpHandler)
  121. if scheme == "http" {
  122. fatal(server.ListenAndServe())
  123. } else {
  124. fatal(server.ListenAndServeTLS(r.tlsInfo.CertFile, r.tlsInfo.KeyFile))
  125. }
  126. }
  127. // Send join requests to the leader.
  128. func joinCluster(s *raft.Server, raftURL string, scheme string) error {
  129. var b bytes.Buffer
  130. json.NewEncoder(&b).Encode(newJoinCommand())
  131. // t must be ok
  132. t, _ := r.Transporter().(transporter)
  133. joinURL := url.URL{Host: raftURL, Scheme: scheme, Path: "/join"}
  134. debugf("Send Join Request to %s", raftURL)
  135. resp, err := t.Post(joinURL.String(), &b)
  136. for {
  137. if err != nil {
  138. return fmt.Errorf("Unable to join: %v", err)
  139. }
  140. if resp != nil {
  141. defer resp.Body.Close()
  142. if resp.StatusCode == http.StatusOK {
  143. return nil
  144. }
  145. if resp.StatusCode == http.StatusTemporaryRedirect {
  146. address := resp.Header.Get("Location")
  147. debugf("Send Join Request to %s", address)
  148. json.NewEncoder(&b).Encode(newJoinCommand())
  149. resp, err = t.Post(address, &b)
  150. } else if resp.StatusCode == http.StatusBadRequest {
  151. debug("Reach max number machines in the cluster")
  152. decoder := json.NewDecoder(resp.Body)
  153. err := &etcdErr.Error{}
  154. decoder.Decode(err)
  155. return *err
  156. } else {
  157. return fmt.Errorf("Unable to join")
  158. }
  159. }
  160. }
  161. return fmt.Errorf("Unable to join: %v", err)
  162. }
  163. // Register commands to raft server
  164. func registerCommands() {
  165. raft.RegisterCommand(&JoinCommand{})
  166. raft.RegisterCommand(&SetCommand{})
  167. raft.RegisterCommand(&GetCommand{})
  168. raft.RegisterCommand(&DeleteCommand{})
  169. raft.RegisterCommand(&WatchCommand{})
  170. raft.RegisterCommand(&TestAndSetCommand{})
  171. }