raft_server.go 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223
  1. package main
  2. import (
  3. "bytes"
  4. "crypto/tls"
  5. "encoding/json"
  6. "fmt"
  7. etcdErr "github.com/coreos/etcd/error"
  8. "github.com/coreos/go-raft"
  9. "net/http"
  10. "net/url"
  11. "time"
  12. )
  13. type raftServer struct {
  14. *raft.Server
  15. name string
  16. url string
  17. tlsConf *TLSConfig
  18. tlsInfo *TLSInfo
  19. }
  20. var r *raftServer
  21. func newRaftServer(name string, url string, tlsConf *TLSConfig, tlsInfo *TLSInfo) *raftServer {
  22. // Create transporter for raft
  23. raftTransporter := newTransporter(tlsConf.Scheme, tlsConf.Client)
  24. // Create raft server
  25. server, err := raft.NewServer(name, dirPath, raftTransporter, etcdStore, nil)
  26. check(err)
  27. return &raftServer{
  28. Server: server,
  29. name: name,
  30. url: url,
  31. tlsConf: tlsConf,
  32. tlsInfo: tlsInfo,
  33. }
  34. }
  35. // Start the raft server
  36. func (r *raftServer) ListenAndServe() {
  37. // Setup commands.
  38. registerCommands()
  39. // LoadSnapshot
  40. if snapshot {
  41. err := r.LoadSnapshot()
  42. if err == nil {
  43. debugf("%s finished load snapshot", r.name)
  44. } else {
  45. debug(err)
  46. }
  47. }
  48. r.SetElectionTimeout(ElectionTimeout)
  49. r.SetHeartbeatTimeout(HeartbeatTimeout)
  50. r.Start()
  51. if r.IsLogEmpty() {
  52. // start as a leader in a new cluster
  53. if len(cluster) == 0 {
  54. time.Sleep(time.Millisecond * 20)
  55. // leader need to join self as a peer
  56. for {
  57. _, err := r.Do(newJoinCommand())
  58. if err == nil {
  59. break
  60. }
  61. }
  62. debugf("%s start as a leader", r.name)
  63. // start as a follower in a existing cluster
  64. } else {
  65. time.Sleep(time.Millisecond * 20)
  66. var err error
  67. for i := 0; i < retryTimes; i++ {
  68. success := false
  69. for _, machine := range cluster {
  70. if len(machine) == 0 {
  71. continue
  72. }
  73. err = joinCluster(r.Server, machine, r.tlsConf.Scheme)
  74. if err != nil {
  75. if _, ok := err.(etcdErr.Error); ok {
  76. fatal(err)
  77. }
  78. debugf("cannot join to cluster via machine %s %s", machine, err)
  79. } else {
  80. success = true
  81. break
  82. }
  83. }
  84. if success {
  85. break
  86. }
  87. warnf("cannot join to cluster via given machines, retry in %d seconds", RetryInterval)
  88. time.Sleep(time.Second * RetryInterval)
  89. }
  90. if err != nil {
  91. fatalf("Cannot join the cluster via given machines after %x retries", retryTimes)
  92. }
  93. debugf("%s success join to the cluster", r.name)
  94. }
  95. } else {
  96. // rejoin the previous cluster
  97. debugf("%s restart as a follower", r.name)
  98. }
  99. // open the snapshot
  100. if snapshot {
  101. go monitorSnapshot()
  102. }
  103. // start to response to raft requests
  104. go r.startTransport(r.tlsConf.Scheme, r.tlsConf.Server)
  105. }
  106. // Start to listen and response raft command
  107. func (r *raftServer) startTransport(scheme string, tlsConf tls.Config) {
  108. u, _ := url.Parse(r.url)
  109. infof("raft server [%s:%s]", r.name, u)
  110. raftMux := http.NewServeMux()
  111. server := &http.Server{
  112. Handler: raftMux,
  113. TLSConfig: &tlsConf,
  114. Addr: u.Host,
  115. }
  116. // internal commands
  117. raftMux.HandleFunc("/name", NameHttpHandler)
  118. raftMux.Handle("/join", errorHandler(JoinHttpHandler))
  119. raftMux.HandleFunc("/vote", VoteHttpHandler)
  120. raftMux.HandleFunc("/log", GetLogHttpHandler)
  121. raftMux.HandleFunc("/log/append", AppendEntriesHttpHandler)
  122. raftMux.HandleFunc("/snapshot", SnapshotHttpHandler)
  123. raftMux.HandleFunc("/snapshotRecovery", SnapshotRecoveryHttpHandler)
  124. raftMux.HandleFunc("/etcdURL", EtcdURLHttpHandler)
  125. if scheme == "http" {
  126. fatal(server.ListenAndServe())
  127. } else {
  128. fatal(server.ListenAndServeTLS(r.tlsInfo.CertFile, r.tlsInfo.KeyFile))
  129. }
  130. }
  131. // Send join requests to the leader.
  132. func joinCluster(s *raft.Server, raftURL string, scheme string) error {
  133. var b bytes.Buffer
  134. json.NewEncoder(&b).Encode(newJoinCommand())
  135. // t must be ok
  136. t, _ := r.Transporter().(transporter)
  137. joinURL := url.URL{Host: raftURL, Scheme: scheme, Path: "/join"}
  138. debugf("Send Join Request to %s", raftURL)
  139. resp, err := t.Post(joinURL.String(), &b)
  140. for {
  141. if err != nil {
  142. return fmt.Errorf("Unable to join: %v", err)
  143. }
  144. if resp != nil {
  145. defer resp.Body.Close()
  146. if resp.StatusCode == http.StatusOK {
  147. return nil
  148. }
  149. if resp.StatusCode == http.StatusTemporaryRedirect {
  150. address := resp.Header.Get("Location")
  151. debugf("Send Join Request to %s", address)
  152. json.NewEncoder(&b).Encode(newJoinCommand())
  153. resp, err = t.Post(address, &b)
  154. } else if resp.StatusCode == http.StatusBadRequest {
  155. debug("Reach max number machines in the cluster")
  156. decoder := json.NewDecoder(resp.Body)
  157. err := &etcdErr.Error{}
  158. decoder.Decode(err)
  159. return *err
  160. } else {
  161. return fmt.Errorf("Unable to join")
  162. }
  163. }
  164. }
  165. return fmt.Errorf("Unable to join: %v", err)
  166. }
  167. // Register commands to raft server
  168. func registerCommands() {
  169. raft.RegisterCommand(&JoinCommand{})
  170. raft.RegisterCommand(&SetCommand{})
  171. raft.RegisterCommand(&GetCommand{})
  172. raft.RegisterCommand(&DeleteCommand{})
  173. raft.RegisterCommand(&WatchCommand{})
  174. raft.RegisterCommand(&TestAndSetCommand{})
  175. }