raft_test.go 26 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013
  1. package raft
  2. import (
  3. "bytes"
  4. "fmt"
  5. "math/rand"
  6. "reflect"
  7. "sort"
  8. "testing"
  9. pb "github.com/coreos/etcd/raft/raftpb"
  10. )
  11. // nextEnts returns the appliable entries and updates the applied index
  12. func nextEnts(r *raft) (ents []pb.Entry) {
  13. ents = r.raftLog.nextEnts()
  14. r.raftLog.resetNextEnts()
  15. return ents
  16. }
  17. type Interface interface {
  18. Step(m pb.Message) error
  19. ReadMessages() []pb.Message
  20. }
  21. func TestLeaderElection(t *testing.T) {
  22. tests := []struct {
  23. *network
  24. state stateType
  25. }{
  26. {newNetwork(nil, nil, nil), stateLeader},
  27. {newNetwork(nil, nil, nopStepper), stateLeader},
  28. {newNetwork(nil, nopStepper, nopStepper), stateCandidate},
  29. {newNetwork(nil, nopStepper, nopStepper, nil), stateCandidate},
  30. {newNetwork(nil, nopStepper, nopStepper, nil, nil), stateLeader},
  31. // three logs further along than 0
  32. {newNetwork(nil, ents(1), ents(2), ents(1, 3), nil), stateFollower},
  33. // logs converge
  34. {newNetwork(ents(1), nil, ents(2), ents(1), nil), stateLeader},
  35. }
  36. for i, tt := range tests {
  37. tt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  38. sm := tt.network.peers[1].(*raft)
  39. if sm.state != tt.state {
  40. t.Errorf("#%d: state = %s, want %s", i, sm.state, tt.state)
  41. }
  42. if g := sm.Term; g != 1 {
  43. t.Errorf("#%d: term = %d, want %d", i, g, 1)
  44. }
  45. }
  46. }
  47. func TestLogReplication(t *testing.T) {
  48. tests := []struct {
  49. *network
  50. msgs []pb.Message
  51. wcommitted int64
  52. }{
  53. {
  54. newNetwork(nil, nil, nil),
  55. []pb.Message{
  56. {From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("somedata")}}},
  57. },
  58. 2,
  59. },
  60. {
  61. newNetwork(nil, nil, nil),
  62. []pb.Message{
  63. {From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("somedata")}}},
  64. {From: 1, To: 2, Type: msgHup},
  65. {From: 1, To: 2, Type: msgProp, Entries: []pb.Entry{{Data: []byte("somedata")}}},
  66. },
  67. 4,
  68. },
  69. }
  70. for i, tt := range tests {
  71. tt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  72. for _, m := range tt.msgs {
  73. tt.send(m)
  74. }
  75. for j, x := range tt.network.peers {
  76. sm := x.(*raft)
  77. if sm.raftLog.committed != tt.wcommitted {
  78. t.Errorf("#%d.%d: committed = %d, want %d", i, j, sm.raftLog.committed, tt.wcommitted)
  79. }
  80. ents := make([]pb.Entry, 0)
  81. for _, e := range nextEnts(sm) {
  82. if e.Data != nil {
  83. ents = append(ents, e)
  84. }
  85. }
  86. props := make([]pb.Message, 0)
  87. for _, m := range tt.msgs {
  88. if m.Type == msgProp {
  89. props = append(props, m)
  90. }
  91. }
  92. for k, m := range props {
  93. if !bytes.Equal(ents[k].Data, m.Entries[0].Data) {
  94. t.Errorf("#%d.%d: data = %d, want %d", i, j, ents[k].Data, m.Entries[0].Data)
  95. }
  96. }
  97. }
  98. }
  99. }
  100. func TestSingleNodeCommit(t *testing.T) {
  101. tt := newNetwork(nil)
  102. tt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  103. tt.send(pb.Message{From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  104. tt.send(pb.Message{From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  105. sm := tt.peers[1].(*raft)
  106. if sm.raftLog.committed != 3 {
  107. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 3)
  108. }
  109. }
  110. // TestCannotCommitWithoutNewTermEntry tests the entries cannot be committed
  111. // when leader changes, no new proposal comes in and ChangeTerm proposal is
  112. // filtered.
  113. func TestCannotCommitWithoutNewTermEntry(t *testing.T) {
  114. tt := newNetwork(nil, nil, nil, nil, nil)
  115. tt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  116. // 0 cannot reach 2,3,4
  117. tt.cut(1, 3)
  118. tt.cut(1, 4)
  119. tt.cut(1, 5)
  120. tt.send(pb.Message{From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  121. tt.send(pb.Message{From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  122. sm := tt.peers[1].(*raft)
  123. if sm.raftLog.committed != 1 {
  124. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 1)
  125. }
  126. // network recovery
  127. tt.recover()
  128. // avoid committing ChangeTerm proposal
  129. tt.ignore(msgApp)
  130. // elect 1 as the new leader with term 2
  131. tt.send(pb.Message{From: 2, To: 2, Type: msgHup})
  132. // no log entries from previous term should be committed
  133. sm = tt.peers[2].(*raft)
  134. if sm.raftLog.committed != 1 {
  135. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 1)
  136. }
  137. tt.recover()
  138. // send out a heartbeat
  139. // after append a ChangeTerm entry from the current term, all entries
  140. // should be committed
  141. tt.send(pb.Message{From: 2, To: 2, Type: msgBeat})
  142. if sm.raftLog.committed != 4 {
  143. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 4)
  144. }
  145. // still be able to append a entry
  146. tt.send(pb.Message{From: 2, To: 2, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  147. if sm.raftLog.committed != 5 {
  148. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 5)
  149. }
  150. }
  151. // TestCommitWithoutNewTermEntry tests the entries could be committed
  152. // when leader changes, no new proposal comes in.
  153. func TestCommitWithoutNewTermEntry(t *testing.T) {
  154. tt := newNetwork(nil, nil, nil, nil, nil)
  155. tt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  156. // 0 cannot reach 2,3,4
  157. tt.cut(1, 3)
  158. tt.cut(1, 4)
  159. tt.cut(1, 5)
  160. tt.send(pb.Message{From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  161. tt.send(pb.Message{From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  162. sm := tt.peers[1].(*raft)
  163. if sm.raftLog.committed != 1 {
  164. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 1)
  165. }
  166. // network recovery
  167. tt.recover()
  168. // elect 1 as the new leader with term 2
  169. // after append a ChangeTerm entry from the current term, all entries
  170. // should be committed
  171. tt.send(pb.Message{From: 2, To: 2, Type: msgHup})
  172. if sm.raftLog.committed != 4 {
  173. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 4)
  174. }
  175. }
  176. func TestDuelingCandidates(t *testing.T) {
  177. a := newRaft(-1, nil, 0, 0) // k, id are set later
  178. b := newRaft(-1, nil, 0, 0)
  179. c := newRaft(-1, nil, 0, 0)
  180. nt := newNetwork(a, b, c)
  181. nt.cut(1, 3)
  182. nt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  183. nt.send(pb.Message{From: 3, To: 3, Type: msgHup})
  184. nt.recover()
  185. nt.send(pb.Message{From: 3, To: 3, Type: msgHup})
  186. wlog := &raftLog{ents: []pb.Entry{{}, pb.Entry{Data: nil, Term: 1, Index: 1}}, committed: 1}
  187. tests := []struct {
  188. sm *raft
  189. state stateType
  190. term int64
  191. raftLog *raftLog
  192. }{
  193. {a, stateFollower, 2, wlog},
  194. {b, stateFollower, 2, wlog},
  195. {c, stateFollower, 2, newLog()},
  196. }
  197. for i, tt := range tests {
  198. if g := tt.sm.state; g != tt.state {
  199. t.Errorf("#%d: state = %s, want %s", i, g, tt.state)
  200. }
  201. if g := tt.sm.Term; g != tt.term {
  202. t.Errorf("#%d: term = %d, want %d", i, g, tt.term)
  203. }
  204. base := ltoa(tt.raftLog)
  205. if sm, ok := nt.peers[1+int64(i)].(*raft); ok {
  206. l := ltoa(sm.raftLog)
  207. if g := diffu(base, l); g != "" {
  208. t.Errorf("#%d: diff:\n%s", i, g)
  209. }
  210. } else {
  211. t.Logf("#%d: empty log", i)
  212. }
  213. }
  214. }
  215. func TestCandidateConcede(t *testing.T) {
  216. tt := newNetwork(nil, nil, nil)
  217. tt.isolate(1)
  218. tt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  219. tt.send(pb.Message{From: 3, To: 3, Type: msgHup})
  220. // heal the partition
  221. tt.recover()
  222. data := []byte("force follower")
  223. // send a proposal to 2 to flush out a msgApp to 0
  224. tt.send(pb.Message{From: 3, To: 3, Type: msgProp, Entries: []pb.Entry{{Data: data}}})
  225. a := tt.peers[1].(*raft)
  226. if g := a.state; g != stateFollower {
  227. t.Errorf("state = %s, want %s", g, stateFollower)
  228. }
  229. if g := a.Term; g != 1 {
  230. t.Errorf("term = %d, want %d", g, 1)
  231. }
  232. wantLog := ltoa(&raftLog{ents: []pb.Entry{{}, {Data: nil, Term: 1, Index: 1}, {Term: 1, Index: 2, Data: data}}, committed: 2})
  233. for i, p := range tt.peers {
  234. if sm, ok := p.(*raft); ok {
  235. l := ltoa(sm.raftLog)
  236. if g := diffu(wantLog, l); g != "" {
  237. t.Errorf("#%d: diff:\n%s", i, g)
  238. }
  239. } else {
  240. t.Logf("#%d: empty log", i)
  241. }
  242. }
  243. }
  244. func TestSingleNodeCandidate(t *testing.T) {
  245. tt := newNetwork(nil)
  246. tt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  247. sm := tt.peers[1].(*raft)
  248. if sm.state != stateLeader {
  249. t.Errorf("state = %d, want %d", sm.state, stateLeader)
  250. }
  251. }
  252. func TestOldMessages(t *testing.T) {
  253. tt := newNetwork(nil, nil, nil)
  254. // make 0 leader @ term 3
  255. tt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  256. tt.send(pb.Message{From: 2, To: 2, Type: msgHup})
  257. tt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  258. // pretend we're an old leader trying to make progress
  259. tt.send(pb.Message{From: 1, To: 1, Type: msgApp, Term: 1, Entries: []pb.Entry{{Term: 1}}})
  260. l := &raftLog{
  261. ents: []pb.Entry{
  262. {}, {Data: nil, Term: 1, Index: 1},
  263. {Data: nil, Term: 2, Index: 2}, {Data: nil, Term: 3, Index: 3},
  264. },
  265. committed: 3,
  266. }
  267. base := ltoa(l)
  268. for i, p := range tt.peers {
  269. if sm, ok := p.(*raft); ok {
  270. l := ltoa(sm.raftLog)
  271. if g := diffu(base, l); g != "" {
  272. t.Errorf("#%d: diff:\n%s", i, g)
  273. }
  274. } else {
  275. t.Logf("#%d: empty log", i)
  276. }
  277. }
  278. }
  279. // TestOldMessagesReply - optimization - reply with new term.
  280. func TestProposal(t *testing.T) {
  281. tests := []struct {
  282. *network
  283. success bool
  284. }{
  285. {newNetwork(nil, nil, nil), true},
  286. {newNetwork(nil, nil, nopStepper), true},
  287. {newNetwork(nil, nopStepper, nopStepper), false},
  288. {newNetwork(nil, nopStepper, nopStepper, nil), false},
  289. {newNetwork(nil, nopStepper, nopStepper, nil, nil), true},
  290. }
  291. for i, tt := range tests {
  292. send := func(m pb.Message) {
  293. defer func() {
  294. // only recover is we expect it to panic so
  295. // panics we don't expect go up.
  296. if !tt.success {
  297. e := recover()
  298. if e != nil {
  299. t.Logf("#%d: err: %s", i, e)
  300. }
  301. }
  302. }()
  303. tt.send(m)
  304. }
  305. data := []byte("somedata")
  306. // promote 0 the leader
  307. send(pb.Message{From: 1, To: 1, Type: msgHup})
  308. send(pb.Message{From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{Data: data}}})
  309. wantLog := newLog()
  310. if tt.success {
  311. wantLog = &raftLog{ents: []pb.Entry{{}, {Data: nil, Term: 1, Index: 1}, {Term: 1, Index: 2, Data: data}}, committed: 2}
  312. }
  313. base := ltoa(wantLog)
  314. for i, p := range tt.peers {
  315. if sm, ok := p.(*raft); ok {
  316. l := ltoa(sm.raftLog)
  317. if g := diffu(base, l); g != "" {
  318. t.Errorf("#%d: diff:\n%s", i, g)
  319. }
  320. } else {
  321. t.Logf("#%d: empty log", i)
  322. }
  323. }
  324. sm := tt.network.peers[1].(*raft)
  325. if g := sm.Term; g != 1 {
  326. t.Errorf("#%d: term = %d, want %d", i, g, 1)
  327. }
  328. }
  329. }
  330. func TestProposalByProxy(t *testing.T) {
  331. data := []byte("somedata")
  332. tests := []*network{
  333. newNetwork(nil, nil, nil),
  334. newNetwork(nil, nil, nopStepper),
  335. }
  336. for i, tt := range tests {
  337. // promote 0 the leader
  338. tt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  339. // propose via follower
  340. tt.send(pb.Message{From: 2, To: 2, Type: msgProp, Entries: []pb.Entry{{Data: []byte("somedata")}}})
  341. wantLog := &raftLog{ents: []pb.Entry{{}, {Data: nil, Term: 1, Index: 1}, {Term: 1, Data: data, Index: 2}}, committed: 2}
  342. base := ltoa(wantLog)
  343. for i, p := range tt.peers {
  344. if sm, ok := p.(*raft); ok {
  345. l := ltoa(sm.raftLog)
  346. if g := diffu(base, l); g != "" {
  347. t.Errorf("#%d: diff:\n%s", i, g)
  348. }
  349. } else {
  350. t.Logf("#%d: empty log", i)
  351. }
  352. }
  353. sm := tt.peers[1].(*raft)
  354. if g := sm.Term; g != 1 {
  355. t.Errorf("#%d: term = %d, want %d", i, g, 1)
  356. }
  357. }
  358. }
  359. func TestCommit(t *testing.T) {
  360. tests := []struct {
  361. matches []int64
  362. logs []pb.Entry
  363. smTerm int64
  364. w int64
  365. }{
  366. // single
  367. {[]int64{1}, []pb.Entry{{}, {Term: 1}}, 1, 1},
  368. {[]int64{1}, []pb.Entry{{}, {Term: 1}}, 2, 0},
  369. {[]int64{2}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 2, 2},
  370. {[]int64{1}, []pb.Entry{{}, {Term: 2}}, 2, 1},
  371. // odd
  372. {[]int64{2, 1, 1}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 1, 1},
  373. {[]int64{2, 1, 1}, []pb.Entry{{}, {Term: 1}, {Term: 1}}, 2, 0},
  374. {[]int64{2, 1, 2}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 2, 2},
  375. {[]int64{2, 1, 2}, []pb.Entry{{}, {Term: 1}, {Term: 1}}, 2, 0},
  376. // even
  377. {[]int64{2, 1, 1, 1}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 1, 1},
  378. {[]int64{2, 1, 1, 1}, []pb.Entry{{}, {Term: 1}, {Term: 1}}, 2, 0},
  379. {[]int64{2, 1, 1, 2}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 1, 1},
  380. {[]int64{2, 1, 1, 2}, []pb.Entry{{}, {Term: 1}, {Term: 1}}, 2, 0},
  381. {[]int64{2, 1, 2, 2}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 2, 2},
  382. {[]int64{2, 1, 2, 2}, []pb.Entry{{}, {Term: 1}, {Term: 1}}, 2, 0},
  383. }
  384. for i, tt := range tests {
  385. prs := make(map[int64]*progress)
  386. for j := 0; j < len(tt.matches); j++ {
  387. prs[int64(j)] = &progress{tt.matches[j], tt.matches[j] + 1}
  388. }
  389. sm := &raft{raftLog: &raftLog{ents: tt.logs}, prs: prs, State: pb.State{Term: tt.smTerm}}
  390. sm.maybeCommit()
  391. if g := sm.raftLog.committed; g != tt.w {
  392. t.Errorf("#%d: committed = %d, want %d", i, g, tt.w)
  393. }
  394. }
  395. }
  396. // ensure that the Step function ignores the message from old term and does not pass it to the
  397. // acutal stepX function.
  398. func TestStepIgnoreOldTermMsg(t *testing.T) {
  399. called := false
  400. fakeStep := func(r *raft, m pb.Message) {
  401. called = true
  402. }
  403. sm := newRaft(1, []int64{1}, 0, 0)
  404. sm.step = fakeStep
  405. sm.Term = 2
  406. sm.Step(pb.Message{Type: msgApp, Term: sm.Term - 1})
  407. if called == true {
  408. t.Errorf("stepFunc called = %v , want %v", called, false)
  409. }
  410. }
  411. // TestHandleMsgApp ensures:
  412. // 1. Reply false if log doesn’t contain an entry at prevLogIndex whose term matches prevLogTerm.
  413. // 2. If an existing entry conflicts with a new one (same index but different terms),
  414. // delete the existing entry and all that follow it; append any new entries not already in the log.
  415. // 3. If leaderCommit > commitIndex, set commitIndex = min(leaderCommit, index of last new entry).
  416. func TestHandleMsgApp(t *testing.T) {
  417. tests := []struct {
  418. m pb.Message
  419. wIndex int64
  420. wCommit int64
  421. wAccept bool
  422. }{
  423. // Ensure 1
  424. {pb.Message{Type: msgApp, Term: 2, LogTerm: 3, Index: 2, Commit: 3}, 2, 0, false}, // previous log mismatch
  425. {pb.Message{Type: msgApp, Term: 2, LogTerm: 3, Index: 3, Commit: 3}, 2, 0, false}, // previous log non-exist
  426. // Ensure 2
  427. {pb.Message{Type: msgApp, Term: 2, LogTerm: 1, Index: 1, Commit: 1}, 2, 1, true},
  428. {pb.Message{Type: msgApp, Term: 2, LogTerm: 0, Index: 0, Commit: 1, Entries: []pb.Entry{{Term: 2}}}, 1, 1, true},
  429. {pb.Message{Type: msgApp, Term: 2, LogTerm: 2, Index: 2, Commit: 3, Entries: []pb.Entry{{Term: 2}, {Term: 2}}}, 4, 3, true},
  430. {pb.Message{Type: msgApp, Term: 2, LogTerm: 2, Index: 2, Commit: 4, Entries: []pb.Entry{{Term: 2}}}, 3, 3, true},
  431. {pb.Message{Type: msgApp, Term: 2, LogTerm: 1, Index: 1, Commit: 4, Entries: []pb.Entry{{Term: 2}}}, 2, 2, true},
  432. // Ensure 3
  433. {pb.Message{Type: msgApp, Term: 2, LogTerm: 2, Index: 2, Commit: 2}, 2, 2, true},
  434. {pb.Message{Type: msgApp, Term: 2, LogTerm: 2, Index: 2, Commit: 4}, 2, 2, true}, // commit upto min(commit, last)
  435. }
  436. for i, tt := range tests {
  437. sm := &raft{
  438. state: stateFollower,
  439. State: pb.State{Term: 2},
  440. raftLog: &raftLog{committed: 0, ents: []pb.Entry{{}, {Term: 1}, {Term: 2}}},
  441. }
  442. sm.handleAppendEntries(tt.m)
  443. if sm.raftLog.lastIndex() != tt.wIndex {
  444. t.Errorf("#%d: lastIndex = %d, want %d", i, sm.raftLog.lastIndex(), tt.wIndex)
  445. }
  446. if sm.raftLog.committed != tt.wCommit {
  447. t.Errorf("#%d: committed = %d, want %d", i, sm.raftLog.committed, tt.wCommit)
  448. }
  449. m := sm.ReadMessages()
  450. if len(m) != 1 {
  451. t.Errorf("#%d: msg = nil, want 1", i)
  452. }
  453. gaccept := true
  454. if m[0].Index == -1 {
  455. gaccept = false
  456. }
  457. if gaccept != tt.wAccept {
  458. t.Errorf("#%d: accept = %v, want %v", i, gaccept, tt.wAccept)
  459. }
  460. }
  461. }
  462. func TestRecvMsgVote(t *testing.T) {
  463. tests := []struct {
  464. state stateType
  465. i, term int64
  466. voteFor int64
  467. w int64
  468. }{
  469. {stateFollower, 0, 0, none, -1},
  470. {stateFollower, 0, 1, none, -1},
  471. {stateFollower, 0, 2, none, -1},
  472. {stateFollower, 0, 3, none, 2},
  473. {stateFollower, 1, 0, none, -1},
  474. {stateFollower, 1, 1, none, -1},
  475. {stateFollower, 1, 2, none, -1},
  476. {stateFollower, 1, 3, none, 2},
  477. {stateFollower, 2, 0, none, -1},
  478. {stateFollower, 2, 1, none, -1},
  479. {stateFollower, 2, 2, none, 2},
  480. {stateFollower, 2, 3, none, 2},
  481. {stateFollower, 3, 0, none, -1},
  482. {stateFollower, 3, 1, none, -1},
  483. {stateFollower, 3, 2, none, 2},
  484. {stateFollower, 3, 3, none, 2},
  485. {stateFollower, 3, 2, 2, 2},
  486. {stateFollower, 3, 2, 1, -1},
  487. {stateLeader, 3, 3, 1, -1},
  488. {stateCandidate, 3, 3, 1, -1},
  489. }
  490. for i, tt := range tests {
  491. sm := newRaft(1, []int64{1}, 0, 0)
  492. sm.state = tt.state
  493. switch tt.state {
  494. case stateFollower:
  495. sm.step = stepFollower
  496. case stateCandidate:
  497. sm.step = stepCandidate
  498. case stateLeader:
  499. sm.step = stepLeader
  500. }
  501. sm.State = pb.State{Vote: tt.voteFor}
  502. sm.raftLog = &raftLog{ents: []pb.Entry{{}, {Term: 2}, {Term: 2}}}
  503. sm.Step(pb.Message{Type: msgVote, From: 2, Index: tt.i, LogTerm: tt.term})
  504. msgs := sm.ReadMessages()
  505. if g := len(msgs); g != 1 {
  506. t.Errorf("#%d: len(msgs) = %d, want 1", i, g)
  507. continue
  508. }
  509. if g := msgs[0].Index; g != tt.w {
  510. t.Errorf("#%d, m.Index = %d, want %d", i, g, tt.w)
  511. }
  512. }
  513. }
  514. func TestStateTransition(t *testing.T) {
  515. tests := []struct {
  516. from stateType
  517. to stateType
  518. wallow bool
  519. wterm int64
  520. wlead int64
  521. }{
  522. {stateFollower, stateFollower, true, 1, none},
  523. {stateFollower, stateCandidate, true, 1, none},
  524. {stateFollower, stateLeader, false, -1, none},
  525. {stateCandidate, stateFollower, true, 0, none},
  526. {stateCandidate, stateCandidate, true, 1, none},
  527. {stateCandidate, stateLeader, true, 0, 1},
  528. {stateLeader, stateFollower, true, 1, none},
  529. {stateLeader, stateCandidate, false, 1, none},
  530. {stateLeader, stateLeader, true, 0, 1},
  531. }
  532. for i, tt := range tests {
  533. func() {
  534. defer func() {
  535. if r := recover(); r != nil {
  536. if tt.wallow == true {
  537. t.Errorf("%d: allow = %v, want %v", i, false, true)
  538. }
  539. }
  540. }()
  541. sm := newRaft(1, []int64{1}, 0, 0)
  542. sm.state = tt.from
  543. switch tt.to {
  544. case stateFollower:
  545. sm.becomeFollower(tt.wterm, tt.wlead)
  546. case stateCandidate:
  547. sm.becomeCandidate()
  548. case stateLeader:
  549. sm.becomeLeader()
  550. }
  551. if sm.Term != tt.wterm {
  552. t.Errorf("%d: term = %d, want %d", i, sm.Term, tt.wterm)
  553. }
  554. if sm.lead != tt.wlead {
  555. t.Errorf("%d: lead = %d, want %d", i, sm.lead, tt.wlead)
  556. }
  557. }()
  558. }
  559. }
  560. func TestAllServerStepdown(t *testing.T) {
  561. tests := []struct {
  562. state stateType
  563. wstate stateType
  564. wterm int64
  565. windex int64
  566. }{
  567. {stateFollower, stateFollower, 3, 1},
  568. {stateCandidate, stateFollower, 3, 1},
  569. {stateLeader, stateFollower, 3, 2},
  570. }
  571. tmsgTypes := [...]int64{msgVote, msgApp}
  572. tterm := int64(3)
  573. for i, tt := range tests {
  574. sm := newRaft(1, []int64{1, 2, 3}, 0, 0)
  575. switch tt.state {
  576. case stateFollower:
  577. sm.becomeFollower(1, none)
  578. case stateCandidate:
  579. sm.becomeCandidate()
  580. case stateLeader:
  581. sm.becomeCandidate()
  582. sm.becomeLeader()
  583. }
  584. for j, msgType := range tmsgTypes {
  585. sm.Step(pb.Message{From: 2, Type: msgType, Term: tterm, LogTerm: tterm})
  586. if sm.state != tt.wstate {
  587. t.Errorf("#%d.%d state = %v , want %v", i, j, sm.state, tt.wstate)
  588. }
  589. if sm.Term != tt.wterm {
  590. t.Errorf("#%d.%d term = %v , want %v", i, j, sm.Term, tt.wterm)
  591. }
  592. if int64(len(sm.raftLog.ents)) != tt.windex {
  593. t.Errorf("#%d.%d index = %v , want %v", i, j, len(sm.raftLog.ents), tt.windex)
  594. }
  595. wlead := int64(2)
  596. if msgType == msgVote {
  597. wlead = none
  598. }
  599. if sm.lead != wlead {
  600. t.Errorf("#%d, sm.lead = %d, want %d", i, sm.lead, none)
  601. }
  602. }
  603. }
  604. }
  605. func TestLeaderAppResp(t *testing.T) {
  606. tests := []struct {
  607. index int64
  608. wmsgNum int
  609. windex int64
  610. wcommitted int64
  611. }{
  612. {-1, 1, 1, 0}, // bad resp; leader does not commit; reply with log entries
  613. {2, 2, 2, 2}, // good resp; leader commits; broadcast with commit index
  614. }
  615. for i, tt := range tests {
  616. // sm term is 1 after it becomes the leader.
  617. // thus the last log term must be 1 to be committed.
  618. sm := newRaft(1, []int64{1, 2, 3}, 0, 0)
  619. sm.raftLog = &raftLog{ents: []pb.Entry{{}, {Term: 0}, {Term: 1}}}
  620. sm.becomeCandidate()
  621. sm.becomeLeader()
  622. sm.ReadMessages()
  623. sm.Step(pb.Message{From: 2, Type: msgAppResp, Index: tt.index, Term: sm.Term})
  624. msgs := sm.ReadMessages()
  625. if len(msgs) != tt.wmsgNum {
  626. t.Errorf("#%d msgNum = %d, want %d", i, len(msgs), tt.wmsgNum)
  627. }
  628. for j, msg := range msgs {
  629. if msg.Index != tt.windex {
  630. t.Errorf("#%d.%d index = %d, want %d", i, j, msg.Index, tt.windex)
  631. }
  632. if msg.Commit != tt.wcommitted {
  633. t.Errorf("#%d.%d commit = %d, want %d", i, j, msg.Commit, tt.wcommitted)
  634. }
  635. }
  636. }
  637. }
  638. // tests the output of the statemachine when receiving msgBeat
  639. func TestRecvMsgBeat(t *testing.T) {
  640. tests := []struct {
  641. state stateType
  642. wMsg int
  643. }{
  644. {stateLeader, 2},
  645. // candidate and follower should ignore msgBeat
  646. {stateCandidate, 0},
  647. {stateFollower, 0},
  648. }
  649. for i, tt := range tests {
  650. sm := newRaft(1, []int64{1, 2, 3}, 0, 0)
  651. sm.raftLog = &raftLog{ents: []pb.Entry{{}, {Term: 0}, {Term: 1}}}
  652. sm.Term = 1
  653. sm.state = tt.state
  654. switch tt.state {
  655. case stateFollower:
  656. sm.step = stepFollower
  657. case stateCandidate:
  658. sm.step = stepCandidate
  659. case stateLeader:
  660. sm.step = stepLeader
  661. }
  662. sm.Step(pb.Message{From: 1, To: 1, Type: msgBeat})
  663. msgs := sm.ReadMessages()
  664. if len(msgs) != tt.wMsg {
  665. t.Errorf("%d: len(msgs) = %d, want %d", i, len(msgs), tt.wMsg)
  666. }
  667. for _, m := range msgs {
  668. if m.Type != msgApp {
  669. t.Errorf("%d: msg.type = %v, want %v", i, m.Type, msgApp)
  670. }
  671. }
  672. }
  673. }
  674. func TestRestore(t *testing.T) {
  675. s := pb.Snapshot{
  676. Index: defaultCompactThreshold + 1,
  677. Term: defaultCompactThreshold + 1,
  678. Nodes: []int64{1, 2, 3},
  679. }
  680. sm := newRaft(1, []int64{1, 2}, 0, 0)
  681. if ok := sm.restore(s); !ok {
  682. t.Fatal("restore fail, want succeed")
  683. }
  684. if sm.raftLog.lastIndex() != s.Index {
  685. t.Errorf("log.lastIndex = %d, want %d", sm.raftLog.lastIndex(), s.Index)
  686. }
  687. if sm.raftLog.term(s.Index) != s.Term {
  688. t.Errorf("log.lastTerm = %d, want %d", sm.raftLog.term(s.Index), s.Term)
  689. }
  690. sg := int64Slice(sm.nodes())
  691. sw := int64Slice(s.Nodes)
  692. sort.Sort(sg)
  693. sort.Sort(sw)
  694. if !reflect.DeepEqual(sg, sw) {
  695. t.Errorf("sm.Nodes = %+v, want %+v", sg, sw)
  696. }
  697. if !reflect.DeepEqual(sm.raftLog.snapshot, s) {
  698. t.Errorf("snapshot = %+v, want %+v", sm.raftLog.snapshot, s)
  699. }
  700. if ok := sm.restore(s); ok {
  701. t.Fatal("restore succeed, want fail")
  702. }
  703. }
  704. func TestProvideSnap(t *testing.T) {
  705. s := pb.Snapshot{
  706. Index: defaultCompactThreshold + 1,
  707. Term: defaultCompactThreshold + 1,
  708. Nodes: []int64{1, 2},
  709. }
  710. sm := newRaft(1, []int64{1}, 0, 0)
  711. // restore the statemachin from a snapshot
  712. // so it has a compacted log and a snapshot
  713. sm.restore(s)
  714. sm.becomeCandidate()
  715. sm.becomeLeader()
  716. sm.Step(pb.Message{From: 1, To: 1, Type: msgBeat})
  717. msgs := sm.ReadMessages()
  718. if len(msgs) != 1 {
  719. t.Errorf("len(msgs) = %d, want 1", len(msgs))
  720. }
  721. m := msgs[0]
  722. if m.Type != msgApp {
  723. t.Errorf("m.Type = %v, want %v", m.Type, msgApp)
  724. }
  725. // force set the next of node 1, so that
  726. // node 1 needs a snapshot
  727. sm.prs[2].next = sm.raftLog.offset
  728. sm.Step(pb.Message{From: 2, To: 1, Type: msgAppResp, Index: -1})
  729. msgs = sm.ReadMessages()
  730. if len(msgs) != 1 {
  731. t.Errorf("len(msgs) = %d, want 1", len(msgs))
  732. }
  733. m = msgs[0]
  734. if m.Type != msgSnap {
  735. t.Errorf("m.Type = %v, want %v", m.Type, msgSnap)
  736. }
  737. }
  738. func TestRestoreFromSnapMsg(t *testing.T) {
  739. s := pb.Snapshot{
  740. Index: defaultCompactThreshold + 1,
  741. Term: defaultCompactThreshold + 1,
  742. Nodes: []int64{1, 2},
  743. }
  744. m := pb.Message{Type: msgSnap, From: 1, Term: 2, Snapshot: s}
  745. sm := newRaft(2, []int64{1, 2}, 0, 0)
  746. sm.Step(m)
  747. if !reflect.DeepEqual(sm.raftLog.snapshot, s) {
  748. t.Errorf("snapshot = %+v, want %+v", sm.raftLog.snapshot, s)
  749. }
  750. }
  751. func TestSlowNodeRestore(t *testing.T) {
  752. nt := newNetwork(nil, nil, nil)
  753. nt.send(pb.Message{From: 1, To: 1, Type: msgHup})
  754. nt.isolate(3)
  755. for j := 0; j < defaultCompactThreshold+1; j++ {
  756. nt.send(pb.Message{From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{}}})
  757. }
  758. lead := nt.peers[1].(*raft)
  759. nextEnts(lead)
  760. lead.compact(nil)
  761. nt.recover()
  762. nt.send(pb.Message{From: 1, To: 1, Type: msgBeat})
  763. follower := nt.peers[3].(*raft)
  764. if !reflect.DeepEqual(follower.raftLog.snapshot, lead.raftLog.snapshot) {
  765. t.Errorf("follower.snap = %+v, want %+v", follower.raftLog.snapshot, lead.raftLog.snapshot)
  766. }
  767. committed := follower.raftLog.lastIndex()
  768. nt.send(pb.Message{From: 1, To: 1, Type: msgProp, Entries: []pb.Entry{{}}})
  769. if follower.raftLog.committed != committed+1 {
  770. t.Errorf("follower.comitted = %d, want %d", follower.raftLog.committed, committed+1)
  771. }
  772. }
  773. func ents(terms ...int64) *raft {
  774. ents := []pb.Entry{{}}
  775. for _, term := range terms {
  776. ents = append(ents, pb.Entry{Term: term})
  777. }
  778. sm := &raft{raftLog: &raftLog{ents: ents}}
  779. sm.reset(0)
  780. return sm
  781. }
  782. type network struct {
  783. peers map[int64]Interface
  784. dropm map[connem]float64
  785. ignorem map[int64]bool
  786. }
  787. // newNetwork initializes a network from peers.
  788. // A nil node will be replaced with a new *stateMachine.
  789. // A *stateMachine will get its k, id.
  790. // When using stateMachine, the address list is always [0, n).
  791. func newNetwork(peers ...Interface) *network {
  792. size := len(peers)
  793. peerAddrs := make([]int64, size)
  794. for i := 0; i < size; i++ {
  795. peerAddrs[i] = 1 + int64(i)
  796. }
  797. npeers := make(map[int64]Interface, size)
  798. for i, p := range peers {
  799. id := peerAddrs[i]
  800. switch v := p.(type) {
  801. case nil:
  802. sm := newRaft(id, peerAddrs, 0, 0)
  803. npeers[id] = sm
  804. case *raft:
  805. v.id = id
  806. v.prs = make(map[int64]*progress)
  807. for i := 0; i < size; i++ {
  808. v.prs[peerAddrs[i]] = &progress{}
  809. }
  810. v.reset(0)
  811. npeers[id] = v
  812. case *blackHole:
  813. npeers[id] = v
  814. default:
  815. panic(fmt.Sprintf("unexpected state machine type: %T", p))
  816. }
  817. }
  818. return &network{
  819. peers: npeers,
  820. dropm: make(map[connem]float64),
  821. ignorem: make(map[int64]bool),
  822. }
  823. }
  824. func (nw *network) send(msgs ...pb.Message) {
  825. for len(msgs) > 0 {
  826. m := msgs[0]
  827. p := nw.peers[m.To]
  828. p.Step(m)
  829. msgs = append(msgs[1:], nw.filter(p.ReadMessages())...)
  830. }
  831. }
  832. func (nw *network) drop(from, to int64, perc float64) {
  833. nw.dropm[connem{from, to}] = perc
  834. }
  835. func (nw *network) cut(one, other int64) {
  836. nw.drop(one, other, 1)
  837. nw.drop(other, one, 1)
  838. }
  839. func (nw *network) isolate(id int64) {
  840. for i := 0; i < len(nw.peers); i++ {
  841. nid := int64(i) + 1
  842. if nid != id {
  843. nw.drop(id, nid, 1.0)
  844. nw.drop(nid, id, 1.0)
  845. }
  846. }
  847. }
  848. func (nw *network) ignore(t int64) {
  849. nw.ignorem[t] = true
  850. }
  851. func (nw *network) recover() {
  852. nw.dropm = make(map[connem]float64)
  853. nw.ignorem = make(map[int64]bool)
  854. }
  855. func (nw *network) filter(msgs []pb.Message) []pb.Message {
  856. mm := make([]pb.Message, 0)
  857. for _, m := range msgs {
  858. if nw.ignorem[m.Type] {
  859. continue
  860. }
  861. switch m.Type {
  862. case msgHup:
  863. // hups never go over the network, so don't drop them but panic
  864. panic("unexpected msgHup")
  865. default:
  866. perc := nw.dropm[connem{m.From, m.To}]
  867. if n := rand.Float64(); n < perc {
  868. continue
  869. }
  870. }
  871. mm = append(mm, m)
  872. }
  873. return mm
  874. }
  875. type connem struct {
  876. from, to int64
  877. }
  878. type blackHole struct{}
  879. func (blackHole) Step(pb.Message) error { return nil }
  880. func (blackHole) ReadMessages() []pb.Message { return nil }
  881. var nopStepper = &blackHole{}