raft_test.go 28 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019
  1. package raft
  2. import (
  3. "bytes"
  4. "math/rand"
  5. "reflect"
  6. "sort"
  7. "testing"
  8. pb "github.com/coreos/etcd/raft/raftpb"
  9. )
  10. // firstId is the id of the first raft machine in the array.
  11. // It implies the way to set id for raft machines:
  12. // The id of n-th machine is firstId+n, and machine with machineId is at machineId-firstId place in the array.
  13. // This is how newNetwork sets ids for raft machines.
  14. // TODO: use more flexible ways to set it
  15. const firstId int64 = 0x1000
  16. // nextEnts returns the appliable entries and updates the applied index
  17. func (r *raft) nextEnts() (ents []pb.Entry) {
  18. ents = r.raftLog.nextEnts()
  19. r.raftLog.resetNextEnts()
  20. return ents
  21. }
  22. type Interface interface {
  23. Step(m pb.Message) error
  24. ReadMessages() []pb.Message
  25. }
  26. func TestLeaderElection(t *testing.T) {
  27. tests := []struct {
  28. *network
  29. state stateType
  30. }{
  31. {newNetwork(nil, nil, nil), stateLeader},
  32. {newNetwork(nil, nil, nopStepper), stateLeader},
  33. {newNetwork(nil, nopStepper, nopStepper), stateCandidate},
  34. {newNetwork(nil, nopStepper, nopStepper, nil), stateCandidate},
  35. {newNetwork(nil, nopStepper, nopStepper, nil, nil), stateLeader},
  36. // three logs further along than 0
  37. {newNetwork(nil, ents(1), ents(2), ents(1, 3), nil), stateFollower},
  38. // logs converge
  39. {newNetwork(ents(1), nil, ents(2), ents(1), nil), stateLeader},
  40. }
  41. for i, tt := range tests {
  42. tt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  43. sm := tt.network.peers[firstId].(*raft)
  44. if sm.state != tt.state {
  45. t.Errorf("#%d: state = %s, want %s", i, sm.state, tt.state)
  46. }
  47. if g := sm.Term; g != 1 {
  48. t.Errorf("#%d: term = %d, want %d", i, g, 1)
  49. }
  50. }
  51. }
  52. func TestLogReplication(t *testing.T) {
  53. tests := []struct {
  54. *network
  55. msgs []pb.Message
  56. wcommitted int64
  57. }{
  58. {
  59. newNetwork(nil, nil, nil),
  60. []pb.Message{
  61. {From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{Data: []byte("somedata")}}},
  62. },
  63. 2,
  64. },
  65. {
  66. newNetwork(nil, nil, nil),
  67. []pb.Message{
  68. {From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{Data: []byte("somedata")}}},
  69. {From: firstId, To: firstId + 1, Type: msgHup},
  70. {From: firstId, To: firstId + 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("somedata")}}},
  71. },
  72. 4,
  73. },
  74. }
  75. for i, tt := range tests {
  76. tt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  77. for _, m := range tt.msgs {
  78. tt.send(m)
  79. }
  80. for j, x := range tt.network.peers {
  81. sm := x.(*raft)
  82. if sm.raftLog.committed != tt.wcommitted {
  83. t.Errorf("#%d.%d: committed = %d, want %d", i, j, sm.raftLog.committed, tt.wcommitted)
  84. }
  85. ents := make([]pb.Entry, 0)
  86. for _, e := range sm.nextEnts() {
  87. if e.Data != nil {
  88. ents = append(ents, e)
  89. }
  90. }
  91. props := make([]pb.Message, 0)
  92. for _, m := range tt.msgs {
  93. if m.Type == msgProp {
  94. props = append(props, m)
  95. }
  96. }
  97. for k, m := range props {
  98. if !bytes.Equal(ents[k].Data, m.Entries[0].Data) {
  99. t.Errorf("#%d.%d: data = %d, want %d", i, j, ents[k].Data, m.Entries[0].Data)
  100. }
  101. }
  102. }
  103. }
  104. }
  105. func TestSingleNodeCommit(t *testing.T) {
  106. tt := newNetwork(nil)
  107. tt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  108. tt.send(pb.Message{From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  109. tt.send(pb.Message{From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  110. sm := tt.peers[firstId].(*raft)
  111. if sm.raftLog.committed != 3 {
  112. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 3)
  113. }
  114. }
  115. // TestCannotCommitWithoutNewTermEntry tests the entries cannot be committed
  116. // when leader changes, no new proposal comes in and ChangeTerm proposal is
  117. // filtered.
  118. func TestCannotCommitWithoutNewTermEntry(t *testing.T) {
  119. tt := newNetwork(nil, nil, nil, nil, nil)
  120. tt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  121. // 0 cannot reach 2,3,4
  122. tt.cut(firstId, firstId+2)
  123. tt.cut(firstId, firstId+3)
  124. tt.cut(firstId, firstId+4)
  125. tt.send(pb.Message{From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  126. tt.send(pb.Message{From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  127. sm := tt.peers[firstId].(*raft)
  128. if sm.raftLog.committed != 1 {
  129. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 1)
  130. }
  131. // network recovery
  132. tt.recover()
  133. // avoid committing ChangeTerm proposal
  134. tt.ignore(msgApp)
  135. // elect 1 as the new leader with term 2
  136. tt.send(pb.Message{From: firstId + 1, To: firstId + 1, Type: msgHup})
  137. // no log entries from previous term should be committed
  138. sm = tt.peers[firstId+1].(*raft)
  139. if sm.raftLog.committed != 1 {
  140. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 1)
  141. }
  142. tt.recover()
  143. // send out a heartbeat
  144. // after append a ChangeTerm entry from the current term, all entries
  145. // should be committed
  146. tt.send(pb.Message{From: firstId + 1, To: firstId + 1, Type: msgBeat})
  147. if sm.raftLog.committed != 4 {
  148. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 4)
  149. }
  150. // still be able to append a entry
  151. tt.send(pb.Message{From: firstId + 1, To: firstId + 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  152. if sm.raftLog.committed != 5 {
  153. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 5)
  154. }
  155. }
  156. // TestCommitWithoutNewTermEntry tests the entries could be committed
  157. // when leader changes, no new proposal comes in.
  158. func TestCommitWithoutNewTermEntry(t *testing.T) {
  159. tt := newNetwork(nil, nil, nil, nil, nil)
  160. tt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  161. // 0 cannot reach 2,3,4
  162. tt.cut(firstId, firstId+2)
  163. tt.cut(firstId, firstId+3)
  164. tt.cut(firstId, firstId+4)
  165. tt.send(pb.Message{From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  166. tt.send(pb.Message{From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{Data: []byte("some data")}}})
  167. sm := tt.peers[firstId].(*raft)
  168. if sm.raftLog.committed != 1 {
  169. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 1)
  170. }
  171. // network recovery
  172. tt.recover()
  173. // elect 1 as the new leader with term 2
  174. // after append a ChangeTerm entry from the current term, all entries
  175. // should be committed
  176. tt.send(pb.Message{From: firstId + 1, To: firstId + 1, Type: msgHup})
  177. if sm.raftLog.committed != 4 {
  178. t.Errorf("committed = %d, want %d", sm.raftLog.committed, 4)
  179. }
  180. }
  181. func TestDuelingCandidates(t *testing.T) {
  182. a := newRaft(-1, nil, 0, 0) // k, id are set later
  183. b := newRaft(-1, nil, 0, 0)
  184. c := newRaft(-1, nil, 0, 0)
  185. nt := newNetwork(a, b, c)
  186. nt.cut(firstId, firstId+2)
  187. nt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  188. nt.send(pb.Message{From: firstId + 2, To: firstId + 2, Type: msgHup})
  189. nt.recover()
  190. nt.send(pb.Message{From: firstId + 2, To: firstId + 2, Type: msgHup})
  191. wlog := &raftLog{ents: []pb.Entry{{}, pb.Entry{Data: nil, Term: 1, Index: 1}}, committed: 1}
  192. tests := []struct {
  193. sm *raft
  194. state stateType
  195. term int64
  196. raftLog *raftLog
  197. }{
  198. {a, stateFollower, 2, wlog},
  199. {b, stateFollower, 2, wlog},
  200. {c, stateFollower, 2, newLog()},
  201. }
  202. for i, tt := range tests {
  203. if g := tt.sm.state; g != tt.state {
  204. t.Errorf("#%d: state = %s, want %s", i, g, tt.state)
  205. }
  206. if g := tt.sm.Term; g != tt.term {
  207. t.Errorf("#%d: term = %d, want %d", i, g, tt.term)
  208. }
  209. base := ltoa(tt.raftLog)
  210. if sm, ok := nt.peers[firstId+int64(i)].(*raft); ok {
  211. l := ltoa(sm.raftLog)
  212. if g := diffu(base, l); g != "" {
  213. t.Errorf("#%d: diff:\n%s", i, g)
  214. }
  215. } else {
  216. t.Logf("#%d: empty log", i)
  217. }
  218. }
  219. }
  220. func TestCandidateConcede(t *testing.T) {
  221. tt := newNetwork(nil, nil, nil)
  222. tt.isolate(firstId)
  223. tt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  224. tt.send(pb.Message{From: firstId + 2, To: firstId + 2, Type: msgHup})
  225. // heal the partition
  226. tt.recover()
  227. data := []byte("force follower")
  228. // send a proposal to 2 to flush out a msgApp to 0
  229. tt.send(pb.Message{From: firstId + 2, To: firstId + 2, Type: msgProp, Entries: []pb.Entry{{Data: data}}})
  230. a := tt.peers[firstId].(*raft)
  231. if g := a.state; g != stateFollower {
  232. t.Errorf("state = %s, want %s", g, stateFollower)
  233. }
  234. if g := a.Term; g != 1 {
  235. t.Errorf("term = %d, want %d", g, 1)
  236. }
  237. wantLog := ltoa(&raftLog{ents: []pb.Entry{{}, {Data: nil, Term: 1, Index: 1}, {Term: 1, Index: 2, Data: data}}, committed: 2})
  238. for i, p := range tt.peers {
  239. if sm, ok := p.(*raft); ok {
  240. l := ltoa(sm.raftLog)
  241. if g := diffu(wantLog, l); g != "" {
  242. t.Errorf("#%d: diff:\n%s", i, g)
  243. }
  244. } else {
  245. t.Logf("#%d: empty log", i)
  246. }
  247. }
  248. }
  249. func TestSingleNodeCandidate(t *testing.T) {
  250. tt := newNetwork(nil)
  251. tt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  252. sm := tt.peers[firstId].(*raft)
  253. if sm.state != stateLeader {
  254. t.Errorf("state = %d, want %d", sm.state, stateLeader)
  255. }
  256. }
  257. func TestOldMessages(t *testing.T) {
  258. tt := newNetwork(nil, nil, nil)
  259. // make 0 leader @ term 3
  260. tt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  261. tt.send(pb.Message{From: firstId + 1, To: firstId + 1, Type: msgHup})
  262. tt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  263. // pretend we're an old leader trying to make progress
  264. tt.send(pb.Message{From: firstId, To: firstId, Type: msgApp, Term: 1, Entries: []pb.Entry{{Term: 1}}})
  265. l := &raftLog{
  266. ents: []pb.Entry{
  267. {}, {Data: nil, Term: 1, Index: 1},
  268. {Data: nil, Term: 2, Index: 2}, {Data: nil, Term: 3, Index: 3},
  269. },
  270. committed: 3,
  271. }
  272. base := ltoa(l)
  273. for i, p := range tt.peers {
  274. if sm, ok := p.(*raft); ok {
  275. l := ltoa(sm.raftLog)
  276. if g := diffu(base, l); g != "" {
  277. t.Errorf("#%d: diff:\n%s", i, g)
  278. }
  279. } else {
  280. t.Logf("#%d: empty log", i)
  281. }
  282. }
  283. }
  284. // TestOldMessagesReply - optimization - reply with new term.
  285. func TestProposal(t *testing.T) {
  286. tests := []struct {
  287. *network
  288. success bool
  289. }{
  290. {newNetwork(nil, nil, nil), true},
  291. {newNetwork(nil, nil, nopStepper), true},
  292. {newNetwork(nil, nopStepper, nopStepper), false},
  293. {newNetwork(nil, nopStepper, nopStepper, nil), false},
  294. {newNetwork(nil, nopStepper, nopStepper, nil, nil), true},
  295. }
  296. for i, tt := range tests {
  297. send := func(m pb.Message) {
  298. defer func() {
  299. // only recover is we expect it to panic so
  300. // panics we don't expect go up.
  301. if !tt.success {
  302. e := recover()
  303. if e != nil {
  304. t.Logf("#%d: err: %s", i, e)
  305. }
  306. }
  307. }()
  308. tt.send(m)
  309. }
  310. data := []byte("somedata")
  311. // promote 0 the leader
  312. send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  313. send(pb.Message{From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{Data: data}}})
  314. wantLog := newLog()
  315. if tt.success {
  316. wantLog = &raftLog{ents: []pb.Entry{{}, {Data: nil, Term: 1, Index: 1}, {Term: 1, Index: 2, Data: data}}, committed: 2}
  317. }
  318. base := ltoa(wantLog)
  319. for i, p := range tt.peers {
  320. if sm, ok := p.(*raft); ok {
  321. l := ltoa(sm.raftLog)
  322. if g := diffu(base, l); g != "" {
  323. t.Errorf("#%d: diff:\n%s", i, g)
  324. }
  325. } else {
  326. t.Logf("#%d: empty log", i)
  327. }
  328. }
  329. sm := tt.network.peers[firstId].(*raft)
  330. if g := sm.Term; g != 1 {
  331. t.Errorf("#%d: term = %d, want %d", i, g, 1)
  332. }
  333. }
  334. }
  335. func TestProposalByProxy(t *testing.T) {
  336. data := []byte("somedata")
  337. tests := []*network{
  338. newNetwork(nil, nil, nil),
  339. newNetwork(nil, nil, nopStepper),
  340. }
  341. for i, tt := range tests {
  342. // promote 0 the leader
  343. tt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  344. // propose via follower
  345. tt.send(pb.Message{From: firstId + 1, To: firstId + 1, Type: msgProp, Entries: []pb.Entry{{Data: []byte("somedata")}}})
  346. wantLog := &raftLog{ents: []pb.Entry{{}, {Data: nil, Term: 1, Index: 1}, {Term: 1, Data: data, Index: 2}}, committed: 2}
  347. base := ltoa(wantLog)
  348. for i, p := range tt.peers {
  349. if sm, ok := p.(*raft); ok {
  350. l := ltoa(sm.raftLog)
  351. if g := diffu(base, l); g != "" {
  352. t.Errorf("#%d: diff:\n%s", i, g)
  353. }
  354. } else {
  355. t.Logf("#%d: empty log", i)
  356. }
  357. }
  358. sm := tt.peers[firstId].(*raft)
  359. if g := sm.Term; g != 1 {
  360. t.Errorf("#%d: term = %d, want %d", i, g, 1)
  361. }
  362. }
  363. }
  364. func TestCommit(t *testing.T) {
  365. tests := []struct {
  366. matches []int64
  367. logs []pb.Entry
  368. smTerm int64
  369. w int64
  370. }{
  371. // single
  372. {[]int64{1}, []pb.Entry{{}, {Term: 1}}, 1, 1},
  373. {[]int64{1}, []pb.Entry{{}, {Term: 1}}, 2, 0},
  374. {[]int64{2}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 2, 2},
  375. {[]int64{1}, []pb.Entry{{}, {Term: 2}}, 2, 1},
  376. // odd
  377. {[]int64{2, 1, 1}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 1, 1},
  378. {[]int64{2, 1, 1}, []pb.Entry{{}, {Term: 1}, {Term: 1}}, 2, 0},
  379. {[]int64{2, 1, 2}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 2, 2},
  380. {[]int64{2, 1, 2}, []pb.Entry{{}, {Term: 1}, {Term: 1}}, 2, 0},
  381. // even
  382. {[]int64{2, 1, 1, 1}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 1, 1},
  383. {[]int64{2, 1, 1, 1}, []pb.Entry{{}, {Term: 1}, {Term: 1}}, 2, 0},
  384. {[]int64{2, 1, 1, 2}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 1, 1},
  385. {[]int64{2, 1, 1, 2}, []pb.Entry{{}, {Term: 1}, {Term: 1}}, 2, 0},
  386. {[]int64{2, 1, 2, 2}, []pb.Entry{{}, {Term: 1}, {Term: 2}}, 2, 2},
  387. {[]int64{2, 1, 2, 2}, []pb.Entry{{}, {Term: 1}, {Term: 1}}, 2, 0},
  388. }
  389. for i, tt := range tests {
  390. prs := make(map[int64]*progress)
  391. for j := 0; j < len(tt.matches); j++ {
  392. prs[int64(j)] = &progress{tt.matches[j], tt.matches[j] + 1}
  393. }
  394. sm := &raft{raftLog: &raftLog{ents: tt.logs}, prs: prs, State: pb.State{Term: tt.smTerm}}
  395. sm.maybeCommit()
  396. if g := sm.raftLog.committed; g != tt.w {
  397. t.Errorf("#%d: committed = %d, want %d", i, g, tt.w)
  398. }
  399. }
  400. }
  401. // ensure that the Step function ignores the message from old term and does not pass it to the
  402. // acutal stepX function.
  403. func TestStepIgnoreOldTermMsg(t *testing.T) {
  404. called := false
  405. fakeStep := func(r *raft, m pb.Message) {
  406. called = true
  407. }
  408. sm := newRaft(firstId, []int64{firstId}, 0, 0)
  409. sm.step = fakeStep
  410. sm.Term = 2
  411. sm.Step(pb.Message{Type: msgApp, Term: sm.Term - 1})
  412. if called == true {
  413. t.Errorf("stepFunc called = %v , want %v", called, false)
  414. }
  415. }
  416. // TestHandleMsgApp ensures:
  417. // 1. Reply false if log doesn’t contain an entry at prevLogIndex whose term matches prevLogTerm.
  418. // 2. If an existing entry conflicts with a new one (same index but different terms),
  419. // delete the existing entry and all that follow it; append any new entries not already in the log.
  420. // 3. If leaderCommit > commitIndex, set commitIndex = min(leaderCommit, index of last new entry).
  421. func TestHandleMsgApp(t *testing.T) {
  422. tests := []struct {
  423. m pb.Message
  424. wIndex int64
  425. wCommit int64
  426. wAccept bool
  427. }{
  428. // Ensure 1
  429. {pb.Message{Type: msgApp, Term: 2, LogTerm: 3, Index: 2, Commit: 3}, 2, 0, false}, // previous log mismatch
  430. {pb.Message{Type: msgApp, Term: 2, LogTerm: 3, Index: 3, Commit: 3}, 2, 0, false}, // previous log non-exist
  431. // Ensure 2
  432. {pb.Message{Type: msgApp, Term: 2, LogTerm: 1, Index: 1, Commit: 1}, 2, 1, true},
  433. {pb.Message{Type: msgApp, Term: 2, LogTerm: 0, Index: 0, Commit: 1, Entries: []pb.Entry{{Term: 2}}}, 1, 1, true},
  434. {pb.Message{Type: msgApp, Term: 2, LogTerm: 2, Index: 2, Commit: 3, Entries: []pb.Entry{{Term: 2}, {Term: 2}}}, 4, 3, true},
  435. {pb.Message{Type: msgApp, Term: 2, LogTerm: 2, Index: 2, Commit: 4, Entries: []pb.Entry{{Term: 2}}}, 3, 3, true},
  436. {pb.Message{Type: msgApp, Term: 2, LogTerm: 1, Index: 1, Commit: 4, Entries: []pb.Entry{{Term: 2}}}, 2, 2, true},
  437. // Ensure 3
  438. {pb.Message{Type: msgApp, Term: 2, LogTerm: 2, Index: 2, Commit: 2}, 2, 2, true},
  439. {pb.Message{Type: msgApp, Term: 2, LogTerm: 2, Index: 2, Commit: 4}, 2, 2, true}, // commit upto min(commit, last)
  440. }
  441. for i, tt := range tests {
  442. sm := &raft{
  443. state: stateFollower,
  444. State: pb.State{Term: 2},
  445. raftLog: &raftLog{committed: 0, ents: []pb.Entry{{}, {Term: 1}, {Term: 2}}},
  446. }
  447. sm.handleAppendEntries(tt.m)
  448. if sm.raftLog.lastIndex() != tt.wIndex {
  449. t.Errorf("#%d: lastIndex = %d, want %d", i, sm.raftLog.lastIndex(), tt.wIndex)
  450. }
  451. if sm.raftLog.committed != tt.wCommit {
  452. t.Errorf("#%d: committed = %d, want %d", i, sm.raftLog.committed, tt.wCommit)
  453. }
  454. m := sm.ReadMessages()
  455. if len(m) != 1 {
  456. t.Errorf("#%d: msg = nil, want 1", i)
  457. }
  458. gaccept := true
  459. if m[0].Index == -1 {
  460. gaccept = false
  461. }
  462. if gaccept != tt.wAccept {
  463. t.Errorf("#%d: accept = %v, want %v", i, gaccept, tt.wAccept)
  464. }
  465. }
  466. }
  467. func TestRecvMsgVote(t *testing.T) {
  468. tests := []struct {
  469. state stateType
  470. i, term int64
  471. voteFor int64
  472. w int64
  473. }{
  474. {stateFollower, 0, 0, none, -1},
  475. {stateFollower, 0, 1, none, -1},
  476. {stateFollower, 0, 2, none, -1},
  477. {stateFollower, 0, 3, none, 2},
  478. {stateFollower, 1, 0, none, -1},
  479. {stateFollower, 1, 1, none, -1},
  480. {stateFollower, 1, 2, none, -1},
  481. {stateFollower, 1, 3, none, 2},
  482. {stateFollower, 2, 0, none, -1},
  483. {stateFollower, 2, 1, none, -1},
  484. {stateFollower, 2, 2, none, 2},
  485. {stateFollower, 2, 3, none, 2},
  486. {stateFollower, 3, 0, none, -1},
  487. {stateFollower, 3, 1, none, -1},
  488. {stateFollower, 3, 2, none, 2},
  489. {stateFollower, 3, 3, none, 2},
  490. {stateFollower, 3, 2, firstId + 1, 2},
  491. {stateFollower, 3, 2, firstId, -1},
  492. {stateLeader, 3, 3, firstId, -1},
  493. {stateCandidate, 3, 3, firstId, -1},
  494. }
  495. for i, tt := range tests {
  496. sm := newRaft(firstId, []int64{firstId}, 0, 0)
  497. sm.state = tt.state
  498. switch tt.state {
  499. case stateFollower:
  500. sm.step = stepFollower
  501. case stateCandidate:
  502. sm.step = stepCandidate
  503. case stateLeader:
  504. sm.step = stepLeader
  505. }
  506. sm.State = pb.State{Vote: tt.voteFor}
  507. sm.raftLog = &raftLog{ents: []pb.Entry{{}, {Term: 2}, {Term: 2}}}
  508. sm.Step(pb.Message{Type: msgVote, From: firstId + 1, Index: tt.i, LogTerm: tt.term})
  509. msgs := sm.ReadMessages()
  510. if g := len(msgs); g != 1 {
  511. t.Errorf("#%d: len(msgs) = %d, want 1", i, g)
  512. continue
  513. }
  514. if g := msgs[0].Index; g != tt.w {
  515. t.Errorf("#%d, m.Index = %d, want %d", i, g, tt.w)
  516. }
  517. }
  518. }
  519. func TestStateTransition(t *testing.T) {
  520. tests := []struct {
  521. from stateType
  522. to stateType
  523. wallow bool
  524. wterm int64
  525. wlead int64
  526. }{
  527. {stateFollower, stateFollower, true, 1, none},
  528. {stateFollower, stateCandidate, true, 1, none},
  529. {stateFollower, stateLeader, false, -1, none},
  530. {stateCandidate, stateFollower, true, 0, none},
  531. {stateCandidate, stateCandidate, true, 1, none},
  532. {stateCandidate, stateLeader, true, 0, firstId},
  533. {stateLeader, stateFollower, true, 1, none},
  534. {stateLeader, stateCandidate, false, 1, none},
  535. {stateLeader, stateLeader, true, 0, firstId},
  536. }
  537. for i, tt := range tests {
  538. func() {
  539. defer func() {
  540. if r := recover(); r != nil {
  541. if tt.wallow == true {
  542. t.Errorf("%d: allow = %v, want %v", i, false, true)
  543. }
  544. }
  545. }()
  546. sm := newRaft(firstId, []int64{firstId}, 0, 0)
  547. sm.state = tt.from
  548. switch tt.to {
  549. case stateFollower:
  550. sm.becomeFollower(tt.wterm, tt.wlead)
  551. case stateCandidate:
  552. sm.becomeCandidate()
  553. case stateLeader:
  554. sm.becomeLeader()
  555. }
  556. if sm.Term != tt.wterm {
  557. t.Errorf("%d: term = %d, want %d", i, sm.Term, tt.wterm)
  558. }
  559. if sm.lead != tt.wlead {
  560. t.Errorf("%d: lead = %d, want %d", i, sm.lead, tt.wlead)
  561. }
  562. }()
  563. }
  564. }
  565. func TestAllServerStepdown(t *testing.T) {
  566. tests := []struct {
  567. state stateType
  568. wstate stateType
  569. wterm int64
  570. windex int64
  571. }{
  572. {stateFollower, stateFollower, 3, 1},
  573. {stateCandidate, stateFollower, 3, 1},
  574. {stateLeader, stateFollower, 3, 2},
  575. }
  576. tmsgTypes := [...]int64{msgVote, msgApp}
  577. tterm := int64(3)
  578. for i, tt := range tests {
  579. sm := newRaft(firstId, []int64{firstId, firstId + 1, firstId + 2}, 0, 0)
  580. switch tt.state {
  581. case stateFollower:
  582. sm.becomeFollower(1, none)
  583. case stateCandidate:
  584. sm.becomeCandidate()
  585. case stateLeader:
  586. sm.becomeCandidate()
  587. sm.becomeLeader()
  588. }
  589. for j, msgType := range tmsgTypes {
  590. sm.Step(pb.Message{From: firstId + 1, Type: msgType, Term: tterm, LogTerm: tterm})
  591. if sm.state != tt.wstate {
  592. t.Errorf("#%d.%d state = %v , want %v", i, j, sm.state, tt.wstate)
  593. }
  594. if sm.Term != tt.wterm {
  595. t.Errorf("#%d.%d term = %v , want %v", i, j, sm.Term, tt.wterm)
  596. }
  597. if int64(len(sm.raftLog.ents)) != tt.windex {
  598. t.Errorf("#%d.%d index = %v , want %v", i, j, len(sm.raftLog.ents), tt.windex)
  599. }
  600. wlead := int64(firstId + 1)
  601. if msgType == msgVote {
  602. wlead = none
  603. }
  604. if sm.lead != wlead {
  605. t.Errorf("#%d, sm.lead = %d, want %d", i, sm.lead, none)
  606. }
  607. }
  608. }
  609. }
  610. func TestLeaderAppResp(t *testing.T) {
  611. tests := []struct {
  612. index int64
  613. wmsgNum int
  614. windex int64
  615. wcommitted int64
  616. }{
  617. {-1, 1, 1, 0}, // bad resp; leader does not commit; reply with log entries
  618. {2, 2, 2, 2}, // good resp; leader commits; broadcast with commit index
  619. }
  620. for i, tt := range tests {
  621. // sm term is 1 after it becomes the leader.
  622. // thus the last log term must be 1 to be committed.
  623. sm := newRaft(firstId, []int64{firstId, firstId + 1, firstId + 2}, 0, 0)
  624. sm.raftLog = &raftLog{ents: []pb.Entry{{}, {Term: 0}, {Term: 1}}}
  625. sm.becomeCandidate()
  626. sm.becomeLeader()
  627. sm.ReadMessages()
  628. sm.Step(pb.Message{From: firstId + 1, Type: msgAppResp, Index: tt.index, Term: sm.Term})
  629. msgs := sm.ReadMessages()
  630. if len(msgs) != tt.wmsgNum {
  631. t.Errorf("#%d msgNum = %d, want %d", i, len(msgs), tt.wmsgNum)
  632. }
  633. for j, msg := range msgs {
  634. if msg.Index != tt.windex {
  635. t.Errorf("#%d.%d index = %d, want %d", i, j, msg.Index, tt.windex)
  636. }
  637. if msg.Commit != tt.wcommitted {
  638. t.Errorf("#%d.%d commit = %d, want %d", i, j, msg.Commit, tt.wcommitted)
  639. }
  640. }
  641. }
  642. }
  643. // tests the output of the statemachine when receiving msgBeat
  644. func TestRecvMsgBeat(t *testing.T) {
  645. tests := []struct {
  646. state stateType
  647. wMsg int
  648. }{
  649. {stateLeader, 2},
  650. // candidate and follower should ignore msgBeat
  651. {stateCandidate, 0},
  652. {stateFollower, 0},
  653. }
  654. for i, tt := range tests {
  655. sm := newRaft(firstId, []int64{firstId, firstId + 1, firstId + 2}, 0, 0)
  656. sm.raftLog = &raftLog{ents: []pb.Entry{{}, {Term: 0}, {Term: 1}}}
  657. sm.Term = 1
  658. sm.state = tt.state
  659. switch tt.state {
  660. case stateFollower:
  661. sm.step = stepFollower
  662. case stateCandidate:
  663. sm.step = stepCandidate
  664. case stateLeader:
  665. sm.step = stepLeader
  666. }
  667. sm.Step(pb.Message{From: firstId, To: firstId, Type: msgBeat})
  668. msgs := sm.ReadMessages()
  669. if len(msgs) != tt.wMsg {
  670. t.Errorf("%d: len(msgs) = %d, want %d", i, len(msgs), tt.wMsg)
  671. }
  672. for _, m := range msgs {
  673. if m.Type != msgApp {
  674. t.Errorf("%d: msg.type = %v, want %v", i, m.Type, msgApp)
  675. }
  676. }
  677. }
  678. }
  679. func TestRestore(t *testing.T) {
  680. s := pb.Snapshot{
  681. Index: defaultCompactThreshold + 1,
  682. Term: defaultCompactThreshold + 1,
  683. Nodes: []int64{firstId, firstId + 1, firstId + 2},
  684. }
  685. sm := newRaft(firstId, []int64{firstId, firstId + 1}, 0, 0)
  686. if ok := sm.restore(s); !ok {
  687. t.Fatal("restore fail, want succeed")
  688. }
  689. if sm.raftLog.lastIndex() != s.Index {
  690. t.Errorf("log.lastIndex = %d, want %d", sm.raftLog.lastIndex(), s.Index)
  691. }
  692. if sm.raftLog.term(s.Index) != s.Term {
  693. t.Errorf("log.lastTerm = %d, want %d", sm.raftLog.term(s.Index), s.Term)
  694. }
  695. sg := int64Slice(sm.nodes())
  696. sw := int64Slice(s.Nodes)
  697. sort.Sort(sg)
  698. sort.Sort(sw)
  699. if !reflect.DeepEqual(sg, sw) {
  700. t.Errorf("sm.Nodes = %+v, want %+v", sg, sw)
  701. }
  702. if !reflect.DeepEqual(sm.raftLog.snapshot, s) {
  703. t.Errorf("snapshot = %+v, want %+v", sm.raftLog.snapshot, s)
  704. }
  705. if ok := sm.restore(s); ok {
  706. t.Fatal("restore succeed, want fail")
  707. }
  708. }
  709. func TestProvideSnap(t *testing.T) {
  710. s := pb.Snapshot{
  711. Index: defaultCompactThreshold + 1,
  712. Term: defaultCompactThreshold + 1,
  713. Nodes: []int64{firstId, firstId + 1},
  714. }
  715. sm := newRaft(firstId, []int64{firstId}, 0, 0)
  716. // restore the statemachin from a snapshot
  717. // so it has a compacted log and a snapshot
  718. sm.restore(s)
  719. sm.becomeCandidate()
  720. sm.becomeLeader()
  721. sm.Step(pb.Message{From: firstId, To: firstId, Type: msgBeat})
  722. msgs := sm.ReadMessages()
  723. if len(msgs) != 1 {
  724. t.Errorf("len(msgs) = %d, want 1", len(msgs))
  725. }
  726. m := msgs[0]
  727. if m.Type != msgApp {
  728. t.Errorf("m.Type = %v, want %v", m.Type, msgApp)
  729. }
  730. // force set the next of node 1, so that
  731. // node 1 needs a snapshot
  732. sm.prs[firstId+1].next = sm.raftLog.offset
  733. sm.Step(pb.Message{From: firstId + 1, To: firstId, Type: msgAppResp, Index: -1})
  734. msgs = sm.ReadMessages()
  735. if len(msgs) != 1 {
  736. t.Errorf("len(msgs) = %d, want 1", len(msgs))
  737. }
  738. m = msgs[0]
  739. if m.Type != msgSnap {
  740. t.Errorf("m.Type = %v, want %v", m.Type, msgSnap)
  741. }
  742. }
  743. func TestRestoreFromSnapMsg(t *testing.T) {
  744. s := pb.Snapshot{
  745. Index: defaultCompactThreshold + 1,
  746. Term: defaultCompactThreshold + 1,
  747. Nodes: []int64{firstId, firstId + 1},
  748. }
  749. m := pb.Message{Type: msgSnap, From: firstId, Term: firstId + 1, Snapshot: s}
  750. sm := newRaft(firstId+1, []int64{firstId, firstId + 1}, 0, 0)
  751. sm.Step(m)
  752. if !reflect.DeepEqual(sm.raftLog.snapshot, s) {
  753. t.Errorf("snapshot = %+v, want %+v", sm.raftLog.snapshot, s)
  754. }
  755. }
  756. func TestSlowNodeRestore(t *testing.T) {
  757. nt := newNetwork(nil, nil, nil)
  758. nt.send(pb.Message{From: firstId, To: firstId, Type: msgHup})
  759. nt.isolate(firstId + 2)
  760. for j := 0; j < defaultCompactThreshold+1; j++ {
  761. nt.send(pb.Message{From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{}}})
  762. }
  763. lead := nt.peers[firstId].(*raft)
  764. lead.nextEnts()
  765. lead.compact(nil)
  766. nt.recover()
  767. nt.send(pb.Message{From: firstId, To: firstId, Type: msgBeat})
  768. follower := nt.peers[firstId+2].(*raft)
  769. if !reflect.DeepEqual(follower.raftLog.snapshot, lead.raftLog.snapshot) {
  770. t.Errorf("follower.snap = %+v, want %+v", follower.raftLog.snapshot, lead.raftLog.snapshot)
  771. }
  772. committed := follower.raftLog.lastIndex()
  773. nt.send(pb.Message{From: firstId, To: firstId, Type: msgProp, Entries: []pb.Entry{{}}})
  774. if follower.raftLog.committed != committed+1 {
  775. t.Errorf("follower.comitted = %d, want %d", follower.raftLog.committed, committed+1)
  776. }
  777. }
  778. func ents(terms ...int64) *raft {
  779. ents := []pb.Entry{{}}
  780. for _, term := range terms {
  781. ents = append(ents, pb.Entry{Term: term})
  782. }
  783. sm := &raft{raftLog: &raftLog{ents: ents}}
  784. sm.reset(0)
  785. return sm
  786. }
  787. type network struct {
  788. peers map[int64]Interface
  789. dropm map[connem]float64
  790. ignorem map[int64]bool
  791. }
  792. // newNetwork initializes a network from peers.
  793. // A nil node will be replaced with a new *stateMachine.
  794. // A *stateMachine will get its k, id.
  795. // When using stateMachine, the address list is always [0, n).
  796. func newNetwork(peers ...Interface) *network {
  797. size := len(peers)
  798. peerAddrs := make([]int64, size)
  799. for i := 0; i < size; i++ {
  800. peerAddrs[i] = firstId + int64(i)
  801. }
  802. npeers := make(map[int64]Interface, size)
  803. for i, p := range peers {
  804. id := peerAddrs[i]
  805. switch v := p.(type) {
  806. case nil:
  807. sm := newRaft(id, peerAddrs, 0, 0)
  808. npeers[id] = sm
  809. case *raft:
  810. v.id = id
  811. v.prs = make(map[int64]*progress)
  812. for i := 0; i < size; i++ {
  813. v.prs[peerAddrs[i]] = &progress{}
  814. }
  815. v.reset(0)
  816. npeers[id] = v
  817. case *blackHole:
  818. npeers[id] = v
  819. default:
  820. panic("unimplemented")
  821. }
  822. }
  823. return &network{
  824. peers: npeers,
  825. dropm: make(map[connem]float64),
  826. ignorem: make(map[int64]bool),
  827. }
  828. }
  829. func (nw *network) send(msgs ...pb.Message) {
  830. for len(msgs) > 0 {
  831. m := msgs[0]
  832. p := nw.peers[m.To]
  833. p.Step(m)
  834. msgs = append(msgs[1:], nw.filter(p.ReadMessages())...)
  835. }
  836. }
  837. func (nw *network) drop(from, to int64, perc float64) {
  838. nw.dropm[connem{from, to}] = perc
  839. }
  840. func (nw *network) cut(one, other int64) {
  841. nw.drop(one, other, 1)
  842. nw.drop(other, one, 1)
  843. }
  844. func (nw *network) isolate(id int64) {
  845. for i := 0; i < len(nw.peers); i++ {
  846. nid := firstId + int64(i)
  847. if nid != id {
  848. nw.drop(id, nid, 1.0)
  849. nw.drop(nid, id, 1.0)
  850. }
  851. }
  852. }
  853. func (nw *network) ignore(t int64) {
  854. nw.ignorem[t] = true
  855. }
  856. func (nw *network) recover() {
  857. nw.dropm = make(map[connem]float64)
  858. nw.ignorem = make(map[int64]bool)
  859. }
  860. func (nw *network) filter(msgs []pb.Message) []pb.Message {
  861. mm := make([]pb.Message, 0)
  862. for _, m := range msgs {
  863. if nw.ignorem[m.Type] {
  864. continue
  865. }
  866. switch m.Type {
  867. case msgHup:
  868. // hups never go over the network, so don't drop them but panic
  869. panic("unexpected msgHup")
  870. default:
  871. perc := nw.dropm[connem{m.From, m.To}]
  872. if n := rand.Float64(); n < perc {
  873. continue
  874. }
  875. }
  876. mm = append(mm, m)
  877. }
  878. return mm
  879. }
  880. type connem struct {
  881. from, to int64
  882. }
  883. type blackHole struct{}
  884. func (blackHole) Step(pb.Message) error { return nil }
  885. func (blackHole) ReadMessages() []pb.Message { return nil }
  886. var nopStepper = &blackHole{}