mirror of
https://github.com/etcd-io/etcd.git
synced 2024-09-27 06:25:44 +00:00
raft: make leader transferring workable when quorum check is on
This commit is contained in:
parent
8e9097d0c0
commit
e020b2a228
24
raft/raft.go
24
raft/raft.go
@ -15,6 +15,7 @@
|
|||||||
package raft
|
package raft
|
||||||
|
|
||||||
import (
|
import (
|
||||||
|
"bytes"
|
||||||
"errors"
|
"errors"
|
||||||
"fmt"
|
"fmt"
|
||||||
"math"
|
"math"
|
||||||
@ -36,6 +37,17 @@ const (
|
|||||||
StateLeader
|
StateLeader
|
||||||
)
|
)
|
||||||
|
|
||||||
|
// Possible values for CampaignType
|
||||||
|
const (
|
||||||
|
LeaderElection CampaignType = "LeaderElection"
|
||||||
|
LeaderTransfer CampaignType = "LeaderTransfer"
|
||||||
|
)
|
||||||
|
|
||||||
|
// CampaignType represents the type of campaigning
|
||||||
|
// the reason we use the type of string instead of uint64
|
||||||
|
// is because it's simpler to compare and fill in raft entries
|
||||||
|
type CampaignType string
|
||||||
|
|
||||||
// StateType represents the role of a node in a cluster.
|
// StateType represents the role of a node in a cluster.
|
||||||
type StateType uint64
|
type StateType uint64
|
||||||
|
|
||||||
@ -520,7 +532,7 @@ func (r *raft) becomeLeader() {
|
|||||||
r.logger.Infof("%x became leader at term %d", r.id, r.Term)
|
r.logger.Infof("%x became leader at term %d", r.id, r.Term)
|
||||||
}
|
}
|
||||||
|
|
||||||
func (r *raft) campaign() {
|
func (r *raft) campaign(t CampaignType) {
|
||||||
r.becomeCandidate()
|
r.becomeCandidate()
|
||||||
if r.quorum() == r.poll(r.id, true) {
|
if r.quorum() == r.poll(r.id, true) {
|
||||||
r.becomeLeader()
|
r.becomeLeader()
|
||||||
@ -532,7 +544,7 @@ func (r *raft) campaign() {
|
|||||||
}
|
}
|
||||||
r.logger.Infof("%x [logterm: %d, index: %d] sent vote request to %x at term %d",
|
r.logger.Infof("%x [logterm: %d, index: %d] sent vote request to %x at term %d",
|
||||||
r.id, r.raftLog.lastTerm(), r.raftLog.lastIndex(), id, r.Term)
|
r.id, r.raftLog.lastTerm(), r.raftLog.lastIndex(), id, r.Term)
|
||||||
r.send(pb.Message{To: id, Type: pb.MsgVote, Index: r.raftLog.lastIndex(), LogTerm: r.raftLog.lastTerm()})
|
r.send(pb.Message{To: id, Type: pb.MsgVote, Index: r.raftLog.lastIndex(), LogTerm: r.raftLog.lastTerm(), Entries: []pb.Entry{{Data: []byte(t)}}})
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -557,7 +569,7 @@ func (r *raft) Step(m pb.Message) error {
|
|||||||
if m.Type == pb.MsgHup {
|
if m.Type == pb.MsgHup {
|
||||||
if r.state != StateLeader {
|
if r.state != StateLeader {
|
||||||
r.logger.Infof("%x is starting a new election at term %d", r.id, r.Term)
|
r.logger.Infof("%x is starting a new election at term %d", r.id, r.Term)
|
||||||
r.campaign()
|
r.campaign(LeaderElection)
|
||||||
} else {
|
} else {
|
||||||
r.logger.Debugf("%x ignoring MsgHup because already leader", r.id)
|
r.logger.Debugf("%x ignoring MsgHup because already leader", r.id)
|
||||||
}
|
}
|
||||||
@ -575,7 +587,9 @@ func (r *raft) Step(m pb.Message) error {
|
|||||||
case m.Term > r.Term:
|
case m.Term > r.Term:
|
||||||
lead := m.From
|
lead := m.From
|
||||||
if m.Type == pb.MsgVote {
|
if m.Type == pb.MsgVote {
|
||||||
if r.checkQuorum && r.state != StateCandidate && r.electionElapsed < r.electionTimeout {
|
force := len(m.Entries) == 1 && bytes.Equal(m.Entries[0].Data, []byte(LeaderTransfer))
|
||||||
|
inLease := r.checkQuorum && r.state != StateCandidate && r.electionElapsed < r.electionTimeout
|
||||||
|
if !force && inLease {
|
||||||
// If a server receives a RequestVote request within the minimum election timeout
|
// If a server receives a RequestVote request within the minimum election timeout
|
||||||
// of hearing from a current leader, it does not update its term or grant its vote
|
// of hearing from a current leader, it does not update its term or grant its vote
|
||||||
r.logger.Infof("%x [logterm: %d, index: %d, vote: %x] ignored vote from %x [logterm: %d, index: %d] at term %d: lease is not expired (remaining ticks: %d)",
|
r.logger.Infof("%x [logterm: %d, index: %d, vote: %x] ignored vote from %x [logterm: %d, index: %d] at term %d: lease is not expired (remaining ticks: %d)",
|
||||||
@ -842,7 +856,7 @@ func stepFollower(r *raft, m pb.Message) {
|
|||||||
}
|
}
|
||||||
case pb.MsgTimeoutNow:
|
case pb.MsgTimeoutNow:
|
||||||
r.logger.Infof("%x [term %d] received MsgTimeoutNow from %x and starts an election to get leadership.", r.id, r.Term, m.From)
|
r.logger.Infof("%x [term %d] received MsgTimeoutNow from %x and starts an election to get leadership.", r.id, r.Term, m.From)
|
||||||
r.campaign()
|
r.campaign(LeaderTransfer)
|
||||||
case pb.MsgReadIndex:
|
case pb.MsgReadIndex:
|
||||||
if r.lead == None {
|
if r.lead == None {
|
||||||
r.logger.Infof("%x no leader at term %d; dropping index reading msg", r.id, r.Term)
|
r.logger.Infof("%x no leader at term %d; dropping index reading msg", r.id, r.Term)
|
||||||
|
@ -175,8 +175,8 @@ func testNonleaderStartElection(t *testing.T, state StateType) {
|
|||||||
msgs := r.readMessages()
|
msgs := r.readMessages()
|
||||||
sort.Sort(messageSlice(msgs))
|
sort.Sort(messageSlice(msgs))
|
||||||
wmsgs := []pb.Message{
|
wmsgs := []pb.Message{
|
||||||
{From: 1, To: 2, Term: 2, Type: pb.MsgVote},
|
{From: 1, To: 2, Term: 2, Type: pb.MsgVote, Entries: []pb.Entry{{Data: []byte(LeaderElection)}}},
|
||||||
{From: 1, To: 3, Term: 2, Type: pb.MsgVote},
|
{From: 1, To: 3, Term: 2, Type: pb.MsgVote, Entries: []pb.Entry{{Data: []byte(LeaderElection)}}},
|
||||||
}
|
}
|
||||||
if !reflect.DeepEqual(msgs, wmsgs) {
|
if !reflect.DeepEqual(msgs, wmsgs) {
|
||||||
t.Errorf("msgs = %v, want %v", msgs, wmsgs)
|
t.Errorf("msgs = %v, want %v", msgs, wmsgs)
|
||||||
|
@ -2208,6 +2208,41 @@ func TestLeaderTransferToUpToDateNode(t *testing.T) {
|
|||||||
checkLeaderTransferState(t, lead, StateLeader, 1)
|
checkLeaderTransferState(t, lead, StateLeader, 1)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// TestLeaderTransferWithCheckQuorum ensures transferring leader still works
|
||||||
|
// even the current leader is still under its leader lease
|
||||||
|
func TestLeaderTransferWithCheckQuorum(t *testing.T) {
|
||||||
|
nt := newNetwork(nil, nil, nil)
|
||||||
|
for i := 1; i < 4; i++ {
|
||||||
|
r := nt.peers[uint64(i)].(*raft)
|
||||||
|
r.checkQuorum = true
|
||||||
|
}
|
||||||
|
|
||||||
|
f := nt.peers[2].(*raft)
|
||||||
|
for i := 0; i < f.electionTimeout; i++ {
|
||||||
|
f.tick()
|
||||||
|
}
|
||||||
|
|
||||||
|
nt.send(pb.Message{From: 1, To: 1, Type: pb.MsgHup})
|
||||||
|
|
||||||
|
lead := nt.peers[1].(*raft)
|
||||||
|
|
||||||
|
if lead.lead != 1 {
|
||||||
|
t.Fatalf("after election leader is %x, want 1", lead.lead)
|
||||||
|
}
|
||||||
|
|
||||||
|
// Transfer leadership to 2.
|
||||||
|
nt.send(pb.Message{From: 2, To: 1, Type: pb.MsgTransferLeader})
|
||||||
|
|
||||||
|
checkLeaderTransferState(t, lead, StateFollower, 2)
|
||||||
|
|
||||||
|
// After some log replication, transfer leadership back to 1.
|
||||||
|
nt.send(pb.Message{From: 1, To: 1, Type: pb.MsgProp, Entries: []pb.Entry{{}}})
|
||||||
|
|
||||||
|
nt.send(pb.Message{From: 1, To: 2, Type: pb.MsgTransferLeader})
|
||||||
|
|
||||||
|
checkLeaderTransferState(t, lead, StateLeader, 1)
|
||||||
|
}
|
||||||
|
|
||||||
func TestLeaderTransferToSlowFollower(t *testing.T) {
|
func TestLeaderTransferToSlowFollower(t *testing.T) {
|
||||||
defaultLogger.EnableDebug()
|
defaultLogger.EnableDebug()
|
||||||
nt := newNetwork(nil, nil, nil)
|
nt := newNetwork(nil, nil, nil)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user