src/raft/raft.go

package raft

//
// this is an outline of the API that raft must expose to
// the service (or tester). see comments below for
// each of these functions for more details.
//
// rf = Make(...)
//   create a new Raft server.
// rf.Start(command interface{}) (index, term, isleader)
//   start agreement on a new log entry
// rf.GetState() (term, isLeader)
//   ask a Raft for its current term, and whether it thinks it is leader
// ApplyMsg
//   each time a new entry is committed to the log, each Raft peer
//   should send an ApplyMsg to the service (or tester)
//   in the same server.
//

import (
	//	"bytes"
	"bytes"
	"math/rand"
	"sync"
	"sync/atomic"
	"time"

	//	"6.5840/labgob"
	"6.5840/labgob"
	"6.5840/labrpc"
)

// as each Raft peer becomes aware that successive log entries are
// committed, the peer should send an ApplyMsg to the service (or
// tester) on the same server, via the applyCh passed to Make(). set
// CommandValid to true to indicate that the ApplyMsg contains a newly
// committed log entry.
//
// in part 2D you'll want to send other kinds of messages (e.g.,
// snapshots) on the applyCh, but set CommandValid to false for these
// other uses.
type ApplyMsg struct {
	CommandValid bool
	Command      interface{}
	CommandIndex int

	// For 2D:
	SnapshotValid bool
	Snapshot      []byte
	SnapshotTerm  int
	SnapshotIndex int
}

// A Go object implementing a single Raft peer.
type Raft struct {
	mu        sync.Mutex          // Lock to protect shared access to this peer's state
	peers     []*labrpc.ClientEnd // RPC end points of all peers
	persister *Persister          // Object to hold this peer's persisted state
	me        int                 // this peer's index into peers[]
	dead      int32               // set by Kill()

	// Your data here (2A, 2B, 2C).
	// Look at the paper's Figure 2 for a description of what
	// state a Raft server must maintain.
	// 所有服务器上的持久性状态 (在响应 RPC 请求之前，已经更新到了稳定的存储设备)

	CurrentTerm    int           // 服务器的任期号（初始化为 0，持续递增）
	VotedFor       int           // 当前投票的候选人的 Id
	Log            []LogEntry    // 日志条目集；每一个条目包含一个用户状态机执行的指令，和收到时的任期号

	LastLogIndex   int         	 // 最后一条日志条目的索引
	LeaderId       int         	 // 领导人的 Id
	State          State       	 // 节点状态
	ElectionTimer  *time.Timer 	 // 选举定时器
	HeartbeatTimer *time.Timer 	 // 心跳定时器
	ApplyCh 	   chan ApplyMsg // 传递给状态机的消息通道
	ApplyCond      *sync.Cond    // 唤醒applier线程的条件变量

	// 所有服务器上的易失性状态

	CommitIndex       int // 已知已提交的最高的日志条目的索引（初始值为0，单调递增）
	LastApplied 	  int // 已经被应用到状态机的最高的日志条目的索引（初始值为0，单调递增）
	LastIncludedIndex int // 快照中包含的最后日志条目的索引值
	LastIncludedTerm  int // 快照中包含的最后日志条目的任期号

	// 领导人上的易失性状态 (选举后已经重新初始化)

	NextIndex  []int // 对于每一台服务器，发送到该服务器的下一个日志条目的索引（初始值为领导人最后的日志条目的索引+1）
	MatchIndex []int //	对于每一台服务器，已知的已经复制到该服务器的最高日志条目的索引（初始值为0，单调递增）

}

// 节点状态
type State int

const (
	Follower  State = iota // 跟随者
	Candidate              // 候选人
	Leader                 // 领导者
)

// 日志条目
type LogEntry struct {
	Term    int         // 领导者收到此条目时的任期号
	Command interface{} // 状态机执行的命令
}

// return currentTerm and whether this server
// believes it is the leader.
func (rf *Raft) GetState() (int, bool) {
	rf.mu.Lock()
	defer rf.mu.Unlock()

	var term int
	var isleader bool
	// Your code here (2A).
	term = rf.CurrentTerm
	isleader = rf.State == Leader
	return term, isleader
}

// save Raft's persistent state to stable storage,
// where it can later be retrieved after a crash and restart.
// see paper's Figure 2 for a description of what should be persistent.
// before you've implemented snapshots, you should pass nil as the
// second argument to persister.Save().
// after you've implemented snapshots, pass the current snapshot
// (or nil if there's not yet a snapshot).
func (rf *Raft) persist() {
	w := new(bytes.Buffer)
	e := labgob.NewEncoder(w)
	e.Encode(rf.CurrentTerm)
	e.Encode(rf.VotedFor)
	e.Encode(rf.Log)
	e.Encode(rf.LastIncludedIndex)
	e.Encode(rf.LastIncludedTerm)
	raftstate := w.Bytes()
	rf.persister.SaveRaftState(raftstate)
	//DPrintf("raft %v persist, CurrentTerm %v, VotedFor %v, Log %v,  LastIncludedIndex %v, LastIncludedTerm %v", rf.me, rf.CurrentTerm, rf.VotedFor, rf.Log, rf.LastIncludedIndex, rf.LastIncludedTerm)
}

// restore previously persisted state.
func (rf *Raft) readPersist(data []byte) {
	if data == nil || len(data) < 1 { // bootstrap without any state?
		return
	}

	r := bytes.NewBuffer(data)
	d := labgob.NewDecoder(r)
	var CurrentTerm int
	var VotedFor int
	var Log []LogEntry
	var LastIncludedIndex int
	var LastIncludedTerm int
	if d.Decode(&CurrentTerm) != nil || d.Decode(&VotedFor) != nil || d.Decode(&Log) != nil || 
	d.Decode(&LastIncludedIndex) != nil || d.Decode(&LastIncludedTerm) != nil{
		//error
	} else {
		rf.CurrentTerm = CurrentTerm
		rf.VotedFor = VotedFor
		rf.Log = Log
		rf.LastIncludedIndex = LastIncludedIndex
		rf.LastIncludedTerm = LastIncludedTerm
		rf.CommitIndex = rf.LastIncludedIndex
		rf.LastApplied = rf.LastIncludedIndex
		rf.LastLogIndex = rf.LastIncludedIndex + len(rf.Log) - 1


		DPrintf("raft %v readPersist, CurrentTerm %v, VotedFor %v, Log %v, LastLogIndex %v", rf.me, rf.CurrentTerm, rf.VotedFor, rf.Log, rf.LastLogIndex)
	}
}

type InstallSnapshotArgs struct {
	Term              int    //领导者的任期
	LeaderId          int    //领导者的 Id，以便于跟随者重定向请求
	LastIncludedIndex int 	 //快照中包含的最后日志条目的索引值
	LastIncludedTerm  int 	 //快照中包含的最后日志条目的任期号
	Data              []byte //快照数据
}

type InstallSnapshotReply struct {
	Term int  //当前任期号，用于领导者去更新自己
}

// InstallSnapshot RPC handler.
func (rf *Raft) InstallSnapshot(args *InstallSnapshotArgs, reply *InstallSnapshotReply) {
	// Your code here (2D).
	rf.mu.Lock()
	defer rf.mu.Unlock()

	//如果term < currentTerm就立即回复
	if args.Term < rf.CurrentTerm {
		reply.Term = rf.CurrentTerm
		return
	}

	if args.Term > rf.CurrentTerm {
		rf.State = Follower
		rf.VotedFor = -1
		rf.CurrentTerm = args.Term
		rf.LeaderId = -1
		rf.persist()
	}

	rf.State = Follower
	rf.LeaderId = args.LeaderId
	rf.resetElectionTimer()

	//如果args.LastIncludedIndex <= rf.CommitIndex，就立即回复
	if args.LastIncludedIndex <= rf.LastIncludedIndex {
		reply.Term = rf.CurrentTerm
		return
	}

	DPrintf("raft %v recieve InstallSnapshot, rf.LastIncludedIndex %v, args.LastIncludedIndex %v, rf.LastIncludedIndex %v", rf.me, rf.LastIncludedIndex, args.LastIncludedIndex, rf.LastIncludedIndex)

	if args.LastIncludedIndex >= rf.LastLogIndex {
		rf.LastLogIndex = args.LastIncludedIndex
		var newLog []LogEntry = make([]LogEntry, 0)
		newLog = append(newLog, LogEntry{Term: args.LastIncludedTerm})
		rf.Log = newLog
	}else{
		//截断日志
		var newLog []LogEntry = make([]LogEntry, 0)
		newLog = append(newLog, LogEntry{Term: args.LastIncludedTerm})
		newLog = append(newLog, rf.Log[args.LastIncludedIndex + 1 - rf.LastIncludedIndex:]...)
		rf.Log = newLog
	}
	
	//更新rf.LastIncludedIndex 和 rf.LastIncludedTerm
	rf.LastIncludedIndex = args.LastIncludedIndex
	rf.LastIncludedTerm = args.LastIncludedTerm

	//更新rf.CommitIndex 和 rf.LastApplied

	rf.CommitIndex = Max(rf.CommitIndex, rf.LastIncludedIndex)
	rf.LastApplied = Max(rf.LastApplied, rf.LastIncludedIndex)
	

	//保存状态和快照
	rf.savaStateAndSnapshot(args.Data)

	reply.Term = rf.CurrentTerm

	applyMsg := ApplyMsg{
		SnapshotValid: true,
		Snapshot: args.Data,
		SnapshotTerm: args.LastIncludedTerm,
		SnapshotIndex: args.LastIncludedIndex,
	}

	rf.mu.Unlock()

	rf.ApplyCh <- applyMsg
}	


func (rf *Raft) savaStateAndSnapshot(snapshot []byte) {
	w := new(bytes.Buffer)
	e := labgob.NewEncoder(w)
	e.Encode(rf.CurrentTerm)
	e.Encode(rf.VotedFor)
	e.Encode(rf.Log)
	e.Encode(rf.LastIncludedIndex)
	e.Encode(rf.LastIncludedTerm)
	state := w.Bytes()
	rf.persister.Save(state, snapshot)
	DPrintf("raft %v savaStateAndSnapshot, CurrentTerm %v, VotedFor %v, Log %v, LastIncludedIndex %v, LastIncludedTerm %v", rf.me, rf.CurrentTerm, rf.VotedFor, rf.Log, rf.LastIncludedIndex, rf.LastIncludedTerm)
}


// the service says it has created a snapshot that has
// all info up to and including index. this means the
// service no longer needs the log through (and including)
// that index. Raft should now trim its log as much as possible.
func (rf *Raft) Snapshot(index int, snapshot []byte) {
	// Your code here (2D).
	rf.mu.Lock()
	defer rf.mu.Unlock()

	if rf.killed() == true {
		return
	}

	if index <= rf.LastIncludedIndex || index > rf.CommitIndex{
		return
	}
	DPrintf("raft %v Snapshot, index %v, LastIncludedIndex %v, LastIncludedTerm %v, CommitIndex %v, LastApplied %v", rf.me, index, rf.LastIncludedIndex, rf.LastIncludedTerm, rf.CommitIndex, rf.LastApplied)

	//如果index > rf.LastIncludedIndex，就截断日志
	//更新rf.LastIncludedIndex 和 rf.LastIncludedTerm
	rf.LastIncludedTerm = rf.Log[index - rf.LastIncludedIndex].Term
	
	var newLog []LogEntry = make([]LogEntry, 0)
	newLog = append(newLog, LogEntry{Term: rf.LastIncludedTerm})
	newLog = append(newLog, rf.Log[index+ 1 - rf.LastIncludedIndex:]...)
	rf.Log = newLog
	rf.LastIncludedIndex = index

	//保存状态和快照
	rf.savaStateAndSnapshot(snapshot)
}

// example RequestVote RPC arguments structure.
// field names must start with capital letters!
type RequestVoteArgs struct {
	// Your data here (2A, 2B).
	Term         int //候选人的任期号
	CandidateId  int //请求选票的候选人的 ID
	LastLogIndex int //候选人的最后日志条目的索引值
	LastLogTerm  int //候选人最后日志条目的任期号
}

// example RequestVote RPC reply structure.
// field names must start with capital letters!
type RequestVoteReply struct {
	// Your data here (2A).
	Term        int  //当前任期号，以便于候选人去更新自己的任期号
	VoteGranted bool //候选人赢得了此张选票时为真
}

// example RequestVote RPC handler.
func (rf *Raft) RequestVote(args *RequestVoteArgs, reply *RequestVoteReply) {
	// Your code here (2A, 2B).
	rf.mu.Lock()
	defer rf.mu.Unlock()

	//如果args.Term < rf.CurrentTerm, 返回 false
	if args.Term < rf.CurrentTerm {
		reply.VoteGranted = false
		reply.Term = rf.CurrentTerm
		return
	}

	//如果节点已经投票给了其他节点，就不再投票，返回 false
	if args.Term == rf.CurrentTerm && rf.VotedFor != -1 && rf.VotedFor != args.CandidateId {
		reply.VoteGranted = false
		reply.Term = rf.CurrentTerm
		return
	}

	//如果 args.Term  > rf.CurrentTerm, 切换状态为跟随者
	if args.Term > rf.CurrentTerm {
		rf.State = Follower
		rf.VotedFor = -1
		rf.CurrentTerm = args.Term
		rf.LeaderId = -1
		rf.persist()
	}

	//选举限制：如果候选人的日志没有自己新，那么就不投票给他
	//Raft 通过比较两份日志中最后一条日志条目的索引值和任期号定义谁的日志比较新。
	//如果两份日志最后的条目的任期号不同，那么任期号大的日志更加新。
	//如果两份日志最后的条目任期号相同，那么日志比较长的那个就更加新。
	if args.LastLogTerm < rf.Log[rf.LastLogIndex - rf.LastIncludedIndex].Term {
		reply.VoteGranted = false
		reply.Term = rf.CurrentTerm
		return
	}else if args.LastLogTerm == rf.Log[rf.LastLogIndex - rf.LastIncludedIndex].Term {
		if args.LastLogIndex < rf.LastLogIndex {
			reply.VoteGranted = false
			reply.Term = rf.CurrentTerm
			return
		}
	}

	//投票给候选人
	rf.VotedFor = args.CandidateId
	reply.VoteGranted = true
	reply.Term = rf.CurrentTerm
	rf.resetElectionTimer()
	rf.persist()
}

// 追加条目RPC参数
type AppendEntriesArgs struct {
	Term         int        //领导者的任期
	LeaderId     int        //领导者的 Id，以便于跟随者重定向请求
	PrevLogIndex int        //紧邻新日志条目之前的那个日志条目的索引
	PrevLogTerm  int        //紧邻新日志条目之前的那个日志条目的任期
	Entries      []LogEntry //准备存储的日志条目（表示心跳时为空；一次性发送多个是为了提高效率）
	LeaderCommit int        //领导人的已知已提交的最高的日志条目的索引
}

type AppendEntriesReply struct {
	Term          int  //当前任期号，用于领导者去更新自己
	Success       bool //如果跟随者所含有的条目和 prevLogIndex 以及 prevLogTerm 匹配上了，则为 true
	ConflictIndex int  //冲突的日志索引
	ConflictTerm  int  //冲突的日志任期
}

// AppendEntries RPC handler.
func (rf *Raft) AppendEntries(args *AppendEntriesArgs, reply *AppendEntriesReply) {
	// Your code here (2A, 2B).
	rf.mu.Lock()
	defer rf.mu.Unlock()

	//DPrintf("raft %v receive AppendEntries, args.PrevLogIndex %v, args.PrevLogTerm %v, rf.LastLogIndex %v, rf.LastIncludedIndex %v", rf.me, args.PrevLogIndex, args.PrevLogTerm, rf.LastLogIndex, rf.LastIncludedIndex)

	reply.ConflictIndex = -1
	reply.ConflictTerm = -1

	//如果args.Term  < rf.CurrentTerm, 返回 false
	if args.Term < rf.CurrentTerm {
		reply.Success = false
		reply.Term = rf.CurrentTerm
		return
	}

	//如果 args.Term  > rf.CurrentTerm，切换状态为跟随者
	if args.Term > rf.CurrentTerm {
		rf.State = Follower
		rf.VotedFor = -1
		rf.CurrentTerm = args.Term
		rf.persist()
	}

	rf.State = Follower
	rf.LeaderId = args.LeaderId
	rf.resetElectionTimer()

	//如果接收者日志中没有包含这样一个条目，那么就返回 false
	if args.PrevLogIndex < rf.LastIncludedIndex {
		reply.Success = false
		reply.Term = rf.CurrentTerm
		reply.ConflictIndex = rf.LastIncludedIndex + 1
		reply.ConflictTerm = -1
		return
	}


	//在接收者日志中, 如果找不到PrevLogIndex
	//应该返回 conflictIndex = len(log) 和 conflictTerm = None。
	if args.PrevLogIndex > rf.LastLogIndex {
		reply.Success = false
		reply.Term = rf.CurrentTerm
		reply.ConflictIndex = rf.LastLogIndex + 1
		reply.ConflictTerm = -1
		return
	}

	//在接收者日志中, 如果追随者的日志中有 preLogIndex，但是任期不匹配
	//返回 conflictTerm = log[preLogIndex].Term，然后在它的日志中搜索任期等于 conflictTerm 的第一个条目索引。
	if args.PrevLogIndex >= rf.LastIncludedIndex && rf.Log[args.PrevLogIndex - rf.LastIncludedIndex].Term != args.PrevLogTerm {
		reply.Success = false
		reply.Term = rf.CurrentTerm
		reply.ConflictTerm = rf.Log[args.PrevLogIndex - rf.LastIncludedIndex].Term
		index := args.PrevLogIndex
		for index >= rf.LastIncludedIndex && rf.Log[index - rf.LastIncludedIndex].Term == reply.ConflictTerm {
			index--
		}
		reply.ConflictIndex = index + 1
		return
	}

	
	DPrintf("raft %v start AppendEntries, args.PrevLogIndex %v, args.PrevLogTerm %v, rf.LastLogIndex %v, rf.LastIncludedIndex %v", rf.me, args.PrevLogIndex, args.PrevLogTerm, rf.LastLogIndex, rf.LastIncludedIndex)
	//如果一个已经存在的条目和新条目（即刚刚接收到的日志条目）发生了冲突（因为索引相同，任期不同），那么就删除这个已经存在的条目以及它之后的所有条目
	if len(args.Entries) > 0 {
		for i, entry := range args.Entries {
			if args.PrevLogIndex+i+1 > rf.LastLogIndex {
				rf.Log = append(rf.Log, entry)
				rf.LastLogIndex++
			} else {
				if rf.Log[args.PrevLogIndex+i+1 - rf.LastIncludedIndex].Term != entry.Term {
					rf.Log = rf.Log[:args.PrevLogIndex+i+1 - rf.LastIncludedIndex]
					rf.Log = append(rf.Log, entry)
					rf.LastLogIndex = args.PrevLogIndex + i + 1
				}
			}
		}
	}
	
	rf.persist()

	//如果leaderCommit > commitIndex
	//则把commitIndex 重置为  leaderCommit 或者是 上一个新条目的索引 取两者的最小值
	if args.LeaderCommit > rf.CommitIndex {
		rf.CommitIndex = args.LeaderCommit
		if rf.CommitIndex > rf.LastLogIndex {
			rf.CommitIndex = rf.LastLogIndex
		}
		rf.ApplyCond.Broadcast()
	}

	reply.Success = true
	reply.Term = rf.CurrentTerm
}


// example code to send a RequestVote RPC to a server.
// server is the index of the target server in rf.peers[].
// expects RPC arguments in args.
// fills in *reply with RPC reply, so caller should
// pass &reply.
// the types of the args and reply passed to Call() must be
// the same as the types of the arguments declared in the
// handler function (including whether they are pointers).
//
// The labrpc package simulates a lossy network, in which servers
// may be unreachable, and in which requests and replies may be lost.
// Call() sends a request and waits for a reply. If a reply arrives
// within a timeout interval, Call() returns true; otherwise
// Call() returns false. Thus Call() may not return for a while.
// A false return can be caused by a dead server, a live server that
// can't be reached, a lost request, or a lost reply.
//
// Call() is guaranteed to return (perhaps after a delay) *except* if the
// handler function on the server side does not return.  Thus there
// is no need to implement your own timeouts around Call().
//
// look at the comments in ../labrpc/labrpc.go for more details.
//
// if you're having trouble getting RPC to work, check that you've
// capitalized all field names in structs passed over RPC, and
// that the caller passes the address of the reply struct with &, not
// the struct itself.
func (rf *Raft) sendRequestVote(server int, args *RequestVoteArgs, reply *RequestVoteReply) bool {
	ok := rf.peers[server].Call("Raft.RequestVote", args, reply)
	return ok
}

func (rf *Raft) sendAppendEntries(server int, args *AppendEntriesArgs, reply *AppendEntriesReply) bool {
	ok := rf.peers[server].Call("Raft.AppendEntries", args, reply)
	return ok
}

func (rf *Raft) sendInstallSnapshot(server int, args *InstallSnapshotArgs, reply *InstallSnapshotReply) bool {
	ok := rf.peers[server].Call("Raft.InstallSnapshot", args, reply)
	return ok
}

// the service using Raft (e.g. a k/v server) wants to start
// agreement on the next command to be appended to Raft's log. if this
// server isn't the leader, returns false. otherwise start the
// agreement and return immediately. there is no guarantee that this
// command will ever be committed to the Raft log, since the leader
// may fail or lose an election. even if the Raft instance has been killed,
// this function should return gracefully.
//
// the first return value is the index that the command will appear at
// if it's ever committed. the second return value is the current
// term. the third return value is true if this server believes it is
// the leader.
func (rf *Raft) Start(command interface{}) (int, int, bool) {
	rf.mu.Lock()
	defer rf.mu.Unlock()

	index := -1
	term := -1
	isLeader := true

	// Your code here (2B).
	//如果不是领导者，返回 false
	if rf.State != Leader {
		return index, term, false
	}

	//如果是领导者，就把命令追加到自己的日志中
	rf.Log = append(rf.Log, LogEntry{Term: rf.CurrentTerm, Command: command})

	//更新最后一条日志的索引
	rf.LastLogIndex++

	DPrintf("raft %v receive command %v, term %v", rf.me, command, rf.CurrentTerm)

	//持久化
	rf.persist()

	//广播
	rf.broadcast()
	rf.resetHeartbeatTimer()

	//返回值
	index = rf.LastLogIndex
	term = rf.CurrentTerm
	isLeader = true

	return index, term, isLeader
}

// the tester doesn't halt goroutines created by Raft after each test,
// but it does call the Kill() method. your code can use killed() to
// check whether Kill() has been called. the use of atomic avoids the
// need for a lock.
//
// the issue is that long-running goroutines use memory and may chew
// up CPU time, perhaps causing later tests to fail and generating
// confusing debug output. any goroutine with a long-running loop
// should call killed() to check whether it should stop.
func (rf *Raft) Kill() {
	atomic.StoreInt32(&rf.dead, 1)
	// Your code here, if desired.
}

func (rf *Raft) killed() bool {
	z := atomic.LoadInt32(&rf.dead)
	return z == 1
}

func (rf *Raft) ticker() {

	for rf.killed() == false {
		// Your code here (2A)
		// Check if a leader election should be started.

		select {
		case <-rf.ElectionTimer.C:
			rf.mu.Lock()
			if rf.State == Leader {
				rf.mu.Unlock()
				continue
			}
			rf.becomeCandidate()
			rf.startElection()
			rf.resetElectionTimer()
			rf.mu.Unlock()
		case <-rf.HeartbeatTimer.C:
			rf.mu.Lock()
			if rf.State == Leader {
				rf.broadcast()
				rf.resetHeartbeatTimer()
			}
			rf.mu.Unlock()
		}
	}
}

// 转换为候选人，开始新一轮选举
func (rf *Raft) becomeCandidate() {

	//转换为候选人
	rf.State = Candidate
	//增加当前任期号
	rf.CurrentTerm++

	rf.persist()

	DPrintf("raft %v become candidate, term %v", rf.me, rf.CurrentTerm)
}

// 转换为领导者
func (rf *Raft) becomeLeader() {

	if rf.State != Candidate {
		return
	}

	//转换为领导者
	rf.State = Leader
	rf.LeaderId = rf.me
	//初始化 nextIndex 和 matchIndex
	//初始化所有的 nextIndex 值为自己的最后一条日志的 index 加 1
	for i := range rf.peers {
		//rf.NextIndex[i] = rf.LastLogIndex + 1
		rf.NextIndex[i] = Max(rf.LastLogIndex + 1, rf.NextIndex[i])
		rf.MatchIndex[i] = 0
	}

	DPrintf("raft %v become leader, term %v", rf.me, rf.CurrentTerm)
}

// 开始选举
func (rf *Raft) startElection() {

	if rf.State == Candidate {

		//给自己投票
		rf.VotedFor = rf.me
		rf.persist()
		//选票数
		voteCount := 1

		//给所有其他节点发送投票请求
		for peer := range rf.peers {
			if peer != rf.me {
				//异步调用自检
				if rf.State != Candidate {
					return
				}
				args := RequestVoteArgs{}
				args.Term = rf.CurrentTerm
				args.CandidateId = rf.me
				args.LastLogIndex = rf.LastLogIndex
				args.LastLogTerm = rf.Log[args.LastLogIndex - rf.LastIncludedIndex].Term

				reply := RequestVoteReply{}
				DPrintf("raft %v send RequestVote to %v, args.Term %v, args.LastLogIndex %v, args.LastLogTerm %v", rf.me, peer, args.Term, args.LastLogIndex, args.LastLogTerm)
				go rf.requestVote(peer, &args, &reply, &voteCount)
			}
		}
	}
}

// 请求投票
func (rf *Raft) requestVote(peer int, args *RequestVoteArgs, reply *RequestVoteReply, voteCount *int) {

	ok := rf.sendRequestVote(peer, args, reply)

	if ok {
		rf.mu.Lock()
		defer rf.mu.Unlock()
		DPrintf("raft %v receive RequestVote reply from %v, reply.Term %v, reply.VoteGranted %v", rf.me, peer, reply.Term, reply.VoteGranted)

		//如果收到旧的 RPC 的回复，先记录回复中的任期（可能高于您当前的任期），
		//然后将当前任期与您在原始 RPC 中发送的任期进行比较。如果两者不同，请放弃回复并返回
		if rf.CurrentTerm != args.Term || rf.State != Candidate {
			return
		}

		if reply.VoteGranted {
			*voteCount++
			//如果获得了大多数的选票，就成为领导人
			if *voteCount > len(rf.peers)/2 {
				rf.becomeLeader()
				rf.broadcast()
				rf.resetHeartbeatTimer()
			}
		} else if reply.Term > rf.CurrentTerm {
			//如果对方的任期号比自己大，就转换为跟随者
			rf.State = Follower
			rf.VotedFor = -1
			rf.CurrentTerm = reply.Term
			rf.resetElectionTimer()
			rf.persist()
		}
	}
}

// 广播
func (rf *Raft) broadcast() {

	if rf.State != Leader {
		return
	}

	for peer := range rf.peers {
		if peer != rf.me {
			//异步调用自检
			if rf.State != Leader {
				return
			}

			//检查是否发送快照
			if rf.NextIndex[peer] <= rf.LastIncludedIndex {
				args := InstallSnapshotArgs{}
				args.Term = rf.CurrentTerm
				args.LeaderId = rf.me
				args.LastIncludedIndex = rf.LastIncludedIndex
				args.LastIncludedTerm = rf.LastIncludedTerm
				args.Data = rf.persister.ReadSnapshot()

				reply := InstallSnapshotReply{}

				DPrintf("raft %v send InstallSnapshot to %v, args.Term %v, args.LastIncludedIndex %v, args.LastIncludedTerm %v, args.Data %v", rf.me, peer, args.Term, args.LastIncludedIndex, args.LastIncludedTerm, args.Data)
				
				go rf.sendSnapshot(peer, &args, &reply)
			} else {
				//发送日志
				args := AppendEntriesArgs{}
				args.Term = rf.CurrentTerm
				args.LeaderId = rf.me
				args.PrevLogIndex = rf.NextIndex[peer] - 1
				args.PrevLogTerm = rf.Log[args.PrevLogIndex - rf.LastIncludedIndex].Term
				args.LeaderCommit = rf.CommitIndex
				//表示心跳， 为空
				args.Entries = make([]LogEntry, 0)
				//如果存在日志条目要发送，就发送日志条目
				if rf.NextIndex[peer] <= rf.LastLogIndex {
					//深拷贝
					args.Entries = append(args.Entries, rf.Log[rf.NextIndex[peer] - rf.LastIncludedIndex:]...)
				}
			
				reply := AppendEntriesReply{}
				DPrintf("raft %v send AppendEntries to %v, args.Term %v, args.PrevLogIndex %v, args.PrevLogTerm %v, args.LeaderCommit %v, args.Entries %v", rf.me, peer, args.Term, args.PrevLogIndex, args.PrevLogTerm, args.LeaderCommit, args.Entries)
				//DPrintf("raft %v sendLog to %v, before go rf.sendLog(peer), rf.NextIndex[peer] %v, rf.LastIncludedIndex %v", rf.me, peer, rf.NextIndex[peer], rf.LastIncludedIndex)
				go rf.sendLog(peer, &args, &reply)
			}
		}
	}
}

// 发送日志(空时，表示心跳)
func (rf *Raft) sendLog(peer int, args *AppendEntriesArgs, reply *AppendEntriesReply) {

	ok := rf.sendAppendEntries(peer, args, reply)

	if ok {
		rf.mu.Lock()
		defer rf.mu.Unlock()
		DPrintf("raft %v receive AppendEntries reply from %v, reply.Term %v, reply.Success %v, reply.ConflictIndex %v, reply.ConflictTerm %v", rf.me, peer, reply.Term, reply.Success, reply.ConflictIndex, reply.ConflictTerm)

		//如果收到旧的 RPC 的回复，先记录回复中的任期（可能高于您当前的任期），
		//然后将当前任期与您在原始 RPC 中发送的任期进行比较。如果两者不同，请放弃回复并返回
		if rf.CurrentTerm != args.Term || rf.State != Leader {
			return
		}

		//处理返回体
		//如果成功，更新 nextIndex 和 matchIndex
		if reply.Success == true {
			//rf.NextIndex[peer] = args.PrevLogIndex + len(args.Entries) + 1
			//rf.MatchIndex[peer] = args.PrevLogIndex + len(args.Entries)
			rf.NextIndex[peer] = Max(args.PrevLogIndex + len(args.Entries) + 1, rf.NextIndex[peer])
			rf.MatchIndex[peer] = Max(args.PrevLogIndex + len(args.Entries), rf.MatchIndex[peer])

			//如果存在一个满足 N > commitIndex 的 N，并且大多数的 matchIndex[i] ≥ N 成立，并且 log[N].term == currentTerm 成立，那么令 commitIndex 等于这个 N
			for N := rf.CommitIndex + 1; N <= rf.LastLogIndex; N++ {
				if rf.Log[N - rf.LastIncludedIndex].Term == rf.CurrentTerm {
					count := 1
					for i := range rf.peers {
						if i != rf.me && rf.MatchIndex[i] >= N {
							count++
						}
					}
					if count > len(rf.peers)/2 {
						rf.CommitIndex = N
						//break
					}
				}
			}
			rf.ApplyCond.Broadcast()
		} else {
			//如果对方的任期号比自己大，就转换为跟随者
			if reply.Term > rf.CurrentTerm {
				rf.State = Follower
				rf.VotedFor = -1
				rf.CurrentTerm = reply.Term
				rf.resetElectionTimer()
				rf.persist()
			} else {
				//如果失败，就递减 nextIndex 重试
				// rf.NextIndex[peer]--
				// if rf.NextIndex[peer] < 1 {
				// 	rf.NextIndex[peer] = 1
				// }

				if reply.ConflictTerm == -1 {
					rf.NextIndex[peer] = reply.ConflictIndex
				} else {
					conflictIndex := -1
					//在收到一个冲突响应后，领导者首先应该搜索其日志中任期为 conflictTerm 的条目。
					//如果领导者在其日志中找到此任期的一个条目，则应该设置 nextIndex 为其日志中此任期的最后一个条目的索引的下一个。
					for i := args.PrevLogIndex; i >= rf.LastIncludedIndex; i-- {
						if rf.Log[i - rf.LastIncludedIndex].Term == reply.ConflictTerm {
							conflictIndex = i
							break
						}
					}
					//如果领导者没有找到此任期的条目，则应该设置 nextIndex = conflictIndex
					if conflictIndex == -1 {
						rf.NextIndex[peer] = reply.ConflictIndex
					} else {
						rf.NextIndex[peer] = conflictIndex + 1
					}
				}
			}
		}
	}
}


// 发送快照
func (rf *Raft) sendSnapshot(peer int, args *InstallSnapshotArgs, reply *InstallSnapshotReply) {

	ok := rf.sendInstallSnapshot(peer, args, reply)

	if ok {
		rf.mu.Lock()
		defer rf.mu.Unlock()
		DPrintf("raft %v receive InstallSnapshot reply from %v, reply.Term %v", rf.me, peer, reply.Term)

		//如果收到旧的 RPC 的回复，先记录回复中的任期（可能高于您当前的任期），
		//然后将当前任期与您在原始 RPC 中发送的任期进行比较。如果两者不同，请放弃回复并返回
		if rf.CurrentTerm != args.Term || rf.State != Leader {
			return
		}

		//如果对方的任期号比自己大，就转换为跟随者
		if reply.Term > rf.CurrentTerm {
			rf.State = Follower
			rf.VotedFor = -1
			rf.CurrentTerm = reply.Term
			rf.resetElectionTimer()
			rf.persist()
		}else{
			//rf.NextIndex[peer] = rf.LastIncludedIndex + 1
			rf.NextIndex[peer] = Max(args.LastIncludedIndex + 1, rf.NextIndex[peer])
			rf.MatchIndex[peer] = Max(rf.LastIncludedIndex, rf.MatchIndex[peer])
		}
	}
}


func Max(x, y int) int {
    if x > y {
        return x
    }
    return y
}


// 重置选举计时器
func (rf *Raft) resetElectionTimer() {
	rf.ElectionTimer.Stop()
	rf.ElectionTimer.Reset(randomElectionTimeout())
	//DPrintf("raft %v reset election timer", rf.me)
}

// 随机选举超时时间,选举超时应该在 150 到 300 毫秒范围内
func randomElectionTimeout() time.Duration {
	return time.Millisecond * time.Duration(rand.Intn(200)+250)
}

// 重置心跳计时器
func (rf *Raft) resetHeartbeatTimer() {
	rf.HeartbeatTimer.Stop()
	rf.HeartbeatTimer.Reset(fixedHeartbeatTimeout())
}

// 固定心跳超时时间
func fixedHeartbeatTimeout() time.Duration {
	return time.Millisecond * 100
}

// 应用日志,使用applyCond来同步
func (rf *Raft) applier() {
	for rf.killed() == false {
		rf.mu.Lock()
		for rf.LastApplied >= rf.CommitIndex {
			rf.ApplyCond.Wait()
		}

		lastIncludedIndex := rf.LastIncludedIndex
		lastApplied := rf.LastApplied
		commitIndex := rf.CommitIndex
		entries := make([]LogEntry, commitIndex - lastApplied)
		copy(entries, rf.Log[lastApplied + 1 - lastIncludedIndex:commitIndex + 1 - lastIncludedIndex])
		rf.mu.Unlock()
		for i , entry := range entries {
			applymsg := ApplyMsg{CommandValid: true, Command: entry.Command, CommandIndex: lastApplied + 1 + i}
			rf.ApplyCh <- applymsg
		}
		rf.mu.Lock()
		rf.LastApplied = Max(rf.LastApplied, commitIndex)
		rf.mu.Unlock()

		// for rf.LastApplied < rf.CommitIndex {
		// 	rf.LastApplied++
		// 	applymsg := ApplyMsg{CommandValid: true, Command: rf.Log[rf.LastApplied - rf.LastIncludedIndex].Command, CommandIndex: rf.LastApplied}
		// 	DPrintf("raft %v apply log %v, term %v, index %v", rf.me, rf.Log[rf.LastApplied - rf.LastIncludedIndex].Command, rf.Log[rf.LastApplied - rf.LastIncludedIndex].Term, rf.LastApplied)
		// 	rf.mu.Unlock()
		// 	rf.ApplyCh <- applymsg	
		// 	rf.mu.Lock()	
		// }
		// rf.mu.Unlock()
	}
}

// func (rf *Raft) applier() {
// 	for rf.killed() == false {
// 		rf.mu.Lock()
		
// 		//如果 commitIndex > lastApplied，那么就 lastApplied 加一，并把 log[lastApplied] 应用到状态机中
// 		for rf.CommitIndex > rf.LastApplied {
// 			//DPrintf("raft %v applier, rf.CommitIndex %v, rf.LastApplied %v", rf.me, rf.CommitIndex, rf.LastApplied)
// 			rf.LastApplied++
// 			applymsg := ApplyMsg{CommandValid: true, Command: rf.Log[rf.LastApplied - rf.LastIncludedIndex].Command, CommandIndex: rf.LastApplied}
// 			DPrintf("raft %v apply log %v, term %v, index %v", rf.me, rf.Log[rf.LastApplied - rf.LastIncludedIndex].Command, rf.Log[rf.LastApplied - rf.LastIncludedIndex].Term, rf.LastApplied)
// 			rf.mu.Unlock()
// 			rf.ApplyCh <- applymsg	
// 			rf.mu.Lock()	
// 		}
// 		rf.mu.Unlock()
// 		time.Sleep(10 * time.Millisecond)
// 	}
// }


// the service or tester wants to create a Raft server. the ports
// of all the Raft servers (including this one) are in peers[]. this
// server's port is peers[me]. all the servers' peers[] arrays
// have the same order. persister is a place for this server to
// save its persistent state, and also initially holds the most
// recent saved state, if any. applyCh is a channel on which the
// tester or service expects Raft to send ApplyMsg messages.
// Make() must return quickly, so it should start goroutines
// for any long-running work.
func Make(peers []*labrpc.ClientEnd, me int,
	persister *Persister, applyCh chan ApplyMsg) *Raft {
	rf := &Raft{}
	rf.peers = peers
	rf.persister = persister
	rf.me = me

	// Your initialization code here (2A, 2B, 2C).
	//2A
	rf.State = Follower
	rf.VotedFor = -1
	rf.CurrentTerm = 0
	rf.ElectionTimer = time.NewTimer(randomElectionTimeout())
	rf.HeartbeatTimer = time.NewTimer(fixedHeartbeatTimeout())
	//2B
	rf.ApplyCond = sync.NewCond(&rf.mu)
	rf.ApplyCh = applyCh
	rf.NextIndex = make([]int, len(peers))
	rf.MatchIndex = make([]int, len(peers))
	rf.Log = append(rf.Log, LogEntry{Term: 0})
	rf.LastLogIndex = 0
	rf.CommitIndex = 0
	rf.LastApplied = 0
	//2D
	rf.LastIncludedIndex = 0
	rf.LastIncludedTerm = 0

	// initialize from state persisted before a crash
	rf.readPersist(persister.ReadRaftState())
	
	// start ticker goroutine to start elections
	go rf.ticker()

	// start applyCh goroutine to apply committed log entries
	go rf.applier()

	return rf
}