147 lines
5.4 KiB
C
147 lines
5.4 KiB
C
/*
|
|
* Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
|
|
*
|
|
* This program is free software: you can use, redistribute, and/or modify
|
|
* it under the terms of the GNU Affero General Public License, version 3
|
|
* or later ("AGPL"), as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE.
|
|
*
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#define _DEFAULT_SOURCE
|
|
#include "syncRequestVote.h"
|
|
#include "syncMessage.h"
|
|
#include "syncRaftCfg.h"
|
|
#include "syncRaftStore.h"
|
|
#include "syncUtil.h"
|
|
#include "syncVoteMgr.h"
|
|
|
|
// TLA+ Spec
|
|
// HandleRequestVoteRequest(i, j, m) ==
|
|
// LET logOk == \/ m.mlastLogTerm > LastTerm(log[i])
|
|
// \/ /\ m.mlastLogTerm = LastTerm(log[i])
|
|
// /\ m.mlastLogIndex >= Len(log[i])
|
|
// grant == /\ m.mterm = currentTerm[i]
|
|
// /\ logOk
|
|
// /\ votedFor[i] \in {Nil, j}
|
|
// IN /\ m.mterm <= currentTerm[i]
|
|
// /\ \/ grant /\ votedFor' = [votedFor EXCEPT ![i] = j]
|
|
// \/ ~grant /\ UNCHANGED votedFor
|
|
// /\ Reply([mtype |-> RequestVoteResponse,
|
|
// mterm |-> currentTerm[i],
|
|
// mvoteGranted |-> grant,
|
|
// \* mlog is used just for the `elections' history variable for
|
|
// \* the proof. It would not exist in a real implementation.
|
|
// mlog |-> log[i],
|
|
// msource |-> i,
|
|
// mdest |-> j],
|
|
// m)
|
|
// /\ UNCHANGED <<state, currentTerm, candidateVars, leaderVars, logVars>>
|
|
//
|
|
|
|
static bool syncNodeOnRequestVoteLogOK(SSyncNode* ths, SyncRequestVote* pMsg) {
|
|
SyncTerm myLastTerm = syncNodeGetLastTerm(ths);
|
|
SyncIndex myLastIndex = syncNodeGetLastIndex(ths);
|
|
|
|
if (myLastTerm == SYNC_TERM_INVALID) {
|
|
sNTrace(ths,
|
|
"logok:0, {my-lterm:%" PRIu64 ", my-lindex:%" PRId64 ", recv-lterm:%" PRIu64 ", recv-lindex:%" PRId64
|
|
", recv-term:%" PRIu64 "}",
|
|
myLastTerm, myLastIndex, pMsg->lastLogTerm, pMsg->lastLogIndex, pMsg->term);
|
|
return false;
|
|
}
|
|
|
|
if (pMsg->lastLogTerm > myLastTerm) {
|
|
sNTrace(ths,
|
|
"logok:1, {my-lterm:%" PRIu64 ", my-lindex:%" PRId64 ", recv-lterm:%" PRIu64 ", recv-lindex:%" PRId64
|
|
", recv-term:%" PRIu64 "}",
|
|
myLastTerm, myLastIndex, pMsg->lastLogTerm, pMsg->lastLogIndex, pMsg->term);
|
|
|
|
if (pMsg->lastLogIndex < ths->commitIndex) {
|
|
sNWarn(ths,
|
|
"logok:1, commit rollback required. {my-lterm:%" PRIu64 ", my-lindex:%" PRId64 ", recv-lterm:%" PRIu64
|
|
", recv-lindex:%" PRId64 ", recv-term:%" PRIu64 "}",
|
|
myLastTerm, myLastIndex, pMsg->lastLogTerm, pMsg->lastLogIndex, pMsg->term);
|
|
}
|
|
return true;
|
|
}
|
|
|
|
if (pMsg->lastLogTerm == myLastTerm && pMsg->lastLogIndex >= myLastIndex) {
|
|
sNTrace(ths,
|
|
"logok:1, {my-lterm:%" PRIu64 ", my-lindex:%" PRId64 ", recv-lterm:%" PRIu64 ", recv-lindex:%" PRId64
|
|
", recv-term:%" PRIu64 "}",
|
|
myLastTerm, myLastIndex, pMsg->lastLogTerm, pMsg->lastLogIndex, pMsg->term);
|
|
return true;
|
|
}
|
|
|
|
sNTrace(ths,
|
|
"logok:0, {my-lterm:%" PRIu64 ", my-lindex:%" PRId64 ", recv-lterm:%" PRIu64 ", recv-lindex:%" PRId64
|
|
", recv-term:%" PRIu64 "}",
|
|
myLastTerm, myLastIndex, pMsg->lastLogTerm, pMsg->lastLogIndex, pMsg->term);
|
|
return false;
|
|
}
|
|
|
|
int32_t syncNodeOnRequestVote(SSyncNode* ths, const SRpcMsg* pRpcMsg) {
|
|
int32_t ret = 0;
|
|
SyncRequestVote* pMsg = pRpcMsg->pCont;
|
|
bool resetElect = false;
|
|
|
|
syncLogRecvRequestVote(ths, pMsg, -1, "", "recv");
|
|
|
|
// if already drop replica, do not process
|
|
if (!syncNodeInRaftGroup(ths, &pMsg->srcId)) {
|
|
syncLogRecvRequestVote(ths, pMsg, -1, "not in my config", "process");
|
|
|
|
TAOS_RETURN(TSDB_CODE_SYN_MISMATCHED_SIGNATURE);
|
|
}
|
|
|
|
bool logOK = syncNodeOnRequestVoteLogOK(ths, pMsg);
|
|
// maybe update term
|
|
if (pMsg->term > raftStoreGetTerm(ths)) {
|
|
syncNodeStepDown(ths, pMsg->term, pMsg->srcId);
|
|
}
|
|
SyncTerm currentTerm = raftStoreGetTerm(ths);
|
|
if (!(pMsg->term <= currentTerm)) return TSDB_CODE_SYN_INTERNAL_ERROR;
|
|
|
|
sTrace("vgId:%d, begin hasVoted", ths->vgId);
|
|
bool grant = (pMsg->term == currentTerm) && logOK &&
|
|
((!raftStoreHasVoted(ths)) || (syncUtilSameId(&ths->raftStore.voteFor, &pMsg->srcId)));
|
|
if (grant) {
|
|
// maybe has already voted for pMsg->srcId
|
|
// vote again, no harm
|
|
raftStoreVote(ths, &(pMsg->srcId));
|
|
|
|
// candidate ?
|
|
syncNodeStepDown(ths, currentTerm, pMsg->srcId);
|
|
|
|
// forbid elect for this round
|
|
resetElect = true;
|
|
}
|
|
|
|
// send msg
|
|
SRpcMsg rpcMsg = {0};
|
|
|
|
TAOS_CHECK_RETURN(syncBuildRequestVoteReply(&rpcMsg, ths->vgId));
|
|
|
|
SyncRequestVoteReply* pReply = rpcMsg.pCont;
|
|
pReply->srcId = ths->myRaftId;
|
|
pReply->destId = pMsg->srcId;
|
|
pReply->term = currentTerm;
|
|
pReply->voteGranted = grant;
|
|
if (!(!grant || pMsg->term == pReply->term)) return TSDB_CODE_SYN_INTERNAL_ERROR;
|
|
|
|
// trace log
|
|
syncLogRecvRequestVote(ths, pMsg, pReply->voteGranted, "", "proceed");
|
|
syncLogSendRequestVoteReply(ths, pReply, "");
|
|
TAOS_CHECK_RETURN(syncNodeSendMsgById(&pReply->destId, ths, &rpcMsg));
|
|
|
|
if (resetElect) syncNodeResetElectTimer(ths);
|
|
|
|
TAOS_RETURN(TSDB_CODE_SUCCESS);
|
|
}
|