146 lines
3.7 KiB
C
146 lines
3.7 KiB
C
/*
|
|
* Copyright (c) 2019 TAOS Data, Inc. <cli@taosdata.com>
|
|
*
|
|
* This program is free software: you can use, redistribute, and/or modify
|
|
* it under the terms of the GNU Affero General Public License, version 3
|
|
* or later ("AGPL"), as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful, but WITHOUT
|
|
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
* FITNESS FOR A PARTICULAR PURPOSE.
|
|
*
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#ifndef _TD_LIBS_SYNC_RAFT_H
|
|
#define _TD_LIBS_SYNC_RAFT_H
|
|
|
|
#include "sync.h"
|
|
#include "sync_type.h"
|
|
#include "thash.h"
|
|
#include "raft_message.h"
|
|
#include "sync_raft_impl.h"
|
|
#include "sync_raft_quorum.h"
|
|
|
|
typedef struct RaftLeaderState {
|
|
|
|
} RaftLeaderState;
|
|
|
|
typedef struct RaftCandidateState {
|
|
/* true if in pre-vote phase */
|
|
bool inPreVote;
|
|
} RaftCandidateState;
|
|
|
|
typedef struct SSyncRaftIOMethods {
|
|
// send SSyncMessage to node
|
|
int (*send)(const SSyncMessage* pMsg, const SNodeInfo* pNode);
|
|
} SSyncRaftIOMethods;
|
|
|
|
typedef int (*SyncRaftStepFp)(SSyncRaft* pRaft, const SSyncMessage* pMsg);
|
|
typedef void (*SyncRaftTickFp)(SSyncRaft* pRaft);
|
|
|
|
struct SSyncRaft {
|
|
// owner sync node
|
|
SSyncNode* pNode;
|
|
|
|
// hash map nodeId -> SNodeInfo*
|
|
SHashObj* nodeInfoMap;
|
|
|
|
SyncNodeId selfId;
|
|
SyncGroupId selfGroupId;
|
|
|
|
SSyncRaftIOMethods io;
|
|
|
|
SSyncFSM fsm;
|
|
SSyncLogStore logStore;
|
|
SStateManager stateManager;
|
|
|
|
union {
|
|
RaftLeaderState leaderState;
|
|
RaftCandidateState candidateState;
|
|
};
|
|
|
|
SyncTerm term;
|
|
SyncNodeId voteFor;
|
|
|
|
SSyncRaftLog *log;
|
|
|
|
uint64_t maxMsgSize;
|
|
uint64_t maxUncommittedSize;
|
|
SSyncRaftProgressTracker *tracker;
|
|
|
|
ESyncState state;
|
|
|
|
// isLearner is true if the local raft node is a learner.
|
|
bool isLearner;
|
|
|
|
/**
|
|
* the leader id
|
|
**/
|
|
SyncNodeId leaderId;
|
|
|
|
/**
|
|
* leadTransferee is id of the leader transfer target when its value is not zero.
|
|
* Follow the procedure defined in raft thesis 3.10.
|
|
**/
|
|
SyncNodeId leadTransferee;
|
|
|
|
/**
|
|
* Only one conf change may be pending (in the log, but not yet
|
|
* applied) at a time. This is enforced via pendingConfIndex, which
|
|
* is set to a value >= the log index of the latest pending
|
|
* configuration change (if any). Config changes are only allowed to
|
|
* be proposed if the leader's applied index is greater than this
|
|
* value.
|
|
**/
|
|
SyncIndex pendingConfigIndex;
|
|
|
|
/**
|
|
* an estimate of the size of the uncommitted tail of the Raft log. Used to
|
|
* prevent unbounded log growth. Only maintained by the leader. Reset on
|
|
* term changes.
|
|
**/
|
|
uint32_t uncommittedSize;
|
|
|
|
/**
|
|
* number of ticks since it reached last electionTimeout when it is leader
|
|
* or candidate.
|
|
* number of ticks since it reached last electionTimeout or received a
|
|
* valid message from current leader when it is a follower.
|
|
**/
|
|
uint16_t electionElapsed;
|
|
|
|
/**
|
|
* number of ticks since it reached last heartbeatTimeout.
|
|
* only leader keeps heartbeatElapsed.
|
|
**/
|
|
uint16_t heartbeatElapsed;
|
|
|
|
bool preVote;
|
|
bool checkQuorum;
|
|
|
|
int heartbeatTimeout;
|
|
int electionTimeout;
|
|
|
|
/**
|
|
* randomizedElectionTimeout is a random number between
|
|
* [electiontimeout, 2 * electiontimeout - 1]. It gets reset
|
|
* when raft changes its state to follower or candidate.
|
|
**/
|
|
int randomizedElectionTimeout;
|
|
bool disableProposalForwarding;
|
|
|
|
// current tick count since start up
|
|
uint32_t currentTick;
|
|
|
|
SyncRaftStepFp stepFp;
|
|
|
|
SyncRaftTickFp tickFp;
|
|
};
|
|
|
|
int32_t syncRaftStart(SSyncRaft* pRaft, const SSyncInfo* pInfo);
|
|
int32_t syncRaftStep(SSyncRaft* pRaft, const SSyncMessage* pMsg);
|
|
int32_t syncRaftTick(SSyncRaft* pRaft);
|
|
|
|
#endif /* _TD_LIBS_SYNC_RAFT_H */ |