syncElection.c 3.7 KB
Newer Older
M
Minghao Li 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

S
Shengliang Guan 已提交
16
#define _DEFAULT_SOURCE
M
Minghao Li 已提交
17
#include "syncElection.h"
18
#include "syncMessage.h"
M
Minghao Li 已提交
19
#include "syncRaftCfg.h"
M
Minghao Li 已提交
20
#include "syncRaftStore.h"
S
Shengliang Guan 已提交
21
#include "syncUtil.h"
22
#include "syncVoteMgr.h"
M
Minghao Li 已提交
23

M
Minghao Li 已提交
24 25 26 27 28 29 30 31 32 33 34
// TLA+ Spec
// RequestVote(i, j) ==
//    /\ state[i] = Candidate
//    /\ j \notin votesResponded[i]
//    /\ Send([mtype         |-> RequestVoteRequest,
//             mterm         |-> currentTerm[i],
//             mlastLogTerm  |-> LastTerm(log[i]),
//             mlastLogIndex |-> Len(log[i]),
//             msource       |-> i,
//             mdest         |-> j])
//    /\ UNCHANGED <<serverVars, candidateVars, leaderVars, logVars>>
M
Minghao Li 已提交
35

S
Shengliang Guan 已提交
36 37 38 39 40 41 42 43
static int32_t syncNodeRequestVotePeers(SSyncNode* pNode) {
  if (pNode->state != TAOS_SYNC_STATE_CANDIDATE) {
    sNTrace(pNode, "not candidate, stop elect");
    return 0;
  }

  int32_t ret = 0;
  for (int i = 0; i < pNode->peersNum; ++i) {
C
cadem 已提交
44 45
    if(pNode->peersNodeInfo[i].nodeRole == TAOS_SYNC_ROLE_LEARNER) continue;
    
S
Shengliang Guan 已提交
46 47
    SRpcMsg rpcMsg = {0};
    ret = syncBuildRequestVote(&rpcMsg, pNode->vgId);
48 49 50 51
    if (ret < 0) {
      sError("vgId:%d, failed to build request-vote msg since %s", pNode->vgId, terrstr());
      continue;
    }
S
Shengliang Guan 已提交
52 53 54 55

    SyncRequestVote* pMsg = rpcMsg.pCont;
    pMsg->srcId = pNode->myRaftId;
    pMsg->destId = pNode->peersId[i];
56
    pMsg->term = raftStoreGetTerm(pNode);
S
Shengliang Guan 已提交
57 58

    ret = syncNodeGetLastIndexTerm(pNode, &pMsg->lastLogIndex, &pMsg->lastLogTerm);
59 60 61 62
    if (ret < 0) {
      sError("vgId:%d, failed to get index and term of last log since %s", pNode->vgId, terrstr());
      continue;
    }
S
Shengliang Guan 已提交
63 64

    ret = syncNodeSendMsgById(&pNode->peersId[i], pNode, &rpcMsg);
65 66 67 68
    if (ret < 0) {
      sError("vgId:%d, failed to send msg to peerId:%" PRId64, pNode->vgId, pNode->peersId[i].addr);
      continue;
    }
S
Shengliang Guan 已提交
69
  }
70
  return 0;
S
Shengliang Guan 已提交
71 72
}

M
Minghao Li 已提交
73
int32_t syncNodeElect(SSyncNode* pSyncNode) {
74 75
  sNInfo(pSyncNode, "begin election");
  pSyncNode->electNum++;
M
Minghao Li 已提交
76

M
Minghao Li 已提交
77
  int32_t ret = 0;
M
Minghao Li 已提交
78 79 80
  if (pSyncNode->state == TAOS_SYNC_STATE_FOLLOWER) {
    syncNodeFollower2Candidate(pSyncNode);
  }
M
Minghao Li 已提交
81 82

  if (pSyncNode->state != TAOS_SYNC_STATE_CANDIDATE) {
S
Shengliang Guan 已提交
83
    sNError(pSyncNode, "not candidate, can not elect");
M
Minghao Li 已提交
84 85
    return -1;
  }
M
Minghao Li 已提交
86

M
Minghao Li 已提交
87
  // start election
S
Shengliang Guan 已提交
88 89
  raftStoreNextTerm(pSyncNode);
  raftStoreClearVote(pSyncNode);
M
Minghao Li 已提交
90

91 92 93 94 95
  SyncTerm currentTerm = raftStoreGetTerm(pSyncNode);
  voteGrantedReset(pSyncNode->pVotesGranted, currentTerm);
  votesRespondReset(pSyncNode->pVotesRespond, currentTerm);
  syncNodeVoteForSelf(pSyncNode, currentTerm);

M
Minghao Li 已提交
96 97
  if (voteGrantedMajority(pSyncNode->pVotesGranted)) {
    // only myself, to leader
M
Minghao Li 已提交
98
    ASSERT(!pSyncNode->pVotesGranted->toLeader);
M
Minghao Li 已提交
99 100 101
    syncNodeCandidate2Leader(pSyncNode);
    pSyncNode->pVotesGranted->toLeader = true;
    return ret;
102
  }
103 104 105 106 107 108

  if (pSyncNode->replicaNum == 1) {
    // only myself, to leader
    voteGrantedUpdate(pSyncNode->pVotesGranted, pSyncNode);
    votesRespondUpdate(pSyncNode->pVotesRespond, pSyncNode);

109
    pSyncNode->quorum = syncUtilQuorum(pSyncNode->raftCfg.cfg.replicaNum);
110 111 112 113

    syncNodeCandidate2Leader(pSyncNode);
    pSyncNode->pVotesGranted->toLeader = true;
    return ret;
M
Minghao Li 已提交
114 115
  }

M
Minghao Li 已提交
116
  ret = syncNodeRequestVotePeers(pSyncNode);
M
Minghao Li 已提交
117
  ASSERT(ret == 0);
M
Minghao Li 已提交
118

M
Minghao Li 已提交
119
  syncNodeResetElectTimer(pSyncNode);
M
Minghao Li 已提交
120
  return ret;
M
Minghao Li 已提交
121
}