syncElection.c 3.6 KB
Newer Older
M
Minghao Li 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

S
Shengliang Guan 已提交
16
#define _DEFAULT_SOURCE
M
Minghao Li 已提交
17
#include "syncElection.h"
18
#include "syncMessage.h"
M
Minghao Li 已提交
19
#include "syncRaftCfg.h"
M
Minghao Li 已提交
20
#include "syncRaftStore.h"
S
Shengliang Guan 已提交
21
#include "syncUtil.h"
22
#include "syncVoteMgr.h"
M
Minghao Li 已提交
23

M
Minghao Li 已提交
24 25 26 27 28 29 30 31 32 33 34
// TLA+ Spec
// RequestVote(i, j) ==
//    /\ state[i] = Candidate
//    /\ j \notin votesResponded[i]
//    /\ Send([mtype         |-> RequestVoteRequest,
//             mterm         |-> currentTerm[i],
//             mlastLogTerm  |-> LastTerm(log[i]),
//             mlastLogIndex |-> Len(log[i]),
//             msource       |-> i,
//             mdest         |-> j])
//    /\ UNCHANGED <<serverVars, candidateVars, leaderVars, logVars>>
M
Minghao Li 已提交
35

S
Shengliang Guan 已提交
36 37 38 39 40 41 42 43 44 45
static int32_t syncNodeRequestVotePeers(SSyncNode* pNode) {
  if (pNode->state != TAOS_SYNC_STATE_CANDIDATE) {
    sNTrace(pNode, "not candidate, stop elect");
    return 0;
  }

  int32_t ret = 0;
  for (int i = 0; i < pNode->peersNum; ++i) {
    SRpcMsg rpcMsg = {0};
    ret = syncBuildRequestVote(&rpcMsg, pNode->vgId);
46 47 48 49
    if (ret < 0) {
      sError("vgId:%d, failed to build request-vote msg since %s", pNode->vgId, terrstr());
      continue;
    }
S
Shengliang Guan 已提交
50 51 52 53

    SyncRequestVote* pMsg = rpcMsg.pCont;
    pMsg->srcId = pNode->myRaftId;
    pMsg->destId = pNode->peersId[i];
54
    pMsg->term = raftStoreGetTerm(pNode);
S
Shengliang Guan 已提交
55 56

    ret = syncNodeGetLastIndexTerm(pNode, &pMsg->lastLogIndex, &pMsg->lastLogTerm);
57 58 59 60
    if (ret < 0) {
      sError("vgId:%d, failed to get index and term of last log since %s", pNode->vgId, terrstr());
      continue;
    }
S
Shengliang Guan 已提交
61 62

    ret = syncNodeSendMsgById(&pNode->peersId[i], pNode, &rpcMsg);
63 64 65 66
    if (ret < 0) {
      sError("vgId:%d, failed to send msg to peerId:%" PRId64, pNode->vgId, pNode->peersId[i].addr);
      continue;
    }
S
Shengliang Guan 已提交
67
  }
68
  return 0;
S
Shengliang Guan 已提交
69 70
}

M
Minghao Li 已提交
71
int32_t syncNodeElect(SSyncNode* pSyncNode) {
72 73
  sNInfo(pSyncNode, "begin election");
  pSyncNode->electNum++;
M
Minghao Li 已提交
74

M
Minghao Li 已提交
75
  int32_t ret = 0;
M
Minghao Li 已提交
76 77 78
  if (pSyncNode->state == TAOS_SYNC_STATE_FOLLOWER) {
    syncNodeFollower2Candidate(pSyncNode);
  }
M
Minghao Li 已提交
79 80

  if (pSyncNode->state != TAOS_SYNC_STATE_CANDIDATE) {
S
Shengliang Guan 已提交
81
    sNError(pSyncNode, "not candidate, can not elect");
M
Minghao Li 已提交
82 83
    return -1;
  }
M
Minghao Li 已提交
84

M
Minghao Li 已提交
85
  // start election
S
Shengliang Guan 已提交
86 87
  raftStoreNextTerm(pSyncNode);
  raftStoreClearVote(pSyncNode);
M
Minghao Li 已提交
88

89 90 91 92 93
  SyncTerm currentTerm = raftStoreGetTerm(pSyncNode);
  voteGrantedReset(pSyncNode->pVotesGranted, currentTerm);
  votesRespondReset(pSyncNode->pVotesRespond, currentTerm);
  syncNodeVoteForSelf(pSyncNode, currentTerm);

M
Minghao Li 已提交
94 95
  if (voteGrantedMajority(pSyncNode->pVotesGranted)) {
    // only myself, to leader
M
Minghao Li 已提交
96
    ASSERT(!pSyncNode->pVotesGranted->toLeader);
M
Minghao Li 已提交
97 98 99
    syncNodeCandidate2Leader(pSyncNode);
    pSyncNode->pVotesGranted->toLeader = true;
    return ret;
100
  }
101 102 103 104 105 106

  if (pSyncNode->replicaNum == 1) {
    // only myself, to leader
    voteGrantedUpdate(pSyncNode->pVotesGranted, pSyncNode);
    votesRespondUpdate(pSyncNode->pVotesRespond, pSyncNode);

107
    pSyncNode->quorum = syncUtilQuorum(pSyncNode->raftCfg.cfg.replicaNum);
108 109 110 111

    syncNodeCandidate2Leader(pSyncNode);
    pSyncNode->pVotesGranted->toLeader = true;
    return ret;
M
Minghao Li 已提交
112 113
  }

M
Minghao Li 已提交
114
  ret = syncNodeRequestVotePeers(pSyncNode);
M
Minghao Li 已提交
115
  ASSERT(ret == 0);
M
Minghao Li 已提交
116

M
Minghao Li 已提交
117
  syncNodeResetElectTimer(pSyncNode);
M
Minghao Li 已提交
118
  return ret;
M
Minghao Li 已提交
119
}