mndMnode.c 20.9 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

S
Shengliang Guan 已提交
16
#define _DEFAULT_SOURCE
S
Shengliang Guan 已提交
17 18 19
#include "mndMnode.h"
#include "mndDnode.h"
#include "mndShow.h"
S
Shengliang Guan 已提交
20
#include "mndTrans.h"
S
Shengliang Guan 已提交
21

S
Shengliang Guan 已提交
22 23
#define TSDB_MNODE_VER_NUMBER 1
#define TSDB_MNODE_RESERVE_SIZE 64
S
Shengliang Guan 已提交
24

S
Shengliang Guan 已提交
25
static int32_t  mndCreateDefaultMnode(SMnode *pMnode);
S
Shengliang Guan 已提交
26
static SSdbRaw *mndMnodeActionEncode(SMnodeObj *pObj);
S
Shengliang Guan 已提交
27
static SSdbRow *mndMnodeActionDecode(SSdbRaw *pRaw);
S
Shengliang Guan 已提交
28 29
static int32_t  mndMnodeActionInsert(SSdb *pSdb, SMnodeObj *pObj);
static int32_t  mndMnodeActionDelete(SSdb *pSdb, SMnodeObj *pObj);
S
Shengliang Guan 已提交
30 31 32 33 34 35
static int32_t  mndMnodeActionUpdate(SSdb *pSdb, SMnodeObj *pOld, SMnodeObj *pNew);
static int32_t  mndProcessCreateMnodeReq(SMnodeMsg *pReq);
static int32_t  mndProcessDropMnodeReq(SMnodeMsg *pReq);
static int32_t  mndProcessCreateMnodeRsp(SMnodeMsg *pRsp);
static int32_t  mndProcessAlterMnodeRsp(SMnodeMsg *pRsp);
static int32_t  mndProcessDropMnodeRsp(SMnodeMsg *pRsp);
S
Shengliang Guan 已提交
36
static int32_t  mndGetMnodeMeta(SMnodeMsg *pReq, SShowObj *pShow, STableMetaRsp *pMeta);
S
Shengliang Guan 已提交
37
static int32_t  mndRetrieveMnodes(SMnodeMsg *pReq, SShowObj *pShow, char *data, int32_t rows);
S
Shengliang Guan 已提交
38
static void     mndCancelGetNextMnode(SMnode *pMnode, void *pIter);
S
Shengliang Guan 已提交
39 40 41 42 43 44 45 46 47 48 49

int32_t mndInitMnode(SMnode *pMnode) {
  SSdbTable table = {.sdbType = SDB_MNODE,
                     .keyType = SDB_KEY_INT32,
                     .deployFp = (SdbDeployFp)mndCreateDefaultMnode,
                     .encodeFp = (SdbEncodeFp)mndMnodeActionEncode,
                     .decodeFp = (SdbDecodeFp)mndMnodeActionDecode,
                     .insertFp = (SdbInsertFp)mndMnodeActionInsert,
                     .updateFp = (SdbUpdateFp)mndMnodeActionUpdate,
                     .deleteFp = (SdbDeleteFp)mndMnodeActionDelete};

H
Hongze Cheng 已提交
50 51 52 53 54
  mndSetMsgHandle(pMnode, TDMT_MND_CREATE_MNODE, mndProcessCreateMnodeReq);
  mndSetMsgHandle(pMnode, TDMT_MND_DROP_MNODE, mndProcessDropMnodeReq);
  mndSetMsgHandle(pMnode, TDMT_DND_CREATE_MNODE_RSP, mndProcessCreateMnodeRsp);
  mndSetMsgHandle(pMnode, TDMT_DND_ALTER_MNODE_RSP, mndProcessAlterMnodeRsp);
  mndSetMsgHandle(pMnode, TDMT_DND_DROP_MNODE_RSP, mndProcessDropMnodeRsp);
S
Shengliang Guan 已提交
55 56 57 58

  mndAddShowMetaHandle(pMnode, TSDB_MGMT_TABLE_MNODE, mndGetMnodeMeta);
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_MNODE, mndRetrieveMnodes);
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_MNODE, mndCancelGetNextMnode);
S
Shengliang Guan 已提交
59 60 61 62 63 64

  return sdbSetTable(pMnode->pSdb, table);
}

void mndCleanupMnode(SMnode *pMnode) {}

S
Shengliang Guan 已提交
65
static SMnodeObj *mndAcquireMnode(SMnode *pMnode, int32_t mnodeId) {
S
Shengliang Guan 已提交
66 67
  SSdb      *pSdb = pMnode->pSdb;
  SMnodeObj *pObj = sdbAcquire(pSdb, SDB_MNODE, &mnodeId);
S
Shengliang Guan 已提交
68
  if (pObj == NULL && terrno == TSDB_CODE_SDB_OBJ_NOT_THERE) {
S
Shengliang Guan 已提交
69 70 71
    terrno = TSDB_CODE_MND_MNODE_NOT_EXIST;
  }
  return pObj;
S
Shengliang Guan 已提交
72 73
}

S
Shengliang Guan 已提交
74
static void mndReleaseMnode(SMnode *pMnode, SMnodeObj *pObj) {
S
Shengliang Guan 已提交
75
  SSdb *pSdb = pMnode->pSdb;
S
Shengliang Guan 已提交
76
  sdbRelease(pSdb, pObj);
S
Shengliang Guan 已提交
77 78 79 80 81 82 83 84 85 86 87 88 89 90 91
}

char *mndGetRoleStr(int32_t showType) {
  switch (showType) {
    case TAOS_SYNC_STATE_FOLLOWER:
      return "unsynced";
    case TAOS_SYNC_STATE_CANDIDATE:
      return "slave";
    case TAOS_SYNC_STATE_LEADER:
      return "master";
    default:
      return "undefined";
  }
}

S
Shengliang Guan 已提交
92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109
void mndUpdateMnodeRole(SMnode *pMnode) {
  SSdb *pSdb = pMnode->pSdb;
  void *pIter = NULL;
  while (1) {
    SMnodeObj *pObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pObj);
    if (pIter == NULL) break;

    if (pObj->id == 1) {
      pObj->role = TAOS_SYNC_STATE_LEADER;
    } else {
      pObj->role = TAOS_SYNC_STATE_CANDIDATE;
    }

    sdbRelease(pSdb, pObj);
  }
}

S
Shengliang Guan 已提交
110 111 112 113 114 115 116 117 118 119
static int32_t mndCreateDefaultMnode(SMnode *pMnode) {
  SMnodeObj mnodeObj = {0};
  mnodeObj.id = 1;
  mnodeObj.createdTime = taosGetTimestampMs();
  mnodeObj.updateTime = mnodeObj.createdTime;

  SSdbRaw *pRaw = mndMnodeActionEncode(&mnodeObj);
  if (pRaw == NULL) return -1;
  sdbSetRawStatus(pRaw, SDB_STATUS_READY);

120
  mDebug("mnode:%d, will be created while deploy sdb, raw:%p", mnodeObj.id, pRaw);
S
Shengliang Guan 已提交
121 122 123
  return sdbWrite(pMnode->pSdb, pRaw);
}

S
Shengliang Guan 已提交
124
static SSdbRaw *mndMnodeActionEncode(SMnodeObj *pObj) {
125 126
  terrno = TSDB_CODE_OUT_OF_MEMORY;

S
Shengliang Guan 已提交
127
  SSdbRaw *pRaw = sdbAllocRaw(SDB_MNODE, TSDB_MNODE_VER_NUMBER, sizeof(SMnodeObj) + TSDB_MNODE_RESERVE_SIZE);
128
  if (pRaw == NULL) goto MNODE_ENCODE_OVER;
S
Shengliang Guan 已提交
129 130

  int32_t dataPos = 0;
131 132 133 134 135 136 137 138 139 140 141 142 143
  SDB_SET_INT32(pRaw, dataPos, pObj->id, MNODE_ENCODE_OVER)
  SDB_SET_INT64(pRaw, dataPos, pObj->createdTime, MNODE_ENCODE_OVER)
  SDB_SET_INT64(pRaw, dataPos, pObj->updateTime, MNODE_ENCODE_OVER)
  SDB_SET_RESERVE(pRaw, dataPos, TSDB_MNODE_RESERVE_SIZE, MNODE_ENCODE_OVER)

  terrno = 0;

MNODE_ENCODE_OVER:
  if (terrno != 0) {
    mError("mnode:%d, failed to encode to raw:%p since %s", pObj->id, pRaw, terrstr());
    sdbFreeRaw(pRaw);
    return NULL;
  }
S
Shengliang Guan 已提交
144

145
  mTrace("mnode:%d, encode to raw:%p, row:%p", pObj->id, pRaw, pObj);
S
Shengliang Guan 已提交
146 147 148 149
  return pRaw;
}

static SSdbRow *mndMnodeActionDecode(SSdbRaw *pRaw) {
150 151
  terrno = TSDB_CODE_OUT_OF_MEMORY;

S
Shengliang Guan 已提交
152 153 154
  int8_t sver = 0;
  if (sdbGetRawSoftVer(pRaw, &sver) != 0) return NULL;

S
Shengliang Guan 已提交
155
  if (sver != TSDB_MNODE_VER_NUMBER) {
S
Shengliang Guan 已提交
156
    terrno = TSDB_CODE_SDB_INVALID_DATA_VER;
157
    goto MNODE_DECODE_OVER;
S
Shengliang Guan 已提交
158 159
  }

160 161 162
  SSdbRow *pRow = sdbAllocRow(sizeof(SMnodeObj));
  if (pRow == NULL) goto MNODE_DECODE_OVER;

S
Shengliang Guan 已提交
163
  SMnodeObj *pObj = sdbGetRowObj(pRow);
164
  if (pObj == NULL) goto MNODE_DECODE_OVER;
S
Shengliang Guan 已提交
165 166

  int32_t dataPos = 0;
167 168 169 170 171 172 173 174 175 176 177 178 179
  SDB_GET_INT32(pRaw, dataPos, &pObj->id, MNODE_DECODE_OVER)
  SDB_GET_INT64(pRaw, dataPos, &pObj->createdTime, MNODE_DECODE_OVER)
  SDB_GET_INT64(pRaw, dataPos, &pObj->updateTime, MNODE_DECODE_OVER)
  SDB_GET_RESERVE(pRaw, dataPos, TSDB_MNODE_RESERVE_SIZE, MNODE_DECODE_OVER)

  terrno = 0;

MNODE_DECODE_OVER:
  if (terrno != 0) {
    mError("mnode:%d, failed to decode from raw:%p since %s", pObj->id, pRaw, terrstr());
    tfree(pRow);
    return NULL;
  }
S
Shengliang Guan 已提交
180

181
  mTrace("mnode:%d, decode from raw:%p, row:%p", pObj->id, pRaw, pObj);
S
Shengliang Guan 已提交
182 183 184
  return pRow;
}

S
Shengliang Guan 已提交
185
static void mnodeResetMnode(SMnodeObj *pObj) { pObj->role = TAOS_SYNC_STATE_FOLLOWER; }
S
Shengliang Guan 已提交
186

S
Shengliang Guan 已提交
187
static int32_t mndMnodeActionInsert(SSdb *pSdb, SMnodeObj *pObj) {
188
  mTrace("mnode:%d, perform insert action, row:%p", pObj->id, pObj);
S
Shengliang Guan 已提交
189 190
  pObj->pDnode = sdbAcquire(pSdb, SDB_DNODE, &pObj->id);
  if (pObj->pDnode == NULL) {
S
Shengliang Guan 已提交
191
    terrno = TSDB_CODE_MND_DNODE_NOT_EXIST;
S
Shengliang Guan 已提交
192
    mError("mnode:%d, failed to perform insert action since %s", pObj->id, terrstr());
S
Shengliang Guan 已提交
193 194 195
    return -1;
  }

S
Shengliang Guan 已提交
196
  mnodeResetMnode(pObj);
S
Shengliang Guan 已提交
197 198 199
  return 0;
}

S
Shengliang Guan 已提交
200
static int32_t mndMnodeActionDelete(SSdb *pSdb, SMnodeObj *pObj) {
201
  mTrace("mnode:%d, perform delete action, row:%p", pObj->id, pObj);
S
Shengliang Guan 已提交
202 203 204
  if (pObj->pDnode != NULL) {
    sdbRelease(pSdb, pObj->pDnode);
    pObj->pDnode = NULL;
S
Shengliang Guan 已提交
205 206 207 208 209
  }

  return 0;
}

S
Shengliang Guan 已提交
210
static int32_t mndMnodeActionUpdate(SSdb *pSdb, SMnodeObj *pOld, SMnodeObj *pNew) {
S
Shengliang Guan 已提交
211
  mTrace("mnode:%d, perform update action, old row:%p new row:%p", pOld->id, pOld, pNew);
S
Shengliang Guan 已提交
212
  pOld->updateTime = pNew->updateTime;
S
Shengliang Guan 已提交
213
  return 0;
S
Shengliang Guan 已提交
214 215 216 217 218
}

bool mndIsMnode(SMnode *pMnode, int32_t dnodeId) {
  SSdb *pSdb = pMnode->pSdb;

S
Shengliang Guan 已提交
219 220
  SMnodeObj *pObj = sdbAcquire(pSdb, SDB_MNODE, &dnodeId);
  if (pObj == NULL) {
S
Shengliang Guan 已提交
221 222 223
    return false;
  }

S
Shengliang Guan 已提交
224
  sdbRelease(pSdb, pObj);
S
Shengliang Guan 已提交
225
  return true;
S
Shengliang Guan 已提交
226 227
}

S
Shengliang Guan 已提交
228 229 230 231 232 233 234
void mndGetMnodeEpSet(SMnode *pMnode, SEpSet *pEpSet) {
  SSdb *pSdb = pMnode->pSdb;

  pEpSet->numOfEps = 0;

  void *pIter = NULL;
  while (1) {
S
Shengliang Guan 已提交
235 236
    SMnodeObj *pObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pObj);
S
Shengliang Guan 已提交
237
    if (pIter == NULL) break;
S
Shengliang Guan 已提交
238
    if (pObj->pDnode == NULL) break;
S
Shengliang Guan 已提交
239

H
Haojun Liao 已提交
240 241
    pEpSet->eps[pEpSet->numOfEps].port = htons(pObj->pDnode->port);
    memcpy(pEpSet->eps[pEpSet->numOfEps].fqdn, pObj->pDnode->fqdn, TSDB_FQDN_LEN);
S
Shengliang Guan 已提交
242
    if (pObj->role == TAOS_SYNC_STATE_LEADER) {
S
Shengliang Guan 已提交
243 244 245 246
      pEpSet->inUse = pEpSet->numOfEps;
    }

    pEpSet->numOfEps++;
S
Shengliang Guan 已提交
247
    sdbRelease(pSdb, pObj);
S
Shengliang Guan 已提交
248
  }
S
Shengliang Guan 已提交
249 250
}

251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274
static int32_t mndSetCreateMnodeRedoLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
  SSdbRaw *pRedoRaw = mndMnodeActionEncode(pObj);
  if (pRedoRaw == NULL) return -1;
  if (mndTransAppendRedolog(pTrans, pRedoRaw) != 0) return -1;
  if (sdbSetRawStatus(pRedoRaw, SDB_STATUS_CREATING) != 0) return -1;
  return 0;
}

static int32_t mndSetCreateMnodeUndoLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
  SSdbRaw *pUndoRaw = mndMnodeActionEncode(pObj);
  if (pUndoRaw == NULL) return -1;
  if (mndTransAppendUndolog(pTrans, pUndoRaw) != 0) return -1;
  if (sdbSetRawStatus(pUndoRaw, SDB_STATUS_DROPPED) != 0) return -1;
  return 0;
}

static int32_t mndSetCreateMnodeCommitLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
  SSdbRaw *pCommitRaw = mndMnodeActionEncode(pObj);
  if (pCommitRaw == NULL) return -1;
  if (mndTransAppendCommitlog(pTrans, pCommitRaw) != 0) return -1;
  if (sdbSetRawStatus(pCommitRaw, SDB_STATUS_READY) != 0) return -1;
  return 0;
}

S
Shengliang Guan 已提交
275 276 277 278
static int32_t mndSetCreateMnodeRedoActions(SMnode *pMnode, STrans *pTrans, SDnodeObj *pDnode, SMnodeObj *pObj) {
  SSdb   *pSdb = pMnode->pSdb;
  void   *pIter = NULL;
  int32_t numOfReplicas = 0;
279

S
Shengliang Guan 已提交
280
  SDCreateMnodeReq createReq = {0};
S
Shengliang Guan 已提交
281 282 283 284
  while (1) {
    SMnodeObj *pMObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
    if (pIter == NULL) break;
285

S
Shengliang Guan 已提交
286
    SReplica *pReplica = &createReq.replicas[numOfReplicas];
S
Shengliang Guan 已提交
287 288 289 290
    pReplica->id = htonl(pMObj->id);
    pReplica->port = htons(pMObj->pDnode->port);
    memcpy(pReplica->fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
    numOfReplicas++;
291

S
Shengliang Guan 已提交
292 293 294
    sdbRelease(pSdb, pMObj);
  }

S
Shengliang Guan 已提交
295
  SReplica *pReplica = &createReq.replicas[numOfReplicas];
S
Shengliang Guan 已提交
296 297 298 299 300
  pReplica->id = htonl(pDnode->id);
  pReplica->port = htons(pDnode->port);
  memcpy(pReplica->fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
  numOfReplicas++;

S
Shengliang Guan 已提交
301
  createReq.replica = numOfReplicas;
S
Shengliang Guan 已提交
302

S
Shengliang Guan 已提交
303 304 305 306 307 308 309
  while (1) {
    SMnodeObj *pMObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
    if (pIter == NULL) break;

    STransAction action = {0};

S
Shengliang Guan 已提交
310 311
    SDAlterMnodeReq *pReq = malloc(sizeof(SDAlterMnodeReq));
    if (pReq == NULL) {
S
Shengliang Guan 已提交
312 313 314 315
      sdbCancelFetch(pSdb, pIter);
      sdbRelease(pSdb, pMObj);
      return -1;
    }
S
Shengliang Guan 已提交
316
    memcpy(pReq, &createReq, sizeof(SDAlterMnodeReq));
S
Shengliang Guan 已提交
317

S
Shengliang Guan 已提交
318
    pReq->dnodeId = htonl(pMObj->id);
S
Shengliang Guan 已提交
319
    action.epSet = mndGetDnodeEpset(pMObj->pDnode);
S
Shengliang Guan 已提交
320
    action.pCont = pReq;
S
Shengliang Guan 已提交
321
    action.contLen = sizeof(SDAlterMnodeReq);
H
Hongze Cheng 已提交
322
    action.msgType = TDMT_DND_ALTER_MNODE;
S
Shengliang Guan 已提交
323
    action.acceptableCode = TSDB_CODE_DND_MNODE_ALREADY_DEPLOYED;
S
Shengliang Guan 已提交
324 325

    if (mndTransAppendRedoAction(pTrans, &action) != 0) {
S
Shengliang Guan 已提交
326
      free(pReq);
S
Shengliang Guan 已提交
327 328 329 330 331 332 333 334 335 336 337 338
      sdbCancelFetch(pSdb, pIter);
      sdbRelease(pSdb, pMObj);
      return -1;
    }

    sdbRelease(pSdb, pMObj);
  }

  {
    STransAction action = {0};
    action.epSet = mndGetDnodeEpset(pDnode);

S
Shengliang Guan 已提交
339 340 341 342
    SDCreateMnodeReq *pReq = malloc(sizeof(SDCreateMnodeReq));
    if (pReq == NULL) return -1;
    memcpy(pReq, &createReq, sizeof(SDAlterMnodeReq));
    pReq->dnodeId = htonl(pObj->id);
S
Shengliang Guan 已提交
343 344

    action.epSet = mndGetDnodeEpset(pDnode);
S
Shengliang Guan 已提交
345
    action.pCont = pReq;
S
Shengliang Guan 已提交
346
    action.contLen = sizeof(SDCreateMnodeReq);
H
Hongze Cheng 已提交
347
    action.msgType = TDMT_DND_CREATE_MNODE;
S
Shengliang Guan 已提交
348
    action.acceptableCode = TSDB_CODE_DND_MNODE_ALREADY_DEPLOYED;
S
Shengliang Guan 已提交
349
    if (mndTransAppendRedoAction(pTrans, &action) != 0) {
S
Shengliang Guan 已提交
350
      free(pReq);
S
Shengliang Guan 已提交
351 352
      return -1;
    }
353 354 355 356 357
  }

  return 0;
}

S
Shengliang Guan 已提交
358
static int32_t mndCreateMnode(SMnode *pMnode, SMnodeMsg *pReq, SDnodeObj *pDnode, SMCreateMnodeReq *pCreate) {
S
Shengliang Guan 已提交
359 360
  int32_t code = -1;

S
Shengliang Guan 已提交
361
  SMnodeObj mnodeObj = {0};
S
Shengliang Guan 已提交
362
  mnodeObj.id = pDnode->id;
S
Shengliang Guan 已提交
363 364 365
  mnodeObj.createdTime = taosGetTimestampMs();
  mnodeObj.updateTime = mnodeObj.createdTime;

S
Shengliang Guan 已提交
366
  STrans *pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, &pReq->rpcMsg);
S
Shengliang Guan 已提交
367
  if (pTrans == NULL) goto CREATE_MNODE_OVER;
S
Shengliang Guan 已提交
368

S
Shengliang Guan 已提交
369 370 371 372
  mDebug("trans:%d, used to create mnode:%d", pTrans->id, pCreate->dnodeId);
  if (mndSetCreateMnodeRedoLogs(pMnode, pTrans, &mnodeObj) != 0) goto CREATE_MNODE_OVER;
  if (mndSetCreateMnodeCommitLogs(pMnode, pTrans, &mnodeObj) != 0) goto CREATE_MNODE_OVER;
  if (mndSetCreateMnodeRedoActions(pMnode, pTrans, pDnode, &mnodeObj) != 0) goto CREATE_MNODE_OVER;
S
Shengliang Guan 已提交
373

S
Shengliang Guan 已提交
374
  if (mndTransPrepare(pMnode, pTrans) != 0) goto CREATE_MNODE_OVER;
S
Shengliang Guan 已提交
375

376 377 378
  code = 0;

CREATE_MNODE_OVER:
S
Shengliang Guan 已提交
379
  mndTransDrop(pTrans);
380
  return code;
S
Shengliang Guan 已提交
381 382
}

S
Shengliang Guan 已提交
383 384 385
static int32_t mndProcessCreateMnodeReq(SMnodeMsg *pReq) {
  SMnode           *pMnode = pReq->pMnode;
  SMCreateMnodeReq *pCreate = pReq->rpcMsg.pCont;
S
Shengliang Guan 已提交
386 387 388 389 390

  pCreate->dnodeId = htonl(pCreate->dnodeId);

  mDebug("mnode:%d, start to create", pCreate->dnodeId);

S
Shengliang Guan 已提交
391 392
  SMnodeObj *pObj = mndAcquireMnode(pMnode, pCreate->dnodeId);
  if (pObj != NULL) {
S
Shengliang Guan 已提交
393
    mndReleaseMnode(pMnode, pObj);
S
Shengliang Guan 已提交
394
    mError("mnode:%d, mnode already exist", pObj->id);
S
Shengliang Guan 已提交
395 396
    terrno = TSDB_CODE_MND_MNODE_ALREADY_EXIST;
    return -1;
S
Shengliang Guan 已提交
397 398 399
  } else if (terrno != TSDB_CODE_MND_MNODE_NOT_EXIST) {
    mError("qnode:%d, failed to create mnode since %s", pCreate->dnodeId, terrstr());
    return -1;
S
Shengliang Guan 已提交
400 401
  }

S
Shengliang Guan 已提交
402 403
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, pCreate->dnodeId);
  if (pDnode == NULL) {
S
Shengliang Guan 已提交
404
    mError("mnode:%d, dnode not exist", pCreate->dnodeId);
S
Shengliang Guan 已提交
405 406 407 408
    terrno = TSDB_CODE_MND_DNODE_NOT_EXIST;
    return -1;
  }

S
Shengliang Guan 已提交
409
  int32_t code = mndCreateMnode(pMnode, pReq, pDnode, pCreate);
S
Shengliang Guan 已提交
410
  mndReleaseDnode(pMnode, pDnode);
S
Shengliang Guan 已提交
411 412 413 414 415 416 417 418 419

  if (code != 0) {
    mError("mnode:%d, failed to create since %s", pCreate->dnodeId, terrstr());
    return -1;
  }

  return TSDB_CODE_MND_ACTION_IN_PROGRESS;
}

420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435
static int32_t mndSetDropMnodeRedoLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
  SSdbRaw *pRedoRaw = mndMnodeActionEncode(pObj);
  if (pRedoRaw == NULL) return -1;
  if (mndTransAppendRedolog(pTrans, pRedoRaw) != 0) return -1;
  if (sdbSetRawStatus(pRedoRaw, SDB_STATUS_DROPPING) != 0) return -1;
  return 0;
}

static int32_t mndSetDropMnodeCommitLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
  SSdbRaw *pCommitRaw = mndMnodeActionEncode(pObj);
  if (pCommitRaw == NULL) return -1;
  if (mndTransAppendCommitlog(pTrans, pCommitRaw) != 0) return -1;
  if (sdbSetRawStatus(pCommitRaw, SDB_STATUS_DROPPED) != 0) return -1;
  return 0;
}

S
Shengliang Guan 已提交
436 437 438 439
static int32_t mndSetDropMnodeRedoActions(SMnode *pMnode, STrans *pTrans, SDnodeObj *pDnode, SMnodeObj *pObj) {
  SSdb   *pSdb = pMnode->pSdb;
  void   *pIter = NULL;
  int32_t numOfReplicas = 0;
440

S
Shengliang Guan 已提交
441
  SDAlterMnodeReq alterReq = {0};
S
Shengliang Guan 已提交
442 443 444 445
  while (1) {
    SMnodeObj *pMObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
    if (pIter == NULL) break;
446

S
Shengliang Guan 已提交
447
    if (pMObj->id != pObj->id) {
S
Shengliang Guan 已提交
448
      SReplica *pReplica = &alterReq.replicas[numOfReplicas];
S
Shengliang Guan 已提交
449 450 451 452 453
      pReplica->id = htonl(pMObj->id);
      pReplica->port = htons(pMObj->pDnode->port);
      memcpy(pReplica->fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
      numOfReplicas++;
    }
454

S
Shengliang Guan 已提交
455 456 457
    sdbRelease(pSdb, pMObj);
  }

S
Shengliang Guan 已提交
458
  alterReq.replica = numOfReplicas;
S
Shengliang Guan 已提交
459

S
Shengliang Guan 已提交
460 461 462 463 464 465 466
  while (1) {
    SMnodeObj *pMObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
    if (pIter == NULL) break;
    if (pMObj->id != pObj->id) {
      STransAction action = {0};

S
Shengliang Guan 已提交
467 468
      SDAlterMnodeReq *pReq = malloc(sizeof(SDAlterMnodeReq));
      if (pReq == NULL) {
S
Shengliang Guan 已提交
469 470 471 472
        sdbCancelFetch(pSdb, pIter);
        sdbRelease(pSdb, pMObj);
        return -1;
      }
S
Shengliang Guan 已提交
473
      memcpy(pReq, &alterReq, sizeof(SDAlterMnodeReq));
S
Shengliang Guan 已提交
474

S
Shengliang Guan 已提交
475
      pReq->dnodeId = htonl(pMObj->id);
S
Shengliang Guan 已提交
476
      action.epSet = mndGetDnodeEpset(pMObj->pDnode);
S
Shengliang Guan 已提交
477
      action.pCont = pReq;
S
Shengliang Guan 已提交
478
      action.contLen = sizeof(SDAlterMnodeReq);
H
Hongze Cheng 已提交
479
      action.msgType = TDMT_DND_ALTER_MNODE;
S
Shengliang Guan 已提交
480
      action.acceptableCode = TSDB_CODE_DND_MNODE_ALREADY_DEPLOYED;
S
Shengliang Guan 已提交
481 482

      if (mndTransAppendRedoAction(pTrans, &action) != 0) {
S
Shengliang Guan 已提交
483
        free(pReq);
S
Shengliang Guan 已提交
484 485 486 487 488 489 490 491 492 493 494 495 496
        sdbCancelFetch(pSdb, pIter);
        sdbRelease(pSdb, pMObj);
        return -1;
      }
    }

    sdbRelease(pSdb, pMObj);
  }

  {
    STransAction action = {0};
    action.epSet = mndGetDnodeEpset(pDnode);

S
Shengliang Guan 已提交
497 498
    SDDropMnodeReq *pReq = malloc(sizeof(SDDropMnodeReq));
    if (pReq == NULL) {
S
Shengliang Guan 已提交
499 500 501
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      return -1;
    }
S
Shengliang Guan 已提交
502
    pReq->dnodeId = htonl(pObj->id);
S
Shengliang Guan 已提交
503 504

    action.epSet = mndGetDnodeEpset(pDnode);
S
Shengliang Guan 已提交
505
    action.pCont = pReq;
S
Shengliang Guan 已提交
506
    action.contLen = sizeof(SDDropMnodeReq);
H
Hongze Cheng 已提交
507
    action.msgType = TDMT_DND_DROP_MNODE;
S
Shengliang Guan 已提交
508
    action.acceptableCode = TSDB_CODE_DND_MNODE_NOT_DEPLOYED;
S
Shengliang Guan 已提交
509
    if (mndTransAppendRedoAction(pTrans, &action) != 0) {
S
Shengliang Guan 已提交
510
      free(pReq);
S
Shengliang Guan 已提交
511 512
      return -1;
    }
513 514 515 516 517
  }

  return 0;
}

S
Shengliang Guan 已提交
518
static int32_t mndDropMnode(SMnode *pMnode, SMnodeMsg *pReq, SMnodeObj *pObj) {
519
  int32_t code = -1;
S
Shengliang Guan 已提交
520

S
Shengliang Guan 已提交
521
  STrans *pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, &pReq->rpcMsg);
S
Shengliang Guan 已提交
522
  if (pTrans == NULL) goto DROP_MNODE_OVER;
S
Shengliang Guan 已提交
523

524 525
  mDebug("trans:%d, used to drop mnode:%d", pTrans->id, pObj->id);

S
Shengliang Guan 已提交
526 527 528 529
  if (mndSetDropMnodeRedoLogs(pMnode, pTrans, pObj) != 0) goto DROP_MNODE_OVER;
  if (mndSetDropMnodeCommitLogs(pMnode, pTrans, pObj) != 0) goto DROP_MNODE_OVER;
  if (mndSetDropMnodeRedoActions(pMnode, pTrans, pObj->pDnode, pObj) != 0) goto DROP_MNODE_OVER;
  if (mndTransPrepare(pMnode, pTrans) != 0) goto DROP_MNODE_OVER;
S
Shengliang Guan 已提交
530

531 532 533
  code = 0;

DROP_MNODE_OVER:
S
Shengliang Guan 已提交
534
  mndTransDrop(pTrans);
535
  return code;
S
Shengliang Guan 已提交
536 537
}

S
Shengliang Guan 已提交
538 539 540
static int32_t mndProcessDropMnodeReq(SMnodeMsg *pReq) {
  SMnode         *pMnode = pReq->pMnode;
  SMDropMnodeReq *pDrop = pReq->rpcMsg.pCont;
S
Shengliang Guan 已提交
541 542 543 544 545 546 547 548 549 550
  pDrop->dnodeId = htonl(pDrop->dnodeId);

  mDebug("mnode:%d, start to drop", pDrop->dnodeId);

  if (pDrop->dnodeId <= 0) {
    terrno = TSDB_CODE_SDB_APP_ERROR;
    mError("mnode:%d, failed to drop since %s", pDrop->dnodeId, terrstr());
    return -1;
  }

S
Shengliang Guan 已提交
551 552
  SMnodeObj *pObj = mndAcquireMnode(pMnode, pDrop->dnodeId);
  if (pObj == NULL) {
S
Shengliang Guan 已提交
553 554 555 556
    mError("mnode:%d, not exist", pDrop->dnodeId);
    return -1;
  }

S
Shengliang Guan 已提交
557
  int32_t code = mndDropMnode(pMnode, pReq, pObj);
S
Shengliang Guan 已提交
558 559 560 561
  if (code != 0) {
    mError("mnode:%d, failed to drop since %s", pMnode->dnodeId, terrstr());
    return -1;
  }
S
Shengliang Guan 已提交
562

S
Shengliang Guan 已提交
563
  sdbRelease(pMnode->pSdb, pObj);
S
Shengliang Guan 已提交
564 565 566
  return TSDB_CODE_MND_ACTION_IN_PROGRESS;
}

S
Shengliang Guan 已提交
567 568
static int32_t mndProcessCreateMnodeRsp(SMnodeMsg *pRsp) {
  mndTransProcessRsp(pRsp);
S
Shengliang Guan 已提交
569 570 571
  return 0;
}

S
Shengliang Guan 已提交
572 573
static int32_t mndProcessAlterMnodeRsp(SMnodeMsg *pRsp) {
  mndTransProcessRsp(pRsp);
S
Shengliang Guan 已提交
574 575
  return 0;
}
S
Shengliang Guan 已提交
576

S
Shengliang Guan 已提交
577 578
static int32_t mndProcessDropMnodeRsp(SMnodeMsg *pRsp) {
  mndTransProcessRsp(pRsp);
S
Shengliang Guan 已提交
579 580
  return 0;
}
S
Shengliang Guan 已提交
581

S
Shengliang Guan 已提交
582
static int32_t mndGetMnodeMeta(SMnodeMsg *pReq, SShowObj *pShow, STableMetaRsp *pMeta) {
S
Shengliang Guan 已提交
583
  SMnode *pMnode = pReq->pMnode;
S
Shengliang Guan 已提交
584 585 586
  SSdb   *pSdb = pMnode->pSdb;

  int32_t  cols = 0;
S
Shengliang Guan 已提交
587
  SSchema *pSchema = pMeta->pSchema;
S
Shengliang Guan 已提交
588 589 590 591

  pShow->bytes[cols] = 2;
  pSchema[cols].type = TSDB_DATA_TYPE_SMALLINT;
  strcpy(pSchema[cols].name, "id");
H
Haojun Liao 已提交
592
  pSchema[cols].bytes = htonl(pShow->bytes[cols]);
S
Shengliang Guan 已提交
593 594 595 596
  cols++;

  pShow->bytes[cols] = TSDB_EP_LEN + VARSTR_HEADER_SIZE;
  pSchema[cols].type = TSDB_DATA_TYPE_BINARY;
H
Haojun Liao 已提交
597 598
  strcpy(pSchema[cols].name, "endpoint");
  pSchema[cols].bytes = htonl(pShow->bytes[cols]);
S
Shengliang Guan 已提交
599 600 601 602 603
  cols++;

  pShow->bytes[cols] = 12 + VARSTR_HEADER_SIZE;
  pSchema[cols].type = TSDB_DATA_TYPE_BINARY;
  strcpy(pSchema[cols].name, "role");
H
Haojun Liao 已提交
604
  pSchema[cols].bytes = htonl(pShow->bytes[cols]);
S
Shengliang Guan 已提交
605 606 607 608
  cols++;

  pShow->bytes[cols] = 8;
  pSchema[cols].type = TSDB_DATA_TYPE_TIMESTAMP;
H
Haojun Liao 已提交
609 610
  strcpy(pSchema[cols].name, "role_time");
  pSchema[cols].bytes = htonl(pShow->bytes[cols]);
S
Shengliang Guan 已提交
611 612 613 614
  cols++;

  pShow->bytes[cols] = 8;
  pSchema[cols].type = TSDB_DATA_TYPE_TIMESTAMP;
H
Haojun Liao 已提交
615 616
  strcpy(pSchema[cols].name, "create_time");
  pSchema[cols].bytes = htonl(pShow->bytes[cols]);
S
Shengliang Guan 已提交
617 618
  cols++;

H
Haojun Liao 已提交
619
  pMeta->numOfColumns = htonl(cols);
S
Shengliang Guan 已提交
620 621 622 623 624 625 626 627 628
  pShow->numOfColumns = cols;

  pShow->offset[0] = 0;
  for (int32_t i = 1; i < cols; ++i) {
    pShow->offset[i] = pShow->offset[i - 1] + pShow->bytes[i - 1];
  }

  pShow->numOfRows = sdbGetSize(pSdb, SDB_MNODE);
  pShow->rowSize = pShow->offset[cols - 1] + pShow->bytes[cols - 1];
629
  strcpy(pMeta->tbFname, mndShowStr(pShow->type));
S
Shengliang Guan 已提交
630

S
Shengliang Guan 已提交
631
  mndUpdateMnodeRole(pMnode);
S
Shengliang Guan 已提交
632 633 634
  return 0;
}

S
Shengliang Guan 已提交
635 636
static int32_t mndRetrieveMnodes(SMnodeMsg *pReq, SShowObj *pShow, char *data, int32_t rows) {
  SMnode    *pMnode = pReq->pMnode;
S
Shengliang Guan 已提交
637 638 639
  SSdb      *pSdb = pMnode->pSdb;
  int32_t    numOfRows = 0;
  int32_t    cols = 0;
S
Shengliang Guan 已提交
640
  SMnodeObj *pObj = NULL;
S
Shengliang Guan 已提交
641 642 643
  char      *pWrite;

  while (numOfRows < rows) {
S
Shengliang Guan 已提交
644
    pShow->pIter = sdbFetch(pSdb, SDB_MNODE, pShow->pIter, (void **)&pObj);
S
Shengliang Guan 已提交
645 646 647 648 649
    if (pShow->pIter == NULL) break;

    cols = 0;

    pWrite = data + pShow->offset[cols] * rows + pShow->bytes[cols] * numOfRows;
S
Shengliang Guan 已提交
650
    *(int16_t *)pWrite = pObj->id;
S
Shengliang Guan 已提交
651 652 653
    cols++;

    pWrite = data + pShow->offset[cols] * rows + pShow->bytes[cols] * numOfRows;
S
Shengliang Guan 已提交
654
    STR_WITH_MAXSIZE_TO_VARSTR(pWrite, pObj->pDnode->ep, pShow->bytes[cols]);
S
Shengliang Guan 已提交
655 656 657 658

    cols++;

    pWrite = data + pShow->offset[cols] * rows + pShow->bytes[cols] * numOfRows;
S
Shengliang Guan 已提交
659
    char *roles = mndGetRoleStr(pObj->role);
S
Shengliang Guan 已提交
660 661 662 663
    STR_WITH_MAXSIZE_TO_VARSTR(pWrite, roles, pShow->bytes[cols]);
    cols++;

    pWrite = data + pShow->offset[cols] * rows + pShow->bytes[cols] * numOfRows;
S
Shengliang Guan 已提交
664
    *(int64_t *)pWrite = pObj->roleTime;
S
Shengliang Guan 已提交
665 666 667
    cols++;

    pWrite = data + pShow->offset[cols] * rows + pShow->bytes[cols] * numOfRows;
S
Shengliang Guan 已提交
668
    *(int64_t *)pWrite = pObj->createdTime;
S
Shengliang Guan 已提交
669 670 671
    cols++;

    numOfRows++;
S
Shengliang Guan 已提交
672
    sdbRelease(pSdb, pObj);
S
Shengliang Guan 已提交
673 674
  }

S
Shengliang Guan 已提交
675
  mndVacuumResult(data, pShow->numOfColumns, numOfRows, rows, pShow);
S
Shengliang Guan 已提交
676 677 678 679 680 681 682 683 684
  pShow->numOfReads += numOfRows;

  return numOfRows;
}

static void mndCancelGetNextMnode(SMnode *pMnode, void *pIter) {
  SSdb *pSdb = pMnode->pSdb;
  sdbCancelFetch(pSdb, pIter);
}