mndMnode.c 21.5 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

S
Shengliang Guan 已提交
16
#define _DEFAULT_SOURCE
S
Shengliang Guan 已提交
17
#include "mndMnode.h"
S
Shengliang Guan 已提交
18
#include "mndAuth.h"
S
Shengliang Guan 已提交
19 20
#include "mndDnode.h"
#include "mndShow.h"
S
Shengliang Guan 已提交
21
#include "mndTrans.h"
S
Shengliang Guan 已提交
22
#include "mndUser.h"
S
Shengliang Guan 已提交
23

S
Shengliang Guan 已提交
24 25
#define TSDB_MNODE_VER_NUMBER 1
#define TSDB_MNODE_RESERVE_SIZE 64
S
Shengliang Guan 已提交
26

S
Shengliang Guan 已提交
27
static int32_t  mndCreateDefaultMnode(SMnode *pMnode);
S
Shengliang Guan 已提交
28
static SSdbRaw *mndMnodeActionEncode(SMnodeObj *pObj);
S
Shengliang Guan 已提交
29
static SSdbRow *mndMnodeActionDecode(SSdbRaw *pRaw);
S
Shengliang Guan 已提交
30 31
static int32_t  mndMnodeActionInsert(SSdb *pSdb, SMnodeObj *pObj);
static int32_t  mndMnodeActionDelete(SSdb *pSdb, SMnodeObj *pObj);
S
Shengliang Guan 已提交
32 33 34 35 36 37
static int32_t  mndMnodeActionUpdate(SSdb *pSdb, SMnodeObj *pOld, SMnodeObj *pNew);
static int32_t  mndProcessCreateMnodeReq(SMnodeMsg *pReq);
static int32_t  mndProcessDropMnodeReq(SMnodeMsg *pReq);
static int32_t  mndProcessCreateMnodeRsp(SMnodeMsg *pRsp);
static int32_t  mndProcessAlterMnodeRsp(SMnodeMsg *pRsp);
static int32_t  mndProcessDropMnodeRsp(SMnodeMsg *pRsp);
S
Shengliang Guan 已提交
38
static int32_t  mndGetMnodeMeta(SMnodeMsg *pReq, SShowObj *pShow, STableMetaRsp *pMeta);
S
Shengliang Guan 已提交
39
static int32_t  mndRetrieveMnodes(SMnodeMsg *pReq, SShowObj *pShow, char *data, int32_t rows);
S
Shengliang Guan 已提交
40
static void     mndCancelGetNextMnode(SMnode *pMnode, void *pIter);
S
Shengliang Guan 已提交
41 42 43 44 45 46 47 48 49 50 51

int32_t mndInitMnode(SMnode *pMnode) {
  SSdbTable table = {.sdbType = SDB_MNODE,
                     .keyType = SDB_KEY_INT32,
                     .deployFp = (SdbDeployFp)mndCreateDefaultMnode,
                     .encodeFp = (SdbEncodeFp)mndMnodeActionEncode,
                     .decodeFp = (SdbDecodeFp)mndMnodeActionDecode,
                     .insertFp = (SdbInsertFp)mndMnodeActionInsert,
                     .updateFp = (SdbUpdateFp)mndMnodeActionUpdate,
                     .deleteFp = (SdbDeleteFp)mndMnodeActionDelete};

H
Hongze Cheng 已提交
52 53 54 55 56
  mndSetMsgHandle(pMnode, TDMT_MND_CREATE_MNODE, mndProcessCreateMnodeReq);
  mndSetMsgHandle(pMnode, TDMT_MND_DROP_MNODE, mndProcessDropMnodeReq);
  mndSetMsgHandle(pMnode, TDMT_DND_CREATE_MNODE_RSP, mndProcessCreateMnodeRsp);
  mndSetMsgHandle(pMnode, TDMT_DND_ALTER_MNODE_RSP, mndProcessAlterMnodeRsp);
  mndSetMsgHandle(pMnode, TDMT_DND_DROP_MNODE_RSP, mndProcessDropMnodeRsp);
S
Shengliang Guan 已提交
57 58 59 60

  mndAddShowMetaHandle(pMnode, TSDB_MGMT_TABLE_MNODE, mndGetMnodeMeta);
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_MNODE, mndRetrieveMnodes);
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_MNODE, mndCancelGetNextMnode);
S
Shengliang Guan 已提交
61 62 63 64 65 66

  return sdbSetTable(pMnode->pSdb, table);
}

void mndCleanupMnode(SMnode *pMnode) {}

S
Shengliang Guan 已提交
67
static SMnodeObj *mndAcquireMnode(SMnode *pMnode, int32_t mnodeId) {
S
Shengliang Guan 已提交
68 69
  SSdb      *pSdb = pMnode->pSdb;
  SMnodeObj *pObj = sdbAcquire(pSdb, SDB_MNODE, &mnodeId);
S
Shengliang Guan 已提交
70
  if (pObj == NULL && terrno == TSDB_CODE_SDB_OBJ_NOT_THERE) {
S
Shengliang Guan 已提交
71 72 73
    terrno = TSDB_CODE_MND_MNODE_NOT_EXIST;
  }
  return pObj;
S
Shengliang Guan 已提交
74 75
}

S
Shengliang Guan 已提交
76
static void mndReleaseMnode(SMnode *pMnode, SMnodeObj *pObj) {
S
Shengliang Guan 已提交
77
  SSdb *pSdb = pMnode->pSdb;
S
Shengliang Guan 已提交
78
  sdbRelease(pSdb, pObj);
S
Shengliang Guan 已提交
79 80 81 82 83 84 85 86 87 88 89 90 91 92 93
}

char *mndGetRoleStr(int32_t showType) {
  switch (showType) {
    case TAOS_SYNC_STATE_FOLLOWER:
      return "unsynced";
    case TAOS_SYNC_STATE_CANDIDATE:
      return "slave";
    case TAOS_SYNC_STATE_LEADER:
      return "master";
    default:
      return "undefined";
  }
}

S
Shengliang Guan 已提交
94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
void mndUpdateMnodeRole(SMnode *pMnode) {
  SSdb *pSdb = pMnode->pSdb;
  void *pIter = NULL;
  while (1) {
    SMnodeObj *pObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pObj);
    if (pIter == NULL) break;

    if (pObj->id == 1) {
      pObj->role = TAOS_SYNC_STATE_LEADER;
    } else {
      pObj->role = TAOS_SYNC_STATE_CANDIDATE;
    }

    sdbRelease(pSdb, pObj);
  }
}

S
Shengliang Guan 已提交
112 113 114 115 116 117 118 119 120 121
static int32_t mndCreateDefaultMnode(SMnode *pMnode) {
  SMnodeObj mnodeObj = {0};
  mnodeObj.id = 1;
  mnodeObj.createdTime = taosGetTimestampMs();
  mnodeObj.updateTime = mnodeObj.createdTime;

  SSdbRaw *pRaw = mndMnodeActionEncode(&mnodeObj);
  if (pRaw == NULL) return -1;
  sdbSetRawStatus(pRaw, SDB_STATUS_READY);

122
  mDebug("mnode:%d, will be created while deploy sdb, raw:%p", mnodeObj.id, pRaw);
S
Shengliang Guan 已提交
123 124 125
  return sdbWrite(pMnode->pSdb, pRaw);
}

S
Shengliang Guan 已提交
126
static SSdbRaw *mndMnodeActionEncode(SMnodeObj *pObj) {
127 128
  terrno = TSDB_CODE_OUT_OF_MEMORY;

S
Shengliang Guan 已提交
129
  SSdbRaw *pRaw = sdbAllocRaw(SDB_MNODE, TSDB_MNODE_VER_NUMBER, sizeof(SMnodeObj) + TSDB_MNODE_RESERVE_SIZE);
130
  if (pRaw == NULL) goto MNODE_ENCODE_OVER;
S
Shengliang Guan 已提交
131 132

  int32_t dataPos = 0;
133 134 135 136 137 138 139 140 141 142 143 144 145
  SDB_SET_INT32(pRaw, dataPos, pObj->id, MNODE_ENCODE_OVER)
  SDB_SET_INT64(pRaw, dataPos, pObj->createdTime, MNODE_ENCODE_OVER)
  SDB_SET_INT64(pRaw, dataPos, pObj->updateTime, MNODE_ENCODE_OVER)
  SDB_SET_RESERVE(pRaw, dataPos, TSDB_MNODE_RESERVE_SIZE, MNODE_ENCODE_OVER)

  terrno = 0;

MNODE_ENCODE_OVER:
  if (terrno != 0) {
    mError("mnode:%d, failed to encode to raw:%p since %s", pObj->id, pRaw, terrstr());
    sdbFreeRaw(pRaw);
    return NULL;
  }
S
Shengliang Guan 已提交
146

147
  mTrace("mnode:%d, encode to raw:%p, row:%p", pObj->id, pRaw, pObj);
S
Shengliang Guan 已提交
148 149 150 151
  return pRaw;
}

static SSdbRow *mndMnodeActionDecode(SSdbRaw *pRaw) {
152 153
  terrno = TSDB_CODE_OUT_OF_MEMORY;

S
Shengliang Guan 已提交
154 155 156
  int8_t sver = 0;
  if (sdbGetRawSoftVer(pRaw, &sver) != 0) return NULL;

S
Shengliang Guan 已提交
157
  if (sver != TSDB_MNODE_VER_NUMBER) {
S
Shengliang Guan 已提交
158
    terrno = TSDB_CODE_SDB_INVALID_DATA_VER;
159
    goto MNODE_DECODE_OVER;
S
Shengliang Guan 已提交
160 161
  }

162 163 164
  SSdbRow *pRow = sdbAllocRow(sizeof(SMnodeObj));
  if (pRow == NULL) goto MNODE_DECODE_OVER;

S
Shengliang Guan 已提交
165
  SMnodeObj *pObj = sdbGetRowObj(pRow);
166
  if (pObj == NULL) goto MNODE_DECODE_OVER;
S
Shengliang Guan 已提交
167 168

  int32_t dataPos = 0;
169 170 171 172 173 174 175 176 177 178 179 180 181
  SDB_GET_INT32(pRaw, dataPos, &pObj->id, MNODE_DECODE_OVER)
  SDB_GET_INT64(pRaw, dataPos, &pObj->createdTime, MNODE_DECODE_OVER)
  SDB_GET_INT64(pRaw, dataPos, &pObj->updateTime, MNODE_DECODE_OVER)
  SDB_GET_RESERVE(pRaw, dataPos, TSDB_MNODE_RESERVE_SIZE, MNODE_DECODE_OVER)

  terrno = 0;

MNODE_DECODE_OVER:
  if (terrno != 0) {
    mError("mnode:%d, failed to decode from raw:%p since %s", pObj->id, pRaw, terrstr());
    tfree(pRow);
    return NULL;
  }
S
Shengliang Guan 已提交
182

183
  mTrace("mnode:%d, decode from raw:%p, row:%p", pObj->id, pRaw, pObj);
S
Shengliang Guan 已提交
184 185 186
  return pRow;
}

S
Shengliang Guan 已提交
187
static void mnodeResetMnode(SMnodeObj *pObj) { pObj->role = TAOS_SYNC_STATE_FOLLOWER; }
S
Shengliang Guan 已提交
188

S
Shengliang Guan 已提交
189
static int32_t mndMnodeActionInsert(SSdb *pSdb, SMnodeObj *pObj) {
190
  mTrace("mnode:%d, perform insert action, row:%p", pObj->id, pObj);
S
Shengliang Guan 已提交
191 192
  pObj->pDnode = sdbAcquire(pSdb, SDB_DNODE, &pObj->id);
  if (pObj->pDnode == NULL) {
S
Shengliang Guan 已提交
193
    terrno = TSDB_CODE_MND_DNODE_NOT_EXIST;
S
Shengliang Guan 已提交
194
    mError("mnode:%d, failed to perform insert action since %s", pObj->id, terrstr());
S
Shengliang Guan 已提交
195 196 197
    return -1;
  }

S
Shengliang Guan 已提交
198
  mnodeResetMnode(pObj);
S
Shengliang Guan 已提交
199 200 201
  return 0;
}

S
Shengliang Guan 已提交
202
static int32_t mndMnodeActionDelete(SSdb *pSdb, SMnodeObj *pObj) {
203
  mTrace("mnode:%d, perform delete action, row:%p", pObj->id, pObj);
S
Shengliang Guan 已提交
204 205 206
  if (pObj->pDnode != NULL) {
    sdbRelease(pSdb, pObj->pDnode);
    pObj->pDnode = NULL;
S
Shengliang Guan 已提交
207 208 209 210 211
  }

  return 0;
}

S
Shengliang Guan 已提交
212
static int32_t mndMnodeActionUpdate(SSdb *pSdb, SMnodeObj *pOld, SMnodeObj *pNew) {
S
Shengliang Guan 已提交
213
  mTrace("mnode:%d, perform update action, old row:%p new row:%p", pOld->id, pOld, pNew);
S
Shengliang Guan 已提交
214
  pOld->updateTime = pNew->updateTime;
S
Shengliang Guan 已提交
215
  return 0;
S
Shengliang Guan 已提交
216 217 218 219 220
}

bool mndIsMnode(SMnode *pMnode, int32_t dnodeId) {
  SSdb *pSdb = pMnode->pSdb;

S
Shengliang Guan 已提交
221 222
  SMnodeObj *pObj = sdbAcquire(pSdb, SDB_MNODE, &dnodeId);
  if (pObj == NULL) {
S
Shengliang Guan 已提交
223 224 225
    return false;
  }

S
Shengliang Guan 已提交
226
  sdbRelease(pSdb, pObj);
S
Shengliang Guan 已提交
227
  return true;
S
Shengliang Guan 已提交
228 229
}

S
Shengliang Guan 已提交
230 231 232 233 234 235 236
void mndGetMnodeEpSet(SMnode *pMnode, SEpSet *pEpSet) {
  SSdb *pSdb = pMnode->pSdb;

  pEpSet->numOfEps = 0;

  void *pIter = NULL;
  while (1) {
S
Shengliang Guan 已提交
237 238
    SMnodeObj *pObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pObj);
S
Shengliang Guan 已提交
239
    if (pIter == NULL) break;
S
Shengliang Guan 已提交
240
    if (pObj->pDnode == NULL) break;
S
Shengliang Guan 已提交
241

S
Shengliang Guan 已提交
242
    if (pObj->role == TAOS_SYNC_STATE_LEADER) {
S
Shengliang Guan 已提交
243 244 245
      pEpSet->inUse = pEpSet->numOfEps;
    }

246
    addEpIntoEpSet(pEpSet, pObj->pDnode->fqdn, htons(pObj->pDnode->port));
S
Shengliang Guan 已提交
247
    sdbRelease(pSdb, pObj);
S
Shengliang Guan 已提交
248
  }
S
Shengliang Guan 已提交
249 250
}

251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274
static int32_t mndSetCreateMnodeRedoLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
  SSdbRaw *pRedoRaw = mndMnodeActionEncode(pObj);
  if (pRedoRaw == NULL) return -1;
  if (mndTransAppendRedolog(pTrans, pRedoRaw) != 0) return -1;
  if (sdbSetRawStatus(pRedoRaw, SDB_STATUS_CREATING) != 0) return -1;
  return 0;
}

static int32_t mndSetCreateMnodeUndoLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
  SSdbRaw *pUndoRaw = mndMnodeActionEncode(pObj);
  if (pUndoRaw == NULL) return -1;
  if (mndTransAppendUndolog(pTrans, pUndoRaw) != 0) return -1;
  if (sdbSetRawStatus(pUndoRaw, SDB_STATUS_DROPPED) != 0) return -1;
  return 0;
}

static int32_t mndSetCreateMnodeCommitLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
  SSdbRaw *pCommitRaw = mndMnodeActionEncode(pObj);
  if (pCommitRaw == NULL) return -1;
  if (mndTransAppendCommitlog(pTrans, pCommitRaw) != 0) return -1;
  if (sdbSetRawStatus(pCommitRaw, SDB_STATUS_READY) != 0) return -1;
  return 0;
}

S
Shengliang Guan 已提交
275 276 277 278
static int32_t mndSetCreateMnodeRedoActions(SMnode *pMnode, STrans *pTrans, SDnodeObj *pDnode, SMnodeObj *pObj) {
  SSdb   *pSdb = pMnode->pSdb;
  void   *pIter = NULL;
  int32_t numOfReplicas = 0;
279

S
Shengliang Guan 已提交
280
  SDCreateMnodeReq createReq = {0};
S
Shengliang Guan 已提交
281 282 283 284
  while (1) {
    SMnodeObj *pMObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
    if (pIter == NULL) break;
285

S
Shengliang Guan 已提交
286
    SReplica *pReplica = &createReq.replicas[numOfReplicas];
S
Shengliang Guan 已提交
287 288 289 290
    pReplica->id = htonl(pMObj->id);
    pReplica->port = htons(pMObj->pDnode->port);
    memcpy(pReplica->fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
    numOfReplicas++;
291

S
Shengliang Guan 已提交
292 293 294
    sdbRelease(pSdb, pMObj);
  }

S
Shengliang Guan 已提交
295
  SReplica *pReplica = &createReq.replicas[numOfReplicas];
S
Shengliang Guan 已提交
296 297 298 299 300
  pReplica->id = htonl(pDnode->id);
  pReplica->port = htons(pDnode->port);
  memcpy(pReplica->fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
  numOfReplicas++;

S
Shengliang Guan 已提交
301
  createReq.replica = numOfReplicas;
S
Shengliang Guan 已提交
302

S
Shengliang Guan 已提交
303 304 305 306 307 308 309
  while (1) {
    SMnodeObj *pMObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
    if (pIter == NULL) break;

    STransAction action = {0};

S
Shengliang Guan 已提交
310 311
    SDAlterMnodeReq *pReq = malloc(sizeof(SDAlterMnodeReq));
    if (pReq == NULL) {
S
Shengliang Guan 已提交
312 313 314 315
      sdbCancelFetch(pSdb, pIter);
      sdbRelease(pSdb, pMObj);
      return -1;
    }
S
Shengliang Guan 已提交
316
    memcpy(pReq, &createReq, sizeof(SDAlterMnodeReq));
S
Shengliang Guan 已提交
317

S
Shengliang Guan 已提交
318
    pReq->dnodeId = htonl(pMObj->id);
S
Shengliang Guan 已提交
319
    action.epSet = mndGetDnodeEpset(pMObj->pDnode);
S
Shengliang Guan 已提交
320
    action.pCont = pReq;
S
Shengliang Guan 已提交
321
    action.contLen = sizeof(SDAlterMnodeReq);
H
Hongze Cheng 已提交
322
    action.msgType = TDMT_DND_ALTER_MNODE;
S
Shengliang Guan 已提交
323
    action.acceptableCode = TSDB_CODE_DND_MNODE_ALREADY_DEPLOYED;
S
Shengliang Guan 已提交
324 325

    if (mndTransAppendRedoAction(pTrans, &action) != 0) {
S
Shengliang Guan 已提交
326
      free(pReq);
S
Shengliang Guan 已提交
327 328 329 330 331 332 333 334 335 336 337 338
      sdbCancelFetch(pSdb, pIter);
      sdbRelease(pSdb, pMObj);
      return -1;
    }

    sdbRelease(pSdb, pMObj);
  }

  {
    STransAction action = {0};
    action.epSet = mndGetDnodeEpset(pDnode);

S
Shengliang Guan 已提交
339 340 341 342
    SDCreateMnodeReq *pReq = malloc(sizeof(SDCreateMnodeReq));
    if (pReq == NULL) return -1;
    memcpy(pReq, &createReq, sizeof(SDAlterMnodeReq));
    pReq->dnodeId = htonl(pObj->id);
S
Shengliang Guan 已提交
343 344

    action.epSet = mndGetDnodeEpset(pDnode);
S
Shengliang Guan 已提交
345
    action.pCont = pReq;
S
Shengliang Guan 已提交
346
    action.contLen = sizeof(SDCreateMnodeReq);
H
Hongze Cheng 已提交
347
    action.msgType = TDMT_DND_CREATE_MNODE;
S
Shengliang Guan 已提交
348
    action.acceptableCode = TSDB_CODE_DND_MNODE_ALREADY_DEPLOYED;
S
Shengliang Guan 已提交
349
    if (mndTransAppendRedoAction(pTrans, &action) != 0) {
S
Shengliang Guan 已提交
350
      free(pReq);
S
Shengliang Guan 已提交
351 352
      return -1;
    }
353 354 355 356 357
  }

  return 0;
}

S
Shengliang Guan 已提交
358
static int32_t mndCreateMnode(SMnode *pMnode, SMnodeMsg *pReq, SDnodeObj *pDnode, SMCreateMnodeReq *pCreate) {
S
Shengliang Guan 已提交
359 360
  int32_t code = -1;

S
Shengliang Guan 已提交
361
  SMnodeObj mnodeObj = {0};
S
Shengliang Guan 已提交
362
  mnodeObj.id = pDnode->id;
S
Shengliang Guan 已提交
363 364 365
  mnodeObj.createdTime = taosGetTimestampMs();
  mnodeObj.updateTime = mnodeObj.createdTime;

S
Shengliang Guan 已提交
366
  STrans *pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, &pReq->rpcMsg);
S
Shengliang Guan 已提交
367
  if (pTrans == NULL) goto CREATE_MNODE_OVER;
S
Shengliang Guan 已提交
368

S
Shengliang Guan 已提交
369 370 371 372
  mDebug("trans:%d, used to create mnode:%d", pTrans->id, pCreate->dnodeId);
  if (mndSetCreateMnodeRedoLogs(pMnode, pTrans, &mnodeObj) != 0) goto CREATE_MNODE_OVER;
  if (mndSetCreateMnodeCommitLogs(pMnode, pTrans, &mnodeObj) != 0) goto CREATE_MNODE_OVER;
  if (mndSetCreateMnodeRedoActions(pMnode, pTrans, pDnode, &mnodeObj) != 0) goto CREATE_MNODE_OVER;
S
Shengliang Guan 已提交
373

S
Shengliang Guan 已提交
374
  if (mndTransPrepare(pMnode, pTrans) != 0) goto CREATE_MNODE_OVER;
S
Shengliang Guan 已提交
375

376 377 378
  code = 0;

CREATE_MNODE_OVER:
S
Shengliang Guan 已提交
379
  mndTransDrop(pTrans);
380
  return code;
S
Shengliang Guan 已提交
381 382
}

S
Shengliang Guan 已提交
383
static int32_t mndProcessCreateMnodeReq(SMnodeMsg *pReq) {
S
Shengliang Guan 已提交
384 385 386 387 388 389 390 391 392 393 394
  SMnode          *pMnode = pReq->pMnode;
  int32_t          code = -1;
  SMnodeObj       *pObj = NULL;
  SDnodeObj       *pDnode = NULL;
  SUserObj        *pUser = NULL;
  SMCreateMnodeReq createReq = {0};

  if (tDeserializeSMCreateDropMnodeReq(pReq->rpcMsg.pCont, pReq->rpcMsg.contLen, &createReq) != 0) {
    terrno = TSDB_CODE_INVALID_MSG;
    goto CREATE_MNODE_OVER;
  }
S
Shengliang Guan 已提交
395

S
Shengliang Guan 已提交
396
  mDebug("mnode:%d, start to create", createReq.dnodeId);
S
Shengliang Guan 已提交
397

S
Shengliang Guan 已提交
398
  pObj = mndAcquireMnode(pMnode, createReq.dnodeId);
S
Shengliang Guan 已提交
399
  if (pObj != NULL) {
S
Shengliang Guan 已提交
400
    terrno = TSDB_CODE_MND_MNODE_ALREADY_EXIST;
S
Shengliang Guan 已提交
401
    goto CREATE_MNODE_OVER;
S
Shengliang Guan 已提交
402
  } else if (terrno != TSDB_CODE_MND_MNODE_NOT_EXIST) {
S
Shengliang Guan 已提交
403
    goto CREATE_MNODE_OVER;
S
Shengliang Guan 已提交
404 405
  }

S
Shengliang Guan 已提交
406
  pDnode = mndAcquireDnode(pMnode, createReq.dnodeId);
S
Shengliang Guan 已提交
407 408
  if (pDnode == NULL) {
    terrno = TSDB_CODE_MND_DNODE_NOT_EXIST;
S
Shengliang Guan 已提交
409
    goto CREATE_MNODE_OVER;
S
Shengliang Guan 已提交
410 411
  }

S
Shengliang Guan 已提交
412 413 414 415 416
  pUser = mndAcquireUser(pMnode, pReq->user);
  if (pUser == NULL) {
    terrno = TSDB_CODE_MND_NO_USER_FROM_CONN;
    goto CREATE_MNODE_OVER;
  }
S
Shengliang Guan 已提交
417

S
Shengliang Guan 已提交
418
  if (mndCheckNodeAuth(pUser)) {
S
Shengliang Guan 已提交
419 420 421 422 423 424 425 426 427
    goto CREATE_MNODE_OVER;
  }

  code = mndCreateMnode(pMnode, pReq, pDnode, &createReq);
  if (code == 0) code = TSDB_CODE_MND_ACTION_IN_PROGRESS;

CREATE_MNODE_OVER:
  if (code != 0 && code != TSDB_CODE_MND_ACTION_IN_PROGRESS) {
    mError("mnode:%d, failed to create since %s", createReq.dnodeId, terrstr());
S
Shengliang Guan 已提交
428 429
  }

S
Shengliang Guan 已提交
430 431 432 433 434
  mndReleaseMnode(pMnode, pObj);
  mndReleaseDnode(pMnode, pDnode);
  mndReleaseUser(pMnode, pUser);

  return code;
S
Shengliang Guan 已提交
435 436
}

437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452
static int32_t mndSetDropMnodeRedoLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
  SSdbRaw *pRedoRaw = mndMnodeActionEncode(pObj);
  if (pRedoRaw == NULL) return -1;
  if (mndTransAppendRedolog(pTrans, pRedoRaw) != 0) return -1;
  if (sdbSetRawStatus(pRedoRaw, SDB_STATUS_DROPPING) != 0) return -1;
  return 0;
}

static int32_t mndSetDropMnodeCommitLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
  SSdbRaw *pCommitRaw = mndMnodeActionEncode(pObj);
  if (pCommitRaw == NULL) return -1;
  if (mndTransAppendCommitlog(pTrans, pCommitRaw) != 0) return -1;
  if (sdbSetRawStatus(pCommitRaw, SDB_STATUS_DROPPED) != 0) return -1;
  return 0;
}

S
Shengliang Guan 已提交
453 454 455 456
static int32_t mndSetDropMnodeRedoActions(SMnode *pMnode, STrans *pTrans, SDnodeObj *pDnode, SMnodeObj *pObj) {
  SSdb   *pSdb = pMnode->pSdb;
  void   *pIter = NULL;
  int32_t numOfReplicas = 0;
457

S
Shengliang Guan 已提交
458
  SDAlterMnodeReq alterReq = {0};
S
Shengliang Guan 已提交
459 460 461 462
  while (1) {
    SMnodeObj *pMObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
    if (pIter == NULL) break;
463

S
Shengliang Guan 已提交
464
    if (pMObj->id != pObj->id) {
S
Shengliang Guan 已提交
465
      SReplica *pReplica = &alterReq.replicas[numOfReplicas];
S
Shengliang Guan 已提交
466 467 468 469 470
      pReplica->id = htonl(pMObj->id);
      pReplica->port = htons(pMObj->pDnode->port);
      memcpy(pReplica->fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
      numOfReplicas++;
    }
471

S
Shengliang Guan 已提交
472 473 474
    sdbRelease(pSdb, pMObj);
  }

S
Shengliang Guan 已提交
475
  alterReq.replica = numOfReplicas;
S
Shengliang Guan 已提交
476

S
Shengliang Guan 已提交
477 478 479 480 481 482 483
  while (1) {
    SMnodeObj *pMObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
    if (pIter == NULL) break;
    if (pMObj->id != pObj->id) {
      STransAction action = {0};

S
Shengliang Guan 已提交
484 485
      SDAlterMnodeReq *pReq = malloc(sizeof(SDAlterMnodeReq));
      if (pReq == NULL) {
S
Shengliang Guan 已提交
486 487 488 489
        sdbCancelFetch(pSdb, pIter);
        sdbRelease(pSdb, pMObj);
        return -1;
      }
S
Shengliang Guan 已提交
490
      memcpy(pReq, &alterReq, sizeof(SDAlterMnodeReq));
S
Shengliang Guan 已提交
491

S
Shengliang Guan 已提交
492
      pReq->dnodeId = htonl(pMObj->id);
S
Shengliang Guan 已提交
493
      action.epSet = mndGetDnodeEpset(pMObj->pDnode);
S
Shengliang Guan 已提交
494
      action.pCont = pReq;
S
Shengliang Guan 已提交
495
      action.contLen = sizeof(SDAlterMnodeReq);
H
Hongze Cheng 已提交
496
      action.msgType = TDMT_DND_ALTER_MNODE;
S
Shengliang Guan 已提交
497
      action.acceptableCode = TSDB_CODE_DND_MNODE_ALREADY_DEPLOYED;
S
Shengliang Guan 已提交
498 499

      if (mndTransAppendRedoAction(pTrans, &action) != 0) {
S
Shengliang Guan 已提交
500
        free(pReq);
S
Shengliang Guan 已提交
501 502 503 504 505 506 507 508 509 510 511 512 513
        sdbCancelFetch(pSdb, pIter);
        sdbRelease(pSdb, pMObj);
        return -1;
      }
    }

    sdbRelease(pSdb, pMObj);
  }

  {
    STransAction action = {0};
    action.epSet = mndGetDnodeEpset(pDnode);

S
Shengliang Guan 已提交
514 515
    SDDropMnodeReq *pReq = malloc(sizeof(SDDropMnodeReq));
    if (pReq == NULL) {
S
Shengliang Guan 已提交
516 517 518
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      return -1;
    }
S
Shengliang Guan 已提交
519
    pReq->dnodeId = htonl(pObj->id);
S
Shengliang Guan 已提交
520 521

    action.epSet = mndGetDnodeEpset(pDnode);
S
Shengliang Guan 已提交
522
    action.pCont = pReq;
S
Shengliang Guan 已提交
523
    action.contLen = sizeof(SDDropMnodeReq);
H
Hongze Cheng 已提交
524
    action.msgType = TDMT_DND_DROP_MNODE;
S
Shengliang Guan 已提交
525
    action.acceptableCode = TSDB_CODE_DND_MNODE_NOT_DEPLOYED;
S
Shengliang Guan 已提交
526
    if (mndTransAppendRedoAction(pTrans, &action) != 0) {
S
Shengliang Guan 已提交
527
      free(pReq);
S
Shengliang Guan 已提交
528 529
      return -1;
    }
530 531 532 533 534
  }

  return 0;
}

S
Shengliang Guan 已提交
535
static int32_t mndDropMnode(SMnode *pMnode, SMnodeMsg *pReq, SMnodeObj *pObj) {
536
  int32_t code = -1;
S
Shengliang Guan 已提交
537

S
Shengliang Guan 已提交
538
  STrans *pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, &pReq->rpcMsg);
S
Shengliang Guan 已提交
539
  if (pTrans == NULL) goto DROP_MNODE_OVER;
S
Shengliang Guan 已提交
540

541 542
  mDebug("trans:%d, used to drop mnode:%d", pTrans->id, pObj->id);

S
Shengliang Guan 已提交
543 544 545 546
  if (mndSetDropMnodeRedoLogs(pMnode, pTrans, pObj) != 0) goto DROP_MNODE_OVER;
  if (mndSetDropMnodeCommitLogs(pMnode, pTrans, pObj) != 0) goto DROP_MNODE_OVER;
  if (mndSetDropMnodeRedoActions(pMnode, pTrans, pObj->pDnode, pObj) != 0) goto DROP_MNODE_OVER;
  if (mndTransPrepare(pMnode, pTrans) != 0) goto DROP_MNODE_OVER;
S
Shengliang Guan 已提交
547

548 549 550
  code = 0;

DROP_MNODE_OVER:
S
Shengliang Guan 已提交
551
  mndTransDrop(pTrans);
552
  return code;
S
Shengliang Guan 已提交
553 554
}

S
Shengliang Guan 已提交
555
static int32_t mndProcessDropMnodeReq(SMnodeMsg *pReq) {
S
Shengliang Guan 已提交
556 557 558 559 560 561 562 563 564 565
  SMnode        *pMnode = pReq->pMnode;
  int32_t        code = -1;
  SUserObj      *pUser = NULL;
  SMnodeObj     *pObj = NULL;
  SMDropMnodeReq dropReq = {0};

  if (tDeserializeSMCreateDropMnodeReq(pReq->rpcMsg.pCont, pReq->rpcMsg.contLen, &dropReq) != 0) {
    terrno = TSDB_CODE_INVALID_MSG;
    goto DROP_MNODE_OVER;
  }
S
Shengliang Guan 已提交
566

S
Shengliang Guan 已提交
567
  mDebug("mnode:%d, start to drop", dropReq.dnodeId);
S
Shengliang Guan 已提交
568

S
Shengliang Guan 已提交
569
  if (dropReq.dnodeId <= 0) {
S
Shengliang Guan 已提交
570
    terrno = TSDB_CODE_SDB_APP_ERROR;
S
Shengliang Guan 已提交
571
    goto DROP_MNODE_OVER;
S
Shengliang Guan 已提交
572 573
  }

S
Shengliang Guan 已提交
574
  pObj = mndAcquireMnode(pMnode, dropReq.dnodeId);
S
Shengliang Guan 已提交
575
  if (pObj == NULL) {
S
Shengliang Guan 已提交
576
    goto DROP_MNODE_OVER;
S
Shengliang Guan 已提交
577 578
  }

S
Shengliang Guan 已提交
579 580 581 582 583 584
  pUser = mndAcquireUser(pMnode, pReq->user);
  if (pUser == NULL) {
    terrno = TSDB_CODE_MND_NO_USER_FROM_CONN;
    goto DROP_MNODE_OVER;
  }

S
Shengliang Guan 已提交
585
  if (mndCheckNodeAuth(pUser)) {
S
Shengliang Guan 已提交
586
    goto DROP_MNODE_OVER;
S
Shengliang Guan 已提交
587
  }
S
Shengliang Guan 已提交
588

S
Shengliang Guan 已提交
589 590 591 592 593 594 595 596 597 598 599 600
  code = mndDropMnode(pMnode, pReq, pObj);
  if (code == 0) code = TSDB_CODE_MND_ACTION_IN_PROGRESS;

DROP_MNODE_OVER:
  if (code != 0 && code != TSDB_CODE_MND_ACTION_IN_PROGRESS) {
    mError("mnode:%d, failed to drop since %s", dropReq.dnodeId, terrstr());
  }

  mndReleaseMnode(pMnode, pObj);
  mndReleaseUser(pMnode, pUser);

  return code;
S
Shengliang Guan 已提交
601 602
}

S
Shengliang Guan 已提交
603 604
static int32_t mndProcessCreateMnodeRsp(SMnodeMsg *pRsp) {
  mndTransProcessRsp(pRsp);
S
Shengliang Guan 已提交
605 606 607
  return 0;
}

S
Shengliang Guan 已提交
608 609
static int32_t mndProcessAlterMnodeRsp(SMnodeMsg *pRsp) {
  mndTransProcessRsp(pRsp);
S
Shengliang Guan 已提交
610 611
  return 0;
}
S
Shengliang Guan 已提交
612

S
Shengliang Guan 已提交
613 614
static int32_t mndProcessDropMnodeRsp(SMnodeMsg *pRsp) {
  mndTransProcessRsp(pRsp);
S
Shengliang Guan 已提交
615 616
  return 0;
}
S
Shengliang Guan 已提交
617

S
Shengliang Guan 已提交
618
static int32_t mndGetMnodeMeta(SMnodeMsg *pReq, SShowObj *pShow, STableMetaRsp *pMeta) {
S
Shengliang Guan 已提交
619
  SMnode *pMnode = pReq->pMnode;
S
Shengliang Guan 已提交
620 621 622
  SSdb   *pSdb = pMnode->pSdb;

  int32_t  cols = 0;
S
Shengliang Guan 已提交
623
  SSchema *pSchema = pMeta->pSchemas;
S
Shengliang Guan 已提交
624 625 626 627

  pShow->bytes[cols] = 2;
  pSchema[cols].type = TSDB_DATA_TYPE_SMALLINT;
  strcpy(pSchema[cols].name, "id");
S
Shengliang Guan 已提交
628
  pSchema[cols].bytes = pShow->bytes[cols];
S
Shengliang Guan 已提交
629 630 631 632
  cols++;

  pShow->bytes[cols] = TSDB_EP_LEN + VARSTR_HEADER_SIZE;
  pSchema[cols].type = TSDB_DATA_TYPE_BINARY;
H
Haojun Liao 已提交
633
  strcpy(pSchema[cols].name, "endpoint");
S
Shengliang Guan 已提交
634
  pSchema[cols].bytes = pShow->bytes[cols];
S
Shengliang Guan 已提交
635 636 637 638 639
  cols++;

  pShow->bytes[cols] = 12 + VARSTR_HEADER_SIZE;
  pSchema[cols].type = TSDB_DATA_TYPE_BINARY;
  strcpy(pSchema[cols].name, "role");
S
Shengliang Guan 已提交
640
  pSchema[cols].bytes = pShow->bytes[cols];
S
Shengliang Guan 已提交
641 642 643 644
  cols++;

  pShow->bytes[cols] = 8;
  pSchema[cols].type = TSDB_DATA_TYPE_TIMESTAMP;
S
Shengliang Guan 已提交
645
  strcpy(pSchema[cols].name, "create_time");
S
Shengliang Guan 已提交
646
  pSchema[cols].bytes = pShow->bytes[cols];
S
Shengliang Guan 已提交
647 648 649 650
  cols++;

  pShow->bytes[cols] = 8;
  pSchema[cols].type = TSDB_DATA_TYPE_TIMESTAMP;
S
Shengliang Guan 已提交
651
  strcpy(pSchema[cols].name, "role_time");
S
Shengliang Guan 已提交
652
  pSchema[cols].bytes = pShow->bytes[cols];
S
Shengliang Guan 已提交
653 654
  cols++;

S
Shengliang Guan 已提交
655
  pMeta->numOfColumns = cols;
S
Shengliang Guan 已提交
656 657 658 659 660 661 662 663 664
  pShow->numOfColumns = cols;

  pShow->offset[0] = 0;
  for (int32_t i = 1; i < cols; ++i) {
    pShow->offset[i] = pShow->offset[i - 1] + pShow->bytes[i - 1];
  }

  pShow->numOfRows = sdbGetSize(pSdb, SDB_MNODE);
  pShow->rowSize = pShow->offset[cols - 1] + pShow->bytes[cols - 1];
D
dapan1121 已提交
665
  strcpy(pMeta->tbName, mndShowStr(pShow->type));
S
Shengliang Guan 已提交
666

S
Shengliang Guan 已提交
667
  mndUpdateMnodeRole(pMnode);
S
Shengliang Guan 已提交
668 669 670
  return 0;
}

S
Shengliang Guan 已提交
671 672
static int32_t mndRetrieveMnodes(SMnodeMsg *pReq, SShowObj *pShow, char *data, int32_t rows) {
  SMnode    *pMnode = pReq->pMnode;
S
Shengliang Guan 已提交
673 674 675
  SSdb      *pSdb = pMnode->pSdb;
  int32_t    numOfRows = 0;
  int32_t    cols = 0;
S
Shengliang Guan 已提交
676
  SMnodeObj *pObj = NULL;
S
Shengliang Guan 已提交
677 678 679
  char      *pWrite;

  while (numOfRows < rows) {
S
Shengliang Guan 已提交
680
    pShow->pIter = sdbFetch(pSdb, SDB_MNODE, pShow->pIter, (void **)&pObj);
S
Shengliang Guan 已提交
681 682 683 684 685
    if (pShow->pIter == NULL) break;

    cols = 0;

    pWrite = data + pShow->offset[cols] * rows + pShow->bytes[cols] * numOfRows;
S
Shengliang Guan 已提交
686
    *(int16_t *)pWrite = pObj->id;
S
Shengliang Guan 已提交
687 688 689
    cols++;

    pWrite = data + pShow->offset[cols] * rows + pShow->bytes[cols] * numOfRows;
S
Shengliang Guan 已提交
690
    STR_WITH_MAXSIZE_TO_VARSTR(pWrite, pObj->pDnode->ep, pShow->bytes[cols]);
S
Shengliang Guan 已提交
691 692 693 694

    cols++;

    pWrite = data + pShow->offset[cols] * rows + pShow->bytes[cols] * numOfRows;
S
Shengliang Guan 已提交
695
    char *roles = mndGetRoleStr(pObj->role);
S
Shengliang Guan 已提交
696 697 698 699
    STR_WITH_MAXSIZE_TO_VARSTR(pWrite, roles, pShow->bytes[cols]);
    cols++;

    pWrite = data + pShow->offset[cols] * rows + pShow->bytes[cols] * numOfRows;
S
Shengliang Guan 已提交
700
    *(int64_t *)pWrite = pObj->createdTime;
S
Shengliang Guan 已提交
701 702 703
    cols++;

    pWrite = data + pShow->offset[cols] * rows + pShow->bytes[cols] * numOfRows;
S
Shengliang Guan 已提交
704
    *(int64_t *)pWrite = pObj->roleTime;
S
Shengliang Guan 已提交
705 706 707
    cols++;

    numOfRows++;
S
Shengliang Guan 已提交
708
    sdbRelease(pSdb, pObj);
S
Shengliang Guan 已提交
709 710
  }

S
Shengliang Guan 已提交
711
  mndVacuumResult(data, pShow->numOfColumns, numOfRows, rows, pShow);
S
Shengliang Guan 已提交
712 713 714 715 716 717 718 719 720
  pShow->numOfReads += numOfRows;

  return numOfRows;
}

static void mndCancelGetNextMnode(SMnode *pMnode, void *pIter) {
  SSdb *pSdb = pMnode->pSdb;
  sdbCancelFetch(pSdb, pIter);
}