mndMain.c 31.8 KB
Newer Older
S
Shengliang Guan 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#define _DEFAULT_SOURCE
S
Shengliang Guan 已提交
17
#include "mndAcct.h"
S
Shengliang Guan 已提交
18
#include "mndBnode.h"
S
Shengliang Guan 已提交
19
#include "mndCluster.h"
L
Liu Jicong 已提交
20
#include "mndConsumer.h"
S
Shengliang Guan 已提交
21 22 23
#include "mndDb.h"
#include "mndDnode.h"
#include "mndFunc.h"
L
Liu Jicong 已提交
24
#include "mndGrant.h"
S
monitor  
Shengliang Guan 已提交
25
#include "mndInfoSchema.h"
S
Shengliang Guan 已提交
26
#include "mndMnode.h"
L
Liu Jicong 已提交
27
#include "mndOffset.h"
L
Liu Jicong 已提交
28
#include "mndPerfSchema.h"
M
Minghao Li 已提交
29
#include "mndPrivilege.h"
S
Shengliang Guan 已提交
30
#include "mndProfile.h"
S
Shengliang Guan 已提交
31
#include "mndQnode.h"
L
Liu Jicong 已提交
32
#include "mndQuery.h"
S
Shengliang Guan 已提交
33
#include "mndShow.h"
S
sma  
Shengliang Guan 已提交
34
#include "mndSma.h"
S
Shengliang Guan 已提交
35
#include "mndSnode.h"
S
Shengliang Guan 已提交
36
#include "mndStb.h"
L
Liu Jicong 已提交
37
#include "mndStream.h"
L
Liu Jicong 已提交
38
#include "mndSubscribe.h"
S
Shengliang Guan 已提交
39 40
#include "mndSync.h"
#include "mndTelem.h"
L
Liu Jicong 已提交
41
#include "mndTopic.h"
S
Shengliang Guan 已提交
42 43 44
#include "mndTrans.h"
#include "mndUser.h"
#include "mndVgroup.h"
S
Shengliang Guan 已提交
45

S
Shengliang Guan 已提交
46 47 48 49 50 51 52 53 54 55 56 57 58
static void *mndBuildTimerMsg(int32_t *pContLen) {
  SMTimerReq timerReq = {0};

  int32_t contLen = tSerializeSMTimerMsg(NULL, 0, &timerReq);
  if (contLen <= 0) return NULL;
  void *pReq = rpcMallocCont(contLen);
  if (pReq == NULL) return NULL;

  tSerializeSMTimerMsg(pReq, contLen, &timerReq);
  *pContLen = contLen;
  return pReq;
}

S
Shengliang Guan 已提交
59 60
static void mndPullupTrans(SMnode *pMnode) {
  int32_t contLen = 0;
M
Minghao Li 已提交
61
  void   *pReq = mndBuildTimerMsg(&contLen);
S
Shengliang Guan 已提交
62 63 64 65
  if (pReq != NULL) {
    SRpcMsg rpcMsg = {.msgType = TDMT_MND_TRANS_TIMER, .pCont = pReq, .contLen = contLen};
    tmsgPutToQueue(&pMnode->msgCb, WRITE_QUEUE, &rpcMsg);
  }
S
Shengliang Guan 已提交
66 67
}

68
static void mndPullupTtl(SMnode *pMnode) {
wmmhello's avatar
wmmhello 已提交
69
  int32_t contLen = 0;
M
Minghao Li 已提交
70
  void   *pReq = mndBuildTimerMsg(&contLen);
wmmhello's avatar
wmmhello 已提交
71
  SRpcMsg rpcMsg = {.msgType = TDMT_MND_TTL_TIMER, .pCont = pReq, .contLen = contLen};
wmmhello's avatar
wmmhello 已提交
72 73 74
  tmsgPutToQueue(&pMnode->msgCb, WRITE_QUEUE, &rpcMsg);
}

S
Shengliang Guan 已提交
75 76
static void mndCalMqRebalance(SMnode *pMnode) {
  int32_t contLen = 0;
M
Minghao Li 已提交
77
  void   *pReq = mndBuildTimerMsg(&contLen);
S
Shengliang Guan 已提交
78 79 80 81
  if (pReq != NULL) {
    SRpcMsg rpcMsg = {.msgType = TDMT_MND_MQ_TIMER, .pCont = pReq, .contLen = contLen};
    tmsgPutToQueue(&pMnode->msgCb, READ_QUEUE, &rpcMsg);
  }
S
Shengliang Guan 已提交
82
}
L
Liu Jicong 已提交
83

S
Shengliang Guan 已提交
84 85
static void mndPullupTelem(SMnode *pMnode) {
  int32_t contLen = 0;
M
Minghao Li 已提交
86
  void   *pReq = mndBuildTimerMsg(&contLen);
S
Shengliang Guan 已提交
87 88 89 90
  if (pReq != NULL) {
    SRpcMsg rpcMsg = {.msgType = TDMT_MND_TELEM_TIMER, .pCont = pReq, .contLen = contLen};
    tmsgPutToQueue(&pMnode->msgCb, READ_QUEUE, &rpcMsg);
  }
S
Shengliang Guan 已提交
91 92
}

93
static void mndPullupGrant(SMnode *pMnode) {
C
Cary Xu 已提交
94 95 96 97 98 99 100 101 102
  int32_t contLen = 0;
  void   *pReq = mndBuildTimerMsg(&contLen);
  if (pReq != NULL) {
    SRpcMsg rpcMsg = {
        .msgType = TDMT_MND_GRANT_HB_TIMER, .pCont = pReq, .contLen = contLen, .info.ahandle = (void *)0x9527};
    tmsgPutToQueue(&pMnode->msgCb, READ_QUEUE, &rpcMsg);
  }
}

103 104 105 106 107 108 109 110 111 112
static void mndIncreaseUpTime(SMnode *pMnode) {
  int32_t contLen = 0;
  void   *pReq = mndBuildTimerMsg(&contLen);
  if (pReq != NULL) {
    SRpcMsg rpcMsg = {
        .msgType = TDMT_MND_UPTIME_TIMER, .pCont = pReq, .contLen = contLen, .info.ahandle = (void *)0x9528};
    tmsgPutToQueue(&pMnode->msgCb, WRITE_QUEUE, &rpcMsg);
  }
}

S
Shengliang Guan 已提交
113
static void *mndThreadFp(void *param) {
S
Shengliang Guan 已提交
114
  SMnode *pMnode = param;
S
Shengliang Guan 已提交
115 116 117 118 119 120
  int64_t lastTime = 0;
  setThreadName("mnode-timer");

  while (1) {
    lastTime++;
    taosMsleep(100);
S
Shengliang Guan 已提交
121
    if (mndGetStop(pMnode)) break;
122
    if (lastTime % 10 != 0) continue;
S
Shengliang Guan 已提交
123

124 125
    int64_t sec = lastTime / 10;
    if (sec % tsTtlPushInterval == 0) {
126
      mndPullupTtl(pMnode);
wmmhello's avatar
wmmhello 已提交
127 128
    }

129
    if (sec % tsTransPullupInterval == 0) {
S
Shengliang Guan 已提交
130 131 132
      mndPullupTrans(pMnode);
    }

133
    if (sec % tsMqRebalanceInterval == 0) {
S
Shengliang Guan 已提交
134 135 136
      mndCalMqRebalance(pMnode);
    }

S
Shengliang Guan 已提交
137
    if (sec % tsTelemInterval == (TMIN(60, (tsTelemInterval - 1)))) {
S
Shengliang Guan 已提交
138 139
      mndPullupTelem(pMnode);
    }
C
Cary Xu 已提交
140

141
    if (sec % tsGrantHBInterval == 0) {
142
      mndPullupGrant(pMnode);
C
Cary Xu 已提交
143
    }
144

145
    if (sec % tsUptimeInterval == 0) {
146 147
      mndIncreaseUpTime(pMnode);
    }
S
Shengliang Guan 已提交
148 149
  }

S
Shengliang Guan 已提交
150
  return NULL;
L
Liu Jicong 已提交
151 152
}

153
static int32_t mndInitTimer(SMnode *pMnode) {
S
Shengliang Guan 已提交
154 155 156 157 158
  TdThreadAttr thAttr;
  taosThreadAttrInit(&thAttr);
  taosThreadAttrSetDetachState(&thAttr, PTHREAD_CREATE_JOINABLE);
  if (taosThreadCreate(&pMnode->thread, &thAttr, mndThreadFp, pMnode) != 0) {
    mError("failed to create timer thread since %s", strerror(errno));
S
shm  
Shengliang Guan 已提交
159 160
    return -1;
  }
L
Liu Jicong 已提交
161

S
Shengliang Guan 已提交
162 163
  taosThreadAttrDestroy(&thAttr);
  tmsgReportStartup("mnode-timer", "initialized");
S
Shengliang Guan 已提交
164 165 166
  return 0;
}

167
static void mndCleanupTimer(SMnode *pMnode) {
S
Shengliang Guan 已提交
168 169
  if (taosCheckPthreadValid(pMnode->thread)) {
    taosThreadJoin(pMnode->thread, NULL);
170
    taosThreadClear(&pMnode->thread);
S
Shengliang Guan 已提交
171 172 173
  }
}

S
Shengliang Guan 已提交
174
static int32_t mndCreateDir(SMnode *pMnode, const char *path) {
175 176 177
  pMnode->path = strdup(path);
  if (pMnode->path == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
S
Shengliang Guan 已提交
178
    return -1;
179 180 181 182
  }

  if (taosMkDir(pMnode->path) != 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
183
    return -1;
184
  }
185 186

  return 0;
187
}
S
Shengliang Guan 已提交
188

189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217
static int32_t mndInitWal(SMnode *pMnode) {
  char path[PATH_MAX + 20] = {0};
  snprintf(path, sizeof(path), "%s%swal", pMnode->path, TD_DIRSEP);
  SWalCfg cfg = {
      .vgId = 1,
      .fsyncPeriod = 0,
      .rollPeriod = -1,
      .segSize = -1,
      .retentionPeriod = -1,
      .retentionSize = -1,
      .level = TAOS_WAL_FSYNC,
  };

  pMnode->pWal = walOpen(path, &cfg);
  if (pMnode->pWal == NULL) {
    mError("failed to open wal since %s", terrstr());
    return -1;
  }

  return 0;
}

static void mndCloseWal(SMnode *pMnode) {
  if (pMnode->pWal != NULL) {
    walClose(pMnode->pWal);
    pMnode->pWal = NULL;
  }
}

218 219 220
static int32_t mndInitSdb(SMnode *pMnode) {
  SSdbOpt opt = {0};
  opt.path = pMnode->path;
S
Shengliang Guan 已提交
221
  opt.pMnode = pMnode;
222
  opt.pWal = pMnode->pWal;
S
Shengliang Guan 已提交
223

S
Shengliang Guan 已提交
224
  pMnode->pSdb = sdbInit(&opt);
225
  if (pMnode->pSdb == NULL) {
S
Shengliang Guan 已提交
226 227 228 229 230 231
    return -1;
  }

  return 0;
}

232 233 234 235 236 237 238
static int32_t mndOpenSdb(SMnode *pMnode) {
  if (!pMnode->deploy) {
    return sdbReadFile(pMnode->pSdb);
  } else {
    return 0;
  }
}
239 240 241

static void mndCleanupSdb(SMnode *pMnode) {
  if (pMnode->pSdb) {
S
Shengliang Guan 已提交
242
    sdbCleanup(pMnode->pSdb);
243 244 245 246
    pMnode->pSdb = NULL;
  }
}

247 248 249 250 251
static int32_t mndAllocStep(SMnode *pMnode, char *name, MndInitFp initFp, MndCleanupFp cleanupFp) {
  SMnodeStep step = {0};
  step.name = name;
  step.initFp = initFp;
  step.cleanupFp = cleanupFp;
S
Shengliang Guan 已提交
252
  if (taosArrayPush(pMnode->pSteps, &step) == NULL) {
253 254 255 256
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }

S
Shengliang Guan 已提交
257 258 259
  return 0;
}

260
static int32_t mndInitSteps(SMnode *pMnode) {
261
  if (mndAllocStep(pMnode, "mnode-wal", mndInitWal, mndCloseWal) != 0) return -1;
S
Shengliang Guan 已提交
262 263 264 265
  if (mndAllocStep(pMnode, "mnode-sdb", mndInitSdb, mndCleanupSdb) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-trans", mndInitTrans, mndCleanupTrans) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-cluster", mndInitCluster, mndCleanupCluster) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-mnode", mndInitMnode, mndCleanupMnode) != 0) return -1;
S
Shengliang Guan 已提交
266
  if (mndAllocStep(pMnode, "mnode-qnode", mndInitQnode, mndCleanupQnode) != 0) return -1;
267 268
  if (mndAllocStep(pMnode, "mnode-snode", mndInitSnode, mndCleanupSnode) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-bnode", mndInitBnode, mndCleanupBnode) != 0) return -1;
S
Shengliang Guan 已提交
269
  if (mndAllocStep(pMnode, "mnode-dnode", mndInitDnode, mndCleanupDnode) != 0) return -1;
S
Shengliang Guan 已提交
270
  if (mndAllocStep(pMnode, "mnode-user", mndInitUser, mndCleanupUser) != 0) return -1;
wafwerar's avatar
wafwerar 已提交
271
  if (mndAllocStep(pMnode, "mnode-grant", mndInitGrant, mndCleanupGrant) != 0) return -1;
272
  if (mndAllocStep(pMnode, "mnode-privilege", mndInitPrivilege, mndCleanupPrivilege) != 0) return -1;
S
Shengliang Guan 已提交
273
  if (mndAllocStep(pMnode, "mnode-acct", mndInitAcct, mndCleanupAcct) != 0) return -1;
L
Liu Jicong 已提交
274
  if (mndAllocStep(pMnode, "mnode-stream", mndInitStream, mndCleanupStream) != 0) return -1;
S
Shengliang Guan 已提交
275
  if (mndAllocStep(pMnode, "mnode-topic", mndInitTopic, mndCleanupTopic) != 0) return -1;
L
Liu Jicong 已提交
276 277
  if (mndAllocStep(pMnode, "mnode-consumer", mndInitConsumer, mndCleanupConsumer) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-subscribe", mndInitSubscribe, mndCleanupSubscribe) != 0) return -1;
L
Liu Jicong 已提交
278
  if (mndAllocStep(pMnode, "mnode-offset", mndInitOffset, mndCleanupOffset) != 0) return -1;
S
Shengliang Guan 已提交
279
  if (mndAllocStep(pMnode, "mnode-vgroup", mndInitVgroup, mndCleanupVgroup) != 0) return -1;
S
Shengliang Guan 已提交
280
  if (mndAllocStep(pMnode, "mnode-stb", mndInitStb, mndCleanupStb) != 0) return -1;
281
  if (mndAllocStep(pMnode, "mnode-sma", mndInitSma, mndCleanupSma) != 0) return -1;
D
dapan1121 已提交
282
  if (mndAllocStep(pMnode, "mnode-infos", mndInitInfos, mndCleanupInfos) != 0) return -1;
D
dapan1121 已提交
283
  if (mndAllocStep(pMnode, "mnode-perfs", mndInitPerfs, mndCleanupPerfs) != 0) return -1;
S
Shengliang Guan 已提交
284
  if (mndAllocStep(pMnode, "mnode-db", mndInitDb, mndCleanupDb) != 0) return -1;
S
Shengliang Guan 已提交
285
  if (mndAllocStep(pMnode, "mnode-func", mndInitFunc, mndCleanupFunc) != 0) return -1;
286
  if (mndAllocStep(pMnode, "mnode-sdb", mndOpenSdb, NULL) != 0) return -1;
S
Shengliang Guan 已提交
287 288
  if (mndAllocStep(pMnode, "mnode-profile", mndInitProfile, mndCleanupProfile) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-show", mndInitShow, mndCleanupShow) != 0) return -1;
D
dapan1121 已提交
289
  if (mndAllocStep(pMnode, "mnode-query", mndInitQuery, mndCleanupQuery) != 0) return -1;
S
Shengliang Guan 已提交
290 291
  if (mndAllocStep(pMnode, "mnode-sync", mndInitSync, mndCleanupSync) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-telem", mndInitTelem, mndCleanupTelem) != 0) return -1;
S
Shengliang Guan 已提交
292 293 294 295

  return 0;
}

296
static void mndCleanupSteps(SMnode *pMnode, int32_t pos) {
S
Shengliang Guan 已提交
297 298
  if (pMnode->pSteps == NULL) return;

299
  if (pos == -1) {
300
    pos = taosArrayGetSize(pMnode->pSteps) - 1;
S
Shengliang Guan 已提交
301 302
  }

303
  for (int32_t s = pos; s >= 0; s--) {
304
    SMnodeStep *pStep = taosArrayGet(pMnode->pSteps, s);
305
    mInfo("%s will cleanup", pStep->name);
306 307 308
    if (pStep->cleanupFp != NULL) {
      (*pStep->cleanupFp)(pMnode);
    }
S
Shengliang Guan 已提交
309 310
  }

S
Shengliang Guan 已提交
311
  taosArrayClear(pMnode->pSteps);
S
Shengliang Guan 已提交
312
  taosArrayDestroy(pMnode->pSteps);
S
Shengliang Guan 已提交
313
  pMnode->pSteps = NULL;
314
}
S
Shengliang Guan 已提交
315

316
static int32_t mndExecSteps(SMnode *pMnode) {
S
Shengliang Guan 已提交
317
  int32_t size = taosArrayGetSize(pMnode->pSteps);
318
  for (int32_t pos = 0; pos < size; pos++) {
S
Shengliang Guan 已提交
319
    SMnodeStep *pStep = taosArrayGet(pMnode->pSteps, pos);
320
    if (pStep->initFp == NULL) continue;
S
Shengliang Guan 已提交
321

S
Shengliang Guan 已提交
322
    if ((*pStep->initFp)(pMnode) != 0) {
S
Shengliang Guan 已提交
323
      int32_t code = terrno;
S
Shengliang Guan 已提交
324
      mError("%s exec failed since %s, start to cleanup", pStep->name, terrstr());
325
      mndCleanupSteps(pMnode, pos);
S
Shengliang Guan 已提交
326
      terrno = code;
S
Shengliang Guan 已提交
327
      return -1;
S
Shengliang Guan 已提交
328
    } else {
329
      mInfo("%s is initialized", pStep->name);
S
Shengliang Guan 已提交
330
      tmsgReportStartup(pStep->name, "initialized");
S
Shengliang Guan 已提交
331 332
    }
  }
S
Shengliang Guan 已提交
333

S
shm  
Shengliang Guan 已提交
334
  pMnode->clusterId = mndGetClusterId(pMnode);
S
Shengliang Guan 已提交
335
  return 0;
336
}
S
Shengliang Guan 已提交
337

S
shm  
Shengliang Guan 已提交
338
static void mndSetOptions(SMnode *pMnode, const SMnodeOpt *pOption) {
S
Shengliang Guan 已提交
339
  pMnode->msgCb = pOption->msgCb;
340
  pMnode->selfDnodeId = pOption->dnodeId;
S
Shengliang Guan 已提交
341
  pMnode->syncMgmt.replica = pOption->replica;
S
Shengliang Guan 已提交
342
  pMnode->syncMgmt.standby = pOption->standby;
L
Liu Jicong 已提交
343
}
344

345
SMnode *mndOpen(const char *path, const SMnodeOpt *pOption) {
346
  mInfo("start to open mnode in %s", path);
S
Shengliang Guan 已提交
347

wafwerar's avatar
wafwerar 已提交
348
  SMnode *pMnode = taosMemoryCalloc(1, sizeof(SMnode));
S
Shengliang Guan 已提交
349 350 351 352 353 354
  if (pMnode == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    mError("failed to open mnode since %s", terrstr());
    return NULL;
  }

S
Shengliang Guan 已提交
355 356
  char timestr[24] = "1970-01-01 00:00:00.00";
  (void)taosParseTime(timestr, &pMnode->checkTime, (int32_t)strlen(timestr), TSDB_TIME_PRECISION_MILLI, 0);
S
shm  
Shengliang Guan 已提交
357
  mndSetOptions(pMnode, pOption);
S
Shengliang Guan 已提交
358

359
  pMnode->deploy = pOption->deploy;
S
Shengliang Guan 已提交
360 361
  pMnode->pSteps = taosArrayInit(24, sizeof(SMnodeStep));
  if (pMnode->pSteps == NULL) {
wafwerar's avatar
wafwerar 已提交
362
    taosMemoryFree(pMnode);
S
Shengliang Guan 已提交
363 364 365 366
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    mError("failed to open mnode since %s", terrstr());
    return NULL;
  }
367

S
Shengliang Guan 已提交
368
  int32_t code = mndCreateDir(pMnode, path);
369
  if (code != 0) {
S
Shengliang Guan 已提交
370 371
    code = terrno;
    mError("failed to open mnode since %s", terrstr());
372 373 374 375 376
    mndClose(pMnode);
    terrno = code;
    return NULL;
  }

377
  code = mndInitSteps(pMnode);
378
  if (code != 0) {
S
Shengliang Guan 已提交
379 380
    code = terrno;
    mError("failed to open mnode since %s", terrstr());
381 382 383 384 385 386 387
    mndClose(pMnode);
    terrno = code;
    return NULL;
  }

  code = mndExecSteps(pMnode);
  if (code != 0) {
S
Shengliang Guan 已提交
388 389
    code = terrno;
    mError("failed to open mnode since %s", terrstr());
390 391 392 393
    mndClose(pMnode);
    terrno = code;
    return NULL;
  }
S
Shengliang Guan 已提交
394

395
  mInfo("mnode open successfully ");
S
Shengliang Guan 已提交
396 397
  return pMnode;
}
S
Shengliang Guan 已提交
398

399 400
void mndPreClose(SMnode *pMnode) {
  if (pMnode != NULL) {
401
    atomic_store_8(&(pMnode->syncMgmt.leaderTransferFinish), 0);
402
    syncLeaderTransfer(pMnode->syncMgmt.sync);
403

404 405 406 407 408 409 410 411 412
#if 0
    mInfo("vgId:1, mnode start leader transfer");
    // wait for leader transfer finish
    while (!atomic_load_8(&(pMnode->syncMgmt.leaderTransferFinish))) {
      taosMsleep(10);
      mInfo("vgId:1, mnode waiting for leader transfer");
    }
    mInfo("vgId:1, mnode finish leader transfer");
#endif
413 414 415
  }
}

416
void mndClose(SMnode *pMnode) {
S
Shengliang Guan 已提交
417
  if (pMnode != NULL) {
418
    mInfo("start to close mnode");
S
Shengliang Guan 已提交
419
    mndCleanupSteps(pMnode, -1);
wafwerar's avatar
wafwerar 已提交
420 421
    taosMemoryFreeClear(pMnode->path);
    taosMemoryFreeClear(pMnode);
422
    mInfo("mnode is closed");
S
Shengliang Guan 已提交
423
  }
424
}
S
Shengliang Guan 已提交
425

426
int32_t mndStart(SMnode *pMnode) {
427
  mndSyncStart(pMnode);
S
Shengliang Guan 已提交
428
  if (pMnode->deploy) {
S
Shengliang Guan 已提交
429 430 431 432 433
    if (sdbDeploy(pMnode->pSdb) != 0) {
      mError("failed to deploy sdb while start mnode");
      return -1;
    }
    mndSetRestore(pMnode, true);
434
  }
M
Minghao Li 已提交
435

C
Cary Xu 已提交
436
  grantReset(pMnode, TSDB_GRANT_ALL, 0);
C
Cary Xu 已提交
437

M
Minghao Li 已提交
438 439 440
  return mndInitTimer(pMnode);
}

441
void mndStop(SMnode *pMnode) {
S
Shengliang Guan 已提交
442
  mndSetStop(pMnode);
443
  mndSyncStop(pMnode);
S
Shengliang Guan 已提交
444
  mndCleanupTimer(pMnode);
M
Minghao Li 已提交
445 446
}

447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485
int32_t mndProcessSyncCtrlMsg(SRpcMsg *pMsg) {
  SMnode    *pMnode = pMsg->info.node;
  SSyncMgmt *pMgmt = &pMnode->syncMgmt;
  int32_t    code = 0;

  mInfo("vgId:%d, process sync ctrl msg", 1);

  if (!syncEnvIsStart()) {
    mError("failed to process sync msg:%p type:%s since syncEnv stop", pMsg, TMSG_INFO(pMsg->msgType));
    terrno = TSDB_CODE_SYN_INTERNAL_ERROR;
    return -1;
  }

  SSyncNode *pSyncNode = syncNodeAcquire(pMgmt->sync);
  if (pSyncNode == NULL) {
    mError("failed to process sync msg:%p type:%s since syncNode is null", pMsg, TMSG_INFO(pMsg->msgType));
    terrno = TSDB_CODE_SYN_INTERNAL_ERROR;
    return -1;
  }

  if (pMsg->msgType == TDMT_SYNC_HEARTBEAT) {
    SyncHeartbeat *pSyncMsg = syncHeartbeatFromRpcMsg2(pMsg);
    code = syncNodeOnHeartbeat(pSyncNode, pSyncMsg);
    syncHeartbeatDestroy(pSyncMsg);

  } else if (pMsg->msgType == TDMT_SYNC_HEARTBEAT_REPLY) {
    SyncHeartbeatReply *pSyncMsg = syncHeartbeatReplyFromRpcMsg2(pMsg);
    code = syncNodeOnHeartbeatReply(pSyncNode, pSyncMsg);
    syncHeartbeatReplyDestroy(pSyncMsg);
  }

  syncNodeRelease(pSyncNode);

  if (code != 0) {
    terrno = TSDB_CODE_SYN_INTERNAL_ERROR;
  }
  return code;
}

M
Minghao Li 已提交
486
int32_t mndProcessSyncMsg(SRpcMsg *pMsg) {
M
Minghao Li 已提交
487
  SMnode    *pMnode = pMsg->info.node;
488
  SSyncMgmt *pMgmt = &pMnode->syncMgmt;
M
Minghao Li 已提交
489
  int32_t    code = 0;
M
Minghao Li 已提交
490

491 492
  if (!syncEnvIsStart()) {
    mError("failed to process sync msg:%p type:%s since syncEnv stop", pMsg, TMSG_INFO(pMsg->msgType));
M
Minghao Li 已提交
493 494
    terrno = TSDB_CODE_SYN_INTERNAL_ERROR;
    return -1;
495
  }
M
Minghao Li 已提交
496

497 498 499
  SSyncNode *pSyncNode = syncNodeAcquire(pMgmt->sync);
  if (pSyncNode == NULL) {
    mError("failed to process sync msg:%p type:%s since syncNode is null", pMsg, TMSG_INFO(pMsg->msgType));
M
Minghao Li 已提交
500 501
    terrno = TSDB_CODE_SYN_INTERNAL_ERROR;
    return -1;
S
Shengliang Guan 已提交
502
  }
503

504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548
  if (pMsg->msgType == TDMT_SYNC_TIMEOUT) {
    SyncTimeout *pSyncMsg = syncTimeoutFromRpcMsg2(pMsg);
    code = syncNodeOnTimeoutCb(pSyncNode, pSyncMsg);
    syncTimeoutDestroy(pSyncMsg);

  } else if (pMsg->msgType == TDMT_SYNC_PING) {
    SyncPing *pSyncMsg = syncPingFromRpcMsg2(pMsg);
    code = syncNodeOnPingCb(pSyncNode, pSyncMsg);
    syncPingDestroy(pSyncMsg);

  } else if (pMsg->msgType == TDMT_SYNC_PING_REPLY) {
    SyncPingReply *pSyncMsg = syncPingReplyFromRpcMsg2(pMsg);
    code = syncNodeOnPingReplyCb(pSyncNode, pSyncMsg);
    syncPingReplyDestroy(pSyncMsg);

  } else if (pMsg->msgType == TDMT_SYNC_CLIENT_REQUEST) {
    SyncClientRequest *pSyncMsg = syncClientRequestFromRpcMsg2(pMsg);
    code = syncNodeOnClientRequest(pSyncNode, pSyncMsg, NULL);
    syncClientRequestDestroy(pSyncMsg);

  } else if (pMsg->msgType == TDMT_SYNC_REQUEST_VOTE) {
    SyncRequestVote *pSyncMsg = syncRequestVoteFromRpcMsg2(pMsg);
    code = syncNodeOnRequestVote(pSyncNode, pSyncMsg);
    syncRequestVoteDestroy(pSyncMsg);

  } else if (pMsg->msgType == TDMT_SYNC_REQUEST_VOTE_REPLY) {
    SyncRequestVoteReply *pSyncMsg = syncRequestVoteReplyFromRpcMsg2(pMsg);
    code = syncNodeOnRequestVoteReply(pSyncNode, pSyncMsg);
    syncRequestVoteReplyDestroy(pSyncMsg);

  } else if (pMsg->msgType == TDMT_SYNC_APPEND_ENTRIES) {
    SyncAppendEntries *pSyncMsg = syncAppendEntriesFromRpcMsg2(pMsg);
    code = syncNodeOnAppendEntries(pSyncNode, pSyncMsg);
    syncAppendEntriesDestroy(pSyncMsg);

  } else if (pMsg->msgType == TDMT_SYNC_APPEND_ENTRIES_REPLY) {
    SyncAppendEntriesReply *pSyncMsg = syncAppendEntriesReplyFromRpcMsg2(pMsg);
    code = syncNodeOnAppendEntriesReply(pSyncNode, pSyncMsg);
    syncAppendEntriesReplyDestroy(pSyncMsg);

  } else if (pMsg->msgType == TDMT_SYNC_SET_MNODE_STANDBY) {
    code = syncSetStandby(pMgmt->sync);
    SRpcMsg rsp = {.code = code, .info = pMsg->info};
    tmsgSendRsp(&rsp);

M
Minghao Li 已提交
549
  } else {
550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604
    mError("failed to process msg:%p since invalid type:%s", pMsg, TMSG_INFO(pMsg->msgType));
    code = -1;
  }

  /*
    // ToDo: ugly! use function pointer
    if (syncNodeStrategy(pSyncNode) == SYNC_STRATEGY_STANDARD_SNAPSHOT) {
      if (pMsg->msgType == TDMT_SYNC_TIMEOUT) {
        SyncTimeout *pSyncMsg = syncTimeoutFromRpcMsg2(pMsg);
        code = syncNodeOnTimeoutCb(pSyncNode, pSyncMsg);
        syncTimeoutDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_PING) {
        SyncPing *pSyncMsg = syncPingFromRpcMsg2(pMsg);
        code = syncNodeOnPingCb(pSyncNode, pSyncMsg);
        syncPingDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_PING_REPLY) {
        SyncPingReply *pSyncMsg = syncPingReplyFromRpcMsg2(pMsg);
        code = syncNodeOnPingReplyCb(pSyncNode, pSyncMsg);
        syncPingReplyDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_CLIENT_REQUEST) {
        SyncClientRequest *pSyncMsg = syncClientRequestFromRpcMsg2(pMsg);
        code = syncNodeOnClientRequestCb(pSyncNode, pSyncMsg, NULL);
        syncClientRequestDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_REQUEST_VOTE) {
        SyncRequestVote *pSyncMsg = syncRequestVoteFromRpcMsg2(pMsg);
        code = syncNodeOnRequestVoteSnapshotCb(pSyncNode, pSyncMsg);
        syncRequestVoteDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_REQUEST_VOTE_REPLY) {
        SyncRequestVoteReply *pSyncMsg = syncRequestVoteReplyFromRpcMsg2(pMsg);
        code = syncNodeOnRequestVoteReplySnapshotCb(pSyncNode, pSyncMsg);
        syncRequestVoteReplyDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_APPEND_ENTRIES) {
        SyncAppendEntries *pSyncMsg = syncAppendEntriesFromRpcMsg2(pMsg);
        code = syncNodeOnAppendEntriesSnapshotCb(pSyncNode, pSyncMsg);
        syncAppendEntriesDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_APPEND_ENTRIES_REPLY) {
        SyncAppendEntriesReply *pSyncMsg = syncAppendEntriesReplyFromRpcMsg2(pMsg);
        code = syncNodeOnAppendEntriesReplySnapshotCb(pSyncNode, pSyncMsg);
        syncAppendEntriesReplyDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_SNAPSHOT_SEND) {
        SyncSnapshotSend *pSyncMsg = syncSnapshotSendFromRpcMsg2(pMsg);
        code = syncNodeOnSnapshotSendCb(pSyncNode, pSyncMsg);
        syncSnapshotSendDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_SNAPSHOT_RSP) {
        SyncSnapshotRsp *pSyncMsg = syncSnapshotRspFromRpcMsg2(pMsg);
        code = syncNodeOnSnapshotRspCb(pSyncNode, pSyncMsg);
        syncSnapshotRspDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_SET_MNODE_STANDBY) {
        code = syncSetStandby(pMgmt->sync);
        SRpcMsg rsp = {.code = code, .info = pMsg->info};
        tmsgSendRsp(&rsp);
      } else {
        mError("failed to process msg:%p since invalid type:%s", pMsg, TMSG_INFO(pMsg->msgType));
        code = -1;
      }
M
Minghao Li 已提交
605
    } else {
606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645
      if (pMsg->msgType == TDMT_SYNC_TIMEOUT) {
        SyncTimeout *pSyncMsg = syncTimeoutFromRpcMsg2(pMsg);
        code = syncNodeOnTimeoutCb(pSyncNode, pSyncMsg);
        syncTimeoutDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_PING) {
        SyncPing *pSyncMsg = syncPingFromRpcMsg2(pMsg);
        code = syncNodeOnPingCb(pSyncNode, pSyncMsg);
        syncPingDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_PING_REPLY) {
        SyncPingReply *pSyncMsg = syncPingReplyFromRpcMsg2(pMsg);
        code = syncNodeOnPingReplyCb(pSyncNode, pSyncMsg);
        syncPingReplyDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_CLIENT_REQUEST) {
        SyncClientRequest *pSyncMsg = syncClientRequestFromRpcMsg2(pMsg);
        code = syncNodeOnClientRequestCb(pSyncNode, pSyncMsg, NULL);
        syncClientRequestDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_REQUEST_VOTE) {
        SyncRequestVote *pSyncMsg = syncRequestVoteFromRpcMsg2(pMsg);
        code = syncNodeOnRequestVoteCb(pSyncNode, pSyncMsg);
        syncRequestVoteDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_REQUEST_VOTE_REPLY) {
        SyncRequestVoteReply *pSyncMsg = syncRequestVoteReplyFromRpcMsg2(pMsg);
        code = syncNodeOnRequestVoteReplyCb(pSyncNode, pSyncMsg);
        syncRequestVoteReplyDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_APPEND_ENTRIES) {
        SyncAppendEntries *pSyncMsg = syncAppendEntriesFromRpcMsg2(pMsg);
        code = syncNodeOnAppendEntriesCb(pSyncNode, pSyncMsg);
        syncAppendEntriesDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_APPEND_ENTRIES_REPLY) {
        SyncAppendEntriesReply *pSyncMsg = syncAppendEntriesReplyFromRpcMsg2(pMsg);
        code = syncNodeOnAppendEntriesReplyCb(pSyncNode, pSyncMsg);
        syncAppendEntriesReplyDestroy(pSyncMsg);
      } else if (pMsg->msgType == TDMT_SYNC_SET_MNODE_STANDBY) {
        code = syncSetStandby(pMgmt->sync);
        SRpcMsg rsp = {.code = code, .info = pMsg->info};
        tmsgSendRsp(&rsp);
      } else {
        mError("failed to process msg:%p since invalid type:%s", pMsg, TMSG_INFO(pMsg->msgType));
        code = -1;
      }
M
Minghao Li 已提交
646
    }
647
  */
M
Minghao Li 已提交
648

M
Minghao Li 已提交
649 650
  syncNodeRelease(pSyncNode);

M
Minghao Li 已提交
651 652 653
  if (code != 0) {
    terrno = TSDB_CODE_SYN_INTERNAL_ERROR;
  }
654
  return code;
M
Minghao Li 已提交
655 656
}

S
Shengliang Guan 已提交
657
static int32_t mndCheckMnodeState(SRpcMsg *pMsg) {
S
Shengliang Guan 已提交
658
  if (!IsReq(pMsg)) return 0;
dengyihao's avatar
dengyihao 已提交
659 660
  if (pMsg->msgType == TDMT_SCH_QUERY || pMsg->msgType == TDMT_SCH_MERGE_QUERY ||
      pMsg->msgType == TDMT_SCH_QUERY_CONTINUE || pMsg->msgType == TDMT_SCH_QUERY_HEARTBEAT ||
S
Shengliang Guan 已提交
661
      pMsg->msgType == TDMT_SCH_FETCH || pMsg->msgType == TDMT_SCH_MERGE_FETCH || pMsg->msgType == TDMT_SCH_DROP_TASK) {
D
dapan1121 已提交
662 663
    return 0;
  }
S
Shengliang Guan 已提交
664
  if (mndAcquireRpcRef(pMsg->info.node) == 0) return 0;
S
Shengliang Guan 已提交
665
  if (pMsg->msgType == TDMT_MND_MQ_TIMER || pMsg->msgType == TDMT_MND_TELEM_TIMER ||
666 667
      pMsg->msgType == TDMT_MND_TRANS_TIMER || pMsg->msgType == TDMT_MND_TTL_TIMER ||
      pMsg->msgType == TDMT_MND_UPTIME_TIMER) {
S
Shengliang Guan 已提交
668 669
    return -1;
  }
S
Shengliang Guan 已提交
670

S
Shengliang Guan 已提交
671 672
  SEpSet epSet = {0};
  mndGetMnodeEpSet(pMsg->info.node, &epSet);
673

S
Shengliang Guan 已提交
674 675 676 677
  const STraceId *trace = &pMsg->info.traceId;
  mError("msg:%p, failed to check mnode state since %s, type:%s, numOfMnodes:%d inUse:%d", pMsg, terrstr(),
         TMSG_INFO(pMsg->msgType), epSet.numOfEps, epSet.inUse);

S
Shengliang Guan 已提交
678 679 680 681 682 683 684
  if (epSet.numOfEps > 0) {
    for (int32_t i = 0; i < epSet.numOfEps; ++i) {
      mInfo("mnode index:%d, ep:%s:%u", i, epSet.eps[i].fqdn, epSet.eps[i].port);
    }

    int32_t contLen = tSerializeSEpSet(NULL, 0, &epSet);
    pMsg->info.rsp = rpcMallocCont(contLen);
dengyihao's avatar
dengyihao 已提交
685
    pMsg->info.hasEpSet = 1;
S
Shengliang Guan 已提交
686 687 688 689 690 691 692
    if (pMsg->info.rsp != NULL) {
      tSerializeSEpSet(pMsg->info.rsp, contLen, &epSet);
      pMsg->info.rspLen = contLen;
      terrno = TSDB_CODE_RPC_REDIRECT;
    } else {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
    }
S
Shengliang Guan 已提交
693
  } else {
S
Shengliang Guan 已提交
694
    terrno = TSDB_CODE_APP_NOT_READY;
S
Shengliang Guan 已提交
695
  }
S
Shengliang Guan 已提交
696 697

  return -1;
698 699
}

S
Shengliang Guan 已提交
700
static int32_t mndCheckMsgContent(SRpcMsg *pMsg) {
701 702
  if (!IsReq(pMsg)) return 0;
  if (pMsg->contLen != 0 && pMsg->pCont != NULL) return 0;
S
Shengliang Guan 已提交
703

S
Shengliang Guan 已提交
704 705
  const STraceId *trace = &pMsg->info.traceId;
  mGError("msg:%p, failed to check msg, cont:%p contLen:%d, app:%p type:%s", pMsg, pMsg->pCont, pMsg->contLen,
S
Shengliang Guan 已提交
706
          pMsg->info.ahandle, TMSG_INFO(pMsg->msgType));
707 708 709 710
  terrno = TSDB_CODE_INVALID_MSG_LEN;
  return -1;
}

S
Shengliang Guan 已提交
711
int32_t mndProcessRpcMsg(SRpcMsg *pMsg) {
M
Minghao Li 已提交
712
  SMnode         *pMnode = pMsg->info.node;
S
Shengliang Guan 已提交
713 714
  const STraceId *trace = &pMsg->info.traceId;

S
Shengliang Guan 已提交
715
  MndMsgFp fp = pMnode->msgFp[TMSG_INDEX(pMsg->msgType)];
S
Shengliang Guan 已提交
716
  if (fp == NULL) {
S
Shengliang Guan 已提交
717
    mGError("msg:%p, failed to get msg handle, app:%p type:%s", pMsg, pMsg->info.ahandle, TMSG_INFO(pMsg->msgType));
S
shm  
Shengliang Guan 已提交
718 719
    terrno = TSDB_CODE_MSG_NOT_PROCESSED;
    return -1;
S
Shengliang Guan 已提交
720 721
  }

S
Shengliang Guan 已提交
722 723 724
  if (mndCheckMsgContent(pMsg) != 0) return -1;
  if (mndCheckMnodeState(pMsg) != 0) return -1;

dengyihao's avatar
dengyihao 已提交
725
  mGTrace("msg:%p, start to process in mnode, app:%p type:%s", pMsg, pMsg->info.ahandle, TMSG_INFO(pMsg->msgType));
S
shm  
Shengliang Guan 已提交
726
  int32_t code = (*fp)(pMsg);
S
Shengliang Guan 已提交
727 728
  mndReleaseRpcRef(pMnode);

S
Shengliang Guan 已提交
729
  if (code == TSDB_CODE_ACTION_IN_PROGRESS) {
S
Shengliang Guan 已提交
730
    mGTrace("msg:%p, won't response immediately since in progress", pMsg);
731
  } else if (code == 0) {
S
Shengliang Guan 已提交
732
    mGTrace("msg:%p, successfully processed", pMsg);
733
  } else {
S
Shengliang Guan 已提交
734 735
    mGError("msg:%p, failed to process since %s, app:%p type:%s", pMsg, terrstr(), pMsg->info.ahandle,
            TMSG_INFO(pMsg->msgType));
S
Shengliang Guan 已提交
736
  }
S
Shengliang Guan 已提交
737

S
shm  
Shengliang Guan 已提交
738
  return code;
S
Shengliang Guan 已提交
739 740
}

741 742
void mndSetMsgHandle(SMnode *pMnode, tmsg_t msgType, MndMsgFp fp) {
  tmsg_t type = TMSG_INDEX(msgType);
S
Shengliang Guan 已提交
743
  if (type < TDMT_MAX) {
744
    pMnode->msgFp[type] = fp;
S
Shengliang Guan 已提交
745 746 747
  }
}

D
dapan1121 已提交
748
// Note: uid 0 is reserved
749
int64_t mndGenerateUid(const char *name, int32_t len) {
S
monitor  
Shengliang Guan 已提交
750
  int32_t hashval = MurmurHash3_32(name, len);
D
dapan1121 已提交
751
  do {
L
Liu Jicong 已提交
752
    int64_t us = taosGetTimestampUs();
S
sma  
Shengliang Guan 已提交
753 754
    int64_t x = (us & 0x000000FFFFFFFFFF) << 24;
    int64_t uuid = x + ((hashval & ((1ul << 16) - 1ul)) << 8) + (taosRand() & ((1ul << 8) - 1ul));
D
dapan1121 已提交
755
    if (uuid) {
L
Liu Jicong 已提交
756
      return llabs(uuid);
D
dapan1121 已提交
757 758
    }
  } while (true);
L
Liu Jicong 已提交
759
}
S
Shengliang Guan 已提交
760 761

int32_t mndGetMonitorInfo(SMnode *pMnode, SMonClusterInfo *pClusterInfo, SMonVgroupInfo *pVgroupInfo,
S
Shengliang Guan 已提交
762
                          SMonStbInfo *pStbInfo, SMonGrantInfo *pGrantInfo) {
S
Shengliang Guan 已提交
763
  if (mndAcquireRpcRef(pMnode) != 0) return -1;
S
Shengliang Guan 已提交
764

M
Minghao Li 已提交
765
  SSdb   *pSdb = pMnode->pSdb;
S
Shengliang Guan 已提交
766 767 768 769 770
  int64_t ms = taosGetTimestampMs();

  pClusterInfo->dnodes = taosArrayInit(sdbGetSize(pSdb, SDB_DNODE), sizeof(SMonDnodeDesc));
  pClusterInfo->mnodes = taosArrayInit(sdbGetSize(pSdb, SDB_MNODE), sizeof(SMonMnodeDesc));
  pVgroupInfo->vgroups = taosArrayInit(sdbGetSize(pSdb, SDB_VGROUP), sizeof(SMonVgroupDesc));
S
Shengliang Guan 已提交
771 772 773
  pStbInfo->stbs = taosArrayInit(sdbGetSize(pSdb, SDB_STB), sizeof(SMonStbDesc));
  if (pClusterInfo->dnodes == NULL || pClusterInfo->mnodes == NULL || pVgroupInfo->vgroups == NULL ||
      pStbInfo->stbs == NULL) {
S
Shengliang Guan 已提交
774
    mndReleaseRpcRef(pMnode);
S
Shengliang Guan 已提交
775 776 777 778
    return -1;
  }

  // cluster info
wmmhello's avatar
wmmhello 已提交
779
  tstrncpy(pClusterInfo->version, version, sizeof(pClusterInfo->version));
S
Shengliang Guan 已提交
780 781
  pClusterInfo->monitor_interval = tsMonitorInterval;
  pClusterInfo->connections_total = mndGetNumOfConnections(pMnode);
782 783
  pClusterInfo->dbs_total = sdbGetSize(pSdb, SDB_DB);
  pClusterInfo->stbs_total = sdbGetSize(pSdb, SDB_STB);
S
Shengliang Guan 已提交
784 785 786 787 788 789 790 791 792 793

  void *pIter = NULL;
  while (1) {
    SDnodeObj *pObj = NULL;
    pIter = sdbFetch(pSdb, SDB_DNODE, pIter, (void **)&pObj);
    if (pIter == NULL) break;

    SMonDnodeDesc desc = {0};
    desc.dnode_id = pObj->id;
    tstrncpy(desc.dnode_ep, pObj->ep, sizeof(desc.dnode_ep));
S
Shengliang Guan 已提交
794
    if (mndIsDnodeOnline(pObj, ms)) {
S
Shengliang Guan 已提交
795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812
      tstrncpy(desc.status, "ready", sizeof(desc.status));
    } else {
      tstrncpy(desc.status, "offline", sizeof(desc.status));
    }
    taosArrayPush(pClusterInfo->dnodes, &desc);
    sdbRelease(pSdb, pObj);
  }

  pIter = NULL;
  while (1) {
    SMnodeObj *pObj = NULL;
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pObj);
    if (pIter == NULL) break;

    SMonMnodeDesc desc = {0};
    desc.mnode_id = pObj->id;
    tstrncpy(desc.mnode_ep, pObj->pDnode->ep, sizeof(desc.mnode_ep));

813
    if (pObj->id == pMnode->selfDnodeId) {
S
Shengliang Guan 已提交
814 815
      pClusterInfo->first_ep_dnode_id = pObj->id;
      tstrncpy(pClusterInfo->first_ep, pObj->pDnode->ep, sizeof(pClusterInfo->first_ep));
816 817
      pClusterInfo->master_uptime = mndGetClusterUpTime(pMnode);
      // pClusterInfo->master_uptime = (ms - pObj->stateStartTime) / (86400000.0f);
818 819 820
      tstrncpy(desc.role, syncStr(TAOS_SYNC_STATE_LEADER), sizeof(desc.role));
    } else {
      tstrncpy(desc.role, syncStr(pObj->state), sizeof(desc.role));
S
Shengliang Guan 已提交
821
    }
822 823
    taosArrayPush(pClusterInfo->mnodes, &desc);
    sdbRelease(pSdb, pObj);
S
Shengliang Guan 已提交
824 825 826 827 828 829 830 831 832 833
  }

  // vgroup info
  pIter = NULL;
  while (1) {
    SVgObj *pVgroup = NULL;
    pIter = sdbFetch(pSdb, SDB_VGROUP, pIter, (void **)&pVgroup);
    if (pIter == NULL) break;

    pClusterInfo->vgroups_total++;
834
    pClusterInfo->tbs_total += pVgroup->numOfTables;
S
Shengliang Guan 已提交
835 836 837

    SMonVgroupDesc desc = {0};
    desc.vgroup_id = pVgroup->vgId;
838 839 840 841 842

    SName name = {0};
    tNameFromString(&name, pVgroup->dbName, T_NAME_ACCT | T_NAME_DB | T_NAME_TABLE);
    tNameGetDbName(&name, desc.database_name);

S
Shengliang Guan 已提交
843 844 845 846
    desc.tables_num = pVgroup->numOfTables;
    pGrantInfo->timeseries_used += pVgroup->numOfTimeSeries;
    tstrncpy(desc.status, "unsynced", sizeof(desc.status));
    for (int32_t i = 0; i < pVgroup->replica; ++i) {
M
Minghao Li 已提交
847
      SVnodeGid     *pVgid = &pVgroup->vnodeGid[i];
S
Shengliang Guan 已提交
848 849
      SMonVnodeDesc *pVnDesc = &desc.vnodes[i];
      pVnDesc->dnode_id = pVgid->dnodeId;
S
Shengliang Guan 已提交
850
      tstrncpy(pVnDesc->vnode_role, syncStr(pVgid->role), sizeof(pVnDesc->vnode_role));
S
Shengliang Guan 已提交
851 852 853 854
      if (pVgid->role == TAOS_SYNC_STATE_LEADER) {
        tstrncpy(desc.status, "ready", sizeof(desc.status));
        pClusterInfo->vgroups_alive++;
      }
S
Shengliang Guan 已提交
855
      if (pVgid->role != TAOS_SYNC_STATE_ERROR) {
S
Shengliang Guan 已提交
856 857 858 859 860 861 862 863 864
        pClusterInfo->vnodes_alive++;
      }
      pClusterInfo->vnodes_total++;
    }

    taosArrayPush(pVgroupInfo->vgroups, &desc);
    sdbRelease(pSdb, pVgroup);
  }

S
Shengliang Guan 已提交
865 866 867 868 869 870 871
  // stb info
  pIter = NULL;
  while (1) {
    SStbObj *pStb = NULL;
    pIter = sdbFetch(pSdb, SDB_STB, pIter, (void **)&pStb);
    if (pIter == NULL) break;

S
Shengliang Guan 已提交
872
    SMonStbDesc desc = {0};
S
Shengliang Guan 已提交
873 874 875 876 877 878 879 880 881 882 883 884 885

    SName name1 = {0};
    tNameFromString(&name1, pStb->db, T_NAME_ACCT | T_NAME_DB | T_NAME_TABLE);
    tNameGetDbName(&name1, desc.database_name);

    SName name2 = {0};
    tNameFromString(&name2, pStb->name, T_NAME_ACCT | T_NAME_DB | T_NAME_TABLE);
    tstrncpy(desc.stb_name, tNameGetTableName(&name2), TSDB_TABLE_NAME_LEN);

    taosArrayPush(pStbInfo->stbs, &desc);
    sdbRelease(pSdb, pStb);
  }

S
Shengliang Guan 已提交
886 887 888 889 890 891 892 893
  // grant info
  pGrantInfo->expire_time = (pMnode->grant.expireTimeMS - ms) / 86400000.0f;
  pGrantInfo->timeseries_total = pMnode->grant.timeseriesAllowed;
  if (pMnode->grant.expireTimeMS == 0) {
    pGrantInfo->expire_time = INT32_MAX;
    pGrantInfo->timeseries_total = INT32_MAX;
  }

S
Shengliang Guan 已提交
894
  mndReleaseRpcRef(pMnode);
S
Shengliang Guan 已提交
895
  return 0;
L
Liu Jicong 已提交
896
}
S
Shengliang Guan 已提交
897 898

int32_t mndGetLoad(SMnode *pMnode, SMnodeLoad *pLoad) {
899
  pLoad->syncState = syncGetMyRole(pMnode->syncMgmt.sync);
S
Shengliang Guan 已提交
900
  mTrace("mnode current syncstate is %s", syncStr(pLoad->syncState));
S
Shengliang Guan 已提交
901
  return 0;
L
fix  
Liu Jicong 已提交
902
}
S
Shengliang Guan 已提交
903 904 905 906 907

int32_t mndAcquireRpcRef(SMnode *pMnode) {
  int32_t code = 0;
  taosThreadRwlockRdlock(&pMnode->lock);
  if (pMnode->stopped) {
S
Shengliang Guan 已提交
908
    mTrace("mnode not running");
S
Shengliang Guan 已提交
909 910 911
    terrno = TSDB_CODE_APP_NOT_READY;
    code = -1;
  } else if (!mndIsMaster(pMnode)) {
S
Shengliang Guan 已提交
912
    mTrace("mnode not ready, role:%s restored:%d", syncGetMyRoleStr(pMnode->syncMgmt.sync), pMnode->restored);
S
Shengliang Guan 已提交
913 914 915
    code = -1;
  } else {
    int32_t ref = atomic_add_fetch_32(&pMnode->rpcRef, 1);
S
Shengliang Guan 已提交
916
    // mTrace("mnode rpc is acquired, ref:%d", ref);
S
Shengliang Guan 已提交
917 918 919 920 921 922 923 924
  }
  taosThreadRwlockUnlock(&pMnode->lock);
  return code;
}

void mndReleaseRpcRef(SMnode *pMnode) {
  taosThreadRwlockRdlock(&pMnode->lock);
  int32_t ref = atomic_sub_fetch_32(&pMnode->rpcRef, 1);
S
Shengliang Guan 已提交
925
  // mTrace("mnode rpc is released, ref:%d", ref);
S
Shengliang Guan 已提交
926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956
  taosThreadRwlockUnlock(&pMnode->lock);
}

void mndSetRestore(SMnode *pMnode, bool restored) {
  if (restored) {
    taosThreadRwlockWrlock(&pMnode->lock);
    pMnode->restored = true;
    taosThreadRwlockUnlock(&pMnode->lock);
    mTrace("mnode set restored:%d", restored);
  } else {
    taosThreadRwlockWrlock(&pMnode->lock);
    pMnode->restored = false;
    taosThreadRwlockUnlock(&pMnode->lock);
    mTrace("mnode set restored:%d", restored);
    while (1) {
      if (pMnode->rpcRef <= 0) break;
      taosMsleep(3);
    }
  }
}

bool mndGetRestored(SMnode *pMnode) { return pMnode->restored; }

void mndSetStop(SMnode *pMnode) {
  taosThreadRwlockWrlock(&pMnode->lock);
  pMnode->stopped = true;
  taosThreadRwlockUnlock(&pMnode->lock);
  mTrace("mnode set stopped");
}

bool mndGetStop(SMnode *pMnode) { return pMnode->stopped; }