mnode.c 12.7 KB
Newer Older
S
Shengliang Guan 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#define _DEFAULT_SOURCE
S
Shengliang Guan 已提交
17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33
#include "mndAcct.h"
#include "mndAuth.h"
#include "mndBalance.h"
#include "mndCluster.h"
#include "mndDb.h"
#include "mndDnode.h"
#include "mndFunc.h"
#include "mndMnode.h"
#include "mndOper.h"
#include "mndProfile.h"
#include "mndShow.h"
#include "mndStable.h"
#include "mndSync.h"
#include "mndTelem.h"
#include "mndTrans.h"
#include "mndUser.h"
#include "mndVgroup.h"
S
Shengliang Guan 已提交
34

35 36 37 38
int32_t mndGetDnodeId(SMnode *pMnode) {
  if (pMnode != NULL) {
    return pMnode->dnodeId;
  }
S
Shengliang Guan 已提交
39

40 41
  return -1;
}
S
Shengliang Guan 已提交
42

43 44 45 46
int64_t mndGetClusterId(SMnode *pMnode) {
  if (pMnode != NULL) {
    return pMnode->clusterId;
  }
S
Shengliang Guan 已提交
47

48 49
  return -1;
}
S
Shengliang Guan 已提交
50

51 52 53 54
tmr_h mndGetTimer(SMnode *pMnode) {
  if (pMnode != NULL) {
    return pMnode->timer;
  }
S
Shengliang Guan 已提交
55 56

  return NULL;
57 58
}

59 60 61 62
void mndSendMsgToDnode(SMnode *pMnode, SEpSet *pEpSet, SRpcMsg *pMsg) {
  if (pMnode != NULL && pMnode->sendMsgToDnodeFp != NULL) {
    (*pMnode->sendMsgToDnodeFp)(pMnode->pDnode, pEpSet, pMsg);
  }
S
Shengliang Guan 已提交
63
}
S
Shengliang Guan 已提交
64

65 66 67 68
void mndSendMsgToMnode(SMnode *pMnode, SRpcMsg *pMsg) {
  if (pMnode != NULL && pMnode->sendMsgToMnodeFp != NULL) {
    (*pMnode->sendMsgToMnodeFp)(pMnode->pDnode, pMsg);
  }
S
Shengliang Guan 已提交
69
}
S
Shengliang Guan 已提交
70

71 72 73 74
void mndSendRedirectMsg(SMnode *pMnode, SRpcMsg *pMsg) {
  if (pMnode != NULL && pMnode->sendRedirectMsgFp != NULL) {
    (*pMnode->sendRedirectMsgFp)(pMnode->pDnode, pMsg);
  }
S
Shengliang Guan 已提交
75
}
S
Shengliang Guan 已提交
76

77 78 79
static int32_t mndInitTimer(SMnode *pMnode) {
  if (pMnode->timer == NULL) {
    pMnode->timer = taosTmrInit(5000, 200, 3600000, "MND");
S
Shengliang Guan 已提交
80 81
  }

82
  if (pMnode->timer == NULL) {
S
Shengliang Guan 已提交
83
    terrno = TSDB_CODE_OUT_OF_MEMORY;
S
Shengliang Guan 已提交
84 85 86 87 88 89
    return -1;
  }

  return 0;
}

90 91 92 93
static void mndCleanupTimer(SMnode *pMnode) {
  if (pMnode->timer != NULL) {
    taosTmrCleanUp(pMnode->timer);
    pMnode->timer = NULL;
S
Shengliang Guan 已提交
94 95 96
  }
}

97 98 99 100
static int32_t mnodeCreateDir(SMnode *pMnode, const char *path) {
  pMnode->path = strdup(path);
  if (pMnode->path == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
S
Shengliang Guan 已提交
101
    return -1;
102 103 104 105
  }

  if (taosMkDir(pMnode->path) != 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
106
    return -1;
107
  }
108 109

  return 0;
110
}
S
Shengliang Guan 已提交
111

112 113 114
static int32_t mndInitSdb(SMnode *pMnode) {
  SSdbOpt opt = {0};
  opt.path = pMnode->path;
S
Shengliang Guan 已提交
115
  opt.pMnode = pMnode;
S
Shengliang Guan 已提交
116

S
Shengliang Guan 已提交
117
  pMnode->pSdb = sdbInit(&opt);
118
  if (pMnode->pSdb == NULL) {
S
Shengliang Guan 已提交
119 120 121 122 123 124
    return -1;
  }

  return 0;
}

125
static int32_t mndDeploySdb(SMnode *pMnode) { return sdbDeploy(pMnode->pSdb); }
S
Shengliang Guan 已提交
126
static int32_t mndReadSdb(SMnode *pMnode) { return sdbReadFile(pMnode->pSdb); }
127 128 129

static void mndCleanupSdb(SMnode *pMnode) {
  if (pMnode->pSdb) {
S
Shengliang Guan 已提交
130
    sdbCleanup(pMnode->pSdb);
131 132 133 134
    pMnode->pSdb = NULL;
  }
}

135 136 137 138 139
static int32_t mndAllocStep(SMnode *pMnode, char *name, MndInitFp initFp, MndCleanupFp cleanupFp) {
  SMnodeStep step = {0};
  step.name = name;
  step.initFp = initFp;
  step.cleanupFp = cleanupFp;
S
Shengliang Guan 已提交
140
  if (taosArrayPush(pMnode->pSteps, &step) == NULL) {
141 142 143 144
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }

S
Shengliang Guan 已提交
145 146 147
  return 0;
}

148
static int32_t mndInitSteps(SMnode *pMnode) {
S
Shengliang Guan 已提交
149 150 151 152 153 154 155 156 157 158 159 160
  if (mndAllocStep(pMnode, "mnode-sdb", mndInitSdb, mndCleanupSdb) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-trans", mndInitTrans, mndCleanupTrans) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-cluster", mndInitCluster, mndCleanupCluster) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-dnode", mndInitDnode, mndCleanupDnode) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-mnode", mndInitMnode, mndCleanupMnode) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-acct", mndInitAcct, mndCleanupAcct) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-auth", mndInitAuth, mndCleanupAuth) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-user", mndInitUser, mndCleanupUser) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-db", mndInitDb, mndCleanupDb) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-vgroup", mndInitVgroup, mndCleanupVgroup) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-stable", mndInitStable, mndCleanupStable) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-func", mndInitFunc, mndCleanupFunc) != 0) return -1;
161
  if (pMnode->clusterId <= 0) {
S
Shengliang Guan 已提交
162 163 164 165 166 167 168 169 170 171 172
    if (mndAllocStep(pMnode, "mnode-sdb-deploy", mndDeploySdb, NULL) != 0) return -1;
  } else {
    if (mndAllocStep(pMnode, "mnode-sdb-read", mndReadSdb, NULL) != 0) return -1;
  }
  if (mndAllocStep(pMnode, "mnode-timer", mndInitTimer, NULL) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-balance", mndInitBalance, mndCleanupBalance) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-profile", mndInitProfile, mndCleanupProfile) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-show", mndInitShow, mndCleanupShow) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-sync", mndInitSync, mndCleanupSync) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-telem", mndInitTelem, mndCleanupTelem) != 0) return -1;
  if (mndAllocStep(pMnode, "mnode-timer", NULL, mndCleanupTimer) != 0) return -1;
S
Shengliang Guan 已提交
173 174 175 176

  return 0;
}

177
static void mndCleanupSteps(SMnode *pMnode, int32_t pos) {
S
Shengliang Guan 已提交
178 179
  if (pMnode->pSteps == NULL) return;

180
  if (pos == -1) {
181
    pos = taosArrayGetSize(pMnode->pSteps) - 1;
S
Shengliang Guan 已提交
182 183
  }

184
  for (int32_t s = pos; s >= 0; s--) {
185
    SMnodeStep *pStep = taosArrayGet(pMnode->pSteps, s);
186 187 188 189
    mDebug("step:%s will cleanup", pStep->name);
    if (pStep->cleanupFp != NULL) {
      (*pStep->cleanupFp)(pMnode);
    }
S
Shengliang Guan 已提交
190 191
  }

S
Shengliang Guan 已提交
192
  taosArrayClear(pMnode->pSteps);
S
Shengliang Guan 已提交
193
  taosArrayDestroy(pMnode->pSteps);
S
Shengliang Guan 已提交
194
  pMnode->pSteps = NULL;
195
}
S
Shengliang Guan 已提交
196

197
static int32_t mndExecSteps(SMnode *pMnode) {
S
Shengliang Guan 已提交
198
  int32_t size = taosArrayGetSize(pMnode->pSteps);
199
  for (int32_t pos = 0; pos < size; pos++) {
S
Shengliang Guan 已提交
200
    SMnodeStep *pStep = taosArrayGet(pMnode->pSteps, pos);
201
    if (pStep->initFp == NULL) continue;
S
Shengliang Guan 已提交
202

203 204
    // (*pMnode->reportProgress)(pStep->name, "start initialize");

S
Shengliang Guan 已提交
205 206
    if ((*pStep->initFp)(pMnode) != 0) {
      mError("step:%s exec failed since %s, start to cleanup", pStep->name, terrstr());
207
      mndCleanupSteps(pMnode, pos);
S
Shengliang Guan 已提交
208
      return -1;
S
Shengliang Guan 已提交
209
    } else {
210
      mDebug("step:%s is initialized", pStep->name);
S
Shengliang Guan 已提交
211
    }
212 213

    // (*pMnode->reportProgress)(pStep->name, "initialize completed");
S
Shengliang Guan 已提交
214
  }
S
Shengliang Guan 已提交
215 216

  return 0;
217
}
S
Shengliang Guan 已提交
218

219 220 221 222 223 224 225 226 227 228 229
static int32_t mndSetOptions(SMnode *pMnode, const SMnodeOpt *pOption) {
  pMnode->dnodeId = pOption->dnodeId;
  pMnode->clusterId = pOption->clusterId;
  pMnode->replica = pOption->replica;
  pMnode->selfIndex = pOption->selfIndex;
  memcpy(&pMnode->replicas, pOption->replicas, sizeof(SReplica) * TSDB_MAX_REPLICA);
  pMnode->pDnode = pOption->pDnode;
  pMnode->putMsgToApplyMsgFp = pOption->putMsgToApplyMsgFp;
  pMnode->sendMsgToDnodeFp = pOption->sendMsgToDnodeFp;
  pMnode->sendMsgToMnodeFp = pOption->sendMsgToMnodeFp;
  pMnode->sendRedirectMsgFp = pOption->sendRedirectMsgFp;
S
Shengliang Guan 已提交
230 231 232 233 234 235
  pMnode->sver = pOption->sver;
  pMnode->statusInterval = pOption->statusInterval;
  pMnode->mnodeEqualVnodeNum = pOption->mnodeEqualVnodeNum;
  pMnode->timezone = strdup(pOption->timezone);
  pMnode->locale = strdup(pOption->locale);
  pMnode->charset = strdup(pOption->charset);
236 237

  if (pMnode->sendMsgToDnodeFp == NULL || pMnode->sendMsgToMnodeFp == NULL || pMnode->sendRedirectMsgFp == NULL ||
S
Shengliang Guan 已提交
238 239
      pMnode->putMsgToApplyMsgFp == NULL || pMnode->dnodeId < 0 || pMnode->clusterId < 0 ||
      pMnode->statusInterval < 1 || pOption->mnodeEqualVnodeNum < 0) {
240
    terrno = TSDB_CODE_MND_APP_ERROR;
S
Shengliang Guan 已提交
241 242 243
    return -1;
  }

S
Shengliang Guan 已提交
244 245
  if (pMnode->timezone == NULL || pMnode->locale == NULL || pMnode->charset == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
S
Shengliang Guan 已提交
246
    return -1;
247 248 249 250 251
  }

  return 0;
}

252
SMnode *mndOpen(const char *path, const SMnodeOpt *pOption) {
S
Shengliang Guan 已提交
253 254
  mDebug("start to open mnode in %s", path);

255
  SMnode *pMnode = calloc(1, sizeof(SMnode));
S
Shengliang Guan 已提交
256 257 258 259 260 261 262 263 264 265 266 267 268
  if (pMnode == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    mError("failed to open mnode since %s", terrstr());
    return NULL;
  }

  pMnode->pSteps = taosArrayInit(24, sizeof(SMnodeStep));
  if (pMnode->pSteps == NULL) {
    free(pMnode);
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    mError("failed to open mnode since %s", terrstr());
    return NULL;
  }
269

270
  int32_t code = mnodeCreateDir(pMnode, path);
271
  if (code != 0) {
S
Shengliang Guan 已提交
272
    mError("failed to open mnode since %s", tstrerror(code));
273 274 275 276 277 278
    mndClose(pMnode);
    terrno = code;
    return NULL;
  }

  code = mndSetOptions(pMnode, pOption);
279
  if (code != 0) {
S
Shengliang Guan 已提交
280
    mError("failed to open mnode since %s", tstrerror(code));
281 282 283 284 285 286 287
    mndClose(pMnode);
    terrno = code;
    return NULL;
  }

  code = mndInitSteps(pMnode);
  if (code != 0) {
S
Shengliang Guan 已提交
288
    mError("failed to open mnode since %s", tstrerror(code));
289 290 291 292 293 294 295
    mndClose(pMnode);
    terrno = code;
    return NULL;
  }

  code = mndExecSteps(pMnode);
  if (code != 0) {
S
Shengliang Guan 已提交
296
    mError("failed to open mnode since %s", tstrerror(code));
297 298 299 300
    mndClose(pMnode);
    terrno = code;
    return NULL;
  }
S
Shengliang Guan 已提交
301

S
Shengliang Guan 已提交
302
  mDebug("mnode open successfully ");
S
Shengliang Guan 已提交
303 304
  return pMnode;
}
S
Shengliang Guan 已提交
305

306
void mndClose(SMnode *pMnode) {
S
Shengliang Guan 已提交
307 308 309 310
  if (pMnode != NULL) {
    mDebug("start to close mnode");
    mndCleanupSteps(pMnode, -1);
    tfree(pMnode->path);
S
Shengliang Guan 已提交
311 312 313
    tfree(pMnode->charset);
    tfree(pMnode->locale);
    tfree(pMnode->timezone);
S
Shengliang Guan 已提交
314 315 316
    tfree(pMnode);
    mDebug("mnode is closed");
  }
317
}
S
Shengliang Guan 已提交
318

319
int32_t mndAlter(SMnode *pMnode, const SMnodeOpt *pOption) {
S
Shengliang Guan 已提交
320 321
  mDebug("start to alter mnode");
  mDebug("mnode is altered");
322 323
  return 0;
}
S
Shengliang Guan 已提交
324

325
void mndDestroy(const char *path) {
S
Shengliang Guan 已提交
326
  mDebug("start to destroy mnode at %s", path);
S
Shengliang Guan 已提交
327
  taosRemoveDir(path);
S
Shengliang Guan 已提交
328
  mDebug("mnode is destroyed");
329
}
S
Shengliang Guan 已提交
330

331
int32_t mndGetLoad(SMnode *pMnode, SMnodeLoad *pLoad) {
S
Shengliang Guan 已提交
332 333 334 335 336 337 338 339 340 341 342
  pLoad->numOfDnode = 0;
  pLoad->numOfMnode = 0;
  pLoad->numOfVgroup = 0;
  pLoad->numOfDatabase = 0;
  pLoad->numOfSuperTable = 0;
  pLoad->numOfChildTable = 0;
  pLoad->numOfColumn = 0;
  pLoad->totalPoints = 0;
  pLoad->totalStorage = 0;
  pLoad->compStorage = 0;

343 344
  return 0;
}
S
Shengliang Guan 已提交
345

346
SMnodeMsg *mndInitMsg(SMnode *pMnode, SRpcMsg *pRpcMsg) {
S
Shengliang Guan 已提交
347 348 349
  SMnodeMsg *pMsg = taosAllocateQitem(sizeof(SMnodeMsg));
  if (pMsg == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
S
Shengliang Guan 已提交
350
    mError("failed to create msg since %s", terrstr());
S
Shengliang Guan 已提交
351 352 353
    return NULL;
  }

S
Shengliang Guan 已提交
354 355
  SRpcConnInfo connInfo = {0};
  if (rpcGetConnInfo(pRpcMsg->handle, &connInfo) != 0) {
356
    mndCleanupMsg(pMsg);
S
Shengliang Guan 已提交
357
    terrno = TSDB_CODE_MND_NO_USER_FROM_CONN;
358
    mError("failed to create msg since %s", terrstr());
S
Shengliang Guan 已提交
359 360
    return NULL;
  }
S
Shengliang Guan 已提交
361
  memcpy(pMsg->user, connInfo.user, TSDB_USER_LEN);
S
Shengliang Guan 已提交
362

S
Shengliang Guan 已提交
363
  pMsg->pMnode = pMnode;
S
Shengliang Guan 已提交
364 365 366
  pMsg->rpcMsg = *pRpcMsg;
  pMsg->createdTime = taosGetTimestampSec();

S
Shengliang Guan 已提交
367
  mTrace("msg:%p, is created", pMsg);
S
Shengliang Guan 已提交
368 369 370
  return pMsg;
}

371
void mndCleanupMsg(SMnodeMsg *pMsg) {
S
Shengliang Guan 已提交
372
  taosFreeQitem(pMsg);
S
Shengliang Guan 已提交
373
  mTrace("msg:%p, is destroyed", pMsg);
S
Shengliang Guan 已提交
374 375
}

376 377 378 379
void mndSendRsp(SMnodeMsg *pMsg, int32_t code) {
  SRpcMsg rpcRsp = {.handle = pMsg->rpcMsg.handle, .code = code};
  rpcSendResponse(&rpcRsp);
}
S
Shengliang Guan 已提交
380

381 382
static void mndProcessRpcMsg(SMnodeMsg *pMsg) {
  SMnode *pMnode = pMsg->pMnode;
S
Shengliang Guan 已提交
383 384 385 386
  int32_t code = 0;
  int32_t msgType = pMsg->rpcMsg.msgType;
  void   *ahandle = pMsg->rpcMsg.ahandle;
  bool    isReq = (msgType % 2 == 1);
387

388
  mTrace("msg:%p, app:%p will be processed", pMsg, ahandle);
S
Shengliang Guan 已提交
389

S
Shengliang Guan 已提交
390 391
  if (isReq && !mndIsMaster(pMnode)) {
    code = TSDB_CODE_APP_NOT_READY;
392
    mDebug("msg:%p, app:%p failed to process since %s", pMsg, ahandle, terrstr());
S
Shengliang Guan 已提交
393 394 395 396 397
    goto PROCESS_RPC_END;
  }

  if (isReq && pMsg->rpcMsg.pCont == NULL) {
    code = TSDB_CODE_MND_INVALID_MSG_LEN;
398
    mError("msg:%p, app:%p failed to process since %s", pMsg, ahandle, terrstr());
S
Shengliang Guan 已提交
399
    goto PROCESS_RPC_END;
S
Shengliang Guan 已提交
400 401
  }

402
  MndMsgFp fp = pMnode->msgFp[msgType];
S
Shengliang Guan 已提交
403
  if (fp == NULL) {
S
Shengliang Guan 已提交
404
    code = TSDB_CODE_MSG_NOT_PROCESSED;
405
    mError("msg:%p, app:%p failed to process since not handle", pMsg, ahandle);
S
Shengliang Guan 已提交
406
    goto PROCESS_RPC_END;
S
Shengliang Guan 已提交
407 408
  }

S
Shengliang Guan 已提交
409
  code = (*fp)(pMnode, pMsg);
S
Shengliang Guan 已提交
410
  if (code != 0) {
S
Shengliang Guan 已提交
411
    code = terrno;
412
    mError("msg:%p, app:%p failed to process since %s", pMsg, ahandle, terrstr());
S
Shengliang Guan 已提交
413
    goto PROCESS_RPC_END;
414 415
  } else {
    mTrace("msg:%p, app:%p is processed", pMsg, ahandle);
S
Shengliang Guan 已提交
416 417 418 419 420 421 422
  }

PROCESS_RPC_END:
  if (isReq) {
    if (code == TSDB_CODE_APP_NOT_READY) {
      mndSendRedirectMsg(pMnode, &pMsg->rpcMsg);
    } else if (code != 0) {
S
Shengliang Guan 已提交
423 424
      SRpcMsg rpcRsp = {.handle = pMsg->rpcMsg.handle, .code = code};
      rpcSendResponse(&rpcRsp);
S
Shengliang Guan 已提交
425
    } else {
S
Shengliang Guan 已提交
426 427
      SRpcMsg rpcRsp = {.handle = pMsg->rpcMsg.handle, .contLen = pMsg->contLen, .pCont = pMsg->pCont};
      rpcSendResponse(&rpcRsp);
S
Shengliang Guan 已提交
428
    }
S
Shengliang Guan 已提交
429
  }
S
Shengliang Guan 已提交
430 431
}

432
void mndSetMsgHandle(SMnode *pMnode, int32_t msgType, MndMsgFp fp) {
S
Shengliang Guan 已提交
433
  if (msgType >= 0 && msgType < TSDB_MSG_TYPE_MAX) {
434
    pMnode->msgFp[msgType] = fp;
S
Shengliang Guan 已提交
435 436 437
  }
}

438
void mndProcessReadMsg(SMnodeMsg *pMsg) { mndProcessRpcMsg(pMsg); }
S
Shengliang Guan 已提交
439

440
void mndProcessWriteMsg(SMnodeMsg *pMsg) { mndProcessRpcMsg(pMsg); }
S
Shengliang Guan 已提交
441

442
void mndProcessSyncMsg(SMnodeMsg *pMsg) { mndProcessRpcMsg(pMsg); }
S
Shengliang Guan 已提交
443

444
void mndProcessApplyMsg(SMnodeMsg *pMsg) {}