dmMgmt.c 9.2 KB
Newer Older
S
shm  
Shengliang Guan 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

S
shm  
Shengliang Guan 已提交
16
#define _DEFAULT_SOURCE
S
Shengliang Guan 已提交
17
#include "dmMgmt.h"
S
Shengliang Guan 已提交
18
#include "dmNodes.h"
S
Shengliang Guan 已提交
19
#include "qworker.h"
S
Shengliang Guan 已提交
20

21
static bool dmRequireNode(SDnode *pDnode, SMgmtWrapper *pWrapper) {
S
Shengliang Guan 已提交
22
  SMgmtInputOpt input = dmBuildMgmtInputOpt(pWrapper);
S
Shengliang Guan 已提交
23 24

  bool    required = false;
S
Shengliang Guan 已提交
25
  int32_t code = (*pWrapper->func.requiredFp)(&input, &required);
S
Shengliang Guan 已提交
26 27 28 29
  if (!required) {
    dDebug("node:%s, does not require startup", pWrapper->name);
  }

30 31 32 33 34 35 36 37 38 39 40 41
  if (pWrapper->ntype == DNODE) {
    if (pDnode->rtype != DNODE && pDnode->rtype != NODE_END) {
      required = false;
      dDebug("node:%s, does not require startup in child process", pWrapper->name);
    }
  } else {
    if (OnlyInChildProc(pWrapper)) {
      if (pWrapper->ntype != pDnode->rtype) {
        dDebug("node:%s, does not require startup in child process", pWrapper->name);
        required = false;
      }
    }
S
Shengliang Guan 已提交
42 43
  }

S
Shengliang Guan 已提交
44 45 46 47
  if (required) {
    dDebug("node:%s, required to startup", pWrapper->name);
  }

S
Shengliang Guan 已提交
48 49
  return required;
}
S
Shengliang Guan 已提交
50

51 52
static int32_t dmInitVars(SDnode *pDnode, EDndNodeType rtype) {
  pDnode->rtype = rtype;
S
Shengliang Guan 已提交
53 54 55 56 57 58 59 60 61 62 63 64 65

  if (tsMultiProcess == 0) {
    pDnode->ptype = DND_PROC_SINGLE;
    dInfo("dnode will run in single-process mode");
  } else if (tsMultiProcess > 1) {
    pDnode->ptype = DND_PROC_TEST;
    dInfo("dnode will run in multi-process test mode");
  } else if (pDnode->rtype == DNODE || pDnode->rtype == NODE_END) {
    pDnode->ptype = DND_PROC_PARENT;
    dInfo("dnode will run in parent-process mode");
  } else {
    pDnode->ptype = DND_PROC_CHILD;
    SMgmtWrapper *pWrapper = &pDnode->wrappers[pDnode->rtype];
S
Shengliang Guan 已提交
66
    dInfo("dnode will run in child-process mode, node:%s", dmNodeName(pDnode->rtype));
S
Shengliang Guan 已提交
67 68
  }

S
Shengliang Guan 已提交
69 70 71 72 73 74 75 76
  SDnodeData *pData = &pDnode->data;
  pData->dnodeId = 0;
  pData->clusterId = 0;
  pData->dnodeVer = 0;
  pData->updateTime = 0;
  pData->rebootTime = taosGetTimestampMs();
  pData->dropped = 0;
  pData->stopped = 0;
S
shm  
Shengliang Guan 已提交
77

S
Shengliang Guan 已提交
78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94
  pData->dnodeHash = taosHashInit(4, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT), true, HASH_NO_LOCK);
  if (pData->dnodeHash == NULL) {
    dError("failed to init dnode hash");
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }

  if (dmReadEps(pData) != 0) {
    dError("failed to read file since %s", terrstr());
    return -1;
  }

  if (pData->dropped) {
    dError("dnode will not start since its already dropped");
    return -1;
  }

95
  taosThreadRwlockInit(&pData->lock, NULL);
96
  taosThreadMutexInit(&pDnode->mutex, NULL);
S
shm  
Shengliang Guan 已提交
97 98 99
  return 0;
}

S
Shengliang Guan 已提交
100
static void dmClearVars(SDnode *pDnode) {
S
Shengliang Guan 已提交
101 102 103
  for (EDndNodeType ntype = DNODE; ntype < NODE_END; ++ntype) {
    SMgmtWrapper *pWrapper = &pDnode->wrappers[ntype];
    taosMemoryFreeClear(pWrapper->path);
104
    taosThreadRwlockDestroy(&pWrapper->lock);
S
Shengliang Guan 已提交
105 106 107 108 109 110 111
  }
  if (pDnode->lockfile != NULL) {
    taosUnLockFile(pDnode->lockfile);
    taosCloseFile(&pDnode->lockfile);
    pDnode->lockfile = NULL;
  }

S
Shengliang Guan 已提交
112
  SDnodeData *pData = &pDnode->data;
113
  taosThreadRwlockWrlock(&pData->lock);
S
Shengliang Guan 已提交
114 115 116 117 118 119 120 121
  if (pData->dnodeEps != NULL) {
    taosArrayDestroy(pData->dnodeEps);
    pData->dnodeEps = NULL;
  }
  if (pData->dnodeHash != NULL) {
    taosHashCleanup(pData->dnodeHash);
    pData->dnodeHash = NULL;
  }
122
  taosThreadRwlockUnlock(&pData->lock);
S
Shengliang Guan 已提交
123

124
  taosThreadRwlockDestroy(&pData->lock);
S
Shengliang Guan 已提交
125 126
  taosThreadMutexDestroy(&pDnode->mutex);
  memset(&pDnode->mutex, 0, sizeof(pDnode->mutex));
S
shm  
Shengliang Guan 已提交
127 128
}

129
int32_t dmInitDnode(SDnode *pDnode, EDndNodeType rtype) {
S
Shengliang Guan 已提交
130
  dInfo("start to create dnode");
S
shm  
Shengliang Guan 已提交
131
  int32_t code = -1;
S
Shengliang Guan 已提交
132
  char    path[PATH_MAX + 100] = {0};
S
shm  
Shengliang Guan 已提交
133

134
  if (dmInitVars(pDnode, rtype) != 0) {
S
Shengliang Guan 已提交
135 136 137
    goto _OVER;
  }

S
Shengliang Guan 已提交
138 139 140 141 142 143
  pDnode->wrappers[DNODE].func = dmGetMgmtFunc();
  pDnode->wrappers[MNODE].func = mmGetMgmtFunc();
  pDnode->wrappers[VNODE].func = vmGetMgmtFunc();
  pDnode->wrappers[QNODE].func = qmGetMgmtFunc();
  pDnode->wrappers[SNODE].func = smGetMgmtFunc();
  pDnode->wrappers[BNODE].func = bmGetMgmtFunc();
S
shm  
Shengliang Guan 已提交
144

S
Shengliang 已提交
145 146
  for (EDndNodeType ntype = DNODE; ntype < NODE_END; ++ntype) {
    SMgmtWrapper *pWrapper = &pDnode->wrappers[ntype];
147
    pWrapper->pDnode = pDnode;
S
Shengliang Guan 已提交
148
    pWrapper->name = dmNodeName(ntype);
S
Shengliang Guan 已提交
149 150 151 152 153 154 155 156
    pWrapper->ntype = ntype;
    pWrapper->proc.wrapper = pWrapper;
    pWrapper->proc.shm.id = -1;
    pWrapper->proc.pid = -1;
    pWrapper->proc.ptype = pDnode->ptype;
    if (ntype == DNODE) {
      pWrapper->proc.ptype = DND_PROC_SINGLE;
    }
157
    taosThreadRwlockInit(&pWrapper->lock, NULL);
S
Shengliang Guan 已提交
158

159
    snprintf(path, sizeof(path), "%s%s%s", tsDataDir, TD_DIRSEP, pWrapper->name);
S
Shengliang Guan 已提交
160
    pWrapper->path = strdup(path);
S
shm  
Shengliang Guan 已提交
161 162 163 164 165
    if (pWrapper->path == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      goto _OVER;
    }

166
    pWrapper->required = dmRequireNode(pDnode, pWrapper);
S
Shengliang Guan 已提交
167

S
Shengliang Guan 已提交
168
    if (ntype != DNODE && dmReadShmFile(pWrapper->path, pWrapper->name, pDnode->rtype, &pWrapper->proc.shm) != 0) {
S
Shengliang Guan 已提交
169 170 171
      dError("node:%s, failed to read shm file since %s", pWrapper->name, terrstr());
      goto _OVER;
    }
S
shm  
Shengliang Guan 已提交
172 173
  }

S
Shengliang Guan 已提交
174
  if (dmInitMsgHandle(pDnode) != 0) {
S
Shengliang Guan 已提交
175
    dError("failed to init msg handles since %s", terrstr());
S
shm  
Shengliang Guan 已提交
176 177 178
    goto _OVER;
  }

179
  if (pDnode->ptype == SINGLE_PROC || (pDnode->ptype & PARENT_PROC)) {
180
    pDnode->lockfile = dmCheckRunning(tsDataDir);
S
Shengliang Guan 已提交
181 182 183 184 185 186 187 188 189 190
    if (pDnode->lockfile == NULL) {
      goto _OVER;
    }

    if (dmInitServer(pDnode) != 0) {
      dError("failed to init transport since %s", terrstr());
      goto _OVER;
    }
  }

S
Shengliang Guan 已提交
191 192 193 194
  if (dmInitClient(pDnode) != 0) {
    goto _OVER;
  }

195
  dmReportStartup("dnode-transport", "initialized");
S
Shengliang Guan 已提交
196
  dDebug("dnode is created, ptr:%p", pDnode);
S
shm  
Shengliang Guan 已提交
197 198 199
  code = 0;

_OVER:
S
Shengliang Guan 已提交
200
  if (code != 0 && pDnode != NULL) {
S
Shengliang Guan 已提交
201
    dmClearVars(pDnode);
202
    pDnode = NULL;
S
shm  
Shengliang Guan 已提交
203
    dError("failed to create dnode since %s", terrstr());
S
shm  
Shengliang Guan 已提交
204 205
  }

206
  return code;
S
shm  
Shengliang Guan 已提交
207 208
}

209
void dmCleanupDnode(SDnode *pDnode) {
S
shm  
Shengliang Guan 已提交
210
  if (pDnode == NULL) return;
S
Shengliang Guan 已提交
211 212 213

  dmCleanupClient(pDnode);
  dmCleanupServer(pDnode);
S
Shengliang Guan 已提交
214
  dmClearVars(pDnode);
S
Shengliang Guan 已提交
215
  dDebug("dnode is closed, ptr:%p", pDnode);
S
shm  
Shengliang Guan 已提交
216
}
S
Shengliang Guan 已提交
217 218 219 220 221 222 223 224 225 226 227 228

void dmSetStatus(SDnode *pDnode, EDndRunStatus status) {
  if (pDnode->status != status) {
    dDebug("dnode status set from %s to %s", dmStatStr(pDnode->status), dmStatStr(status));
    pDnode->status = status;
  }
}

SMgmtWrapper *dmAcquireWrapper(SDnode *pDnode, EDndNodeType ntype) {
  SMgmtWrapper *pWrapper = &pDnode->wrappers[ntype];
  SMgmtWrapper *pRetWrapper = pWrapper;

229
  taosThreadRwlockRdlock(&pWrapper->lock);
S
Shengliang Guan 已提交
230 231
  if (pWrapper->deployed) {
    int32_t refCount = atomic_add_fetch_32(&pWrapper->refCount, 1);
S
Shengliang Guan 已提交
232
    // dTrace("node:%s, is acquired, ref:%d", pWrapper->name, refCount);
S
Shengliang Guan 已提交
233 234 235 236
  } else {
    terrno = TSDB_CODE_NODE_NOT_DEPLOYED;
    pRetWrapper = NULL;
  }
237
  taosThreadRwlockUnlock(&pWrapper->lock);
S
Shengliang Guan 已提交
238 239 240 241 242 243 244

  return pRetWrapper;
}

int32_t dmMarkWrapper(SMgmtWrapper *pWrapper) {
  int32_t code = 0;

245
  taosThreadRwlockRdlock(&pWrapper->lock);
246
  if (pWrapper->deployed || (InParentProc(pWrapper) && pWrapper->required)) {
S
Shengliang Guan 已提交
247
    int32_t refCount = atomic_add_fetch_32(&pWrapper->refCount, 1);
S
Shengliang Guan 已提交
248
    // dTrace("node:%s, is marked, ref:%d", pWrapper->name, refCount);
S
Shengliang Guan 已提交
249 250 251 252
  } else {
    terrno = TSDB_CODE_NODE_NOT_DEPLOYED;
    code = -1;
  }
253
  taosThreadRwlockUnlock(&pWrapper->lock);
S
Shengliang Guan 已提交
254 255 256 257 258 259 260

  return code;
}

void dmReleaseWrapper(SMgmtWrapper *pWrapper) {
  if (pWrapper == NULL) return;

261
  taosThreadRwlockRdlock(&pWrapper->lock);
S
Shengliang Guan 已提交
262
  int32_t refCount = atomic_sub_fetch_32(&pWrapper->refCount, 1);
263
  taosThreadRwlockUnlock(&pWrapper->lock);
S
Shengliang Guan 已提交
264
  // dTrace("node:%s, is released, ref:%d", pWrapper->name, refCount);
S
Shengliang Guan 已提交
265 266
}

267
static void dmGetServerStartupStatus(SDnode *pDnode, SServerStatusRsp *pStatus) {
S
Shengliang Guan 已提交
268
  SDnodeMgmt *pMgmt = pDnode->wrappers[DNODE].pMgmt;
S
Shengliang Guan 已提交
269 270 271 272 273
  pStatus->details[0] = 0;

  if (pDnode->status == DND_STAT_INIT) {
    pStatus->statusCode = TSDB_SRV_STATUS_NETWORK_OK;
    snprintf(pStatus->details, sizeof(pStatus->details), "%s: %s", pDnode->startup.name, pDnode->startup.desc);
274
  } else if (pDnode->status == DND_STAT_STOPPED) {
S
Shengliang Guan 已提交
275
    pStatus->statusCode = TSDB_SRV_STATUS_EXTING;
276 277
  } else {
    pStatus->statusCode = TSDB_SRV_STATUS_SERVICE_OK;
S
Shengliang Guan 已提交
278 279 280
  }
}

S
Shengliang Guan 已提交
281
void dmProcessNetTestReq(SDnode *pDnode, SRpcMsg *pMsg) {
S
Shengliang Guan 已提交
282
  dDebug("msg:%p, net test req will be processed", pMsg);
S
Shengliang Guan 已提交
283 284

  SRpcMsg rsp = {.info = pMsg->info};
S
Shengliang Guan 已提交
285
  rsp.pCont = rpcMallocCont(pMsg->contLen);
S
Shengliang Guan 已提交
286 287 288
  if (rsp.pCont == NULL) {
    rsp.code = TSDB_CODE_OUT_OF_MEMORY;
  } else {
S
Shengliang Guan 已提交
289
    rsp.contLen = pMsg->contLen;
S
Shengliang Guan 已提交
290
  }
S
Shengliang Guan 已提交
291

S
Shengliang Guan 已提交
292
  rpcSendResponse(&rsp);
S
Shengliang Guan 已提交
293
  rpcFreeCont(pMsg->pCont);
S
Shengliang Guan 已提交
294 295
}

S
Shengliang Guan 已提交
296
void dmProcessServerStartupStatus(SDnode *pDnode, SRpcMsg *pMsg) {
S
Shengliang Guan 已提交
297
  dDebug("msg:%p, server startup status req will be processed", pMsg);
S
Shengliang Guan 已提交
298

S
Shengliang Guan 已提交
299
  SServerStatusRsp statusRsp = {0};
300
  dmGetServerStartupStatus(pDnode, &statusRsp);
S
Shengliang Guan 已提交
301

S
Shengliang Guan 已提交
302 303 304 305 306 307 308 309 310 311
  SRpcMsg rsp = {.info = pMsg->info};
  int32_t contLen = tSerializeSServerStatusRsp(NULL, 0, &statusRsp);
  if (contLen < 0) {
    rsp.code = TSDB_CODE_OUT_OF_MEMORY;
  } else {
    rsp.pCont = rpcMallocCont(contLen);
    if (rsp.pCont != NULL) {
      tSerializeSServerStatusRsp(rsp.pCont, contLen, &statusRsp);
      rsp.contLen = contLen;
    }
S
Shengliang Guan 已提交
312 313
  }

S
Shengliang Guan 已提交
314 315
  rpcSendResponse(&rsp);
  rpcFreeCont(pMsg->pCont);
S
Shengliang Guan 已提交
316
}