dndMgmt.c 20.7 KB
Newer Older
S
Shengliang Guan 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#define _DEFAULT_SOURCE
S
Shengliang Guan 已提交
17
#include "dndMgmt.h"
S
Shengliang Guan 已提交
18 19 20 21
#include "dndBnode.h"
#include "dndMnode.h"
#include "dndQnode.h"
#include "dndSnode.h"
S
Shengliang Guan 已提交
22 23
#include "dndTransport.h"
#include "dndVnodes.h"
S
Shengliang Guan 已提交
24
#include "dndWorker.h"
S
Shengliang Guan 已提交
25

S
Shengliang Guan 已提交
26
static void dndProcessMgmtQueue(SDnode *pDnode, SRpcMsg *pMsg);
S
Shengliang Guan 已提交
27 28 29 30 31

static int32_t dndReadDnodes(SDnode *pDnode);
static int32_t dndWriteDnodes(SDnode *pDnode);
static void   *dnodeThreadRoutine(void *param);

S
Shengliang Guan 已提交
32 33 34 35
static int32_t dndProcessConfigDnodeReq(SDnode *pDnode, SRpcMsg *pReq);
static void    dndProcessStatusRsp(SDnode *pDnode, SRpcMsg *pRsp);
static void    dndProcessAuthRsp(SDnode *pDnode, SRpcMsg *pRsp);
static void    dndProcessGrantRsp(SDnode *pDnode, SRpcMsg *pRsp);
S
Shengliang Guan 已提交
36

S
Shengliang Guan 已提交
37
int32_t dndGetDnodeId(SDnode *pDnode) {
S
Shengliang Guan 已提交
38 39 40 41
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);
  int32_t dnodeId = pMgmt->dnodeId;
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
42
  return dnodeId;
S
Shengliang Guan 已提交
43 44
}

S
Shengliang Guan 已提交
45
int64_t dndGetClusterId(SDnode *pDnode) {
S
Shengliang Guan 已提交
46 47
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
48
  int64_t clusterId = pMgmt->clusterId;
S
Shengliang Guan 已提交
49
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
50
  return clusterId;
S
Shengliang Guan 已提交
51 52
}

S
Shengliang Guan 已提交
53
void dndGetDnodeEp(SDnode *pDnode, int32_t dnodeId, char *pEp, char *pFqdn, uint16_t *pPort) {
S
Shengliang Guan 已提交
54 55
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
56

S
Shengliang Guan 已提交
57
  SDnodeEp *pDnodeEp = taosHashGet(pMgmt->dnodeHash, &dnodeId, sizeof(int32_t));
S
Shengliang Guan 已提交
58 59
  if (pDnodeEp != NULL) {
    if (pPort != NULL) {
H
Haojun Liao 已提交
60
      *pPort = pDnodeEp->ep.port;
S
Shengliang Guan 已提交
61 62
    }
    if (pFqdn != NULL) {
H
Haojun Liao 已提交
63
      tstrncpy(pFqdn, pDnodeEp->ep.fqdn, TSDB_FQDN_LEN);
S
Shengliang Guan 已提交
64 65
    }
    if (pEp != NULL) {
H
Haojun Liao 已提交
66
      snprintf(pEp, TSDB_EP_LEN, "%s:%u", pDnodeEp->ep.fqdn, pDnodeEp->ep.port);
S
Shengliang Guan 已提交
67
    }
S
Shengliang Guan 已提交
68
  }
S
Shengliang Guan 已提交
69

S
Shengliang Guan 已提交
70
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
71
}
S
Shengliang Guan 已提交
72

S
Shengliang Guan 已提交
73
void dndGetMnodeEpSet(SDnode *pDnode, SEpSet *pEpSet) {
S
Shengliang Guan 已提交
74 75 76 77
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);
  *pEpSet = pMgmt->mnodeEpSet;
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
78 79
}

S
Shengliang Guan 已提交
80 81
void dndSendRedirectRsp(SDnode *pDnode, SRpcMsg *pReq) {
  tmsg_t msgType = pReq->msgType;
S
Shengliang Guan 已提交
82

S
Shengliang Guan 已提交
83
  SEpSet epSet = {0};
S
Shengliang Guan 已提交
84
  dndGetMnodeEpSet(pDnode, &epSet);
S
Shengliang Guan 已提交
85

S
Shengliang Guan 已提交
86
  dDebug("RPC %p, req:%s is redirected, num:%d use:%d", pReq->handle, TMSG_INFO(msgType), epSet.numOfEps, epSet.inUse);
S
Shengliang Guan 已提交
87
  for (int32_t i = 0; i < epSet.numOfEps; ++i) {
H
Haojun Liao 已提交
88 89
    dDebug("mnode index:%d %s:%u", i, epSet.eps[i].fqdn, epSet.eps[i].port);
    if (strcmp(epSet.eps[i].fqdn, pDnode->cfg.localFqdn) == 0 && epSet.eps[i].port == pDnode->cfg.serverPort) {
S
Shengliang Guan 已提交
90
      epSet.inUse = (i + 1) % epSet.numOfEps;
S
Shengliang Guan 已提交
91 92
    }

H
Haojun Liao 已提交
93
    epSet.eps[i].port = htons(epSet.eps[i].port);
S
Shengliang Guan 已提交
94 95
  }

S
Shengliang Guan 已提交
96
  rpcSendRedirectRsp(pReq->handle, &epSet);
S
Shengliang Guan 已提交
97 98
}

S
Shengliang Guan 已提交
99
static void dndUpdateMnodeEpSet(SDnode *pDnode, SEpSet *pEpSet) {
S
Shengliang Guan 已提交
100
  dInfo("mnode is changed, num:%d use:%d", pEpSet->numOfEps, pEpSet->inUse);
S
Shengliang Guan 已提交
101

S
Shengliang Guan 已提交
102 103
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosWLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
104

S
Shengliang Guan 已提交
105
  pMgmt->mnodeEpSet = *pEpSet;
S
Shengliang Guan 已提交
106
  for (int32_t i = 0; i < pEpSet->numOfEps; ++i) {
H
Haojun Liao 已提交
107
    dInfo("mnode index:%d %s:%u", i, pEpSet->eps[i].fqdn, pEpSet->eps[i].port);
S
Shengliang Guan 已提交
108 109
  }

S
Shengliang Guan 已提交
110
  taosWUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
111 112
}

S
Shengliang Guan 已提交
113 114
static void dndPrintDnodes(SDnode *pDnode) {
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
115

S
Shengliang Guan 已提交
116 117 118 119
  int32_t numOfEps = (int32_t)taosArrayGetSize(pMgmt->pDnodeEps);
  dDebug("print dnode ep list, num:%d", numOfEps);
  for (int32_t i = 0; i < numOfEps; i++) {
    SDnodeEp *pEp = taosArrayGet(pMgmt->pDnodeEps, i);
H
Haojun Liao 已提交
120
    dDebug("dnode:%d, fqdn:%s port:%u isMnode:%d", pEp->id, pEp->ep.fqdn, pEp->ep.port, pEp->isMnode);
S
Shengliang Guan 已提交
121 122 123
  }
}

S
Shengliang Guan 已提交
124
static void dndResetDnodes(SDnode *pDnode, SArray *pDnodeEps) {
S
Shengliang Guan 已提交
125
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
126

S
Shengliang Guan 已提交
127 128 129 130
  if (pMgmt->pDnodeEps != pDnodeEps) {
    SArray *tmp = pMgmt->pDnodeEps;
    pMgmt->pDnodeEps = taosArrayDup(pDnodeEps);
    taosArrayDestroy(tmp);
S
Shengliang Guan 已提交
131 132
  }

S
Shengliang Guan 已提交
133
  pMgmt->mnodeEpSet.inUse = 0;
134
  pMgmt->mnodeEpSet.numOfEps = 0;
S
Shengliang Guan 已提交
135 136

  int32_t mIndex = 0;
S
Shengliang Guan 已提交
137 138 139 140
  int32_t numOfEps = (int32_t)taosArrayGetSize(pDnodeEps);

  for (int32_t i = 0; i < numOfEps; i++) {
    SDnodeEp *pDnodeEp = taosArrayGet(pDnodeEps, i);
S
Shengliang Guan 已提交
141
    if (!pDnodeEp->isMnode) continue;
S
Shengliang Guan 已提交
142
    if (mIndex >= TSDB_MAX_REPLICA) continue;
143
    pMgmt->mnodeEpSet.numOfEps++;
H
Haojun Liao 已提交
144 145

    pMgmt->mnodeEpSet.eps[mIndex] = pDnodeEp->ep;
S
Shengliang Guan 已提交
146
    mIndex++;
S
Shengliang Guan 已提交
147 148
  }

S
Shengliang Guan 已提交
149 150
  for (int32_t i = 0; i < numOfEps; i++) {
    SDnodeEp *pDnodeEp = taosArrayGet(pDnodeEps, i);
S
Shengliang Guan 已提交
151
    taosHashPut(pMgmt->dnodeHash, &pDnodeEp->id, sizeof(int32_t), pDnodeEp, sizeof(SDnodeEp));
S
Shengliang Guan 已提交
152 153
  }

S
Shengliang Guan 已提交
154
  dndPrintDnodes(pDnode);
S
Shengliang Guan 已提交
155 156
}

S
Shengliang Guan 已提交
157
static bool dndIsEpChanged(SDnode *pDnode, int32_t dnodeId, char *pEp) {
S
Shengliang Guan 已提交
158 159
  bool changed = false;

S
Shengliang Guan 已提交
160 161 162 163
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);

  SDnodeEp *pDnodeEp = taosHashGet(pMgmt->dnodeHash, &dnodeId, sizeof(int32_t));
S
Shengliang Guan 已提交
164 165
  if (pDnodeEp != NULL) {
    char epstr[TSDB_EP_LEN + 1];
H
Haojun Liao 已提交
166
    snprintf(epstr, TSDB_EP_LEN, "%s:%u", pDnodeEp->ep.fqdn, pDnodeEp->ep.port);
S
Shengliang Guan 已提交
167
    changed = strcmp(pEp, epstr) != 0;
S
Shengliang Guan 已提交
168 169
  }

S
Shengliang Guan 已提交
170
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
171 172 173
  return changed;
}

S
Shengliang Guan 已提交
174 175
static int32_t dndReadDnodes(SDnode *pDnode) {
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
176

S
Shengliang Guan 已提交
177 178 179 180 181 182
  pMgmt->pDnodeEps = taosArrayInit(1, sizeof(SDnodeEp));
  if (pMgmt->pDnodeEps == NULL) {
    dError("failed to calloc dnodeEp array since %s", strerror(errno));
    goto PRASE_DNODE_OVER;
  }

S
Shengliang Guan 已提交
183
  int32_t code = TSDB_CODE_DND_DNODE_READ_FILE_ERROR;
S
Shengliang Guan 已提交
184
  int32_t len = 0;
S
Shengliang Guan 已提交
185
  int32_t maxLen = 256 * 1024;
S
Shengliang Guan 已提交
186 187 188
  char   *content = calloc(1, maxLen + 1);
  cJSON  *root = NULL;

189 190 191
  // fp = fopen(pMgmt->file, "r");
  TdFilePtr pFile = taosOpenFile(pMgmt->file, TD_FILE_READ);
  if (pFile == NULL) {
S
Shengliang Guan 已提交
192 193
    dDebug("file %s not exist", pMgmt->file);
    code = 0;
S
Shengliang Guan 已提交
194
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
195 196
  }

197
  len = (int32_t)taosReadFile(pFile, content, maxLen);
S
Shengliang Guan 已提交
198
  if (len <= 0) {
S
Shengliang Guan 已提交
199
    dError("failed to read %s since content is null", pMgmt->file);
S
Shengliang Guan 已提交
200
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
201 202 203 204 205
  }

  content[len] = 0;
  root = cJSON_Parse(content);
  if (root == NULL) {
S
Shengliang Guan 已提交
206
    dError("failed to read %s since invalid json format", pMgmt->file);
S
Shengliang Guan 已提交
207
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
208 209 210
  }

  cJSON *dnodeId = cJSON_GetObjectItem(root, "dnodeId");
S
Shengliang Guan 已提交
211
  if (!dnodeId || dnodeId->type != cJSON_Number) {
S
Shengliang Guan 已提交
212
    dError("failed to read %s since dnodeId not found", pMgmt->file);
S
Shengliang Guan 已提交
213
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
214
  }
S
Shengliang Guan 已提交
215
  pMgmt->dnodeId = dnodeId->valueint;
S
Shengliang Guan 已提交
216

S
Shengliang Guan 已提交
217
  cJSON *clusterId = cJSON_GetObjectItem(root, "clusterId");
S
Shengliang Guan 已提交
218
  if (!clusterId || clusterId->type != cJSON_String) {
S
Shengliang Guan 已提交
219
    dError("failed to read %s since clusterId not found", pMgmt->file);
S
Shengliang Guan 已提交
220
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
221
  }
S
Shengliang Guan 已提交
222
  pMgmt->clusterId = atoll(clusterId->valuestring);
S
Shengliang Guan 已提交
223

S
Shengliang Guan 已提交
224
  cJSON *dropped = cJSON_GetObjectItem(root, "dropped");
S
Shengliang Guan 已提交
225
  if (!dropped || dropped->type != cJSON_Number) {
S
Shengliang Guan 已提交
226
    dError("failed to read %s since dropped not found", pMgmt->file);
S
Shengliang Guan 已提交
227
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
228
  }
S
Shengliang Guan 已提交
229
  pMgmt->dropped = dropped->valueint;
S
Shengliang Guan 已提交
230

S
Shengliang Guan 已提交
231 232 233
  cJSON *dnodes = cJSON_GetObjectItem(root, "dnodes");
  if (!dnodes || dnodes->type != cJSON_Array) {
    dError("failed to read %s since dnodes not found", pMgmt->file);
S
Shengliang Guan 已提交
234
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
235 236
  }

S
Shengliang Guan 已提交
237 238 239
  int32_t numOfDnodes = cJSON_GetArraySize(dnodes);
  if (numOfDnodes <= 0) {
    dError("failed to read %s since numOfDnodes:%d invalid", pMgmt->file, numOfDnodes);
S
Shengliang Guan 已提交
240
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
241 242
  }

S
Shengliang Guan 已提交
243
  for (int32_t i = 0; i < numOfDnodes; ++i) {
S
Shengliang Guan 已提交
244 245
    cJSON *node = cJSON_GetArrayItem(dnodes, i);
    if (node == NULL) break;
S
Shengliang Guan 已提交
246

S
Shengliang Guan 已提交
247
    SDnodeEp dnodeEp = {0};
S
Shengliang Guan 已提交
248

H
Haojun Liao 已提交
249 250
    cJSON *did = cJSON_GetObjectItem(node, "id");
    if (!did || did->type != cJSON_Number) {
S
Shengliang Guan 已提交
251
      dError("failed to read %s since dnodeId not found", pMgmt->file);
S
Shengliang Guan 已提交
252
      goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
253
    }
H
Haojun Liao 已提交
254

S
Shengliang Guan 已提交
255
    dnodeEp.id = dnodeId->valueint;
S
Shengliang Guan 已提交
256

S
Shengliang Guan 已提交
257
    cJSON *dnodeFqdn = cJSON_GetObjectItem(node, "fqdn");
S
Shengliang Guan 已提交
258
    if (!dnodeFqdn || dnodeFqdn->type != cJSON_String || dnodeFqdn->valuestring == NULL) {
S
Shengliang Guan 已提交
259
      dError("failed to read %s since dnodeFqdn not found", pMgmt->file);
S
Shengliang Guan 已提交
260
      goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
261
    }
S
Shengliang Guan 已提交
262
    tstrncpy(dnodeEp.ep.fqdn, dnodeFqdn->valuestring, TSDB_FQDN_LEN);
S
Shengliang Guan 已提交
263

S
Shengliang Guan 已提交
264 265
    cJSON *dnodePort = cJSON_GetObjectItem(node, "port");
    if (!dnodePort || dnodePort->type != cJSON_Number) {
S
Shengliang Guan 已提交
266
      dError("failed to read %s since dnodePort not found", pMgmt->file);
S
Shengliang Guan 已提交
267
      goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
268
    }
H
Haojun Liao 已提交
269

S
Shengliang Guan 已提交
270
    dnodeEp.ep.port = dnodePort->valueint;
S
Shengliang Guan 已提交
271 272 273

    cJSON *isMnode = cJSON_GetObjectItem(node, "isMnode");
    if (!isMnode || isMnode->type != cJSON_Number) {
S
Shengliang Guan 已提交
274
      dError("failed to read %s since isMnode not found", pMgmt->file);
S
Shengliang Guan 已提交
275 276
      goto PRASE_DNODE_OVER;
    }
S
Shengliang Guan 已提交
277 278 279
    dnodeEp.isMnode = isMnode->valueint;

    taosArrayPush(pMgmt->pDnodeEps, &dnodeEp);
S
Shengliang Guan 已提交
280 281
  }

S
Shengliang Guan 已提交
282 283 284
  code = 0;
  dInfo("succcessed to read file %s", pMgmt->file);
  dndPrintDnodes(pDnode);
S
Shengliang Guan 已提交
285

S
Shengliang Guan 已提交
286
PRASE_DNODE_OVER:
S
Shengliang Guan 已提交
287 288
  if (content != NULL) free(content);
  if (root != NULL) cJSON_Delete(root);
289
  if (pFile != NULL) taosCloseFile(&pFile);
S
Shengliang Guan 已提交
290

S
Shengliang Guan 已提交
291 292
  if (dndIsEpChanged(pDnode, pMgmt->dnodeId, pDnode->cfg.localEp)) {
    dError("localEp %s different with %s and need reconfigured", pDnode->cfg.localEp, pMgmt->file);
S
Shengliang Guan 已提交
293 294 295
    return -1;
  }

S
Shengliang Guan 已提交
296 297 298
  if (taosArrayGetSize(pMgmt->pDnodeEps) == 0) {
    SDnodeEp dnodeEp = {0};
    dnodeEp.isMnode = 1;
S
Shengliang Guan 已提交
299
    taosGetFqdnPortFromEp(pDnode->cfg.firstEp, &dnodeEp.ep);
S
Shengliang Guan 已提交
300
    taosArrayPush(pMgmt->pDnodeEps, &dnodeEp);
S
Shengliang Guan 已提交
301 302
  }

S
Shengliang Guan 已提交
303
  dndResetDnodes(pDnode, pMgmt->pDnodeEps);
S
Shengliang Guan 已提交
304 305 306 307 308

  terrno = 0;
  return 0;
}

S
Shengliang Guan 已提交
309 310
static int32_t dndWriteDnodes(SDnode *pDnode) {
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
311

312 313 314
  // FILE *fp = fopen(pMgmt->file, "w");
  TdFilePtr pFile = taosOpenFile(pMgmt->file, TD_FILE_CTEATE | TD_FILE_WRITE | TD_FILE_TRUNC);
  if (pFile == NULL) {
S
Shengliang Guan 已提交
315 316
    dError("failed to write %s since %s", pMgmt->file, strerror(errno));
    terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
317 318 319 320
    return -1;
  }

  int32_t len = 0;
S
Shengliang Guan 已提交
321
  int32_t maxLen = 256 * 1024;
S
Shengliang Guan 已提交
322 323 324
  char   *content = calloc(1, maxLen + 1);

  len += snprintf(content + len, maxLen - len, "{\n");
S
Shengliang Guan 已提交
325
  len += snprintf(content + len, maxLen - len, "  \"dnodeId\": %d,\n", pMgmt->dnodeId);
326
  len += snprintf(content + len, maxLen - len, "  \"clusterId\": \"%" PRId64 "\",\n", pMgmt->clusterId);
S
Shengliang Guan 已提交
327 328
  len += snprintf(content + len, maxLen - len, "  \"dropped\": %d,\n", pMgmt->dropped);
  len += snprintf(content + len, maxLen - len, "  \"dnodes\": [{\n");
S
Shengliang Guan 已提交
329 330 331 332

  int32_t numOfEps = (int32_t)taosArrayGetSize(pMgmt->pDnodeEps);
  for (int32_t i = 0; i < numOfEps; ++i) {
    SDnodeEp *pDnodeEp = taosArrayGet(pMgmt->pDnodeEps, i);
S
Shengliang Guan 已提交
333
    len += snprintf(content + len, maxLen - len, "    \"id\": %d,\n", pDnodeEp->id);
H
Haojun Liao 已提交
334 335
    len += snprintf(content + len, maxLen - len, "    \"fqdn\": \"%s\",\n", pDnodeEp->ep.fqdn);
    len += snprintf(content + len, maxLen - len, "    \"port\": %u,\n", pDnodeEp->ep.port);
S
Shengliang Guan 已提交
336
    len += snprintf(content + len, maxLen - len, "    \"isMnode\": %d\n", pDnodeEp->isMnode);
S
Shengliang Guan 已提交
337
    if (i < numOfEps - 1) {
S
Shengliang Guan 已提交
338 339 340 341 342 343 344
      len += snprintf(content + len, maxLen - len, "  },{\n");
    } else {
      len += snprintf(content + len, maxLen - len, "  }]\n");
    }
  }
  len += snprintf(content + len, maxLen - len, "}\n");

345 346 347
  taosWriteFile(pFile, content, len);
  taosFsyncFile(pFile);
  taosCloseFile(&pFile);
S
Shengliang Guan 已提交
348 349 350
  free(content);
  terrno = 0;

S
Shengliang Guan 已提交
351
  pMgmt->updateTime = taosGetTimestampMs();
S
Shengliang Guan 已提交
352
  dDebug("successed to write %s", pMgmt->file);
S
Shengliang Guan 已提交
353 354 355
  return 0;
}

S
Shengliang Guan 已提交
356
void dndSendStatusReq(SDnode *pDnode) {
S
Shengliang Guan 已提交
357
  SStatusReq req = {0};
S
Shengliang Guan 已提交
358

S
Shengliang Guan 已提交
359 360
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);
S
config  
Shengliang Guan 已提交
361
  req.sver = tsVersion;
S
Shengliang Guan 已提交
362 363 364 365 366
  req.dver = pMgmt->dver;
  req.dnodeId = pMgmt->dnodeId;
  req.clusterId = pMgmt->clusterId;
  req.rebootTime = pMgmt->rebootTime;
  req.updateTime = pMgmt->updateTime;
S
config  
Shengliang Guan 已提交
367
  req.numOfCores = tsNumOfCores;
S
Shengliang Guan 已提交
368 369 370
  req.numOfSupportVnodes = pDnode->cfg.numOfSupportVnodes;
  memcpy(req.dnodeEp, pDnode->cfg.localEp, TSDB_EP_LEN);

S
Shengliang Guan 已提交
371
  req.clusterCfg.statusInterval = tsStatusInterval;
S
Shengliang Guan 已提交
372
  req.clusterCfg.checkTime = 0;
S
Shengliang Guan 已提交
373
  char timestr[32] = "1970-01-01 00:00:00.00";
S
Shengliang Guan 已提交
374
  (void)taosParseTime(timestr, &req.clusterCfg.checkTime, (int32_t)strlen(timestr), TSDB_TIME_PRECISION_MILLI, 0);
S
os env  
Shengliang Guan 已提交
375 376 377
  memcpy(req.clusterCfg.timezone, tsTimezone, TD_TIMEZONE_LEN);
  memcpy(req.clusterCfg.locale, tsLocale, TD_LOCALE_LEN);
  memcpy(req.clusterCfg.charset, tsCharset, TD_LOCALE_LEN);
S
Shengliang Guan 已提交
378
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
379

S
Shengliang Guan 已提交
380 381 382
  req.pVloads = taosArrayInit(TSDB_MAX_VNODES, sizeof(SVnodeLoad));
  dndGetVnodeLoads(pDnode, req.pVloads);

S
Shengliang Guan 已提交
383
  int32_t contLen = tSerializeSStatusReq(NULL, 0, &req);
S
Shengliang Guan 已提交
384
  void   *pHead = rpcMallocCont(contLen);
S
Shengliang Guan 已提交
385
  tSerializeSStatusReq(pHead, contLen, &req);
S
Shengliang Guan 已提交
386
  taosArrayDestroy(req.pVloads);
S
Shengliang Guan 已提交
387

S
Shengliang Guan 已提交
388
  SRpcMsg rpcMsg = {.pCont = pHead, .contLen = contLen, .msgType = TDMT_MND_STATUS, .ahandle = (void *)9527};
389
  pMgmt->statusSent = 1;
S
Shengliang Guan 已提交
390

S
Shengliang Guan 已提交
391
  dTrace("pDnode:%p, send status req to mnode", pDnode);
S
Shengliang Guan 已提交
392
  dndSendReqToMnode(pDnode, &rpcMsg);
S
Shengliang Guan 已提交
393 394
}

S
Shengliang Guan 已提交
395 396
static void dndUpdateDnodeCfg(SDnode *pDnode, SDnodeCfg *pCfg) {
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
397
  if (pMgmt->dnodeId == 0) {
S
Shengliang Guan 已提交
398
    dInfo("set dnodeId:%d clusterId:%" PRId64, pCfg->dnodeId, pCfg->clusterId);
S
Shengliang Guan 已提交
399
    taosWLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
400 401
    pMgmt->dnodeId = pCfg->dnodeId;
    pMgmt->clusterId = pCfg->clusterId;
402
    dndWriteDnodes(pDnode);
S
Shengliang Guan 已提交
403
    taosWUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
404
  }
S
Shengliang Guan 已提交
405 406
}

S
Shengliang Guan 已提交
407 408 409
static void dndUpdateDnodeEps(SDnode *pDnode, SArray *pDnodeEps) {
  int32_t numOfEps = taosArrayGetSize(pDnodeEps);
  if (numOfEps <= 0) return;
S
Shengliang Guan 已提交
410

S
Shengliang Guan 已提交
411 412
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosWLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
413

S
Shengliang Guan 已提交
414 415
  int32_t numOfEpsOld = (int32_t)taosArrayGetSize(pMgmt->pDnodeEps);
  if (numOfEps != numOfEpsOld) {
S
Shengliang Guan 已提交
416 417
    dndResetDnodes(pDnode, pDnodeEps);
    dndWriteDnodes(pDnode);
S
Shengliang Guan 已提交
418
  } else {
S
Shengliang Guan 已提交
419 420
    int32_t size = numOfEps * sizeof(SDnodeEp);
    if (memcmp(pMgmt->pDnodeEps->pData, pDnodeEps->pData, size) != 0) {
S
Shengliang Guan 已提交
421 422
      dndResetDnodes(pDnode, pDnodeEps);
      dndWriteDnodes(pDnode);
S
Shengliang Guan 已提交
423 424 425
    }
  }

S
Shengliang Guan 已提交
426
  taosWUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
427 428
}

S
Shengliang Guan 已提交
429
static void dndProcessStatusRsp(SDnode *pDnode, SRpcMsg *pRsp) {
430 431
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;

S
Shengliang Guan 已提交
432 433
  if (pRsp->code != TSDB_CODE_SUCCESS) {
    if (pRsp->code == TSDB_CODE_MND_DNODE_NOT_EXIST && !pMgmt->dropped && pMgmt->dnodeId > 0) {
S
Shengliang Guan 已提交
434 435 436 437
      dInfo("dnode:%d, set to dropped since not exist in mnode", pMgmt->dnodeId);
      pMgmt->dropped = 1;
      dndWriteDnodes(pDnode);
    }
S
Shengliang Guan 已提交
438 439
  } else {
    SStatusRsp statusRsp = {0};
S
Shengliang Guan 已提交
440 441
    if (pRsp->pCont != NULL && pRsp->contLen != 0 &&
        tDeserializeSStatusRsp(pRsp->pCont, pRsp->contLen, &statusRsp) == 0) {
S
Shengliang Guan 已提交
442 443 444
      pMgmt->dver = statusRsp.dver;
      dndUpdateDnodeCfg(pDnode, &statusRsp.dnodeCfg);
      dndUpdateDnodeEps(pDnode, statusRsp.pDnodeEps);
S
Shengliang Guan 已提交
445
    }
S
Shengliang Guan 已提交
446
    taosArrayDestroy(statusRsp.pDnodeEps);
S
Shengliang Guan 已提交
447
  }
S
Shengliang Guan 已提交
448

449
  pMgmt->statusSent = 0;
S
Shengliang Guan 已提交
450
}
S
Shengliang Guan 已提交
451

S
Shengliang Guan 已提交
452
static void dndProcessAuthRsp(SDnode *pDnode, SRpcMsg *pReq) { dError("auth rsp is received, but not supported yet"); }
S
Shengliang Guan 已提交
453

S
Shengliang Guan 已提交
454 455 456
static void dndProcessGrantRsp(SDnode *pDnode, SRpcMsg *pReq) {
  dError("grant rsp is received, but not supported yet");
}
S
Shengliang Guan 已提交
457

S
Shengliang Guan 已提交
458 459 460
static int32_t dndProcessConfigDnodeReq(SDnode *pDnode, SRpcMsg *pReq) {
  dError("config req is received, but not supported yet");
  SDCfgDnodeReq *pCfg = pReq->pCont;
S
Shengliang Guan 已提交
461
  return TSDB_CODE_OPS_NOT_SUPPORT;
S
Shengliang Guan 已提交
462 463
}

S
Shengliang Guan 已提交
464 465
void dndProcessStartupReq(SDnode *pDnode, SRpcMsg *pReq) {
  dDebug("startup req is received");
S
Shengliang Guan 已提交
466

S
Shengliang Guan 已提交
467
  SStartupReq *pStartup = rpcMallocCont(sizeof(SStartupReq));
S
Shengliang Guan 已提交
468
  dndGetStartup(pDnode, pStartup);
S
Shengliang Guan 已提交
469

S
Shengliang Guan 已提交
470
  dDebug("startup req is sent, step:%s desc:%s finished:%d", pStartup->name, pStartup->desc, pStartup->finished);
S
Shengliang Guan 已提交
471

S
Shengliang Guan 已提交
472
  SRpcMsg rpcRsp = {.handle = pReq->handle, .pCont = pStartup, .contLen = sizeof(SStartupReq)};
S
Shengliang Guan 已提交
473
  rpcSendResponse(&rpcRsp);
S
Shengliang Guan 已提交
474 475 476
}

static void *dnodeThreadRoutine(void *param) {
477 478
  SDnode     *pDnode = param;
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
479
  int32_t     ms = tsStatusInterval * 1000;
S
Shengliang Guan 已提交
480

H
Haojun Liao 已提交
481 482
  setThreadName("dnode-hb");

S
Shengliang Guan 已提交
483 484
  while (true) {
    pthread_testcancel();
S
Shengliang Guan 已提交
485
    taosMsleep(ms);
S
Shengliang Guan 已提交
486

S
Shengliang Guan 已提交
487
    if (dndGetStat(pDnode) == DND_STAT_RUNNING && !pMgmt->statusSent && !pMgmt->dropped) {
S
Shengliang Guan 已提交
488
      dndSendStatusReq(pDnode);
S
Shengliang Guan 已提交
489
    }
S
Shengliang Guan 已提交
490 491 492
  }
}

S
Shengliang Guan 已提交
493
int32_t dndInitMgmt(SDnode *pDnode) {
S
Shengliang Guan 已提交
494
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
495

S
Shengliang Guan 已提交
496
  pMgmt->dnodeId = 0;
497
  pMgmt->rebootTime = taosGetTimestampMs();
S
Shengliang Guan 已提交
498 499
  pMgmt->dropped = 0;
  pMgmt->clusterId = 0;
S
Shengliang Guan 已提交
500
  taosInitRWLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
501 502

  char path[PATH_MAX];
S
Shengliang Guan 已提交
503 504 505
  snprintf(path, PATH_MAX, "%s/dnode.json", pDnode->dir.dnode);
  pMgmt->file = strdup(path);
  if (pMgmt->file == NULL) {
S
Shengliang Guan 已提交
506 507 508 509
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }

510
  pMgmt->dnodeHash = taosHashInit(4, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT), true, HASH_NO_LOCK);
S
Shengliang Guan 已提交
511
  if (pMgmt->dnodeHash == NULL) {
S
Shengliang Guan 已提交
512
    dError("failed to init dnode hash");
S
Shengliang Guan 已提交
513 514
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
S
Shengliang Guan 已提交
515 516
  }

S
Shengliang Guan 已提交
517 518
  if (dndReadDnodes(pDnode) != 0) {
    dError("failed to read file:%s since %s", pMgmt->file, terrstr());
S
Shengliang Guan 已提交
519
    return -1;
S
Shengliang Guan 已提交
520 521
  }

S
Shengliang Guan 已提交
522
  if (pMgmt->dropped) {
S
Shengliang Guan 已提交
523
    dError("dnode not start since its already dropped");
S
Shengliang Guan 已提交
524 525 526
    return -1;
  }

S
Shengliang Guan 已提交
527 528
  if (dndInitWorker(pDnode, &pMgmt->mgmtWorker, DND_WORKER_SINGLE, "dnode-mgmt", 1, 1, dndProcessMgmtQueue) != 0) {
    dError("failed to start dnode mgmt worker since %s", terrstr());
S
Shengliang Guan 已提交
529 530
    return -1;
  }
S
Shengliang Guan 已提交
531

532 533 534 535 536
  if (dndInitWorker(pDnode, &pMgmt->statusWorker, DND_WORKER_SINGLE, "dnode-status", 1, 1, dndProcessMgmtQueue) != 0) {
    dError("failed to start dnode mgmt worker since %s", terrstr());
    return -1;
  }

S
Shengliang Guan 已提交
537 538
  pMgmt->threadId = taosCreateThread(dnodeThreadRoutine, pDnode);
  if (pMgmt->threadId == NULL) {
S
Shengliang Guan 已提交
539 540 541
    dError("failed to init dnode thread");
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
S
Shengliang Guan 已提交
542 543
  }

S
Shengliang Guan 已提交
544
  dInfo("dnode-mgmt is initialized");
S
Shengliang Guan 已提交
545 546 547
  return 0;
}

S
Shengliang Guan 已提交
548
void dndStopMgmt(SDnode *pDnode) {
S
Shengliang Guan 已提交
549
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
550
  dndCleanupWorker(&pMgmt->mgmtWorker);
551
  dndCleanupWorker(&pMgmt->statusWorker);
S
Shengliang Guan 已提交
552

S
Shengliang Guan 已提交
553 554 555
  if (pMgmt->threadId != NULL) {
    taosDestoryThread(pMgmt->threadId);
    pMgmt->threadId = NULL;
S
Shengliang Guan 已提交
556
  }
S
Shengliang Guan 已提交
557
}
S
Shengliang Guan 已提交
558

S
Shengliang Guan 已提交
559 560
void dndCleanupMgmt(SDnode *pDnode) {
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
561
  taosWLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
562

S
Shengliang Guan 已提交
563 564 565
  if (pMgmt->pDnodeEps != NULL) {
    taosArrayDestroy(pMgmt->pDnodeEps);
    pMgmt->pDnodeEps = NULL;
S
Shengliang Guan 已提交
566
  }
S
Shengliang Guan 已提交
567

S
Shengliang Guan 已提交
568 569 570
  if (pMgmt->dnodeHash != NULL) {
    taosHashCleanup(pMgmt->dnodeHash);
    pMgmt->dnodeHash = NULL;
S
Shengliang Guan 已提交
571
  }
S
Shengliang Guan 已提交
572

S
Shengliang Guan 已提交
573 574 575
  if (pMgmt->file != NULL) {
    free(pMgmt->file);
    pMgmt->file = NULL;
S
Shengliang Guan 已提交
576 577
  }

S
Shengliang Guan 已提交
578
  taosWUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
579
  dInfo("dnode-mgmt is cleaned up");
S
Shengliang Guan 已提交
580 581
}

S
Shengliang Guan 已提交
582
void dndProcessMgmtMsg(SDnode *pDnode, SRpcMsg *pMsg, SEpSet *pEpSet) {
S
Shengliang Guan 已提交
583 584
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;

S
Shengliang Guan 已提交
585
  if (pEpSet && pEpSet->numOfEps > 0 && pMsg->msgType == TDMT_MND_STATUS_RSP) {
S
Shengliang Guan 已提交
586 587 588
    dndUpdateMnodeEpSet(pDnode, pEpSet);
  }

589 590 591 592 593 594
  SDnodeWorker *pWorker = &pMgmt->mgmtWorker;
  if (pMsg->msgType == TDMT_MND_STATUS_RSP) {
    pWorker = &pMgmt->statusWorker;
  }

  if (dndWriteMsgToWorker(pWorker, pMsg, sizeof(SRpcMsg)) != 0) {
S
Shengliang Guan 已提交
595 596
    if (pMsg->msgType & 1u) {
      SRpcMsg rsp = {.handle = pMsg->handle, .code = TSDB_CODE_OUT_OF_MEMORY};
S
Shengliang Guan 已提交
597 598
      rpcSendResponse(&rsp);
    }
S
Shengliang Guan 已提交
599
    rpcFreeCont(pMsg->pCont);
S
Shengliang Guan 已提交
600 601 602 603 604 605 606
    taosFreeQitem(pMsg);
  }
}

static void dndProcessMgmtQueue(SDnode *pDnode, SRpcMsg *pMsg) {
  int32_t code = 0;

S
Shengliang Guan 已提交
607
  switch (pMsg->msgType) {
S
Shengliang Guan 已提交
608 609 610 611 612 613 614 615 616
    case TDMT_DND_CREATE_MNODE:
      code = dndProcessCreateMnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_ALTER_MNODE:
      code = dndProcessAlterMnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_DROP_MNODE:
      code = dndProcessDropMnodeReq(pDnode, pMsg);
      break;
S
Shengliang Guan 已提交
617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634
    case TDMT_DND_CREATE_QNODE:
      code = dndProcessCreateQnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_DROP_QNODE:
      code = dndProcessDropQnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_CREATE_SNODE:
      code = dndProcessCreateSnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_DROP_SNODE:
      code = dndProcessDropSnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_CREATE_BNODE:
      code = dndProcessCreateBnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_DROP_BNODE:
      code = dndProcessDropBnodeReq(pDnode, pMsg);
      break;
H
Hongze Cheng 已提交
635
    case TDMT_DND_CONFIG_DNODE:
S
Shengliang Guan 已提交
636
      code = dndProcessConfigDnodeReq(pDnode, pMsg);
S
Shengliang Guan 已提交
637
      break;
H
Hongze Cheng 已提交
638
    case TDMT_MND_STATUS_RSP:
S
Shengliang Guan 已提交
639
      dndProcessStatusRsp(pDnode, pMsg);
S
Shengliang Guan 已提交
640
      break;
H
Hongze Cheng 已提交
641
    case TDMT_MND_AUTH_RSP:
S
Shengliang Guan 已提交
642
      dndProcessAuthRsp(pDnode, pMsg);
S
Shengliang Guan 已提交
643
      break;
H
Hongze Cheng 已提交
644
    case TDMT_MND_GRANT_RSP:
S
Shengliang Guan 已提交
645
      dndProcessGrantRsp(pDnode, pMsg);
S
Shengliang Guan 已提交
646
      break;
S
Shengliang Guan 已提交
647 648 649 650 651 652 653 654 655 656 657 658 659 660 661
    case TDMT_DND_CREATE_VNODE:
      code = dndProcessCreateVnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_ALTER_VNODE:
      code = dndProcessAlterVnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_DROP_VNODE:
      code = dndProcessDropVnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_SYNC_VNODE:
      code = dndProcessSyncVnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_COMPACT_VNODE:
      code = dndProcessCompactVnodeReq(pDnode, pMsg);
      break;
S
Shengliang Guan 已提交
662
    default:
S
Shengliang Guan 已提交
663 664
      terrno = TSDB_CODE_MSG_NOT_PROCESSED;
      code = -1;
S
Shengliang Guan 已提交
665
      dError("RPC %p, dnode msg:%s not processed", pMsg->handle, TMSG_INFO(pMsg->msgType));
S
Shengliang Guan 已提交
666 667 668 669 670 671 672
      break;
  }

  if (pMsg->msgType & 1u) {
    if (code != 0) code = terrno;
    SRpcMsg rsp = {.code = code, .handle = pMsg->handle, .ahandle = pMsg->ahandle};
    rpcSendResponse(&rsp);
S
Shengliang Guan 已提交
673
  }
S
Shengliang Guan 已提交
674

S
Shengliang Guan 已提交
675
  rpcFreeCont(pMsg->pCont);
S
Shengliang Guan 已提交
676
  pMsg->pCont = NULL;
S
Shengliang Guan 已提交
677
  taosFreeQitem(pMsg);
S
Shengliang Guan 已提交
678
}