dndMgmt.c 20.7 KB
Newer Older
S
Shengliang Guan 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#define _DEFAULT_SOURCE
S
Shengliang Guan 已提交
17
#include "dndMgmt.h"
S
Shengliang Guan 已提交
18 19 20 21
#include "dndBnode.h"
#include "dndMnode.h"
#include "dndQnode.h"
#include "dndSnode.h"
S
Shengliang Guan 已提交
22 23
#include "dndTransport.h"
#include "dndVnodes.h"
S
Shengliang Guan 已提交
24
#include "dndWorker.h"
S
Shengliang Guan 已提交
25

S
Shengliang Guan 已提交
26
static void dndProcessMgmtQueue(SDnode *pDnode, SRpcMsg *pMsg);
S
Shengliang Guan 已提交
27 28 29 30 31

static int32_t dndReadDnodes(SDnode *pDnode);
static int32_t dndWriteDnodes(SDnode *pDnode);
static void   *dnodeThreadRoutine(void *param);

S
Shengliang Guan 已提交
32 33 34 35
static int32_t dndProcessConfigDnodeReq(SDnode *pDnode, SRpcMsg *pReq);
static void    dndProcessStatusRsp(SDnode *pDnode, SRpcMsg *pRsp);
static void    dndProcessAuthRsp(SDnode *pDnode, SRpcMsg *pRsp);
static void    dndProcessGrantRsp(SDnode *pDnode, SRpcMsg *pRsp);
S
Shengliang Guan 已提交
36

S
Shengliang Guan 已提交
37
int32_t dndGetDnodeId(SDnode *pDnode) {
S
Shengliang Guan 已提交
38 39 40 41
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);
  int32_t dnodeId = pMgmt->dnodeId;
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
42
  return dnodeId;
S
Shengliang Guan 已提交
43 44
}

S
Shengliang Guan 已提交
45
int64_t dndGetClusterId(SDnode *pDnode) {
S
Shengliang Guan 已提交
46 47
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
48
  int64_t clusterId = pMgmt->clusterId;
S
Shengliang Guan 已提交
49
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
50
  return clusterId;
S
Shengliang Guan 已提交
51 52
}

S
Shengliang Guan 已提交
53
void dndGetDnodeEp(SDnode *pDnode, int32_t dnodeId, char *pEp, char *pFqdn, uint16_t *pPort) {
S
Shengliang Guan 已提交
54 55
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
56

S
Shengliang Guan 已提交
57
  SDnodeEp *pDnodeEp = taosHashGet(pMgmt->dnodeHash, &dnodeId, sizeof(int32_t));
S
Shengliang Guan 已提交
58 59
  if (pDnodeEp != NULL) {
    if (pPort != NULL) {
H
Haojun Liao 已提交
60
      *pPort = pDnodeEp->ep.port;
S
Shengliang Guan 已提交
61 62
    }
    if (pFqdn != NULL) {
H
Haojun Liao 已提交
63
      tstrncpy(pFqdn, pDnodeEp->ep.fqdn, TSDB_FQDN_LEN);
S
Shengliang Guan 已提交
64 65
    }
    if (pEp != NULL) {
H
Haojun Liao 已提交
66
      snprintf(pEp, TSDB_EP_LEN, "%s:%u", pDnodeEp->ep.fqdn, pDnodeEp->ep.port);
S
Shengliang Guan 已提交
67
    }
S
Shengliang Guan 已提交
68
  }
S
Shengliang Guan 已提交
69

S
Shengliang Guan 已提交
70
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
71
}
S
Shengliang Guan 已提交
72

S
Shengliang Guan 已提交
73
void dndGetMnodeEpSet(SDnode *pDnode, SEpSet *pEpSet) {
S
Shengliang Guan 已提交
74 75 76 77
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);
  *pEpSet = pMgmt->mnodeEpSet;
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
78 79
}

S
Shengliang Guan 已提交
80 81
void dndSendRedirectRsp(SDnode *pDnode, SRpcMsg *pReq) {
  tmsg_t msgType = pReq->msgType;
S
Shengliang Guan 已提交
82

S
Shengliang Guan 已提交
83
  SEpSet epSet = {0};
S
Shengliang Guan 已提交
84
  dndGetMnodeEpSet(pDnode, &epSet);
S
Shengliang Guan 已提交
85

S
Shengliang Guan 已提交
86
  dDebug("RPC %p, req:%s is redirected, num:%d use:%d", pReq->handle, TMSG_INFO(msgType), epSet.numOfEps, epSet.inUse);
S
Shengliang Guan 已提交
87
  for (int32_t i = 0; i < epSet.numOfEps; ++i) {
H
Haojun Liao 已提交
88 89
    dDebug("mnode index:%d %s:%u", i, epSet.eps[i].fqdn, epSet.eps[i].port);
    if (strcmp(epSet.eps[i].fqdn, pDnode->cfg.localFqdn) == 0 && epSet.eps[i].port == pDnode->cfg.serverPort) {
S
Shengliang Guan 已提交
90
      epSet.inUse = (i + 1) % epSet.numOfEps;
S
Shengliang Guan 已提交
91 92
    }

H
Haojun Liao 已提交
93
    epSet.eps[i].port = htons(epSet.eps[i].port);
S
Shengliang Guan 已提交
94 95
  }

S
Shengliang Guan 已提交
96
  rpcSendRedirectRsp(pReq->handle, &epSet);
S
Shengliang Guan 已提交
97 98
}

S
Shengliang Guan 已提交
99
static void dndUpdateMnodeEpSet(SDnode *pDnode, SEpSet *pEpSet) {
S
Shengliang Guan 已提交
100
  dInfo("mnode is changed, num:%d use:%d", pEpSet->numOfEps, pEpSet->inUse);
S
Shengliang Guan 已提交
101

S
Shengliang Guan 已提交
102 103
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosWLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
104

S
Shengliang Guan 已提交
105
  pMgmt->mnodeEpSet = *pEpSet;
S
Shengliang Guan 已提交
106
  for (int32_t i = 0; i < pEpSet->numOfEps; ++i) {
H
Haojun Liao 已提交
107
    dInfo("mnode index:%d %s:%u", i, pEpSet->eps[i].fqdn, pEpSet->eps[i].port);
S
Shengliang Guan 已提交
108 109
  }

S
Shengliang Guan 已提交
110
  taosWUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
111 112
}

S
Shengliang Guan 已提交
113 114
static void dndPrintDnodes(SDnode *pDnode) {
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
115

S
Shengliang Guan 已提交
116 117 118 119
  int32_t numOfEps = (int32_t)taosArrayGetSize(pMgmt->pDnodeEps);
  dDebug("print dnode ep list, num:%d", numOfEps);
  for (int32_t i = 0; i < numOfEps; i++) {
    SDnodeEp *pEp = taosArrayGet(pMgmt->pDnodeEps, i);
H
Haojun Liao 已提交
120
    dDebug("dnode:%d, fqdn:%s port:%u isMnode:%d", pEp->id, pEp->ep.fqdn, pEp->ep.port, pEp->isMnode);
S
Shengliang Guan 已提交
121 122 123
  }
}

S
Shengliang Guan 已提交
124
static void dndResetDnodes(SDnode *pDnode, SArray *pDnodeEps) {
S
Shengliang Guan 已提交
125
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
126

S
Shengliang Guan 已提交
127 128 129 130
  if (pMgmt->pDnodeEps != pDnodeEps) {
    SArray *tmp = pMgmt->pDnodeEps;
    pMgmt->pDnodeEps = taosArrayDup(pDnodeEps);
    taosArrayDestroy(tmp);
S
Shengliang Guan 已提交
131 132
  }

S
Shengliang Guan 已提交
133
  pMgmt->mnodeEpSet.inUse = 0;
134
  pMgmt->mnodeEpSet.numOfEps = 0;
S
Shengliang Guan 已提交
135 136

  int32_t mIndex = 0;
S
Shengliang Guan 已提交
137 138 139 140
  int32_t numOfEps = (int32_t)taosArrayGetSize(pDnodeEps);

  for (int32_t i = 0; i < numOfEps; i++) {
    SDnodeEp *pDnodeEp = taosArrayGet(pDnodeEps, i);
S
Shengliang Guan 已提交
141
    if (!pDnodeEp->isMnode) continue;
S
Shengliang Guan 已提交
142
    if (mIndex >= TSDB_MAX_REPLICA) continue;
143
    pMgmt->mnodeEpSet.numOfEps++;
H
Haojun Liao 已提交
144 145

    pMgmt->mnodeEpSet.eps[mIndex] = pDnodeEp->ep;
S
Shengliang Guan 已提交
146
    mIndex++;
S
Shengliang Guan 已提交
147 148
  }

S
Shengliang Guan 已提交
149 150
  for (int32_t i = 0; i < numOfEps; i++) {
    SDnodeEp *pDnodeEp = taosArrayGet(pDnodeEps, i);
S
Shengliang Guan 已提交
151
    taosHashPut(pMgmt->dnodeHash, &pDnodeEp->id, sizeof(int32_t), pDnodeEp, sizeof(SDnodeEp));
S
Shengliang Guan 已提交
152 153
  }

S
Shengliang Guan 已提交
154
  dndPrintDnodes(pDnode);
S
Shengliang Guan 已提交
155 156
}

S
Shengliang Guan 已提交
157
static bool dndIsEpChanged(SDnode *pDnode, int32_t dnodeId, char *pEp) {
S
Shengliang Guan 已提交
158 159
  bool changed = false;

S
Shengliang Guan 已提交
160 161 162 163
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);

  SDnodeEp *pDnodeEp = taosHashGet(pMgmt->dnodeHash, &dnodeId, sizeof(int32_t));
S
Shengliang Guan 已提交
164 165
  if (pDnodeEp != NULL) {
    char epstr[TSDB_EP_LEN + 1];
H
Haojun Liao 已提交
166
    snprintf(epstr, TSDB_EP_LEN, "%s:%u", pDnodeEp->ep.fqdn, pDnodeEp->ep.port);
S
Shengliang Guan 已提交
167
    changed = strcmp(pEp, epstr) != 0;
S
Shengliang Guan 已提交
168 169
  }

S
Shengliang Guan 已提交
170
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
171 172 173
  return changed;
}

S
Shengliang Guan 已提交
174 175
static int32_t dndReadDnodes(SDnode *pDnode) {
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
176

S
Shengliang Guan 已提交
177 178 179 180 181 182
  pMgmt->pDnodeEps = taosArrayInit(1, sizeof(SDnodeEp));
  if (pMgmt->pDnodeEps == NULL) {
    dError("failed to calloc dnodeEp array since %s", strerror(errno));
    goto PRASE_DNODE_OVER;
  }

S
Shengliang Guan 已提交
183
  int32_t code = TSDB_CODE_DND_DNODE_READ_FILE_ERROR;
S
Shengliang Guan 已提交
184
  int32_t len = 0;
S
Shengliang Guan 已提交
185
  int32_t maxLen = 256 * 1024;
S
Shengliang Guan 已提交
186 187 188 189
  char   *content = calloc(1, maxLen + 1);
  cJSON  *root = NULL;
  FILE   *fp = NULL;

S
Shengliang Guan 已提交
190 191 192 193
  fp = fopen(pMgmt->file, "r");
  if (fp == NULL) {
    dDebug("file %s not exist", pMgmt->file);
    code = 0;
S
Shengliang Guan 已提交
194
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
195 196 197 198
  }

  len = (int32_t)fread(content, 1, maxLen, fp);
  if (len <= 0) {
S
Shengliang Guan 已提交
199
    dError("failed to read %s since content is null", pMgmt->file);
S
Shengliang Guan 已提交
200
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
201 202 203 204 205
  }

  content[len] = 0;
  root = cJSON_Parse(content);
  if (root == NULL) {
S
Shengliang Guan 已提交
206
    dError("failed to read %s since invalid json format", pMgmt->file);
S
Shengliang Guan 已提交
207
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
208 209 210
  }

  cJSON *dnodeId = cJSON_GetObjectItem(root, "dnodeId");
S
Shengliang Guan 已提交
211
  if (!dnodeId || dnodeId->type != cJSON_Number) {
S
Shengliang Guan 已提交
212
    dError("failed to read %s since dnodeId not found", pMgmt->file);
S
Shengliang Guan 已提交
213
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
214
  }
S
Shengliang Guan 已提交
215
  pMgmt->dnodeId = dnodeId->valueint;
S
Shengliang Guan 已提交
216

S
Shengliang Guan 已提交
217
  cJSON *clusterId = cJSON_GetObjectItem(root, "clusterId");
S
Shengliang Guan 已提交
218
  if (!clusterId || clusterId->type != cJSON_String) {
S
Shengliang Guan 已提交
219
    dError("failed to read %s since clusterId not found", pMgmt->file);
S
Shengliang Guan 已提交
220
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
221
  }
S
Shengliang Guan 已提交
222
  pMgmt->clusterId = atoll(clusterId->valuestring);
S
Shengliang Guan 已提交
223

S
Shengliang Guan 已提交
224
  cJSON *dropped = cJSON_GetObjectItem(root, "dropped");
S
Shengliang Guan 已提交
225
  if (!dropped || dropped->type != cJSON_Number) {
S
Shengliang Guan 已提交
226
    dError("failed to read %s since dropped not found", pMgmt->file);
S
Shengliang Guan 已提交
227
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
228
  }
S
Shengliang Guan 已提交
229
  pMgmt->dropped = dropped->valueint;
S
Shengliang Guan 已提交
230

S
Shengliang Guan 已提交
231 232 233
  cJSON *dnodes = cJSON_GetObjectItem(root, "dnodes");
  if (!dnodes || dnodes->type != cJSON_Array) {
    dError("failed to read %s since dnodes not found", pMgmt->file);
S
Shengliang Guan 已提交
234
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
235 236
  }

S
Shengliang Guan 已提交
237 238 239
  int32_t numOfDnodes = cJSON_GetArraySize(dnodes);
  if (numOfDnodes <= 0) {
    dError("failed to read %s since numOfDnodes:%d invalid", pMgmt->file, numOfDnodes);
S
Shengliang Guan 已提交
240
    goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
241 242
  }

S
Shengliang Guan 已提交
243
  for (int32_t i = 0; i < numOfDnodes; ++i) {
S
Shengliang Guan 已提交
244 245
    cJSON *node = cJSON_GetArrayItem(dnodes, i);
    if (node == NULL) break;
S
Shengliang Guan 已提交
246

S
Shengliang Guan 已提交
247
    SDnodeEp dnodeEp = {0};
S
Shengliang Guan 已提交
248

H
Haojun Liao 已提交
249 250
    cJSON *did = cJSON_GetObjectItem(node, "id");
    if (!did || did->type != cJSON_Number) {
S
Shengliang Guan 已提交
251
      dError("failed to read %s since dnodeId not found", pMgmt->file);
S
Shengliang Guan 已提交
252
      goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
253
    }
H
Haojun Liao 已提交
254

S
Shengliang Guan 已提交
255
    dnodeEp.id = dnodeId->valueint;
S
Shengliang Guan 已提交
256

S
Shengliang Guan 已提交
257
    cJSON *dnodeFqdn = cJSON_GetObjectItem(node, "fqdn");
S
Shengliang Guan 已提交
258
    if (!dnodeFqdn || dnodeFqdn->type != cJSON_String || dnodeFqdn->valuestring == NULL) {
S
Shengliang Guan 已提交
259
      dError("failed to read %s since dnodeFqdn not found", pMgmt->file);
S
Shengliang Guan 已提交
260
      goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
261
    }
S
Shengliang Guan 已提交
262
    tstrncpy(dnodeEp.ep.fqdn, dnodeFqdn->valuestring, TSDB_FQDN_LEN);
S
Shengliang Guan 已提交
263

S
Shengliang Guan 已提交
264 265
    cJSON *dnodePort = cJSON_GetObjectItem(node, "port");
    if (!dnodePort || dnodePort->type != cJSON_Number) {
S
Shengliang Guan 已提交
266
      dError("failed to read %s since dnodePort not found", pMgmt->file);
S
Shengliang Guan 已提交
267
      goto PRASE_DNODE_OVER;
S
Shengliang Guan 已提交
268
    }
H
Haojun Liao 已提交
269

S
Shengliang Guan 已提交
270
    dnodeEp.ep.port = dnodePort->valueint;
S
Shengliang Guan 已提交
271 272 273

    cJSON *isMnode = cJSON_GetObjectItem(node, "isMnode");
    if (!isMnode || isMnode->type != cJSON_Number) {
S
Shengliang Guan 已提交
274
      dError("failed to read %s since isMnode not found", pMgmt->file);
S
Shengliang Guan 已提交
275 276
      goto PRASE_DNODE_OVER;
    }
S
Shengliang Guan 已提交
277 278 279
    dnodeEp.isMnode = isMnode->valueint;

    taosArrayPush(pMgmt->pDnodeEps, &dnodeEp);
S
Shengliang Guan 已提交
280 281
  }

S
Shengliang Guan 已提交
282 283 284
  code = 0;
  dInfo("succcessed to read file %s", pMgmt->file);
  dndPrintDnodes(pDnode);
S
Shengliang Guan 已提交
285

S
Shengliang Guan 已提交
286
PRASE_DNODE_OVER:
S
Shengliang Guan 已提交
287 288 289 290
  if (content != NULL) free(content);
  if (root != NULL) cJSON_Delete(root);
  if (fp != NULL) fclose(fp);

S
Shengliang Guan 已提交
291 292
  if (dndIsEpChanged(pDnode, pMgmt->dnodeId, pDnode->cfg.localEp)) {
    dError("localEp %s different with %s and need reconfigured", pDnode->cfg.localEp, pMgmt->file);
S
Shengliang Guan 已提交
293 294 295
    return -1;
  }

S
Shengliang Guan 已提交
296 297 298 299 300
  if (taosArrayGetSize(pMgmt->pDnodeEps) == 0) {
    SDnodeEp dnodeEp = {0};
    dnodeEp.isMnode = 1;
    taosGetFqdnPortFromEp(pDnode->cfg.firstEp, &dnodeEp.ep);
    taosArrayPush(pMgmt->pDnodeEps, &dnodeEp);
S
Shengliang Guan 已提交
301 302
  }

S
Shengliang Guan 已提交
303
  dndResetDnodes(pDnode, pMgmt->pDnodeEps);
S
Shengliang Guan 已提交
304 305 306 307 308

  terrno = 0;
  return 0;
}

S
Shengliang Guan 已提交
309 310
static int32_t dndWriteDnodes(SDnode *pDnode) {
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
311

S
Shengliang Guan 已提交
312 313 314 315
  FILE *fp = fopen(pMgmt->file, "w");
  if (fp == NULL) {
    dError("failed to write %s since %s", pMgmt->file, strerror(errno));
    terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
316 317 318 319
    return -1;
  }

  int32_t len = 0;
S
Shengliang Guan 已提交
320
  int32_t maxLen = 256 * 1024;
S
Shengliang Guan 已提交
321 322 323
  char   *content = calloc(1, maxLen + 1);

  len += snprintf(content + len, maxLen - len, "{\n");
S
Shengliang Guan 已提交
324
  len += snprintf(content + len, maxLen - len, "  \"dnodeId\": %d,\n", pMgmt->dnodeId);
325
  len += snprintf(content + len, maxLen - len, "  \"clusterId\": \"%" PRId64 "\",\n", pMgmt->clusterId);
S
Shengliang Guan 已提交
326 327
  len += snprintf(content + len, maxLen - len, "  \"dropped\": %d,\n", pMgmt->dropped);
  len += snprintf(content + len, maxLen - len, "  \"dnodes\": [{\n");
S
Shengliang Guan 已提交
328 329 330 331

  int32_t numOfEps = (int32_t)taosArrayGetSize(pMgmt->pDnodeEps);
  for (int32_t i = 0; i < numOfEps; ++i) {
    SDnodeEp *pDnodeEp = taosArrayGet(pMgmt->pDnodeEps, i);
S
Shengliang Guan 已提交
332
    len += snprintf(content + len, maxLen - len, "    \"id\": %d,\n", pDnodeEp->id);
H
Haojun Liao 已提交
333 334
    len += snprintf(content + len, maxLen - len, "    \"fqdn\": \"%s\",\n", pDnodeEp->ep.fqdn);
    len += snprintf(content + len, maxLen - len, "    \"port\": %u,\n", pDnodeEp->ep.port);
S
Shengliang Guan 已提交
335
    len += snprintf(content + len, maxLen - len, "    \"isMnode\": %d\n", pDnodeEp->isMnode);
S
Shengliang Guan 已提交
336
    if (i < numOfEps - 1) {
S
Shengliang Guan 已提交
337 338 339 340 341 342 343 344 345 346 347 348 349
      len += snprintf(content + len, maxLen - len, "  },{\n");
    } else {
      len += snprintf(content + len, maxLen - len, "  }]\n");
    }
  }
  len += snprintf(content + len, maxLen - len, "}\n");

  fwrite(content, 1, len, fp);
  taosFsyncFile(fileno(fp));
  fclose(fp);
  free(content);
  terrno = 0;

S
Shengliang Guan 已提交
350
  pMgmt->updateTime = taosGetTimestampMs();
S
Shengliang Guan 已提交
351
  dDebug("successed to write %s", pMgmt->file);
S
Shengliang Guan 已提交
352 353 354
  return 0;
}

S
Shengliang Guan 已提交
355
void dndSendStatusReq(SDnode *pDnode) {
S
Shengliang Guan 已提交
356
  SStatusReq req = {0};
S
Shengliang Guan 已提交
357

S
Shengliang Guan 已提交
358 359
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosRLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
360 361 362 363 364 365 366 367 368 369 370 371
  req.sver = pDnode->env.sver;
  req.dver = pMgmt->dver;
  req.dnodeId = pMgmt->dnodeId;
  req.clusterId = pMgmt->clusterId;
  req.rebootTime = pMgmt->rebootTime;
  req.updateTime = pMgmt->updateTime;
  req.numOfCores = pDnode->env.numOfCores;
  req.numOfSupportVnodes = pDnode->cfg.numOfSupportVnodes;
  memcpy(req.dnodeEp, pDnode->cfg.localEp, TSDB_EP_LEN);

  req.clusterCfg.statusInterval = pDnode->cfg.statusInterval;
  req.clusterCfg.checkTime = 0;
S
Shengliang Guan 已提交
372
  char timestr[32] = "1970-01-01 00:00:00.00";
S
Shengliang Guan 已提交
373 374 375 376
  (void)taosParseTime(timestr, &req.clusterCfg.checkTime, (int32_t)strlen(timestr), TSDB_TIME_PRECISION_MILLI, 0);
  memcpy(req.clusterCfg.timezone, pDnode->env.timezone, TSDB_TIMEZONE_LEN);
  memcpy(req.clusterCfg.locale, pDnode->env.locale, TSDB_LOCALE_LEN);
  memcpy(req.clusterCfg.charset, pDnode->env.charset, TSDB_LOCALE_LEN);
S
Shengliang Guan 已提交
377
  taosRUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
378

S
Shengliang Guan 已提交
379 380 381 382 383 384 385
  req.pVloads = taosArrayInit(TSDB_MAX_VNODES, sizeof(SVnodeLoad));
  dndGetVnodeLoads(pDnode, req.pVloads);

  int32_t contLen = tSerializeSStatusReq(NULL, &req);
  void   *pHead = rpcMallocCont(contLen);
  void   *pBuf = pHead;
  tSerializeSStatusReq(&pBuf, &req);
S
Shengliang Guan 已提交
386
  taosArrayDestroy(req.pVloads);
S
Shengliang Guan 已提交
387

S
Shengliang Guan 已提交
388
  SRpcMsg rpcMsg = {.pCont = pHead, .contLen = contLen, .msgType = TDMT_MND_STATUS, .ahandle = (void *)9527};
389
  pMgmt->statusSent = 1;
S
Shengliang Guan 已提交
390

S
Shengliang Guan 已提交
391
  dTrace("pDnode:%p, send status req to mnode", pDnode);
S
Shengliang Guan 已提交
392
  dndSendReqToMnode(pDnode, &rpcMsg);
S
Shengliang Guan 已提交
393 394
}

S
Shengliang Guan 已提交
395 396
static void dndUpdateDnodeCfg(SDnode *pDnode, SDnodeCfg *pCfg) {
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
397
  if (pMgmt->dnodeId == 0) {
H
Haojun Liao 已提交
398
    dInfo("set dnodeId:%d clusterId:0x%" PRId64, pCfg->dnodeId, pCfg->clusterId);
S
Shengliang Guan 已提交
399
    taosWLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
400 401
    pMgmt->dnodeId = pCfg->dnodeId;
    pMgmt->clusterId = pCfg->clusterId;
402
    dndWriteDnodes(pDnode);
S
Shengliang Guan 已提交
403
    taosWUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
404
  }
S
Shengliang Guan 已提交
405 406
}

S
Shengliang Guan 已提交
407 408 409
static void dndUpdateDnodeEps(SDnode *pDnode, SArray *pDnodeEps) {
  int32_t numOfEps = taosArrayGetSize(pDnodeEps);
  if (numOfEps <= 0) return;
S
Shengliang Guan 已提交
410

S
Shengliang Guan 已提交
411 412
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
  taosWLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
413

S
Shengliang Guan 已提交
414 415
  int32_t numOfEpsOld = (int32_t)taosArrayGetSize(pMgmt->pDnodeEps);
  if (numOfEps != numOfEpsOld) {
S
Shengliang Guan 已提交
416 417
    dndResetDnodes(pDnode, pDnodeEps);
    dndWriteDnodes(pDnode);
S
Shengliang Guan 已提交
418
  } else {
S
Shengliang Guan 已提交
419 420
    int32_t size = numOfEps * sizeof(SDnodeEp);
    if (memcmp(pMgmt->pDnodeEps->pData, pDnodeEps->pData, size) != 0) {
S
Shengliang Guan 已提交
421 422
      dndResetDnodes(pDnode, pDnodeEps);
      dndWriteDnodes(pDnode);
S
Shengliang Guan 已提交
423 424 425
    }
  }

S
Shengliang Guan 已提交
426
  taosWUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
427 428
}

S
Shengliang Guan 已提交
429
static void dndProcessStatusRsp(SDnode *pDnode, SRpcMsg *pRsp) {
430 431
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;

S
Shengliang Guan 已提交
432 433
  if (pRsp->code != TSDB_CODE_SUCCESS) {
    if (pRsp->code == TSDB_CODE_MND_DNODE_NOT_EXIST && !pMgmt->dropped && pMgmt->dnodeId > 0) {
S
Shengliang Guan 已提交
434 435 436 437
      dInfo("dnode:%d, set to dropped since not exist in mnode", pMgmt->dnodeId);
      pMgmt->dropped = 1;
      dndWriteDnodes(pDnode);
    }
S
Shengliang Guan 已提交
438 439 440 441 442 443
  } else {
    SStatusRsp statusRsp = {0};
    if (pRsp->pCont != NULL && pRsp->contLen != 0 && tDeserializeSStatusRsp(pRsp->pCont, &statusRsp) != NULL) {
      pMgmt->dver = statusRsp.dver;
      dndUpdateDnodeCfg(pDnode, &statusRsp.dnodeCfg);
      dndUpdateDnodeEps(pDnode, statusRsp.pDnodeEps);
S
Shengliang Guan 已提交
444
    }
S
Shengliang Guan 已提交
445
    taosArrayDestroy(statusRsp.pDnodeEps);
S
Shengliang Guan 已提交
446
  }
S
Shengliang Guan 已提交
447

448
  pMgmt->statusSent = 0;
S
Shengliang Guan 已提交
449
}
S
Shengliang Guan 已提交
450

S
Shengliang Guan 已提交
451
static void dndProcessAuthRsp(SDnode *pDnode, SRpcMsg *pReq) { dError("auth rsp is received, but not supported yet"); }
S
Shengliang Guan 已提交
452

S
Shengliang Guan 已提交
453 454 455
static void dndProcessGrantRsp(SDnode *pDnode, SRpcMsg *pReq) {
  dError("grant rsp is received, but not supported yet");
}
S
Shengliang Guan 已提交
456

S
Shengliang Guan 已提交
457 458 459
static int32_t dndProcessConfigDnodeReq(SDnode *pDnode, SRpcMsg *pReq) {
  dError("config req is received, but not supported yet");
  SDCfgDnodeReq *pCfg = pReq->pCont;
S
Shengliang Guan 已提交
460
  return TSDB_CODE_OPS_NOT_SUPPORT;
S
Shengliang Guan 已提交
461 462
}

S
Shengliang Guan 已提交
463 464
void dndProcessStartupReq(SDnode *pDnode, SRpcMsg *pReq) {
  dDebug("startup req is received");
S
Shengliang Guan 已提交
465

S
Shengliang Guan 已提交
466
  SStartupReq *pStartup = rpcMallocCont(sizeof(SStartupReq));
S
Shengliang Guan 已提交
467
  dndGetStartup(pDnode, pStartup);
S
Shengliang Guan 已提交
468

S
Shengliang Guan 已提交
469
  dDebug("startup req is sent, step:%s desc:%s finished:%d", pStartup->name, pStartup->desc, pStartup->finished);
S
Shengliang Guan 已提交
470

S
Shengliang Guan 已提交
471
  SRpcMsg rpcRsp = {.handle = pReq->handle, .pCont = pStartup, .contLen = sizeof(SStartupReq)};
S
Shengliang Guan 已提交
472
  rpcSendResponse(&rpcRsp);
S
Shengliang Guan 已提交
473 474 475
}

static void *dnodeThreadRoutine(void *param) {
476 477
  SDnode     *pDnode = param;
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
478
  int32_t     ms = pDnode->cfg.statusInterval * 1000;
S
Shengliang Guan 已提交
479

H
Haojun Liao 已提交
480 481
  setThreadName("dnode-hb");

S
Shengliang Guan 已提交
482 483
  while (true) {
    pthread_testcancel();
S
Shengliang Guan 已提交
484
    taosMsleep(ms);
S
Shengliang Guan 已提交
485

S
Shengliang Guan 已提交
486
    if (dndGetStat(pDnode) == DND_STAT_RUNNING && !pMgmt->statusSent && !pMgmt->dropped) {
S
Shengliang Guan 已提交
487
      dndSendStatusReq(pDnode);
S
Shengliang Guan 已提交
488
    }
S
Shengliang Guan 已提交
489 490 491
  }
}

S
Shengliang Guan 已提交
492
int32_t dndInitMgmt(SDnode *pDnode) {
S
Shengliang Guan 已提交
493
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
494

S
Shengliang Guan 已提交
495
  pMgmt->dnodeId = 0;
496
  pMgmt->rebootTime = taosGetTimestampMs();
S
Shengliang Guan 已提交
497 498
  pMgmt->dropped = 0;
  pMgmt->clusterId = 0;
S
Shengliang Guan 已提交
499
  taosInitRWLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
500 501

  char path[PATH_MAX];
S
Shengliang Guan 已提交
502 503 504
  snprintf(path, PATH_MAX, "%s/dnode.json", pDnode->dir.dnode);
  pMgmt->file = strdup(path);
  if (pMgmt->file == NULL) {
S
Shengliang Guan 已提交
505 506 507 508
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }

509
  pMgmt->dnodeHash = taosHashInit(4, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT), true, HASH_NO_LOCK);
S
Shengliang Guan 已提交
510
  if (pMgmt->dnodeHash == NULL) {
S
Shengliang Guan 已提交
511
    dError("failed to init dnode hash");
S
Shengliang Guan 已提交
512 513
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
S
Shengliang Guan 已提交
514 515
  }

S
Shengliang Guan 已提交
516 517
  if (dndReadDnodes(pDnode) != 0) {
    dError("failed to read file:%s since %s", pMgmt->file, terrstr());
S
Shengliang Guan 已提交
518
    return -1;
S
Shengliang Guan 已提交
519 520
  }

S
Shengliang Guan 已提交
521
  if (pMgmt->dropped) {
S
Shengliang Guan 已提交
522
    dError("dnode not start since its already dropped");
S
Shengliang Guan 已提交
523 524 525
    return -1;
  }

S
Shengliang Guan 已提交
526 527
  if (dndInitWorker(pDnode, &pMgmt->mgmtWorker, DND_WORKER_SINGLE, "dnode-mgmt", 1, 1, dndProcessMgmtQueue) != 0) {
    dError("failed to start dnode mgmt worker since %s", terrstr());
S
Shengliang Guan 已提交
528 529
    return -1;
  }
S
Shengliang Guan 已提交
530

531 532 533 534 535
  if (dndInitWorker(pDnode, &pMgmt->statusWorker, DND_WORKER_SINGLE, "dnode-status", 1, 1, dndProcessMgmtQueue) != 0) {
    dError("failed to start dnode mgmt worker since %s", terrstr());
    return -1;
  }

S
Shengliang Guan 已提交
536 537
  pMgmt->threadId = taosCreateThread(dnodeThreadRoutine, pDnode);
  if (pMgmt->threadId == NULL) {
S
Shengliang Guan 已提交
538 539 540
    dError("failed to init dnode thread");
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
S
Shengliang Guan 已提交
541 542
  }

S
Shengliang Guan 已提交
543
  dInfo("dnode-mgmt is initialized");
S
Shengliang Guan 已提交
544 545 546
  return 0;
}

S
Shengliang Guan 已提交
547
void dndStopMgmt(SDnode *pDnode) {
S
Shengliang Guan 已提交
548
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
549
  dndCleanupWorker(&pMgmt->mgmtWorker);
550
  dndCleanupWorker(&pMgmt->statusWorker);
S
Shengliang Guan 已提交
551

S
Shengliang Guan 已提交
552 553 554
  if (pMgmt->threadId != NULL) {
    taosDestoryThread(pMgmt->threadId);
    pMgmt->threadId = NULL;
S
Shengliang Guan 已提交
555
  }
S
Shengliang Guan 已提交
556
}
S
Shengliang Guan 已提交
557

S
Shengliang Guan 已提交
558 559
void dndCleanupMgmt(SDnode *pDnode) {
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;
S
Shengliang Guan 已提交
560
  taosWLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
561

S
Shengliang Guan 已提交
562 563 564
  if (pMgmt->pDnodeEps != NULL) {
    taosArrayDestroy(pMgmt->pDnodeEps);
    pMgmt->pDnodeEps = NULL;
S
Shengliang Guan 已提交
565
  }
S
Shengliang Guan 已提交
566

S
Shengliang Guan 已提交
567 568 569
  if (pMgmt->dnodeHash != NULL) {
    taosHashCleanup(pMgmt->dnodeHash);
    pMgmt->dnodeHash = NULL;
S
Shengliang Guan 已提交
570
  }
S
Shengliang Guan 已提交
571

S
Shengliang Guan 已提交
572 573 574
  if (pMgmt->file != NULL) {
    free(pMgmt->file);
    pMgmt->file = NULL;
S
Shengliang Guan 已提交
575 576
  }

S
Shengliang Guan 已提交
577
  taosWUnLockLatch(&pMgmt->latch);
S
Shengliang Guan 已提交
578
  dInfo("dnode-mgmt is cleaned up");
S
Shengliang Guan 已提交
579 580
}

S
Shengliang Guan 已提交
581
void dndProcessMgmtMsg(SDnode *pDnode, SRpcMsg *pMsg, SEpSet *pEpSet) {
S
Shengliang Guan 已提交
582 583
  SDnodeMgmt *pMgmt = &pDnode->dmgmt;

S
Shengliang Guan 已提交
584
  if (pEpSet && pEpSet->numOfEps > 0 && pMsg->msgType == TDMT_MND_STATUS_RSP) {
S
Shengliang Guan 已提交
585 586 587
    dndUpdateMnodeEpSet(pDnode, pEpSet);
  }

588 589 590 591 592 593
  SDnodeWorker *pWorker = &pMgmt->mgmtWorker;
  if (pMsg->msgType == TDMT_MND_STATUS_RSP) {
    pWorker = &pMgmt->statusWorker;
  }

  if (dndWriteMsgToWorker(pWorker, pMsg, sizeof(SRpcMsg)) != 0) {
S
Shengliang Guan 已提交
594 595
    if (pMsg->msgType & 1u) {
      SRpcMsg rsp = {.handle = pMsg->handle, .code = TSDB_CODE_OUT_OF_MEMORY};
S
Shengliang Guan 已提交
596 597
      rpcSendResponse(&rsp);
    }
S
Shengliang Guan 已提交
598
    rpcFreeCont(pMsg->pCont);
S
Shengliang Guan 已提交
599 600 601 602 603 604 605
    taosFreeQitem(pMsg);
  }
}

static void dndProcessMgmtQueue(SDnode *pDnode, SRpcMsg *pMsg) {
  int32_t code = 0;

S
Shengliang Guan 已提交
606
  switch (pMsg->msgType) {
S
Shengliang Guan 已提交
607 608 609 610 611 612 613 614 615
    case TDMT_DND_CREATE_MNODE:
      code = dndProcessCreateMnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_ALTER_MNODE:
      code = dndProcessAlterMnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_DROP_MNODE:
      code = dndProcessDropMnodeReq(pDnode, pMsg);
      break;
S
Shengliang Guan 已提交
616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633
    case TDMT_DND_CREATE_QNODE:
      code = dndProcessCreateQnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_DROP_QNODE:
      code = dndProcessDropQnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_CREATE_SNODE:
      code = dndProcessCreateSnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_DROP_SNODE:
      code = dndProcessDropSnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_CREATE_BNODE:
      code = dndProcessCreateBnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_DROP_BNODE:
      code = dndProcessDropBnodeReq(pDnode, pMsg);
      break;
H
Hongze Cheng 已提交
634
    case TDMT_DND_CONFIG_DNODE:
S
Shengliang Guan 已提交
635
      code = dndProcessConfigDnodeReq(pDnode, pMsg);
S
Shengliang Guan 已提交
636
      break;
H
Hongze Cheng 已提交
637
    case TDMT_MND_STATUS_RSP:
S
Shengliang Guan 已提交
638
      dndProcessStatusRsp(pDnode, pMsg);
S
Shengliang Guan 已提交
639
      break;
H
Hongze Cheng 已提交
640
    case TDMT_MND_AUTH_RSP:
S
Shengliang Guan 已提交
641
      dndProcessAuthRsp(pDnode, pMsg);
S
Shengliang Guan 已提交
642
      break;
H
Hongze Cheng 已提交
643
    case TDMT_MND_GRANT_RSP:
S
Shengliang Guan 已提交
644
      dndProcessGrantRsp(pDnode, pMsg);
S
Shengliang Guan 已提交
645
      break;
S
Shengliang Guan 已提交
646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663
    case TDMT_DND_CREATE_VNODE:
      code = dndProcessCreateVnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_ALTER_VNODE:
      code = dndProcessAlterVnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_DROP_VNODE:
      code = dndProcessDropVnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_AUTH_VNODE:
      code = dndProcessAuthVnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_SYNC_VNODE:
      code = dndProcessSyncVnodeReq(pDnode, pMsg);
      break;
    case TDMT_DND_COMPACT_VNODE:
      code = dndProcessCompactVnodeReq(pDnode, pMsg);
      break;
S
Shengliang Guan 已提交
664
    default:
S
Shengliang Guan 已提交
665 666
      terrno = TSDB_CODE_MSG_NOT_PROCESSED;
      code = -1;
S
Shengliang Guan 已提交
667
      dError("RPC %p, dnode msg:%s not processed", pMsg->handle, TMSG_INFO(pMsg->msgType));
S
Shengliang Guan 已提交
668 669 670 671 672 673 674
      break;
  }

  if (pMsg->msgType & 1u) {
    if (code != 0) code = terrno;
    SRpcMsg rsp = {.code = code, .handle = pMsg->handle, .ahandle = pMsg->ahandle};
    rpcSendResponse(&rsp);
S
Shengliang Guan 已提交
675
  }
S
Shengliang Guan 已提交
676

S
Shengliang Guan 已提交
677
  rpcFreeCont(pMsg->pCont);
S
Shengliang Guan 已提交
678
  pMsg->pCont = NULL;
S
Shengliang Guan 已提交
679
  taosFreeQitem(pMsg);
S
Shengliang Guan 已提交
680
}