clientHb.c 23.5 KB
Newer Older
L
Liu Jicong 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

D
dapan1121 已提交
16
#include "catalog.h"
L
fix  
Liu Jicong 已提交
17
#include "clientInt.h"
D
dapan1121 已提交
18
#include "clientLog.h"
L
Liu Jicong 已提交
19
#include "scheduler.h"
L
fix  
Liu Jicong 已提交
20
#include "trpc.h"
L
Liu Jicong 已提交
21 22 23 24 25 26

static SClientHbMgr clientHbMgr = {0};

static int32_t hbCreateThread();
static void    hbStopThread();

L
Liu Jicong 已提交
27 28
static int32_t hbMqHbReqHandle(SClientHbKey *connKey, void *param, SClientHbReq *req) { return 0; }

L
Liu Jicong 已提交
29
static int32_t hbMqHbRspHandle(SAppHbMgr *pAppHbMgr, SClientHbRsp *pRsp) { return 0; }
L
Liu Jicong 已提交
30

D
dapan 已提交
31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47
static int32_t hbProcessUserAuthInfoRsp(void *value, int32_t valueLen, struct SCatalog *pCatalog) {
  int32_t code = 0;

  SUserAuthBatchRsp batchRsp = {0};
  if (tDeserializeSUserAuthBatchRsp(value, valueLen, &batchRsp) != 0) {
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  int32_t numOfBatchs = taosArrayGetSize(batchRsp.pArray);
  for (int32_t i = 0; i < numOfBatchs; ++i) {
    SGetUserAuthRsp *rsp = taosArrayGet(batchRsp.pArray, i);
    tscDebug("hb user auth rsp, user:%s, version:%d", rsp->user, rsp->version);

    catalogUpdateUserAuthInfo(pCatalog, rsp);
  }

D
dapan1121 已提交
48
  taosArrayDestroy(batchRsp.pArray);
D
dapan 已提交
49 50 51
  return TSDB_CODE_SUCCESS;
}

D
dapan1121 已提交
52 53 54
static int32_t hbProcessDBInfoRsp(void *value, int32_t valueLen, struct SCatalog *pCatalog) {
  int32_t code = 0;

S
Shengliang Guan 已提交
55 56 57 58 59
  SUseDbBatchRsp batchUseRsp = {0};
  if (tDeserializeSUseDbBatchRsp(value, valueLen, &batchUseRsp) != 0) {
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }
D
dapan1121 已提交
60

S
Shengliang Guan 已提交
61 62 63
  int32_t numOfBatchs = taosArrayGetSize(batchUseRsp.pArray);
  for (int32_t i = 0; i < numOfBatchs; ++i) {
    SUseDbRsp *rsp = taosArrayGet(batchUseRsp.pArray, i);
L
fix  
Liu Jicong 已提交
64 65
    tscDebug("hb db rsp, db:%s, vgVersion:%d, uid:%" PRIx64, rsp->db, rsp->vgVersion, rsp->uid);

D
dapan1121 已提交
66
    if (rsp->vgVersion < 0) {
D
dapan1121 已提交
67
      code = catalogRemoveDB(pCatalog, rsp->db, rsp->uid);
D
dapan1121 已提交
68
    } else {
D
dapan1121 已提交
69
      SDBVgInfo vgInfo = {0};
D
dapan1121 已提交
70 71
      vgInfo.vgVersion = rsp->vgVersion;
      vgInfo.hashMethod = rsp->hashMethod;
D
dapan1121 已提交
72 73
      vgInfo.vgHash = taosHashInit(rsp->vgNum, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT), true, HASH_ENTRY_LOCK);
      if (NULL == vgInfo.vgHash) {
D
dapan1121 已提交
74 75 76 77
        tscError("hash init[%d] failed", rsp->vgNum);
        return TSDB_CODE_TSC_OUT_OF_MEMORY;
      }

S
Shengliang Guan 已提交
78 79 80
      for (int32_t j = 0; j < rsp->vgNum; ++j) {
        SVgroupInfo *pInfo = taosArrayGet(rsp->pVgroupInfos, j);
        if (taosHashPut(vgInfo.vgHash, &pInfo->vgId, sizeof(int32_t), pInfo, sizeof(SVgroupInfo)) != 0) {
D
dapan1121 已提交
81
          tscError("hash push failed, errno:%d", errno);
D
dapan1121 已提交
82
          taosHashCleanup(vgInfo.vgHash);
D
dapan1121 已提交
83 84
          return TSDB_CODE_TSC_OUT_OF_MEMORY;
        }
L
fix  
Liu Jicong 已提交
85 86
      }

D
dapan1121 已提交
87
      catalogUpdateDBVgInfo(pCatalog, rsp->db, rsp->uid, &vgInfo);
D
dapan1121 已提交
88 89 90 91 92 93 94
    }

    if (code) {
      return code;
    }
  }

S
Shengliang Guan 已提交
95
  tFreeSUseDbBatchRsp(&batchUseRsp);
D
dapan1121 已提交
96 97 98
  return TSDB_CODE_SUCCESS;
}

D
dapan 已提交
99 100 101
static int32_t hbProcessStbInfoRsp(void *value, int32_t valueLen, struct SCatalog *pCatalog) {
  int32_t code = 0;

D
dapan1121 已提交
102 103
  SSTbHbRsp hbRsp = {0};
  if (tDeserializeSSTbHbRsp(value, valueLen, &hbRsp) != 0) {
S
Shengliang Guan 已提交
104 105 106 107
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

D
dapan1121 已提交
108 109 110
  int32_t numOfMeta = taosArrayGetSize(hbRsp.pMetaRsp);
  for (int32_t i = 0; i < numOfMeta; ++i) {
    STableMetaRsp *rsp = taosArrayGet(hbRsp.pMetaRsp, i);
S
Shengliang Guan 已提交
111

D
dapan 已提交
112 113
    if (rsp->numOfColumns < 0) {
      tscDebug("hb remove stb, db:%s, stb:%s", rsp->dbFName, rsp->stbName);
D
dapan1121 已提交
114
      catalogRemoveStbMeta(pCatalog, rsp->dbFName, rsp->dbId, rsp->stbName, rsp->suid);
D
dapan 已提交
115
    } else {
D
dapan1121 已提交
116
      tscDebug("hb update stb, db:%s, stb:%s", rsp->dbFName, rsp->stbName);
S
Shengliang Guan 已提交
117
      if (rsp->pSchemas[0].colId != PRIMARYKEY_TIMESTAMP_COL_ID) {
118
        tscError("invalid colId[%" PRIi16 "] for the first column in table meta rsp msg", rsp->pSchemas[0].colId);
D
dapan1121 已提交
119
        tFreeSSTbHbRsp(&hbRsp);
D
dapan1121 已提交
120
        return TSDB_CODE_TSC_INVALID_VALUE;
D
dapan 已提交
121 122
      }

D
dapan1121 已提交
123
      catalogUpdateTableMeta(pCatalog, rsp);
D
dapan 已提交
124 125 126
    }
  }

D
dapan1121 已提交
127 128 129 130 131 132 133 134 135 136
  int32_t numOfIndex = taosArrayGetSize(hbRsp.pIndexRsp);
  for (int32_t i = 0; i < numOfIndex; ++i) {
    STableIndexRsp *rsp = taosArrayGet(hbRsp.pIndexRsp, i);

    catalogUpdateTableIndex(pCatalog, rsp);
  }

  taosArrayDestroy(hbRsp.pIndexRsp);
  hbRsp.pIndexRsp = NULL;

D
dapan1121 已提交
137
  tFreeSSTbHbRsp(&hbRsp);
D
dapan 已提交
138 139 140
  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
141
static int32_t hbQueryHbRspHandle(SAppHbMgr *pAppHbMgr, SClientHbRsp *pRsp) {
D
dapan1121 已提交
142 143 144
  SClientHbReq *pReq = taosHashGet(pAppHbMgr->activeInfo, &pRsp->connKey, sizeof(SClientHbKey));
  if (NULL == pReq) {
    tscWarn("pReq to get activeInfo, may be dropped, refId:%" PRIx64 ", type:%d", pRsp->connKey.tscRid,
L
Liu Jicong 已提交
145
            pRsp->connKey.connType);
D
dapan1121 已提交
146 147 148
    return TSDB_CODE_SUCCESS;
  }

D
dapan1121 已提交
149 150 151 152
  if (pRsp->query) {
    STscObj *pTscObj = (STscObj *)acquireTscObj(pRsp->connKey.tscRid);
    if (NULL == pTscObj) {
      tscDebug("tscObj rid %" PRIx64 " not exist", pRsp->connKey.tscRid);
D
dapan1121 已提交
153
    } else {      
D
dapan1121 已提交
154
      if (pRsp->query->totalDnodes > 1 && !isEpsetEqual(&pTscObj->pAppInfo->mgmtEp.epSet, &pRsp->query->epSet)) {
D
dapan1121 已提交
155 156 157 158 159 160 161
        SEpSet* pOrig = &pTscObj->pAppInfo->mgmtEp.epSet;
        SEp* pOrigEp = &pOrig->eps[pOrig->inUse];
        SEp* pNewEp = &pRsp->query->epSet.eps[pRsp->query->epSet.inUse];
        tscDebug("mnode epset updated from %d/%d=>%s:%d to %d/%d=>%s:%d in hb", 
            pOrig->inUse, pOrig->numOfEps, pOrigEp->fqdn, pOrigEp->port, 
            pRsp->query->epSet.inUse, pRsp->query->epSet.numOfEps, pNewEp->fqdn, pNewEp->port);
            
D
dapan1121 已提交
162 163
        updateEpSet_s(&pTscObj->pAppInfo->mgmtEp, &pRsp->query->epSet);
      }
D
dapan1121 已提交
164
      pTscObj->connId = pRsp->query->connId;
L
Liu Jicong 已提交
165

D
dapan1121 已提交
166 167 168 169 170 171 172 173 174
      if (pRsp->query->killRid) {
        SRequestObj *pRequest = acquireRequest(pRsp->query->killRid);
        if (NULL == pRequest) {
          tscDebug("request 0x%" PRIx64 " not exist to kill", pRsp->query->killRid);
        } else {
          taos_stop_query((TAOS_RES *)pRequest);
          releaseRequest(pRsp->query->killRid);
        }
      }
L
Liu Jicong 已提交
175

D
dapan1121 已提交
176
      if (pRsp->query->killConnection) {
177
        taos_close_internal(pTscObj);
D
dapan1121 已提交
178 179
      }

D
dapan1121 已提交
180 181 182 183
      if (pRsp->query->pQnodeList) {
        updateQnodeList(pTscObj->pAppInfo, pRsp->query->pQnodeList);
      }

D
dapan1121 已提交
184 185 186
      releaseTscObj(pRsp->connKey.tscRid);
    }
  }
L
Liu Jicong 已提交
187

D
dapan1121 已提交
188
  int32_t kvNum = pRsp->info ? taosArrayGetSize(pRsp->info) : 0;
D
dapan1121 已提交
189 190

  tscDebug("hb got %d rsp kv", kvNum);
L
fix  
Liu Jicong 已提交
191

D
dapan1121 已提交
192 193 194
  for (int32_t i = 0; i < kvNum; ++i) {
    SKv *kv = taosArrayGet(pRsp->info, i);
    switch (kv->key) {
D
dapan 已提交
195 196 197 198 199 200 201 202
      case HEARTBEAT_KEY_USER_AUTHINFO: {
        if (kv->valueLen <= 0 || NULL == kv->value) {
          tscError("invalid hb user auth info, len:%d, value:%p", kv->valueLen, kv->value);
          break;
        }

        struct SCatalog *pCatalog = NULL;

D
dapan1121 已提交
203
        int32_t code = catalogGetHandle(pReq->clusterId, &pCatalog);
D
dapan 已提交
204
        if (code != TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
205
          tscWarn("catalogGetHandle failed, clusterId:%" PRIx64 ", error:%s", pReq->clusterId, tstrerror(code));
D
dapan 已提交
206 207 208 209 210 211
          break;
        }

        hbProcessUserAuthInfoRsp(kv->value, kv->valueLen, pCatalog);
        break;
      }
D
dapan1121 已提交
212 213 214 215 216 217 218
      case HEARTBEAT_KEY_DBINFO: {
        if (kv->valueLen <= 0 || NULL == kv->value) {
          tscError("invalid hb db info, len:%d, value:%p", kv->valueLen, kv->value);
          break;
        }

        struct SCatalog *pCatalog = NULL;
L
fix  
Liu Jicong 已提交
219

D
dapan1121 已提交
220
        int32_t code = catalogGetHandle(pReq->clusterId, &pCatalog);
D
dapan1121 已提交
221
        if (code != TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
222
          tscWarn("catalogGetHandle failed, clusterId:%" PRIx64 ", error:%s", pReq->clusterId, tstrerror(code));
D
dapan1121 已提交
223 224 225 226
          break;
        }

        hbProcessDBInfoRsp(kv->value, kv->valueLen, pCatalog);
D
dapan1121 已提交
227
        break;
D
dapan1121 已提交
228
      }
L
fix  
Liu Jicong 已提交
229
      case HEARTBEAT_KEY_STBINFO: {
D
dapan 已提交
230 231 232 233
        if (kv->valueLen <= 0 || NULL == kv->value) {
          tscError("invalid hb stb info, len:%d, value:%p", kv->valueLen, kv->value);
          break;
        }
D
dapan1121 已提交
234

D
dapan 已提交
235
        struct SCatalog *pCatalog = NULL;
L
fix  
Liu Jicong 已提交
236

D
dapan1121 已提交
237
        int32_t code = catalogGetHandle(pReq->clusterId, &pCatalog);
D
dapan 已提交
238
        if (code != TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
239
          tscWarn("catalogGetHandle failed, clusterId:%" PRIx64 ", error:%s", pReq->clusterId, tstrerror(code));
D
dapan 已提交
240 241 242 243
          break;
        }

        hbProcessStbInfoRsp(kv->value, kv->valueLen, pCatalog);
D
dapan1121 已提交
244
        break;
D
dapan 已提交
245
      }
D
dapan1121 已提交
246 247 248 249 250 251 252 253 254
      default:
        tscError("invalid hb key type:%d", kv->key);
        break;
    }
  }

  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
255
static int32_t hbAsyncCallBack(void *param, const SDataBuf *pMsg, int32_t code) {
D
dapan1121 已提交
256
  static int32_t emptyRspNum = 0;
L
Liu Jicong 已提交
257
  if (code != 0) {
wafwerar's avatar
wafwerar 已提交
258
    taosMemoryFreeClear(param);
L
Liu Jicong 已提交
259 260
    return -1;
  }
S
Shengliang Guan 已提交
261

L
fix  
Liu Jicong 已提交
262
  char             *key = (char *)param;
D
dapan1121 已提交
263
  SClientHbBatchRsp pRsp = {0};
S
Shengliang Guan 已提交
264
  tDeserializeSClientHbBatchRsp(pMsg->pData, pMsg->len, &pRsp);
L
fix  
Liu Jicong 已提交
265

D
dapan1121 已提交
266
  int32_t rspNum = taosArrayGetSize(pRsp.rsps);
D
dapan1121 已提交
267

L
fix  
Liu Jicong 已提交
268
  SAppInstInfo **pInst = taosHashGet(appInfo.pInstMap, key, strlen(key));
D
dapan1121 已提交
269
  if (pInst == NULL || NULL == *pInst) {
L
fix  
Liu Jicong 已提交
270
    tscError("cluster not exist, key:%s", key);
wafwerar's avatar
wafwerar 已提交
271
    taosMemoryFreeClear(param);
D
dapan1121 已提交
272
    tFreeClientHbBatchRsp(&pRsp);
D
dapan1121 已提交
273 274 275
    return -1;
  }

wafwerar's avatar
wafwerar 已提交
276
  taosMemoryFreeClear(param);
D
dapan1121 已提交
277 278

  if (rspNum) {
L
fix  
Liu Jicong 已提交
279 280
    tscDebug("hb got %d rsp, %d empty rsp received before", rspNum,
             atomic_val_compare_exchange_32(&emptyRspNum, emptyRspNum, 0));
D
dapan1121 已提交
281 282 283 284 285
  } else {
    atomic_add_fetch_32(&emptyRspNum, 1);
  }

  for (int32_t i = 0; i < rspNum; ++i) {
L
fix  
Liu Jicong 已提交
286
    SClientHbRsp *rsp = taosArrayGet(pRsp.rsps, i);
D
dapan1121 已提交
287
    code = (*clientHbMgr.rspHandle[rsp->connKey.connType])((*pInst)->pAppHbMgr, rsp);
D
dapan1121 已提交
288 289 290 291
    if (code) {
      break;
    }
  }
D
dapan1121 已提交
292 293

  tFreeClientHbBatchRsp(&pRsp);
L
fix  
Liu Jicong 已提交
294

D
dapan1121 已提交
295
  return code;
L
Liu Jicong 已提交
296 297
}

D
dapan1121 已提交
298
int32_t hbBuildQueryDesc(SQueryHbReqBasic *hbBasic, STscObj *pObj) {
L
Liu Jicong 已提交
299
  int64_t    now = taosGetTimestampUs();
D
dapan1121 已提交
300
  SQueryDesc desc = {0};
L
Liu Jicong 已提交
301
  int32_t    code = 0;
D
dapan1121 已提交
302

L
Liu Jicong 已提交
303
  void *pIter = taosHashIterate(pObj->pRequests, NULL);
D
dapan1121 已提交
304
  while (pIter != NULL) {
L
Liu Jicong 已提交
305
    int64_t     *rid = pIter;
D
dapan1121 已提交
306 307
    SRequestObj *pRequest = acquireRequest(*rid);
    if (NULL == pRequest) {
D
dapan1121 已提交
308
      pIter = taosHashIterate(pObj->pRequests, pIter);
D
dapan1121 已提交
309 310 311 312
      continue;
    }

    tstrncpy(desc.sql, pRequest->sqlstr, sizeof(desc.sql));
313
    desc.stime = pRequest->metric.start / 1000;
L
Liu Jicong 已提交
314
    desc.queryId = pRequest->requestId;
D
dapan1121 已提交
315
    desc.useconds = now - pRequest->metric.start;
L
Liu Jicong 已提交
316 317
    desc.reqRid = pRequest->self;
    desc.pid = hbBasic->pid;
318
    desc.stableQuery = pRequest->stableQuery;
D
dapan1121 已提交
319 320 321 322 323 324 325 326 327 328 329 330 331 332
    taosGetFqdn(desc.fqdn);
    desc.subPlanNum = pRequest->body.pDag ? pRequest->body.pDag->numOfSubplans : 0;

    if (desc.subPlanNum) {
      desc.subDesc = taosArrayInit(desc.subPlanNum, sizeof(SQuerySubDesc));
      if (NULL == desc.subDesc) {
        releaseRequest(*rid);
        return TSDB_CODE_QRY_OUT_OF_MEMORY;
      }

      code = schedulerGetTasksStatus(pRequest->body.queryJob, desc.subDesc);
      if (code) {
        taosArrayDestroy(desc.subDesc);
        desc.subDesc = NULL;
333
        desc.subPlanNum = 0;
D
dapan1121 已提交
334
      }
D
dapan1121 已提交
335 336
    } else {
      desc.subDesc = NULL;
D
dapan1121 已提交
337 338
    }

L
Liu Jicong 已提交
339
    releaseRequest(*rid);
D
dapan1121 已提交
340
    taosArrayPush(hbBasic->queryDesc, &desc);
L
Liu Jicong 已提交
341

D
dapan1121 已提交
342 343 344 345 346 347 348 349 350 351 352 353
    pIter = taosHashIterate(pObj->pRequests, pIter);
  }

  return TSDB_CODE_SUCCESS;
}

int32_t hbGetQueryBasicInfo(SClientHbKey *connKey, SClientHbReq *req) {
  STscObj *pTscObj = (STscObj *)acquireTscObj(connKey->tscRid);
  if (NULL == pTscObj) {
    tscWarn("tscObj rid %" PRIx64 " not exist", connKey->tscRid);
    return TSDB_CODE_QRY_APP_ERROR;
  }
L
Liu Jicong 已提交
354

D
dapan1121 已提交
355 356 357 358 359 360
  SQueryHbReqBasic *hbBasic = (SQueryHbReqBasic *)taosMemoryCalloc(1, sizeof(SQueryHbReqBasic));
  if (NULL == hbBasic) {
    tscError("calloc %d failed", (int32_t)sizeof(SQueryHbReqBasic));
    releaseTscObj(connKey->tscRid);
    return TSDB_CODE_QRY_OUT_OF_MEMORY;
  }
361 362 363 364 365 366 367 368 369 370 371 372
  
  hbBasic->connId = pTscObj->connId;
  hbBasic->pid = taosGetPId();
  taosGetAppName(hbBasic->app, NULL);

  int32_t numOfQueries = pTscObj->pRequests ? taosHashGetSize(pTscObj->pRequests) : 0;
  if (numOfQueries <= 0) {
    req->query = hbBasic;
    releaseTscObj(connKey->tscRid);
    tscDebug("no queries on connection");
    return TSDB_CODE_SUCCESS;
  }
D
dapan1121 已提交
373 374 375 376 377 378 379 380

  hbBasic->queryDesc = taosArrayInit(numOfQueries, sizeof(SQueryDesc));
  if (NULL == hbBasic->queryDesc) {
    tscWarn("taosArrayInit %d queryDesc failed", numOfQueries);
    releaseTscObj(connKey->tscRid);
    taosMemoryFree(hbBasic);
    return TSDB_CODE_QRY_OUT_OF_MEMORY;
  }
L
Liu Jicong 已提交
381

D
dapan1121 已提交
382 383 384 385 386 387 388 389 390 391 392 393 394 395

  int32_t code = hbBuildQueryDesc(hbBasic, pTscObj);
  if (code) {
    releaseTscObj(connKey->tscRid);
    taosMemoryFree(hbBasic);
    return code;
  }

  req->query = hbBasic;
  releaseTscObj(connKey->tscRid);

  return TSDB_CODE_SUCCESS;
}

D
dapan 已提交
396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422
int32_t hbGetExpiredUserInfo(SClientHbKey *connKey, struct SCatalog *pCatalog, SClientHbReq *req) {
  SUserAuthVersion *users = NULL;
  uint32_t          userNum = 0;
  int32_t           code = 0;

  code = catalogGetExpiredUsers(pCatalog, &users, &userNum);
  if (TSDB_CODE_SUCCESS != code) {
    return code;
  }

  if (userNum <= 0) {
    return TSDB_CODE_SUCCESS;
  }

  for (int32_t i = 0; i < userNum; ++i) {
    SUserAuthVersion *user = &users[i];
    user->version = htonl(user->version);
  }

  SKv kv = {
      .key = HEARTBEAT_KEY_USER_AUTHINFO,
      .valueLen = sizeof(SUserAuthVersion) * userNum,
      .value = users,
  };

  tscDebug("hb got %d expired users, valueLen:%d", userNum, kv.valueLen);

D
dapan1121 已提交
423 424 425 426
  if (NULL == req->info) {
    req->info = taosHashInit(64, hbKeyHashFunc, 1, HASH_ENTRY_LOCK);
  }
  
D
dapan 已提交
427 428 429 430 431 432
  taosHashPut(req->info, &kv.key, sizeof(kv.key), &kv, sizeof(kv));

  return TSDB_CODE_SUCCESS;
}


D
dapan1121 已提交
433 434
int32_t hbGetExpiredDBInfo(SClientHbKey *connKey, struct SCatalog *pCatalog, SClientHbReq *req) {
  SDbVgVersion *dbs = NULL;
L
fix  
Liu Jicong 已提交
435 436
  uint32_t      dbNum = 0;
  int32_t       code = 0;
D
dapan1121 已提交
437 438 439 440 441 442

  code = catalogGetExpiredDBs(pCatalog, &dbs, &dbNum);
  if (TSDB_CODE_SUCCESS != code) {
    return code;
  }

D
dapan1121 已提交
443 444 445 446
  if (dbNum <= 0) {
    return TSDB_CODE_SUCCESS;
  }

D
dapan1121 已提交
447 448 449 450
  for (int32_t i = 0; i < dbNum; ++i) {
    SDbVgVersion *db = &dbs[i];
    db->dbId = htobe64(db->dbId);
    db->vgVersion = htonl(db->vgVersion);
D
dapan 已提交
451
    db->numOfTable = htonl(db->numOfTable);
D
dapan1121 已提交
452 453
  }

L
Liu Jicong 已提交
454 455 456 457 458
  SKv kv = {
      .key = HEARTBEAT_KEY_DBINFO,
      .valueLen = sizeof(SDbVgVersion) * dbNum,
      .value = dbs,
  };
D
dapan1121 已提交
459 460 461

  tscDebug("hb got %d expired db, valueLen:%d", dbNum, kv.valueLen);

D
dapan1121 已提交
462 463 464 465
  if (NULL == req->info) {
    req->info = taosHashInit(64, hbKeyHashFunc, 1, HASH_ENTRY_LOCK);
  }

D
dapan1121 已提交
466 467 468 469 470
  taosHashPut(req->info, &kv.key, sizeof(kv.key), &kv, sizeof(kv));

  return TSDB_CODE_SUCCESS;
}

D
dapan 已提交
471
int32_t hbGetExpiredStbInfo(SClientHbKey *connKey, struct SCatalog *pCatalog, SClientHbReq *req) {
D
dapan1121 已提交
472
  SSTableVersion *stbs = NULL;
L
fix  
Liu Jicong 已提交
473 474
  uint32_t            stbNum = 0;
  int32_t             code = 0;
D
dapan 已提交
475 476 477 478 479 480 481 482 483 484 485

  code = catalogGetExpiredSTables(pCatalog, &stbs, &stbNum);
  if (TSDB_CODE_SUCCESS != code) {
    return code;
  }

  if (stbNum <= 0) {
    return TSDB_CODE_SUCCESS;
  }

  for (int32_t i = 0; i < stbNum; ++i) {
D
dapan1121 已提交
486
    SSTableVersion *stb = &stbs[i];
D
dapan 已提交
487 488
    stb->suid = htobe64(stb->suid);
    stb->sversion = htons(stb->sversion);
L
fix  
Liu Jicong 已提交
489
    stb->tversion = htons(stb->tversion);
D
dapan1121 已提交
490
    stb->smaVer = htonl(stb->smaVer);
D
dapan 已提交
491 492
  }

L
Liu Jicong 已提交
493 494
  SKv kv = {
      .key = HEARTBEAT_KEY_STBINFO,
D
dapan1121 已提交
495
      .valueLen = sizeof(SSTableVersion) * stbNum,
L
Liu Jicong 已提交
496 497
      .value = stbs,
  };
D
dapan 已提交
498 499 500

  tscDebug("hb got %d expired stb, valueLen:%d", stbNum, kv.valueLen);

D
dapan1121 已提交
501 502 503 504
  if (NULL == req->info) {
    req->info = taosHashInit(64, hbKeyHashFunc, 1, HASH_ENTRY_LOCK);
  }

D
dapan 已提交
505 506 507 508 509
  taosHashPut(req->info, &kv.key, sizeof(kv.key), &kv, sizeof(kv));

  return TSDB_CODE_SUCCESS;
}

L
fix  
Liu Jicong 已提交
510 511
int32_t hbQueryHbReqHandle(SClientHbKey *connKey, void *param, SClientHbReq *req) {
  int64_t         *clusterId = (int64_t *)param;
D
dapan1121 已提交
512 513 514 515
  struct SCatalog *pCatalog = NULL;

  int32_t code = catalogGetHandle(*clusterId, &pCatalog);
  if (code != TSDB_CODE_SUCCESS) {
L
fix  
Liu Jicong 已提交
516
    tscWarn("catalogGetHandle failed, clusterId:%" PRIx64 ", error:%s", *clusterId, tstrerror(code));
D
dapan1121 已提交
517 518
    return code;
  }
L
fix  
Liu Jicong 已提交
519

D
dapan1121 已提交
520
  hbGetQueryBasicInfo(connKey, req);
L
Liu Jicong 已提交
521

D
dapan 已提交
522 523 524 525 526
  code = hbGetExpiredUserInfo(connKey, pCatalog, req);
  if (TSDB_CODE_SUCCESS != code) {
    return code;
  }

D
dapan1121 已提交
527 528 529 530 531
  code = hbGetExpiredDBInfo(connKey, pCatalog, req);
  if (TSDB_CODE_SUCCESS != code) {
    return code;
  }

D
dapan 已提交
532 533 534 535 536
  code = hbGetExpiredStbInfo(connKey, pCatalog, req);
  if (TSDB_CODE_SUCCESS != code) {
    return code;
  }

D
dapan1121 已提交
537 538 539 540
  return TSDB_CODE_SUCCESS;
}

void hbMgrInitMqHbHandle() {
D
dapan1121 已提交
541 542
  clientHbMgr.reqHandle[CONN_TYPE__QUERY] = hbQueryHbReqHandle;
  clientHbMgr.reqHandle[CONN_TYPE__TMQ] = hbMqHbReqHandle;
L
Liu Jicong 已提交
543

D
dapan1121 已提交
544 545
  clientHbMgr.rspHandle[CONN_TYPE__QUERY] = hbQueryHbRspHandle;
  clientHbMgr.rspHandle[CONN_TYPE__TMQ] = hbMqHbRspHandle;
L
Liu Jicong 已提交
546 547
}

L
Liu Jicong 已提交
548 549
static FORCE_INLINE void hbMgrInitHandle() {
  // init all handle
D
dapan1121 已提交
550
  hbMgrInitMqHbHandle();
L
Liu Jicong 已提交
551 552
}

L
fix  
Liu Jicong 已提交
553
SClientHbBatchReq *hbGatherAllInfo(SAppHbMgr *pAppHbMgr) {
wafwerar's avatar
wafwerar 已提交
554
  SClientHbBatchReq *pBatchReq = taosMemoryCalloc(1, sizeof(SClientHbBatchReq));
L
Liu Jicong 已提交
555
  if (pBatchReq == NULL) {
L
Liu Jicong 已提交
556 557 558
    terrno = TSDB_CODE_TSC_OUT_OF_MEMORY;
    return NULL;
  }
L
Liu Jicong 已提交
559
  int32_t connKeyCnt = atomic_load_32(&pAppHbMgr->connKeyCnt);
L
Liu Jicong 已提交
560
  pBatchReq->reqs = taosArrayInit(connKeyCnt, sizeof(SClientHbReq));
L
Liu Jicong 已提交
561

D
dapan1121 已提交
562
  int32_t code = 0;
L
fix  
Liu Jicong 已提交
563
  void   *pIter = taosHashIterate(pAppHbMgr->activeInfo, NULL);
L
Liu Jicong 已提交
564
  while (pIter != NULL) {
L
fix  
Liu Jicong 已提交
565
    SClientHbReq *pOneReq = pIter;
D
dapan1121 已提交
566

D
dapan1121 已提交
567 568
    pOneReq = taosArrayPush(pBatchReq->reqs, pOneReq);

D
dapan1121 已提交
569 570 571 572
    code = (*clientHbMgr.reqHandle[pOneReq->connKey.connType])(&pOneReq->connKey, &pOneReq->clusterId, pOneReq);
    if (code) {
      pIter = taosHashIterate(pAppHbMgr->activeInfo, pIter);
      continue;
D
dapan1121 已提交
573 574
    }

D
dapan1121 已提交
575
    //hbClearClientHbReq(pOneReq);
L
Liu Jicong 已提交
576

L
Liu Jicong 已提交
577
    pIter = taosHashIterate(pAppHbMgr->activeInfo, pIter);
L
Liu Jicong 已提交
578 579
  }

L
Liu Jicong 已提交
580 581 582 583
  //  if (code) {
  //    taosArrayDestroyEx(pBatchReq->reqs, hbFreeReq);
  //    taosMemoryFreeClear(pBatchReq);
  //  }
L
Liu Jicong 已提交
584

L
Liu Jicong 已提交
585
  return pBatchReq;
L
Liu Jicong 已提交
586 587
}

wafwerar's avatar
wafwerar 已提交
588 589 590 591
void hbThreadFuncUnexpectedStopped(void) {
  atomic_store_8(&clientHbMgr.threadStop, 2);
}

L
fix  
Liu Jicong 已提交
592
static void *hbThreadFunc(void *param) {
L
Liu Jicong 已提交
593
  setThreadName("hb");
wafwerar's avatar
wafwerar 已提交
594
#ifdef WINDOWS
wafwerar's avatar
wafwerar 已提交
595 596 597
  if (taosCheckCurrentInDll()) {
    atexit(hbThreadFuncUnexpectedStopped);
  }
wafwerar's avatar
wafwerar 已提交
598
#endif
L
Liu Jicong 已提交
599
  while (1) {
600
    int8_t threadStop = atomic_val_compare_exchange_8(&clientHbMgr.threadStop, 1, 2);
L
fix  
Liu Jicong 已提交
601
    if (1 == threadStop) {
L
Liu Jicong 已提交
602 603 604
      break;
    }

wafwerar's avatar
wafwerar 已提交
605
    taosThreadMutexLock(&clientHbMgr.lock);
606

L
Liu Jicong 已提交
607
    int sz = taosArrayGetSize(clientHbMgr.appHbMgrs);
L
fix  
Liu Jicong 已提交
608 609
    for (int i = 0; i < sz; i++) {
      SAppHbMgr *pAppHbMgr = taosArrayGetP(clientHbMgr.appHbMgrs, i);
L
Liu Jicong 已提交
610

L
Liu Jicong 已提交
611 612 613 614
      int32_t connCnt = atomic_load_32(&pAppHbMgr->connKeyCnt);
      if (connCnt == 0) {
        continue;
      }
L
fix  
Liu Jicong 已提交
615
      SClientHbBatchReq *pReq = hbGatherAllInfo(pAppHbMgr);
L
Liu Jicong 已提交
616 617 618
      if (pReq == NULL) {
        continue;
      }
L
fix  
Liu Jicong 已提交
619
      int   tlen = tSerializeSClientHbBatchReq(NULL, 0, pReq);
wafwerar's avatar
wafwerar 已提交
620
      void *buf = taosMemoryMalloc(tlen);
L
Liu Jicong 已提交
621
      if (buf == NULL) {
D
dapan1121 已提交
622
        terrno = TSDB_CODE_TSC_OUT_OF_MEMORY;
D
dapan1121 已提交
623 624
        tFreeClientHbBatchReq(pReq);
        //hbClearReqInfo(pAppHbMgr);
L
Liu Jicong 已提交
625 626
        break;
      }
L
fix  
Liu Jicong 已提交
627

S
Shengliang Guan 已提交
628
      tSerializeSClientHbBatchReq(buf, tlen, pReq);
wafwerar's avatar
wafwerar 已提交
629
      SMsgSendInfo *pInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
630

L
Liu Jicong 已提交
631 632
      if (pInfo == NULL) {
        terrno = TSDB_CODE_TSC_OUT_OF_MEMORY;
D
dapan1121 已提交
633 634
        tFreeClientHbBatchReq(pReq);
        //hbClearReqInfo(pAppHbMgr);
wafwerar's avatar
wafwerar 已提交
635
        taosMemoryFree(buf);
L
Liu Jicong 已提交
636 637
        break;
      }
L
Liu Jicong 已提交
638
      pInfo->fp = hbAsyncCallBack;
L
Liu Jicong 已提交
639 640 641
      pInfo->msgInfo.pData = buf;
      pInfo->msgInfo.len = tlen;
      pInfo->msgType = TDMT_MND_HEARTBEAT;
D
dapan1121 已提交
642
      pInfo->param = strdup(pAppHbMgr->key);
L
Liu Jicong 已提交
643 644
      pInfo->requestId = generateRequestId();
      pInfo->requestObjRefId = 0;
L
Liu Jicong 已提交
645 646

      SAppInstInfo *pAppInstInfo = pAppHbMgr->pAppInstInfo;
L
fix  
Liu Jicong 已提交
647 648
      int64_t       transporterId = 0;
      SEpSet        epSet = getEpSet_s(&pAppInstInfo->mgmtEp);
L
Liu Jicong 已提交
649
      asyncSendMsgToServer(pAppInstInfo->pTransporter, &epSet, &transporterId, pInfo);
D
dapan1121 已提交
650 651
      tFreeClientHbBatchReq(pReq);
      //hbClearReqInfo(pAppHbMgr);
L
Liu Jicong 已提交
652 653 654

      atomic_add_fetch_32(&pAppHbMgr->reportCnt, 1);
    }
655

wafwerar's avatar
wafwerar 已提交
656
    taosThreadMutexUnlock(&clientHbMgr.lock);
L
fix  
Liu Jicong 已提交
657

L
Liu Jicong 已提交
658
    taosMsleep(HEARTBEAT_INTERVAL);
L
Liu Jicong 已提交
659 660 661 662 663
  }
  return NULL;
}

static int32_t hbCreateThread() {
wafwerar's avatar
wafwerar 已提交
664 665 666
  TdThreadAttr thAttr;
  taosThreadAttrInit(&thAttr);
  taosThreadAttrSetDetachState(&thAttr, PTHREAD_CREATE_JOINABLE);
L
Liu Jicong 已提交
667

D
dapan1121 已提交
668 669 670
  if (taosThreadCreate(&clientHbMgr.thread, &thAttr, hbThreadFunc, NULL) != 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
    return -1;
L
Liu Jicong 已提交
671
  }
D
dapan1121 已提交
672
  taosThreadAttrDestroy(&thAttr);
L
Liu Jicong 已提交
673 674 675
  return 0;
}

L
Liu Jicong 已提交
676
static void hbStopThread() {
D
dapan1121 已提交
677 678 679
  if (0 == atomic_load_8(&clientHbMgr.inited)) {
    return;
  }
680
  if (atomic_val_compare_exchange_8(&clientHbMgr.threadStop, 0, 1)) {
D
dapan1121 已提交
681
    tscDebug("hb thread already stopped");
682 683
    return;
  }
L
fix  
Liu Jicong 已提交
684

685
  while (2 != atomic_load_8(&clientHbMgr.threadStop)) {
wafwerar's avatar
wafwerar 已提交
686
    taosUsleep(10);
687
  }
D
dapan1121 已提交
688

L
fix  
Liu Jicong 已提交
689
  tscDebug("hb thread stopped");
L
Liu Jicong 已提交
690 691
}

L
fix  
Liu Jicong 已提交
692
SAppHbMgr *appHbMgrInit(SAppInstInfo *pAppInstInfo, char *key) {
L
Liu Jicong 已提交
693
  hbMgrInit();
wafwerar's avatar
wafwerar 已提交
694
  SAppHbMgr *pAppHbMgr = taosMemoryMalloc(sizeof(SAppHbMgr));
L
Liu Jicong 已提交
695 696 697 698 699 700
  if (pAppHbMgr == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }
  // init stat
  pAppHbMgr->startTime = taosGetTimestampMs();
L
Liu Jicong 已提交
701 702 703
  pAppHbMgr->connKeyCnt = 0;
  pAppHbMgr->reportCnt = 0;
  pAppHbMgr->reportBytes = 0;
D
dapan1121 已提交
704
  pAppHbMgr->key = strdup(key);
L
Liu Jicong 已提交
705

L
Liu Jicong 已提交
706 707
  // init app info
  pAppHbMgr->pAppInstInfo = pAppInstInfo;
L
Liu Jicong 已提交
708 709 710

  // init hash info
  pAppHbMgr->activeInfo = taosHashInit(64, hbKeyHashFunc, 1, HASH_ENTRY_LOCK);
L
Liu Jicong 已提交
711 712 713

  if (pAppHbMgr->activeInfo == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
wafwerar's avatar
wafwerar 已提交
714
    taosMemoryFree(pAppHbMgr);
L
Liu Jicong 已提交
715 716
    return NULL;
  }
H
Haojun Liao 已提交
717

718
  // taosHashSetFreeFp(pAppHbMgr->activeInfo, tFreeClientHbReq);
L
Liu Jicong 已提交
719

wafwerar's avatar
wafwerar 已提交
720
  taosThreadMutexLock(&clientHbMgr.lock);
L
Liu Jicong 已提交
721
  taosArrayPush(clientHbMgr.appHbMgrs, &pAppHbMgr);
wafwerar's avatar
wafwerar 已提交
722
  taosThreadMutexUnlock(&clientHbMgr.lock);
L
fix  
Liu Jicong 已提交
723

L
Liu Jicong 已提交
724 725 726
  return pAppHbMgr;
}

D
dapan1121 已提交
727
void appHbMgrCleanup(void) {
L
Liu Jicong 已提交
728 729
  int sz = taosArrayGetSize(clientHbMgr.appHbMgrs);
  for (int i = 0; i < sz; i++) {
L
fix  
Liu Jicong 已提交
730
    SAppHbMgr *pTarget = taosArrayGetP(clientHbMgr.appHbMgrs, i);
L
Liu Jicong 已提交
731 732

    void *pIter = taosHashIterate(pTarget->activeInfo, NULL);
D
dapan1121 已提交
733 734
    while (pIter != NULL) {
      SClientHbReq *pOneReq = pIter;
D
dapan1121 已提交
735
      tFreeClientHbReq(pOneReq);
D
dapan1121 已提交
736
      pIter = taosHashIterate(pTarget->activeInfo, pIter);
L
Liu Jicong 已提交
737
    }
D
dapan1121 已提交
738 739
    taosHashCleanup(pTarget->activeInfo);
    pTarget->activeInfo = NULL;
D
dapan1121 已提交
740 741 742

    taosMemoryFree(pTarget->key);
    taosMemoryFree(pTarget);
L
Liu Jicong 已提交
743 744 745 746
  }
}

int hbMgrInit() {
L
Liu Jicong 已提交
747 748 749 750
  // init once
  int8_t old = atomic_val_compare_exchange_8(&clientHbMgr.inited, 0, 1);
  if (old == 1) return 0;

L
fix  
Liu Jicong 已提交
751
  clientHbMgr.appHbMgrs = taosArrayInit(0, sizeof(void *));
wafwerar's avatar
wafwerar 已提交
752
  taosThreadMutexInit(&clientHbMgr.lock, NULL);
L
Liu Jicong 已提交
753 754 755 756 757

  // init handle funcs
  hbMgrInitHandle();

  // init backgroud thread
D
dapan1121 已提交
758
  hbCreateThread();
L
Liu Jicong 已提交
759

L
Liu Jicong 已提交
760 761 762 763
  return 0;
}

void hbMgrCleanUp() {
D
dapan1121 已提交
764
  hbStopThread();
L
fix  
Liu Jicong 已提交
765

L
Liu Jicong 已提交
766
  // destroy all appHbMgr
L
Liu Jicong 已提交
767 768 769
  int8_t old = atomic_val_compare_exchange_8(&clientHbMgr.inited, 1, 0);
  if (old == 0) return;

wafwerar's avatar
wafwerar 已提交
770
  taosThreadMutexLock(&clientHbMgr.lock);
D
dapan1121 已提交
771
  appHbMgrCleanup();
L
fix  
Liu Jicong 已提交
772
  taosArrayDestroy(clientHbMgr.appHbMgrs);
wafwerar's avatar
wafwerar 已提交
773
  taosThreadMutexUnlock(&clientHbMgr.lock);
L
fix  
Liu Jicong 已提交
774

775
  clientHbMgr.appHbMgrs = NULL;
L
Liu Jicong 已提交
776 777
}

D
dapan1121 已提交
778
int hbRegisterConnImpl(SAppHbMgr *pAppHbMgr, SClientHbKey connKey, int64_t clusterId) {
L
Liu Jicong 已提交
779
  // init hash in activeinfo
L
fix  
Liu Jicong 已提交
780
  void *data = taosHashGet(pAppHbMgr->activeInfo, &connKey, sizeof(SClientHbKey));
L
Liu Jicong 已提交
781 782 783
  if (data != NULL) {
    return 0;
  }
D
dapan1121 已提交
784
  SClientHbReq hbReq = {0};
L
Liu Jicong 已提交
785
  hbReq.connKey = connKey;
D
dapan1121 已提交
786
  hbReq.clusterId = clusterId;
D
dapan1121 已提交
787
  //hbReq.info = taosHashInit(64, hbKeyHashFunc, 1, HASH_ENTRY_LOCK);
L
fix  
Liu Jicong 已提交
788

L
Liu Jicong 已提交
789
  taosHashPut(pAppHbMgr->activeInfo, &connKey, sizeof(SClientHbKey), &hbReq, sizeof(SClientHbReq));
L
fix  
Liu Jicong 已提交
790

L
Liu Jicong 已提交
791
  atomic_add_fetch_32(&pAppHbMgr->connKeyCnt, 1);
L
Liu Jicong 已提交
792 793 794
  return 0;
}

D
dapan1121 已提交
795
int hbRegisterConn(SAppHbMgr *pAppHbMgr, int64_t tscRefId, int64_t clusterId, int8_t connType) {
L
Liu Jicong 已提交
796
  SClientHbKey connKey = {
D
dapan1121 已提交
797
      .tscRid = tscRefId,
D
dapan1121 已提交
798
      .connType = connType,
L
Liu Jicong 已提交
799
  };
D
dapan1121 已提交
800

D
dapan1121 已提交
801 802
  switch (connType) {
    case CONN_TYPE__QUERY: {
D
dapan1121 已提交
803
      return hbRegisterConnImpl(pAppHbMgr, connKey, clusterId);
D
dapan1121 已提交
804
    }
D
dapan1121 已提交
805
    case CONN_TYPE__TMQ: {
L
Liu Jicong 已提交
806
      return 0;
D
dapan1121 已提交
807 808
    }
    default:
L
Liu Jicong 已提交
809
      return 0;
D
dapan1121 已提交
810 811 812
  }
}

L
fix  
Liu Jicong 已提交
813
void hbDeregisterConn(SAppHbMgr *pAppHbMgr, SClientHbKey connKey) {
D
dapan1121 已提交
814 815
  SClientHbReq *pReq = taosHashGet(pAppHbMgr->activeInfo, &connKey, sizeof(SClientHbKey));
  if (pReq) {
D
dapan1121 已提交
816
    tFreeClientHbReq(pReq);
D
dapan1121 已提交
817 818 819
    taosHashRemove(pAppHbMgr->activeInfo, &connKey, sizeof(SClientHbKey));
  }

D
dapan1121 已提交
820
  if (NULL == pReq) {
D
dapan1121 已提交
821 822
    return;
  }
L
Liu Jicong 已提交
823

L
Liu Jicong 已提交
824
  atomic_sub_fetch_32(&pAppHbMgr->connKeyCnt, 1);
L
Liu Jicong 已提交
825 826
}