tq.c 50.4 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
S
Shengliang Guan 已提交
14 15
 */

H
Hongze Cheng 已提交
16
#include "tq.h"
S
Shengliang Guan 已提交
17

dengyihao's avatar
dengyihao 已提交
18 19 20
// 0: not init
// 1: already inited
// 2: wait to be inited or cleaup
21
#define WAL_READ_TASKS_ID (-1)
22

23
static int32_t tqInitialize(STQ* pTq);
dengyihao's avatar
dengyihao 已提交
24

wmmhello's avatar
wmmhello 已提交
25
static FORCE_INLINE bool tqIsHandleExec(STqHandle* pHandle) { return TMQ_HANDLE_STATUS_EXEC == pHandle->status; }
dengyihao's avatar
dengyihao 已提交
26 27
static FORCE_INLINE void tqSetHandleExec(STqHandle* pHandle) { pHandle->status = TMQ_HANDLE_STATUS_EXEC; }
static FORCE_INLINE void tqSetHandleIdle(STqHandle* pHandle) { pHandle->status = TMQ_HANDLE_STATUS_IDLE; }
wmmhello's avatar
wmmhello 已提交
28

L
Liu Jicong 已提交
29
int32_t tqInit() {
L
Liu Jicong 已提交
30 31 32 33 34 35
  int8_t old;
  while (1) {
    old = atomic_val_compare_exchange_8(&tqMgmt.inited, 0, 2);
    if (old != 2) break;
  }

36 37 38 39 40 41
  if (old == 0) {
    tqMgmt.timer = taosTmrInit(10000, 100, 10000, "TQ");
    if (tqMgmt.timer == NULL) {
      atomic_store_8(&tqMgmt.inited, 0);
      return -1;
    }
42 43 44
    if (streamInit() < 0) {
      return -1;
    }
L
Liu Jicong 已提交
45
    atomic_store_8(&tqMgmt.inited, 1);
46
  }
47

L
Liu Jicong 已提交
48 49
  return 0;
}
L
Liu Jicong 已提交
50

51
void tqCleanUp() {
L
Liu Jicong 已提交
52 53 54 55 56 57 58 59
  int8_t old;
  while (1) {
    old = atomic_val_compare_exchange_8(&tqMgmt.inited, 1, 2);
    if (old != 2) break;
  }

  if (old == 1) {
    taosTmrCleanUp(tqMgmt.timer);
L
Liu Jicong 已提交
60
    streamCleanUp();
L
Liu Jicong 已提交
61 62
    atomic_store_8(&tqMgmt.inited, 0);
  }
63
}
L
Liu Jicong 已提交
64

65
static void destroyTqHandle(void* data) {
66 67
  STqHandle* pData = (STqHandle*)data;
  qDestroyTask(pData->execHandle.task);
wmmhello's avatar
wmmhello 已提交
68

69
  if (pData->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
L
Liu Jicong 已提交
70
    taosMemoryFreeClear(pData->execHandle.execCol.qmsg);
71
  } else if (pData->execHandle.subType == TOPIC_SUB_TYPE__DB) {
72
    tqReaderClose(pData->execHandle.pTqReader);
73 74
    walCloseReader(pData->pWalReader);
    taosHashCleanup(pData->execHandle.execDb.pFilterOutTbUid);
L
Liu Jicong 已提交
75
  } else if (pData->execHandle.subType == TOPIC_SUB_TYPE__TABLE) {
76
    walCloseReader(pData->pWalReader);
77
    tqReaderClose(pData->execHandle.pTqReader);
78 79
    taosMemoryFreeClear(pData->execHandle.execTb.qmsg);
    nodesDestroyNode(pData->execHandle.execTb.node);
80
  }
dengyihao's avatar
dengyihao 已提交
81
  if (pData->msg != NULL) {
82 83 84
    rpcFreeCont(pData->msg->pCont);
    taosMemoryFree(pData->msg);
    pData->msg = NULL;
D
dapan1121 已提交
85
  }
L
Liu Jicong 已提交
86 87
}

88 89 90 91 92
static bool tqOffsetLessOrEqual(const STqOffset* pLeft, const STqOffset* pRight) {
  return pLeft->val.type == TMQ_OFFSET__LOG && pRight->val.type == TMQ_OFFSET__LOG &&
         pLeft->val.version <= pRight->val.version;
}

L
Liu Jicong 已提交
93
STQ* tqOpen(const char* path, SVnode* pVnode) {
94
  STQ* pTq = taosMemoryCalloc(1, sizeof(STQ));
L
Liu Jicong 已提交
95
  if (pTq == NULL) {
S
Shengliang Guan 已提交
96
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
97 98
    return NULL;
  }
99

100
  pTq->path = taosStrdup(path);
L
Liu Jicong 已提交
101
  pTq->pVnode = pVnode;
L
Liu Jicong 已提交
102
  pTq->walLogLastVer = pVnode->pWal->vers.lastVer;
103

104
  pTq->pHandle = taosHashInit(64, MurmurHash3_32, true, HASH_ENTRY_LOCK);
105
  taosHashSetFreeFp(pTq->pHandle, destroyTqHandle);
106

107
  taosInitRWLatch(&pTq->lock);
108
  pTq->pPushMgr = taosHashInit(64, MurmurHash3_32, false, HASH_NO_LOCK);
L
Liu Jicong 已提交
109

110
  pTq->pCheckInfo = taosHashInit(64, MurmurHash3_32, true, HASH_ENTRY_LOCK);
L
Liu Jicong 已提交
111
  taosHashSetFreeFp(pTq->pCheckInfo, (FDelete)tDeleteSTqCheckInfo);
L
Liu Jicong 已提交
112

113 114 115 116 117 118 119
  int32_t code = tqInitialize(pTq);
  if (code != TSDB_CODE_SUCCESS) {
    tqClose(pTq);
    return NULL;
  } else {
    return pTq;
  }
120 121 122
}

int32_t tqInitialize(STQ* pTq) {
L
Liu Jicong 已提交
123
  if (tqMetaOpen(pTq) < 0) {
124
    return -1;
125 126
  }

L
Liu Jicong 已提交
127 128
  pTq->pOffsetStore = tqOffsetOpen(pTq);
  if (pTq->pOffsetStore == NULL) {
129
    return -1;
130 131
  }

132
  pTq->pStreamMeta = streamMetaOpen(pTq->path, pTq, (FTaskExpand*)tqExpandTask, pTq->pVnode->config.vgId);
L
Liu Jicong 已提交
133
  if (pTq->pStreamMeta == NULL) {
134
    return -1;
L
Liu Jicong 已提交
135 136
  }

137 138
  // the version is kept in task's meta data
  // todo check if this version is required or not
139 140
  if (streamLoadTasks(pTq->pStreamMeta, walGetCommittedVer(pTq->pVnode->pWal)) < 0) {
    return -1;
L
Liu Jicong 已提交
141 142
  }

143
  return 0;
L
Liu Jicong 已提交
144
}
L
Liu Jicong 已提交
145

L
Liu Jicong 已提交
146
void tqClose(STQ* pTq) {
147 148
  if (pTq == NULL) {
    return;
H
Hongze Cheng 已提交
149
  }
150 151 152 153 154 155 156 157 158

  tqOffsetClose(pTq->pOffsetStore);
  taosHashCleanup(pTq->pHandle);
  taosHashCleanup(pTq->pPushMgr);
  taosHashCleanup(pTq->pCheckInfo);
  taosMemoryFree(pTq->path);
  tqMetaClose(pTq);
  streamMetaClose(pTq->pStreamMeta);
  taosMemoryFree(pTq);
L
Liu Jicong 已提交
159
}
L
Liu Jicong 已提交
160

H
Haojun Liao 已提交
161 162 163 164 165 166 167 168 169 170 171 172 173
void tqNotifyClose(STQ* pTq) {
  if (pTq != NULL) {
    taosWLockLatch(&pTq->pStreamMeta->lock);

    void* pIter = NULL;
    while (1) {
      pIter = taosHashIterate(pTq->pStreamMeta->pTasks, pIter);
      if (pIter == NULL) {
        break;
      }

      SStreamTask* pTask = *(SStreamTask**)pIter;
      tqDebug("vgId:%d s-task:%s set dropping flag", pTq->pStreamMeta->vgId, pTask->id.idStr);
174 175 176
      pTask->status.taskStatus = TASK_STATUS__STOP;

      int64_t st = taosGetTimestampMs();
H
Haojun Liao 已提交
177
      qKillTask(pTask->exec.pExecutor, TSDB_CODE_SUCCESS);
178
      int64_t el = taosGetTimestampMs() - st;
H
Haojun Liao 已提交
179
      tqDebug("vgId:%d s-task:%s is closed in %" PRId64 " ms", pTq->pStreamMeta->vgId, pTask->id.idStr, el);
H
Haojun Liao 已提交
180 181 182 183 184 185
    }

    taosWUnLockLatch(&pTq->pStreamMeta->lock);
  }
}

D
dapan1121 已提交
186 187
static int32_t doSendDataRsp(const SRpcHandleInfo* pRpcHandleInfo, const SMqDataRsp* pRsp, int32_t epoch,
                             int64_t consumerId, int32_t type) {
L
Liu Jicong 已提交
188 189
  int32_t len = 0;
  int32_t code = 0;
D
dapan1121 已提交
190 191

  if (type == TMQ_MSG_TYPE__POLL_RSP) {
H
Haojun Liao 已提交
192
    tEncodeSize(tEncodeMqDataRsp, pRsp, len, code);
D
dapan1121 已提交
193 194 195
  } else if (type == TMQ_MSG_TYPE__TAOSX_RSP) {
    tEncodeSize(tEncodeSTaosxRsp, (STaosxRsp*)pRsp, len, code);
  }
L
Liu Jicong 已提交
196 197 198 199 200 201 202 203 204 205 206

  if (code < 0) {
    return -1;
  }

  int32_t tlen = sizeof(SMqRspHead) + len;
  void*   buf = rpcMallocCont(tlen);
  if (buf == NULL) {
    return -1;
  }

D
dapan1121 已提交
207 208 209
  ((SMqRspHead*)buf)->mqMsgType = type;
  ((SMqRspHead*)buf)->epoch = epoch;
  ((SMqRspHead*)buf)->consumerId = consumerId;
L
Liu Jicong 已提交
210 211 212 213 214 215

  void* abuf = POINTER_SHIFT(buf, sizeof(SMqRspHead));

  SEncoder encoder = {0};
  tEncoderInit(&encoder, abuf, len);

D
dapan1121 已提交
216
  if (type == TMQ_MSG_TYPE__POLL_RSP) {
H
Haojun Liao 已提交
217
    tEncodeMqDataRsp(&encoder, pRsp);
D
dapan1121 已提交
218
  } else if (type == TMQ_MSG_TYPE__TAOSX_RSP) {
X
Xiaoyu Wang 已提交
219
    tEncodeSTaosxRsp(&encoder, (STaosxRsp*)pRsp);
dengyihao's avatar
dengyihao 已提交
220
  }
L
Liu Jicong 已提交
221

wmmhello's avatar
wmmhello 已提交
222
  tEncoderClear(&encoder);
L
Liu Jicong 已提交
223 224

  SRpcMsg rsp = {
D
dapan1121 已提交
225
      .info = *pRpcHandleInfo,
L
Liu Jicong 已提交
226 227 228 229
      .pCont = buf,
      .contLen = tlen,
      .code = 0,
  };
L
Liu Jicong 已提交
230

L
Liu Jicong 已提交
231
  tmsgSendRsp(&rsp);
L
Liu Jicong 已提交
232 233
  return 0;
}
L
Liu Jicong 已提交
234

H
Haojun Liao 已提交
235
int32_t tqPushDataRsp(STqHandle* pHandle, int32_t vgId) {
236 237 238 239
  SMqDataRsp dataRsp = {0};
  dataRsp.head.consumerId = pHandle->consumerId;
  dataRsp.head.epoch = pHandle->epoch;
  dataRsp.head.mqMsgType = TMQ_MSG_TYPE__POLL_RSP;
240 241

  int64_t sver = 0, ever = 0;
H
Haojun Liao 已提交
242
  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);
dengyihao's avatar
dengyihao 已提交
243 244
  tqDoSendDataRsp(&pHandle->msg->info, &dataRsp, pHandle->epoch, pHandle->consumerId, TMQ_MSG_TYPE__POLL_RSP, sver,
                  ever);
D
dapan1121 已提交
245

246 247
  char buf1[TSDB_OFFSET_LEN] = {0};
  char buf2[TSDB_OFFSET_LEN] = {0};
248 249
  tFormatOffset(buf1, tListLen(buf1), &dataRsp.reqOffset);
  tFormatOffset(buf2, tListLen(buf2), &dataRsp.rspOffset);
dengyihao's avatar
dengyihao 已提交
250 251
  tqDebug("vgId:%d, from consumer:0x%" PRIx64 " (epoch %d) push rsp, block num: %d, req:%s, rsp:%s", vgId,
          dataRsp.head.consumerId, dataRsp.head.epoch, dataRsp.blockNum, buf1, buf2);
L
Liu Jicong 已提交
252 253 254
  return 0;
}

255 256 257 258 259 260
int32_t tqSendDataRsp(STqHandle* pHandle, const SRpcMsg* pMsg, const SMqPollReq* pReq, const SMqDataRsp* pRsp,
                      int32_t type, int32_t vgId) {
  int64_t sver = 0, ever = 0;
  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);

  tqDoSendDataRsp(&pMsg->info, pRsp, pReq->epoch, pReq->consumerId, type, sver, ever);
261

262 263 264 265
  char buf1[TSDB_OFFSET_LEN] = {0};
  char buf2[TSDB_OFFSET_LEN] = {0};
  tFormatOffset(buf1, TSDB_OFFSET_LEN, &pRsp->reqOffset);
  tFormatOffset(buf2, TSDB_OFFSET_LEN, &pRsp->rspOffset);
266

dengyihao's avatar
dengyihao 已提交
267 268
  tqDebug("vgId:%d consumer:0x%" PRIx64 " (epoch %d) send rsp, block num:%d, req:%s, rsp:%s, reqId:0x%" PRIx64, vgId,
          pReq->consumerId, pReq->epoch, pRsp->blockNum, buf1, buf2, pReq->reqId);
269 270 271 272

  return 0;
}

273
int32_t tqProcessOffsetCommitReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
274 275
  SMqVgOffset vgOffset = {0};
  int32_t     vgId = TD_VID(pTq->pVnode);
276

X
Xiaoyu Wang 已提交
277 278
  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
279
  if (tDecodeMqVgOffset(&decoder, &vgOffset) < 0) {
280 281
    return -1;
  }
282

283 284
  tDecoderClear(&decoder);

285 286 287
  STqOffset* pOffset = &vgOffset.offset;

  if (pOffset->val.type == TMQ_OFFSET__SNAPSHOT_DATA || pOffset->val.type == TMQ_OFFSET__SNAPSHOT_META) {
L
Liu Jicong 已提交
288
    tqDebug("receive offset commit msg to %s on vgId:%d, offset(type:snapshot) uid:%" PRId64 ", ts:%" PRId64,
289 290 291 292 293 294
            pOffset->subKey, vgId, pOffset->val.uid, pOffset->val.ts);
  } else if (pOffset->val.type == TMQ_OFFSET__LOG) {
    tqDebug("receive offset commit msg to %s on vgId:%d, offset(type:log) version:%" PRId64, pOffset->subKey, vgId,
            pOffset->val.version);
    if (pOffset->val.version + 1 == sversion) {
      pOffset->val.version += 1;
295
    }
296
  } else {
297
    tqError("invalid commit offset type:%d", pOffset->val.type);
298
    return -1;
299
  }
300

301 302
  STqOffset* pSavedOffset = tqOffsetRead(pTq->pOffsetStore, pOffset->subKey);
  if (pSavedOffset != NULL && tqOffsetLessOrEqual(pOffset, pSavedOffset)) {
303
    tqDebug("not update the offset, vgId:%d sub:%s since committed:%" PRId64 " less than/equal to existed:%" PRId64,
304
            vgId, pOffset->subKey, pOffset->val.version, pSavedOffset->val.version);
305
    return 0;  // no need to update the offset value
306 307
  }

308
  // save the new offset value
309
  if (tqOffsetWrite(pTq->pOffsetStore, pOffset) < 0) {
310
    return -1;
311
  }
312

313 314 315
  return 0;
}

316
int32_t tqProcessSeekReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
317 318
  SMqVgOffset vgOffset = {0};
  int32_t     vgId = TD_VID(pTq->pVnode);
319 320 321

  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
322
  if (tDecodeMqVgOffset(&decoder, &vgOffset) < 0) {
H
Haojun Liao 已提交
323
    tqError("vgId:%d failed to decode seek msg", vgId);
324 325 326 327 328
    return -1;
  }

  tDecoderClear(&decoder);

H
Haojun Liao 已提交
329 330 331
  tqDebug("topic:%s, vgId:%d process offset seek by consumer:0x%" PRIx64 ", req offset:%" PRId64,
          vgOffset.offset.subKey, vgId, vgOffset.consumerId, vgOffset.offset.val.version);

332 333 334
  STqOffset* pOffset = &vgOffset.offset;
  if (pOffset->val.type != TMQ_OFFSET__LOG) {
    tqError("vgId:%d, subKey:%s invalid seek offset type:%d", vgId, pOffset->subKey, pOffset->val.type);
335 336 337
    return -1;
  }

338 339
  STqHandle* pHandle = taosHashGet(pTq->pHandle, pOffset->subKey, strlen(pOffset->subKey));
  if (pHandle == NULL) {
dengyihao's avatar
dengyihao 已提交
340
    tqError("tmq seek: consumer:0x%" PRIx64 " vgId:%d subkey %s not found", vgOffset.consumerId, vgId, pOffset->subKey);
341 342
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
343 344
  }

345 346 347 348 349 350 351 352
  // 2. check consumer-vg assignment status
  taosRLockLatch(&pTq->lock);
  if (pHandle->consumerId != vgOffset.consumerId) {
    tqDebug("ERROR tmq seek: consumer:0x%" PRIx64 " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
            vgOffset.consumerId, vgId, pOffset->subKey, pHandle->consumerId);
    terrno = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
    taosRUnLockLatch(&pTq->lock);
    return -1;
353
  }
354 355
  taosRUnLockLatch(&pTq->lock);

dengyihao's avatar
dengyihao 已提交
356
  // 3. check the offset info
357 358 359 360 361 362
  STqOffset* pSavedOffset = tqOffsetRead(pTq->pOffsetStore, pOffset->subKey);
  if (pSavedOffset != NULL) {
    if (pSavedOffset->val.type != TMQ_OFFSET__LOG) {
      tqError("invalid saved offset type, vgId:%d sub:%s", vgId, pOffset->subKey);
      return 0;  // no need to update the offset value
    }
363

364 365 366 367 368 369
    if (pSavedOffset->val.version == pOffset->val.version) {
      tqDebug("vgId:%d subKey:%s no need to seek to %" PRId64 " prev offset:%" PRId64, vgId, pOffset->subKey,
              pOffset->val.version, pSavedOffset->val.version);
      return 0;
    }
  }
370 371 372

  int64_t sver = 0, ever = 0;
  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);
373 374 375 376
  if (pOffset->val.version < sver) {
    pOffset->val.version = sver;
  } else if (pOffset->val.version > ever) {
    pOffset->val.version = ever;
377 378 379
  }

  // save the new offset value
380 381 382 383
  if (pSavedOffset != NULL) {
    tqDebug("vgId:%d sub:%s seek to:%" PRId64 " prev offset:%" PRId64, vgId, pOffset->subKey, pOffset->val.version,
            pSavedOffset->val.version);
  } else {
dengyihao's avatar
dengyihao 已提交
384
    tqDebug("vgId:%d sub:%s seek to:%" PRId64 " not saved yet", vgId, pOffset->subKey, pOffset->val.version);
385
  }
386

387 388
  if (tqOffsetWrite(pTq->pOffsetStore, pOffset) < 0) {
    tqError("failed to save offset, vgId:%d sub:%s seek to %" PRId64, vgId, pOffset->subKey, pOffset->val.version);
389 390 391
    return -1;
  }

H
Haojun Liao 已提交
392 393 394
  tqDebug("topic:%s, vgId:%d consumer:0x%" PRIx64 " offset is update to:%" PRId64, vgOffset.offset.subKey, vgId,
          vgOffset.consumerId, vgOffset.offset.val.version);

395 396 397
  return 0;
}

L
Liu Jicong 已提交
398
int32_t tqCheckColModifiable(STQ* pTq, int64_t tbUid, int32_t colId) {
L
Liu Jicong 已提交
399
  void* pIter = NULL;
400

L
Liu Jicong 已提交
401
  while (1) {
402
    pIter = taosHashIterate(pTq->pCheckInfo, pIter);
403 404 405 406
    if (pIter == NULL) {
      break;
    }

407
    STqCheckInfo* pCheck = (STqCheckInfo*)pIter;
408

L
Liu Jicong 已提交
409 410
    if (pCheck->ntbUid == tbUid) {
      int32_t sz = taosArrayGetSize(pCheck->colIdList);
L
Liu Jicong 已提交
411
      for (int32_t i = 0; i < sz; i++) {
L
Liu Jicong 已提交
412 413
        int16_t forbidColId = *(int16_t*)taosArrayGet(pCheck->colIdList, i);
        if (forbidColId == colId) {
414
          taosHashCancelIterate(pTq->pCheckInfo, pIter);
L
Liu Jicong 已提交
415 416 417 418 419
          return -1;
        }
      }
    }
  }
420

L
Liu Jicong 已提交
421 422 423
  return 0;
}

D
dapan1121 已提交
424
int32_t tqProcessPollReq(STQ* pTq, SRpcMsg* pMsg) {
X
Xiaoyu Wang 已提交
425
  SMqPollReq req = {0};
dengyihao's avatar
dengyihao 已提交
426
  int        code = 0;
D
dapan1121 已提交
427 428 429 430 431 432 433 434 435 436
  if (tDeserializeSMqPollReq(pMsg->pCont, pMsg->contLen, &req) < 0) {
    tqError("tDeserializeSMqPollReq %d failed", pMsg->contLen);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  int64_t      consumerId = req.consumerId;
  int32_t      reqEpoch = req.epoch;
  STqOffsetVal reqOffset = req.reqOffset;
  int32_t      vgId = TD_VID(pTq->pVnode);
wmmhello's avatar
wmmhello 已提交
437
  STqHandle*   pHandle = NULL;
D
dapan1121 已提交
438

wmmhello's avatar
wmmhello 已提交
439 440 441 442 443 444 445 446 447 448
  while (1) {
    taosWLockLatch(&pTq->lock);
    // 1. find handle
    pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
    if (pHandle == NULL) {
      tqError("tmq poll: consumer:0x%" PRIx64 " vgId:%d subkey %s not found", consumerId, vgId, req.subKey);
      terrno = TSDB_CODE_INVALID_MSG;
      taosWUnLockLatch(&pTq->lock);
      return -1;
    }
D
dapan1121 已提交
449

450 451
    // 2. check re-balance status
    if (pHandle->consumerId != consumerId) {
dengyihao's avatar
dengyihao 已提交
452 453
      tqError("ERROR tmq poll: consumer:0x%" PRIx64
              " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
454
              consumerId, TD_VID(pTq->pVnode), req.subKey, pHandle->consumerId);
455
      terrno = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
456 457 458
      taosWUnLockLatch(&pTq->lock);
      return -1;
    }
wmmhello's avatar
wmmhello 已提交
459

wmmhello's avatar
wmmhello 已提交
460
    bool exec = tqIsHandleExec(pHandle);
dengyihao's avatar
dengyihao 已提交
461
    if (!exec) {
wmmhello's avatar
wmmhello 已提交
462
      tqSetHandleExec(pHandle);
dengyihao's avatar
dengyihao 已提交
463 464 465
      //      qSetTaskCode(pHandle->execHandle.task, TDB_CODE_SUCCESS);
      tqDebug("tmq poll: consumer:0x%" PRIx64 "vgId:%d, topic:%s, set handle exec, pHandle:%p", consumerId, vgId,
              req.subKey, pHandle);
wmmhello's avatar
wmmhello 已提交
466 467 468
      taosWUnLockLatch(&pTq->lock);
      break;
    }
469
    taosWUnLockLatch(&pTq->lock);
470

dengyihao's avatar
dengyihao 已提交
471 472 473
    tqDebug("tmq poll: consumer:0x%" PRIx64
            "vgId:%d, topic:%s, subscription is executing, wait for 10ms and retry, pHandle:%p",
            consumerId, vgId, req.subKey, pHandle);
wmmhello's avatar
wmmhello 已提交
474
    taosMsleep(10);
D
dapan1121 已提交
475 476 477
  }

  // 3. update the epoch value
478
  if (pHandle->epoch < reqEpoch) {
dengyihao's avatar
dengyihao 已提交
479
    tqDebug("tmq poll: consumer:0x%" PRIx64 " epoch update from %d to %d by poll req", consumerId, pHandle->epoch,
X
Xiaoyu Wang 已提交
480
            reqEpoch);
D
dapan1121 已提交
481 482 483
    pHandle->epoch = reqEpoch;
  }

484 485
  char buf[TSDB_OFFSET_LEN];
  tFormatOffset(buf, TSDB_OFFSET_LEN, &reqOffset);
D
dapan1121 已提交
486 487 488
  tqDebug("tmq poll: consumer:0x%" PRIx64 " (epoch %d), subkey %s, recv poll req vgId:%d, req:%s, reqId:0x%" PRIx64,
          consumerId, req.epoch, pHandle->subKey, vgId, buf, req.reqId);

wmmhello's avatar
wmmhello 已提交
489
  code = tqExtractDataForMq(pTq, pHandle, &req, pMsg);
490
  tqSetHandleIdle(pHandle);
491

dengyihao's avatar
dengyihao 已提交
492 493
  tqDebug("tmq poll: consumer:0x%" PRIx64 "vgId:%d, topic:%s, , set handle idle, pHandle:%p", consumerId, vgId,
          req.subKey, pHandle);
494
  return code;
D
dapan1121 已提交
495 496
}

497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554
int32_t tqProcessVgWalInfoReq(STQ* pTq, SRpcMsg* pMsg) {
  SMqPollReq req = {0};
  if (tDeserializeSMqPollReq(pMsg->pCont, pMsg->contLen, &req) < 0) {
    tqError("tDeserializeSMqPollReq %d failed", pMsg->contLen);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  int64_t      consumerId = req.consumerId;
  STqOffsetVal reqOffset = req.reqOffset;
  int32_t      vgId = TD_VID(pTq->pVnode);

  // 1. find handle
  STqHandle* pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
  if (pHandle == NULL) {
    tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s not found", consumerId, vgId, req.subKey);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  // 2. check re-balance status
  taosRLockLatch(&pTq->lock);
  if (pHandle->consumerId != consumerId) {
    tqDebug("ERROR consumer:0x%" PRIx64 " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
            consumerId, vgId, req.subKey, pHandle->consumerId);
    terrno = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
    taosRUnLockLatch(&pTq->lock);
    return -1;
  }
  taosRUnLockLatch(&pTq->lock);

  int64_t sver = 0, ever = 0;
  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);

  SMqDataRsp dataRsp = {0};
  tqInitDataRsp(&dataRsp, &req);

  STqOffset* pOffset = tqOffsetRead(pTq->pOffsetStore, req.subKey);
  if (pOffset != NULL) {
    if (pOffset->val.type != TMQ_OFFSET__LOG) {
      tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s use snapshot, no valid wal info", consumerId, vgId, req.subKey);
      terrno = TSDB_CODE_INVALID_PARA;
      tDeleteMqDataRsp(&dataRsp);
      return -1;
    }

    dataRsp.rspOffset.type = TMQ_OFFSET__LOG;
    dataRsp.rspOffset.version = pOffset->val.version;
  } else {
    if (req.useSnapshot == true) {
      tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s snapshot not support wal info", consumerId, vgId, req.subKey);
      terrno = TSDB_CODE_INVALID_PARA;
      tDeleteMqDataRsp(&dataRsp);
      return -1;
    }

    dataRsp.rspOffset.type = TMQ_OFFSET__LOG;

555
    if (reqOffset.type == TMQ_OFFSET__LOG) {
556
      int64_t currentVer = walReaderGetCurrentVer(pHandle->execHandle.pTqReader->pWalReader);
dengyihao's avatar
dengyihao 已提交
557
      if (currentVer == -1) {  // not start to read data from wal yet, return req offset directly
558 559 560 561
        dataRsp.rspOffset.version = reqOffset.version;
      } else {
        dataRsp.rspOffset.version = currentVer;  // return current consume offset value
      }
562 563
    } else if (reqOffset.type == TMQ_OFFSET__RESET_EARLIEAST) {
      dataRsp.rspOffset.version = sver;  // not consume yet, set the earliest position
564 565 566 567 568 569 570 571 572 573 574 575 576 577 578
    } else if (reqOffset.type == TMQ_OFFSET__RESET_LATEST) {
      dataRsp.rspOffset.version = ever;
    } else {
      tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s invalid offset type:%d", consumerId, vgId, req.subKey,
              reqOffset.type);
      terrno = TSDB_CODE_INVALID_PARA;
      tDeleteMqDataRsp(&dataRsp);
      return -1;
    }
  }

  tqDoSendDataRsp(&pMsg->info, &dataRsp, req.epoch, req.consumerId, TMQ_MSG_TYPE__WALINFO_RSP, sver, ever);
  return 0;
}

579
int32_t tqProcessDeleteSubReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
L
Liu Jicong 已提交
580
  SMqVDeleteReq* pReq = (SMqVDeleteReq*)msg;
dengyihao's avatar
dengyihao 已提交
581
  int32_t        vgId = TD_VID(pTq->pVnode);
L
Liu Jicong 已提交
582

583
  tqDebug("vgId:%d, tq process delete sub req %s", vgId, pReq->subKey);
wmmhello's avatar
wmmhello 已提交
584
  int32_t code = 0;
L
Liu Jicong 已提交
585

wmmhello's avatar
wmmhello 已提交
586
  taosWLockLatch(&pTq->lock);
L
Liu Jicong 已提交
587 588
  STqHandle* pHandle = taosHashGet(pTq->pHandle, pReq->subKey, strlen(pReq->subKey));
  if (pHandle) {
wmmhello's avatar
wmmhello 已提交
589
    while (tqIsHandleExec(pHandle)) {
dengyihao's avatar
dengyihao 已提交
590 591
      tqDebug("vgId:%d, topic:%s, subscription is executing, wait for 10ms and retry, pHandle:%p", vgId,
              pHandle->subKey, pHandle);
wmmhello's avatar
wmmhello 已提交
592
      taosMsleep(10);
593
    }
594

L
Liu Jicong 已提交
595 596 597
    if (pHandle->pRef) {
      walCloseRef(pTq->pVnode->pWal, pHandle->pRef->refId);
    }
598

L
Liu Jicong 已提交
599 600 601 602
    code = taosHashRemove(pTq->pHandle, pReq->subKey, strlen(pReq->subKey));
    if (code != 0) {
      tqError("cannot process tq delete req %s, since no such handle", pReq->subKey);
    }
L
Liu Jicong 已提交
603
  }
604

L
Liu Jicong 已提交
605 606
  code = tqOffsetDelete(pTq->pOffsetStore, pReq->subKey);
  if (code != 0) {
607
    tqError("cannot process tq delete req %s, since no such offset in cache", pReq->subKey);
L
Liu Jicong 已提交
608
  }
L
Liu Jicong 已提交
609

L
Liu Jicong 已提交
610
  if (tqMetaDeleteHandle(pTq, pReq->subKey) < 0) {
L
Liu Jicong 已提交
611
    tqError("cannot process tq delete req %s, since no such offset in tdb", pReq->subKey);
612
  }
wmmhello's avatar
wmmhello 已提交
613 614
  taosWUnLockLatch(&pTq->lock);

L
Liu Jicong 已提交
615
  return 0;
L
Liu Jicong 已提交
616 617
}

618
int32_t tqProcessAddCheckInfoReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
619 620
  STqCheckInfo info = {0};
  SDecoder     decoder;
X
Xiaoyu Wang 已提交
621
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
622
  if (tDecodeSTqCheckInfo(&decoder, &info) < 0) {
L
Liu Jicong 已提交
623 624 625 626
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  tDecoderClear(&decoder);
627 628 629 630 631
  if (taosHashPut(pTq->pCheckInfo, info.topic, strlen(info.topic), &info, sizeof(STqCheckInfo)) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  if (tqMetaSaveCheckInfo(pTq, info.topic, msg, msgLen) < 0) {
L
Liu Jicong 已提交
632 633 634 635 636 637
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  return 0;
}

638
int32_t tqProcessDelCheckInfoReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
639 640 641 642 643 644 645 646 647 648 649
  if (taosHashRemove(pTq->pCheckInfo, msg, strlen(msg)) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  if (tqMetaDeleteCheckInfo(pTq, msg) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  return 0;
}

650
int32_t tqProcessSubscribeReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
dengyihao's avatar
dengyihao 已提交
651
  int         ret = 0;
L
Liu Jicong 已提交
652
  SMqRebVgReq req = {0};
dengyihao's avatar
dengyihao 已提交
653
  SDecoder    dc = {0};
654 655 656 657 658 659 660 661 662

  tDecoderInit(&dc, msg, msgLen);

  // decode req
  if (tDecodeSMqRebVgReq(&dc, &req) < 0) {
    terrno = TSDB_CODE_INVALID_MSG;
    tDecoderClear(&dc);
    return -1;
  }
L
Liu Jicong 已提交
663

D
dapan1121 已提交
664 665 666
  SVnode* pVnode = pTq->pVnode;
  int32_t vgId = TD_VID(pVnode);

667
  tqDebug("vgId:%d, tq process sub req:%s, Id:0x%" PRIx64 " -> Id:0x%" PRIx64, pVnode->config.vgId, req.subKey,
D
dapan1121 已提交
668
          req.oldConsumerId, req.newConsumerId);
L
Liu Jicong 已提交
669

670
  STqHandle* pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
L
Liu Jicong 已提交
671
  if (pHandle == NULL) {
L
Liu Jicong 已提交
672
    if (req.oldConsumerId != -1) {
673
      tqError("vgId:%d, build new consumer handle %s for consumer:0x%" PRIx64 ", but old consumerId:0x%" PRIx64,
674
              req.vgId, req.subKey, req.newConsumerId, req.oldConsumerId);
L
Liu Jicong 已提交
675
    }
D
dapan1121 已提交
676

L
Liu Jicong 已提交
677
    if (req.newConsumerId == -1) {
678
      tqError("vgId:%d, tq invalid re-balance request, new consumerId %" PRId64 "", req.vgId, req.newConsumerId);
679
      goto end;
L
Liu Jicong 已提交
680
    }
D
dapan1121 已提交
681

L
Liu Jicong 已提交
682 683
    STqHandle tqHandle = {0};
    pHandle = &tqHandle;
L
Liu Jicong 已提交
684

L
Liu Jicong 已提交
685 686 687
    memcpy(pHandle->subKey, req.subKey, TSDB_SUBSCRIBE_KEY_LEN);
    pHandle->consumerId = req.newConsumerId;
    pHandle->epoch = -1;
L
Liu Jicong 已提交
688

L
Liu Jicong 已提交
689
    pHandle->execHandle.subType = req.subType;
L
Liu Jicong 已提交
690
    pHandle->fetchMeta = req.withMeta;
wmmhello's avatar
wmmhello 已提交
691

692
    // TODO version should be assigned and refed during preprocess
D
dapan1121 已提交
693
    SWalRef* pRef = walRefCommittedVer(pVnode->pWal);
694
    if (pRef == NULL) {
695 696
      ret = -1;
      goto end;
697
    }
D
dapan1121 已提交
698

699 700
    int64_t ver = pRef->refVer;
    pHandle->pRef = pRef;
L
Liu Jicong 已提交
701

702
    SReadHandle handle = {.vnode = pVnode, .initTableReader = true, .initTqReader = true, .version = ver};
H
Haojun Liao 已提交
703 704
    initStorageAPI(&handle.api);

wmmhello's avatar
wmmhello 已提交
705
    pHandle->snapshotVer = ver;
706

L
Liu Jicong 已提交
707
    if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
dengyihao's avatar
dengyihao 已提交
708
      pHandle->execHandle.execCol.qmsg = taosStrdup(req.qmsg);
709

X
Xiaoyu Wang 已提交
710 711
      pHandle->execHandle.task = qCreateQueueExecTaskInfo(pHandle->execHandle.execCol.qmsg, &handle, vgId,
                                                          &pHandle->execHandle.numOfCols, req.newConsumerId);
L
Liu Jicong 已提交
712
      void* scanner = NULL;
713
      qExtractStreamScanner(pHandle->execHandle.task, &scanner);
714
      pHandle->execHandle.pTqReader = qExtractReaderFromStreamScanner(scanner);
L
Liu Jicong 已提交
715
    } else if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__DB) {
D
dapan1121 已提交
716
      pHandle->pWalReader = walOpenReader(pVnode->pWal, NULL);
717
      pHandle->execHandle.pTqReader = tqReaderOpen(pVnode);
D
dapan1121 已提交
718

L
Liu Jicong 已提交
719
      pHandle->execHandle.execDb.pFilterOutTbUid =
wmmhello's avatar
wmmhello 已提交
720
          taosHashInit(64, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_ENTRY_LOCK);
721
      buildSnapContext(handle.vnode, handle.version, 0, pHandle->execHandle.subType, pHandle->fetchMeta,
722
                       (SSnapContext**)(&handle.sContext));
723

724
      pHandle->execHandle.task = qCreateQueueExecTaskInfo(NULL, &handle, vgId, NULL, req.newConsumerId);
L
Liu Jicong 已提交
725
    } else if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__TABLE) {
D
dapan1121 已提交
726
      pHandle->pWalReader = walOpenReader(pVnode->pWal, NULL);
wmmhello's avatar
wmmhello 已提交
727
      pHandle->execHandle.execTb.suid = req.suid;
728
      pHandle->execHandle.execTb.qmsg = taosStrdup(req.qmsg);
wmmhello's avatar
wmmhello 已提交
729

dengyihao's avatar
dengyihao 已提交
730
      if (strcmp(pHandle->execHandle.execTb.qmsg, "") != 0) {
731 732 733 734 735
        if (nodesStringToNode(pHandle->execHandle.execTb.qmsg, &pHandle->execHandle.execTb.node) != 0) {
          tqError("nodesStringToNode error in sub stable, since %s, vgId:%d, subkey:%s consumer:0x%" PRIx64, terrstr(),
                  pVnode->config.vgId, req.subKey, pHandle->consumerId);
          return -1;
        }
L
Liu Jicong 已提交
736
      }
737

738
      buildSnapContext(handle.vnode, handle.version, req.suid, pHandle->execHandle.subType, pHandle->fetchMeta,
L
Liu Jicong 已提交
739
                       (SSnapContext**)(&handle.sContext));
740
      pHandle->execHandle.task = qCreateQueueExecTaskInfo(NULL, &handle, vgId, NULL, req.newConsumerId);
wmmhello's avatar
wmmhello 已提交
741

742
      SArray* tbUidList = NULL;
wmmhello's avatar
wmmhello 已提交
743
      ret = qGetTableList(req.suid, pVnode, pHandle->execHandle.execTb.node, &tbUidList, pHandle->execHandle.task);
dengyihao's avatar
dengyihao 已提交
744 745 746
      if (ret != TDB_CODE_SUCCESS) {
        tqError("qGetTableList error:%d vgId:%d, subkey:%s consumer:0x%" PRIx64, ret, pVnode->config.vgId, req.subKey,
                pHandle->consumerId);
747 748
        taosArrayDestroy(tbUidList);
        goto end;
L
Liu Jicong 已提交
749
      }
dengyihao's avatar
dengyihao 已提交
750 751
      tqDebug("tq try to get ctb for stb subscribe, vgId:%d, subkey:%s consumer:0x%" PRIx64 " suid:%" PRId64,
              pVnode->config.vgId, req.subKey, pHandle->consumerId, req.suid);
752
      pHandle->execHandle.pTqReader = tqReaderOpen(pVnode);
H
Haojun Liao 已提交
753
      tqReaderSetTbUidList(pHandle->execHandle.pTqReader, tbUidList, NULL);
L
Liu Jicong 已提交
754
      taosArrayDestroy(tbUidList);
L
Liu Jicong 已提交
755
    }
H
Haojun Liao 已提交
756

757
    taosHashPut(pTq->pHandle, req.subKey, strlen(req.subKey), pHandle, sizeof(STqHandle));
dengyihao's avatar
dengyihao 已提交
758
    tqDebug("try to persist handle %s consumer:0x%" PRIx64, req.subKey, pHandle->consumerId);
759 760
    ret = tqMetaSaveHandle(pTq, req.subKey, pHandle);
    goto end;
L
Liu Jicong 已提交
761
  } else {
762
    taosWLockLatch(&pTq->lock);
wmmhello's avatar
wmmhello 已提交
763

D
dapan1121 已提交
764
    if (pHandle->consumerId == req.newConsumerId) {  // do nothing
dengyihao's avatar
dengyihao 已提交
765 766
      tqInfo("vgId:%d consumer:0x%" PRIx64 " remains, no switch occurs, should not reach here", req.vgId,
             req.newConsumerId);
767 768 769
    } else {
      tqInfo("vgId:%d switch consumer from Id:0x%" PRIx64 " to Id:0x%" PRIx64, req.vgId, pHandle->consumerId,
             req.newConsumerId);
770 771
      atomic_store_64(&pHandle->consumerId, req.newConsumerId);
    }
dengyihao's avatar
dengyihao 已提交
772
    //    atomic_add_fetch_32(&pHandle->epoch, 1);
773

774
    // kill executing task
dengyihao's avatar
dengyihao 已提交
775 776 777 778 779 780 781 782 783 784
    //    if(tqIsHandleExec(pHandle)) {
    //      qTaskInfo_t pTaskInfo = pHandle->execHandle.task;
    //      if (pTaskInfo != NULL) {
    //        qKillTask(pTaskInfo, TSDB_CODE_SUCCESS);
    //      }

    //      if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
    //        qStreamCloseTsdbReader(pTaskInfo);
    //      }
    //    }
wmmhello's avatar
wmmhello 已提交
785 786
    // remove if it has been register in the push manager, and return one empty block to consumer
    tqUnregisterPushHandle(pTq, pHandle);
787
    taosWUnLockLatch(&pTq->lock);
788
    ret = tqMetaSaveHandle(pTq, req.subKey, pHandle);
L
Liu Jicong 已提交
789
  }
L
Liu Jicong 已提交
790

791
end:
792
  tDecoderClear(&dc);
793
  return ret;
L
Liu Jicong 已提交
794
}
795

dengyihao's avatar
dengyihao 已提交
796
void freePtr(void* ptr) { taosMemoryFree(*(void**)ptr); }
L
liuyao 已提交
797

798
int32_t tqExpandTask(STQ* pTq, SStreamTask* pTask, int64_t ver) {
D
dapan1121 已提交
799
  int32_t vgId = TD_VID(pTq->pVnode);
800

801
  pTask->id.idStr = createStreamTaskIdStr(pTask->id.streamId, pTask->id.taskId);
L
Liu Jicong 已提交
802
  pTask->refCnt = 1;
803
  pTask->status.schedStatus = TASK_SCHED_STATUS__INACTIVE;
dengyihao's avatar
dengyihao 已提交
804 805
  pTask->inputQueue = streamQueueOpen(512 << 10);
  pTask->outputQueue = streamQueueOpen(512 << 10);
L
Liu Jicong 已提交
806 807

  if (pTask->inputQueue == NULL || pTask->outputQueue == NULL) {
L
Liu Jicong 已提交
808
    return -1;
L
Liu Jicong 已提交
809 810
  }

L
Liu Jicong 已提交
811 812
  pTask->inputStatus = TASK_INPUT_STATUS__NORMAL;
  pTask->outputStatus = TASK_OUTPUT_STATUS__NORMAL;
813
  pTask->pMsgCb = &pTq->pVnode->msgCb;
814
  pTask->pMeta = pTq->pStreamMeta;
815
  pTask->chkInfo.version = ver;
816
  pTask->chkInfo.currentVer = ver;
817

818
  // expand executor
dengyihao's avatar
dengyihao 已提交
819
  pTask->status.taskStatus = (pTask->fillHistory) ? TASK_STATUS__WAIT_DOWNSTREAM : TASK_STATUS__NORMAL;
820

821
  if (pTask->taskLevel == TASK_LEVEL__SOURCE) {
822
    pTask->pState = streamStateOpen(pTq->pStreamMeta->path, pTask, false, -1, -1);
823 824 825 826
    if (pTask->pState == NULL) {
      return -1;
    }

827
    SReadHandle handle = {.vnode = pTq->pVnode, .initTqReader = 1, .pStateBackend = pTask->pState};
828
    initStorageAPI(&handle.api);
829

830 831
    pTask->exec.pExecutor = qCreateStreamExecTaskInfo(pTask->exec.qmsg, &handle, vgId);
    if (pTask->exec.pExecutor == NULL) {
L
Liu Jicong 已提交
832 833
      return -1;
    }
834

835
    qSetTaskId(pTask->exec.pExecutor, pTask->id.taskId, pTask->id.streamId);
836
  } else if (pTask->taskLevel == TASK_LEVEL__AGG) {
837
    pTask->pState = streamStateOpen(pTq->pStreamMeta->path, pTask, false, -1, -1);
838 839 840
    if (pTask->pState == NULL) {
      return -1;
    }
841

842
    int32_t     numOfVgroups = (int32_t)taosArrayGetSize(pTask->childEpInfo);
843 844
    SReadHandle handle = {.vnode = NULL, .numOfVgroups = numOfVgroups, .pStateBackend = pTask->pState};
    initStorageAPI(&handle.api);
845

846
    pTask->exec.pExecutor = qCreateStreamExecTaskInfo(pTask->exec.qmsg, &handle, vgId);
847
    if (pTask->exec.pExecutor == NULL) {
L
Liu Jicong 已提交
848 849
      return -1;
    }
850 851

    qSetTaskId(pTask->exec.pExecutor, pTask->id.taskId, pTask->id.streamId);
L
Liu Jicong 已提交
852
  }
L
Liu Jicong 已提交
853 854

  // sink
855
  if (pTask->outputType == TASK_OUTPUT__SMA) {
L
Liu Jicong 已提交
856
    pTask->smaSink.vnode = pTq->pVnode;
L
Liu Jicong 已提交
857
    pTask->smaSink.smaSink = smaHandleRes;
858
  } else if (pTask->outputType == TASK_OUTPUT__TABLE) {
L
Liu Jicong 已提交
859
    pTask->tbSink.vnode = pTq->pVnode;
H
Haojun Liao 已提交
860
    pTask->tbSink.tbSinkFunc = tqSinkToTablePipeline;
L
Liu Jicong 已提交
861

X
Xiaoyu Wang 已提交
862
    int32_t   ver1 = 1;
5
54liuyao 已提交
863
    SMetaInfo info = {0};
dengyihao's avatar
dengyihao 已提交
864
    int32_t   code = metaGetInfo(pTq->pVnode->pMeta, pTask->tbSink.stbUid, &info, NULL);
5
54liuyao 已提交
865
    if (code == TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
866
      ver1 = info.skmVer;
5
54liuyao 已提交
867
    }
L
Liu Jicong 已提交
868

869 870
    SSchemaWrapper* pschemaWrapper = pTask->tbSink.pSchemaWrapper;
    pTask->tbSink.pTSchema = tBuildTSchema(pschemaWrapper->pSchema, pschemaWrapper->nCols, ver1);
871
    if (pTask->tbSink.pTSchema == NULL) {
D
dapan1121 已提交
872 873
      return -1;
    }
L
liuyao 已提交
874 875
    pTask->tbSink.pTblInfo = tSimpleHashInit(10240, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT));
    tSimpleHashSetFreeFp(pTask->tbSink.pTblInfo, freePtr);
L
Liu Jicong 已提交
876
  }
877

878
  if (pTask->taskLevel == TASK_LEVEL__SOURCE) {
879
    SWalFilterCond cond = {.deleteMsg = 1};  // delete msg also extract from wal files
880
    pTask->exec.pWalReader = walOpenReader(pTq->pVnode->pWal, &cond);
881 882
  }

883
  streamSetupTrigger(pTask);
884

dengyihao's avatar
dengyihao 已提交
885 886
  tqInfo("vgId:%d expand stream task, s-task:%s, checkpoint ver:%" PRId64 " child id:%d, level:%d", vgId,
         pTask->id.idStr, pTask->chkInfo.version, pTask->selfChildId, pTask->taskLevel);
887 888 889

  // next valid version will add one
  pTask->chkInfo.version += 1;
L
Liu Jicong 已提交
890
  return 0;
L
Liu Jicong 已提交
891
}
L
Liu Jicong 已提交
892

893
int32_t tqProcessStreamTaskCheckReq(STQ* pTq, SRpcMsg* pMsg) {
894 895 896 897
  char*   msgStr = pMsg->pCont;
  char*   msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t msgLen = pMsg->contLen - sizeof(SMsgHead);

898 899
  SStreamTaskCheckReq req;
  SDecoder            decoder;
900

X
Xiaoyu Wang 已提交
901
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
902 903
  tDecodeSStreamTaskCheckReq(&decoder, &req);
  tDecoderClear(&decoder);
904

905 906 907 908 909 910 911 912 913 914
  int32_t             taskId = req.downstreamTaskId;
  SStreamTaskCheckRsp rsp = {
      .reqId = req.reqId,
      .streamId = req.streamId,
      .childId = req.childId,
      .downstreamNodeId = req.downstreamNodeId,
      .downstreamTaskId = req.downstreamTaskId,
      .upstreamNodeId = req.upstreamNodeId,
      .upstreamTaskId = req.upstreamTaskId,
  };
915

L
Liu Jicong 已提交
916
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
917

918
  if (pTask != NULL) {
919
    rsp.status = streamTaskCheckStatus(pTask);
920 921
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);

922
    tqDebug("s-task:%s recv task check req(reqId:0x%" PRIx64
923
            ") %d at node %d task status:%d, check req from task %d at node %d, rsp status %d",
924 925
            pTask->id.idStr, rsp.reqId, rsp.downstreamTaskId, rsp.downstreamNodeId, pTask->status.taskStatus,
            rsp.upstreamTaskId, rsp.upstreamNodeId, rsp.status);
926 927
  } else {
    rsp.status = 0;
928 929
    tqDebug("tq recv task check(taskId:0x%x not built yet) req(reqId:0x%" PRIx64
            ") %d at node %d, check req from task:0x%x at node %d, rsp status %d",
930 931
            taskId, rsp.reqId, rsp.downstreamTaskId, rsp.downstreamNodeId, rsp.upstreamTaskId, rsp.upstreamNodeId,
            rsp.status);
932 933 934 935 936
  }

  SEncoder encoder;
  int32_t  code;
  int32_t  len;
937

938 939
  tEncodeSize(tEncodeSStreamTaskCheckRsp, &rsp, len, code);
  if (code < 0) {
940
    tqError("vgId:%d failed to encode task check rsp, task:0x%x", pTq->pStreamMeta->vgId, taskId);
L
Liu Jicong 已提交
941
    return -1;
942
  }
L
Liu Jicong 已提交
943

944 945 946 947 948 949 950 951
  void* buf = rpcMallocCont(sizeof(SMsgHead) + len);
  ((SMsgHead*)buf)->vgId = htonl(req.upstreamNodeId);

  void* abuf = POINTER_SHIFT(buf, sizeof(SMsgHead));
  tEncoderInit(&encoder, (uint8_t*)abuf, len);
  tEncodeSStreamTaskCheckRsp(&encoder, &rsp);
  tEncoderClear(&encoder);

952
  SRpcMsg rspMsg = {.code = 0, .pCont = buf, .contLen = sizeof(SMsgHead) + len, .info = pMsg->info};
953

954 955 956 957
  tmsgSendRsp(&rspMsg);
  return 0;
}

958
int32_t tqProcessStreamTaskCheckRsp(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
959 960 961 962 963 964
  int32_t             code;
  SStreamTaskCheckRsp rsp;

  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
  code = tDecodeSStreamTaskCheckRsp(&decoder, &rsp);
965

966 967 968 969 970
  if (code < 0) {
    tDecoderClear(&decoder);
    return -1;
  }

971
  tDecoderClear(&decoder);
972
  tqDebug("tq recv task check rsp(reqId:0x%" PRIx64 ") %d at node %d check req from task:0x%x at node %d, status %d",
973 974
          rsp.reqId, rsp.downstreamTaskId, rsp.downstreamNodeId, rsp.upstreamTaskId, rsp.upstreamNodeId, rsp.status);

L
Liu Jicong 已提交
975
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, rsp.upstreamTaskId);
976
  if (pTask == NULL) {
977 978
    tqError("tq failed to locate the stream task:0x%x vgId:%d, it may have been destroyed", rsp.upstreamTaskId,
            pTq->pStreamMeta->vgId);
979 980 981
    return -1;
  }

982
  code = streamProcessTaskCheckRsp(pTask, &rsp, sversion);
L
Liu Jicong 已提交
983 984
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
  return code;
985 986
}

987
int32_t tqProcessTaskDeployReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
988 989 990
  int32_t code = 0;
  int32_t vgId = TD_VID(pTq->pVnode);

5
54liuyao 已提交
991 992 993
  if (tsDisableStream) {
    return 0;
  }
994 995 996 997

  // 1.deserialize msg and build task
  SStreamTask* pTask = taosMemoryCalloc(1, sizeof(SStreamTask));
  if (pTask == NULL) {
998
    terrno = TSDB_CODE_OUT_OF_MEMORY;
dengyihao's avatar
dengyihao 已提交
999 1000
    tqError("vgId:%d failed to create stream task due to out of memory, alloc size:%d", vgId,
            (int32_t)sizeof(SStreamTask));
1001 1002
    return -1;
  }
1003

1004 1005
  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
1006
  code = tDecodeStreamTask(&decoder, pTask);
1007 1008 1009 1010 1011
  if (code < 0) {
    tDecoderClear(&decoder);
    taosMemoryFree(pTask);
    return -1;
  }
1012

1013 1014
  tDecoderClear(&decoder);

1015
  // 2.save task, use the newest commit version as the initial start version of stream task.
1016
  taosWLockLatch(&pTq->pStreamMeta->lock);
1017
  code = streamMetaAddDeployedTask(pTq->pStreamMeta, sversion, pTask);
1018
  int32_t numOfTasks = streamMetaGetNumOfTasks(pTq->pStreamMeta);
1019
  if (code < 0) {
1020
    tqError("vgId:%d failed to add s-task:%s, total:%d", vgId, pTask->id.idStr, numOfTasks);
1021
    taosWUnLockLatch(&pTq->pStreamMeta->lock);
1022 1023 1024
    return -1;
  }

1025 1026
  taosWUnLockLatch(&pTq->pStreamMeta->lock);

1027 1028
  // 3.go through recover steps to fill history
  if (pTask->fillHistory) {
1029
    streamTaskCheckDownstream(pTask, sversion);
1030 1031
  }

1032
  tqDebug("vgId:%d s-task:%s is deployed and add meta from mnd, status:%d, total:%d", vgId, pTask->id.idStr,
1033
          pTask->status.taskStatus, numOfTasks);
1034 1035 1036
  return 0;
}

L
Liu Jicong 已提交
1037 1038 1039 1040 1041
int32_t tqProcessTaskRecover1Req(STQ* pTq, SRpcMsg* pMsg) {
  int32_t code;
  char*   msg = pMsg->pCont;
  int32_t msgLen = pMsg->contLen;

1042
  SStreamRecoverStep1Req* pReq = (SStreamRecoverStep1Req*)msg;
L
Liu Jicong 已提交
1043
  SStreamTask*            pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->taskId);
1044 1045 1046 1047 1048
  if (pTask == NULL) {
    return -1;
  }

  // check param
1049
  int64_t fillVer1 = pTask->chkInfo.version;
1050
  if (fillVer1 <= 0) {
L
Liu Jicong 已提交
1051
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1052 1053 1054 1055
    return -1;
  }

  // do recovery step 1
H
Haojun Liao 已提交
1056
  tqDebug("s-task:%s start non-blocking recover stage(step 1) scan", pTask->id.idStr);
H
Haojun Liao 已提交
1057
  int64_t st = taosGetTimestampMs();
1058

H
Haojun Liao 已提交
1059
  streamSourceRecoverScanStep1(pTask);
1060
  if (atomic_load_8(&pTask->status.taskStatus) == TASK_STATUS__DROPPING) {
H
Haojun Liao 已提交
1061 1062
    tqDebug("s-task:%s is dropped, abort recover in step1", pTask->id.idStr);

L
Liu Jicong 已提交
1063 1064 1065 1066
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
    return 0;
  }

H
Haojun Liao 已提交
1067
  double el = (taosGetTimestampMs() - st) / 1000.0;
H
Haojun Liao 已提交
1068
  tqDebug("s-task:%s non-blocking recover stage(step 1) ended, elapsed time:%.2fs", pTask->id.idStr, el);
H
Haojun Liao 已提交
1069

1070 1071 1072 1073
  // build msg to launch next step
  SStreamRecoverStep2Req req;
  code = streamBuildSourceRecover2Req(pTask, &req);
  if (code < 0) {
L
Liu Jicong 已提交
1074
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1075 1076 1077
    return -1;
  }

L
Liu Jicong 已提交
1078
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1079
  if (atomic_load_8(&pTask->status.taskStatus) == TASK_STATUS__DROPPING) {
L
Liu Jicong 已提交
1080 1081 1082
    return 0;
  }

1083
  // serialize msg
L
Liu Jicong 已提交
1084 1085 1086 1087
  int32_t len = sizeof(SStreamRecoverStep1Req);

  void* serializedReq = rpcMallocCont(len);
  if (serializedReq == NULL) {
H
Haojun Liao 已提交
1088
    tqError("s-task:%s failed to prepare the step2 stage, out of memory", pTask->id.idStr);
L
Liu Jicong 已提交
1089 1090 1091 1092
    return -1;
  }

  memcpy(serializedReq, &req, len);
1093 1094

  // dispatch msg
H
Haojun Liao 已提交
1095
  tqDebug("s-task:%s start recover block stage", pTask->id.idStr);
1096

H
Haojun Liao 已提交
1097 1098
  SRpcMsg rpcMsg = {
      .code = 0, .contLen = len, .msgType = TDMT_VND_STREAM_RECOVER_BLOCKING_STAGE, .pCont = serializedReq};
1099 1100 1101 1102
  tmsgPutToQueue(&pTq->pVnode->msgCb, WRITE_QUEUE, &rpcMsg);
  return 0;
}

1103
int32_t tqProcessTaskRecover2Req(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
H
Haojun Liao 已提交
1104 1105
  int32_t code = 0;

1106
  SStreamRecoverStep2Req* pReq = (SStreamRecoverStep2Req*)msg;
H
Haojun Liao 已提交
1107 1108

  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->taskId);
1109 1110 1111 1112 1113
  if (pTask == NULL) {
    return -1;
  }

  // do recovery step 2
H
Haojun Liao 已提交
1114
  int64_t st = taosGetTimestampMs();
dengyihao's avatar
dengyihao 已提交
1115
  tqDebug("s-task:%s start step2 recover, ts:%" PRId64, pTask->id.idStr, st);
H
Haojun Liao 已提交
1116

1117
  code = streamSourceRecoverScanStep2(pTask, sversion);
1118
  if (code < 0) {
L
Liu Jicong 已提交
1119
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1120 1121 1122
    return -1;
  }

1123
  qDebug("s-task:%s set start wal scan start ver:%"PRId64, pTask->id.idStr, sversion);
1124

1125
  walReaderSeekVer(pTask->exec.pWalReader, sversion);
L
liuyao 已提交
1126
  pTask->chkInfo.currentVer = sversion;
1127

1128
  if (atomic_load_8(&pTask->status.taskStatus) == TASK_STATUS__DROPPING) {
L
Liu Jicong 已提交
1129 1130 1131 1132
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
    return 0;
  }

1133 1134 1135
  // restore param
  code = streamRestoreParam(pTask);
  if (code < 0) {
L
Liu Jicong 已提交
1136
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1137 1138 1139 1140
    return -1;
  }

  // set status normal
H
Haojun Liao 已提交
1141
  tqDebug("s-task:%s blocking stage completed, set the status to be normal", pTask->id.idStr);
1142 1143
  code = streamSetStatusNormal(pTask);
  if (code < 0) {
L
Liu Jicong 已提交
1144
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1145 1146 1147
    return -1;
  }

dengyihao's avatar
dengyihao 已提交
1148
  double el = (taosGetTimestampMs() - st) / 1000.0;
H
Haojun Liao 已提交
1149
  tqDebug("s-task:%s step2 recover finished, el:%.2fs", pTask->id.idStr, el);
H
Haojun Liao 已提交
1150

1151 1152 1153
  // dispatch recover finish req to all related downstream task
  code = streamDispatchRecoverFinishReq(pTask);
  if (code < 0) {
L
Liu Jicong 已提交
1154
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1155 1156 1157
    return -1;
  }

L
Liu Jicong 已提交
1158 1159 1160
  atomic_store_8(&pTask->fillHistory, 0);
  streamMetaSaveTask(pTq->pStreamMeta, pTask);

L
Liu Jicong 已提交
1161
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1162 1163 1164
  return 0;
}

L
Liu Jicong 已提交
1165 1166 1167
int32_t tqProcessTaskRecoverFinishReq(STQ* pTq, SRpcMsg* pMsg) {
  char*   msg = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
  int32_t msgLen = pMsg->contLen - sizeof(SMsgHead);
1168 1169

  // deserialize
1170 1171 1172
  SStreamRecoverFinishReq req;

  SDecoder decoder;
X
Xiaoyu Wang 已提交
1173
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
1174 1175 1176
  tDecodeSStreamRecoverFinishReq(&decoder, &req);
  tDecoderClear(&decoder);

1177
  // find task
L
Liu Jicong 已提交
1178
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.taskId);
1179 1180 1181
  if (pTask == NULL) {
    return -1;
  }
1182
  // do process request
1183
  if (streamProcessRecoverFinishReq(pTask, req.childId) < 0) {
L
Liu Jicong 已提交
1184
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1185 1186 1187
    return -1;
  }

L
Liu Jicong 已提交
1188
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1189
  return 0;
L
Liu Jicong 已提交
1190
}
L
Liu Jicong 已提交
1191

L
Liu Jicong 已提交
1192 1193 1194 1195 1196
int32_t tqProcessTaskRecoverFinishRsp(STQ* pTq, SRpcMsg* pMsg) {
  //
  return 0;
}

1197 1198 1199 1200
int32_t extractDelDataBlock(const void* pData, int32_t len, int64_t ver, SStreamRefDataBlock** pRefBlock) {
  SDecoder*   pCoder = &(SDecoder){0};
  SDeleteRes* pRes = &(SDeleteRes){0};

H
Haojun Liao 已提交
1201 1202
  *pRefBlock = NULL;

1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249
  pRes->uidList = taosArrayInit(0, sizeof(tb_uid_t));
  if (pRes->uidList == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  tDecoderInit(pCoder, (uint8_t*)pData, len);
  tDecodeDeleteRes(pCoder, pRes);
  tDecoderClear(pCoder);

  int32_t numOfTables = taosArrayGetSize(pRes->uidList);
  if (numOfTables == 0 || pRes->affectedRows == 0) {
    taosArrayDestroy(pRes->uidList);
    return TSDB_CODE_SUCCESS;
  }

  SSDataBlock* pDelBlock = createSpecialDataBlock(STREAM_DELETE_DATA);
  blockDataEnsureCapacity(pDelBlock, numOfTables);
  pDelBlock->info.rows = numOfTables;
  pDelBlock->info.version = ver;

  for (int32_t i = 0; i < numOfTables; i++) {
    // start key column
    SColumnInfoData* pStartCol = taosArrayGet(pDelBlock->pDataBlock, START_TS_COLUMN_INDEX);
    colDataSetVal(pStartCol, i, (const char*)&pRes->skey, false);  // end key column
    SColumnInfoData* pEndCol = taosArrayGet(pDelBlock->pDataBlock, END_TS_COLUMN_INDEX);
    colDataSetVal(pEndCol, i, (const char*)&pRes->ekey, false);
    // uid column
    SColumnInfoData* pUidCol = taosArrayGet(pDelBlock->pDataBlock, UID_COLUMN_INDEX);
    int64_t*         pUid = taosArrayGet(pRes->uidList, i);
    colDataSetVal(pUidCol, i, (const char*)pUid, false);

    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, GROUPID_COLUMN_INDEX), i);
    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, CALCULATE_START_TS_COLUMN_INDEX), i);
    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, CALCULATE_END_TS_COLUMN_INDEX), i);
  }

  taosArrayDestroy(pRes->uidList);
  *pRefBlock = taosAllocateQitem(sizeof(SStreamRefDataBlock), DEF_QITEM, 0);
  if (pRefBlock == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  (*pRefBlock)->type = STREAM_INPUT__REF_DATA_BLOCK;
  (*pRefBlock)->pBlock = pDelBlock;
  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
1250 1251
int32_t tqProcessTaskRunReq(STQ* pTq, SRpcMsg* pMsg) {
  SStreamTaskRunReq* pReq = pMsg->pCont;
1252 1253 1254 1255

  int32_t taskId = pReq->taskId;
  int32_t vgId = TD_VID(pTq->pVnode);

1256 1257
  if (taskId == WAL_READ_TASKS_ID) {  // all tasks are extracted submit data from the wal
    tqStreamTasksScanWal(pTq);
L
Liu Jicong 已提交
1258
    return 0;
1259
  }
1260

1261
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
1262 1263
  if (pTask != NULL) {
    if (pTask->status.taskStatus == TASK_STATUS__NORMAL) {
dengyihao's avatar
dengyihao 已提交
1264 1265
      tqDebug("vgId:%d s-task:%s start to process block from wal, last chk point:%" PRId64, vgId, pTask->id.idStr,
              pTask->chkInfo.version);
1266
      streamProcessRunReq(pTask);
1267
    } else {
L
liuyao 已提交
1268
      if (streamTaskShouldPause(&pTask->status)) {
L
liuyao 已提交
1269
        atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__INACTIVE);
L
liuyao 已提交
1270
      }
1271
      tqDebug("vgId:%d s-task:%s ignore run req since not in ready state", vgId, pTask->id.idStr);
1272
    }
1273

L
Liu Jicong 已提交
1274
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1275
    tqStartStreamTasks(pTq);
L
Liu Jicong 已提交
1276
    return 0;
1277
  } else {
1278
    tqError("vgId:%d failed to found s-task, taskId:%d", vgId, taskId);
1279
    return -1;
L
Liu Jicong 已提交
1280
  }
L
Liu Jicong 已提交
1281 1282
}

L
Liu Jicong 已提交
1283
int32_t tqProcessTaskDispatchReq(STQ* pTq, SRpcMsg* pMsg, bool exec) {
dengyihao's avatar
dengyihao 已提交
1284 1285 1286
  char*   msgStr = pMsg->pCont;
  char*   msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t msgLen = pMsg->contLen - sizeof(SMsgHead);
1287 1288 1289 1290

  SStreamDispatchReq req = {0};

  SDecoder decoder;
L
Liu Jicong 已提交
1291
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
1292
  tDecodeStreamDispatchReq(&decoder, &req);
L
Liu Jicong 已提交
1293

1294
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.taskId);
L
Liu Jicong 已提交
1295
  if (pTask) {
1296
    SRpcMsg rsp = {.info = pMsg->info, .code = 0};
1297
    streamProcessDispatchMsg(pTask, &req, &rsp, exec);
L
Liu Jicong 已提交
1298
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1299
    return 0;
1300
  } else {
L
liuyao 已提交
1301
    tDeleteStreamDispatchReq(&req);
1302
    return -1;
L
Liu Jicong 已提交
1303
  }
L
Liu Jicong 已提交
1304 1305
}

L
Liu Jicong 已提交
1306 1307
int32_t tqProcessTaskDispatchRsp(STQ* pTq, SRpcMsg* pMsg) {
  SStreamDispatchRsp* pRsp = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
1308
  int32_t             taskId = ntohl(pRsp->upstreamTaskId);
L
Liu Jicong 已提交
1309
  SStreamTask*        pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
1310 1311

  int32_t vgId = pTq->pStreamMeta->vgId;
L
Liu Jicong 已提交
1312
  if (pTask) {
1313
    streamProcessDispatchRsp(pTask, pRsp, pMsg->code);
L
Liu Jicong 已提交
1314
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1315
    return 0;
1316
  } else {
1317
    tqDebug("vgId:%d failed to handle the dispatch rsp, since find task:0x%x failed", vgId, taskId);
1318
    return TSDB_CODE_INVALID_MSG;
L
Liu Jicong 已提交
1319
  }
L
Liu Jicong 已提交
1320
}
L
Liu Jicong 已提交
1321

1322
int32_t tqProcessTaskDropReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
L
Liu Jicong 已提交
1323
  SVDropStreamTaskReq* pReq = (SVDropStreamTaskReq*)msg;
1324 1325
  tqDebug("vgId:%d receive msg to drop stream task:0x%x", TD_VID(pTq->pVnode), pReq->taskId);

1326
  streamMetaRemoveTask(pTq->pStreamMeta, pReq->taskId);
L
Liu Jicong 已提交
1327
  return 0;
L
Liu Jicong 已提交
1328
}
L
Liu Jicong 已提交
1329

5
54liuyao 已提交
1330 1331
int32_t tqProcessTaskPauseReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
  SVPauseStreamTaskReq* pReq = (SVPauseStreamTaskReq*)msg;
dengyihao's avatar
dengyihao 已提交
1332
  SStreamTask*          pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->taskId);
L
liuyao 已提交
1333 1334
  if (pTask) {
    tqDebug("vgId:%d s-task:%s set pause flag", pTq->pStreamMeta->vgId, pTask->id.idStr);
L
liuyao 已提交
1335
    atomic_store_8(&pTask->status.keepTaskStatus, pTask->status.taskStatus);
L
liuyao 已提交
1336 1337 1338
    atomic_store_8(&pTask->status.taskStatus, TASK_STATUS__PAUSE);
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
  }
5
54liuyao 已提交
1339 1340 1341 1342 1343
  return 0;
}

int32_t tqProcessTaskResumeReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
  SVResumeStreamTaskReq* pReq = (SVResumeStreamTaskReq*)msg;
1344 1345

  int32_t      vgId = pTq->pStreamMeta->vgId;
L
liuyao 已提交
1346 1347
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->taskId);
  if (pTask) {
L
liuyao 已提交
1348
    atomic_store_8(&pTask->status.taskStatus, pTask->status.keepTaskStatus);
1349 1350

    // no lock needs to secure the access of the version
1351 1352 1353 1354 1355 1356
    if (pReq->igUntreated && pTask->taskLevel == TASK_LEVEL__SOURCE) {
      // discard all the data  when the stream task is suspended.
      walReaderSetSkipToVersion(pTask->exec.pWalReader, sversion);
      tqDebug("vgId:%d s-task:%s resume to exec, prev paused version:%" PRId64 ", start from vnode ver:%" PRId64
              ", schedStatus:%d",
              vgId, pTask->id.idStr, pTask->chkInfo.currentVer, sversion, pTask->status.schedStatus);
1357
    } else {  // from the previous paused version and go on
1358 1359
      tqDebug("vgId:%d s-task:%s resume to exec, from paused ver:%" PRId64 ", vnode ver:%" PRId64 ", schedStatus:%d",
              vgId, pTask->id.idStr, pTask->chkInfo.currentVer, sversion, pTask->status.schedStatus);
1360 1361
    }

L
liuyao 已提交
1362
    if (pTask->taskLevel == TASK_LEVEL__SOURCE && taosQueueItemSize(pTask->inputQueue->queue) == 0) {
L
liuyao 已提交
1363 1364 1365 1366
      tqStartStreamTasks(pTq);
    } else {
      streamSchedExec(pTask);
    }
L
liuyao 已提交
1367
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1368 1369
  } else {
    tqError("vgId:%d failed to find the s-task:0x%x for resume stream task", vgId, pReq->taskId);
L
liuyao 已提交
1370
  }
1371

5
54liuyao 已提交
1372 1373 1374
  return 0;
}

L
Liu Jicong 已提交
1375 1376 1377 1378 1379 1380
int32_t tqProcessTaskRetrieveReq(STQ* pTq, SRpcMsg* pMsg) {
  char*              msgStr = pMsg->pCont;
  char*              msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t            msgLen = pMsg->contLen - sizeof(SMsgHead);
  SStreamRetrieveReq req;
  SDecoder           decoder;
1381
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
L
Liu Jicong 已提交
1382
  tDecodeStreamRetrieveReq(&decoder, &req);
L
Liu Jicong 已提交
1383
  tDecoderClear(&decoder);
L
Liu Jicong 已提交
1384
  int32_t      taskId = req.dstTaskId;
L
Liu Jicong 已提交
1385
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
L
Liu Jicong 已提交
1386
  if (pTask) {
1387
    SRpcMsg rsp = {.info = pMsg->info, .code = 0};
L
Liu Jicong 已提交
1388
    streamProcessRetrieveReq(pTask, &req, &rsp);
L
Liu Jicong 已提交
1389
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1390
    tDeleteStreamRetrieveReq(&req);
L
Liu Jicong 已提交
1391
    return 0;
L
Liu Jicong 已提交
1392
  } else {
L
liuyao 已提交
1393
    tDeleteStreamRetrieveReq(&req);
L
Liu Jicong 已提交
1394
    return -1;
L
Liu Jicong 已提交
1395 1396 1397 1398 1399 1400 1401
  }
}

int32_t tqProcessTaskRetrieveRsp(STQ* pTq, SRpcMsg* pMsg) {
  //
  return 0;
}
L
Liu Jicong 已提交
1402

1403 1404 1405 1406 1407 1408
int32_t vnodeEnqueueStreamMsg(SVnode* pVnode, SRpcMsg* pMsg) {
  STQ*      pTq = pVnode->pTq;
  SMsgHead* msgStr = pMsg->pCont;
  char*     msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t   msgLen = pMsg->contLen - sizeof(SMsgHead);
  int32_t   code = 0;
L
Liu Jicong 已提交
1409 1410 1411

  SStreamDispatchReq req;
  SDecoder           decoder;
1412
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
L
Liu Jicong 已提交
1413 1414
  if (tDecodeStreamDispatchReq(&decoder, &req) < 0) {
    code = TSDB_CODE_MSG_DECODE_ERROR;
L
Liu Jicong 已提交
1415
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1416 1417
    goto FAIL;
  }
L
Liu Jicong 已提交
1418
  tDecoderClear(&decoder);
L
Liu Jicong 已提交
1419

L
Liu Jicong 已提交
1420
  int32_t taskId = req.taskId;
L
Liu Jicong 已提交
1421

L
Liu Jicong 已提交
1422
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
L
Liu Jicong 已提交
1423
  if (pTask) {
1424
    SRpcMsg rsp = {.info = pMsg->info, .code = 0};
1425
    streamProcessDispatchMsg(pTask, &req, &rsp, false);
L
Liu Jicong 已提交
1426
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1427 1428
    rpcFreeCont(pMsg->pCont);
    taosFreeQitem(pMsg);
1429
    return 0;
5
54liuyao 已提交
1430 1431
  } else {
    tDeleteStreamDispatchReq(&req);
L
Liu Jicong 已提交
1432
  }
L
Liu Jicong 已提交
1433

1434 1435
  code = TSDB_CODE_STREAM_TASK_NOT_EXIST;

L
Liu Jicong 已提交
1436
FAIL:
1437 1438 1439 1440
  if (pMsg->info.handle == NULL) return -1;

  SMsgHead* pRspHead = rpcMallocCont(sizeof(SMsgHead) + sizeof(SStreamDispatchRsp));
  if (pRspHead == NULL) {
1441
    SRpcMsg rsp = {.code = TSDB_CODE_OUT_OF_MEMORY, .info = pMsg->info};
1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457
    tqDebug("send dispatch error rsp, code: %x", code);
    tmsgSendRsp(&rsp);
    rpcFreeCont(pMsg->pCont);
    taosFreeQitem(pMsg);
    return -1;
  }

  pRspHead->vgId = htonl(req.upstreamNodeId);
  SStreamDispatchRsp* pRsp = POINTER_SHIFT(pRspHead, sizeof(SMsgHead));
  pRsp->streamId = htobe64(req.streamId);
  pRsp->upstreamTaskId = htonl(req.upstreamTaskId);
  pRsp->upstreamNodeId = htonl(req.upstreamNodeId);
  pRsp->downstreamNodeId = htonl(pVnode->config.vgId);
  pRsp->downstreamTaskId = htonl(req.taskId);
  pRsp->inputStatus = TASK_OUTPUT_STATUS__NORMAL;

L
Liu Jicong 已提交
1458
  SRpcMsg rsp = {
1459
      .code = code, .info = pMsg->info, .contLen = sizeof(SMsgHead) + sizeof(SStreamDispatchRsp), .pCont = pRspHead};
1460
  tqDebug("send dispatch error rsp, code: %x", code);
L
Liu Jicong 已提交
1461
  tmsgSendRsp(&rsp);
L
Liu Jicong 已提交
1462 1463
  rpcFreeCont(pMsg->pCont);
  taosFreeQitem(pMsg);
1464
  return -1;
L
Liu Jicong 已提交
1465
}
L
Liu Jicong 已提交
1466

1467
int32_t tqCheckLogInWal(STQ* pTq, int64_t sversion) { return sversion <= pTq->walLogLastVer; }
1468

1469
int32_t tqStartStreamTasks(STQ* pTq) {
1470
  int32_t      vgId = TD_VID(pTq->pVnode);
1471
  SStreamMeta* pMeta = pTq->pStreamMeta;
1472

1473
  taosWLockLatch(&pMeta->lock);
1474

1475
  int32_t numOfTasks = taosArrayGetSize(pMeta->pTaskList);
1476
  if (numOfTasks == 0) {
1477
    tqInfo("vgId:%d no stream tasks exist", vgId);
1478
    taosWUnLockLatch(&pMeta->lock);
1479 1480 1481
    return 0;
  }

1482
  pMeta->walScanCounter += 1;
1483

1484 1485
  if (pMeta->walScanCounter > 1) {
    tqDebug("vgId:%d wal read task has been launched, remain scan times:%d", vgId, pMeta->walScanCounter);
1486
    taosWUnLockLatch(&pMeta->lock);
1487 1488 1489
    return 0;
  }

1490 1491 1492
  SStreamTaskRunReq* pRunReq = rpcMallocCont(sizeof(SStreamTaskRunReq));
  if (pRunReq == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
1493
    tqError("vgId:%d failed to create msg to start wal scanning to launch stream tasks, code:%s", vgId, terrstr());
1494
    taosWUnLockLatch(&pMeta->lock);
1495 1496 1497
    return -1;
  }

H
Haojun Liao 已提交
1498
  tqDebug("vgId:%d create msg to start wal scan to launch stream tasks, numOfTasks:%d", vgId, numOfTasks);
1499 1500
  pRunReq->head.vgId = vgId;
  pRunReq->streamId = 0;
1501
  pRunReq->taskId = WAL_READ_TASKS_ID;
1502 1503 1504

  SRpcMsg msg = {.msgType = TDMT_STREAM_TASK_RUN, .pCont = pRunReq, .contLen = sizeof(SStreamTaskRunReq)};
  tmsgPutToQueue(&pTq->pVnode->msgCb, STREAM_QUEUE, &msg);
1505
  taosWUnLockLatch(&pMeta->lock);
1506 1507 1508

  return 0;
}