tq.c 45.2 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
S
Shengliang Guan 已提交
14 15
 */

H
Hongze Cheng 已提交
16
#include "tq.h"
S
Shengliang Guan 已提交
17

dengyihao's avatar
dengyihao 已提交
18 19 20
// 0: not init
// 1: already inited
// 2: wait to be inited or cleaup
21
#define WAL_READ_TASKS_ID (-1)
22

23
static int32_t tqInitialize(STQ* pTq);
dengyihao's avatar
dengyihao 已提交
24

L
Liu Jicong 已提交
25
int32_t tqInit() {
L
Liu Jicong 已提交
26 27 28 29 30 31
  int8_t old;
  while (1) {
    old = atomic_val_compare_exchange_8(&tqMgmt.inited, 0, 2);
    if (old != 2) break;
  }

32 33 34 35 36 37
  if (old == 0) {
    tqMgmt.timer = taosTmrInit(10000, 100, 10000, "TQ");
    if (tqMgmt.timer == NULL) {
      atomic_store_8(&tqMgmt.inited, 0);
      return -1;
    }
38 39 40
    if (streamInit() < 0) {
      return -1;
    }
L
Liu Jicong 已提交
41
    atomic_store_8(&tqMgmt.inited, 1);
42
  }
43

L
Liu Jicong 已提交
44 45
  return 0;
}
L
Liu Jicong 已提交
46

47
void tqCleanUp() {
L
Liu Jicong 已提交
48 49 50 51 52 53 54 55
  int8_t old;
  while (1) {
    old = atomic_val_compare_exchange_8(&tqMgmt.inited, 1, 2);
    if (old != 2) break;
  }

  if (old == 1) {
    taosTmrCleanUp(tqMgmt.timer);
L
Liu Jicong 已提交
56
    streamCleanUp();
L
Liu Jicong 已提交
57 58
    atomic_store_8(&tqMgmt.inited, 0);
  }
59
}
L
Liu Jicong 已提交
60

61
static void destroyTqHandle(void* data) {
62 63 64
  STqHandle* pData = (STqHandle*)data;
  qDestroyTask(pData->execHandle.task);
  if (pData->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
L
Liu Jicong 已提交
65
    taosMemoryFreeClear(pData->execHandle.execCol.qmsg);
66
  } else if (pData->execHandle.subType == TOPIC_SUB_TYPE__DB) {
67
    tqCloseReader(pData->execHandle.pTqReader);
68 69
    walCloseReader(pData->pWalReader);
    taosHashCleanup(pData->execHandle.execDb.pFilterOutTbUid);
L
Liu Jicong 已提交
70
  } else if (pData->execHandle.subType == TOPIC_SUB_TYPE__TABLE) {
71
    walCloseReader(pData->pWalReader);
72
    tqCloseReader(pData->execHandle.pTqReader);
73
  }
74 75 76 77
  if(pData->msg != NULL) {
    rpcFreeCont(pData->msg->pCont);
    taosMemoryFree(pData->msg);
    pData->msg = NULL;
D
dapan1121 已提交
78
  }
L
Liu Jicong 已提交
79 80
}

81 82 83 84 85
static bool tqOffsetLessOrEqual(const STqOffset* pLeft, const STqOffset* pRight) {
  return pLeft->val.type == TMQ_OFFSET__LOG && pRight->val.type == TMQ_OFFSET__LOG &&
         pLeft->val.version <= pRight->val.version;
}

L
Liu Jicong 已提交
86
STQ* tqOpen(const char* path, SVnode* pVnode) {
87
  STQ* pTq = taosMemoryCalloc(1, sizeof(STQ));
L
Liu Jicong 已提交
88
  if (pTq == NULL) {
S
Shengliang Guan 已提交
89
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
90 91
    return NULL;
  }
92

93
  pTq->path = taosStrdup(path);
L
Liu Jicong 已提交
94
  pTq->pVnode = pVnode;
L
Liu Jicong 已提交
95
  pTq->walLogLastVer = pVnode->pWal->vers.lastVer;
96

97
  pTq->pHandle = taosHashInit(64, MurmurHash3_32, true, HASH_ENTRY_LOCK);
98
  taosHashSetFreeFp(pTq->pHandle, destroyTqHandle);
99

100
  taosInitRWLatch(&pTq->lock);
101
  pTq->pPushMgr = taosHashInit(64, MurmurHash3_32, false, HASH_NO_LOCK);
L
Liu Jicong 已提交
102

103
  pTq->pCheckInfo = taosHashInit(64, MurmurHash3_32, true, HASH_ENTRY_LOCK);
L
Liu Jicong 已提交
104
  taosHashSetFreeFp(pTq->pCheckInfo, (FDelete)tDeleteSTqCheckInfo);
L
Liu Jicong 已提交
105

106 107 108 109 110 111 112
  int32_t code = tqInitialize(pTq);
  if (code != TSDB_CODE_SUCCESS) {
    tqClose(pTq);
    return NULL;
  } else {
    return pTq;
  }
113 114 115
}

int32_t tqInitialize(STQ* pTq) {
L
Liu Jicong 已提交
116
  if (tqMetaOpen(pTq) < 0) {
117
    return -1;
118 119
  }

L
Liu Jicong 已提交
120 121
  pTq->pOffsetStore = tqOffsetOpen(pTq);
  if (pTq->pOffsetStore == NULL) {
122
    return -1;
123 124
  }

125
  pTq->pStreamMeta = streamMetaOpen(pTq->path, pTq, (FTaskExpand*)tqExpandTask, pTq->pVnode->config.vgId);
L
Liu Jicong 已提交
126
  if (pTq->pStreamMeta == NULL) {
127
    return -1;
L
Liu Jicong 已提交
128 129
  }

130 131
  // the version is kept in task's meta data
  // todo check if this version is required or not
132 133
  if (streamLoadTasks(pTq->pStreamMeta, walGetCommittedVer(pTq->pVnode->pWal)) < 0) {
    return -1;
L
Liu Jicong 已提交
134 135
  }

136
  return 0;
L
Liu Jicong 已提交
137
}
L
Liu Jicong 已提交
138

L
Liu Jicong 已提交
139
void tqClose(STQ* pTq) {
140 141
  if (pTq == NULL) {
    return;
H
Hongze Cheng 已提交
142
  }
143 144 145 146 147 148 149 150 151

  tqOffsetClose(pTq->pOffsetStore);
  taosHashCleanup(pTq->pHandle);
  taosHashCleanup(pTq->pPushMgr);
  taosHashCleanup(pTq->pCheckInfo);
  taosMemoryFree(pTq->path);
  tqMetaClose(pTq);
  streamMetaClose(pTq->pStreamMeta);
  taosMemoryFree(pTq);
L
Liu Jicong 已提交
152
}
L
Liu Jicong 已提交
153

H
Haojun Liao 已提交
154 155 156 157 158 159 160 161 162 163 164 165 166
void tqNotifyClose(STQ* pTq) {
  if (pTq != NULL) {
    taosWLockLatch(&pTq->pStreamMeta->lock);

    void* pIter = NULL;
    while (1) {
      pIter = taosHashIterate(pTq->pStreamMeta->pTasks, pIter);
      if (pIter == NULL) {
        break;
      }

      SStreamTask* pTask = *(SStreamTask**)pIter;
      tqDebug("vgId:%d s-task:%s set dropping flag", pTq->pStreamMeta->vgId, pTask->id.idStr);
167 168 169
      pTask->status.taskStatus = TASK_STATUS__STOP;

      int64_t st = taosGetTimestampMs();
H
Haojun Liao 已提交
170
      qKillTask(pTask->exec.pExecutor, TSDB_CODE_SUCCESS);
171
      int64_t el = taosGetTimestampMs() - st;
H
Haojun Liao 已提交
172
      tqDebug("vgId:%d s-task:%s is closed in %" PRId64 " ms", pTq->pStreamMeta->vgId, pTask->id.idStr, el);
H
Haojun Liao 已提交
173 174 175 176 177 178
    }

    taosWUnLockLatch(&pTq->pStreamMeta->lock);
  }
}

D
dapan1121 已提交
179 180
static int32_t doSendDataRsp(const SRpcHandleInfo* pRpcHandleInfo, const SMqDataRsp* pRsp, int32_t epoch,
                             int64_t consumerId, int32_t type) {
L
Liu Jicong 已提交
181 182
  int32_t len = 0;
  int32_t code = 0;
D
dapan1121 已提交
183 184 185 186 187 188

  if (type == TMQ_MSG_TYPE__POLL_RSP) {
    tEncodeSize(tEncodeSMqDataRsp, pRsp, len, code);
  } else if (type == TMQ_MSG_TYPE__TAOSX_RSP) {
    tEncodeSize(tEncodeSTaosxRsp, (STaosxRsp*)pRsp, len, code);
  }
L
Liu Jicong 已提交
189 190 191 192 193 194 195 196 197 198 199

  if (code < 0) {
    return -1;
  }

  int32_t tlen = sizeof(SMqRspHead) + len;
  void*   buf = rpcMallocCont(tlen);
  if (buf == NULL) {
    return -1;
  }

D
dapan1121 已提交
200 201 202
  ((SMqRspHead*)buf)->mqMsgType = type;
  ((SMqRspHead*)buf)->epoch = epoch;
  ((SMqRspHead*)buf)->consumerId = consumerId;
L
Liu Jicong 已提交
203 204 205 206 207 208

  void* abuf = POINTER_SHIFT(buf, sizeof(SMqRspHead));

  SEncoder encoder = {0};
  tEncoderInit(&encoder, abuf, len);

D
dapan1121 已提交
209 210 211
  if (type == TMQ_MSG_TYPE__POLL_RSP) {
    tEncodeSMqDataRsp(&encoder, pRsp);
  } else if (type == TMQ_MSG_TYPE__TAOSX_RSP) {
X
Xiaoyu Wang 已提交
212
    tEncodeSTaosxRsp(&encoder, (STaosxRsp*)pRsp);
dengyihao's avatar
dengyihao 已提交
213
  }
L
Liu Jicong 已提交
214

wmmhello's avatar
wmmhello 已提交
215
  tEncoderClear(&encoder);
L
Liu Jicong 已提交
216 217

  SRpcMsg rsp = {
D
dapan1121 已提交
218
      .info = *pRpcHandleInfo,
L
Liu Jicong 已提交
219 220 221 222
      .pCont = buf,
      .contLen = tlen,
      .code = 0,
  };
L
Liu Jicong 已提交
223

L
Liu Jicong 已提交
224
  tmsgSendRsp(&rsp);
L
Liu Jicong 已提交
225 226
  return 0;
}
L
Liu Jicong 已提交
227

228 229 230 231 232 233
int32_t tqPushDataRsp(STQ* pTq, STqHandle* pHandle) {
  SMqDataRsp dataRsp = {0};
  dataRsp.head.consumerId = pHandle->consumerId;
  dataRsp.head.epoch = pHandle->epoch;
  dataRsp.head.mqMsgType = TMQ_MSG_TYPE__POLL_RSP;
  doSendDataRsp(&pHandle->msg->info, &dataRsp, pHandle->epoch, pHandle->consumerId, TMQ_MSG_TYPE__POLL_RSP);
D
dapan1121 已提交
234 235 236

  char buf1[80] = {0};
  char buf2[80] = {0};
237 238
  tFormatOffset(buf1, tListLen(buf1), &dataRsp.reqOffset);
  tFormatOffset(buf2, tListLen(buf2), &dataRsp.rspOffset);
D
dapan1121 已提交
239
  tqDebug("vgId:%d, from consumer:0x%" PRIx64 " (epoch %d) push rsp, block num: %d, req:%s, rsp:%s",
240
          TD_VID(pTq->pVnode), dataRsp.head.consumerId, dataRsp.head.epoch, dataRsp.blockNum, buf1, buf2);
L
Liu Jicong 已提交
241 242 243
  return 0;
}

D
dapan1121 已提交
244 245
int32_t tqSendDataRsp(STQ* pTq, const SRpcMsg* pMsg, const SMqPollReq* pReq, const SMqDataRsp* pRsp, int32_t type) {
  doSendDataRsp(&pMsg->info, pRsp, pReq->epoch, pReq->consumerId, type);
246

D
dapan1121 已提交
247 248 249 250
  char buf1[80] = {0};
  char buf2[80] = {0};
  tFormatOffset(buf1, 80, &pRsp->reqOffset);
  tFormatOffset(buf2, 80, &pRsp->rspOffset);
251

X
Xiaoyu Wang 已提交
252
  tqDebug("vgId:%d consumer:0x%" PRIx64 " (epoch %d) send rsp, block num:%d, req:%s, rsp:%s, reqId:0x%" PRIx64,
D
dapan1121 已提交
253
          TD_VID(pTq->pVnode), pReq->consumerId, pReq->epoch, pRsp->blockNum, buf1, buf2, pReq->reqId);
254 255 256 257

  return 0;
}

258
int32_t tqProcessOffsetCommitReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
259
  STqOffset offset = {0};
X
Xiaoyu Wang 已提交
260
  int32_t   vgId = TD_VID(pTq->pVnode);
261

X
Xiaoyu Wang 已提交
262 263
  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
264 265 266
  if (tDecodeSTqOffset(&decoder, &offset) < 0) {
    return -1;
  }
267

268 269
  tDecoderClear(&decoder);

wmmhello's avatar
wmmhello 已提交
270
  if (offset.val.type == TMQ_OFFSET__SNAPSHOT_DATA || offset.val.type == TMQ_OFFSET__SNAPSHOT_META) {
L
Liu Jicong 已提交
271
    tqDebug("receive offset commit msg to %s on vgId:%d, offset(type:snapshot) uid:%" PRId64 ", ts:%" PRId64,
D
dapan1121 已提交
272
            offset.subKey, vgId, offset.val.uid, offset.val.ts);
L
Liu Jicong 已提交
273
  } else if (offset.val.type == TMQ_OFFSET__LOG) {
X
Xiaoyu Wang 已提交
274 275
    tqDebug("receive offset commit msg to %s on vgId:%d, offset(type:log) version:%" PRId64, offset.subKey, vgId,
            offset.val.version);
276
    if (offset.val.version + 1 == sversion) {
277 278
      offset.val.version += 1;
    }
279
  } else {
280 281
    tqError("invalid commit offset type:%d", offset.val.type);
    return -1;
282
  }
283 284 285 286

  STqOffset* pSavedOffset = tqOffsetRead(pTq->pOffsetStore, offset.subKey);
  if (pSavedOffset != NULL && tqOffsetLessOrEqual(&offset, pSavedOffset)) {
    return 0;  // no need to update the offset value
287 288
  }

289
  // save the new offset value
290 291
  if (tqOffsetWrite(pTq->pOffsetStore, &offset) < 0) {
    return -1;
292
  }
293 294

  if (offset.val.type == TMQ_OFFSET__LOG) {
295
    STqHandle* pHandle = taosHashGet(pTq->pHandle, offset.subKey, strlen(offset.subKey));
296 297
    if (pHandle && (walRefVer(pHandle->pRef, offset.val.version) < 0)) {
      return -1;
298 299 300
    }
  }

301 302 303
  return 0;
}

L
Liu Jicong 已提交
304
int32_t tqCheckColModifiable(STQ* pTq, int64_t tbUid, int32_t colId) {
L
Liu Jicong 已提交
305
  void* pIter = NULL;
306

L
Liu Jicong 已提交
307
  while (1) {
308
    pIter = taosHashIterate(pTq->pCheckInfo, pIter);
309 310 311 312
    if (pIter == NULL) {
      break;
    }

313
    STqCheckInfo* pCheck = (STqCheckInfo*)pIter;
314

L
Liu Jicong 已提交
315 316
    if (pCheck->ntbUid == tbUid) {
      int32_t sz = taosArrayGetSize(pCheck->colIdList);
L
Liu Jicong 已提交
317
      for (int32_t i = 0; i < sz; i++) {
L
Liu Jicong 已提交
318 319
        int16_t forbidColId = *(int16_t*)taosArrayGet(pCheck->colIdList, i);
        if (forbidColId == colId) {
320
          taosHashCancelIterate(pTq->pCheckInfo, pIter);
L
Liu Jicong 已提交
321 322 323 324 325
          return -1;
        }
      }
    }
  }
326

L
Liu Jicong 已提交
327 328 329
  return 0;
}

D
dapan1121 已提交
330
int32_t tqProcessPollReq(STQ* pTq, SRpcMsg* pMsg) {
X
Xiaoyu Wang 已提交
331
  SMqPollReq req = {0};
D
dapan1121 已提交
332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351
  if (tDeserializeSMqPollReq(pMsg->pCont, pMsg->contLen, &req) < 0) {
    tqError("tDeserializeSMqPollReq %d failed", pMsg->contLen);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  int64_t      consumerId = req.consumerId;
  int32_t      reqEpoch = req.epoch;
  STqOffsetVal reqOffset = req.reqOffset;
  int32_t      vgId = TD_VID(pTq->pVnode);

  // 1. find handle
  STqHandle* pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
  if (pHandle == NULL) {
    tqError("tmq poll: consumer:0x%" PRIx64 " vgId:%d subkey %s not found", consumerId, vgId, req.subKey);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  // 2. check re-balance status
352
  taosRLockLatch(&pTq->lock);
D
dapan1121 已提交
353 354 355 356
  if (pHandle->consumerId != consumerId) {
    tqDebug("ERROR tmq poll: consumer:0x%" PRIx64 " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
            consumerId, TD_VID(pTq->pVnode), req.subKey, pHandle->consumerId);
    terrno = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
357
    taosRUnLockLatch(&pTq->lock);
D
dapan1121 已提交
358 359
    return -1;
  }
360
  taosRUnLockLatch(&pTq->lock);
D
dapan1121 已提交
361 362

  // 3. update the epoch value
363
  taosWLockLatch(&pTq->lock);
D
dapan1121 已提交
364 365
  int32_t savedEpoch = pHandle->epoch;
  if (savedEpoch < reqEpoch) {
X
Xiaoyu Wang 已提交
366 367
    tqDebug("tmq poll: consumer:0x%" PRIx64 " epoch update from %d to %d by poll req", consumerId, savedEpoch,
            reqEpoch);
D
dapan1121 已提交
368 369
    pHandle->epoch = reqEpoch;
  }
370
  taosWUnLockLatch(&pTq->lock);
D
dapan1121 已提交
371 372 373 374 375 376

  char buf[80];
  tFormatOffset(buf, 80, &reqOffset);
  tqDebug("tmq poll: consumer:0x%" PRIx64 " (epoch %d), subkey %s, recv poll req vgId:%d, req:%s, reqId:0x%" PRIx64,
          consumerId, req.epoch, pHandle->subKey, vgId, buf, req.reqId);

377
  return tqExtractDataForMq(pTq, pHandle, &req, pMsg);
D
dapan1121 已提交
378 379
}

380
int32_t tqProcessDeleteSubReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
L
Liu Jicong 已提交
381
  SMqVDeleteReq* pReq = (SMqVDeleteReq*)msg;
L
Liu Jicong 已提交
382

L
Liu Jicong 已提交
383
  tqDebug("vgId:%d, tq process delete sub req %s", pTq->pVnode->config.vgId, pReq->subKey);
wmmhello's avatar
wmmhello 已提交
384
  int32_t code = 0;
wmmhello's avatar
wmmhello 已提交
385 386 387 388 389 390
//  taosWLockLatch(&pTq->lock);
//  int32_t code = taosHashRemove(pTq->pPushMgr, pReq->subKey, strlen(pReq->subKey));
//  if (code != 0) {
//    tqDebug("vgId:%d, tq remove push handle %s", pTq->pVnode->config.vgId, pReq->subKey);
//  }
//  taosWUnLockLatch(&pTq->lock);
L
Liu Jicong 已提交
391

L
Liu Jicong 已提交
392 393
  STqHandle* pHandle = taosHashGet(pTq->pHandle, pReq->subKey, strlen(pReq->subKey));
  if (pHandle) {
X
Xiaoyu Wang 已提交
394
    // walCloseRef(pHandle->pWalReader->pWal, pHandle->pRef->refId);
L
Liu Jicong 已提交
395 396 397 398 399 400 401
    if (pHandle->pRef) {
      walCloseRef(pTq->pVnode->pWal, pHandle->pRef->refId);
    }
    code = taosHashRemove(pTq->pHandle, pReq->subKey, strlen(pReq->subKey));
    if (code != 0) {
      tqError("cannot process tq delete req %s, since no such handle", pReq->subKey);
    }
L
Liu Jicong 已提交
402
  }
403

L
Liu Jicong 已提交
404 405
  code = tqOffsetDelete(pTq->pOffsetStore, pReq->subKey);
  if (code != 0) {
406
    tqError("cannot process tq delete req %s, since no such offset in cache", pReq->subKey);
L
Liu Jicong 已提交
407
  }
L
Liu Jicong 已提交
408

L
Liu Jicong 已提交
409
  if (tqMetaDeleteHandle(pTq, pReq->subKey) < 0) {
L
Liu Jicong 已提交
410
    tqError("cannot process tq delete req %s, since no such offset in tdb", pReq->subKey);
411
  }
L
Liu Jicong 已提交
412
  return 0;
L
Liu Jicong 已提交
413 414
}

415
int32_t tqProcessAddCheckInfoReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
416 417
  STqCheckInfo info = {0};
  SDecoder     decoder;
X
Xiaoyu Wang 已提交
418
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
419
  if (tDecodeSTqCheckInfo(&decoder, &info) < 0) {
L
Liu Jicong 已提交
420 421 422 423
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  tDecoderClear(&decoder);
424 425 426 427 428
  if (taosHashPut(pTq->pCheckInfo, info.topic, strlen(info.topic), &info, sizeof(STqCheckInfo)) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  if (tqMetaSaveCheckInfo(pTq, info.topic, msg, msgLen) < 0) {
L
Liu Jicong 已提交
429 430 431 432 433 434
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  return 0;
}

435
int32_t tqProcessDelCheckInfoReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
436 437 438 439 440 441 442 443 444 445 446
  if (taosHashRemove(pTq->pCheckInfo, msg, strlen(msg)) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  if (tqMetaDeleteCheckInfo(pTq, msg) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  return 0;
}

447
int32_t tqProcessSubscribeReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
L
Liu Jicong 已提交
448
  SMqRebVgReq req = {0};
L
Liu Jicong 已提交
449
  tDecodeSMqRebVgReq(msg, &req);
L
Liu Jicong 已提交
450

D
dapan1121 已提交
451 452 453
  SVnode* pVnode = pTq->pVnode;
  int32_t vgId = TD_VID(pVnode);

454
  tqDebug("vgId:%d, tq process sub req:%s, Id:0x%" PRIx64 " -> Id:0x%" PRIx64, pVnode->config.vgId, req.subKey,
D
dapan1121 已提交
455
          req.oldConsumerId, req.newConsumerId);
L
Liu Jicong 已提交
456

457
  STqHandle* pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
L
Liu Jicong 已提交
458
  if (pHandle == NULL) {
L
Liu Jicong 已提交
459
    if (req.oldConsumerId != -1) {
460
      tqError("vgId:%d, build new consumer handle %s for consumer:0x%" PRIx64 ", but old consumerId:0x%" PRIx64,
461
              req.vgId, req.subKey, req.newConsumerId, req.oldConsumerId);
L
Liu Jicong 已提交
462
    }
D
dapan1121 已提交
463

L
Liu Jicong 已提交
464
    if (req.newConsumerId == -1) {
465
      tqError("vgId:%d, tq invalid re-balance request, new consumerId %" PRId64 "", req.vgId, req.newConsumerId);
L
Liu Jicong 已提交
466
      taosMemoryFree(req.qmsg);
L
Liu Jicong 已提交
467 468
      return 0;
    }
D
dapan1121 已提交
469

L
Liu Jicong 已提交
470 471
    STqHandle tqHandle = {0};
    pHandle = &tqHandle;
L
Liu Jicong 已提交
472

H
Haojun Liao 已提交
473
    uint64_t oldConsumerId = pHandle->consumerId;
L
Liu Jicong 已提交
474 475 476
    memcpy(pHandle->subKey, req.subKey, TSDB_SUBSCRIBE_KEY_LEN);
    pHandle->consumerId = req.newConsumerId;
    pHandle->epoch = -1;
L
Liu Jicong 已提交
477

L
Liu Jicong 已提交
478
    pHandle->execHandle.subType = req.subType;
L
Liu Jicong 已提交
479
    pHandle->fetchMeta = req.withMeta;
wmmhello's avatar
wmmhello 已提交
480

481
    // TODO version should be assigned and refed during preprocess
D
dapan1121 已提交
482
    SWalRef* pRef = walRefCommittedVer(pVnode->pWal);
483
    if (pRef == NULL) {
D
dapan1121 已提交
484
      taosMemoryFree(req.qmsg);
L
Liu Jicong 已提交
485
      return -1;
486
    }
D
dapan1121 已提交
487

488 489
    int64_t ver = pRef->refVer;
    pHandle->pRef = pRef;
L
Liu Jicong 已提交
490

491
    SReadHandle handle = {
492
        .meta = pVnode->pMeta, .vnode = pVnode, .initTableReader = true, .initTqReader = true, .version = ver};
wmmhello's avatar
wmmhello 已提交
493
    pHandle->snapshotVer = ver;
494

L
Liu Jicong 已提交
495
    if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
L
Liu Jicong 已提交
496
      pHandle->execHandle.execCol.qmsg = req.qmsg;
L
Liu Jicong 已提交
497
      req.qmsg = NULL;
498

X
Xiaoyu Wang 已提交
499 500
      pHandle->execHandle.task = qCreateQueueExecTaskInfo(pHandle->execHandle.execCol.qmsg, &handle, vgId,
                                                          &pHandle->execHandle.numOfCols, req.newConsumerId);
L
Liu Jicong 已提交
501
      void* scanner = NULL;
502
      qExtractStreamScanner(pHandle->execHandle.task, &scanner);
503
      pHandle->execHandle.pTqReader = qExtractReaderFromStreamScanner(scanner);
L
Liu Jicong 已提交
504
    } else if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__DB) {
D
dapan1121 已提交
505
      pHandle->pWalReader = walOpenReader(pVnode->pWal, NULL);
506
      pHandle->execHandle.pTqReader = tqReaderOpen(pVnode);
D
dapan1121 已提交
507

L
Liu Jicong 已提交
508
      pHandle->execHandle.execDb.pFilterOutTbUid =
L
Liu Jicong 已提交
509
          taosHashInit(64, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_NO_LOCK);
510 511
      buildSnapContext(handle.meta, handle.version, 0, pHandle->execHandle.subType, pHandle->fetchMeta,
                       (SSnapContext**)(&handle.sContext));
512

513
      pHandle->execHandle.task = qCreateQueueExecTaskInfo(NULL, &handle, vgId, NULL, req.newConsumerId);
L
Liu Jicong 已提交
514
    } else if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__TABLE) {
D
dapan1121 已提交
515
      pHandle->pWalReader = walOpenReader(pVnode->pWal, NULL);
wmmhello's avatar
wmmhello 已提交
516 517
      pHandle->execHandle.execTb.suid = req.suid;

L
Liu Jicong 已提交
518
      SArray* tbUidList = taosArrayInit(0, sizeof(int64_t));
D
dapan1121 已提交
519 520
      vnodeGetCtbIdList(pVnode, req.suid, tbUidList);
      tqDebug("vgId:%d, tq try to get all ctb, suid:%" PRId64, pVnode->config.vgId, req.suid);
L
Liu Jicong 已提交
521 522
      for (int32_t i = 0; i < taosArrayGetSize(tbUidList); i++) {
        int64_t tbUid = *(int64_t*)taosArrayGet(tbUidList, i);
D
dapan1121 已提交
523
        tqDebug("vgId:%d, idx %d, uid:%" PRId64, vgId, i, tbUid);
L
Liu Jicong 已提交
524
      }
525
      pHandle->execHandle.pTqReader = tqReaderOpen(pVnode);
526
      tqReaderSetTbUidList(pHandle->execHandle.pTqReader, tbUidList);
L
Liu Jicong 已提交
527
      taosArrayDestroy(tbUidList);
wmmhello's avatar
wmmhello 已提交
528

L
Liu Jicong 已提交
529 530
      buildSnapContext(handle.meta, handle.version, req.suid, pHandle->execHandle.subType, pHandle->fetchMeta,
                       (SSnapContext**)(&handle.sContext));
531
      pHandle->execHandle.task = qCreateQueueExecTaskInfo(NULL, &handle, vgId, NULL, req.newConsumerId);
L
Liu Jicong 已提交
532
    }
H
Haojun Liao 已提交
533

534
    taosHashPut(pTq->pHandle, req.subKey, strlen(req.subKey), pHandle, sizeof(STqHandle));
dengyihao's avatar
dengyihao 已提交
535 536
    tqDebug("try to persist handle %s consumer:0x%" PRIx64 " , old consumer:0x%" PRIx64, req.subKey,
            pHandle->consumerId, oldConsumerId);
L
Liu Jicong 已提交
537
    if (tqMetaSaveHandle(pTq, req.subKey, pHandle) < 0) {
D
dapan1121 已提交
538
      taosMemoryFree(req.qmsg);
L
Liu Jicong 已提交
539
      return -1;
L
Liu Jicong 已提交
540
    }
L
Liu Jicong 已提交
541
  } else {
D
dapan1121 已提交
542 543 544 545 546 547
    if (pHandle->consumerId == req.newConsumerId) {  // do nothing
      tqInfo("vgId:%d consumer:0x%" PRIx64 " remains, no switch occurs", req.vgId, req.newConsumerId);
      atomic_store_32(&pHandle->epoch, -1);
      atomic_add_fetch_32(&pHandle->epoch, 1);
      taosMemoryFree(req.qmsg);
      return tqMetaSaveHandle(pTq, req.subKey, pHandle);
548 549 550
    } else {
      tqInfo("vgId:%d switch consumer from Id:0x%" PRIx64 " to Id:0x%" PRIx64, req.vgId, pHandle->consumerId,
             req.newConsumerId);
H
Haojun Liao 已提交
551

552 553 554
      // kill executing task
      qTaskInfo_t pTaskInfo = pHandle->execHandle.task;
      if (pTaskInfo != NULL) {
555
        qKillTask(pTaskInfo, TSDB_CODE_SUCCESS);
556
      }
D
dapan1121 已提交
557

558
      taosWLockLatch(&pTq->lock);
wmmhello's avatar
wmmhello 已提交
559
      atomic_store_32(&pHandle->epoch, 0);
D
dapan1121 已提交
560

561
      // remove if it has been register in the push manager, and return one empty block to consumer
562
      tqUnregisterPushHandle(pTq, pHandle);
D
dapan1121 已提交
563

564
      atomic_store_64(&pHandle->consumerId, req.newConsumerId);
D
dapan1121 已提交
565

566
      if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
567 568
        qStreamCloseTsdbReader(pTaskInfo);
      }
H
Haojun Liao 已提交
569

570 571 572 573 574
      taosWUnLockLatch(&pTq->lock);
      if (tqMetaSaveHandle(pTq, req.subKey, pHandle) < 0) {
        taosMemoryFree(req.qmsg);
        return -1;
      }
L
Liu Jicong 已提交
575
    }
L
Liu Jicong 已提交
576
  }
L
Liu Jicong 已提交
577

D
dapan1121 已提交
578
  taosMemoryFree(req.qmsg);
L
Liu Jicong 已提交
579
  return 0;
L
Liu Jicong 已提交
580
}
581

582
int32_t tqExpandTask(STQ* pTq, SStreamTask* pTask, int64_t ver) {
D
dapan1121 已提交
583
  int32_t vgId = TD_VID(pTq->pVnode);
584
  pTask->id.idStr = createStreamTaskIdStr(pTask->id.streamId, pTask->id.taskId);
L
Liu Jicong 已提交
585
  pTask->refCnt = 1;
586
  pTask->status.schedStatus = TASK_SCHED_STATUS__INACTIVE;
dengyihao's avatar
dengyihao 已提交
587 588
  pTask->inputQueue = streamQueueOpen(512 << 10);
  pTask->outputQueue = streamQueueOpen(512 << 10);
L
Liu Jicong 已提交
589 590

  if (pTask->inputQueue == NULL || pTask->outputQueue == NULL) {
L
Liu Jicong 已提交
591
    return -1;
L
Liu Jicong 已提交
592 593
  }

L
Liu Jicong 已提交
594 595
  pTask->inputStatus = TASK_INPUT_STATUS__NORMAL;
  pTask->outputStatus = TASK_OUTPUT_STATUS__NORMAL;
596
  pTask->pMsgCb = &pTq->pVnode->msgCb;
597
  pTask->pMeta = pTq->pStreamMeta;
598
  pTask->chkInfo.version = ver;
599
  pTask->chkInfo.currentVer = ver;
600

601
  // expand executor
602
  pTask->status.taskStatus = (pTask->fillHistory)? TASK_STATUS__WAIT_DOWNSTREAM:TASK_STATUS__NORMAL;
603

604
  if (pTask->taskLevel == TASK_LEVEL__SOURCE) {
605
    pTask->pState = streamStateOpen(pTq->pStreamMeta->path, pTask, false, -1, -1);
606 607 608 609
    if (pTask->pState == NULL) {
      return -1;
    }

610
    SReadHandle handle = {
611
        .meta = pTq->pVnode->pMeta, .vnode = pTq->pVnode, .initTqReader = 1, .pStateBackend = pTask->pState};
612

613 614
    pTask->exec.pExecutor = qCreateStreamExecTaskInfo(pTask->exec.qmsg, &handle, vgId);
    if (pTask->exec.pExecutor == NULL) {
L
Liu Jicong 已提交
615 616
      return -1;
    }
617

618
  } else if (pTask->taskLevel == TASK_LEVEL__AGG) {
619
    pTask->pState = streamStateOpen(pTq->pStreamMeta->path, pTask, false, -1, -1);
620 621 622
    if (pTask->pState == NULL) {
      return -1;
    }
623

624 625
    int32_t     numOfVgroups = (int32_t)taosArrayGetSize(pTask->childEpInfo);
    SReadHandle mgHandle = {.vnode = NULL, .numOfVgroups = numOfVgroups, .pStateBackend = pTask->pState};
626 627 628

    pTask->exec.pExecutor = qCreateStreamExecTaskInfo(pTask->exec.qmsg, &mgHandle, vgId);
    if (pTask->exec.pExecutor == NULL) {
L
Liu Jicong 已提交
629 630
      return -1;
    }
L
Liu Jicong 已提交
631
  }
L
Liu Jicong 已提交
632 633

  // sink
L
Liu Jicong 已提交
634
  /*pTask->ahandle = pTq->pVnode;*/
635
  if (pTask->outputType == TASK_OUTPUT__SMA) {
L
Liu Jicong 已提交
636
    pTask->smaSink.vnode = pTq->pVnode;
L
Liu Jicong 已提交
637
    pTask->smaSink.smaSink = smaHandleRes;
638
  } else if (pTask->outputType == TASK_OUTPUT__TABLE) {
L
Liu Jicong 已提交
639
    pTask->tbSink.vnode = pTq->pVnode;
L
Liu Jicong 已提交
640
    pTask->tbSink.tbSinkFunc = tqSinkToTablePipeline2;
L
Liu Jicong 已提交
641

X
Xiaoyu Wang 已提交
642
    int32_t   ver1 = 1;
5
54liuyao 已提交
643
    SMetaInfo info = {0};
dengyihao's avatar
dengyihao 已提交
644
    int32_t   code = metaGetInfo(pTq->pVnode->pMeta, pTask->tbSink.stbUid, &info, NULL);
5
54liuyao 已提交
645
    if (code == TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
646
      ver1 = info.skmVer;
5
54liuyao 已提交
647
    }
L
Liu Jicong 已提交
648

649 650
    SSchemaWrapper* pschemaWrapper = pTask->tbSink.pSchemaWrapper;
    pTask->tbSink.pTSchema = tBuildTSchema(pschemaWrapper->pSchema, pschemaWrapper->nCols, ver1);
651
    if (pTask->tbSink.pTSchema == NULL) {
D
dapan1121 已提交
652 653
      return -1;
    }
L
Liu Jicong 已提交
654
  }
655

656
  if (pTask->taskLevel == TASK_LEVEL__SOURCE) {
657
    pTask->exec.pWalReader = walOpenReader(pTq->pVnode->pWal, NULL);
658 659
  }

660
  streamSetupTrigger(pTask);
661

662
  tqInfo("vgId:%d expand stream task, s-task:%s, checkpoint ver:%" PRId64 " child id:%d, level:%d", vgId, pTask->id.idStr,
663
         pTask->chkInfo.version, pTask->selfChildId, pTask->taskLevel);
664 665 666

  // next valid version will add one
  pTask->chkInfo.version += 1;
L
Liu Jicong 已提交
667
  return 0;
L
Liu Jicong 已提交
668
}
L
Liu Jicong 已提交
669

670 671 672 673 674 675
int32_t tqProcessStreamTaskCheckReq(STQ* pTq, SRpcMsg* pMsg) {
  char*               msgStr = pMsg->pCont;
  char*               msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t             msgLen = pMsg->contLen - sizeof(SMsgHead);
  SStreamTaskCheckReq req;
  SDecoder            decoder;
X
Xiaoyu Wang 已提交
676
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
677 678 679 680 681 682 683 684 685 686 687 688
  tDecodeSStreamTaskCheckReq(&decoder, &req);
  tDecoderClear(&decoder);
  int32_t             taskId = req.downstreamTaskId;
  SStreamTaskCheckRsp rsp = {
      .reqId = req.reqId,
      .streamId = req.streamId,
      .childId = req.childId,
      .downstreamNodeId = req.downstreamNodeId,
      .downstreamTaskId = req.downstreamTaskId,
      .upstreamNodeId = req.upstreamNodeId,
      .upstreamTaskId = req.upstreamTaskId,
  };
689

L
Liu Jicong 已提交
690
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
691

692
  if (pTask) {
693
    rsp.status = streamTaskCheckStatus(pTask);
694 695 696 697 698 699
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);

    tqDebug("tq recv task check req(reqId:0x%" PRIx64
            ") %d at node %d task status:%d, check req from task %d at node %d, rsp status %d",
            rsp.reqId, rsp.downstreamTaskId, rsp.downstreamNodeId, pTask->status.taskStatus, rsp.upstreamTaskId,
            rsp.upstreamNodeId, rsp.status);
700 701
  } else {
    rsp.status = 0;
702 703 704 705
    tqDebug("tq recv task check(taskId:%d not built yet) req(reqId:0x%" PRIx64
            ") %d at node %d, check req from task %d at node %d, rsp status %d",
            taskId, rsp.reqId, rsp.downstreamTaskId, rsp.downstreamNodeId, rsp.upstreamTaskId, rsp.upstreamNodeId,
            rsp.status);
706 707 708 709 710 711 712
  }

  SEncoder encoder;
  int32_t  code;
  int32_t  len;
  tEncodeSize(tEncodeSStreamTaskCheckRsp, &rsp, len, code);
  if (code < 0) {
L
Liu Jicong 已提交
713
    tqError("unable to encode rsp %d", __LINE__);
L
Liu Jicong 已提交
714
    return -1;
715
  }
L
Liu Jicong 已提交
716

717 718 719 720 721 722 723 724
  void* buf = rpcMallocCont(sizeof(SMsgHead) + len);
  ((SMsgHead*)buf)->vgId = htonl(req.upstreamNodeId);

  void* abuf = POINTER_SHIFT(buf, sizeof(SMsgHead));
  tEncoderInit(&encoder, (uint8_t*)abuf, len);
  tEncodeSStreamTaskCheckRsp(&encoder, &rsp);
  tEncoderClear(&encoder);

725
  SRpcMsg rspMsg = {.code = 0, .pCont = buf, .contLen = sizeof(SMsgHead) + len, .info = pMsg->info};
726 727 728 729
  tmsgSendRsp(&rspMsg);
  return 0;
}

730
int32_t tqProcessStreamTaskCheckRsp(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
731 732 733 734 735 736 737 738 739 740 741
  int32_t             code;
  SStreamTaskCheckRsp rsp;

  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
  code = tDecodeSStreamTaskCheckRsp(&decoder, &rsp);
  if (code < 0) {
    tDecoderClear(&decoder);
    return -1;
  }

742
  tDecoderClear(&decoder);
743
  tqDebug("tq recv task check rsp(reqId:0x%" PRIx64 ") %d at node %d check req from task %d at node %d, status %d",
744 745
          rsp.reqId, rsp.downstreamTaskId, rsp.downstreamNodeId, rsp.upstreamTaskId, rsp.upstreamNodeId, rsp.status);

L
Liu Jicong 已提交
746
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, rsp.upstreamTaskId);
747 748 749 750
  if (pTask == NULL) {
    return -1;
  }

751
  code = streamProcessTaskCheckRsp(pTask, &rsp, sversion);
L
Liu Jicong 已提交
752 753
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
  return code;
754 755
}

756
int32_t tqProcessTaskDeployReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
757 758 759 760 761
  int32_t code;
#if 0
  code = streamMetaAddSerializedTask(pTq->pStreamMeta, version, msg, msgLen);
  if (code < 0) return code;
#endif
5
54liuyao 已提交
762 763 764
  if (tsDisableStream) {
    return 0;
  }
765 766 767 768 769 770

  // 1.deserialize msg and build task
  SStreamTask* pTask = taosMemoryCalloc(1, sizeof(SStreamTask));
  if (pTask == NULL) {
    return -1;
  }
771

772 773
  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
774
  code = tDecodeStreamTask(&decoder, pTask);
775 776 777 778 779
  if (code < 0) {
    tDecoderClear(&decoder);
    taosMemoryFree(pTask);
    return -1;
  }
780

781 782
  tDecoderClear(&decoder);

783
  // 2.save task, use the newest commit version as the initial start version of stream task.
784
  taosWLockLatch(&pTq->pStreamMeta->lock);
785
  code = streamMetaAddDeployedTask(pTq->pStreamMeta, sversion, pTask);
786
  if (code < 0) {
787 788
    tqError("vgId:%d failed to add s-task:%s, total:%d", TD_VID(pTq->pVnode), pTask->id.idStr,
            streamMetaGetNumOfTasks(pTq->pStreamMeta));
789
    taosWUnLockLatch(&pTq->pStreamMeta->lock);
790 791 792
    return -1;
  }

793 794
  taosWUnLockLatch(&pTq->pStreamMeta->lock);

795 796
  // 3.go through recover steps to fill history
  if (pTask->fillHistory) {
797
    streamTaskCheckDownstream(pTask, sversion);
798 799
  }

800 801
  tqDebug("vgId:%d s-task:%s is deployed and add meta from mnd, status:%d, total:%d", TD_VID(pTq->pVnode),
          pTask->id.idStr, pTask->status.taskStatus, streamMetaGetNumOfTasks(pTq->pStreamMeta));
802 803 804
  return 0;
}

L
Liu Jicong 已提交
805 806 807 808 809
int32_t tqProcessTaskRecover1Req(STQ* pTq, SRpcMsg* pMsg) {
  int32_t code;
  char*   msg = pMsg->pCont;
  int32_t msgLen = pMsg->contLen;

810
  SStreamRecoverStep1Req* pReq = (SStreamRecoverStep1Req*)msg;
L
Liu Jicong 已提交
811
  SStreamTask*            pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->taskId);
812 813 814 815 816
  if (pTask == NULL) {
    return -1;
  }

  // check param
817
  int64_t fillVer1 = pTask->chkInfo.version;
818
  if (fillVer1 <= 0) {
L
Liu Jicong 已提交
819
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
820 821 822 823
    return -1;
  }

  // do recovery step 1
H
Haojun Liao 已提交
824
  tqDebug("s-task:%s start non-blocking recover stage(step 1) scan", pTask->id.idStr);
H
Haojun Liao 已提交
825
  int64_t st = taosGetTimestampMs();
826

H
Haojun Liao 已提交
827
  streamSourceRecoverScanStep1(pTask);
828
  if (atomic_load_8(&pTask->status.taskStatus) == TASK_STATUS__DROPPING) {
H
Haojun Liao 已提交
829 830
    tqDebug("s-task:%s is dropped, abort recover in step1", pTask->id.idStr);

L
Liu Jicong 已提交
831 832 833 834
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
    return 0;
  }

H
Haojun Liao 已提交
835
  double el = (taosGetTimestampMs() - st) / 1000.0;
H
Haojun Liao 已提交
836
  tqDebug("s-task:%s non-blocking recover stage(step 1) ended, elapsed time:%.2fs", pTask->id.idStr, el);
H
Haojun Liao 已提交
837

838 839 840 841
  // build msg to launch next step
  SStreamRecoverStep2Req req;
  code = streamBuildSourceRecover2Req(pTask, &req);
  if (code < 0) {
L
Liu Jicong 已提交
842
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
843 844 845
    return -1;
  }

L
Liu Jicong 已提交
846
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
847
  if (atomic_load_8(&pTask->status.taskStatus) == TASK_STATUS__DROPPING) {
L
Liu Jicong 已提交
848 849 850
    return 0;
  }

851
  // serialize msg
L
Liu Jicong 已提交
852 853 854 855
  int32_t len = sizeof(SStreamRecoverStep1Req);

  void* serializedReq = rpcMallocCont(len);
  if (serializedReq == NULL) {
H
Haojun Liao 已提交
856
    tqError("s-task:%s failed to prepare the step2 stage, out of memory", pTask->id.idStr);
L
Liu Jicong 已提交
857 858 859 860
    return -1;
  }

  memcpy(serializedReq, &req, len);
861 862

  // dispatch msg
H
Haojun Liao 已提交
863
  tqDebug("s-task:%s step 1 finished, send msg to start blocking recover stage(step 2)", pTask->id.idStr);
864

H
Haojun Liao 已提交
865 866
  SRpcMsg rpcMsg = {
      .code = 0, .contLen = len, .msgType = TDMT_VND_STREAM_RECOVER_BLOCKING_STAGE, .pCont = serializedReq};
867 868 869 870
  tmsgPutToQueue(&pTq->pVnode->msgCb, WRITE_QUEUE, &rpcMsg);
  return 0;
}

871
int32_t tqProcessTaskRecover2Req(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
H
Haojun Liao 已提交
872 873
  int32_t code = 0;

874
  SStreamRecoverStep2Req* pReq = (SStreamRecoverStep2Req*)msg;
H
Haojun Liao 已提交
875 876

  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->taskId);
877 878 879 880 881
  if (pTask == NULL) {
    return -1;
  }

  // do recovery step 2
H
Haojun Liao 已提交
882 883 884
  int64_t st = taosGetTimestampMs();
  tqDebug("s-task:%s start step2 recover, ts:%"PRId64, pTask->id.idStr, st);

885
  code = streamSourceRecoverScanStep2(pTask, sversion);
886
  if (code < 0) {
L
Liu Jicong 已提交
887
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
888 889 890
    return -1;
  }

891
  if (atomic_load_8(&pTask->status.taskStatus) == TASK_STATUS__DROPPING) {
L
Liu Jicong 已提交
892 893 894 895
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
    return 0;
  }

896 897 898
  // restore param
  code = streamRestoreParam(pTask);
  if (code < 0) {
L
Liu Jicong 已提交
899
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
900 901 902 903
    return -1;
  }

  // set status normal
H
Haojun Liao 已提交
904
  tqDebug("s-task:%s blocking stage completed, set the status to be normal", pTask->id.idStr);
905 906
  code = streamSetStatusNormal(pTask);
  if (code < 0) {
L
Liu Jicong 已提交
907
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
908 909 910
    return -1;
  }

H
Haojun Liao 已提交
911
  double el = (taosGetTimestampMs() - st)/ 1000.0;
H
Haojun Liao 已提交
912
  tqDebug("s-task:%s step2 recover finished, el:%.2fs", pTask->id.idStr, el);
H
Haojun Liao 已提交
913

914 915 916
  // dispatch recover finish req to all related downstream task
  code = streamDispatchRecoverFinishReq(pTask);
  if (code < 0) {
L
Liu Jicong 已提交
917
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
918 919 920
    return -1;
  }

L
Liu Jicong 已提交
921 922 923
  atomic_store_8(&pTask->fillHistory, 0);
  streamMetaSaveTask(pTq->pStreamMeta, pTask);

L
Liu Jicong 已提交
924
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
925 926 927
  return 0;
}

L
Liu Jicong 已提交
928 929 930
int32_t tqProcessTaskRecoverFinishReq(STQ* pTq, SRpcMsg* pMsg) {
  char*   msg = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
  int32_t msgLen = pMsg->contLen - sizeof(SMsgHead);
931 932

  // deserialize
933 934 935
  SStreamRecoverFinishReq req;

  SDecoder decoder;
X
Xiaoyu Wang 已提交
936
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
937 938 939
  tDecodeSStreamRecoverFinishReq(&decoder, &req);
  tDecoderClear(&decoder);

940
  // find task
L
Liu Jicong 已提交
941
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.taskId);
942 943 944
  if (pTask == NULL) {
    return -1;
  }
945
  // do process request
946
  if (streamProcessRecoverFinishReq(pTask, req.childId) < 0) {
L
Liu Jicong 已提交
947
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
948 949 950
    return -1;
  }

L
Liu Jicong 已提交
951
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
952
  return 0;
L
Liu Jicong 已提交
953
}
L
Liu Jicong 已提交
954

L
Liu Jicong 已提交
955 956 957 958 959
int32_t tqProcessTaskRecoverFinishRsp(STQ* pTq, SRpcMsg* pMsg) {
  //
  return 0;
}

L
Liu Jicong 已提交
960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975
int32_t tqProcessDelReq(STQ* pTq, void* pReq, int32_t len, int64_t ver) {
  bool        failed = false;
  SDecoder*   pCoder = &(SDecoder){0};
  SDeleteRes* pRes = &(SDeleteRes){0};

  pRes->uidList = taosArrayInit(0, sizeof(tb_uid_t));
  if (pRes->uidList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    failed = true;
  }

  tDecoderInit(pCoder, pReq, len);
  tDecodeDeleteRes(pCoder, pRes);
  tDecoderClear(pCoder);

  int32_t sz = taosArrayGetSize(pRes->uidList);
L
Liu Jicong 已提交
976
  if (sz == 0 || pRes->affectedRows == 0) {
L
Liu Jicong 已提交
977 978 979 980 981 982 983 984 985 986 987
    taosArrayDestroy(pRes->uidList);
    return 0;
  }
  SSDataBlock* pDelBlock = createSpecialDataBlock(STREAM_DELETE_DATA);
  blockDataEnsureCapacity(pDelBlock, sz);
  pDelBlock->info.rows = sz;
  pDelBlock->info.version = ver;

  for (int32_t i = 0; i < sz; i++) {
    // start key column
    SColumnInfoData* pStartCol = taosArrayGet(pDelBlock->pDataBlock, START_TS_COLUMN_INDEX);
988
    colDataSetVal(pStartCol, i, (const char*)&pRes->skey, false);  // end key column
L
Liu Jicong 已提交
989
    SColumnInfoData* pEndCol = taosArrayGet(pDelBlock->pDataBlock, END_TS_COLUMN_INDEX);
990
    colDataSetVal(pEndCol, i, (const char*)&pRes->ekey, false);
L
Liu Jicong 已提交
991 992 993
    // uid column
    SColumnInfoData* pUidCol = taosArrayGet(pDelBlock->pDataBlock, UID_COLUMN_INDEX);
    int64_t*         pUid = taosArrayGet(pRes->uidList, i);
994
    colDataSetVal(pUidCol, i, (const char*)pUid, false);
L
Liu Jicong 已提交
995

996 997 998
    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, GROUPID_COLUMN_INDEX), i);
    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, CALCULATE_START_TS_COLUMN_INDEX), i);
    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, CALCULATE_END_TS_COLUMN_INDEX), i);
L
Liu Jicong 已提交
999 1000
  }

L
Liu Jicong 已提交
1001 1002
  taosArrayDestroy(pRes->uidList);

L
Liu Jicong 已提交
1003 1004 1005
  int32_t* pRef = taosMemoryMalloc(sizeof(int32_t));
  *pRef = 1;

1006 1007
  taosWLockLatch(&pTq->pStreamMeta->lock);

L
Liu Jicong 已提交
1008 1009 1010
  void* pIter = NULL;
  while (1) {
    pIter = taosHashIterate(pTq->pStreamMeta->pTasks, pIter);
1011 1012 1013 1014
    if (pIter == NULL) {
      break;
    }

L
Liu Jicong 已提交
1015
    SStreamTask* pTask = *(SStreamTask**)pIter;
1016 1017 1018
    if (pTask->taskLevel != TASK_LEVEL__SOURCE) {
      continue;
    }
L
Liu Jicong 已提交
1019

1020
    qDebug("s-task:%s delete req enqueue, ver: %" PRId64, pTask->id.idStr, ver);
L
Liu Jicong 已提交
1021

L
Liu Jicong 已提交
1022
    if (!failed) {
S
Shengliang Guan 已提交
1023
      SStreamRefDataBlock* pRefBlock = taosAllocateQitem(sizeof(SStreamRefDataBlock), DEF_QITEM, 0);
L
Liu Jicong 已提交
1024 1025 1026 1027 1028
      pRefBlock->type = STREAM_INPUT__REF_DATA_BLOCK;
      pRefBlock->pBlock = pDelBlock;
      pRefBlock->dataRef = pRef;
      atomic_add_fetch_32(pRefBlock->dataRef, 1);

1029
      if (tAppendDataToInputQueue(pTask, (SStreamQueueItem*)pRefBlock) < 0) {
L
Liu Jicong 已提交
1030
        atomic_sub_fetch_32(pRef, 1);
L
Liu Jicong 已提交
1031
        taosFreeQitem(pRefBlock);
L
Liu Jicong 已提交
1032 1033
        continue;
      }
L
Liu Jicong 已提交
1034

L
Liu Jicong 已提交
1035
      if (streamSchedExec(pTask) < 0) {
1036
        qError("s-task:%s stream task launch failed", pTask->id.idStr);
L
Liu Jicong 已提交
1037 1038
        continue;
      }
L
Liu Jicong 已提交
1039

L
Liu Jicong 已提交
1040 1041 1042 1043
    } else {
      streamTaskInputFail(pTask);
    }
  }
L
Liu Jicong 已提交
1044

1045 1046
  taosWUnLockLatch(&pTq->pStreamMeta->lock);

L
Liu Jicong 已提交
1047 1048
  int32_t ref = atomic_sub_fetch_32(pRef, 1);
  if (ref == 0) {
L
Liu Jicong 已提交
1049
    blockDataDestroy(pDelBlock);
L
Liu Jicong 已提交
1050 1051 1052 1053
    taosMemoryFree(pRef);
  }

#if 0
S
Shengliang Guan 已提交
1054
    SStreamDataBlock* pStreamBlock = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, 0);
L
Liu Jicong 已提交
1055 1056 1057 1058 1059 1060 1061 1062
    pStreamBlock->type = STREAM_INPUT__DATA_BLOCK;
    pStreamBlock->blocks = taosArrayInit(0, sizeof(SSDataBlock));
    SSDataBlock block = {0};
    assignOneDataBlock(&block, pDelBlock);
    block.info.type = STREAM_DELETE_DATA;
    taosArrayPush(pStreamBlock->blocks, &block);

    if (!failed) {
1063
      if (tAppendDataToInputQueue(pTask, (SStreamQueueItem*)pStreamBlock) < 0) {
1064
        qError("stream task input del failed, task id %d", pTask->id.taskId);
L
Liu Jicong 已提交
1065 1066 1067 1068
        continue;
      }

      if (streamSchedExec(pTask) < 0) {
1069
        qError("stream task launch failed, task id %d", pTask->id.taskId);
L
Liu Jicong 已提交
1070 1071 1072 1073 1074 1075
        continue;
      }
    } else {
      streamTaskInputFail(pTask);
    }
  }
L
Liu Jicong 已提交
1076
  blockDataDestroy(pDelBlock);
L
Liu Jicong 已提交
1077
#endif
L
Liu Jicong 已提交
1078 1079 1080
  return 0;
}

1081 1082 1083 1084
int32_t tqProcessSubmitReqForSubscribe(STQ* pTq) {
  int32_t vgId = TD_VID(pTq->pVnode);

  taosWLockLatch(&pTq->lock);
wmmhello's avatar
wmmhello 已提交
1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099
  if(taosHashGetSize(pTq->pPushMgr) > 0){
    void *pIter = taosHashIterate(pTq->pPushMgr, NULL);
    while(pIter){
      STqHandle* pHandle = *(STqHandle**)pIter;
      tqDebug("vgId:%d start set submit for pHandle:%p, consume id:0x%"PRIx64, vgId, pHandle, pHandle->consumerId);
      if(ASSERT(pHandle->msg != NULL)){
        tqError("pHandle->msg should not be null");
        break;
      }else{
        SRpcMsg msg = {.msgType = TDMT_VND_TMQ_CONSUME, .pCont = pHandle->msg->pCont, .contLen = pHandle->msg->contLen, .info = pHandle->msg->info};
        tmsgPutToQueue(&pTq->pVnode->msgCb, QUERY_QUEUE, &msg);
        taosMemoryFree(pHandle->msg);
        pHandle->msg = NULL;
      }
      pIter = taosHashIterate(pTq->pPushMgr, pIter);
1100
    }
wmmhello's avatar
wmmhello 已提交
1101
    taosHashClear(pTq->pPushMgr);
1102 1103 1104 1105 1106 1107 1108
  }
  // unlock
  taosWUnLockLatch(&pTq->lock);

  return 0;
}

L
Liu Jicong 已提交
1109
int32_t tqProcessSubmitReq(STQ* pTq, SPackedData submit) {
1110
#if 0
1111
  void* pIter = NULL;
1112
  SStreamDataSubmit2* pSubmit = streamDataSubmitNew(submit, STREAM_INPUT__DATA_SUBMIT);
L
Liu Jicong 已提交
1113
  if (pSubmit == NULL) {
L
Liu Jicong 已提交
1114
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
1115
    tqError("failed to create data submit for stream since out of memory");
1116
    saveOffsetForAllTasks(pTq, submit.ver);
1117
    return -1;
L
Liu Jicong 已提交
1118 1119
  }

1120 1121
  SArray* pInputQueueFullTasks = taosArrayInit(4, POINTER_BYTES);

L
Liu Jicong 已提交
1122
  while (1) {
L
Liu Jicong 已提交
1123
    pIter = taosHashIterate(pTq->pStreamMeta->pTasks, pIter);
1124 1125 1126 1127
    if (pIter == NULL) {
      break;
    }

1128
    SStreamTask* pTask = *(SStreamTask**)pIter;
1129
    if (pTask->taskLevel != TASK_LEVEL__SOURCE) {
L
Liu Jicong 已提交
1130 1131
      continue;
    }
L
Liu Jicong 已提交
1132

1133
    if (pTask->status.taskStatus == TASK_STATUS__RECOVER_PREPARE || pTask->status.taskStatus == TASK_STATUS__WAIT_DOWNSTREAM) {
1134
      tqDebug("stream task:%d skip push data, not ready for processing, status %d", pTask->id.taskId,
1135
              pTask->status.taskStatus);
L
Liu Jicong 已提交
1136 1137
      continue;
    }
L
Liu Jicong 已提交
1138

1139 1140 1141
    // check if offset value exists
    char key[128] = {0};
    createStreamTaskOffsetKey(key, pTask->id.streamId, pTask->id.taskId);
L
Liu Jicong 已提交
1142

1143 1144 1145 1146 1147 1148 1149 1150
    if (tInputQueueIsFull(pTask)) {
      STqOffset* pOffset = tqOffsetRead(pTq->pOffsetStore, key);

      int64_t ver = submit.ver;
      if (pOffset == NULL) {
        doSaveTaskOffset(pTq->pOffsetStore, key, submit.ver);
      } else {
        ver = pOffset->val.version;
L
Liu Jicong 已提交
1151
      }
L
Liu Jicong 已提交
1152

1153 1154
      tqDebug("s-task:%s input queue is full, discard submit block, ver:%" PRId64, pTask->id.idStr, ver);
      taosArrayPush(pInputQueueFullTasks, &pTask);
1155
      continue;
L
Liu Jicong 已提交
1156 1157
    }

1158 1159
    // check if offset value exists
    STqOffset* pOffset = tqOffsetRead(pTq->pOffsetStore, key);
1160
    ASSERT(pOffset == NULL);
1161

1162
    addSubmitBlockNLaunchTask(pTq->pOffsetStore, pTask, pSubmit, key, submit.ver);
L
Liu Jicong 已提交
1163
  }
L
Liu Jicong 已提交
1164

1165 1166
  streamDataSubmitDestroy(pSubmit);
  taosFreeQitem(pSubmit);
1167
#endif
L
Liu Jicong 已提交
1168

1169
  tqStartStreamTasks(pTq);
1170
  return 0;
L
Liu Jicong 已提交
1171 1172
}

L
Liu Jicong 已提交
1173 1174
int32_t tqProcessTaskRunReq(STQ* pTq, SRpcMsg* pMsg) {
  SStreamTaskRunReq* pReq = pMsg->pCont;
1175 1176 1177 1178

  int32_t taskId = pReq->taskId;
  int32_t vgId = TD_VID(pTq->pVnode);

1179 1180
  if (taskId == WAL_READ_TASKS_ID) {  // all tasks are extracted submit data from the wal
    tqStreamTasksScanWal(pTq);
L
Liu Jicong 已提交
1181
    return 0;
1182
  }
1183

1184
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
1185 1186 1187 1188 1189
  if (pTask != NULL) {
    if (pTask->status.taskStatus == TASK_STATUS__NORMAL) {
      tqDebug("vgId:%d s-task:%s start to process block from wal, last chk point:%" PRId64, vgId,
              pTask->id.idStr, pTask->chkInfo.version);
      streamProcessRunReq(pTask);
1190
    } else {
1191
      tqDebug("vgId:%d s-task:%s ignore run req since not in ready state", vgId, pTask->id.idStr);
1192
    }
1193

L
Liu Jicong 已提交
1194
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1195
    tqStartStreamTasks(pTq);
L
Liu Jicong 已提交
1196
    return 0;
1197
  } else {
1198
    tqError("vgId:%d failed to found s-task, taskId:%d", vgId, taskId);
1199
    return -1;
L
Liu Jicong 已提交
1200
  }
L
Liu Jicong 已提交
1201 1202
}

L
Liu Jicong 已提交
1203
int32_t tqProcessTaskDispatchReq(STQ* pTq, SRpcMsg* pMsg, bool exec) {
1204 1205 1206 1207 1208
  char*              msgStr = pMsg->pCont;
  char*              msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t            msgLen = pMsg->contLen - sizeof(SMsgHead);
  SStreamDispatchReq req;
  SDecoder           decoder;
L
Liu Jicong 已提交
1209
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
1210
  tDecodeStreamDispatchReq(&decoder, &req);
L
Liu Jicong 已提交
1211

1212
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.taskId);
L
Liu Jicong 已提交
1213
  if (pTask) {
1214
    SRpcMsg rsp = {.info = pMsg->info, .code = 0};
L
Liu Jicong 已提交
1215
    streamProcessDispatchReq(pTask, &req, &rsp, exec);
L
Liu Jicong 已提交
1216
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1217
    return 0;
1218
  } else {
L
liuyao 已提交
1219
    tDeleteStreamDispatchReq(&req);
1220
    return -1;
L
Liu Jicong 已提交
1221
  }
L
Liu Jicong 已提交
1222 1223
}

L
Liu Jicong 已提交
1224 1225
int32_t tqProcessTaskDispatchRsp(STQ* pTq, SRpcMsg* pMsg) {
  SStreamDispatchRsp* pRsp = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
1226
  int32_t             taskId = ntohl(pRsp->upstreamTaskId);
L
Liu Jicong 已提交
1227
  SStreamTask*        pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
1228
  tqDebug("recv dispatch rsp, code:%x", pMsg->code);
L
Liu Jicong 已提交
1229
  if (pTask) {
1230
    streamProcessDispatchRsp(pTask, pRsp, pMsg->code);
L
Liu Jicong 已提交
1231
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1232
    return 0;
1233 1234
  } else {
    return -1;
L
Liu Jicong 已提交
1235
  }
L
Liu Jicong 已提交
1236
}
L
Liu Jicong 已提交
1237

1238
int32_t tqProcessTaskDropReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
L
Liu Jicong 已提交
1239
  SVDropStreamTaskReq* pReq = (SVDropStreamTaskReq*)msg;
1240
  streamMetaRemoveTask(pTq->pStreamMeta, pReq->taskId);
L
Liu Jicong 已提交
1241
  return 0;
L
Liu Jicong 已提交
1242
}
L
Liu Jicong 已提交
1243

5
54liuyao 已提交
1244 1245
int32_t tqProcessTaskPauseReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
  SVPauseStreamTaskReq* pReq = (SVPauseStreamTaskReq*)msg;
L
liuyao 已提交
1246 1247 1248
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->taskId);
  if (pTask) {
    tqDebug("vgId:%d s-task:%s set pause flag", pTq->pStreamMeta->vgId, pTask->id.idStr);
L
liuyao 已提交
1249
    atomic_store_8(&pTask->status.keepTaskStatus, pTask->status.taskStatus);
L
liuyao 已提交
1250 1251 1252
    atomic_store_8(&pTask->status.taskStatus, TASK_STATUS__PAUSE);
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
  }
5
54liuyao 已提交
1253 1254 1255 1256 1257
  return 0;
}

int32_t tqProcessTaskResumeReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
  SVResumeStreamTaskReq* pReq = (SVResumeStreamTaskReq*)msg;
L
liuyao 已提交
1258 1259
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->taskId);
  if (pTask) {
L
liuyao 已提交
1260
    atomic_store_8(&pTask->status.taskStatus, pTask->status.keepTaskStatus);
1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271

    // no lock needs to secure the access of the version
    if (pReq->igUntreated) {  // discard all the data  when the stream task is suspended.
      pTask->chkInfo.currentVer = sversion;
      tqDebug("vgId:%d s-task:%s resume to normal from the latest version:%" PRId64 ", vnode ver:%" PRId64, pTq->pStreamMeta->vgId,
              pTask->id.idStr, pTask->chkInfo.currentVer, sversion);
    } else {  // from the previous paused version and go on
      tqDebug("vgId:%d s-task:%s resume to normal from paused ver:%" PRId64 ", vnode ver:%" PRId64, pTq->pStreamMeta->vgId,
              pTask->id.idStr, pTask->chkInfo.currentVer, sversion);
    }

L
liuyao 已提交
1272
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
5
54liuyao 已提交
1273
    tqStartStreamTasks(pTq);
L
liuyao 已提交
1274
  }
1275

5
54liuyao 已提交
1276 1277 1278
  return 0;
}

L
Liu Jicong 已提交
1279 1280 1281 1282 1283 1284
int32_t tqProcessTaskRetrieveReq(STQ* pTq, SRpcMsg* pMsg) {
  char*              msgStr = pMsg->pCont;
  char*              msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t            msgLen = pMsg->contLen - sizeof(SMsgHead);
  SStreamRetrieveReq req;
  SDecoder           decoder;
1285
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
L
Liu Jicong 已提交
1286
  tDecodeStreamRetrieveReq(&decoder, &req);
L
Liu Jicong 已提交
1287
  tDecoderClear(&decoder);
L
Liu Jicong 已提交
1288
  int32_t      taskId = req.dstTaskId;
L
Liu Jicong 已提交
1289
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
L
Liu Jicong 已提交
1290
  if (pTask) {
1291
    SRpcMsg rsp = {.info = pMsg->info, .code = 0};
L
Liu Jicong 已提交
1292
    streamProcessRetrieveReq(pTask, &req, &rsp);
L
Liu Jicong 已提交
1293
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1294
    tDeleteStreamRetrieveReq(&req);
L
Liu Jicong 已提交
1295
    return 0;
L
Liu Jicong 已提交
1296
  } else {
L
liuyao 已提交
1297
    tDeleteStreamRetrieveReq(&req);
L
Liu Jicong 已提交
1298
    return -1;
L
Liu Jicong 已提交
1299 1300 1301 1302 1303 1304 1305
  }
}

int32_t tqProcessTaskRetrieveRsp(STQ* pTq, SRpcMsg* pMsg) {
  //
  return 0;
}
L
Liu Jicong 已提交
1306

1307 1308 1309 1310 1311 1312
int32_t vnodeEnqueueStreamMsg(SVnode* pVnode, SRpcMsg* pMsg) {
  STQ*      pTq = pVnode->pTq;
  SMsgHead* msgStr = pMsg->pCont;
  char*     msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t   msgLen = pMsg->contLen - sizeof(SMsgHead);
  int32_t   code = 0;
L
Liu Jicong 已提交
1313 1314 1315

  SStreamDispatchReq req;
  SDecoder           decoder;
1316
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
L
Liu Jicong 已提交
1317 1318
  if (tDecodeStreamDispatchReq(&decoder, &req) < 0) {
    code = TSDB_CODE_MSG_DECODE_ERROR;
L
Liu Jicong 已提交
1319
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1320 1321
    goto FAIL;
  }
L
Liu Jicong 已提交
1322
  tDecoderClear(&decoder);
L
Liu Jicong 已提交
1323

L
Liu Jicong 已提交
1324
  int32_t taskId = req.taskId;
L
Liu Jicong 已提交
1325

L
Liu Jicong 已提交
1326
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
L
Liu Jicong 已提交
1327
  if (pTask) {
1328
    SRpcMsg rsp = {.info = pMsg->info, .code = 0};
L
Liu Jicong 已提交
1329
    streamProcessDispatchReq(pTask, &req, &rsp, false);
L
Liu Jicong 已提交
1330
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1331 1332
    rpcFreeCont(pMsg->pCont);
    taosFreeQitem(pMsg);
1333
    return 0;
5
54liuyao 已提交
1334 1335
  } else {
    tDeleteStreamDispatchReq(&req);
L
Liu Jicong 已提交
1336
  }
L
Liu Jicong 已提交
1337

1338 1339
  code = TSDB_CODE_STREAM_TASK_NOT_EXIST;

L
Liu Jicong 已提交
1340
FAIL:
1341 1342 1343 1344
  if (pMsg->info.handle == NULL) return -1;

  SMsgHead* pRspHead = rpcMallocCont(sizeof(SMsgHead) + sizeof(SStreamDispatchRsp));
  if (pRspHead == NULL) {
1345
    SRpcMsg rsp = {.code = TSDB_CODE_OUT_OF_MEMORY, .info = pMsg->info};
1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361
    tqDebug("send dispatch error rsp, code: %x", code);
    tmsgSendRsp(&rsp);
    rpcFreeCont(pMsg->pCont);
    taosFreeQitem(pMsg);
    return -1;
  }

  pRspHead->vgId = htonl(req.upstreamNodeId);
  SStreamDispatchRsp* pRsp = POINTER_SHIFT(pRspHead, sizeof(SMsgHead));
  pRsp->streamId = htobe64(req.streamId);
  pRsp->upstreamTaskId = htonl(req.upstreamTaskId);
  pRsp->upstreamNodeId = htonl(req.upstreamNodeId);
  pRsp->downstreamNodeId = htonl(pVnode->config.vgId);
  pRsp->downstreamTaskId = htonl(req.taskId);
  pRsp->inputStatus = TASK_OUTPUT_STATUS__NORMAL;

L
Liu Jicong 已提交
1362
  SRpcMsg rsp = {
1363
      .code = code, .info = pMsg->info, .contLen = sizeof(SMsgHead) + sizeof(SStreamDispatchRsp), .pCont = pRspHead};
1364
  tqDebug("send dispatch error rsp, code: %x", code);
L
Liu Jicong 已提交
1365
  tmsgSendRsp(&rsp);
L
Liu Jicong 已提交
1366 1367
  rpcFreeCont(pMsg->pCont);
  taosFreeQitem(pMsg);
1368
  return -1;
L
Liu Jicong 已提交
1369
}
L
Liu Jicong 已提交
1370

1371
int32_t tqCheckLogInWal(STQ* pTq, int64_t sversion) { return sversion <= pTq->walLogLastVer; }
1372

1373
int32_t tqStartStreamTasks(STQ* pTq) {
1374
  int32_t      vgId = TD_VID(pTq->pVnode);
1375
  SStreamMeta* pMeta = pTq->pStreamMeta;
1376

1377
  taosWLockLatch(&pMeta->lock);
1378

1379
  int32_t numOfTasks = taosArrayGetSize(pMeta->pTaskList);
1380
  if (numOfTasks == 0) {
1381
    tqInfo("vgId:%d no stream tasks exist", vgId);
1382 1383 1384 1385
    taosWUnLockLatch(&pTq->pStreamMeta->lock);
    return 0;
  }

1386
  pMeta->walScanCounter += 1;
1387

1388 1389
  if (pMeta->walScanCounter > 1) {
    tqDebug("vgId:%d wal read task has been launched, remain scan times:%d", vgId, pMeta->walScanCounter);
1390 1391 1392 1393
    taosWUnLockLatch(&pTq->pStreamMeta->lock);
    return 0;
  }

1394 1395 1396
  SStreamTaskRunReq* pRunReq = rpcMallocCont(sizeof(SStreamTaskRunReq));
  if (pRunReq == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
1397
    tqError("vgId:%d failed to create msg to start wal scanning to launch stream tasks, code:%s", vgId, terrstr());
1398
    taosWUnLockLatch(&pTq->pStreamMeta->lock);
1399 1400 1401
    return -1;
  }

H
Haojun Liao 已提交
1402
  tqDebug("vgId:%d create msg to start wal scan to launch stream tasks, numOfTasks:%d", vgId, numOfTasks);
1403 1404
  pRunReq->head.vgId = vgId;
  pRunReq->streamId = 0;
1405
  pRunReq->taskId = WAL_READ_TASKS_ID;
1406 1407 1408

  SRpcMsg msg = {.msgType = TDMT_STREAM_TASK_RUN, .pCont = pRunReq, .contLen = sizeof(SStreamTaskRunReq)};
  tmsgPutToQueue(&pTq->pVnode->msgCb, STREAM_QUEUE, &msg);
1409
  taosWUnLockLatch(&pTq->pStreamMeta->lock);
1410 1411 1412

  return 0;
}