tq.c 61.3 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
S
Shengliang Guan 已提交
14 15
 */

H
Hongze Cheng 已提交
16
#include "tq.h"
S
Shengliang Guan 已提交
17

dengyihao's avatar
dengyihao 已提交
18 19 20
// 0: not init
// 1: already inited
// 2: wait to be inited or cleaup
21
static int32_t tqInitialize(STQ* pTq);
dengyihao's avatar
dengyihao 已提交
22

wmmhello's avatar
wmmhello 已提交
23
static FORCE_INLINE bool tqIsHandleExec(STqHandle* pHandle) { return TMQ_HANDLE_STATUS_EXEC == pHandle->status; }
dengyihao's avatar
dengyihao 已提交
24 25
static FORCE_INLINE void tqSetHandleExec(STqHandle* pHandle) { pHandle->status = TMQ_HANDLE_STATUS_EXEC; }
static FORCE_INLINE void tqSetHandleIdle(STqHandle* pHandle) { pHandle->status = TMQ_HANDLE_STATUS_IDLE; }
wmmhello's avatar
wmmhello 已提交
26

L
Liu Jicong 已提交
27
int32_t tqInit() {
L
Liu Jicong 已提交
28 29 30 31 32 33
  int8_t old;
  while (1) {
    old = atomic_val_compare_exchange_8(&tqMgmt.inited, 0, 2);
    if (old != 2) break;
  }

34 35 36 37 38 39
  if (old == 0) {
    tqMgmt.timer = taosTmrInit(10000, 100, 10000, "TQ");
    if (tqMgmt.timer == NULL) {
      atomic_store_8(&tqMgmt.inited, 0);
      return -1;
    }
40 41 42
    if (streamInit() < 0) {
      return -1;
    }
L
Liu Jicong 已提交
43
    atomic_store_8(&tqMgmt.inited, 1);
44
  }
45

L
Liu Jicong 已提交
46 47
  return 0;
}
L
Liu Jicong 已提交
48

49
void tqCleanUp() {
L
Liu Jicong 已提交
50 51 52 53 54 55 56 57
  int8_t old;
  while (1) {
    old = atomic_val_compare_exchange_8(&tqMgmt.inited, 1, 2);
    if (old != 2) break;
  }

  if (old == 1) {
    taosTmrCleanUp(tqMgmt.timer);
L
Liu Jicong 已提交
58
    streamCleanUp();
L
Liu Jicong 已提交
59 60
    atomic_store_8(&tqMgmt.inited, 0);
  }
61
}
L
Liu Jicong 已提交
62

63
void tqDestroyTqHandle(void* data) {
64 65
  STqHandle* pData = (STqHandle*)data;
  qDestroyTask(pData->execHandle.task);
wmmhello's avatar
wmmhello 已提交
66

67
  if (pData->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
L
Liu Jicong 已提交
68
    taosMemoryFreeClear(pData->execHandle.execCol.qmsg);
69
  } else if (pData->execHandle.subType == TOPIC_SUB_TYPE__DB) {
70
    tqReaderClose(pData->execHandle.pTqReader);
71 72
    walCloseReader(pData->pWalReader);
    taosHashCleanup(pData->execHandle.execDb.pFilterOutTbUid);
L
Liu Jicong 已提交
73
  } else if (pData->execHandle.subType == TOPIC_SUB_TYPE__TABLE) {
74
    walCloseReader(pData->pWalReader);
75
    tqReaderClose(pData->execHandle.pTqReader);
76 77
    taosMemoryFreeClear(pData->execHandle.execTb.qmsg);
    nodesDestroyNode(pData->execHandle.execTb.node);
78
  }
dengyihao's avatar
dengyihao 已提交
79
  if (pData->msg != NULL) {
80 81 82
    rpcFreeCont(pData->msg->pCont);
    taosMemoryFree(pData->msg);
    pData->msg = NULL;
D
dapan1121 已提交
83
  }
L
Liu Jicong 已提交
84 85
}

86
static bool tqOffsetEqual(const STqOffset* pLeft, const STqOffset* pRight) {
87
  return pLeft->val.type == TMQ_OFFSET__LOG && pRight->val.type == TMQ_OFFSET__LOG &&
88
         pLeft->val.version == pRight->val.version;
89 90
}

L
Liu Jicong 已提交
91
STQ* tqOpen(const char* path, SVnode* pVnode) {
92
  STQ* pTq = taosMemoryCalloc(1, sizeof(STQ));
L
Liu Jicong 已提交
93
  if (pTq == NULL) {
S
Shengliang Guan 已提交
94
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
95 96
    return NULL;
  }
97

98
  pTq->path = taosStrdup(path);
L
Liu Jicong 已提交
99
  pTq->pVnode = pVnode;
L
Liu Jicong 已提交
100
  pTq->walLogLastVer = pVnode->pWal->vers.lastVer;
101

102
  pTq->pHandle = taosHashInit(64, MurmurHash3_32, true, HASH_ENTRY_LOCK);
103
  taosHashSetFreeFp(pTq->pHandle, tqDestroyTqHandle);
104

105
  taosInitRWLatch(&pTq->lock);
106
  pTq->pPushMgr = taosHashInit(64, MurmurHash3_32, false, HASH_NO_LOCK);
L
Liu Jicong 已提交
107

108
  pTq->pCheckInfo = taosHashInit(64, MurmurHash3_32, true, HASH_ENTRY_LOCK);
L
Liu Jicong 已提交
109
  taosHashSetFreeFp(pTq->pCheckInfo, (FDelete)tDeleteSTqCheckInfo);
L
Liu Jicong 已提交
110

111 112 113 114 115 116 117
  int32_t code = tqInitialize(pTq);
  if (code != TSDB_CODE_SUCCESS) {
    tqClose(pTq);
    return NULL;
  } else {
    return pTq;
  }
118 119 120
}

int32_t tqInitialize(STQ* pTq) {
L
Liu Jicong 已提交
121
  if (tqMetaOpen(pTq) < 0) {
122
    return -1;
123 124
  }

L
Liu Jicong 已提交
125 126
  pTq->pOffsetStore = tqOffsetOpen(pTq);
  if (pTq->pOffsetStore == NULL) {
127
    return -1;
128 129
  }

130
  pTq->pStreamMeta = streamMetaOpen(pTq->path, pTq, (FTaskExpand*)tqExpandTask, pTq->pVnode->config.vgId);
L
Liu Jicong 已提交
131
  if (pTq->pStreamMeta == NULL) {
132
    return -1;
L
Liu Jicong 已提交
133 134
  }

135 136
  // the version is kept in task's meta data
  // todo check if this version is required or not
137 138
  if (streamLoadTasks(pTq->pStreamMeta, walGetCommittedVer(pTq->pVnode->pWal)) < 0) {
    return -1;
L
Liu Jicong 已提交
139 140
  }

141
  return 0;
L
Liu Jicong 已提交
142
}
L
Liu Jicong 已提交
143

L
Liu Jicong 已提交
144
void tqClose(STQ* pTq) {
145 146
  if (pTq == NULL) {
    return;
H
Hongze Cheng 已提交
147
  }
148

wmmhello's avatar
wmmhello 已提交
149 150 151 152 153 154 155 156 157 158 159 160 161 162
  void* pIter = taosHashIterate(pTq->pPushMgr, NULL);
  while (pIter) {
    STqHandle* pHandle = *(STqHandle**)pIter;
    int32_t    vgId = TD_VID(pTq->pVnode);

    if(pHandle->msg != NULL) {
      tqPushEmptyDataRsp(pHandle, vgId);
      rpcFreeCont(pHandle->msg->pCont);
      taosMemoryFree(pHandle->msg);
      pHandle->msg = NULL;
    }
    pIter = taosHashIterate(pTq->pPushMgr, pIter);
  }

163 164 165 166 167 168 169 170
  tqOffsetClose(pTq->pOffsetStore);
  taosHashCleanup(pTq->pHandle);
  taosHashCleanup(pTq->pPushMgr);
  taosHashCleanup(pTq->pCheckInfo);
  taosMemoryFree(pTq->path);
  tqMetaClose(pTq);
  streamMetaClose(pTq->pStreamMeta);
  taosMemoryFree(pTq);
L
Liu Jicong 已提交
171
}
L
Liu Jicong 已提交
172

173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195
static bool hasStreamTaskInTimer(SStreamMeta* pMeta) {
  bool inTimer = false;

  taosWLockLatch(&pMeta->lock);

  void* pIter = NULL;
  while(1) {
    pIter = taosHashIterate(pMeta->pTasks, pIter);
    if (pIter == NULL) {
      break;
    }

    SStreamTask* pTask = *(SStreamTask**)pIter;
    if (pTask->status.timerActive == 1) {
      inTimer = true;
    }
  }

  taosWUnLockLatch(&pMeta->lock);

  return inTimer;
}

H
Haojun Liao 已提交
196 197 198 199 200 201 202 203 204 205 206 207
void tqNotifyClose(STQ* pTq) {
  if (pTq != NULL) {
    taosWLockLatch(&pTq->pStreamMeta->lock);

    void* pIter = NULL;
    while (1) {
      pIter = taosHashIterate(pTq->pStreamMeta->pTasks, pIter);
      if (pIter == NULL) {
        break;
      }

      SStreamTask* pTask = *(SStreamTask**)pIter;
H
Haojun Liao 已提交
208
      tqDebug("vgId:%d s-task:%s set closing flag", pTq->pStreamMeta->vgId, pTask->id.idStr);
209 210 211
      pTask->status.taskStatus = TASK_STATUS__STOP;

      int64_t st = taosGetTimestampMs();
H
Haojun Liao 已提交
212
      qKillTask(pTask->exec.pExecutor, TSDB_CODE_SUCCESS);
H
Haojun Liao 已提交
213

214
      int64_t el = taosGetTimestampMs() - st;
H
Haojun Liao 已提交
215
      tqDebug("vgId:%d s-task:%s is closed in %" PRId64 " ms", pTq->pStreamMeta->vgId, pTask->id.idStr, el);
H
Haojun Liao 已提交
216 217 218
    }

    taosWUnLockLatch(&pTq->pStreamMeta->lock);
H
Haojun Liao 已提交
219 220 221 222 223

    tqDebug("vgId:%d start to check all tasks", pTq->pStreamMeta->vgId);

    int64_t st = taosGetTimestampMs();

224 225 226
    while(hasStreamTaskInTimer(pTq->pStreamMeta)) {
      tqDebug("vgId:%d some tasks in timer, wait for 100ms and recheck", pTq->pStreamMeta->vgId);
      taosMsleep(100);
H
Haojun Liao 已提交
227 228 229 230
    }

    int64_t el = taosGetTimestampMs() - st;
    tqDebug("vgId:%d all stream tasks are not in timer, continue close, elapsed time:%"PRId64" ms", pTq->pStreamMeta->vgId, el);
H
Haojun Liao 已提交
231 232 233
  }
}

234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281
//static int32_t doSendDataRsp(const SRpcHandleInfo* pRpcHandleInfo, const SMqDataRsp* pRsp, int32_t epoch,
//                             int64_t consumerId, int32_t type) {
//  int32_t len = 0;
//  int32_t code = 0;
//
//  if (type == TMQ_MSG_TYPE__POLL_DATA_RSP) {
//    tEncodeSize(tEncodeMqDataRsp, pRsp, len, code);
//  } else if (type == TMQ_MSG_TYPE__POLL_DATA_META_RSP) {
//    tEncodeSize(tEncodeSTaosxRsp, (STaosxRsp*)pRsp, len, code);
//  }
//
//  if (code < 0) {
//    return -1;
//  }
//
//  int32_t tlen = sizeof(SMqRspHead) + len;
//  void*   buf = rpcMallocCont(tlen);
//  if (buf == NULL) {
//    return -1;
//  }
//
//  ((SMqRspHead*)buf)->mqMsgType = type;
//  ((SMqRspHead*)buf)->epoch = epoch;
//  ((SMqRspHead*)buf)->consumerId = consumerId;
//
//  void* abuf = POINTER_SHIFT(buf, sizeof(SMqRspHead));
//
//  SEncoder encoder = {0};
//  tEncoderInit(&encoder, abuf, len);
//
//  if (type == TMQ_MSG_TYPE__POLL_DATA_RSP) {
//    tEncodeMqDataRsp(&encoder, pRsp);
//  } else if (type == TMQ_MSG_TYPE__POLL_DATA_META_RSP) {
//    tEncodeSTaosxRsp(&encoder, (STaosxRsp*)pRsp);
//  }
//
//  tEncoderClear(&encoder);
//
//  SRpcMsg rsp = {
//      .info = *pRpcHandleInfo,
//      .pCont = buf,
//      .contLen = tlen,
//      .code = 0,
//  };
//
//  tmsgSendRsp(&rsp);
//  return 0;
//}
L
Liu Jicong 已提交
282

283 284 285 286 287 288 289
int32_t tqPushEmptyDataRsp(STqHandle* pHandle, int32_t vgId) {
  SMqPollReq req = {0};
  if (tDeserializeSMqPollReq(pHandle->msg->pCont, pHandle->msg->contLen, &req) < 0) {
    tqError("tDeserializeSMqPollReq %d failed", pHandle->msg->contLen);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }
D
dapan1121 已提交
290

291 292 293 294
  SMqDataRsp dataRsp = {0};
  tqInitDataRsp(&dataRsp, &req);
  dataRsp.blockNum = 0;
  dataRsp.rspOffset = dataRsp.reqOffset;
wmmhello's avatar
wmmhello 已提交
295 296 297 298
  char buf[TSDB_OFFSET_LEN] = {0};
  tFormatOffset(buf, TSDB_OFFSET_LEN, &dataRsp.reqOffset);
  tqInfo("tqPushEmptyDataRsp to consumer:0x%"PRIx64 " vgId:%d, offset:%s, reqId:0x%" PRIx64, req.consumerId, vgId, buf, req.reqId);

H
Haojun Liao 已提交
299
  tqSendDataRsp(pHandle, pHandle->msg, &req, &dataRsp, TMQ_MSG_TYPE__POLL_DATA_RSP, vgId);
300
  tDeleteMqDataRsp(&dataRsp);
L
Liu Jicong 已提交
301 302 303
  return 0;
}

304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323
//int32_t tqPushDataRsp(STqHandle* pHandle, int32_t vgId) {
//  SMqDataRsp dataRsp = {0};
//  dataRsp.head.consumerId = pHandle->consumerId;
//  dataRsp.head.epoch = pHandle->epoch;
//  dataRsp.head.mqMsgType = TMQ_MSG_TYPE__POLL_RSP;
//
//  int64_t sver = 0, ever = 0;
//  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);
//  tqDoSendDataRsp(&pHandle->msg->info, &dataRsp, pHandle->epoch, pHandle->consumerId, TMQ_MSG_TYPE__POLL_RSP, sver,
//                  ever);
//
//  char buf1[TSDB_OFFSET_LEN] = {0};
//  char buf2[TSDB_OFFSET_LEN] = {0};
//  tFormatOffset(buf1, tListLen(buf1), &dataRsp.reqOffset);
//  tFormatOffset(buf2, tListLen(buf2), &dataRsp.rspOffset);
//  tqDebug("vgId:%d, from consumer:0x%" PRIx64 " (epoch %d) push rsp, block num: %d, req:%s, rsp:%s", vgId,
//          dataRsp.head.consumerId, dataRsp.head.epoch, dataRsp.blockNum, buf1, buf2);
//  return 0;
//}

324 325 326 327 328 329
int32_t tqSendDataRsp(STqHandle* pHandle, const SRpcMsg* pMsg, const SMqPollReq* pReq, const SMqDataRsp* pRsp,
                      int32_t type, int32_t vgId) {
  int64_t sver = 0, ever = 0;
  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);

  tqDoSendDataRsp(&pMsg->info, pRsp, pReq->epoch, pReq->consumerId, type, sver, ever);
330

331 332 333 334
  char buf1[TSDB_OFFSET_LEN] = {0};
  char buf2[TSDB_OFFSET_LEN] = {0};
  tFormatOffset(buf1, TSDB_OFFSET_LEN, &pRsp->reqOffset);
  tFormatOffset(buf2, TSDB_OFFSET_LEN, &pRsp->rspOffset);
335

336
  tqDebug("tmq poll vgId:%d consumer:0x%" PRIx64 " (epoch %d) send rsp, block num:%d, req:%s, rsp:%s, reqId:0x%" PRIx64, vgId,
dengyihao's avatar
dengyihao 已提交
337
          pReq->consumerId, pReq->epoch, pRsp->blockNum, buf1, buf2, pReq->reqId);
338 339 340 341

  return 0;
}

342
int32_t tqProcessOffsetCommitReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
343 344
  SMqVgOffset vgOffset = {0};
  int32_t     vgId = TD_VID(pTq->pVnode);
345

X
Xiaoyu Wang 已提交
346 347
  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
348
  if (tDecodeMqVgOffset(&decoder, &vgOffset) < 0) {
349 350
    return -1;
  }
351

352 353
  tDecoderClear(&decoder);

354 355 356
  STqOffset* pOffset = &vgOffset.offset;

  if (pOffset->val.type == TMQ_OFFSET__SNAPSHOT_DATA || pOffset->val.type == TMQ_OFFSET__SNAPSHOT_META) {
357
    tqDebug("receive offset commit msg to %s on vgId:%d, offset(type:snapshot) uid:%" PRId64 ", ts:%" PRId64,
358 359
            pOffset->subKey, vgId, pOffset->val.uid, pOffset->val.ts);
  } else if (pOffset->val.type == TMQ_OFFSET__LOG) {
360
    tqDebug("receive offset commit msg to %s on vgId:%d, offset(type:log) version:%" PRId64, pOffset->subKey, vgId,
361
            pOffset->val.version);
362
  } else {
363
    tqError("invalid commit offset type:%d", pOffset->val.type);
364
    return -1;
365
  }
366

367
  STqOffset* pSavedOffset = tqOffsetRead(pTq->pOffsetStore, pOffset->subKey);
368 369
  if (pSavedOffset != NULL && tqOffsetEqual(pOffset, pSavedOffset)) {
    tqInfo("not update the offset, vgId:%d sub:%s since committed:%" PRId64 " less than/equal to existed:%" PRId64,
370
            vgId, pOffset->subKey, pOffset->val.version, pSavedOffset->val.version);
371
    return 0;  // no need to update the offset value
372 373
  }

374
  // save the new offset value
375
  if (tqOffsetWrite(pTq->pOffsetStore, pOffset) < 0) {
376
    return -1;
377
  }
378

379 380 381
  return 0;
}

382 383
int32_t tqProcessSeekReq(STQ* pTq, SRpcMsg* pMsg) {
  SMqSeekReq  req = {0};
384
  int32_t     vgId = TD_VID(pTq->pVnode);
385 386
  SRpcMsg     rsp = {.info = pMsg->info};
  int         code = 0;
387

388 389 390
  if (tDeserializeSMqSeekReq(pMsg->pCont, pMsg->contLen, &req) < 0) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto end;
391 392
  }

393 394
  tqDebug("tmq seek: consumer:0x%" PRIx64 " vgId:%d, subkey %s", req.consumerId, vgId, req.subKey);

395
  STqHandle* pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
396
  if (pHandle == NULL) {
397 398 399
    tqWarn("tmq seek: consumer:0x%" PRIx64 " vgId:%d subkey %s not found", req.consumerId, vgId, req.subKey);
    code = 0;
    goto end;
400 401
  }

402 403
  // 2. check consumer-vg assignment status
  taosRLockLatch(&pTq->lock);
404 405 406
  if (pHandle->consumerId != req.consumerId) {
    tqError("ERROR tmq seek: consumer:0x%" PRIx64 " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
            req.consumerId, vgId, req.subKey, pHandle->consumerId);
407
    taosRUnLockLatch(&pTq->lock);
408 409
    code = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
    goto end;
410 411
  }

412 413 414 415
  //if consumer register to push manager, push empty to consumer to change vg status from TMQ_VG_STATUS__WAIT to TMQ_VG_STATUS__IDLE,
  //otherwise poll data failed after seek.
  tqUnregisterPushHandle(pTq, pHandle);
  taosRUnLockLatch(&pTq->lock);
H
Haojun Liao 已提交
416

417 418 419
end:
  rsp.code = code;
  tmsgSendRsp(&rsp);
420
  return 0;
421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500

//  SMqVgOffset vgOffset = {0};
//  int32_t     vgId = TD_VID(pTq->pVnode);
//
//  SDecoder decoder;
//  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
//  if (tDecodeMqVgOffset(&decoder, &vgOffset) < 0) {
//    tqError("vgId:%d failed to decode seek msg", vgId);
//    return -1;
//  }
//
//  tDecoderClear(&decoder);
//
//  tqDebug("topic:%s, vgId:%d process offset seek by consumer:0x%" PRIx64 ", req offset:%" PRId64,
//          vgOffset.offset.subKey, vgId, vgOffset.consumerId, vgOffset.offset.val.version);
//
//  STqOffset* pOffset = &vgOffset.offset;
//  if (pOffset->val.type != TMQ_OFFSET__LOG) {
//    tqError("vgId:%d, subKey:%s invalid seek offset type:%d", vgId, pOffset->subKey, pOffset->val.type);
//    return -1;
//  }
//
//  STqHandle* pHandle = taosHashGet(pTq->pHandle, pOffset->subKey, strlen(pOffset->subKey));
//  if (pHandle == NULL) {
//    tqError("tmq seek: consumer:0x%" PRIx64 " vgId:%d subkey %s not found", vgOffset.consumerId, vgId, pOffset->subKey);
//    terrno = TSDB_CODE_INVALID_MSG;
//    return -1;
//  }
//
//  // 2. check consumer-vg assignment status
//  taosRLockLatch(&pTq->lock);
//  if (pHandle->consumerId != vgOffset.consumerId) {
//    tqDebug("ERROR tmq seek: consumer:0x%" PRIx64 " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
//            vgOffset.consumerId, vgId, pOffset->subKey, pHandle->consumerId);
//    terrno = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
//    taosRUnLockLatch(&pTq->lock);
//    return -1;
//  }
//  taosRUnLockLatch(&pTq->lock);
//
//  // 3. check the offset info
//  STqOffset* pSavedOffset = tqOffsetRead(pTq->pOffsetStore, pOffset->subKey);
//  if (pSavedOffset != NULL) {
//    if (pSavedOffset->val.type != TMQ_OFFSET__LOG) {
//      tqError("invalid saved offset type, vgId:%d sub:%s", vgId, pOffset->subKey);
//      return 0;  // no need to update the offset value
//    }
//
//    if (pSavedOffset->val.version == pOffset->val.version) {
//      tqDebug("vgId:%d subKey:%s no need to seek to %" PRId64 " prev offset:%" PRId64, vgId, pOffset->subKey,
//              pOffset->val.version, pSavedOffset->val.version);
//      return 0;
//    }
//  }
//
//  int64_t sver = 0, ever = 0;
//  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);
//  if (pOffset->val.version < sver) {
//    pOffset->val.version = sver;
//  } else if (pOffset->val.version > ever) {
//    pOffset->val.version = ever;
//  }
//
//  // save the new offset value
//  if (pSavedOffset != NULL) {
//    tqDebug("vgId:%d sub:%s seek to:%" PRId64 " prev offset:%" PRId64, vgId, pOffset->subKey, pOffset->val.version,
//            pSavedOffset->val.version);
//  } else {
//    tqDebug("vgId:%d sub:%s seek to:%" PRId64 " not saved yet", vgId, pOffset->subKey, pOffset->val.version);
//  }
//
//  if (tqOffsetWrite(pTq->pOffsetStore, pOffset) < 0) {
//    tqError("failed to save offset, vgId:%d sub:%s seek to %" PRId64, vgId, pOffset->subKey, pOffset->val.version);
//    return -1;
//  }
//
//  tqDebug("topic:%s, vgId:%d consumer:0x%" PRIx64 " offset is update to:%" PRId64, vgOffset.offset.subKey, vgId,
//          vgOffset.consumerId, vgOffset.offset.val.version);
//
//  return 0;
501 502
}

L
Liu Jicong 已提交
503
int32_t tqCheckColModifiable(STQ* pTq, int64_t tbUid, int32_t colId) {
L
Liu Jicong 已提交
504
  void* pIter = NULL;
505

L
Liu Jicong 已提交
506
  while (1) {
507
    pIter = taosHashIterate(pTq->pCheckInfo, pIter);
508 509 510 511
    if (pIter == NULL) {
      break;
    }

512
    STqCheckInfo* pCheck = (STqCheckInfo*)pIter;
513

L
Liu Jicong 已提交
514 515
    if (pCheck->ntbUid == tbUid) {
      int32_t sz = taosArrayGetSize(pCheck->colIdList);
L
Liu Jicong 已提交
516
      for (int32_t i = 0; i < sz; i++) {
L
Liu Jicong 已提交
517 518
        int16_t forbidColId = *(int16_t*)taosArrayGet(pCheck->colIdList, i);
        if (forbidColId == colId) {
519
          taosHashCancelIterate(pTq->pCheckInfo, pIter);
L
Liu Jicong 已提交
520 521 522 523 524
          return -1;
        }
      }
    }
  }
525

L
Liu Jicong 已提交
526 527 528
  return 0;
}

529 530 531 532 533 534 535 536
int32_t tqProcessPollPush(STQ* pTq, SRpcMsg* pMsg) {
  int32_t vgId = TD_VID(pTq->pVnode);
  taosWLockLatch(&pTq->lock);
  if (taosHashGetSize(pTq->pPushMgr) > 0) {
    void* pIter = taosHashIterate(pTq->pPushMgr, NULL);

    while (pIter) {
      STqHandle* pHandle = *(STqHandle**)pIter;
wmmhello's avatar
wmmhello 已提交
537
      tqInfo("vgId:%d start set submit for pHandle:%p, consumer:0x%" PRIx64, vgId, pHandle, pHandle->consumerId);
538 539 540

      if (ASSERT(pHandle->msg != NULL)) {
        tqError("pHandle->msg should not be null");
wmmhello's avatar
wmmhello 已提交
541
        taosHashCancelIterate(pTq->pPushMgr, pIter);
542 543 544 545 546 547 548 549 550 551 552 553 554
        break;
      }else{
        SRpcMsg msg = {.msgType = TDMT_VND_TMQ_CONSUME, .pCont = pHandle->msg->pCont, .contLen = pHandle->msg->contLen, .info = pHandle->msg->info};
        tmsgPutToQueue(&pTq->pVnode->msgCb, QUERY_QUEUE, &msg);
        taosMemoryFree(pHandle->msg);
        pHandle->msg = NULL;
      }

      pIter = taosHashIterate(pTq->pPushMgr, pIter);
    }

    taosHashClear(pTq->pPushMgr);
  }
wmmhello's avatar
wmmhello 已提交
555
  taosWUnLockLatch(&pTq->lock);
556 557 558
  return 0;
}

D
dapan1121 已提交
559
int32_t tqProcessPollReq(STQ* pTq, SRpcMsg* pMsg) {
X
Xiaoyu Wang 已提交
560
  SMqPollReq req = {0};
dengyihao's avatar
dengyihao 已提交
561
  int        code = 0;
D
dapan1121 已提交
562 563 564 565 566 567 568 569 570 571
  if (tDeserializeSMqPollReq(pMsg->pCont, pMsg->contLen, &req) < 0) {
    tqError("tDeserializeSMqPollReq %d failed", pMsg->contLen);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  int64_t      consumerId = req.consumerId;
  int32_t      reqEpoch = req.epoch;
  STqOffsetVal reqOffset = req.reqOffset;
  int32_t      vgId = TD_VID(pTq->pVnode);
wmmhello's avatar
wmmhello 已提交
572
  STqHandle*   pHandle = NULL;
D
dapan1121 已提交
573

wmmhello's avatar
wmmhello 已提交
574 575 576 577 578
  while (1) {
    taosWLockLatch(&pTq->lock);
    // 1. find handle
    pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
    if (pHandle == NULL) {
wmmhello's avatar
wmmhello 已提交
579 580 581 582 583 584 585 586 587 588 589 590
      do{
        if (tqMetaGetHandle(pTq, req.subKey) == 0){
          pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
          if(pHandle != NULL){
            break;
          }
        }
        tqError("tmq poll: consumer:0x%" PRIx64 " vgId:%d subkey %s not found", consumerId, vgId, req.subKey);
        terrno = TSDB_CODE_INVALID_MSG;
        taosWUnLockLatch(&pTq->lock);
        return -1;
      }while(0);
wmmhello's avatar
wmmhello 已提交
591
    }
D
dapan1121 已提交
592

593 594
    // 2. check re-balance status
    if (pHandle->consumerId != consumerId) {
dengyihao's avatar
dengyihao 已提交
595 596
      tqError("ERROR tmq poll: consumer:0x%" PRIx64
              " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
597
              consumerId, TD_VID(pTq->pVnode), req.subKey, pHandle->consumerId);
598
      terrno = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
599 600 601
      taosWUnLockLatch(&pTq->lock);
      return -1;
    }
wmmhello's avatar
wmmhello 已提交
602

wmmhello's avatar
wmmhello 已提交
603
    bool exec = tqIsHandleExec(pHandle);
dengyihao's avatar
dengyihao 已提交
604
    if (!exec) {
wmmhello's avatar
wmmhello 已提交
605
      tqSetHandleExec(pHandle);
dengyihao's avatar
dengyihao 已提交
606
      //      qSetTaskCode(pHandle->execHandle.task, TDB_CODE_SUCCESS);
607
      tqDebug("tmq poll: consumer:0x%" PRIx64 " vgId:%d, topic:%s, set handle exec, pHandle:%p", consumerId, vgId,
dengyihao's avatar
dengyihao 已提交
608
              req.subKey, pHandle);
wmmhello's avatar
wmmhello 已提交
609 610 611
      taosWUnLockLatch(&pTq->lock);
      break;
    }
612
    taosWUnLockLatch(&pTq->lock);
613

dengyihao's avatar
dengyihao 已提交
614 615 616
    tqDebug("tmq poll: consumer:0x%" PRIx64
            "vgId:%d, topic:%s, subscription is executing, wait for 10ms and retry, pHandle:%p",
            consumerId, vgId, req.subKey, pHandle);
wmmhello's avatar
wmmhello 已提交
617
    taosMsleep(10);
D
dapan1121 已提交
618 619 620
  }

  // 3. update the epoch value
621
  if (pHandle->epoch < reqEpoch) {
dengyihao's avatar
dengyihao 已提交
622
    tqDebug("tmq poll: consumer:0x%" PRIx64 " epoch update from %d to %d by poll req", consumerId, pHandle->epoch,
X
Xiaoyu Wang 已提交
623
            reqEpoch);
D
dapan1121 已提交
624 625 626
    pHandle->epoch = reqEpoch;
  }

wmmhello's avatar
wmmhello 已提交
627
  char buf[TSDB_OFFSET_LEN] = {0};
628
  tFormatOffset(buf, TSDB_OFFSET_LEN, &reqOffset);
D
dapan1121 已提交
629 630 631
  tqDebug("tmq poll: consumer:0x%" PRIx64 " (epoch %d), subkey %s, recv poll req vgId:%d, req:%s, reqId:0x%" PRIx64,
          consumerId, req.epoch, pHandle->subKey, vgId, buf, req.reqId);

wmmhello's avatar
wmmhello 已提交
632
  code = tqExtractDataForMq(pTq, pHandle, &req, pMsg);
633
  tqSetHandleIdle(pHandle);
634

635
  tqDebug("tmq poll: consumer:0x%" PRIx64 " vgId:%d, topic:%s, set handle idle, pHandle:%p", consumerId, vgId,
dengyihao's avatar
dengyihao 已提交
636
          req.subKey, pHandle);
637
  return code;
D
dapan1121 已提交
638 639
}

640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666
int32_t tqProcessVgCommittedInfoReq(STQ* pTq, SRpcMsg* pMsg) {
  void* data = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
  int32_t len = pMsg->contLen - sizeof(SMsgHead);

  SMqVgOffset vgOffset = {0};

  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)data, len);
  if (tDecodeMqVgOffset(&decoder, &vgOffset) < 0) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  tDecoderClear(&decoder);

  STqOffset* pOffset = &vgOffset.offset;
  STqOffset* pSavedOffset = tqOffsetRead(pTq->pOffsetStore, pOffset->subKey);
  if (pSavedOffset == NULL) {
    return TSDB_CODE_TMQ_NO_COMMITTED;
  }
  vgOffset.offset = *pSavedOffset;

  int32_t code = 0;
  tEncodeSize(tEncodeMqVgOffset, &vgOffset, len, code);
  if (code < 0) {
    return TSDB_CODE_INVALID_PARA;
  }

667
  void* buf = rpcMallocCont(len);
668 669 670 671 672 673 674 675 676 677 678 679 680 681 682
  if (buf == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
  SEncoder encoder;
  tEncoderInit(&encoder, buf, len);
  tEncodeMqVgOffset(&encoder, &vgOffset);
  tEncoderClear(&encoder);

  SRpcMsg rsp = {.info = pMsg->info, .pCont = buf, .contLen = len, .code = 0};

  tmsgSendRsp(&rsp);

  return 0;
}

683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719
int32_t tqProcessVgWalInfoReq(STQ* pTq, SRpcMsg* pMsg) {
  SMqPollReq req = {0};
  if (tDeserializeSMqPollReq(pMsg->pCont, pMsg->contLen, &req) < 0) {
    tqError("tDeserializeSMqPollReq %d failed", pMsg->contLen);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  int64_t      consumerId = req.consumerId;
  STqOffsetVal reqOffset = req.reqOffset;
  int32_t      vgId = TD_VID(pTq->pVnode);

  // 1. find handle
  STqHandle* pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
  if (pHandle == NULL) {
    tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s not found", consumerId, vgId, req.subKey);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  // 2. check re-balance status
  taosRLockLatch(&pTq->lock);
  if (pHandle->consumerId != consumerId) {
    tqDebug("ERROR consumer:0x%" PRIx64 " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
            consumerId, vgId, req.subKey, pHandle->consumerId);
    terrno = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
    taosRUnLockLatch(&pTq->lock);
    return -1;
  }
  taosRUnLockLatch(&pTq->lock);

  int64_t sver = 0, ever = 0;
  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);

  SMqDataRsp dataRsp = {0};
  tqInitDataRsp(&dataRsp, &req);

wmmhello's avatar
wmmhello 已提交
720 721 722 723 724 725
  if (req.useSnapshot == true) {
    tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s snapshot not support wal info", consumerId, vgId, req.subKey);
    terrno = TSDB_CODE_INVALID_PARA;
    tDeleteMqDataRsp(&dataRsp);
    return -1;
  }
726

wmmhello's avatar
wmmhello 已提交
727
  dataRsp.rspOffset.type = TMQ_OFFSET__LOG;
728

wmmhello's avatar
wmmhello 已提交
729 730
  if (reqOffset.type == TMQ_OFFSET__LOG) {
    dataRsp.rspOffset.version = reqOffset.version;
731 732 733 734 735 736 737 738 739
  } else if(reqOffset.type < 0){
    STqOffset* pOffset = tqOffsetRead(pTq->pOffsetStore, req.subKey);
    if (pOffset != NULL) {
      if (pOffset->val.type != TMQ_OFFSET__LOG) {
        tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s, no valid wal info", consumerId, vgId, req.subKey);
        terrno = TSDB_CODE_INVALID_PARA;
        tDeleteMqDataRsp(&dataRsp);
        return -1;
      }
740

741 742 743 744 745 746 747
      dataRsp.rspOffset.version = pOffset->val.version;
      tqInfo("consumer:0x%" PRIx64 " vgId:%d subkey:%s get assignment from store:%"PRId64, consumerId, vgId, req.subKey, dataRsp.rspOffset.version);
    }else{
      if (reqOffset.type == TMQ_OFFSET__RESET_EARLIEST) {
        dataRsp.rspOffset.version = sver;  // not consume yet, set the earliest position
      } else if (reqOffset.type == TMQ_OFFSET__RESET_LATEST) {
        dataRsp.rspOffset.version = ever;
748
      }
749
      tqInfo("consumer:0x%" PRIx64 " vgId:%d subkey:%s get assignment from init:%"PRId64, consumerId, vgId, req.subKey, dataRsp.rspOffset.version);
750
    }
wmmhello's avatar
wmmhello 已提交
751 752 753 754 755 756
  } else {
    tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s invalid offset type:%d", consumerId, vgId, req.subKey,
            reqOffset.type);
    terrno = TSDB_CODE_INVALID_PARA;
    tDeleteMqDataRsp(&dataRsp);
    return -1;
757 758 759
  }

  tqDoSendDataRsp(&pMsg->info, &dataRsp, req.epoch, req.consumerId, TMQ_MSG_TYPE__WALINFO_RSP, sver, ever);
wmmhello's avatar
wmmhello 已提交
760
  tDeleteMqDataRsp(&dataRsp);
761 762 763
  return 0;
}

764
int32_t tqProcessDeleteSubReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
L
Liu Jicong 已提交
765
  SMqVDeleteReq* pReq = (SMqVDeleteReq*)msg;
dengyihao's avatar
dengyihao 已提交
766
  int32_t        vgId = TD_VID(pTq->pVnode);
L
Liu Jicong 已提交
767

768
  tqInfo("vgId:%d, tq process delete sub req %s", vgId, pReq->subKey);
wmmhello's avatar
wmmhello 已提交
769
  int32_t code = 0;
L
Liu Jicong 已提交
770

wmmhello's avatar
wmmhello 已提交
771
  taosWLockLatch(&pTq->lock);
L
Liu Jicong 已提交
772 773
  STqHandle* pHandle = taosHashGet(pTq->pHandle, pReq->subKey, strlen(pReq->subKey));
  if (pHandle) {
wmmhello's avatar
wmmhello 已提交
774
    while (tqIsHandleExec(pHandle)) {
dengyihao's avatar
dengyihao 已提交
775 776
      tqDebug("vgId:%d, topic:%s, subscription is executing, wait for 10ms and retry, pHandle:%p", vgId,
              pHandle->subKey, pHandle);
wmmhello's avatar
wmmhello 已提交
777
      taosMsleep(10);
778
    }
779

L
Liu Jicong 已提交
780 781 782
    if (pHandle->pRef) {
      walCloseRef(pTq->pVnode->pWal, pHandle->pRef->refId);
    }
783

L
Liu Jicong 已提交
784 785 786 787
    code = taosHashRemove(pTq->pHandle, pReq->subKey, strlen(pReq->subKey));
    if (code != 0) {
      tqError("cannot process tq delete req %s, since no such handle", pReq->subKey);
    }
L
Liu Jicong 已提交
788
  }
789

L
Liu Jicong 已提交
790 791
  code = tqOffsetDelete(pTq->pOffsetStore, pReq->subKey);
  if (code != 0) {
792
    tqError("cannot process tq delete req %s, since no such offset in cache", pReq->subKey);
L
Liu Jicong 已提交
793
  }
L
Liu Jicong 已提交
794

L
Liu Jicong 已提交
795
  if (tqMetaDeleteHandle(pTq, pReq->subKey) < 0) {
L
Liu Jicong 已提交
796
    tqError("cannot process tq delete req %s, since no such offset in tdb", pReq->subKey);
797
  }
wmmhello's avatar
wmmhello 已提交
798 799
  taosWUnLockLatch(&pTq->lock);

L
Liu Jicong 已提交
800
  return 0;
L
Liu Jicong 已提交
801 802
}

803
int32_t tqProcessAddCheckInfoReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
804 805
  STqCheckInfo info = {0};
  SDecoder     decoder;
X
Xiaoyu Wang 已提交
806
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
807
  if (tDecodeSTqCheckInfo(&decoder, &info) < 0) {
L
Liu Jicong 已提交
808 809 810 811
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  tDecoderClear(&decoder);
812 813 814 815 816
  if (taosHashPut(pTq->pCheckInfo, info.topic, strlen(info.topic), &info, sizeof(STqCheckInfo)) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  if (tqMetaSaveCheckInfo(pTq, info.topic, msg, msgLen) < 0) {
L
Liu Jicong 已提交
817 818 819 820 821 822
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  return 0;
}

823
int32_t tqProcessDelCheckInfoReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
824 825 826 827 828 829 830 831 832 833 834
  if (taosHashRemove(pTq->pCheckInfo, msg, strlen(msg)) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  if (tqMetaDeleteCheckInfo(pTq, msg) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  return 0;
}

835
int32_t tqProcessSubscribeReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
dengyihao's avatar
dengyihao 已提交
836
  int         ret = 0;
L
Liu Jicong 已提交
837
  SMqRebVgReq req = {0};
dengyihao's avatar
dengyihao 已提交
838
  SDecoder    dc = {0};
839 840 841 842 843 844 845 846 847

  tDecoderInit(&dc, msg, msgLen);

  // decode req
  if (tDecodeSMqRebVgReq(&dc, &req) < 0) {
    terrno = TSDB_CODE_INVALID_MSG;
    tDecoderClear(&dc);
    return -1;
  }
L
Liu Jicong 已提交
848

849
  tqInfo("vgId:%d, tq process sub req:%s, Id:0x%" PRIx64 " -> Id:0x%" PRIx64, pTq->pVnode->config.vgId, req.subKey,
D
dapan1121 已提交
850
          req.oldConsumerId, req.newConsumerId);
L
Liu Jicong 已提交
851

852 853 854 855 856 857 858 859
  STqHandle* pHandle = NULL;
  while(1){
    pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
    if (pHandle || tqMetaGetHandle(pTq, req.subKey) < 0){
      break;
    }
  }

L
Liu Jicong 已提交
860
  if (pHandle == NULL) {
L
Liu Jicong 已提交
861
    if (req.oldConsumerId != -1) {
862
      tqError("vgId:%d, build new consumer handle %s for consumer:0x%" PRIx64 ", but old consumerId:0x%" PRIx64,
863
              req.vgId, req.subKey, req.newConsumerId, req.oldConsumerId);
L
Liu Jicong 已提交
864
    }
L
Liu Jicong 已提交
865
    if (req.newConsumerId == -1) {
866
      tqError("vgId:%d, tq invalid re-balance request, new consumerId %" PRId64 "", req.vgId, req.newConsumerId);
867
      goto end;
L
Liu Jicong 已提交
868
    }
869 870 871 872
    STqHandle handle = {0};
    ret = tqCreateHandle(pTq, &req, &handle);
    if(ret < 0){
      tqDestroyTqHandle(&handle);
873
      goto end;
874
    }
875
    ret = tqMetaSaveHandle(pTq, req.subKey, &handle);
L
Liu Jicong 已提交
876
  } else {
877
    taosWLockLatch(&pTq->lock);
wmmhello's avatar
wmmhello 已提交
878

D
dapan1121 已提交
879
    if (pHandle->consumerId == req.newConsumerId) {  // do nothing
wmmhello's avatar
wmmhello 已提交
880
      tqInfo("vgId:%d no switch consumer:0x%" PRIx64 " remains, because redo wal log", req.vgId, req.newConsumerId);
881
    } else {
wmmhello's avatar
wmmhello 已提交
882
      tqInfo("vgId:%d switch consumer from Id:0x%" PRIx64 " to Id:0x%" PRIx64, req.vgId, pHandle->consumerId, req.newConsumerId);
883
      atomic_store_64(&pHandle->consumerId, req.newConsumerId);
wmmhello's avatar
wmmhello 已提交
884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899
      //    atomic_add_fetch_32(&pHandle->epoch, 1);

      // kill executing task
      //    if(tqIsHandleExec(pHandle)) {
      //      qTaskInfo_t pTaskInfo = pHandle->execHandle.task;
      //      if (pTaskInfo != NULL) {
      //        qKillTask(pTaskInfo, TSDB_CODE_SUCCESS);
      //      }

      //      if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
      //        qStreamCloseTsdbReader(pTaskInfo);
      //      }
      //    }
      // remove if it has been register in the push manager, and return one empty block to consumer
      tqUnregisterPushHandle(pTq, pHandle);
      ret = tqMetaSaveHandle(pTq, req.subKey, pHandle);
900
    }
901
    taosWUnLockLatch(&pTq->lock);
L
Liu Jicong 已提交
902
  }
L
Liu Jicong 已提交
903

904
end:
905
  tDecoderClear(&dc);
906
  return ret;
L
Liu Jicong 已提交
907
}
908

dengyihao's avatar
dengyihao 已提交
909
void freePtr(void* ptr) { taosMemoryFree(*(void**)ptr); }
L
liuyao 已提交
910

911
int32_t tqExpandTask(STQ* pTq, SStreamTask* pTask, int64_t ver) {
D
dapan1121 已提交
912
  int32_t vgId = TD_VID(pTq->pVnode);
913

914
  pTask->id.idStr = createStreamTaskIdStr(pTask->id.streamId, pTask->id.taskId);
L
Liu Jicong 已提交
915
  pTask->refCnt = 1;
916
  pTask->status.schedStatus = TASK_SCHED_STATUS__INACTIVE;
dengyihao's avatar
dengyihao 已提交
917
  pTask->inputQueue = streamQueueOpen(512 << 10);
918
  pTask->outputInfo.queue = streamQueueOpen(512 << 10);
L
Liu Jicong 已提交
919

920
  if (pTask->inputQueue == NULL || pTask->outputInfo.queue == NULL) {
H
Haojun Liao 已提交
921
    tqError("s-task:%s failed to prepare the input/output queue, initialize task failed", pTask->id.idStr);
L
Liu Jicong 已提交
922
    return -1;
L
Liu Jicong 已提交
923 924
  }

H
Haojun Liao 已提交
925
  pTask->tsInfo.init = taosGetTimestampMs();
L
Liu Jicong 已提交
926
  pTask->inputStatus = TASK_INPUT_STATUS__NORMAL;
927
  pTask->outputInfo.status = TASK_OUTPUT_STATUS__NORMAL;
928
  pTask->pMsgCb = &pTq->pVnode->msgCb;
929
  pTask->pMeta = pTq->pStreamMeta;
930

931
  // backup the initial status, and set it to be TASK_STATUS__INIT
932
  pTask->chkInfo.version = ver;
933
  pTask->chkInfo.currentVer = ver;
934

935 936
  pTask->dataRange.range.maxVer = ver;
  pTask->dataRange.range.minVer = ver;
937

938
  if (pTask->info.taskLevel == TASK_LEVEL__SOURCE) {
L
liuyao 已提交
939
    SStreamTask* pSateTask = pTask;
L
liuyao 已提交
940
    SStreamTask task = {0};
L
liuyao 已提交
941
    if (pTask->info.fillHistory) {
L
liuyao 已提交
942 943 944
      task.id = pTask->streamTaskId;
      task.pMeta = pTask->pMeta;
      pSateTask = &task;
L
liuyao 已提交
945
    }
946

L
liuyao 已提交
947
    pTask->pState = streamStateOpen(pTq->pStreamMeta->path, pSateTask, false, -1, -1);
948 949 950 951
    if (pTask->pState == NULL) {
      return -1;
    }

L
liuyao 已提交
952 953 954 955 956
    SReadHandle handle = {.vnode = pTq->pVnode,
                          .initTqReader = 1,
                          .pStateBackend = pTask->pState,
                          .fillHistory = pTask->info.fillHistory,
                          .winRange = pTask->dataRange.window};
957
    initStorageAPI(&handle.api);
958

959
    pTask->exec.pExecutor = qCreateStreamExecTaskInfo(pTask->exec.qmsg, &handle, vgId, pTask->id.taskId);
960
    if (pTask->exec.pExecutor == NULL) {
L
Liu Jicong 已提交
961 962
      return -1;
    }
963

964
    qSetTaskId(pTask->exec.pExecutor, pTask->id.taskId, pTask->id.streamId);
965
  } else if (pTask->info.taskLevel == TASK_LEVEL__AGG) {
L
liuyao 已提交
966
    SStreamTask* pSateTask = pTask;
L
liuyao 已提交
967
    SStreamTask task = {0};
L
liuyao 已提交
968
    if (pTask->info.fillHistory) {
L
liuyao 已提交
969 970 971
      task.id = pTask->streamTaskId;
      task.pMeta = pTask->pMeta;
      pSateTask = &task;
L
liuyao 已提交
972
    }
L
liuyao 已提交
973
    pTask->pState = streamStateOpen(pTq->pStreamMeta->path, pSateTask, false, -1, -1);
974 975 976
    if (pTask->pState == NULL) {
      return -1;
    }
977

978
    int32_t     numOfVgroups = (int32_t)taosArrayGetSize(pTask->pUpstreamEpInfoList);
L
liuyao 已提交
979 980 981 982 983
    SReadHandle handle = {.vnode = NULL,
                          .numOfVgroups = numOfVgroups,
                          .pStateBackend = pTask->pState,
                          .fillHistory = pTask->info.fillHistory,
                          .winRange = pTask->dataRange.window};
984
    initStorageAPI(&handle.api);
985

986
    pTask->exec.pExecutor = qCreateStreamExecTaskInfo(pTask->exec.qmsg, &handle, vgId, pTask->id.taskId);
987
    if (pTask->exec.pExecutor == NULL) {
L
Liu Jicong 已提交
988 989
      return -1;
    }
990
    qSetTaskId(pTask->exec.pExecutor, pTask->id.taskId, pTask->id.streamId);
L
Liu Jicong 已提交
991
  }
L
Liu Jicong 已提交
992 993

  // sink
994
  if (pTask->outputInfo.type == TASK_OUTPUT__SMA) {
L
Liu Jicong 已提交
995
    pTask->smaSink.vnode = pTq->pVnode;
L
Liu Jicong 已提交
996
    pTask->smaSink.smaSink = smaHandleRes;
997
  } else if (pTask->outputInfo.type == TASK_OUTPUT__TABLE) {
L
Liu Jicong 已提交
998
    pTask->tbSink.vnode = pTq->pVnode;
H
Haojun Liao 已提交
999
    pTask->tbSink.tbSinkFunc = tqSinkToTablePipeline;
L
Liu Jicong 已提交
1000

X
Xiaoyu Wang 已提交
1001
    int32_t   ver1 = 1;
5
54liuyao 已提交
1002
    SMetaInfo info = {0};
dengyihao's avatar
dengyihao 已提交
1003
    int32_t   code = metaGetInfo(pTq->pVnode->pMeta, pTask->tbSink.stbUid, &info, NULL);
5
54liuyao 已提交
1004
    if (code == TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
1005
      ver1 = info.skmVer;
5
54liuyao 已提交
1006
    }
L
Liu Jicong 已提交
1007

1008 1009
    SSchemaWrapper* pschemaWrapper = pTask->tbSink.pSchemaWrapper;
    pTask->tbSink.pTSchema = tBuildTSchema(pschemaWrapper->pSchema, pschemaWrapper->nCols, ver1);
1010
    if (pTask->tbSink.pTSchema == NULL) {
D
dapan1121 已提交
1011 1012
      return -1;
    }
L
liuyao 已提交
1013 1014
    pTask->tbSink.pTblInfo = tSimpleHashInit(10240, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT));
    tSimpleHashSetFreeFp(pTask->tbSink.pTblInfo, freePtr);
L
Liu Jicong 已提交
1015
  }
1016

1017
  if (pTask->info.taskLevel == TASK_LEVEL__SOURCE) {
1018
    SWalFilterCond cond = {.deleteMsg = 1};  // delete msg also extract from wal files
1019
    pTask->exec.pWalReader = walOpenReader(pTq->pVnode->pWal, &cond);
1020 1021
  }

1022 1023 1024 1025 1026 1027
  // reset the task status from unfinished transaction
  if (pTask->status.taskStatus == TASK_STATUS__PAUSE) {
    tqWarn("s-task:%s reset task status to be normal, kept in meta status: Paused", pTask->id.idStr);
    pTask->status.taskStatus = TASK_STATUS__NORMAL;
  }

H
Haojun Liao 已提交
1028
  taosThreadMutexInit(&pTask->lock, NULL);
1029
  streamSetupScheduleTrigger(pTask);
1030

1031
  tqInfo("vgId:%d expand stream task, s-task:%s, checkpoint ver:%" PRId64
1032
         " child id:%d, level:%d, fill-history:%d, trigger:%" PRId64 " ms, disable pause",
1033
         vgId, pTask->id.idStr, pTask->chkInfo.version, pTask->info.selfChildId, pTask->info.taskLevel,
1034
         pTask->info.fillHistory, pTask->triggerParam);
1035 1036 1037

  // next valid version will add one
  pTask->chkInfo.version += 1;
L
Liu Jicong 已提交
1038
  return 0;
L
Liu Jicong 已提交
1039
}
L
Liu Jicong 已提交
1040

1041
int32_t tqProcessStreamTaskCheckReq(STQ* pTq, SRpcMsg* pMsg) {
1042 1043 1044 1045
  char*   msgStr = pMsg->pCont;
  char*   msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t msgLen = pMsg->contLen - sizeof(SMsgHead);

1046 1047
  SStreamTaskCheckReq req;
  SDecoder            decoder;
1048

X
Xiaoyu Wang 已提交
1049
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
1050
  tDecodeStreamTaskCheckReq(&decoder, &req);
1051
  tDecoderClear(&decoder);
1052

1053 1054
  int32_t taskId = req.downstreamTaskId;

1055 1056 1057 1058 1059 1060 1061 1062 1063
  SStreamTaskCheckRsp rsp = {
      .reqId = req.reqId,
      .streamId = req.streamId,
      .childId = req.childId,
      .downstreamNodeId = req.downstreamNodeId,
      .downstreamTaskId = req.downstreamTaskId,
      .upstreamNodeId = req.upstreamNodeId,
      .upstreamTaskId = req.upstreamTaskId,
  };
1064

1065
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.streamId, taskId);
1066
  if (pTask != NULL) {
1067
    rsp.status = streamTaskCheckStatus(pTask);
1068 1069
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);

1070 1071 1072
    const char* pStatus = streamGetTaskStatusStr(pTask->status.taskStatus);
    tqDebug("s-task:%s status:%s, recv task check req(reqId:0x%" PRIx64 ") task:0x%x (vgId:%d), ready:%d",
            pTask->id.idStr, pStatus, rsp.reqId, rsp.upstreamTaskId, rsp.upstreamNodeId, rsp.status);
1073 1074
  } else {
    rsp.status = 0;
1075 1076
    tqDebug("tq recv task check(taskId:0x%x not built yet) req(reqId:0x%" PRIx64 ") from task:0x%x (vgId:%d), rsp status %d",
            taskId, rsp.reqId, rsp.upstreamTaskId, rsp.upstreamNodeId, rsp.status);
1077 1078
  }

1079
  return streamSendCheckRsp(pTq->pStreamMeta, &req, &rsp, &pMsg->info, taskId);
1080 1081
}

1082 1083 1084 1085
int32_t tqProcessStreamTaskCheckRsp(STQ* pTq, int64_t sversion, SRpcMsg* pMsg) {
  char* pReq = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
  int32_t len = pMsg->contLen - sizeof(SMsgHead);

1086 1087 1088 1089
  int32_t             code;
  SStreamTaskCheckRsp rsp;

  SDecoder decoder;
1090
  tDecoderInit(&decoder, (uint8_t*)pReq, len);
1091
  code = tDecodeStreamTaskCheckRsp(&decoder, &rsp);
1092

1093 1094 1095 1096 1097
  if (code < 0) {
    tDecoderClear(&decoder);
    return -1;
  }

1098
  tDecoderClear(&decoder);
1099 1100
  tqDebug("tq task:0x%x (vgId:%d) recv check rsp(reqId:0x%" PRIx64 ") from 0x%x (vgId:%d) status %d",
          rsp.upstreamTaskId, rsp.upstreamNodeId, rsp.reqId, rsp.downstreamTaskId, rsp.downstreamNodeId, rsp.status);
1101

1102
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, rsp.streamId, rsp.upstreamTaskId);
1103
  if (pTask == NULL) {
1104
    tqError("tq failed to locate the stream task:0x%x (vgId:%d), it may have been destroyed", rsp.upstreamTaskId,
1105
            pTq->pStreamMeta->vgId);
1106
    terrno = TSDB_CODE_STREAM_TASK_NOT_EXIST;
1107 1108 1109
    return -1;
  }

1110
  code = streamProcessCheckRsp(pTask, &rsp);
L
Liu Jicong 已提交
1111 1112
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
  return code;
1113 1114
}

1115
int32_t tqProcessTaskDeployReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
1116 1117 1118
  int32_t code = 0;
  int32_t vgId = TD_VID(pTq->pVnode);

5
54liuyao 已提交
1119 1120 1121
  if (tsDisableStream) {
    return 0;
  }
1122 1123 1124 1125

  // 1.deserialize msg and build task
  SStreamTask* pTask = taosMemoryCalloc(1, sizeof(SStreamTask));
  if (pTask == NULL) {
1126
    terrno = TSDB_CODE_OUT_OF_MEMORY;
dengyihao's avatar
dengyihao 已提交
1127 1128
    tqError("vgId:%d failed to create stream task due to out of memory, alloc size:%d", vgId,
            (int32_t)sizeof(SStreamTask));
1129 1130
    return -1;
  }
1131

1132 1133
  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
1134
  code = tDecodeStreamTask(&decoder, pTask);
1135 1136 1137 1138 1139
  if (code < 0) {
    tDecoderClear(&decoder);
    taosMemoryFree(pTask);
    return -1;
  }
1140

1141 1142
  tDecoderClear(&decoder);

1143 1144
  SStreamMeta* pStreamMeta = pTq->pStreamMeta;

1145
  // 2.save task, use the newest commit version as the initial start version of stream task.
1146 1147
  int32_t taskId = pTask->id.taskId;
  bool    added = false;
1148

1149 1150
  taosWLockLatch(&pStreamMeta->lock);
  code = streamMetaRegisterTask(pStreamMeta, sversion, pTask, &added);
1151
  int32_t numOfTasks = streamMetaGetNumOfTasks(pStreamMeta);
1152
  taosWUnLockLatch(&pStreamMeta->lock);
1153

1154
  if (code < 0) {
1155
    tqError("vgId:%d failed to add s-task:0x%x, total:%d", vgId, pTask->id.taskId, numOfTasks);
H
Haojun Liao 已提交
1156
    tFreeStreamTask(pTask);
1157 1158 1159
    return -1;
  }

1160
  // not added into meta store
1161 1162
  if (added) {
    tqDebug("vgId:%d s-task:0x%x is deployed and add into meta, numOfTasks:%d", vgId, taskId, numOfTasks);
1163
    SStreamTask* p = streamMetaAcquireTask(pStreamMeta, pTask->id.streamId, taskId);
1164 1165 1166 1167 1168
    if (p != NULL) {  // reset the downstreamReady flag.
      streamTaskCheckDownstreamTasks(p);
    }
    streamMetaReleaseTask(pStreamMeta, p);
  } else {
1169 1170
    tqWarn("vgId:%d failed to add s-task:0x%x, already exists in meta store", vgId, taskId);
    tFreeStreamTask(pTask);
1171 1172
  }

1173 1174 1175
  return 0;
}

1176
int32_t tqProcessTaskScanHistory(STQ* pTq, SRpcMsg* pMsg) {
1177
  SStreamScanHistoryReq* pReq = (SStreamScanHistoryReq*)pMsg->pCont;
1178
  SStreamMeta*           pMeta = pTq->pStreamMeta;
1179

1180
  int32_t      code = TSDB_CODE_SUCCESS;
1181
  SStreamTask* pTask = streamMetaAcquireTask(pMeta, pReq->streamId, pReq->taskId);
1182
  if (pTask == NULL) {
1183 1184
    tqError("vgId:%d failed to acquire stream task:0x%x during stream recover, task may have been destroyed",
            pMeta->vgId, pReq->taskId);
1185 1186 1187
    return -1;
  }

1188
  // do recovery step1
1189
  const char* id = pTask->id.idStr;
1190
  const char* pStatus = streamGetTaskStatusStr(pTask->status.taskStatus);
1191
  tqDebug("s-task:%s start scan-history stage(step 1), status:%s", id, pStatus);
1192

1193
  if (pTask->tsInfo.step1Start == 0) {
1194
    ASSERT(pTask->status.pauseAllowed == false);
1195
    pTask->tsInfo.step1Start = taosGetTimestampMs();
1196 1197 1198 1199 1200
    if (pTask->info.fillHistory == 1) {
      streamTaskEnablePause(pTask);
    }
  } else {
    tqDebug("s-task:%s resume from paused, start ts:%"PRId64, pTask->id.idStr, pTask->tsInfo.step1Start);
1201
  }
1202

1203
  // we have to continue retrying to successfully execute the scan history task.
1204 1205 1206 1207 1208 1209 1210 1211
  int8_t schedStatus = atomic_val_compare_exchange_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__INACTIVE,
                                                     TASK_SCHED_STATUS__WAITING);
  if (schedStatus != TASK_SCHED_STATUS__INACTIVE) {
    tqError(
        "s-task:%s failed to start scan-history in first stream time window since already started, unexpected "
        "sched-status:%d",
        id, schedStatus);
    return 0;
1212
  }
1213

1214
  if (pTask->info.fillHistory == 1) {
1215
    ASSERT(pTask->status.pauseAllowed == true);
1216 1217
  }

1218 1219
  streamSourceScanHistoryData(pTask);
  if (pTask->status.taskStatus == TASK_STATUS__PAUSE) {
1220
    double el = (taosGetTimestampMs() - pTask->tsInfo.step1Start) / 1000.0;
1221 1222
    tqDebug("s-task:%s is paused in the step1, elapsed time:%.2fs, sched-status:%d", pTask->id.idStr, el,
            TASK_SCHED_STATUS__INACTIVE);
L
liuyao 已提交
1223
    atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__INACTIVE);
L
Liu Jicong 已提交
1224 1225 1226
    return 0;
  }

1227 1228
  // the following procedure should be executed, no matter status is stop/pause or not
  double el = (taosGetTimestampMs() - pTask->tsInfo.step1Start) / 1000.0;
H
Haojun Liao 已提交
1229
  tqDebug("s-task:%s scan-history stage(step 1) ended, elapsed time:%.2fs", id, el);
H
Haojun Liao 已提交
1230

H
Haojun Liao 已提交
1231
  if (pTask->info.fillHistory) {
L
liuyao 已提交
1232
    SVersionRange* pRange = NULL;
1233
    SStreamTask*   pStreamTask = NULL;
1234
    bool           done = false;
1235

1236
    // 1. get the related stream task
1237
    pStreamTask = streamMetaAcquireTask(pMeta, pTask->streamTaskId.streamId, pTask->streamTaskId.taskId);
1238 1239 1240 1241
    if (pStreamTask == NULL) {
      // todo delete this task, if the related stream task is dropped
      qError("failed to find s-task:0x%x, it may have been destroyed, drop fill-history task:%s",
             pTask->streamTaskId.taskId, pTask->id.idStr);
1242

1243
      tqDebug("s-task:%s fill-history task set status to be dropping", id);
1244

H
Haojun Liao 已提交
1245
      streamMetaUnregisterTask(pMeta, pTask->id.streamId, pTask->id.taskId);
1246 1247 1248
      streamMetaReleaseTask(pMeta, pTask);
      return -1;
    }
L
Liu Jicong 已提交
1249

1250
    ASSERT(pStreamTask->info.taskLevel == TASK_LEVEL__SOURCE);
L
Liu Jicong 已提交
1251

1252 1253
    // 2. it cannot be paused, when the stream task in TASK_STATUS__SCAN_HISTORY status. Let's wait for the
    // stream task get ready for scan history data
1254 1255 1256 1257 1258 1259
    while (pStreamTask->status.taskStatus == TASK_STATUS__SCAN_HISTORY) {
      tqDebug(
          "s-task:%s level:%d related stream task:%s(status:%s) not ready for halt, wait for it and recheck in 100ms",
          id, pTask->info.taskLevel, pStreamTask->id.idStr, streamGetTaskStatusStr(pStreamTask->status.taskStatus));
      taosMsleep(100);
    }
1260

1261 1262
    // now we can stop the stream task execution
    streamTaskHalt(pStreamTask);
1263

1264 1265
    tqDebug("s-task:%s level:%d sched-status:%d is halt by fill-history task:%s", pStreamTask->id.idStr,
            pStreamTask->info.taskLevel, pStreamTask->status.schedStatus, id);
H
Haojun Liao 已提交
1266

1267 1268 1269 1270
    // if it's an source task, extract the last version in wal.
    pRange = &pTask->dataRange.range;
    int64_t latestVer = walReaderGetCurrentVer(pStreamTask->exec.pWalReader);
    done = streamHistoryTaskSetVerRangeStep2(pTask, latestVer);
1271

1272
    if (done) {
H
Haojun Liao 已提交
1273
      pTask->tsInfo.step2Start = taosGetTimestampMs();
1274 1275
      streamTaskEndScanWAL(pTask);
    } else {
1276 1277 1278 1279 1280 1281
      STimeWindow* pWindow = &pTask->dataRange.window;
      tqDebug("s-task:%s level:%d verRange:%" PRId64 " - %" PRId64 " window:%" PRId64 "-%" PRId64
              ", do secondary scan-history from WAL after halt the related stream task:%s",
              id, pTask->info.taskLevel, pRange->minVer, pRange->maxVer, pWindow->skey, pWindow->ekey,
              pStreamTask->id.idStr);
      ASSERT(pTask->status.schedStatus == TASK_SCHED_STATUS__WAITING);
1282

1283 1284
      pTask->tsInfo.step2Start = taosGetTimestampMs();
      streamSetParamForStreamScannerStep2(pTask, pRange, pWindow);
H
Haojun Liao 已提交
1285

1286
      int64_t dstVer = pTask->dataRange.range.minVer - 1;
H
Haojun Liao 已提交
1287

1288 1289 1290 1291
      pTask->chkInfo.currentVer = dstVer;
      walReaderSetSkipToVersion(pTask->exec.pWalReader, dstVer);
      tqDebug("s-task:%s wal reader start scan WAL verRange:%" PRId64 "-%" PRId64 ", set sched-status:%d", id, dstVer,
              pTask->dataRange.range.maxVer, TASK_SCHED_STATUS__INACTIVE);
H
Haojun Liao 已提交
1292

1293 1294
      atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__INACTIVE);

1295 1296 1297 1298 1299
      // set the fill-history task to be normal
      if (pTask->info.fillHistory == 1) {
        streamSetStatusNormal(pTask);
      }

1300 1301
      tqStartStreamTasks(pTq);
    }
1302 1303 1304

    streamMetaReleaseTask(pMeta, pTask);
    streamMetaReleaseTask(pMeta, pStreamTask);
1305 1306 1307 1308
  } else {
    // todo update the chkInfo version for current task.
    // this task has an associated history stream task, so we need to scan wal from the end version of
    // history scan. The current version of chkInfo.current is not updated during the history scan
1309 1310
    STimeWindow* pWindow = &pTask->dataRange.window;

1311
    if (pTask->historyTaskId.taskId == 0) {
1312
      *pWindow = (STimeWindow){INT64_MIN, INT64_MAX};
1313
      tqDebug(
1314
          "s-task:%s scan-history in stream time window completed, no related fill-history task, reset the time "
1315 1316
          "window:%" PRId64 " - %" PRId64,
          id, pWindow->skey, pWindow->ekey);
1317
      qStreamInfoResetTimewindowFilter(pTask->exec.pExecutor);
1318
    } else {
H
Haojun Liao 已提交
1319 1320
      // when related fill-history task exists, update the fill-history time window only when the
      // state transfer is completed.
1321
      tqDebug(
1322
          "s-task:%s scan-history in stream time window completed, now start to handle data from WAL, start "
1323
          "ver:%" PRId64 ", window:%" PRId64 " - %" PRId64,
1324
          id, pTask->chkInfo.currentVer, pWindow->skey, pWindow->ekey);
1325
    }
1326

1327
    // notify the downstream agg tasks that upstream tasks are ready to processing the WAL data, update the
1328 1329
    code = streamTaskScanHistoryDataComplete(pTask);
    streamMetaReleaseTask(pMeta, pTask);
1330

1331 1332
    // when all source task complete to scan history data in stream time window, they are allowed to handle stream data
    // at the same time.
1333 1334
    return code;
  }
1335 1336 1337 1338

  return 0;
}

H
Haojun Liao 已提交
1339
// notify the downstream tasks to transfer executor state after handle all history blocks.
H
Haojun Liao 已提交
1340 1341 1342 1343 1344
int32_t tqProcessTaskTransferStateReq(STQ* pTq, SRpcMsg* pMsg) {
  char*   pReq = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
  int32_t len = pMsg->contLen - sizeof(SMsgHead);

  SStreamTransferReq req = {0};
H
Haojun Liao 已提交
1345

1346
  SDecoder decoder;
H
Haojun Liao 已提交
1347
  tDecoderInit(&decoder, (uint8_t*)pReq, len);
1348
  int32_t code = tDecodeStreamScanHistoryFinishReq(&decoder, &req);
H
Haojun Liao 已提交
1349
  tDecoderClear(&decoder);
H
Haojun Liao 已提交
1350

1351
  tqDebug("vgId:%d start to process transfer state msg, from s-task:0x%x", pTq->pStreamMeta->vgId, req.downstreamTaskId);
1352

1353
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.streamId, req.downstreamTaskId);
1354
  if (pTask == NULL) {
1355
    tqError("failed to find task:0x%x, it may have been dropped already. process transfer state failed", req.downstreamTaskId);
1356 1357 1358
    return -1;
  }

H
Haojun Liao 已提交
1359 1360
  int32_t remain = streamAlignTransferState(pTask);
  if (remain > 0) {
1361
    tqDebug("s-task:%s receive upstream transfer state msg, remain:%d", pTask->id.idStr, remain);
H
Haojun Liao 已提交
1362
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
H
Haojun Liao 已提交
1363 1364 1365
    return 0;
  }

L
liuyao 已提交
1366
  // transfer the ownership of executor state
1367 1368
  tqDebug("s-task:%s all upstream tasks send transfer msg, open transfer state flag", pTask->id.idStr);
  ASSERT(pTask->streamTaskId.taskId != 0 && pTask->info.fillHistory == 1);
1369

1370
  pTask->status.transferState = true;
L
Liu Jicong 已提交
1371

H
Haojun Liao 已提交
1372
  streamSchedExec(pTask);
L
Liu Jicong 已提交
1373
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1374 1375 1376
  return 0;
}

1377
int32_t tqProcessTaskScanHistoryFinishReq(STQ* pTq, SRpcMsg* pMsg) {
L
Liu Jicong 已提交
1378 1379
  char*   msg = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
  int32_t msgLen = pMsg->contLen - sizeof(SMsgHead);
1380 1381

  // deserialize
1382
  SStreamScanHistoryFinishReq req = {0};
1383 1384

  SDecoder decoder;
X
Xiaoyu Wang 已提交
1385
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
1386
  tDecodeStreamScanHistoryFinishReq(&decoder, &req);
1387 1388
  tDecoderClear(&decoder);

1389
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.streamId, req.downstreamTaskId);
1390
  if (pTask == NULL) {
1391 1392
    tqError("vgId:%d process scan history finish msg, failed to find task:0x%x, it may be destroyed",
            pTq->pStreamMeta->vgId, req.downstreamTaskId);
1393 1394 1395
    return -1;
  }

1396 1397 1398
  tqDebug("s-task:%s receive scan-history finish msg from task:0x%x", pTask->id.idStr, req.upstreamTaskId);

  int32_t code = streamProcessScanHistoryFinishReq(pTask, &req, &pMsg->info);
L
Liu Jicong 已提交
1399
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1400
  return code;
L
Liu Jicong 已提交
1401
}
L
Liu Jicong 已提交
1402

1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414
int32_t tqProcessTaskScanHistoryFinishRsp(STQ* pTq, SRpcMsg* pMsg) {
  char*   msg = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
  int32_t msgLen = pMsg->contLen - sizeof(SMsgHead);

  // deserialize
  SStreamCompleteHistoryMsg req = {0};

  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
  tDecodeCompleteHistoryDataMsg(&decoder, &req);
  tDecoderClear(&decoder);

1415
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.streamId, req.upstreamTaskId);
1416 1417 1418 1419 1420 1421 1422 1423
  if (pTask == NULL) {
    tqError("vgId:%d process scan history finish rsp, failed to find task:0x%x, it may be destroyed",
            pTq->pStreamMeta->vgId, req.upstreamTaskId);
    return -1;
  }

  int32_t remain = atomic_sub_fetch_32(&pTask->notReadyTasks, 1);
  if (remain > 0) {
1424 1425
    tqDebug("s-task:%s scan-history finish rsp received from downstream task:0x%x, remain:%d not send finish rsp",
            pTask->id.idStr, req.downstreamId, remain);
1426
  } else {
1427 1428
    tqDebug(
        "s-task:%s scan-history finish rsp received from downstream task:0x%x, all downstream tasks rsp scan-history "
H
Haojun Liao 已提交
1429
        "completed msg", pTask->id.idStr, req.downstreamId);
1430 1431 1432 1433
    streamProcessScanHistoryFinishRsp(pTask);
  }

  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1434 1435 1436
  return 0;
}

1437 1438 1439 1440
int32_t extractDelDataBlock(const void* pData, int32_t len, int64_t ver, SStreamRefDataBlock** pRefBlock) {
  SDecoder*   pCoder = &(SDecoder){0};
  SDeleteRes* pRes = &(SDeleteRes){0};

H
Haojun Liao 已提交
1441
  (*pRefBlock) = NULL;
H
Haojun Liao 已提交
1442

1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480
  pRes->uidList = taosArrayInit(0, sizeof(tb_uid_t));
  if (pRes->uidList == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  tDecoderInit(pCoder, (uint8_t*)pData, len);
  tDecodeDeleteRes(pCoder, pRes);
  tDecoderClear(pCoder);

  int32_t numOfTables = taosArrayGetSize(pRes->uidList);
  if (numOfTables == 0 || pRes->affectedRows == 0) {
    taosArrayDestroy(pRes->uidList);
    return TSDB_CODE_SUCCESS;
  }

  SSDataBlock* pDelBlock = createSpecialDataBlock(STREAM_DELETE_DATA);
  blockDataEnsureCapacity(pDelBlock, numOfTables);
  pDelBlock->info.rows = numOfTables;
  pDelBlock->info.version = ver;

  for (int32_t i = 0; i < numOfTables; i++) {
    // start key column
    SColumnInfoData* pStartCol = taosArrayGet(pDelBlock->pDataBlock, START_TS_COLUMN_INDEX);
    colDataSetVal(pStartCol, i, (const char*)&pRes->skey, false);  // end key column
    SColumnInfoData* pEndCol = taosArrayGet(pDelBlock->pDataBlock, END_TS_COLUMN_INDEX);
    colDataSetVal(pEndCol, i, (const char*)&pRes->ekey, false);
    // uid column
    SColumnInfoData* pUidCol = taosArrayGet(pDelBlock->pDataBlock, UID_COLUMN_INDEX);
    int64_t*         pUid = taosArrayGet(pRes->uidList, i);
    colDataSetVal(pUidCol, i, (const char*)pUid, false);

    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, GROUPID_COLUMN_INDEX), i);
    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, CALCULATE_START_TS_COLUMN_INDEX), i);
    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, CALCULATE_END_TS_COLUMN_INDEX), i);
  }

  taosArrayDestroy(pRes->uidList);
  *pRefBlock = taosAllocateQitem(sizeof(SStreamRefDataBlock), DEF_QITEM, 0);
H
Haojun Liao 已提交
1481
  if ((*pRefBlock) == NULL) {
1482 1483 1484 1485 1486 1487 1488 1489
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  (*pRefBlock)->type = STREAM_INPUT__REF_DATA_BLOCK;
  (*pRefBlock)->pBlock = pDelBlock;
  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
1490 1491
int32_t tqProcessTaskRunReq(STQ* pTq, SRpcMsg* pMsg) {
  SStreamTaskRunReq* pReq = pMsg->pCont;
1492 1493 1494 1495

  int32_t taskId = pReq->taskId;
  int32_t vgId = TD_VID(pTq->pVnode);

1496 1497 1498 1499 1500 1501
  if (taskId == STREAM_TASK_STATUS_CHECK_ID) {
    tqStreamTasksStatusCheck(pTq);
    return 0;
  }

  if (taskId == EXTRACT_DATA_FROM_WAL_ID) {  // all tasks are extracted submit data from the wal
1502
    tqStreamTasksScanWal(pTq);
L
Liu Jicong 已提交
1503
    return 0;
1504
  }
1505

1506
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->streamId, taskId);
1507
  if (pTask != NULL) {
1508
    // even in halt status, the data in inputQ must be processed
H
Haojun Liao 已提交
1509
    int8_t st = pTask->status.taskStatus;
1510
    if (st == TASK_STATUS__NORMAL || st == TASK_STATUS__SCAN_HISTORY) {
1511
      tqDebug("vgId:%d s-task:%s start to process block from inputQ, last chk point:%" PRId64, vgId, pTask->id.idStr,
dengyihao's avatar
dengyihao 已提交
1512
              pTask->chkInfo.version);
1513
      streamProcessRunReq(pTask);
1514
    } else {
1515
      atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__INACTIVE);
1516 1517
      tqDebug("vgId:%d s-task:%s ignore run req since not in ready state, status:%s, sched-status:%d", vgId,
              pTask->id.idStr, streamGetTaskStatusStr(pTask->status.taskStatus), pTask->status.schedStatus);
1518
    }
1519

L
Liu Jicong 已提交
1520
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1521
    tqStartStreamTasks(pTq);
L
Liu Jicong 已提交
1522
    return 0;
1523 1524 1525
  } else { // NOTE: pTask->status.schedStatus is not updated since it is not be handled by the run exec.
    // todo add one function to handle this
    tqError("vgId:%d failed to found s-task, taskId:0x%x may have been dropped", vgId, taskId);
1526
    return -1;
L
Liu Jicong 已提交
1527
  }
L
Liu Jicong 已提交
1528 1529
}

L
Liu Jicong 已提交
1530
int32_t tqProcessTaskDispatchReq(STQ* pTq, SRpcMsg* pMsg, bool exec) {
dengyihao's avatar
dengyihao 已提交
1531 1532 1533
  char*   msgStr = pMsg->pCont;
  char*   msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t msgLen = pMsg->contLen - sizeof(SMsgHead);
1534 1535 1536 1537

  SStreamDispatchReq req = {0};

  SDecoder decoder;
L
Liu Jicong 已提交
1538
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
1539
  tDecodeStreamDispatchReq(&decoder, &req);
L
Liu Jicong 已提交
1540

1541
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.streamId, req.taskId);
L
Liu Jicong 已提交
1542
  if (pTask) {
1543
    SRpcMsg rsp = {.info = pMsg->info, .code = 0};
1544
    streamProcessDispatchMsg(pTask, &req, &rsp, exec);
L
Liu Jicong 已提交
1545
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1546
    return 0;
1547
  } else {
L
liuyao 已提交
1548
    tDeleteStreamDispatchReq(&req);
1549
    return -1;
L
Liu Jicong 已提交
1550
  }
L
Liu Jicong 已提交
1551 1552
}

L
Liu Jicong 已提交
1553 1554
int32_t tqProcessTaskDispatchRsp(STQ* pTq, SRpcMsg* pMsg) {
  SStreamDispatchRsp* pRsp = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
1555
  int32_t             taskId = ntohl(pRsp->upstreamTaskId);
1556
  SStreamTask*        pTask = streamMetaAcquireTask(pTq->pStreamMeta, pRsp->streamId, taskId);
1557 1558

  int32_t vgId = pTq->pStreamMeta->vgId;
L
Liu Jicong 已提交
1559
  if (pTask) {
1560
    streamProcessDispatchRsp(pTask, pRsp, pMsg->code);
L
Liu Jicong 已提交
1561
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1562
    return 0;
1563
  } else {
1564
    tqDebug("vgId:%d failed to handle the dispatch rsp, since find task:0x%x failed", vgId, taskId);
1565
    return TSDB_CODE_INVALID_MSG;
L
Liu Jicong 已提交
1566
  }
L
Liu Jicong 已提交
1567
}
L
Liu Jicong 已提交
1568

1569
int32_t tqProcessTaskDropReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
L
Liu Jicong 已提交
1570
  SVDropStreamTaskReq* pReq = (SVDropStreamTaskReq*)msg;
1571
  tqDebug("vgId:%d receive msg to drop stream task:0x%x", TD_VID(pTq->pVnode), pReq->taskId);
1572
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->streamId, pReq->taskId);
1573 1574 1575 1576
  if (pTask == NULL) {
    tqError("vgId:%d failed to acquire s-task:0x%x when dropping it", pTq->pStreamMeta->vgId, pReq->taskId);
    return 0;
  }
1577

H
Haojun Liao 已提交
1578
  streamMetaUnregisterTask(pTq->pStreamMeta, pReq->streamId, pReq->taskId);
1579
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1580
  return 0;
L
Liu Jicong 已提交
1581
}
L
Liu Jicong 已提交
1582

5
54liuyao 已提交
1583 1584
int32_t tqProcessTaskPauseReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
  SVPauseStreamTaskReq* pReq = (SVPauseStreamTaskReq*)msg;
1585 1586

  SStreamMeta* pMeta = pTq->pStreamMeta;
1587
  SStreamTask* pTask = streamMetaAcquireTask(pMeta, pReq->streamId, pReq->taskId);
1588
  if (pTask == NULL) {
1589
    tqError("vgId:%d process pause req, failed to acquire task:0x%x, it may have been dropped already", pMeta->vgId,
1590
            pReq->taskId);
1591 1592
    // since task is in [STOP|DROPPING] state, it is safe to assume the pause is active
    return TSDB_CODE_SUCCESS;
1593 1594 1595
  }

  tqDebug("s-task:%s receive pause msg from mnode", pTask->id.idStr);
1596
  streamTaskPause(pTask);
1597 1598 1599

  SStreamTask* pHistoryTask = NULL;
  if (pTask->historyTaskId.taskId != 0) {
1600
    pHistoryTask = streamMetaAcquireTask(pMeta, pTask->historyTaskId.streamId, pTask->historyTaskId.taskId);
1601
    if (pHistoryTask == NULL) {
1602
      tqError("vgId:%d process pause req, failed to acquire fill-history task:0x%x, it may have been dropped already",
1603
              pMeta->vgId, pTask->historyTaskId.taskId);
1604
      streamMetaReleaseTask(pMeta, pTask);
1605 1606 1607

      // since task is in [STOP|DROPPING] state, it is safe to assume the pause is active
      return TSDB_CODE_SUCCESS;
1608 1609
    }

1610
    tqDebug("s-task:%s fill-history task handle paused along with related stream task", pHistoryTask->id.idStr);
1611

1612
    streamTaskPause(pHistoryTask);
1613
    streamMetaReleaseTask(pMeta, pHistoryTask);
L
liuyao 已提交
1614
  }
1615

1616
  streamMetaReleaseTask(pMeta, pTask);
1617
  return TSDB_CODE_SUCCESS;
L
liuyao 已提交
1618 1619 1620 1621
}

int32_t tqProcessTaskResumeImpl(STQ* pTq, SStreamTask* pTask, int64_t sversion, int8_t igUntreated) {
  int32_t vgId = pTq->pStreamMeta->vgId;
1622 1623 1624
  if (pTask == NULL) {
    return -1;
  }
L
liuyao 已提交
1625

1626 1627
  // todo: handle the case: resume from halt to pause/ from halt to normal/ from pause to normal
  streamTaskResume(pTask);
1628

1629 1630 1631
  int32_t level = pTask->info.taskLevel;
  int8_t  status = pTask->status.taskStatus;
  if (status == TASK_STATUS__NORMAL || status == TASK_STATUS__SCAN_HISTORY) {
1632
    // no lock needs to secure the access of the version
1633
    if (igUntreated && level == TASK_LEVEL__SOURCE && !pTask->info.fillHistory) {
1634 1635 1636 1637 1638 1639 1640 1641 1642 1643
      // discard all the data  when the stream task is suspended.
      walReaderSetSkipToVersion(pTask->exec.pWalReader, sversion);
      tqDebug("vgId:%d s-task:%s resume to exec, prev paused version:%" PRId64 ", start from vnode ver:%" PRId64
              ", schedStatus:%d",
              vgId, pTask->id.idStr, pTask->chkInfo.currentVer, sversion, pTask->status.schedStatus);
    } else {  // from the previous paused version and go on
      tqDebug("vgId:%d s-task:%s resume to exec, from paused ver:%" PRId64 ", vnode ver:%" PRId64 ", schedStatus:%d",
              vgId, pTask->id.idStr, pTask->chkInfo.currentVer, sversion, pTask->status.schedStatus);
    }

1644
    if (level == TASK_LEVEL__SOURCE && pTask->info.fillHistory && pTask->status.taskStatus == TASK_STATUS__SCAN_HISTORY) {
1645
      streamStartScanHistoryAsync(pTask, igUntreated);
1646
    } else if (level == TASK_LEVEL__SOURCE && (taosQueueItemSize(pTask->inputQueue->queue) == 0)) {
1647 1648 1649
      tqStartStreamTasks(pTq);
    } else {
      streamSchedExec(pTask);
L
liuyao 已提交
1650
    }
L
liuyao 已提交
1651
  }
1652 1653

  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
5
54liuyao 已提交
1654 1655 1656 1657 1658
  return 0;
}

int32_t tqProcessTaskResumeReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
  SVResumeStreamTaskReq* pReq = (SVResumeStreamTaskReq*)msg;
1659
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->streamId, pReq->taskId);
L
liuyao 已提交
1660 1661 1662
  int32_t code = tqProcessTaskResumeImpl(pTq, pTask, sversion, pReq->igUntreated);
  if (code != 0) {
    return code;
L
liuyao 已提交
1663
  }
1664

1665
  SStreamTask* pHistoryTask = streamMetaAcquireTask(pTq->pStreamMeta, pTask->historyTaskId.streamId, pTask->historyTaskId.taskId);
L
liuyao 已提交
1666 1667 1668
  if (pHistoryTask) {
    code = tqProcessTaskResumeImpl(pTq, pHistoryTask, sversion, pReq->igUntreated);
  }
1669

L
liuyao 已提交
1670
  return code;
5
54liuyao 已提交
1671 1672
}

L
Liu Jicong 已提交
1673
int32_t tqProcessTaskRetrieveReq(STQ* pTq, SRpcMsg* pMsg) {
1674 1675 1676 1677 1678
  char*    msgStr = pMsg->pCont;
  char*    msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t  msgLen = pMsg->contLen - sizeof(SMsgHead);
  SDecoder decoder;

L
Liu Jicong 已提交
1679
  SStreamRetrieveReq req;
1680
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
L
Liu Jicong 已提交
1681
  tDecodeStreamRetrieveReq(&decoder, &req);
L
Liu Jicong 已提交
1682
  tDecoderClear(&decoder);
1683

1684
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.streamId, req.dstTaskId);
1685

L
Liu Jicong 已提交
1686
  if (pTask) {
1687
    SRpcMsg rsp = {.info = pMsg->info, .code = 0};
L
Liu Jicong 已提交
1688
    streamProcessRetrieveReq(pTask, &req, &rsp);
1689

L
Liu Jicong 已提交
1690
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1691
    tDeleteStreamRetrieveReq(&req);
L
Liu Jicong 已提交
1692
    return 0;
L
Liu Jicong 已提交
1693
  } else {
L
liuyao 已提交
1694
    tDeleteStreamRetrieveReq(&req);
L
Liu Jicong 已提交
1695
    return -1;
L
Liu Jicong 已提交
1696 1697 1698 1699 1700 1701 1702
  }
}

int32_t tqProcessTaskRetrieveRsp(STQ* pTq, SRpcMsg* pMsg) {
  //
  return 0;
}
L
Liu Jicong 已提交
1703

1704 1705 1706 1707 1708 1709
int32_t vnodeEnqueueStreamMsg(SVnode* pVnode, SRpcMsg* pMsg) {
  STQ*      pTq = pVnode->pTq;
  SMsgHead* msgStr = pMsg->pCont;
  char*     msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t   msgLen = pMsg->contLen - sizeof(SMsgHead);
  int32_t   code = 0;
L
Liu Jicong 已提交
1710 1711 1712

  SStreamDispatchReq req;
  SDecoder           decoder;
1713
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
L
Liu Jicong 已提交
1714 1715
  if (tDecodeStreamDispatchReq(&decoder, &req) < 0) {
    code = TSDB_CODE_MSG_DECODE_ERROR;
L
Liu Jicong 已提交
1716
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1717 1718
    goto FAIL;
  }
L
Liu Jicong 已提交
1719
  tDecoderClear(&decoder);
L
Liu Jicong 已提交
1720

L
Liu Jicong 已提交
1721
  int32_t taskId = req.taskId;
1722
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.streamId, req.taskId);
1723
  if (pTask != NULL) {
1724
    SRpcMsg rsp = {.info = pMsg->info, .code = 0};
1725
    streamProcessDispatchMsg(pTask, &req, &rsp, false);
L
Liu Jicong 已提交
1726
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1727 1728
    rpcFreeCont(pMsg->pCont);
    taosFreeQitem(pMsg);
1729
    return 0;
5
54liuyao 已提交
1730
  } else {
1731

5
54liuyao 已提交
1732
    tDeleteStreamDispatchReq(&req);
L
Liu Jicong 已提交
1733
  }
L
Liu Jicong 已提交
1734

1735 1736
  code = TSDB_CODE_STREAM_TASK_NOT_EXIST;

L
Liu Jicong 已提交
1737
FAIL:
1738 1739 1740 1741
  if (pMsg->info.handle == NULL) {
    tqError("s-task:0x%x vgId:%d msg handle is null, abort enqueue dispatch msg", pTq->pStreamMeta->vgId, taskId);
    return -1;
  }
1742 1743 1744

  SMsgHead* pRspHead = rpcMallocCont(sizeof(SMsgHead) + sizeof(SStreamDispatchRsp));
  if (pRspHead == NULL) {
1745
    SRpcMsg rsp = {.code = TSDB_CODE_OUT_OF_MEMORY, .info = pMsg->info};
1746
    tqError("s-task:0x%x send dispatch error rsp, code:%s", taskId, tstrerror(code));
1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761
    tmsgSendRsp(&rsp);
    rpcFreeCont(pMsg->pCont);
    taosFreeQitem(pMsg);
    return -1;
  }

  pRspHead->vgId = htonl(req.upstreamNodeId);
  SStreamDispatchRsp* pRsp = POINTER_SHIFT(pRspHead, sizeof(SMsgHead));
  pRsp->streamId = htobe64(req.streamId);
  pRsp->upstreamTaskId = htonl(req.upstreamTaskId);
  pRsp->upstreamNodeId = htonl(req.upstreamNodeId);
  pRsp->downstreamNodeId = htonl(pVnode->config.vgId);
  pRsp->downstreamTaskId = htonl(req.taskId);
  pRsp->inputStatus = TASK_OUTPUT_STATUS__NORMAL;

1762 1763 1764 1765
  int32_t len = sizeof(SMsgHead) + sizeof(SStreamDispatchRsp);
  SRpcMsg rsp = { .code = code, .info = pMsg->info, .contLen = len, .pCont = pRspHead};
  tqError("s-task:0x%x send dispatch error rsp, code:%s", taskId, tstrerror(code));

L
Liu Jicong 已提交
1766
  tmsgSendRsp(&rsp);
L
Liu Jicong 已提交
1767 1768
  rpcFreeCont(pMsg->pCont);
  taosFreeQitem(pMsg);
1769
  return -1;
L
Liu Jicong 已提交
1770
}
L
Liu Jicong 已提交
1771

1772
int32_t tqCheckLogInWal(STQ* pTq, int64_t sversion) { return sversion <= pTq->walLogLastVer; }
1773