tq.c 46.6 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
S
Shengliang Guan 已提交
14 15
 */

H
Hongze Cheng 已提交
16
#include "tq.h"
S
Shengliang Guan 已提交
17

dengyihao's avatar
dengyihao 已提交
18 19 20
// 0: not init
// 1: already inited
// 2: wait to be inited or cleaup
21
#define WAL_READ_TASKS_ID       (-1)
22

23 24
static int32_t tqInitialize(STQ* pTq);

L
Liu Jicong 已提交
25
int32_t tqInit() {
L
Liu Jicong 已提交
26 27 28 29 30 31
  int8_t old;
  while (1) {
    old = atomic_val_compare_exchange_8(&tqMgmt.inited, 0, 2);
    if (old != 2) break;
  }

32 33 34 35 36 37
  if (old == 0) {
    tqMgmt.timer = taosTmrInit(10000, 100, 10000, "TQ");
    if (tqMgmt.timer == NULL) {
      atomic_store_8(&tqMgmt.inited, 0);
      return -1;
    }
38 39 40
    if (streamInit() < 0) {
      return -1;
    }
L
Liu Jicong 已提交
41
    atomic_store_8(&tqMgmt.inited, 1);
42
  }
43

L
Liu Jicong 已提交
44 45
  return 0;
}
L
Liu Jicong 已提交
46

47
void tqCleanUp() {
L
Liu Jicong 已提交
48 49 50 51 52 53 54 55
  int8_t old;
  while (1) {
    old = atomic_val_compare_exchange_8(&tqMgmt.inited, 1, 2);
    if (old != 2) break;
  }

  if (old == 1) {
    taosTmrCleanUp(tqMgmt.timer);
L
Liu Jicong 已提交
56
    streamCleanUp();
L
Liu Jicong 已提交
57 58
    atomic_store_8(&tqMgmt.inited, 0);
  }
59
}
L
Liu Jicong 已提交
60

61
static void destroyTqHandle(void* data) {
62 63 64
  STqHandle* pData = (STqHandle*)data;
  qDestroyTask(pData->execHandle.task);
  if (pData->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
L
Liu Jicong 已提交
65
    taosMemoryFreeClear(pData->execHandle.execCol.qmsg);
66
  } else if (pData->execHandle.subType == TOPIC_SUB_TYPE__DB) {
67
    tqCloseReader(pData->execHandle.pTqReader);
68 69
    walCloseReader(pData->pWalReader);
    taosHashCleanup(pData->execHandle.execDb.pFilterOutTbUid);
L
Liu Jicong 已提交
70
  } else if (pData->execHandle.subType == TOPIC_SUB_TYPE__TABLE) {
71
    walCloseReader(pData->pWalReader);
72
    tqCloseReader(pData->execHandle.pTqReader);
73
  }
74 75 76 77
  if(pData->msg != NULL) {
    rpcFreeCont(pData->msg->pCont);
    taosMemoryFree(pData->msg);
    pData->msg = NULL;
H
Haojun Liao 已提交
78
  }
L
Liu Jicong 已提交
79 80
}

81 82 83 84 85
static bool tqOffsetLessOrEqual(const STqOffset* pLeft, const STqOffset* pRight) {
  return pLeft->val.type == TMQ_OFFSET__LOG && pRight->val.type == TMQ_OFFSET__LOG &&
         pLeft->val.version <= pRight->val.version;
}

L
Liu Jicong 已提交
86
STQ* tqOpen(const char* path, SVnode* pVnode) {
87
  STQ* pTq = taosMemoryCalloc(1, sizeof(STQ));
L
Liu Jicong 已提交
88
  if (pTq == NULL) {
S
Shengliang Guan 已提交
89
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
90 91
    return NULL;
  }
92

93
  pTq->path = taosStrdup(path);
L
Liu Jicong 已提交
94
  pTq->pVnode = pVnode;
L
Liu Jicong 已提交
95
  pTq->walLogLastVer = pVnode->pWal->vers.lastVer;
96

97
  pTq->pHandle = taosHashInit(64, MurmurHash3_32, true, HASH_ENTRY_LOCK);
98
  taosHashSetFreeFp(pTq->pHandle, destroyTqHandle);
99

100
  taosInitRWLatch(&pTq->lock);
101
  pTq->pPushMgr = taosHashInit(64, MurmurHash3_32, false, HASH_NO_LOCK);
L
Liu Jicong 已提交
102

103
  pTq->pCheckInfo = taosHashInit(64, MurmurHash3_32, true, HASH_ENTRY_LOCK);
L
Liu Jicong 已提交
104
  taosHashSetFreeFp(pTq->pCheckInfo, (FDelete)tDeleteSTqCheckInfo);
L
Liu Jicong 已提交
105

106 107 108 109 110 111 112
  int32_t code = tqInitialize(pTq);
  if (code != TSDB_CODE_SUCCESS) {
    tqClose(pTq);
    return NULL;
  } else {
    return pTq;
  }
113 114 115
}

int32_t tqInitialize(STQ* pTq) {
L
Liu Jicong 已提交
116
  if (tqMetaOpen(pTq) < 0) {
117
    return -1;
118 119
  }

L
Liu Jicong 已提交
120 121
  pTq->pOffsetStore = tqOffsetOpen(pTq);
  if (pTq->pOffsetStore == NULL) {
122
    return -1;
123 124
  }

125
  pTq->pStreamMeta = streamMetaOpen(pTq->path, pTq, (FTaskExpand*)tqExpandTask, pTq->pVnode->config.vgId);
L
Liu Jicong 已提交
126
  if (pTq->pStreamMeta == NULL) {
127
    return -1;
L
Liu Jicong 已提交
128 129
  }

130 131
  // the version is kept in task's meta data
  // todo check if this version is required or not
132 133
  if (streamLoadTasks(pTq->pStreamMeta, walGetCommittedVer(pTq->pVnode->pWal)) < 0) {
    return -1;
L
Liu Jicong 已提交
134 135
  }

136
  return 0;
L
Liu Jicong 已提交
137
}
L
Liu Jicong 已提交
138

L
Liu Jicong 已提交
139
void tqClose(STQ* pTq) {
140 141
  if (pTq == NULL) {
    return;
H
Hongze Cheng 已提交
142
  }
143 144 145 146 147 148 149 150 151

  tqOffsetClose(pTq->pOffsetStore);
  taosHashCleanup(pTq->pHandle);
  taosHashCleanup(pTq->pPushMgr);
  taosHashCleanup(pTq->pCheckInfo);
  taosMemoryFree(pTq->path);
  tqMetaClose(pTq);
  streamMetaClose(pTq->pStreamMeta);
  taosMemoryFree(pTq);
L
Liu Jicong 已提交
152
}
L
Liu Jicong 已提交
153

H
Haojun Liao 已提交
154 155 156
void tqNotifyClose(STQ* pTq) {
  if (pTq != NULL) {
    taosWLockLatch(&pTq->pStreamMeta->lock);
157

H
Haojun Liao 已提交
158 159 160 161 162 163 164 165 166
    void* pIter = NULL;
    while (1) {
      pIter = taosHashIterate(pTq->pStreamMeta->pTasks, pIter);
      if (pIter == NULL) {
        break;
      }

      SStreamTask* pTask = *(SStreamTask**)pIter;
      tqDebug("vgId:%d s-task:%s set dropping flag", pTq->pStreamMeta->vgId, pTask->id.idStr);
167 168 169
      pTask->status.taskStatus = TASK_STATUS__STOP;

      int64_t st = taosGetTimestampMs();
H
Haojun Liao 已提交
170
      qKillTask(pTask->exec.pExecutor, TSDB_CODE_SUCCESS);
171 172
      int64_t el = taosGetTimestampMs() - st;
      tqDebug("vgId:%d s-task:%s is closed in %" PRId64 "ms", pTq->pStreamMeta->vgId, pTask->id.idStr, el);
H
Haojun Liao 已提交
173 174 175 176 177 178
    }

    taosWUnLockLatch(&pTq->pStreamMeta->lock);
  }
}

H
Haojun Liao 已提交
179 180
static int32_t doSendDataRsp(const SRpcHandleInfo* pRpcHandleInfo, const SMqDataRsp* pRsp, int32_t epoch,
                             int64_t consumerId, int32_t type) {
L
Liu Jicong 已提交
181 182
  int32_t len = 0;
  int32_t code = 0;
H
Haojun Liao 已提交
183 184

  if (type == TMQ_MSG_TYPE__POLL_RSP) {
H
Haojun Liao 已提交
185
    tEncodeSize(tEncodeMqDataRsp, pRsp, len, code);
H
Haojun Liao 已提交
186 187 188
  } else if (type == TMQ_MSG_TYPE__TAOSX_RSP) {
    tEncodeSize(tEncodeSTaosxRsp, (STaosxRsp*)pRsp, len, code);
  }
189

L
Liu Jicong 已提交
190 191 192 193 194 195 196 197 198 199
  if (code < 0) {
    return -1;
  }

  int32_t tlen = sizeof(SMqRspHead) + len;
  void*   buf = rpcMallocCont(tlen);
  if (buf == NULL) {
    return -1;
  }

H
Haojun Liao 已提交
200 201 202
  ((SMqRspHead*)buf)->mqMsgType = type;
  ((SMqRspHead*)buf)->epoch = epoch;
  ((SMqRspHead*)buf)->consumerId = consumerId;
L
Liu Jicong 已提交
203 204 205 206 207

  void* abuf = POINTER_SHIFT(buf, sizeof(SMqRspHead));

  SEncoder encoder = {0};
  tEncoderInit(&encoder, abuf, len);
H
Haojun Liao 已提交
208 209

  if (type == TMQ_MSG_TYPE__POLL_RSP) {
H
Haojun Liao 已提交
210
    tEncodeMqDataRsp(&encoder, pRsp);
H
Haojun Liao 已提交
211
  } else if (type == TMQ_MSG_TYPE__TAOSX_RSP) {
X
Xiaoyu Wang 已提交
212
    tEncodeSTaosxRsp(&encoder, (STaosxRsp*)pRsp);
H
Haojun Liao 已提交
213 214
  }

L
Liu Jicong 已提交
215 216 217
  tEncoderClear(&encoder);

  SRpcMsg rsp = {
H
Haojun Liao 已提交
218
      .info = *pRpcHandleInfo,
L
Liu Jicong 已提交
219 220 221 222 223 224 225 226 227
      .pCont = buf,
      .contLen = tlen,
      .code = 0,
  };

  tmsgSendRsp(&rsp);
  return 0;
}

H
Haojun Liao 已提交
228
int32_t tqPushDataRsp(STqHandle* pHandle, int32_t vgId) {
229 230 231 232
  SMqDataRsp dataRsp = {0};
  dataRsp.head.consumerId = pHandle->consumerId;
  dataRsp.head.epoch = pHandle->epoch;
  dataRsp.head.mqMsgType = TMQ_MSG_TYPE__POLL_RSP;
H
Haojun Liao 已提交
233 234 235 236

  int64_t sver = 0, ever = 0;
  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);
  tqDoSendDataRsp(&pHandle->msg->info, &dataRsp, pHandle->epoch, pHandle->consumerId, TMQ_MSG_TYPE__POLL_RSP, sver, ever);
L
Liu Jicong 已提交
237

wmmhello's avatar
wmmhello 已提交
238 239
  char buf1[80] = {0};
  char buf2[80] = {0};
240 241
  tFormatOffset(buf1, tListLen(buf1), &dataRsp.reqOffset);
  tFormatOffset(buf2, tListLen(buf2), &dataRsp.rspOffset);
H
Haojun Liao 已提交
242
  tqDebug("vgId:%d, from consumer:0x%" PRIx64 " (epoch %d) push rsp, block num: %d, req:%s, rsp:%s",
H
Haojun Liao 已提交
243
          vgId, dataRsp.head.consumerId, dataRsp.head.epoch, dataRsp.blockNum, buf1, buf2);
L
Liu Jicong 已提交
244 245 246
  return 0;
}

247 248 249 250 251 252
int32_t tqSendDataRsp(STqHandle* pHandle, const SRpcMsg* pMsg, const SMqPollReq* pReq, const SMqDataRsp* pRsp,
                      int32_t type, int32_t vgId) {
  int64_t sver = 0, ever = 0;
  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);

  tqDoSendDataRsp(&pMsg->info, pRsp, pReq->epoch, pReq->consumerId, type, sver, ever);
253 254 255 256 257 258

  char buf1[80] = {0};
  char buf2[80] = {0};
  tFormatOffset(buf1, 80, &pRsp->reqOffset);
  tFormatOffset(buf2, 80, &pRsp->rspOffset);

X
Xiaoyu Wang 已提交
259
  tqDebug("vgId:%d consumer:0x%" PRIx64 " (epoch %d) send rsp, block num:%d, req:%s, rsp:%s, reqId:0x%" PRIx64,
260
          vgId, pReq->consumerId, pReq->epoch, pRsp->blockNum, buf1, buf2, pReq->reqId);
H
Haojun Liao 已提交
261

262 263 264
  return 0;
}

265
int32_t tqProcessOffsetCommitReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
266 267
  SMqVgOffset vgOffset = {0};
  int32_t     vgId = TD_VID(pTq->pVnode);
268

X
Xiaoyu Wang 已提交
269 270
  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
271
  if (tDecodeMqVgOffset(&decoder, &vgOffset) < 0) {
272 273
    return -1;
  }
274

275 276
  tDecoderClear(&decoder);

277 278 279
  STqOffset* pOffset = &vgOffset.offset;

  if (pOffset->val.type == TMQ_OFFSET__SNAPSHOT_DATA || pOffset->val.type == TMQ_OFFSET__SNAPSHOT_META) {
L
Liu Jicong 已提交
280
    tqDebug("receive offset commit msg to %s on vgId:%d, offset(type:snapshot) uid:%" PRId64 ", ts:%" PRId64,
281 282 283 284 285 286
            pOffset->subKey, vgId, pOffset->val.uid, pOffset->val.ts);
  } else if (pOffset->val.type == TMQ_OFFSET__LOG) {
    tqDebug("receive offset commit msg to %s on vgId:%d, offset(type:log) version:%" PRId64, pOffset->subKey, vgId,
            pOffset->val.version);
    if (pOffset->val.version + 1 == sversion) {
      pOffset->val.version += 1;
287
    }
288
  } else {
289
    tqError("invalid commit offset type:%d", pOffset->val.type);
290
    return -1;
291
  }
292

293 294
  STqOffset* pSavedOffset = tqOffsetRead(pTq->pOffsetStore, pOffset->subKey);
  if (pSavedOffset != NULL && tqOffsetLessOrEqual(pOffset, pSavedOffset)) {
295
    tqDebug("not update the offset, vgId:%d sub:%s since committed:%" PRId64 " less than/equal to existed:%" PRId64,
296
            vgId, pOffset->subKey, pOffset->val.version, pSavedOffset->val.version);
297
    return 0;  // no need to update the offset value
298 299
  }

300
  // save the new offset value
301
  if (tqOffsetWrite(pTq->pOffsetStore, pOffset) < 0) {
302
    return -1;
303
  }
304

305 306 307
  if (pOffset->val.type == TMQ_OFFSET__LOG) {
    STqHandle* pHandle = taosHashGet(pTq->pHandle, pOffset->subKey, strlen(pOffset->subKey));
    if (pHandle && (walRefVer(pHandle->pRef, pOffset->val.version) < 0)) {
308
      return -1;
309 310 311
    }
  }

312 313 314
  return 0;
}

315
int32_t tqProcessSeekReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
316 317
  SMqVgOffset vgOffset = {0};
  int32_t     vgId = TD_VID(pTq->pVnode);
318 319 320

  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
321
  if (tDecodeMqVgOffset(&decoder, &vgOffset) < 0) {
322 323 324 325 326
    return -1;
  }

  tDecoderClear(&decoder);

327 328 329
  STqOffset* pOffset = &vgOffset.offset;
  if (pOffset->val.type != TMQ_OFFSET__LOG) {
    tqError("vgId:%d, subKey:%s invalid seek offset type:%d", vgId, pOffset->subKey, pOffset->val.type);
330 331 332
    return -1;
  }

333 334 335 336 337 338
  STqHandle* pHandle = taosHashGet(pTq->pHandle, pOffset->subKey, strlen(pOffset->subKey));
  if (pHandle == NULL) {
    tqError("tmq seek: consumer:0x%" PRIx64 " vgId:%d subkey %s not found", vgOffset.consumerId, vgId,
        pOffset->subKey);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
339 340
  }

341 342 343 344 345 346 347 348
  // 2. check consumer-vg assignment status
  taosRLockLatch(&pTq->lock);
  if (pHandle->consumerId != vgOffset.consumerId) {
    tqDebug("ERROR tmq seek: consumer:0x%" PRIx64 " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
            vgOffset.consumerId, vgId, pOffset->subKey, pHandle->consumerId);
    terrno = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
    taosRUnLockLatch(&pTq->lock);
    return -1;
349
  }
350 351 352 353 354 355 356 357 358
  taosRUnLockLatch(&pTq->lock);

  //3. check the offset info
  STqOffset* pSavedOffset = tqOffsetRead(pTq->pOffsetStore, pOffset->subKey);
  if (pSavedOffset != NULL) {
    if (pSavedOffset->val.type != TMQ_OFFSET__LOG) {
      tqError("invalid saved offset type, vgId:%d sub:%s", vgId, pOffset->subKey);
      return 0;  // no need to update the offset value
    }
359

360 361 362 363 364 365
    if (pSavedOffset->val.version == pOffset->val.version) {
      tqDebug("vgId:%d subKey:%s no need to seek to %" PRId64 " prev offset:%" PRId64, vgId, pOffset->subKey,
              pOffset->val.version, pSavedOffset->val.version);
      return 0;
    }
  }
366 367 368

  int64_t sver = 0, ever = 0;
  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);
369 370 371 372
  if (pOffset->val.version < sver) {
    pOffset->val.version = sver;
  } else if (pOffset->val.version > ever) {
    pOffset->val.version = ever;
373 374 375
  }

  // save the new offset value
376 377 378 379 380 381
  if (pSavedOffset != NULL) {
    tqDebug("vgId:%d sub:%s seek to:%" PRId64 " prev offset:%" PRId64, vgId, pOffset->subKey, pOffset->val.version,
            pSavedOffset->val.version);
  } else {
    tqDebug("vgId:%d sub:%s seek to:%"PRId64" not saved yet", vgId, pOffset->subKey, pOffset->val.version);
  }
382

383 384
  if (tqOffsetWrite(pTq->pOffsetStore, pOffset) < 0) {
    tqError("failed to save offset, vgId:%d sub:%s seek to %" PRId64, vgId, pOffset->subKey, pOffset->val.version);
385 386 387 388 389 390
    return -1;
  }

  return 0;
}

L
Liu Jicong 已提交
391
int32_t tqCheckColModifiable(STQ* pTq, int64_t tbUid, int32_t colId) {
L
Liu Jicong 已提交
392
  void* pIter = NULL;
393

L
Liu Jicong 已提交
394
  while (1) {
395
    pIter = taosHashIterate(pTq->pCheckInfo, pIter);
396 397 398 399
    if (pIter == NULL) {
      break;
    }

400
    STqCheckInfo* pCheck = (STqCheckInfo*)pIter;
401

L
Liu Jicong 已提交
402 403
    if (pCheck->ntbUid == tbUid) {
      int32_t sz = taosArrayGetSize(pCheck->colIdList);
L
Liu Jicong 已提交
404
      for (int32_t i = 0; i < sz; i++) {
L
Liu Jicong 已提交
405 406
        int16_t forbidColId = *(int16_t*)taosArrayGet(pCheck->colIdList, i);
        if (forbidColId == colId) {
407
          taosHashCancelIterate(pTq->pCheckInfo, pIter);
L
Liu Jicong 已提交
408 409 410 411 412
          return -1;
        }
      }
    }
  }
413

L
Liu Jicong 已提交
414 415 416
  return 0;
}

417
int32_t tqProcessPollReq(STQ* pTq, SRpcMsg* pMsg) {
X
Xiaoyu Wang 已提交
418
  SMqPollReq req = {0};
419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437
  if (tDeserializeSMqPollReq(pMsg->pCont, pMsg->contLen, &req) < 0) {
    tqError("tDeserializeSMqPollReq %d failed", pMsg->contLen);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  int64_t      consumerId = req.consumerId;
  int32_t      reqEpoch = req.epoch;
  STqOffsetVal reqOffset = req.reqOffset;
  int32_t      vgId = TD_VID(pTq->pVnode);

  // 1. find handle
  STqHandle* pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
  if (pHandle == NULL) {
    tqError("tmq poll: consumer:0x%" PRIx64 " vgId:%d subkey %s not found", consumerId, vgId, req.subKey);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

438
  // 2. check re-balance status
439
  taosRLockLatch(&pTq->lock);
440 441 442 443
  if (pHandle->consumerId != consumerId) {
    tqDebug("ERROR tmq poll: consumer:0x%" PRIx64 " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
            consumerId, TD_VID(pTq->pVnode), req.subKey, pHandle->consumerId);
    terrno = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
444
    taosRUnLockLatch(&pTq->lock);
445 446
    return -1;
  }
447
  taosRUnLockLatch(&pTq->lock);
448

449
  // 3. update the epoch value
450
  taosWLockLatch(&pTq->lock);
H
Haojun Liao 已提交
451 452
  int32_t savedEpoch = pHandle->epoch;
  if (savedEpoch < reqEpoch) {
X
Xiaoyu Wang 已提交
453 454
    tqDebug("tmq poll: consumer:0x%" PRIx64 " epoch update from %d to %d by poll req", consumerId, savedEpoch,
            reqEpoch);
455
    pHandle->epoch = reqEpoch;
H
Haojun Liao 已提交
456
  }
457
  taosWUnLockLatch(&pTq->lock);
458 459 460

  char buf[80];
  tFormatOffset(buf, 80, &reqOffset);
H
Haojun Liao 已提交
461 462
  tqDebug("tmq poll: consumer:0x%" PRIx64 " (epoch %d), subkey %s, recv poll req vgId:%d, req:%s, reqId:0x%" PRIx64,
          consumerId, req.epoch, pHandle->subKey, vgId, buf, req.reqId);
463

464
  return tqExtractDataForMq(pTq, pHandle, &req, pMsg);
465 466
}

467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541
int32_t tqProcessVgWalInfoReq(STQ* pTq, SRpcMsg* pMsg) {
  SMqPollReq req = {0};
  if (tDeserializeSMqPollReq(pMsg->pCont, pMsg->contLen, &req) < 0) {
    tqError("tDeserializeSMqPollReq %d failed", pMsg->contLen);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  int64_t      consumerId = req.consumerId;
  STqOffsetVal reqOffset = req.reqOffset;
  int32_t      vgId = TD_VID(pTq->pVnode);

  // 1. find handle
  STqHandle* pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
  if (pHandle == NULL) {
    tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s not found", consumerId, vgId, req.subKey);
    terrno = TSDB_CODE_INVALID_MSG;
    return -1;
  }

  // 2. check re-balance status
  taosRLockLatch(&pTq->lock);
  if (pHandle->consumerId != consumerId) {
    tqDebug("ERROR consumer:0x%" PRIx64 " vgId:%d, subkey %s, mismatch for saved handle consumer:0x%" PRIx64,
            consumerId, vgId, req.subKey, pHandle->consumerId);
    terrno = TSDB_CODE_TMQ_CONSUMER_MISMATCH;
    taosRUnLockLatch(&pTq->lock);
    return -1;
  }
  taosRUnLockLatch(&pTq->lock);

  int64_t sver = 0, ever = 0;
  walReaderValidVersionRange(pHandle->execHandle.pTqReader->pWalReader, &sver, &ever);

  SMqDataRsp dataRsp = {0};
  tqInitDataRsp(&dataRsp, &req);

  STqOffset* pOffset = tqOffsetRead(pTq->pOffsetStore, req.subKey);
  if (pOffset != NULL) {
    if (pOffset->val.type != TMQ_OFFSET__LOG) {
      tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s use snapshot, no valid wal info", consumerId, vgId, req.subKey);
      terrno = TSDB_CODE_INVALID_PARA;
      tDeleteMqDataRsp(&dataRsp);
      return -1;
    }

    dataRsp.rspOffset.type = TMQ_OFFSET__LOG;
    dataRsp.rspOffset.version = pOffset->val.version;
  } else {
    if (req.useSnapshot == true) {
      tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s snapshot not support wal info", consumerId, vgId, req.subKey);
      terrno = TSDB_CODE_INVALID_PARA;
      tDeleteMqDataRsp(&dataRsp);
      return -1;
    }

    dataRsp.rspOffset.type = TMQ_OFFSET__LOG;

    if (reqOffset.type == TMQ_OFFSET__RESET_EARLIEAST) {
      dataRsp.rspOffset.version = sver;
    } else if (reqOffset.type == TMQ_OFFSET__RESET_LATEST) {
      dataRsp.rspOffset.version = ever;
    } else {
      tqError("consumer:0x%" PRIx64 " vgId:%d subkey:%s invalid offset type:%d", consumerId, vgId, req.subKey,
              reqOffset.type);
      terrno = TSDB_CODE_INVALID_PARA;
      tDeleteMqDataRsp(&dataRsp);
      return -1;
    }
  }

  tqDoSendDataRsp(&pMsg->info, &dataRsp, req.epoch, req.consumerId, TMQ_MSG_TYPE__WALINFO_RSP, sver, ever);
  return 0;
}

542
int32_t tqProcessDeleteSubReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
L
Liu Jicong 已提交
543
  SMqVDeleteReq* pReq = (SMqVDeleteReq*)msg;
L
Liu Jicong 已提交
544

L
Liu Jicong 已提交
545
  tqDebug("vgId:%d, tq process delete sub req %s", pTq->pVnode->config.vgId, pReq->subKey);
wmmhello's avatar
wmmhello 已提交
546
  int32_t code = 0;
wmmhello's avatar
wmmhello 已提交
547 548 549 550 551 552
//  taosWLockLatch(&pTq->lock);
//  int32_t code = taosHashRemove(pTq->pPushMgr, pReq->subKey, strlen(pReq->subKey));
//  if (code != 0) {
//    tqDebug("vgId:%d, tq remove push handle %s", pTq->pVnode->config.vgId, pReq->subKey);
//  }
//  taosWUnLockLatch(&pTq->lock);
L
Liu Jicong 已提交
553

L
Liu Jicong 已提交
554 555
  STqHandle* pHandle = taosHashGet(pTq->pHandle, pReq->subKey, strlen(pReq->subKey));
  if (pHandle) {
X
Xiaoyu Wang 已提交
556
    // walCloseRef(pHandle->pWalReader->pWal, pHandle->pRef->refId);
L
Liu Jicong 已提交
557 558 559 560 561 562 563
    if (pHandle->pRef) {
      walCloseRef(pTq->pVnode->pWal, pHandle->pRef->refId);
    }
    code = taosHashRemove(pTq->pHandle, pReq->subKey, strlen(pReq->subKey));
    if (code != 0) {
      tqError("cannot process tq delete req %s, since no such handle", pReq->subKey);
    }
L
Liu Jicong 已提交
564
  }
565

L
Liu Jicong 已提交
566 567
  code = tqOffsetDelete(pTq->pOffsetStore, pReq->subKey);
  if (code != 0) {
568
    tqError("cannot process tq delete req %s, since no such offset in cache", pReq->subKey);
L
Liu Jicong 已提交
569
  }
L
Liu Jicong 已提交
570

L
Liu Jicong 已提交
571
  if (tqMetaDeleteHandle(pTq, pReq->subKey) < 0) {
L
Liu Jicong 已提交
572
    tqError("cannot process tq delete req %s, since no such offset in tdb", pReq->subKey);
573
  }
L
Liu Jicong 已提交
574
  return 0;
L
Liu Jicong 已提交
575 576
}

577
int32_t tqProcessAddCheckInfoReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
578 579
  STqCheckInfo info = {0};
  SDecoder     decoder;
X
Xiaoyu Wang 已提交
580
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
581
  if (tDecodeSTqCheckInfo(&decoder, &info) < 0) {
L
Liu Jicong 已提交
582 583 584 585
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  tDecoderClear(&decoder);
586 587 588 589 590
  if (taosHashPut(pTq->pCheckInfo, info.topic, strlen(info.topic), &info, sizeof(STqCheckInfo)) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  if (tqMetaSaveCheckInfo(pTq, info.topic, msg, msgLen) < 0) {
L
Liu Jicong 已提交
591 592 593 594 595 596
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  return 0;
}

597
int32_t tqProcessDelCheckInfoReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
598 599 600 601 602 603 604 605 606 607 608
  if (taosHashRemove(pTq->pCheckInfo, msg, strlen(msg)) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  if (tqMetaDeleteCheckInfo(pTq, msg) < 0) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  return 0;
}

609
int32_t tqProcessSubscribeReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
610
  int ret = 0;
L
Liu Jicong 已提交
611
  SMqRebVgReq req = {0};
L
Liu Jicong 已提交
612
  tDecodeSMqRebVgReq(msg, &req);
L
Liu Jicong 已提交
613

614 615 616
  SVnode* pVnode = pTq->pVnode;
  int32_t vgId = TD_VID(pVnode);

617
  tqDebug("vgId:%d, tq process sub req:%s, Id:0x%" PRIx64 " -> Id:0x%" PRIx64, pVnode->config.vgId, req.subKey,
618
          req.oldConsumerId, req.newConsumerId);
L
Liu Jicong 已提交
619

620
  STqHandle* pHandle = taosHashGet(pTq->pHandle, req.subKey, strlen(req.subKey));
L
Liu Jicong 已提交
621
  if (pHandle == NULL) {
L
Liu Jicong 已提交
622
    if (req.oldConsumerId != -1) {
623
      tqError("vgId:%d, build new consumer handle %s for consumer:0x%" PRIx64 ", but old consumerId:0x%" PRIx64,
624
              req.vgId, req.subKey, req.newConsumerId, req.oldConsumerId);
L
Liu Jicong 已提交
625
    }
626

L
Liu Jicong 已提交
627
    if (req.newConsumerId == -1) {
628
      tqError("vgId:%d, tq invalid re-balance request, new consumerId %" PRId64 "", req.vgId, req.newConsumerId);
629
      goto end;
L
Liu Jicong 已提交
630
    }
631

L
Liu Jicong 已提交
632 633
    STqHandle tqHandle = {0};
    pHandle = &tqHandle;
L
Liu Jicong 已提交
634

H
Haojun Liao 已提交
635
    uint64_t oldConsumerId = pHandle->consumerId;
L
Liu Jicong 已提交
636 637 638
    memcpy(pHandle->subKey, req.subKey, TSDB_SUBSCRIBE_KEY_LEN);
    pHandle->consumerId = req.newConsumerId;
    pHandle->epoch = -1;
L
Liu Jicong 已提交
639

L
Liu Jicong 已提交
640
    pHandle->execHandle.subType = req.subType;
L
Liu Jicong 已提交
641
    pHandle->fetchMeta = req.withMeta;
wmmhello's avatar
wmmhello 已提交
642

643
    // TODO version should be assigned and refed during preprocess
644
    SWalRef* pRef = walRefCommittedVer(pVnode->pWal);
645
    if (pRef == NULL) {
646 647
      ret = -1;
      goto end;
648
    }
H
Haojun Liao 已提交
649

650 651
    int64_t ver = pRef->refVer;
    pHandle->pRef = pRef;
L
Liu Jicong 已提交
652

653
    SReadHandle handle = {
654
        .meta = pVnode->pMeta, .vnode = pVnode, .initTableReader = true, .initTqReader = true, .version = ver};
wmmhello's avatar
wmmhello 已提交
655
    pHandle->snapshotVer = ver;
656

L
Liu Jicong 已提交
657
    if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
L
Liu Jicong 已提交
658
      pHandle->execHandle.execCol.qmsg = req.qmsg;
L
Liu Jicong 已提交
659
      req.qmsg = NULL;
660

X
Xiaoyu Wang 已提交
661 662
      pHandle->execHandle.task = qCreateQueueExecTaskInfo(pHandle->execHandle.execCol.qmsg, &handle, vgId,
                                                          &pHandle->execHandle.numOfCols, req.newConsumerId);
L
Liu Jicong 已提交
663
      void* scanner = NULL;
664
      qExtractStreamScanner(pHandle->execHandle.task, &scanner);
665
      pHandle->execHandle.pTqReader = qExtractReaderFromStreamScanner(scanner);
L
Liu Jicong 已提交
666
    } else if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__DB) {
667
      pHandle->pWalReader = walOpenReader(pVnode->pWal, NULL);
668
      pHandle->execHandle.pTqReader = tqReaderOpen(pVnode);
669

L
Liu Jicong 已提交
670
      pHandle->execHandle.execDb.pFilterOutTbUid =
L
Liu Jicong 已提交
671
          taosHashInit(64, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_NO_LOCK);
672 673
      buildSnapContext(handle.meta, handle.version, 0, pHandle->execHandle.subType, pHandle->fetchMeta,
                       (SSnapContext**)(&handle.sContext));
674

675
      pHandle->execHandle.task = qCreateQueueExecTaskInfo(NULL, &handle, vgId, NULL, req.newConsumerId);
L
Liu Jicong 已提交
676
    } else if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__TABLE) {
677
      pHandle->pWalReader = walOpenReader(pVnode->pWal, NULL);
wmmhello's avatar
wmmhello 已提交
678 679
      pHandle->execHandle.execTb.suid = req.suid;

L
Liu Jicong 已提交
680
      SArray* tbUidList = taosArrayInit(0, sizeof(int64_t));
681 682
      vnodeGetCtbIdList(pVnode, req.suid, tbUidList);
      tqDebug("vgId:%d, tq try to get all ctb, suid:%" PRId64, pVnode->config.vgId, req.suid);
L
Liu Jicong 已提交
683 684
      for (int32_t i = 0; i < taosArrayGetSize(tbUidList); i++) {
        int64_t tbUid = *(int64_t*)taosArrayGet(tbUidList, i);
685
        tqDebug("vgId:%d, idx %d, uid:%" PRId64, vgId, i, tbUid);
L
Liu Jicong 已提交
686
      }
687
      pHandle->execHandle.pTqReader = tqReaderOpen(pVnode);
688
      tqReaderSetTbUidList(pHandle->execHandle.pTqReader, tbUidList);
L
Liu Jicong 已提交
689
      taosArrayDestroy(tbUidList);
wmmhello's avatar
wmmhello 已提交
690

L
Liu Jicong 已提交
691 692
      buildSnapContext(handle.meta, handle.version, req.suid, pHandle->execHandle.subType, pHandle->fetchMeta,
                       (SSnapContext**)(&handle.sContext));
693
      pHandle->execHandle.task = qCreateQueueExecTaskInfo(NULL, &handle, vgId, NULL, req.newConsumerId);
L
Liu Jicong 已提交
694
    }
H
Haojun Liao 已提交
695

696
    taosHashPut(pTq->pHandle, req.subKey, strlen(req.subKey), pHandle, sizeof(STqHandle));
697 698
    tqDebug("try to persist handle %s consumer:0x%" PRIx64 " , old consumer:0x%" PRIx64, req.subKey,
            pHandle->consumerId, oldConsumerId);
699 700
    ret = tqMetaSaveHandle(pTq, req.subKey, pHandle);
    goto end;
L
Liu Jicong 已提交
701
  } else {
702 703 704
    if (pHandle->consumerId == req.newConsumerId) {  // do nothing
      tqInfo("vgId:%d consumer:0x%" PRIx64 " remains, no switch occurs", req.vgId, req.newConsumerId);
      atomic_add_fetch_32(&pHandle->epoch, 1);
705

706 707 708 709
    } else {
      tqInfo("vgId:%d switch consumer from Id:0x%" PRIx64 " to Id:0x%" PRIx64, req.vgId, pHandle->consumerId,
             req.newConsumerId);
      atomic_store_64(&pHandle->consumerId, req.newConsumerId);
wmmhello's avatar
wmmhello 已提交
710
      atomic_store_32(&pHandle->epoch, 0);
711 712 713 714 715 716
    }
    // kill executing task
    qTaskInfo_t pTaskInfo = pHandle->execHandle.task;
    if (pTaskInfo != NULL) {
      qKillTask(pTaskInfo, TSDB_CODE_SUCCESS);
    }
717

718 719 720
    taosWLockLatch(&pTq->lock);
    // remove if it has been register in the push manager, and return one empty block to consumer
    tqUnregisterPushHandle(pTq, pHandle);
721 722


723 724
    if (pHandle->execHandle.subType == TOPIC_SUB_TYPE__COLUMN) {
      qStreamCloseTsdbReader(pTaskInfo);
L
Liu Jicong 已提交
725
    }
726 727 728 729

    taosWUnLockLatch(&pTq->lock);
    ret = tqMetaSaveHandle(pTq, req.subKey, pHandle);
    goto end;
L
Liu Jicong 已提交
730
  }
L
Liu Jicong 已提交
731

732
end:
H
Haojun Liao 已提交
733
  taosMemoryFree(req.qmsg);
734
  return ret;
L
Liu Jicong 已提交
735
}
736

737
int32_t tqExpandTask(STQ* pTq, SStreamTask* pTask, int64_t ver) {
738
  int32_t vgId = TD_VID(pTq->pVnode);
739
  pTask->id.idStr = createStreamTaskIdStr(pTask->id.streamId, pTask->id.taskId);
L
Liu Jicong 已提交
740
  pTask->refCnt = 1;
741
  pTask->status.schedStatus = TASK_SCHED_STATUS__INACTIVE;
L
Liu Jicong 已提交
742 743
  pTask->inputQueue = streamQueueOpen();
  pTask->outputQueue = streamQueueOpen();
L
Liu Jicong 已提交
744 745

  if (pTask->inputQueue == NULL || pTask->outputQueue == NULL) {
L
Liu Jicong 已提交
746
    return -1;
L
Liu Jicong 已提交
747 748
  }

L
Liu Jicong 已提交
749 750
  pTask->inputStatus = TASK_INPUT_STATUS__NORMAL;
  pTask->outputStatus = TASK_OUTPUT_STATUS__NORMAL;
751
  pTask->pMsgCb = &pTq->pVnode->msgCb;
752
  pTask->pMeta = pTq->pStreamMeta;
753
  pTask->chkInfo.version = ver;
754
  pTask->chkInfo.currentVer = ver;
755

756
  // expand executor
757
  pTask->status.taskStatus = (pTask->fillHistory)? TASK_STATUS__WAIT_DOWNSTREAM:TASK_STATUS__NORMAL;
758

759
  if (pTask->taskLevel == TASK_LEVEL__SOURCE) {
760
    pTask->pState = streamStateOpen(pTq->pStreamMeta->path, pTask, false, -1, -1);
761 762 763 764
    if (pTask->pState == NULL) {
      return -1;
    }

765
    SReadHandle handle = {
766
        .meta = pTq->pVnode->pMeta, .vnode = pTq->pVnode, .initTqReader = 1, .pStateBackend = pTask->pState};
767

768 769
    pTask->exec.pExecutor = qCreateStreamExecTaskInfo(pTask->exec.qmsg, &handle, vgId);
    if (pTask->exec.pExecutor == NULL) {
L
Liu Jicong 已提交
770 771
      return -1;
    }
772

773
  } else if (pTask->taskLevel == TASK_LEVEL__AGG) {
774
    pTask->pState = streamStateOpen(pTq->pStreamMeta->path, pTask, false, -1, -1);
775 776 777
    if (pTask->pState == NULL) {
      return -1;
    }
778

779 780 781 782 783
    int32_t numOfVgroups = (int32_t)taosArrayGetSize(pTask->childEpInfo);
    SReadHandle mgHandle = { .vnode = NULL, .numOfVgroups = numOfVgroups, .pStateBackend = pTask->pState};

    pTask->exec.pExecutor = qCreateStreamExecTaskInfo(pTask->exec.qmsg, &mgHandle, vgId);
    if (pTask->exec.pExecutor == NULL) {
L
Liu Jicong 已提交
784 785
      return -1;
    }
L
Liu Jicong 已提交
786
  }
L
Liu Jicong 已提交
787 788

  // sink
L
Liu Jicong 已提交
789
  /*pTask->ahandle = pTq->pVnode;*/
790
  if (pTask->outputType == TASK_OUTPUT__SMA) {
L
Liu Jicong 已提交
791
    pTask->smaSink.vnode = pTq->pVnode;
L
Liu Jicong 已提交
792
    pTask->smaSink.smaSink = smaHandleRes;
793
  } else if (pTask->outputType == TASK_OUTPUT__TABLE) {
L
Liu Jicong 已提交
794
    pTask->tbSink.vnode = pTq->pVnode;
L
Liu Jicong 已提交
795
    pTask->tbSink.tbSinkFunc = tqSinkToTablePipeline2;
L
Liu Jicong 已提交
796

X
Xiaoyu Wang 已提交
797
    int32_t   ver1 = 1;
5
54liuyao 已提交
798
    SMetaInfo info = {0};
dengyihao's avatar
dengyihao 已提交
799
    int32_t   code = metaGetInfo(pTq->pVnode->pMeta, pTask->tbSink.stbUid, &info, NULL);
5
54liuyao 已提交
800
    if (code == TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
801
      ver1 = info.skmVer;
5
54liuyao 已提交
802
    }
L
Liu Jicong 已提交
803

804 805
    SSchemaWrapper* pschemaWrapper = pTask->tbSink.pSchemaWrapper;
    pTask->tbSink.pTSchema = tBuildTSchema(pschemaWrapper->pSchema, pschemaWrapper->nCols, ver1);
wmmhello's avatar
wmmhello 已提交
806
    if(pTask->tbSink.pTSchema == NULL) {
wmmhello's avatar
wmmhello 已提交
807
      return -1;
wmmhello's avatar
wmmhello 已提交
808
    }
L
Liu Jicong 已提交
809
  }
810

811
  if (pTask->taskLevel == TASK_LEVEL__SOURCE) {
812
    pTask->exec.pWalReader = walOpenReader(pTq->pVnode->pWal, NULL);
813 814
  }

815
  streamSetupTrigger(pTask);
816

817
  tqInfo("vgId:%d expand stream task, s-task:%s, checkpoint ver:%" PRId64 " child id:%d, level:%d", vgId, pTask->id.idStr,
818
         pTask->chkInfo.version, pTask->selfChildId, pTask->taskLevel);
819 820 821

  // next valid version will add one
  pTask->chkInfo.version += 1;
L
Liu Jicong 已提交
822
  return 0;
L
Liu Jicong 已提交
823
}
L
Liu Jicong 已提交
824

825 826 827 828 829 830
int32_t tqProcessStreamTaskCheckReq(STQ* pTq, SRpcMsg* pMsg) {
  char*               msgStr = pMsg->pCont;
  char*               msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t             msgLen = pMsg->contLen - sizeof(SMsgHead);
  SStreamTaskCheckReq req;
  SDecoder            decoder;
X
Xiaoyu Wang 已提交
831
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
832 833 834 835 836 837 838 839 840 841 842 843
  tDecodeSStreamTaskCheckReq(&decoder, &req);
  tDecoderClear(&decoder);
  int32_t             taskId = req.downstreamTaskId;
  SStreamTaskCheckRsp rsp = {
      .reqId = req.reqId,
      .streamId = req.streamId,
      .childId = req.childId,
      .downstreamNodeId = req.downstreamNodeId,
      .downstreamTaskId = req.downstreamTaskId,
      .upstreamNodeId = req.upstreamNodeId,
      .upstreamTaskId = req.upstreamTaskId,
  };
844

L
Liu Jicong 已提交
845
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
846

847
  if (pTask) {
848
    rsp.status = streamTaskCheckStatus(pTask);
849 850 851 852 853 854
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);

    tqDebug("tq recv task check req(reqId:0x%" PRIx64
            ") %d at node %d task status:%d, check req from task %d at node %d, rsp status %d",
            rsp.reqId, rsp.downstreamTaskId, rsp.downstreamNodeId, pTask->status.taskStatus, rsp.upstreamTaskId,
            rsp.upstreamNodeId, rsp.status);
855 856
  } else {
    rsp.status = 0;
857 858 859 860
    tqDebug("tq recv task check(taskId:%d not built yet) req(reqId:0x%" PRIx64
            ") %d at node %d, check req from task %d at node %d, rsp status %d",
            taskId, rsp.reqId, rsp.downstreamTaskId, rsp.downstreamNodeId, rsp.upstreamTaskId, rsp.upstreamNodeId,
            rsp.status);
861 862 863 864 865 866 867
  }

  SEncoder encoder;
  int32_t  code;
  int32_t  len;
  tEncodeSize(tEncodeSStreamTaskCheckRsp, &rsp, len, code);
  if (code < 0) {
L
Liu Jicong 已提交
868
    tqError("unable to encode rsp %d", __LINE__);
L
Liu Jicong 已提交
869
    return -1;
870
  }
L
Liu Jicong 已提交
871

872 873 874 875 876 877 878 879
  void* buf = rpcMallocCont(sizeof(SMsgHead) + len);
  ((SMsgHead*)buf)->vgId = htonl(req.upstreamNodeId);

  void* abuf = POINTER_SHIFT(buf, sizeof(SMsgHead));
  tEncoderInit(&encoder, (uint8_t*)abuf, len);
  tEncodeSStreamTaskCheckRsp(&encoder, &rsp);
  tEncoderClear(&encoder);

880
  SRpcMsg rspMsg = { .code = 0, .pCont = buf, .contLen = sizeof(SMsgHead) + len, .info = pMsg->info };
881 882 883 884
  tmsgSendRsp(&rspMsg);
  return 0;
}

885
int32_t tqProcessStreamTaskCheckRsp(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
886 887 888 889 890 891 892 893 894 895 896
  int32_t             code;
  SStreamTaskCheckRsp rsp;

  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
  code = tDecodeSStreamTaskCheckRsp(&decoder, &rsp);
  if (code < 0) {
    tDecoderClear(&decoder);
    return -1;
  }

897
  tDecoderClear(&decoder);
898
  tqDebug("tq recv task check rsp(reqId:0x%" PRIx64 ") %d at node %d check req from task %d at node %d, status %d",
899 900
          rsp.reqId, rsp.downstreamTaskId, rsp.downstreamNodeId, rsp.upstreamTaskId, rsp.upstreamNodeId, rsp.status);

L
Liu Jicong 已提交
901
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, rsp.upstreamTaskId);
902 903 904 905
  if (pTask == NULL) {
    return -1;
  }

906
  code = streamProcessTaskCheckRsp(pTask, &rsp, sversion);
L
Liu Jicong 已提交
907 908
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
  return code;
909 910
}

911
int32_t tqProcessTaskDeployReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
912 913 914 915 916
  int32_t code;
#if 0
  code = streamMetaAddSerializedTask(pTq->pStreamMeta, version, msg, msgLen);
  if (code < 0) return code;
#endif
5
54liuyao 已提交
917 918 919
  if (tsDisableStream) {
    return 0;
  }
920 921 922 923 924 925

  // 1.deserialize msg and build task
  SStreamTask* pTask = taosMemoryCalloc(1, sizeof(SStreamTask));
  if (pTask == NULL) {
    return -1;
  }
926

927 928
  SDecoder decoder;
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
929
  code = tDecodeStreamTask(&decoder, pTask);
930 931 932 933 934
  if (code < 0) {
    tDecoderClear(&decoder);
    taosMemoryFree(pTask);
    return -1;
  }
935

936 937
  tDecoderClear(&decoder);

938
  // 2.save task, use the newest commit version as the initial start version of stream task.
939
  taosWLockLatch(&pTq->pStreamMeta->lock);
940
  code = streamMetaAddDeployedTask(pTq->pStreamMeta, sversion, pTask);
941
  if (code < 0) {
942 943
    tqError("vgId:%d failed to add s-task:%s, total:%d", TD_VID(pTq->pVnode), pTask->id.idStr,
            streamMetaGetNumOfTasks(pTq->pStreamMeta));
944
    taosWUnLockLatch(&pTq->pStreamMeta->lock);
945 946 947
    return -1;
  }

948 949
  taosWUnLockLatch(&pTq->pStreamMeta->lock);

950 951
  // 3.go through recover steps to fill history
  if (pTask->fillHistory) {
952
    streamTaskCheckDownstream(pTask, sversion);
953 954
  }

955 956
  tqDebug("vgId:%d s-task:%s is deployed and add meta from mnd, status:%d, total:%d", TD_VID(pTq->pVnode),
          pTask->id.idStr, pTask->status.taskStatus, streamMetaGetNumOfTasks(pTq->pStreamMeta));
957 958 959
  return 0;
}

L
Liu Jicong 已提交
960 961 962 963 964
int32_t tqProcessTaskRecover1Req(STQ* pTq, SRpcMsg* pMsg) {
  int32_t code;
  char*   msg = pMsg->pCont;
  int32_t msgLen = pMsg->contLen;

965
  SStreamRecoverStep1Req* pReq = (SStreamRecoverStep1Req*)msg;
L
Liu Jicong 已提交
966
  SStreamTask*            pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->taskId);
967 968 969 970 971
  if (pTask == NULL) {
    return -1;
  }

  // check param
972
  int64_t fillVer1 = pTask->chkInfo.version;
973
  if (fillVer1 <= 0) {
L
Liu Jicong 已提交
974
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
975 976 977 978
    return -1;
  }

  // do recovery step 1
H
Haojun Liao 已提交
979 980
  tqDebug("s-task:%s start recover step 1 scan", pTask->id.idStr);
  int64_t st = taosGetTimestampMs();
981

H
Haojun Liao 已提交
982
  streamSourceRecoverScanStep1(pTask);
983
  if (atomic_load_8(&pTask->status.taskStatus) == TASK_STATUS__DROPPING) {
L
Liu Jicong 已提交
984 985 986 987
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
    return 0;
  }

H
Haojun Liao 已提交
988 989 990
  double el = (taosGetTimestampMs() - st) / 1000.0;
  tqDebug("s-task:%s recover step 1 ended, elapsed time:%.2fs", pTask->id.idStr, el);

991 992 993 994
  // build msg to launch next step
  SStreamRecoverStep2Req req;
  code = streamBuildSourceRecover2Req(pTask, &req);
  if (code < 0) {
L
Liu Jicong 已提交
995
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
996 997 998
    return -1;
  }

L
Liu Jicong 已提交
999
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1000

1001
  if (atomic_load_8(&pTask->status.taskStatus) == TASK_STATUS__DROPPING) {
L
Liu Jicong 已提交
1002 1003 1004
    return 0;
  }

1005
  // serialize msg
L
Liu Jicong 已提交
1006 1007 1008 1009 1010 1011 1012 1013
  int32_t len = sizeof(SStreamRecoverStep1Req);

  void* serializedReq = rpcMallocCont(len);
  if (serializedReq == NULL) {
    return -1;
  }

  memcpy(serializedReq, &req, len);
1014 1015

  // dispatch msg
H
Haojun Liao 已提交
1016
  tqDebug("s-task:%s start recover block stage", pTask->id.idStr);
1017

H
Haojun Liao 已提交
1018 1019
  SRpcMsg rpcMsg = {
      .code = 0, .contLen = len, .msgType = TDMT_VND_STREAM_RECOVER_BLOCKING_STAGE, .pCont = serializedReq};
1020 1021 1022 1023
  tmsgPutToQueue(&pTq->pVnode->msgCb, WRITE_QUEUE, &rpcMsg);
  return 0;
}

1024
int32_t tqProcessTaskRecover2Req(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
H
Haojun Liao 已提交
1025 1026
  int32_t code = 0;

1027
  SStreamRecoverStep2Req* pReq = (SStreamRecoverStep2Req*)msg;
L
Liu Jicong 已提交
1028
  SStreamTask*            pTask = streamMetaAcquireTask(pTq->pStreamMeta, pReq->taskId);
1029 1030 1031 1032 1033
  if (pTask == NULL) {
    return -1;
  }

  // do recovery step 2
1034
  code = streamSourceRecoverScanStep2(pTask, sversion);
1035
  if (code < 0) {
L
Liu Jicong 已提交
1036
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1037 1038 1039
    return -1;
  }

1040
  if (atomic_load_8(&pTask->status.taskStatus) == TASK_STATUS__DROPPING) {
L
Liu Jicong 已提交
1041 1042 1043 1044
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
    return 0;
  }

1045 1046 1047
  // restore param
  code = streamRestoreParam(pTask);
  if (code < 0) {
L
Liu Jicong 已提交
1048
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1049 1050 1051 1052 1053 1054
    return -1;
  }

  // set status normal
  code = streamSetStatusNormal(pTask);
  if (code < 0) {
L
Liu Jicong 已提交
1055
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1056 1057 1058 1059 1060 1061
    return -1;
  }

  // dispatch recover finish req to all related downstream task
  code = streamDispatchRecoverFinishReq(pTask);
  if (code < 0) {
L
Liu Jicong 已提交
1062
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1063 1064 1065
    return -1;
  }

L
Liu Jicong 已提交
1066 1067 1068
  atomic_store_8(&pTask->fillHistory, 0);
  streamMetaSaveTask(pTq->pStreamMeta, pTask);

L
Liu Jicong 已提交
1069 1070
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);

1071 1072 1073
  return 0;
}

L
Liu Jicong 已提交
1074 1075 1076
int32_t tqProcessTaskRecoverFinishReq(STQ* pTq, SRpcMsg* pMsg) {
  char*   msg = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
  int32_t msgLen = pMsg->contLen - sizeof(SMsgHead);
1077 1078

  // deserialize
1079 1080 1081
  SStreamRecoverFinishReq req;

  SDecoder decoder;
X
Xiaoyu Wang 已提交
1082
  tDecoderInit(&decoder, (uint8_t*)msg, msgLen);
1083 1084 1085
  tDecodeSStreamRecoverFinishReq(&decoder, &req);
  tDecoderClear(&decoder);

1086
  // find task
L
Liu Jicong 已提交
1087
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.taskId);
1088 1089 1090
  if (pTask == NULL) {
    return -1;
  }
1091
  // do process request
1092
  if (streamProcessRecoverFinishReq(pTask, req.childId) < 0) {
L
Liu Jicong 已提交
1093
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1094 1095 1096
    return -1;
  }

L
Liu Jicong 已提交
1097
  streamMetaReleaseTask(pTq->pStreamMeta, pTask);
1098
  return 0;
L
Liu Jicong 已提交
1099
}
L
Liu Jicong 已提交
1100

L
Liu Jicong 已提交
1101 1102 1103 1104 1105
int32_t tqProcessTaskRecoverFinishRsp(STQ* pTq, SRpcMsg* pMsg) {
  //
  return 0;
}

L
Liu Jicong 已提交
1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121
int32_t tqProcessDelReq(STQ* pTq, void* pReq, int32_t len, int64_t ver) {
  bool        failed = false;
  SDecoder*   pCoder = &(SDecoder){0};
  SDeleteRes* pRes = &(SDeleteRes){0};

  pRes->uidList = taosArrayInit(0, sizeof(tb_uid_t));
  if (pRes->uidList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    failed = true;
  }

  tDecoderInit(pCoder, pReq, len);
  tDecodeDeleteRes(pCoder, pRes);
  tDecoderClear(pCoder);

  int32_t sz = taosArrayGetSize(pRes->uidList);
L
Liu Jicong 已提交
1122
  if (sz == 0 || pRes->affectedRows == 0) {
L
Liu Jicong 已提交
1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133
    taosArrayDestroy(pRes->uidList);
    return 0;
  }
  SSDataBlock* pDelBlock = createSpecialDataBlock(STREAM_DELETE_DATA);
  blockDataEnsureCapacity(pDelBlock, sz);
  pDelBlock->info.rows = sz;
  pDelBlock->info.version = ver;

  for (int32_t i = 0; i < sz; i++) {
    // start key column
    SColumnInfoData* pStartCol = taosArrayGet(pDelBlock->pDataBlock, START_TS_COLUMN_INDEX);
1134
    colDataSetVal(pStartCol, i, (const char*)&pRes->skey, false);  // end key column
L
Liu Jicong 已提交
1135
    SColumnInfoData* pEndCol = taosArrayGet(pDelBlock->pDataBlock, END_TS_COLUMN_INDEX);
1136
    colDataSetVal(pEndCol, i, (const char*)&pRes->ekey, false);
L
Liu Jicong 已提交
1137 1138 1139
    // uid column
    SColumnInfoData* pUidCol = taosArrayGet(pDelBlock->pDataBlock, UID_COLUMN_INDEX);
    int64_t*         pUid = taosArrayGet(pRes->uidList, i);
1140
    colDataSetVal(pUidCol, i, (const char*)pUid, false);
L
Liu Jicong 已提交
1141

1142 1143 1144
    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, GROUPID_COLUMN_INDEX), i);
    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, CALCULATE_START_TS_COLUMN_INDEX), i);
    colDataSetNULL(taosArrayGet(pDelBlock->pDataBlock, CALCULATE_END_TS_COLUMN_INDEX), i);
L
Liu Jicong 已提交
1145 1146
  }

L
Liu Jicong 已提交
1147 1148
  taosArrayDestroy(pRes->uidList);

L
Liu Jicong 已提交
1149 1150 1151
  int32_t* pRef = taosMemoryMalloc(sizeof(int32_t));
  *pRef = 1;

1152 1153
  taosWLockLatch(&pTq->pStreamMeta->lock);

L
Liu Jicong 已提交
1154 1155 1156
  void* pIter = NULL;
  while (1) {
    pIter = taosHashIterate(pTq->pStreamMeta->pTasks, pIter);
1157 1158 1159 1160
    if (pIter == NULL) {
      break;
    }

L
Liu Jicong 已提交
1161
    SStreamTask* pTask = *(SStreamTask**)pIter;
1162 1163 1164
    if (pTask->taskLevel != TASK_LEVEL__SOURCE) {
      continue;
    }
L
Liu Jicong 已提交
1165

1166
    qDebug("s-task:%s delete req enqueue, ver: %" PRId64, pTask->id.idStr, ver);
L
Liu Jicong 已提交
1167

L
Liu Jicong 已提交
1168
    if (!failed) {
S
Shengliang Guan 已提交
1169
      SStreamRefDataBlock* pRefBlock = taosAllocateQitem(sizeof(SStreamRefDataBlock), DEF_QITEM, 0);
L
Liu Jicong 已提交
1170 1171 1172 1173 1174
      pRefBlock->type = STREAM_INPUT__REF_DATA_BLOCK;
      pRefBlock->pBlock = pDelBlock;
      pRefBlock->dataRef = pRef;
      atomic_add_fetch_32(pRefBlock->dataRef, 1);

1175
      if (tAppendDataToInputQueue(pTask, (SStreamQueueItem*)pRefBlock) < 0) {
L
Liu Jicong 已提交
1176
        atomic_sub_fetch_32(pRef, 1);
L
Liu Jicong 已提交
1177
        taosFreeQitem(pRefBlock);
L
Liu Jicong 已提交
1178 1179
        continue;
      }
L
Liu Jicong 已提交
1180

L
Liu Jicong 已提交
1181
      if (streamSchedExec(pTask) < 0) {
1182
        qError("s-task:%s stream task launch failed", pTask->id.idStr);
L
Liu Jicong 已提交
1183 1184
        continue;
      }
L
Liu Jicong 已提交
1185

L
Liu Jicong 已提交
1186 1187 1188 1189
    } else {
      streamTaskInputFail(pTask);
    }
  }
L
Liu Jicong 已提交
1190

1191 1192
  taosWUnLockLatch(&pTq->pStreamMeta->lock);

L
Liu Jicong 已提交
1193 1194
  int32_t ref = atomic_sub_fetch_32(pRef, 1);
  if (ref == 0) {
L
Liu Jicong 已提交
1195
    blockDataDestroy(pDelBlock);
L
Liu Jicong 已提交
1196 1197 1198 1199
    taosMemoryFree(pRef);
  }

#if 0
S
Shengliang Guan 已提交
1200
    SStreamDataBlock* pStreamBlock = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, 0);
L
Liu Jicong 已提交
1201 1202 1203 1204 1205 1206 1207 1208
    pStreamBlock->type = STREAM_INPUT__DATA_BLOCK;
    pStreamBlock->blocks = taosArrayInit(0, sizeof(SSDataBlock));
    SSDataBlock block = {0};
    assignOneDataBlock(&block, pDelBlock);
    block.info.type = STREAM_DELETE_DATA;
    taosArrayPush(pStreamBlock->blocks, &block);

    if (!failed) {
1209
      if (tAppendDataToInputQueue(pTask, (SStreamQueueItem*)pStreamBlock) < 0) {
1210
        qError("stream task input del failed, task id %d", pTask->id.taskId);
L
Liu Jicong 已提交
1211 1212 1213 1214
        continue;
      }

      if (streamSchedExec(pTask) < 0) {
1215
        qError("stream task launch failed, task id %d", pTask->id.taskId);
L
Liu Jicong 已提交
1216 1217 1218 1219 1220 1221
        continue;
      }
    } else {
      streamTaskInputFail(pTask);
    }
  }
L
Liu Jicong 已提交
1222
  blockDataDestroy(pDelBlock);
L
Liu Jicong 已提交
1223
#endif
L
Liu Jicong 已提交
1224 1225 1226
  return 0;
}

1227 1228
int32_t tqProcessSubmitReqForSubscribe(STQ* pTq) {
  int32_t vgId = TD_VID(pTq->pVnode);
1229

1230
  taosWLockLatch(&pTq->lock);
1231

1232 1233 1234 1235
  if (taosHashGetSize(pTq->pPushMgr) > 0) {
    void* pIter = taosHashIterate(pTq->pPushMgr, NULL);

    while (pIter) {
wmmhello's avatar
wmmhello 已提交
1236
      STqHandle* pHandle = *(STqHandle**)pIter;
1237 1238 1239
      tqDebug("vgId:%d start set submit for pHandle:%p, consumer:0x%" PRIx64, vgId, pHandle, pHandle->consumerId);

      if (ASSERT(pHandle->msg != NULL)) {
wmmhello's avatar
wmmhello 已提交
1240 1241 1242 1243 1244 1245 1246
        tqError("pHandle->msg should not be null");
        break;
      }else{
        SRpcMsg msg = {.msgType = TDMT_VND_TMQ_CONSUME, .pCont = pHandle->msg->pCont, .contLen = pHandle->msg->contLen, .info = pHandle->msg->info};
        tmsgPutToQueue(&pTq->pVnode->msgCb, QUERY_QUEUE, &msg);
        taosMemoryFree(pHandle->msg);
        pHandle->msg = NULL;
L
Liu Jicong 已提交
1247 1248
      }

wmmhello's avatar
wmmhello 已提交
1249
      pIter = taosHashIterate(pTq->pPushMgr, pIter);
1250 1251
    }

wmmhello's avatar
wmmhello 已提交
1252
    taosHashClear(pTq->pPushMgr);
L
Liu Jicong 已提交
1253 1254
  }

1255 1256
  // unlock
  taosWUnLockLatch(&pTq->lock);
1257
  return 0;
L
Liu Jicong 已提交
1258 1259
}

L
Liu Jicong 已提交
1260 1261
int32_t tqProcessTaskRunReq(STQ* pTq, SRpcMsg* pMsg) {
  SStreamTaskRunReq* pReq = pMsg->pCont;
1262 1263 1264 1265

  int32_t taskId = pReq->taskId;
  int32_t vgId = TD_VID(pTq->pVnode);

1266 1267
  if (taskId == WAL_READ_TASKS_ID) {  // all tasks are extracted submit data from the wal
    tqStreamTasksScanWal(pTq);
L
Liu Jicong 已提交
1268
    return 0;
1269
  }
1270

1271
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
1272 1273 1274 1275 1276
  if (pTask != NULL) {
    if (pTask->status.taskStatus == TASK_STATUS__NORMAL) {
      tqDebug("vgId:%d s-task:%s start to process block from wal, last chk point:%" PRId64, vgId,
              pTask->id.idStr, pTask->chkInfo.version);
      streamProcessRunReq(pTask);
1277
    } else {
1278
      tqDebug("vgId:%d s-task:%s ignore run req since not in ready state", vgId, pTask->id.idStr);
1279
    }
1280 1281 1282 1283 1284 1285 1286

    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
    tqStartStreamTasks(pTq);
    return 0;
  } else {
    tqError("vgId:%d failed to found s-task, taskId:%d", vgId, taskId);
    return -1;
L
Liu Jicong 已提交
1287
  }
L
Liu Jicong 已提交
1288 1289
}

L
Liu Jicong 已提交
1290
int32_t tqProcessTaskDispatchReq(STQ* pTq, SRpcMsg* pMsg, bool exec) {
1291 1292 1293 1294 1295
  char*              msgStr = pMsg->pCont;
  char*              msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t            msgLen = pMsg->contLen - sizeof(SMsgHead);
  SStreamDispatchReq req;
  SDecoder           decoder;
L
Liu Jicong 已提交
1296
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
1297
  tDecodeStreamDispatchReq(&decoder, &req);
L
Liu Jicong 已提交
1298

1299
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, req.taskId);
L
Liu Jicong 已提交
1300
  if (pTask) {
1301
    SRpcMsg rsp = { .info = pMsg->info, .code = 0 };
L
Liu Jicong 已提交
1302
    streamProcessDispatchReq(pTask, &req, &rsp, exec);
L
Liu Jicong 已提交
1303
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1304
    return 0;
1305
  } else {
L
liuyao 已提交
1306
    tDeleteStreamDispatchReq(&req);
1307
    return -1;
L
Liu Jicong 已提交
1308
  }
L
Liu Jicong 已提交
1309 1310
}

L
Liu Jicong 已提交
1311 1312
int32_t tqProcessTaskDispatchRsp(STQ* pTq, SRpcMsg* pMsg) {
  SStreamDispatchRsp* pRsp = POINTER_SHIFT(pMsg->pCont, sizeof(SMsgHead));
1313
  int32_t             taskId = ntohl(pRsp->upstreamTaskId);
L
Liu Jicong 已提交
1314
  SStreamTask*        pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
1315
  tqDebug("recv dispatch rsp, code:%x", pMsg->code);
L
Liu Jicong 已提交
1316
  if (pTask) {
1317
    streamProcessDispatchRsp(pTask, pRsp, pMsg->code);
L
Liu Jicong 已提交
1318
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1319
    return 0;
1320 1321
  } else {
    return -1;
L
Liu Jicong 已提交
1322
  }
L
Liu Jicong 已提交
1323
}
L
Liu Jicong 已提交
1324

1325
int32_t tqProcessTaskDropReq(STQ* pTq, int64_t sversion, char* msg, int32_t msgLen) {
L
Liu Jicong 已提交
1326
  SVDropStreamTaskReq* pReq = (SVDropStreamTaskReq*)msg;
1327
  streamMetaRemoveTask(pTq->pStreamMeta, pReq->taskId);
L
Liu Jicong 已提交
1328
  return 0;
L
Liu Jicong 已提交
1329
}
L
Liu Jicong 已提交
1330 1331 1332 1333 1334 1335 1336

int32_t tqProcessTaskRetrieveReq(STQ* pTq, SRpcMsg* pMsg) {
  char*              msgStr = pMsg->pCont;
  char*              msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t            msgLen = pMsg->contLen - sizeof(SMsgHead);
  SStreamRetrieveReq req;
  SDecoder           decoder;
1337
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
L
Liu Jicong 已提交
1338
  tDecodeStreamRetrieveReq(&decoder, &req);
L
Liu Jicong 已提交
1339
  tDecoderClear(&decoder);
L
Liu Jicong 已提交
1340
  int32_t      taskId = req.dstTaskId;
L
Liu Jicong 已提交
1341
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
L
Liu Jicong 已提交
1342
  if (pTask) {
1343
    SRpcMsg rsp = { .info = pMsg->info, .code = 0 };
L
Liu Jicong 已提交
1344
    streamProcessRetrieveReq(pTask, &req, &rsp);
L
Liu Jicong 已提交
1345
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1346
    tDeleteStreamRetrieveReq(&req);
L
Liu Jicong 已提交
1347
    return 0;
L
Liu Jicong 已提交
1348
  } else {
L
liuyao 已提交
1349
    tDeleteStreamRetrieveReq(&req);
L
Liu Jicong 已提交
1350
    return -1;
L
Liu Jicong 已提交
1351 1352 1353 1354 1355 1356 1357
  }
}

int32_t tqProcessTaskRetrieveRsp(STQ* pTq, SRpcMsg* pMsg) {
  //
  return 0;
}
L
Liu Jicong 已提交
1358

1359 1360 1361 1362 1363 1364
int32_t vnodeEnqueueStreamMsg(SVnode* pVnode, SRpcMsg* pMsg) {
  STQ*      pTq = pVnode->pTq;
  SMsgHead* msgStr = pMsg->pCont;
  char*     msgBody = POINTER_SHIFT(msgStr, sizeof(SMsgHead));
  int32_t   msgLen = pMsg->contLen - sizeof(SMsgHead);
  int32_t   code = 0;
L
Liu Jicong 已提交
1365 1366 1367

  SStreamDispatchReq req;
  SDecoder           decoder;
1368
  tDecoderInit(&decoder, (uint8_t*)msgBody, msgLen);
L
Liu Jicong 已提交
1369 1370
  if (tDecodeStreamDispatchReq(&decoder, &req) < 0) {
    code = TSDB_CODE_MSG_DECODE_ERROR;
L
Liu Jicong 已提交
1371
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1372 1373
    goto FAIL;
  }
L
Liu Jicong 已提交
1374
  tDecoderClear(&decoder);
L
Liu Jicong 已提交
1375

L
Liu Jicong 已提交
1376
  int32_t taskId = req.taskId;
L
Liu Jicong 已提交
1377

L
Liu Jicong 已提交
1378
  SStreamTask* pTask = streamMetaAcquireTask(pTq->pStreamMeta, taskId);
L
Liu Jicong 已提交
1379
  if (pTask) {
1380
    SRpcMsg rsp = { .info = pMsg->info, .code = 0 };
L
Liu Jicong 已提交
1381
    streamProcessDispatchReq(pTask, &req, &rsp, false);
L
Liu Jicong 已提交
1382
    streamMetaReleaseTask(pTq->pStreamMeta, pTask);
L
Liu Jicong 已提交
1383 1384
    rpcFreeCont(pMsg->pCont);
    taosFreeQitem(pMsg);
1385
    return 0;
5
54liuyao 已提交
1386 1387
  } else {
    tDeleteStreamDispatchReq(&req);
L
Liu Jicong 已提交
1388
  }
L
Liu Jicong 已提交
1389

1390 1391
  code = TSDB_CODE_STREAM_TASK_NOT_EXIST;

L
Liu Jicong 已提交
1392
FAIL:
1393 1394 1395 1396
  if (pMsg->info.handle == NULL) return -1;

  SMsgHead* pRspHead = rpcMallocCont(sizeof(SMsgHead) + sizeof(SStreamDispatchRsp));
  if (pRspHead == NULL) {
1397
    SRpcMsg rsp = { .code = TSDB_CODE_OUT_OF_MEMORY, .info = pMsg->info };
1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413
    tqDebug("send dispatch error rsp, code: %x", code);
    tmsgSendRsp(&rsp);
    rpcFreeCont(pMsg->pCont);
    taosFreeQitem(pMsg);
    return -1;
  }

  pRspHead->vgId = htonl(req.upstreamNodeId);
  SStreamDispatchRsp* pRsp = POINTER_SHIFT(pRspHead, sizeof(SMsgHead));
  pRsp->streamId = htobe64(req.streamId);
  pRsp->upstreamTaskId = htonl(req.upstreamTaskId);
  pRsp->upstreamNodeId = htonl(req.upstreamNodeId);
  pRsp->downstreamNodeId = htonl(pVnode->config.vgId);
  pRsp->downstreamTaskId = htonl(req.taskId);
  pRsp->inputStatus = TASK_OUTPUT_STATUS__NORMAL;

L
Liu Jicong 已提交
1414
  SRpcMsg rsp = {
1415
      .code = code, .info = pMsg->info, .contLen = sizeof(SMsgHead) + sizeof(SStreamDispatchRsp), .pCont = pRspHead};
1416
  tqDebug("send dispatch error rsp, code: %x", code);
L
Liu Jicong 已提交
1417
  tmsgSendRsp(&rsp);
L
Liu Jicong 已提交
1418 1419
  rpcFreeCont(pMsg->pCont);
  taosFreeQitem(pMsg);
1420
  return -1;
L
Liu Jicong 已提交
1421
}
L
Liu Jicong 已提交
1422

1423
int32_t tqCheckLogInWal(STQ* pTq, int64_t sversion) { return sversion <= pTq->walLogLastVer; }
1424

1425
int32_t tqStartStreamTasks(STQ* pTq) {
1426
  int32_t      vgId = TD_VID(pTq->pVnode);
1427
  SStreamMeta* pMeta = pTq->pStreamMeta;
1428

1429
  taosWLockLatch(&pMeta->lock);
1430

1431
  int32_t numOfTasks = taosArrayGetSize(pMeta->pTaskList);
1432 1433 1434 1435 1436 1437
  if (numOfTasks == 0) {
    tqInfo("vgId:%d no stream tasks exists", vgId);
    taosWUnLockLatch(&pTq->pStreamMeta->lock);
    return 0;
  }

1438
  pMeta->walScanCounter += 1;
1439

1440 1441
  if (pMeta->walScanCounter > 1) {
    tqDebug("vgId:%d wal read task has been launched, remain scan times:%d", vgId, pMeta->walScanCounter);
1442 1443 1444 1445
    taosWUnLockLatch(&pTq->pStreamMeta->lock);
    return 0;
  }

1446 1447 1448 1449
  SStreamTaskRunReq* pRunReq = rpcMallocCont(sizeof(SStreamTaskRunReq));
  if (pRunReq == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    tqError("vgId:%d failed restore stream tasks, code:%s", vgId, terrstr(terrno));
1450
    taosWUnLockLatch(&pTq->pStreamMeta->lock);
1451 1452 1453
    return -1;
  }

H
Haojun Liao 已提交
1454
  tqDebug("vgId:%d start wal scan stream tasks, tasks:%d", vgId, numOfTasks);
1455 1456
  pRunReq->head.vgId = vgId;
  pRunReq->streamId = 0;
1457
  pRunReq->taskId = WAL_READ_TASKS_ID;
1458 1459 1460

  SRpcMsg msg = {.msgType = TDMT_STREAM_TASK_RUN, .pCont = pRunReq, .contLen = sizeof(SStreamTaskRunReq)};
  tmsgPutToQueue(&pTq->pVnode->msgCb, STREAM_QUEUE, &msg);
1461
  taosWUnLockLatch(&pTq->pStreamMeta->lock);
1462 1463 1464

  return 0;
}