streamExec.c 12.5 KB
Newer Older
L
Liu Jicong 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

L
Liu Jicong 已提交
16
#include "streamInc.h"
L
Liu Jicong 已提交
17

L
liuyao 已提交
18
#define STREAM_EXEC_MAX_BATCH_NUM 1024
5
54liuyao 已提交
19

20 21 22 23 24
bool streamTaskShouldStop(const SStreamStatus* pStatus) {
  int32_t status = atomic_load_8((int8_t*) &pStatus->taskStatus);
  return (status == TASK_STATUS__STOP) || (status == TASK_STATUS__DROPPING);
}

L
Liu Jicong 已提交
25
static int32_t streamTaskExecImpl(SStreamTask* pTask, const void* data, SArray* pRes) {
26 27 28
  int32_t code = TSDB_CODE_SUCCESS;
  void*   pExecutor = pTask->exec.pExecutor;

29
  while (pTask->taskLevel == TASK_LEVEL__SOURCE) {
30
    int8_t status = atomic_load_8(&pTask->status.taskStatus);
31 32
    if (status != TASK_STATUS__NORMAL && status != TASK_STATUS__RESTORE) {
      qError("stream task wait for the end of fill history, s-task:%s, status:%d", pTask->id.idStr,
33
             atomic_load_8(&pTask->status.taskStatus));
34 35 36 37
      taosMsleep(2);
    } else {
      break;
    }
5
54liuyao 已提交
38
  }
L
Liu Jicong 已提交
39 40

  // set input
L
Liu Jicong 已提交
41
  const SStreamQueueItem* pItem = (const SStreamQueueItem*)data;
L
Liu Jicong 已提交
42
  if (pItem->type == STREAM_INPUT__GET_RES) {
L
Liu Jicong 已提交
43
    const SStreamTrigger* pTrigger = (const SStreamTrigger*)data;
44
    qSetMultiStreamInput(pExecutor, pTrigger->pBlock, 1, STREAM_INPUT__DATA_BLOCK);
45
  } else if (pItem->type == STREAM_INPUT__DATA_SUBMIT) {
46
    ASSERT(pTask->taskLevel == TASK_LEVEL__SOURCE);
L
Liu Jicong 已提交
47
    const SStreamDataSubmit2* pSubmit = (const SStreamDataSubmit2*)data;
48
    qSetMultiStreamInput(pExecutor, &pSubmit->submit, 1, STREAM_INPUT__DATA_SUBMIT);
49
    qDebug("s-task:%s set submit blocks as source block completed, %p %p len:%d ver:%" PRId64, pTask->id.idStr, pSubmit, pSubmit->submit.msgStr,
L
Liu Jicong 已提交
50
           pSubmit->submit.msgLen, pSubmit->submit.ver);
51
  } else if (pItem->type == STREAM_INPUT__DATA_BLOCK || pItem->type == STREAM_INPUT__DATA_RETRIEVE) {
L
Liu Jicong 已提交
52
    const SStreamDataBlock* pBlock = (const SStreamDataBlock*)data;
53 54 55 56 57

    SArray* pBlockList = pBlock->blocks;
    int32_t numOfBlocks = taosArrayGetSize(pBlockList);
    qDebug("s-task:%s set sdata blocks as input num:%d, ver:%"PRId64, pTask->id.idStr, numOfBlocks, pBlock->sourceVer);
    qSetMultiStreamInput(pExecutor, pBlockList->pData, numOfBlocks, STREAM_INPUT__DATA_BLOCK);
58
  } else if (pItem->type == STREAM_INPUT__MERGED_SUBMIT) {
L
Liu Jicong 已提交
59
    const SStreamMergedSubmit2* pMerged = (const SStreamMergedSubmit2*)data;
60 61 62 63 64

    SArray* pBlockList = pMerged->submits;
    int32_t numOfBlocks = taosArrayGetSize(pBlockList);
    qDebug("st-task:%s %p set submit input (merged), batch num:%d", pTask->id.idStr, pTask, numOfBlocks);
    qSetMultiStreamInput(pExecutor, pBlockList->pData, numOfBlocks, STREAM_INPUT__MERGED_SUBMIT);
L
Liu Jicong 已提交
65 66
  } else if (pItem->type == STREAM_INPUT__REF_DATA_BLOCK) {
    const SStreamRefDataBlock* pRefBlock = (const SStreamRefDataBlock*)data;
67
    qSetMultiStreamInput(pExecutor, pRefBlock->pBlock, 1, STREAM_INPUT__DATA_BLOCK);
68
  } else {
69
    ASSERT(0);
L
Liu Jicong 已提交
70 71
  }

72
  // pExecutor
L
Liu Jicong 已提交
73
  while (1) {
74
    if (streamTaskShouldStop(&pTask->status)) {
L
Liu Jicong 已提交
75 76 77
      return 0;
    }

L
Liu Jicong 已提交
78 79
    SSDataBlock* output = NULL;
    uint64_t     ts = 0;
80
    if ((code = qExecTask(pExecutor, &output, &ts)) < 0) {
5
54liuyao 已提交
81
      if (code == TSDB_CODE_QRY_IN_EXEC) {
82
        resetTaskInfo(pExecutor);
5
54liuyao 已提交
83
      }
84 85

      qError("unexpected stream execution, s-task:%s since %s", pTask->id.idStr, terrstr());
L
Liu Jicong 已提交
86
      continue;
L
Liu Jicong 已提交
87
    }
88

89
    if (output == NULL) {
5
54liuyao 已提交
90
      if (pItem->type == STREAM_INPUT__DATA_RETRIEVE) {
91 92
        SSDataBlock block = {0};

L
Liu Jicong 已提交
93
        const SStreamDataBlock* pRetrieveBlock = (const SStreamDataBlock*)data;
94
        ASSERT(taosArrayGetSize(pRetrieveBlock->blocks) == 1);
95

L
Liu Jicong 已提交
96
        assignOneDataBlock(&block, taosArrayGet(pRetrieveBlock->blocks, 0));
L
Liu Jicong 已提交
97
        block.info.type = STREAM_PULL_OVER;
L
Liu Jicong 已提交
98 99
        block.info.childId = pTask->selfChildId;
        taosArrayPush(pRes, &block);
L
Liu Jicong 已提交
100

101
        qDebug("task %d(child %d) processed retrieve, reqId %" PRId64, pTask->id.taskId, pTask->selfChildId,
L
Liu Jicong 已提交
102
               pRetrieveBlock->reqId);
103 104 105
      }
      break;
    }
L
Liu Jicong 已提交
106 107 108 109 110 111 112 113

    if (output->info.type == STREAM_RETRIEVE) {
      if (streamBroadcastToChildren(pTask, output) < 0) {
        // TODO
      }
      continue;
    }

114
    qDebug("s-task:%s (child %d) executed and get block", pTask->id.idStr, pTask->selfChildId);
J
jiajingbin 已提交
115

L
Liu Jicong 已提交
116 117 118 119
    SSDataBlock block = {0};
    assignOneDataBlock(&block, output);
    block.info.childId = pTask->selfChildId;
    taosArrayPush(pRes, &block);
L
Liu Jicong 已提交
120
  }
121

L
Liu Jicong 已提交
122 123 124
  return 0;
}

125
int32_t streamScanExec(SStreamTask* pTask, int32_t batchSz) {
dengyihao's avatar
dengyihao 已提交
126
  int32_t code = 0;
127

dengyihao's avatar
dengyihao 已提交
128
  ASSERT(pTask->taskLevel == TASK_LEVEL__SOURCE);
129

130
  void* exec = pTask->exec.pExecutor;
131

L
Liu Jicong 已提交
132
  qSetStreamOpOpen(exec);
L
Liu Jicong 已提交
133
  bool finished = false;
L
Liu Jicong 已提交
134

135 136 137 138 139 140 141 142 143
  while (1) {
    SArray* pRes = taosArrayInit(0, sizeof(SSDataBlock));
    if (pRes == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      return -1;
    }

    int32_t batchCnt = 0;
    while (1) {
144
      if (streamTaskShouldStop(&pTask->status)) {
5
54liuyao 已提交
145
        taosArrayDestroy(pRes);
L
Liu Jicong 已提交
146 147 148
        return 0;
      }

149 150 151
      SSDataBlock* output = NULL;
      uint64_t     ts = 0;
      if (qExecTask(exec, &output, &ts) < 0) {
5
54liuyao 已提交
152
        continue;
153
      }
L
Liu Jicong 已提交
154
      if (output == NULL) {
L
Liu Jicong 已提交
155 156 157 158 159
        if (qStreamRecoverScanFinished(exec)) {
          finished = true;
        } else {
          qSetStreamOpOpen(exec);
        }
L
Liu Jicong 已提交
160 161
        break;
      }
162 163 164 165 166 167

      SSDataBlock block = {0};
      assignOneDataBlock(&block, output);
      block.info.childId = pTask->selfChildId;
      taosArrayPush(pRes, &block);

L
Liu Jicong 已提交
168 169
      batchCnt++;

170
      qDebug("task %d scan exec block num %d, block limit %d", pTask->id.taskId, batchCnt, batchSz);
L
Liu Jicong 已提交
171 172

      if (batchCnt >= batchSz) break;
173 174
    }
    if (taosArrayGetSize(pRes) == 0) {
175 176
      if (finished) {
        taosArrayDestroy(pRes);
177
        qDebug("task %d finish recover exec task ", pTask->id.taskId);
178 179
        break;
      } else {
180
        qDebug("task %d continue recover exec task ", pTask->id.taskId);
181 182
        continue;
      }
183
    }
S
Shengliang Guan 已提交
184
    SStreamDataBlock* qRes = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, 0);
185 186 187 188 189 190 191 192
    if (qRes == NULL) {
      taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      return -1;
    }

    qRes->type = STREAM_INPUT__DATA_BLOCK;
    qRes->blocks = pRes;
dengyihao's avatar
dengyihao 已提交
193 194 195 196 197
    code = streamTaskOutput(pTask, qRes);
    if (code == TSDB_CODE_UTIL_QUEUE_OUT_OF_MEMORY) {
      taosFreeQitem(pRes);
      return code;
    }
L
Liu Jicong 已提交
198 199

    if (pTask->outputType == TASK_OUTPUT__FIXED_DISPATCH || pTask->outputType == TASK_OUTPUT__SHUFFLE_DISPATCH) {
200
      qDebug("task %d scan exec dispatch block num %d", pTask->id.taskId, batchCnt);
L
Liu Jicong 已提交
201 202
      streamDispatch(pTask);
    }
203 204 205 206

    if (finished) {
      break;
    }
207 208 209 210 211
  }
  return 0;
}

#if 0
212 213 214 215
int32_t streamBatchExec(SStreamTask* pTask, int32_t batchLimit) {
  // fetch all queue item, merge according to batchLimit
  int32_t numOfItems = taosReadAllQitems(pTask->inputQueue1, pTask->inputQall);
  if (numOfItems == 0) {
216
    qDebug("task: %d, stream task exec over, queue empty", pTask->id.taskId);
217 218 219 220 221 222 223 224 225 226
    return 0;
  }
  SStreamQueueItem* pMerged = NULL;
  SStreamQueueItem* pItem = NULL;
  taosGetQitem(pTask->inputQall, (void**)&pItem);
  if (pItem == NULL) {
    if (pMerged != NULL) {
      // process merged item
    } else {
      return 0;
227
    }
228
  }
229

230 231 232 233 234
  // if drop
  if (pItem->type == STREAM_INPUT__DESTROY) {
    // set status drop
    return -1;
  }
235

236
  if (pTask->taskLevel == TASK_LEVEL__SINK) {
237
    ASSERT(((SStreamQueueItem*)pItem)->type == STREAM_INPUT__DATA_BLOCK);
238
    streamTaskOutput(pTask, (SStreamDataBlock*)pItem);
239 240
  }

241 242 243 244
  // exec impl

  // output
  // try dispatch
245 246
  return 0;
}
247
#endif
L
Liu Jicong 已提交
248

L
Liu Jicong 已提交
249
int32_t streamExecForAll(SStreamTask* pTask) {
dengyihao's avatar
dengyihao 已提交
250
  int32_t code = 0;
L
Liu Jicong 已提交
251
  while (1) {
252 253 254 255
    int32_t batchSize = 1;
    void*   pInput = NULL;

    // merge multiple input data if possible in the input queue.
L
Liu Jicong 已提交
256 257 258
    while (1) {
      SStreamQueueItem* qItem = streamQueueNextItem(pTask->inputQueue);
      if (qItem == NULL) {
259
//        qDebug("s-task:%s extract data from input queue, queue is empty, abort", pTask->id.idStr);
L
Liu Jicong 已提交
260
        break;
L
Liu Jicong 已提交
261
      }
262 263 264

      if (pInput == NULL) {
        pInput = qItem;
265
        streamQueueProcessSuccess(pTask->inputQueue);
266
        if (pTask->taskLevel == TASK_LEVEL__SINK) {
L
Liu Jicong 已提交
267
          break;
L
Liu Jicong 已提交
268
        }
L
Liu Jicong 已提交
269
      } else {
270 271
        void* newRet = NULL;
        if ((newRet = streamMergeQueueItem(pInput, qItem)) == NULL) {
L
Liu Jicong 已提交
272 273 274
          streamQueueProcessFail(pTask->inputQueue);
          break;
        } else {
275 276
          batchSize++;
          pInput = newRet;
L
Liu Jicong 已提交
277
          streamQueueProcessSuccess(pTask->inputQueue);
278
          if (batchSize > STREAM_EXEC_MAX_BATCH_NUM) {
5
54liuyao 已提交
279 280
            break;
          }
L
Liu Jicong 已提交
281
        }
L
Liu Jicong 已提交
282 283
      }
    }
284

285
    if (streamTaskShouldStop(&pTask->status)) {
286 287 288
      if (pInput) {
        streamFreeQitem(pInput);
      }
L
Liu Jicong 已提交
289
      return 0;
L
Liu Jicong 已提交
290
    }
L
Liu Jicong 已提交
291

292
    if (pInput == NULL) {
L
Liu Jicong 已提交
293 294 295
      break;
    }

296
    if (pTask->taskLevel == TASK_LEVEL__SINK) {
297
      ASSERT(((SStreamQueueItem*)pInput)->type == STREAM_INPUT__DATA_BLOCK);
298
      qDebug("s-task:%s sink node start to sink result. numOfBlocks:%d", pTask->id.idStr, batchSize);
299
      streamTaskOutput(pTask, pInput);
L
Liu Jicong 已提交
300
      continue;
L
Liu Jicong 已提交
301
    }
L
Liu Jicong 已提交
302

L
Liu Jicong 已提交
303
    SArray* pRes = taosArrayInit(0, sizeof(SSDataBlock));
304
    qDebug("s-task:%s exec begin, numOfBlocks:%d", pTask->id.idStr, batchSize);
L
Liu Jicong 已提交
305

306
    streamTaskExecImpl(pTask, pInput, pRes);
307

L
liuyao 已提交
308 309 310
    int64_t ckId = 0;
    int64_t dataVer = 0;
    qGetCheckpointVersion(pTask->exec.pExecutor, &dataVer, &ckId);
311
    if (dataVer > pTask->chkInfo.version) {    // save it since the checkpoint is updated
312 313 314
      qDebug("s-task:%s exec end, start to update check point, ver from %" PRId64 " to %" PRId64
             ", checkPoint id:%" PRId64 " -> %" PRId64,
             pTask->id.idStr, pTask->chkInfo.version, dataVer, pTask->chkInfo.id, ckId);
L
Liu Jicong 已提交
315

316
      pTask->chkInfo = (SCheckpointInfo) {.version = dataVer, .id = ckId, .currentVer = pTask->chkInfo.currentVer};
317

318 319
      taosWLockLatch(&pTask->pMeta->lock);
      streamMetaSaveTask(pTask->pMeta, pTask);
320
      if (streamMetaCommit(pTask->pMeta) < 0) {
321 322
        taosWUnLockLatch(&pTask->pMeta->lock);
        qError("s-task:%s failed to commit stream meta, since %s", pTask->id.idStr, terrstr());
323
        return -1;
324 325 326
      } else {
        taosWUnLockLatch(&pTask->pMeta->lock);
        qDebug("s-task:%s update checkpoint ver succeed", pTask->id.idStr);
327 328 329 330
      }
    } else {
      qDebug("s-task:%s exec end", pTask->id.idStr);
    }
331

L
Liu Jicong 已提交
332
    if (taosArrayGetSize(pRes) != 0) {
S
Shengliang Guan 已提交
333
      SStreamDataBlock* qRes = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, 0);
L
Liu Jicong 已提交
334
      if (qRes == NULL) {
L
Liu Jicong 已提交
335
        taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
336
        streamFreeQitem(pInput);
L
Liu Jicong 已提交
337
        return -1;
L
Liu Jicong 已提交
338
      }
339

L
Liu Jicong 已提交
340 341
      qRes->type = STREAM_INPUT__DATA_BLOCK;
      qRes->blocks = pRes;
L
Liu Jicong 已提交
342

343 344
      if (((SStreamQueueItem*)pInput)->type == STREAM_INPUT__DATA_SUBMIT) {
        SStreamDataSubmit2* pSubmit = (SStreamDataSubmit2*)pInput;
L
Liu Jicong 已提交
345 346
        qRes->childId = pTask->selfChildId;
        qRes->sourceVer = pSubmit->ver;
347 348
      } else if (((SStreamQueueItem*)pInput)->type == STREAM_INPUT__MERGED_SUBMIT) {
        SStreamMergedSubmit2* pMerged = (SStreamMergedSubmit2*)pInput;
L
Liu Jicong 已提交
349 350
        qRes->childId = pTask->selfChildId;
        qRes->sourceVer = pMerged->ver;
L
Liu Jicong 已提交
351
      }
L
Liu Jicong 已提交
352

dengyihao's avatar
dengyihao 已提交
353 354 355
      code = streamTaskOutput(pTask, qRes);
      if (code == TSDB_CODE_UTIL_QUEUE_OUT_OF_MEMORY) {
        // backpressure and record position
L
Liu Jicong 已提交
356
        taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
357
        streamFreeQitem(pInput);
L
Liu Jicong 已提交
358
        taosFreeQitem(qRes);
L
Liu Jicong 已提交
359 360
        return -1;
      }
L
Liu Jicong 已提交
361 362
    } else {
      taosArrayDestroy(pRes);
L
Liu Jicong 已提交
363
    }
364
    streamFreeQitem(pInput);
L
Liu Jicong 已提交
365
  }
L
Liu Jicong 已提交
366
  return 0;
L
Liu Jicong 已提交
367 368
}

L
Liu Jicong 已提交
369
int32_t streamTryExec(SStreamTask* pTask) {
370
  // this function may be executed by multi-threads, so status check is required.
L
Liu Jicong 已提交
371
  int8_t schedStatus =
372
      atomic_val_compare_exchange_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__WAITING, TASK_SCHED_STATUS__ACTIVE);
373

L
Liu Jicong 已提交
374 375 376
  if (schedStatus == TASK_SCHED_STATUS__WAITING) {
    int32_t code = streamExecForAll(pTask);
    if (code < 0) {
377
      atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__FAILED);
L
Liu Jicong 已提交
378 379
      return -1;
    }
380

381
    // todo the task should be commit here
382
    atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__INACTIVE);
383
    qDebug("s-task:%s exec completed", pTask->id.idStr);
L
Liu Jicong 已提交
384

385
    if (!taosQueueEmpty(pTask->inputQueue->queue) && (!streamTaskShouldStop(&pTask->status))) {
L
Liu Jicong 已提交
386
      streamSchedExec(pTask);
L
Liu Jicong 已提交
387 388
    }
  }
389

L
Liu Jicong 已提交
390
  return 0;
L
Liu Jicong 已提交
391
}