streamExec.c 12.3 KB
Newer Older
L
Liu Jicong 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

L
Liu Jicong 已提交
16
#include "streamInc.h"
L
Liu Jicong 已提交
17

5
54liuyao 已提交
18 19
#define STREAM_EXEC_MAX_BATCH_NUM 100

20 21 22 23 24
bool streamTaskShouldStop(const SStreamStatus* pStatus) {
  int32_t status = atomic_load_8((int8_t*) &pStatus->taskStatus);
  return (status == TASK_STATUS__STOP) || (status == TASK_STATUS__DROPPING);
}

L
Liu Jicong 已提交
25
static int32_t streamTaskExecImpl(SStreamTask* pTask, const void* data, SArray* pRes) {
26 27 28
  int32_t code = TSDB_CODE_SUCCESS;
  void*   pExecutor = pTask->exec.pExecutor;

29
  while (pTask->taskLevel == TASK_LEVEL__SOURCE) {
30
    int8_t status = atomic_load_8(&pTask->status.taskStatus);
31
    if (status != TASK_STATUS__NORMAL) {
32
      qError("stream task wait for the end of fill history, s-task:%s, status:%d", pTask->id.idStr,
33
             atomic_load_8(&pTask->status.taskStatus));
34 35 36 37
      taosMsleep(2);
    } else {
      break;
    }
5
54liuyao 已提交
38
  }
L
Liu Jicong 已提交
39 40

  // set input
L
Liu Jicong 已提交
41
  const SStreamQueueItem* pItem = (const SStreamQueueItem*)data;
L
Liu Jicong 已提交
42
  if (pItem->type == STREAM_INPUT__GET_RES) {
L
Liu Jicong 已提交
43
    const SStreamTrigger* pTrigger = (const SStreamTrigger*)data;
44
    qSetMultiStreamInput(pExecutor, pTrigger->pBlock, 1, STREAM_INPUT__DATA_BLOCK);
45
  } else if (pItem->type == STREAM_INPUT__DATA_SUBMIT) {
46
    ASSERT(pTask->taskLevel == TASK_LEVEL__SOURCE);
L
Liu Jicong 已提交
47
    const SStreamDataSubmit2* pSubmit = (const SStreamDataSubmit2*)data;
48
    qSetMultiStreamInput(pExecutor, &pSubmit->submit, 1, STREAM_INPUT__DATA_SUBMIT);
49 50
    qDebug("s-task:%s set submit blocks as source block completed, %p %p len:%d ver:%" PRId64, pTask->id.idStr, pSubmit, pSubmit->submit.msgStr,
           pSubmit->submit.msgLen, pSubmit->submit.ver);
51
  } else if (pItem->type == STREAM_INPUT__DATA_BLOCK || pItem->type == STREAM_INPUT__DATA_RETRIEVE) {
L
Liu Jicong 已提交
52
    const SStreamDataBlock* pBlock = (const SStreamDataBlock*)data;
53 54 55 56 57

    SArray* pBlockList = pBlock->blocks;
    int32_t numOfBlocks = taosArrayGetSize(pBlockList);
    qDebug("s-task:%s set sdata blocks as input num:%d, ver:%"PRId64, pTask->id.idStr, numOfBlocks, pBlock->sourceVer);
    qSetMultiStreamInput(pExecutor, pBlockList->pData, numOfBlocks, STREAM_INPUT__DATA_BLOCK);
58
  } else if (pItem->type == STREAM_INPUT__MERGED_SUBMIT) {
L
Liu Jicong 已提交
59
    const SStreamMergedSubmit2* pMerged = (const SStreamMergedSubmit2*)data;
60 61 62 63 64

    SArray* pBlockList = pMerged->submits;
    int32_t numOfBlocks = taosArrayGetSize(pBlockList);
    qDebug("st-task:%s %p set submit input (merged), batch num:%d", pTask->id.idStr, pTask, numOfBlocks);
    qSetMultiStreamInput(pExecutor, pBlockList->pData, numOfBlocks, STREAM_INPUT__MERGED_SUBMIT);
L
Liu Jicong 已提交
65 66
  } else if (pItem->type == STREAM_INPUT__REF_DATA_BLOCK) {
    const SStreamRefDataBlock* pRefBlock = (const SStreamRefDataBlock*)data;
67
    qSetMultiStreamInput(pExecutor, pRefBlock->pBlock, 1, STREAM_INPUT__DATA_BLOCK);
68
  } else {
69
    ASSERT(0);
L
Liu Jicong 已提交
70 71
  }

72
  // pExecutor
L
Liu Jicong 已提交
73
  while (1) {
74
    if (streamTaskShouldStop(&pTask->status)) {
L
Liu Jicong 已提交
75 76 77
      return 0;
    }

L
Liu Jicong 已提交
78 79
    SSDataBlock* output = NULL;
    uint64_t     ts = 0;
80
    if ((code = qExecTask(pExecutor, &output, &ts)) < 0) {
5
54liuyao 已提交
81
      if (code == TSDB_CODE_QRY_IN_EXEC) {
82
        resetTaskInfo(pExecutor);
5
54liuyao 已提交
83
      }
84 85

      qError("unexpected stream execution, s-task:%s since %s", pTask->id.idStr, terrstr());
L
Liu Jicong 已提交
86
      continue;
L
Liu Jicong 已提交
87
    }
88

89
    if (output == NULL) {
5
54liuyao 已提交
90
      if (pItem->type == STREAM_INPUT__DATA_RETRIEVE) {
91 92
        SSDataBlock block = {0};

L
Liu Jicong 已提交
93
        const SStreamDataBlock* pRetrieveBlock = (const SStreamDataBlock*)data;
94
        ASSERT(taosArrayGetSize(pRetrieveBlock->blocks) == 1);
95

L
Liu Jicong 已提交
96
        assignOneDataBlock(&block, taosArrayGet(pRetrieveBlock->blocks, 0));
L
Liu Jicong 已提交
97
        block.info.type = STREAM_PULL_OVER;
L
Liu Jicong 已提交
98 99
        block.info.childId = pTask->selfChildId;
        taosArrayPush(pRes, &block);
L
Liu Jicong 已提交
100

101
        qDebug("task %d(child %d) processed retrieve, reqId %" PRId64, pTask->id.taskId, pTask->selfChildId,
L
Liu Jicong 已提交
102
               pRetrieveBlock->reqId);
103 104 105
      }
      break;
    }
L
Liu Jicong 已提交
106 107 108 109 110 111 112 113

    if (output->info.type == STREAM_RETRIEVE) {
      if (streamBroadcastToChildren(pTask, output) < 0) {
        // TODO
      }
      continue;
    }

114
    qDebug("s-task:%s (child %d) executed and get block", pTask->id.idStr, pTask->selfChildId);
J
jiajingbin 已提交
115

L
Liu Jicong 已提交
116 117 118 119
    SSDataBlock block = {0};
    assignOneDataBlock(&block, output);
    block.info.childId = pTask->selfChildId;
    taosArrayPush(pRes, &block);
L
Liu Jicong 已提交
120
  }
121

L
Liu Jicong 已提交
122 123 124
  return 0;
}

125
int32_t streamScanExec(SStreamTask* pTask, int32_t batchSz) {
126
  ASSERT(pTask->taskLevel == TASK_LEVEL__SOURCE);
127

128
  void* exec = pTask->exec.pExecutor;
129

L
Liu Jicong 已提交
130
  qSetStreamOpOpen(exec);
L
Liu Jicong 已提交
131
  bool finished = false;
L
Liu Jicong 已提交
132

133 134 135 136 137 138 139 140 141
  while (1) {
    SArray* pRes = taosArrayInit(0, sizeof(SSDataBlock));
    if (pRes == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      return -1;
    }

    int32_t batchCnt = 0;
    while (1) {
142
      if (streamTaskShouldStop(&pTask->status)) {
5
54liuyao 已提交
143
        taosArrayDestroy(pRes);
L
Liu Jicong 已提交
144 145 146
        return 0;
      }

147 148 149
      SSDataBlock* output = NULL;
      uint64_t     ts = 0;
      if (qExecTask(exec, &output, &ts) < 0) {
5
54liuyao 已提交
150
        continue;
151
      }
L
Liu Jicong 已提交
152
      if (output == NULL) {
L
Liu Jicong 已提交
153 154 155 156 157
        if (qStreamRecoverScanFinished(exec)) {
          finished = true;
        } else {
          qSetStreamOpOpen(exec);
        }
L
Liu Jicong 已提交
158 159
        break;
      }
160 161 162 163 164 165

      SSDataBlock block = {0};
      assignOneDataBlock(&block, output);
      block.info.childId = pTask->selfChildId;
      taosArrayPush(pRes, &block);

L
Liu Jicong 已提交
166 167
      batchCnt++;

H
Haojun Liao 已提交
168
      qDebug("s-task:%s scan exec block num %d, block limit %d", pTask->id.idStr, batchCnt, batchSz);
L
Liu Jicong 已提交
169

H
Haojun Liao 已提交
170 171 172
      if (batchCnt >= batchSz) {
        break;
      }
173
    }
H
Haojun Liao 已提交
174

175
    if (taosArrayGetSize(pRes) == 0) {
176 177
      if (finished) {
        taosArrayDestroy(pRes);
H
Haojun Liao 已提交
178
        qDebug("s-task:%s finish recover exec task ", pTask->id.idStr);
179 180
        break;
      } else {
H
Haojun Liao 已提交
181
        qDebug("s-task:%s continue recover exec task ", pTask->id.idStr);
182 183
        continue;
      }
184
    }
H
Haojun Liao 已提交
185

S
Shengliang Guan 已提交
186
    SStreamDataBlock* qRes = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, 0);
187 188 189 190 191 192 193 194 195
    if (qRes == NULL) {
      taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      return -1;
    }

    qRes->type = STREAM_INPUT__DATA_BLOCK;
    qRes->blocks = pRes;
    streamTaskOutput(pTask, qRes);
L
Liu Jicong 已提交
196 197

    if (pTask->outputType == TASK_OUTPUT__FIXED_DISPATCH || pTask->outputType == TASK_OUTPUT__SHUFFLE_DISPATCH) {
198
      qDebug("task %d scan exec dispatch block num %d", pTask->id.taskId, batchCnt);
L
Liu Jicong 已提交
199 200
      streamDispatch(pTask);
    }
201 202 203 204

    if (finished) {
      break;
    }
205 206 207 208 209
  }
  return 0;
}

#if 0
210 211 212 213
int32_t streamBatchExec(SStreamTask* pTask, int32_t batchLimit) {
  // fetch all queue item, merge according to batchLimit
  int32_t numOfItems = taosReadAllQitems(pTask->inputQueue1, pTask->inputQall);
  if (numOfItems == 0) {
214
    qDebug("task: %d, stream task exec over, queue empty", pTask->id.taskId);
215 216 217 218 219 220 221 222 223 224
    return 0;
  }
  SStreamQueueItem* pMerged = NULL;
  SStreamQueueItem* pItem = NULL;
  taosGetQitem(pTask->inputQall, (void**)&pItem);
  if (pItem == NULL) {
    if (pMerged != NULL) {
      // process merged item
    } else {
      return 0;
225
    }
226
  }
227

228 229 230 231 232
  // if drop
  if (pItem->type == STREAM_INPUT__DESTROY) {
    // set status drop
    return -1;
  }
233

234
  if (pTask->taskLevel == TASK_LEVEL__SINK) {
235
    ASSERT(((SStreamQueueItem*)pItem)->type == STREAM_INPUT__DATA_BLOCK);
236
    streamTaskOutput(pTask, (SStreamDataBlock*)pItem);
237 238
  }

239 240 241 242
  // exec impl

  // output
  // try dispatch
243 244
  return 0;
}
245
#endif
L
Liu Jicong 已提交
246

L
Liu Jicong 已提交
247
int32_t streamExecForAll(SStreamTask* pTask) {
L
Liu Jicong 已提交
248
  while (1) {
249 250 251 252
    int32_t batchSize = 1;
    void*   pInput = NULL;

    // merge multiple input data if possible in the input queue.
H
Haojun Liao 已提交
253 254
    qDebug("s-task:%s start to extract data block from inputQ", pTask->id.idStr);

L
Liu Jicong 已提交
255 256 257
    while (1) {
      SStreamQueueItem* qItem = streamQueueNextItem(pTask->inputQueue);
      if (qItem == NULL) {
L
Liu Jicong 已提交
258
        break;
L
Liu Jicong 已提交
259
      }
260 261 262

      if (pInput == NULL) {
        pInput = qItem;
263
        streamQueueProcessSuccess(pTask->inputQueue);
264
        if (pTask->taskLevel == TASK_LEVEL__SINK) {
L
Liu Jicong 已提交
265
          break;
L
Liu Jicong 已提交
266
        }
L
Liu Jicong 已提交
267
      } else {
268 269
        void* newRet = NULL;
        if ((newRet = streamMergeQueueItem(pInput, qItem)) == NULL) {
L
Liu Jicong 已提交
270 271 272
          streamQueueProcessFail(pTask->inputQueue);
          break;
        } else {
273 274
          batchSize++;
          pInput = newRet;
L
Liu Jicong 已提交
275
          streamQueueProcessSuccess(pTask->inputQueue);
276
          if (batchSize > STREAM_EXEC_MAX_BATCH_NUM) {
5
54liuyao 已提交
277 278
            break;
          }
L
Liu Jicong 已提交
279
        }
L
Liu Jicong 已提交
280 281
      }
    }
282

283
    if (streamTaskShouldStop(&pTask->status)) {
284 285 286
      if (pInput) {
        streamFreeQitem(pInput);
      }
L
Liu Jicong 已提交
287
      return 0;
L
Liu Jicong 已提交
288
    }
L
Liu Jicong 已提交
289

290
    if (pInput == NULL) {
L
Liu Jicong 已提交
291 292 293
      break;
    }

294
    if (pTask->taskLevel == TASK_LEVEL__SINK) {
295
      ASSERT(((SStreamQueueItem*)pInput)->type == STREAM_INPUT__DATA_BLOCK);
296
      qDebug("s-task:%s sink node start to sink result. numOfBlocks:%d", pTask->id.idStr, batchSize);
297
      streamTaskOutput(pTask, pInput);
L
Liu Jicong 已提交
298
      continue;
L
Liu Jicong 已提交
299
    }
L
Liu Jicong 已提交
300

L
Liu Jicong 已提交
301
    SArray* pRes = taosArrayInit(0, sizeof(SSDataBlock));
302
    qDebug("s-task:%s start to execute, numOfBlocks:%d", pTask->id.idStr, batchSize);
L
Liu Jicong 已提交
303

304
    streamTaskExecImpl(pTask, pInput, pRes);
305

L
liuyao 已提交
306 307 308
    int64_t ckId = 0;
    int64_t dataVer = 0;
    qGetCheckpointVersion(pTask->exec.pExecutor, &dataVer, &ckId);
309
    if (dataVer > pTask->chkInfo.version) {    // save it since the checkpoint is updated
310 311 312 313
      qDebug("s-task:%s exec end, start to update check point, ver from %" PRId64 " to %" PRId64
             ", checkPoint id:%" PRId64 " -> %" PRId64,
             pTask->id.idStr, pTask->chkInfo.version, dataVer, pTask->chkInfo.id, ckId);

314
      pTask->chkInfo = (SCheckpointInfo) {.version = dataVer, .id = ckId, .currentVer = pTask->chkInfo.currentVer};
315

316
      taosWLockLatch(&pTask->pMeta->lock);
317

318
      streamMetaSaveTask(pTask->pMeta, pTask);
319
      if (streamMetaCommit(pTask->pMeta) < 0) {
320 321
        taosWUnLockLatch(&pTask->pMeta->lock);
        qError("s-task:%s failed to commit stream meta, since %s", pTask->id.idStr, terrstr());
322
        return -1;
323 324 325
      } else {
        taosWUnLockLatch(&pTask->pMeta->lock);
        qDebug("s-task:%s update checkpoint ver succeed", pTask->id.idStr);
326 327 328 329
      }
    } else {
      qDebug("s-task:%s exec end", pTask->id.idStr);
    }
330

L
Liu Jicong 已提交
331
    if (taosArrayGetSize(pRes) != 0) {
S
Shengliang Guan 已提交
332
      SStreamDataBlock* qRes = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, 0);
L
Liu Jicong 已提交
333
      if (qRes == NULL) {
L
Liu Jicong 已提交
334
        taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
335
        streamFreeQitem(pInput);
L
Liu Jicong 已提交
336
        return -1;
L
Liu Jicong 已提交
337
      }
338

L
Liu Jicong 已提交
339 340
      qRes->type = STREAM_INPUT__DATA_BLOCK;
      qRes->blocks = pRes;
L
Liu Jicong 已提交
341

342 343
      if (((SStreamQueueItem*)pInput)->type == STREAM_INPUT__DATA_SUBMIT) {
        SStreamDataSubmit2* pSubmit = (SStreamDataSubmit2*)pInput;
L
Liu Jicong 已提交
344 345
        qRes->childId = pTask->selfChildId;
        qRes->sourceVer = pSubmit->ver;
346 347
      } else if (((SStreamQueueItem*)pInput)->type == STREAM_INPUT__MERGED_SUBMIT) {
        SStreamMergedSubmit2* pMerged = (SStreamMergedSubmit2*)pInput;
L
Liu Jicong 已提交
348 349
        qRes->childId = pTask->selfChildId;
        qRes->sourceVer = pMerged->ver;
L
Liu Jicong 已提交
350
      }
L
Liu Jicong 已提交
351 352 353

      if (streamTaskOutput(pTask, qRes) < 0) {
        taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
354
        streamFreeQitem(pInput);
L
Liu Jicong 已提交
355
        taosFreeQitem(qRes);
L
Liu Jicong 已提交
356 357
        return -1;
      }
L
Liu Jicong 已提交
358 359
    } else {
      taosArrayDestroy(pRes);
L
Liu Jicong 已提交
360
    }
361
    streamFreeQitem(pInput);
L
Liu Jicong 已提交
362
  }
L
Liu Jicong 已提交
363
  return 0;
L
Liu Jicong 已提交
364 365
}

L
Liu Jicong 已提交
366
int32_t streamTryExec(SStreamTask* pTask) {
367
  // this function may be executed by multi-threads, so status check is required.
L
Liu Jicong 已提交
368
  int8_t schedStatus =
369
      atomic_val_compare_exchange_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__WAITING, TASK_SCHED_STATUS__ACTIVE);
370

L
Liu Jicong 已提交
371 372 373
  if (schedStatus == TASK_SCHED_STATUS__WAITING) {
    int32_t code = streamExecForAll(pTask);
    if (code < 0) {
374
      atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__FAILED);
L
Liu Jicong 已提交
375 376
      return -1;
    }
377

378
    // todo the task should be commit here
379
    atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__INACTIVE);
380
    qDebug("s-task:%s exec completed", pTask->id.idStr);
L
Liu Jicong 已提交
381

382
    if (!taosQueueEmpty(pTask->inputQueue->queue) && (!streamTaskShouldStop(&pTask->status))) {
L
Liu Jicong 已提交
383
      streamSchedExec(pTask);
L
Liu Jicong 已提交
384 385
    }
  }
386

L
Liu Jicong 已提交
387
  return 0;
L
Liu Jicong 已提交
388
}