streamExec.c 12.3 KB
Newer Older
L
Liu Jicong 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

L
Liu Jicong 已提交
16
#include "streamInc.h"
L
Liu Jicong 已提交
17

5
54liuyao 已提交
18 19
#define STREAM_EXEC_MAX_BATCH_NUM 100

20 21 22 23 24
bool streamTaskShouldStop(const SStreamStatus* pStatus) {
  int32_t status = atomic_load_8((int8_t*) &pStatus->taskStatus);
  return (status == TASK_STATUS__STOP) || (status == TASK_STATUS__DROPPING);
}

L
Liu Jicong 已提交
25
static int32_t streamTaskExecImpl(SStreamTask* pTask, const void* data, SArray* pRes) {
26 27 28
  int32_t code = TSDB_CODE_SUCCESS;
  void*   pExecutor = pTask->exec.pExecutor;

29
  while (pTask->taskLevel == TASK_LEVEL__SOURCE) {
30
    int8_t status = atomic_load_8(&pTask->status.taskStatus);
31 32
    if (status != TASK_STATUS__NORMAL && status != TASK_STATUS__RESTORE) {
      qError("stream task wait for the end of fill history, s-task:%s, status:%d", pTask->id.idStr,
33
             atomic_load_8(&pTask->status.taskStatus));
34 35 36 37
      taosMsleep(2);
    } else {
      break;
    }
5
54liuyao 已提交
38
  }
L
Liu Jicong 已提交
39 40

  // set input
L
Liu Jicong 已提交
41
  const SStreamQueueItem* pItem = (const SStreamQueueItem*)data;
L
Liu Jicong 已提交
42
  if (pItem->type == STREAM_INPUT__GET_RES) {
L
Liu Jicong 已提交
43
    const SStreamTrigger* pTrigger = (const SStreamTrigger*)data;
44
    qSetMultiStreamInput(pExecutor, pTrigger->pBlock, 1, STREAM_INPUT__DATA_BLOCK);
45
  } else if (pItem->type == STREAM_INPUT__DATA_SUBMIT) {
46
    ASSERT(pTask->taskLevel == TASK_LEVEL__SOURCE);
L
Liu Jicong 已提交
47
    const SStreamDataSubmit2* pSubmit = (const SStreamDataSubmit2*)data;
48
    qSetMultiStreamInput(pExecutor, &pSubmit->submit, 1, STREAM_INPUT__DATA_SUBMIT);
49 50
    qDebug("s-task:%s set submit blocks as source block completed, %p %p len:%d ver:%" PRId64, pTask->id.idStr, pSubmit, pSubmit->submit.msgStr,
           pSubmit->submit.msgLen, pSubmit->submit.ver);
51
  } else if (pItem->type == STREAM_INPUT__DATA_BLOCK || pItem->type == STREAM_INPUT__DATA_RETRIEVE) {
L
Liu Jicong 已提交
52
    const SStreamDataBlock* pBlock = (const SStreamDataBlock*)data;
53 54 55 56 57

    SArray* pBlockList = pBlock->blocks;
    int32_t numOfBlocks = taosArrayGetSize(pBlockList);
    qDebug("s-task:%s set sdata blocks as input num:%d, ver:%"PRId64, pTask->id.idStr, numOfBlocks, pBlock->sourceVer);
    qSetMultiStreamInput(pExecutor, pBlockList->pData, numOfBlocks, STREAM_INPUT__DATA_BLOCK);
58
  } else if (pItem->type == STREAM_INPUT__MERGED_SUBMIT) {
L
Liu Jicong 已提交
59
    const SStreamMergedSubmit2* pMerged = (const SStreamMergedSubmit2*)data;
60 61 62 63 64

    SArray* pBlockList = pMerged->submits;
    int32_t numOfBlocks = taosArrayGetSize(pBlockList);
    qDebug("st-task:%s %p set submit input (merged), batch num:%d", pTask->id.idStr, pTask, numOfBlocks);
    qSetMultiStreamInput(pExecutor, pBlockList->pData, numOfBlocks, STREAM_INPUT__MERGED_SUBMIT);
L
Liu Jicong 已提交
65 66
  } else if (pItem->type == STREAM_INPUT__REF_DATA_BLOCK) {
    const SStreamRefDataBlock* pRefBlock = (const SStreamRefDataBlock*)data;
67
    qSetMultiStreamInput(pExecutor, pRefBlock->pBlock, 1, STREAM_INPUT__DATA_BLOCK);
68
  } else {
69
    ASSERT(0);
L
Liu Jicong 已提交
70 71
  }

72
  // pExecutor
L
Liu Jicong 已提交
73
  while (1) {
74
    if (streamTaskShouldStop(&pTask->status)) {
L
Liu Jicong 已提交
75 76 77
      return 0;
    }

L
Liu Jicong 已提交
78 79
    SSDataBlock* output = NULL;
    uint64_t     ts = 0;
80
    if ((code = qExecTask(pExecutor, &output, &ts)) < 0) {
5
54liuyao 已提交
81
      if (code == TSDB_CODE_QRY_IN_EXEC) {
82
        resetTaskInfo(pExecutor);
5
54liuyao 已提交
83
      }
84 85

      qError("unexpected stream execution, s-task:%s since %s", pTask->id.idStr, terrstr());
L
Liu Jicong 已提交
86
      continue;
L
Liu Jicong 已提交
87
    }
88

89
    if (output == NULL) {
5
54liuyao 已提交
90
      if (pItem->type == STREAM_INPUT__DATA_RETRIEVE) {
91 92
        SSDataBlock block = {0};

L
Liu Jicong 已提交
93
        const SStreamDataBlock* pRetrieveBlock = (const SStreamDataBlock*)data;
94
        ASSERT(taosArrayGetSize(pRetrieveBlock->blocks) == 1);
95

L
Liu Jicong 已提交
96
        assignOneDataBlock(&block, taosArrayGet(pRetrieveBlock->blocks, 0));
L
Liu Jicong 已提交
97
        block.info.type = STREAM_PULL_OVER;
L
Liu Jicong 已提交
98 99
        block.info.childId = pTask->selfChildId;
        taosArrayPush(pRes, &block);
L
Liu Jicong 已提交
100

101
        qDebug("task %d(child %d) processed retrieve, reqId %" PRId64, pTask->id.taskId, pTask->selfChildId,
L
Liu Jicong 已提交
102
               pRetrieveBlock->reqId);
103 104 105
      }
      break;
    }
L
Liu Jicong 已提交
106 107 108 109 110 111 112 113

    if (output->info.type == STREAM_RETRIEVE) {
      if (streamBroadcastToChildren(pTask, output) < 0) {
        // TODO
      }
      continue;
    }

114
    qDebug("s-task:%s (child %d) executed and get block", pTask->id.idStr, pTask->selfChildId);
J
jiajingbin 已提交
115

L
Liu Jicong 已提交
116 117 118 119
    SSDataBlock block = {0};
    assignOneDataBlock(&block, output);
    block.info.childId = pTask->selfChildId;
    taosArrayPush(pRes, &block);
L
Liu Jicong 已提交
120
  }
121

L
Liu Jicong 已提交
122 123 124
  return 0;
}

125
int32_t streamScanExec(SStreamTask* pTask, int32_t batchSz) {
126
  ASSERT(pTask->taskLevel == TASK_LEVEL__SOURCE);
127

128
  void* exec = pTask->exec.pExecutor;
129

L
Liu Jicong 已提交
130
  qSetStreamOpOpen(exec);
L
Liu Jicong 已提交
131
  bool finished = false;
L
Liu Jicong 已提交
132

133 134 135 136 137 138 139 140 141
  while (1) {
    SArray* pRes = taosArrayInit(0, sizeof(SSDataBlock));
    if (pRes == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      return -1;
    }

    int32_t batchCnt = 0;
    while (1) {
142
      if (streamTaskShouldStop(&pTask->status)) {
5
54liuyao 已提交
143
        taosArrayDestroy(pRes);
L
Liu Jicong 已提交
144 145 146
        return 0;
      }

147 148 149
      SSDataBlock* output = NULL;
      uint64_t     ts = 0;
      if (qExecTask(exec, &output, &ts) < 0) {
5
54liuyao 已提交
150
        continue;
151
      }
L
Liu Jicong 已提交
152
      if (output == NULL) {
L
Liu Jicong 已提交
153 154 155 156 157
        if (qStreamRecoverScanFinished(exec)) {
          finished = true;
        } else {
          qSetStreamOpOpen(exec);
        }
L
Liu Jicong 已提交
158 159
        break;
      }
160 161 162 163 164 165

      SSDataBlock block = {0};
      assignOneDataBlock(&block, output);
      block.info.childId = pTask->selfChildId;
      taosArrayPush(pRes, &block);

L
Liu Jicong 已提交
166 167
      batchCnt++;

168
      qDebug("task %d scan exec block num %d, block limit %d", pTask->id.taskId, batchCnt, batchSz);
L
Liu Jicong 已提交
169 170

      if (batchCnt >= batchSz) break;
171 172
    }
    if (taosArrayGetSize(pRes) == 0) {
173 174
      if (finished) {
        taosArrayDestroy(pRes);
175
        qDebug("task %d finish recover exec task ", pTask->id.taskId);
176 177
        break;
      } else {
178
        qDebug("task %d continue recover exec task ", pTask->id.taskId);
179 180
        continue;
      }
181
    }
S
Shengliang Guan 已提交
182
    SStreamDataBlock* qRes = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, 0);
183 184 185 186 187 188 189 190 191
    if (qRes == NULL) {
      taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      return -1;
    }

    qRes->type = STREAM_INPUT__DATA_BLOCK;
    qRes->blocks = pRes;
    streamTaskOutput(pTask, qRes);
L
Liu Jicong 已提交
192 193

    if (pTask->outputType == TASK_OUTPUT__FIXED_DISPATCH || pTask->outputType == TASK_OUTPUT__SHUFFLE_DISPATCH) {
194
      qDebug("task %d scan exec dispatch block num %d", pTask->id.taskId, batchCnt);
L
Liu Jicong 已提交
195 196
      streamDispatch(pTask);
    }
197 198 199 200

    if (finished) {
      break;
    }
201 202 203 204 205
  }
  return 0;
}

#if 0
206 207 208 209
int32_t streamBatchExec(SStreamTask* pTask, int32_t batchLimit) {
  // fetch all queue item, merge according to batchLimit
  int32_t numOfItems = taosReadAllQitems(pTask->inputQueue1, pTask->inputQall);
  if (numOfItems == 0) {
210
    qDebug("task: %d, stream task exec over, queue empty", pTask->id.taskId);
211 212 213 214 215 216 217 218 219 220
    return 0;
  }
  SStreamQueueItem* pMerged = NULL;
  SStreamQueueItem* pItem = NULL;
  taosGetQitem(pTask->inputQall, (void**)&pItem);
  if (pItem == NULL) {
    if (pMerged != NULL) {
      // process merged item
    } else {
      return 0;
221
    }
222
  }
223

224 225 226 227 228
  // if drop
  if (pItem->type == STREAM_INPUT__DESTROY) {
    // set status drop
    return -1;
  }
229

230
  if (pTask->taskLevel == TASK_LEVEL__SINK) {
231
    ASSERT(((SStreamQueueItem*)pItem)->type == STREAM_INPUT__DATA_BLOCK);
232
    streamTaskOutput(pTask, (SStreamDataBlock*)pItem);
233 234
  }

235 236 237 238
  // exec impl

  // output
  // try dispatch
239 240
  return 0;
}
241
#endif
L
Liu Jicong 已提交
242

L
Liu Jicong 已提交
243
int32_t streamExecForAll(SStreamTask* pTask) {
L
Liu Jicong 已提交
244
  while (1) {
245 246 247 248
    int32_t batchSize = 1;
    void*   pInput = NULL;

    // merge multiple input data if possible in the input queue.
L
Liu Jicong 已提交
249 250 251
    while (1) {
      SStreamQueueItem* qItem = streamQueueNextItem(pTask->inputQueue);
      if (qItem == NULL) {
252
//        qDebug("s-task:%s extract data from input queue, queue is empty, abort", pTask->id.idStr);
L
Liu Jicong 已提交
253
        break;
L
Liu Jicong 已提交
254
      }
255 256 257

      if (pInput == NULL) {
        pInput = qItem;
258
        streamQueueProcessSuccess(pTask->inputQueue);
259
        if (pTask->taskLevel == TASK_LEVEL__SINK) {
L
Liu Jicong 已提交
260
          break;
L
Liu Jicong 已提交
261
        }
L
Liu Jicong 已提交
262
      } else {
263 264
        void* newRet = NULL;
        if ((newRet = streamMergeQueueItem(pInput, qItem)) == NULL) {
L
Liu Jicong 已提交
265 266 267
          streamQueueProcessFail(pTask->inputQueue);
          break;
        } else {
268 269
          batchSize++;
          pInput = newRet;
L
Liu Jicong 已提交
270
          streamQueueProcessSuccess(pTask->inputQueue);
271
          if (batchSize > STREAM_EXEC_MAX_BATCH_NUM) {
5
54liuyao 已提交
272 273
            break;
          }
L
Liu Jicong 已提交
274
        }
L
Liu Jicong 已提交
275 276
      }
    }
277

278
    if (streamTaskShouldStop(&pTask->status)) {
279 280 281
      if (pInput) {
        streamFreeQitem(pInput);
      }
L
Liu Jicong 已提交
282
      return 0;
L
Liu Jicong 已提交
283
    }
L
Liu Jicong 已提交
284

285
    if (pInput == NULL) {
L
Liu Jicong 已提交
286 287 288
      break;
    }

289
    if (pTask->taskLevel == TASK_LEVEL__SINK) {
290
      ASSERT(((SStreamQueueItem*)pInput)->type == STREAM_INPUT__DATA_BLOCK);
291
      qDebug("s-task:%s sink node start to sink result. numOfBlocks:%d", pTask->id.idStr, batchSize);
292
      streamTaskOutput(pTask, pInput);
L
Liu Jicong 已提交
293
      continue;
L
Liu Jicong 已提交
294
    }
L
Liu Jicong 已提交
295

L
Liu Jicong 已提交
296
    SArray* pRes = taosArrayInit(0, sizeof(SSDataBlock));
297
    qDebug("s-task:%s exec begin, numOfBlocks:%d", pTask->id.idStr, batchSize);
L
Liu Jicong 已提交
298

299
    streamTaskExecImpl(pTask, pInput, pRes);
300

L
liuyao 已提交
301 302 303
    int64_t ckId = 0;
    int64_t dataVer = 0;
    qGetCheckpointVersion(pTask->exec.pExecutor, &dataVer, &ckId);
304
    if (dataVer > pTask->chkInfo.version) {    // save it since the checkpoint is updated
305 306 307 308
      qDebug("s-task:%s exec end, start to update check point, ver from %" PRId64 " to %" PRId64
             ", checkPoint id:%" PRId64 " -> %" PRId64,
             pTask->id.idStr, pTask->chkInfo.version, dataVer, pTask->chkInfo.id, ckId);

309
      pTask->chkInfo = (SCheckpointInfo) {.version = dataVer, .id = ckId, .currentVer = pTask->chkInfo.currentVer};
310

311 312
      taosWLockLatch(&pTask->pMeta->lock);
      streamMetaSaveTask(pTask->pMeta, pTask);
313
      if (streamMetaCommit(pTask->pMeta) < 0) {
314 315
        taosWUnLockLatch(&pTask->pMeta->lock);
        qError("s-task:%s failed to commit stream meta, since %s", pTask->id.idStr, terrstr());
316
        return -1;
317 318 319
      } else {
        taosWUnLockLatch(&pTask->pMeta->lock);
        qDebug("s-task:%s update checkpoint ver succeed", pTask->id.idStr);
320 321 322 323
      }
    } else {
      qDebug("s-task:%s exec end", pTask->id.idStr);
    }
324

L
Liu Jicong 已提交
325
    if (taosArrayGetSize(pRes) != 0) {
S
Shengliang Guan 已提交
326
      SStreamDataBlock* qRes = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, 0);
L
Liu Jicong 已提交
327
      if (qRes == NULL) {
L
Liu Jicong 已提交
328
        taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
329
        streamFreeQitem(pInput);
L
Liu Jicong 已提交
330
        return -1;
L
Liu Jicong 已提交
331
      }
332

L
Liu Jicong 已提交
333 334
      qRes->type = STREAM_INPUT__DATA_BLOCK;
      qRes->blocks = pRes;
L
Liu Jicong 已提交
335

336 337
      if (((SStreamQueueItem*)pInput)->type == STREAM_INPUT__DATA_SUBMIT) {
        SStreamDataSubmit2* pSubmit = (SStreamDataSubmit2*)pInput;
L
Liu Jicong 已提交
338 339
        qRes->childId = pTask->selfChildId;
        qRes->sourceVer = pSubmit->ver;
340 341
      } else if (((SStreamQueueItem*)pInput)->type == STREAM_INPUT__MERGED_SUBMIT) {
        SStreamMergedSubmit2* pMerged = (SStreamMergedSubmit2*)pInput;
L
Liu Jicong 已提交
342 343
        qRes->childId = pTask->selfChildId;
        qRes->sourceVer = pMerged->ver;
L
Liu Jicong 已提交
344
      }
L
Liu Jicong 已提交
345 346 347

      if (streamTaskOutput(pTask, qRes) < 0) {
        taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
348
        streamFreeQitem(pInput);
L
Liu Jicong 已提交
349
        taosFreeQitem(qRes);
L
Liu Jicong 已提交
350 351
        return -1;
      }
L
Liu Jicong 已提交
352 353
    } else {
      taosArrayDestroy(pRes);
L
Liu Jicong 已提交
354
    }
355
    streamFreeQitem(pInput);
L
Liu Jicong 已提交
356
  }
L
Liu Jicong 已提交
357
  return 0;
L
Liu Jicong 已提交
358 359
}

L
Liu Jicong 已提交
360
int32_t streamTryExec(SStreamTask* pTask) {
361
  // this function may be executed by multi-threads, so status check is required.
L
Liu Jicong 已提交
362
  int8_t schedStatus =
363
      atomic_val_compare_exchange_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__WAITING, TASK_SCHED_STATUS__ACTIVE);
364

L
Liu Jicong 已提交
365 366 367
  if (schedStatus == TASK_SCHED_STATUS__WAITING) {
    int32_t code = streamExecForAll(pTask);
    if (code < 0) {
368
      atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__FAILED);
L
Liu Jicong 已提交
369 370
      return -1;
    }
371

372
    // todo the task should be commit here
373
    atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__INACTIVE);
374
    qDebug("s-task:%s exec completed", pTask->id.idStr);
L
Liu Jicong 已提交
375

376
    if (!taosQueueEmpty(pTask->inputQueue->queue) && (!streamTaskShouldStop(&pTask->status))) {
L
Liu Jicong 已提交
377
      streamSchedExec(pTask);
L
Liu Jicong 已提交
378 379
    }
  }
380

L
Liu Jicong 已提交
381
  return 0;
L
Liu Jicong 已提交
382
}