streamExec.c 13.9 KB
Newer Older
L
Liu Jicong 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

L
Liu Jicong 已提交
16
#include "streamInc.h"
L
Liu Jicong 已提交
17

H
Haojun Liao 已提交
18 19
// maximum allowed processed block batches. One block may include several submit blocks
#define MAX_STREAM_EXEC_BATCH_NUM 128
L
liuyao 已提交
20
#define MIN_STREAM_EXEC_BATCH_NUM 16
5
54liuyao 已提交
21

22
bool streamTaskShouldStop(const SStreamStatus* pStatus) {
dengyihao's avatar
dengyihao 已提交
23
  int32_t status = atomic_load_8((int8_t*)&pStatus->taskStatus);
24 25 26
  return (status == TASK_STATUS__STOP) || (status == TASK_STATUS__DROPPING);
}

L
liuyao 已提交
27
bool streamTaskShouldPause(const SStreamStatus* pStatus) {
dengyihao's avatar
dengyihao 已提交
28
  int32_t status = atomic_load_8((int8_t*)&pStatus->taskStatus);
L
liuyao 已提交
29 30 31
  return (status == TASK_STATUS__PAUSE);
}

H
Haojun Liao 已提交
32
static int32_t streamTaskExecImpl(SStreamTask* pTask, const void* data, SArray* pRes, int64_t* resSize) {
33 34
  int32_t code = TSDB_CODE_SUCCESS;
  void*   pExecutor = pTask->exec.pExecutor;
H
Haojun Liao 已提交
35
  *resSize = 0;
36

37
  while (pTask->taskLevel == TASK_LEVEL__SOURCE) {
38
    int8_t status = atomic_load_8(&pTask->status.taskStatus);
L
liuyao 已提交
39
    if (status != TASK_STATUS__NORMAL && status != TASK_STATUS__PAUSE) {
40
      qError("stream task wait for the end of fill history, s-task:%s, status:%d", pTask->id.idStr,
41
             atomic_load_8(&pTask->status.taskStatus));
42 43 44 45
      taosMsleep(2);
    } else {
      break;
    }
5
54liuyao 已提交
46
  }
L
Liu Jicong 已提交
47 48

  // set input
L
Liu Jicong 已提交
49
  const SStreamQueueItem* pItem = (const SStreamQueueItem*)data;
L
Liu Jicong 已提交
50
  if (pItem->type == STREAM_INPUT__GET_RES) {
L
Liu Jicong 已提交
51
    const SStreamTrigger* pTrigger = (const SStreamTrigger*)data;
52
    qSetMultiStreamInput(pExecutor, pTrigger->pBlock, 1, STREAM_INPUT__DATA_BLOCK);
53
  } else if (pItem->type == STREAM_INPUT__DATA_SUBMIT) {
54
    ASSERT(pTask->taskLevel == TASK_LEVEL__SOURCE);
55
    const SStreamDataSubmit* pSubmit = (const SStreamDataSubmit*)data;
56
    qSetMultiStreamInput(pExecutor, &pSubmit->submit, 1, STREAM_INPUT__DATA_SUBMIT);
dengyihao's avatar
dengyihao 已提交
57 58
    qDebug("s-task:%s set submit blocks as source block completed, %p %p len:%d ver:%" PRId64, pTask->id.idStr, pSubmit,
           pSubmit->submit.msgStr, pSubmit->submit.msgLen, pSubmit->submit.ver);
59
  } else if (pItem->type == STREAM_INPUT__DATA_BLOCK || pItem->type == STREAM_INPUT__DATA_RETRIEVE) {
L
Liu Jicong 已提交
60
    const SStreamDataBlock* pBlock = (const SStreamDataBlock*)data;
61 62 63

    SArray* pBlockList = pBlock->blocks;
    int32_t numOfBlocks = taosArrayGetSize(pBlockList);
dengyihao's avatar
dengyihao 已提交
64
    qDebug("s-task:%s set sdata blocks as input num:%d, ver:%" PRId64, pTask->id.idStr, numOfBlocks, pBlock->sourceVer);
65
    qSetMultiStreamInput(pExecutor, pBlockList->pData, numOfBlocks, STREAM_INPUT__DATA_BLOCK);
66
  } else if (pItem->type == STREAM_INPUT__MERGED_SUBMIT) {
67
    const SStreamMergedSubmit* pMerged = (const SStreamMergedSubmit*)data;
68 69 70

    SArray* pBlockList = pMerged->submits;
    int32_t numOfBlocks = taosArrayGetSize(pBlockList);
71
    qDebug("s-task:%s %p set submit input (merged), batch num:%d", pTask->id.idStr, pTask, numOfBlocks);
72
    qSetMultiStreamInput(pExecutor, pBlockList->pData, numOfBlocks, STREAM_INPUT__MERGED_SUBMIT);
L
Liu Jicong 已提交
73 74
  } else if (pItem->type == STREAM_INPUT__REF_DATA_BLOCK) {
    const SStreamRefDataBlock* pRefBlock = (const SStreamRefDataBlock*)data;
75
    qSetMultiStreamInput(pExecutor, pRefBlock->pBlock, 1, STREAM_INPUT__DATA_BLOCK);
76
  } else {
77
    ASSERT(0);
L
Liu Jicong 已提交
78 79
  }

80
  // pExecutor
L
Liu Jicong 已提交
81
  while (1) {
82
    if (streamTaskShouldStop(&pTask->status)) {
L
Liu Jicong 已提交
83 84 85
      return 0;
    }

L
Liu Jicong 已提交
86 87
    SSDataBlock* output = NULL;
    uint64_t     ts = 0;
88
    if ((code = qExecTask(pExecutor, &output, &ts)) < 0) {
5
54liuyao 已提交
89
      if (code == TSDB_CODE_QRY_IN_EXEC) {
90
        resetTaskInfo(pExecutor);
5
54liuyao 已提交
91
      }
92 93

      qError("unexpected stream execution, s-task:%s since %s", pTask->id.idStr, terrstr());
L
Liu Jicong 已提交
94
      continue;
L
Liu Jicong 已提交
95
    }
96

97
    if (output == NULL) {
5
54liuyao 已提交
98
      if (pItem->type == STREAM_INPUT__DATA_RETRIEVE) {
99 100
        SSDataBlock block = {0};

L
Liu Jicong 已提交
101
        const SStreamDataBlock* pRetrieveBlock = (const SStreamDataBlock*)data;
102
        ASSERT(taosArrayGetSize(pRetrieveBlock->blocks) == 1);
103

L
Liu Jicong 已提交
104
        assignOneDataBlock(&block, taosArrayGet(pRetrieveBlock->blocks, 0));
L
Liu Jicong 已提交
105
        block.info.type = STREAM_PULL_OVER;
L
Liu Jicong 已提交
106 107
        block.info.childId = pTask->selfChildId;
        taosArrayPush(pRes, &block);
L
Liu Jicong 已提交
108

H
Haojun Liao 已提交
109
        qDebug("s-task:%s(child %d) processed retrieve, reqId:0x%" PRIx64, pTask->id.idStr, pTask->selfChildId,
L
Liu Jicong 已提交
110
               pRetrieveBlock->reqId);
111
      }
H
Haojun Liao 已提交
112

113 114
      break;
    }
L
Liu Jicong 已提交
115 116 117 118 119 120 121 122

    if (output->info.type == STREAM_RETRIEVE) {
      if (streamBroadcastToChildren(pTask, output) < 0) {
        // TODO
      }
      continue;
    }

L
Liu Jicong 已提交
123 124 125
    SSDataBlock block = {0};
    assignOneDataBlock(&block, output);
    block.info.childId = pTask->selfChildId;
H
Haojun Liao 已提交
126 127

    (*resSize) += blockDataGetSize(output);
L
Liu Jicong 已提交
128
    taosArrayPush(pRes, &block);
H
Haojun Liao 已提交
129

H
Haojun Liao 已提交
130 131
    qDebug("s-task:%s (child %d) executed and get block, total blocks:%d, size:%.2fMiB", pTask->id.idStr, pTask->selfChildId, (int32_t)taosArrayGetSize(pRes),
        (*resSize)/1048576.0);
L
Liu Jicong 已提交
132
  }
133

L
Liu Jicong 已提交
134 135 136
  return 0;
}

137
int32_t streamScanExec(SStreamTask* pTask, int32_t batchSz) {
dengyihao's avatar
dengyihao 已提交
138
  int32_t code = 0;
139

dengyihao's avatar
dengyihao 已提交
140
  ASSERT(pTask->taskLevel == TASK_LEVEL__SOURCE);
141

142
  void* exec = pTask->exec.pExecutor;
143

L
Liu Jicong 已提交
144
  qSetStreamOpOpen(exec);
L
Liu Jicong 已提交
145
  bool finished = false;
L
Liu Jicong 已提交
146

147 148 149 150 151 152 153 154 155
  while (1) {
    SArray* pRes = taosArrayInit(0, sizeof(SSDataBlock));
    if (pRes == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      return -1;
    }

    int32_t batchCnt = 0;
    while (1) {
L
liuyao 已提交
156
      if (streamTaskShouldStop(&pTask->status) || streamTaskShouldPause(&pTask->status)) {
L
liuyao 已提交
157
        taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
L
Liu Jicong 已提交
158 159 160
        return 0;
      }

161 162 163
      SSDataBlock* output = NULL;
      uint64_t     ts = 0;
      if (qExecTask(exec, &output, &ts) < 0) {
5
54liuyao 已提交
164
        continue;
165
      }
L
Liu Jicong 已提交
166
      if (output == NULL) {
L
Liu Jicong 已提交
167 168 169 170 171
        if (qStreamRecoverScanFinished(exec)) {
          finished = true;
        } else {
          qSetStreamOpOpen(exec);
        }
L
Liu Jicong 已提交
172 173
        break;
      }
174 175 176 177 178 179

      SSDataBlock block = {0};
      assignOneDataBlock(&block, output);
      block.info.childId = pTask->selfChildId;
      taosArrayPush(pRes, &block);

L
Liu Jicong 已提交
180 181
      batchCnt++;

182
      qDebug("s-task:%s scan exec numOfBlocks:%d, limit:%d", pTask->id.idStr, batchCnt, batchSz);
H
Haojun Liao 已提交
183 184 185
      if (batchCnt >= batchSz) {
        break;
      }
186
    }
H
Haojun Liao 已提交
187

188
    if (taosArrayGetSize(pRes) == 0) {
189 190
      if (finished) {
        taosArrayDestroy(pRes);
H
Haojun Liao 已提交
191
        qDebug("s-task:%s finish recover exec task ", pTask->id.idStr);
192 193
        break;
      } else {
H
Haojun Liao 已提交
194
        qDebug("s-task:%s continue recover exec task ", pTask->id.idStr);
195 196
        continue;
      }
197
    }
H
Haojun Liao 已提交
198

S
Shengliang Guan 已提交
199
    SStreamDataBlock* qRes = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, 0);
200 201 202 203 204 205 206 207
    if (qRes == NULL) {
      taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      return -1;
    }

    qRes->type = STREAM_INPUT__DATA_BLOCK;
    qRes->blocks = pRes;
dengyihao's avatar
dengyihao 已提交
208 209
    code = streamTaskOutput(pTask, qRes);
    if (code == TSDB_CODE_UTIL_QUEUE_OUT_OF_MEMORY) {
dengyihao's avatar
dengyihao 已提交
210
      taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
dengyihao's avatar
dengyihao 已提交
211
      taosFreeQitem(qRes);
dengyihao's avatar
dengyihao 已提交
212 213
      return code;
    }
L
Liu Jicong 已提交
214 215

    if (pTask->outputType == TASK_OUTPUT__FIXED_DISPATCH || pTask->outputType == TASK_OUTPUT__SHUFFLE_DISPATCH) {
216
      qDebug("s-task:%s scan exec dispatch blocks:%d", pTask->id.idStr, batchCnt);
L
Liu Jicong 已提交
217 218
      streamDispatch(pTask);
    }
219 220 221 222

    if (finished) {
      break;
    }
223 224 225 226 227
  }
  return 0;
}

#if 0
228 229 230 231
int32_t streamBatchExec(SStreamTask* pTask, int32_t batchLimit) {
  // fetch all queue item, merge according to batchLimit
  int32_t numOfItems = taosReadAllQitems(pTask->inputQueue1, pTask->inputQall);
  if (numOfItems == 0) {
232
    qDebug("task: %d, stream task exec over, queue empty", pTask->id.taskId);
233 234 235 236 237 238 239 240 241 242
    return 0;
  }
  SStreamQueueItem* pMerged = NULL;
  SStreamQueueItem* pItem = NULL;
  taosGetQitem(pTask->inputQall, (void**)&pItem);
  if (pItem == NULL) {
    if (pMerged != NULL) {
      // process merged item
    } else {
      return 0;
243
    }
244
  }
245

246 247 248 249 250
  // if drop
  if (pItem->type == STREAM_INPUT__DESTROY) {
    // set status drop
    return -1;
  }
251

252
  if (pTask->taskLevel == TASK_LEVEL__SINK) {
253
    ASSERT(((SStreamQueueItem*)pItem)->type == STREAM_INPUT__DATA_BLOCK);
254
    streamTaskOutput(pTask, (SStreamDataBlock*)pItem);
255 256
  }

257 258 259 260
  // exec impl

  // output
  // try dispatch
261 262
  return 0;
}
263
#endif
L
Liu Jicong 已提交
264

L
Liu Jicong 已提交
265
int32_t streamExecForAll(SStreamTask* pTask) {
dengyihao's avatar
dengyihao 已提交
266
  int32_t code = 0;
L
Liu Jicong 已提交
267
  while (1) {
268
    int32_t batchSize = 1;
L
liuyao 已提交
269
    int16_t times = 0;
270

271 272
    SStreamQueueItem* pInput = NULL;

273
    // merge multiple input data if possible in the input queue.
H
Haojun Liao 已提交
274 275
    qDebug("s-task:%s start to extract data block from inputQ", pTask->id.idStr);

L
Liu Jicong 已提交
276
    while (1) {
L
liuyao 已提交
277 278 279
      if (streamTaskShouldPause(&pTask->status)) {
        return 0;
      }
280

L
Liu Jicong 已提交
281 282
      SStreamQueueItem* qItem = streamQueueNextItem(pTask->inputQueue);
      if (qItem == NULL) {
L
liuyao 已提交
283 284 285
        if (pTask->taskLevel == TASK_LEVEL__SOURCE && batchSize < MIN_STREAM_EXEC_BATCH_NUM && times < 5) {
          times++;
          taosMsleep(1);
286
          qDebug("===stream===try again batchSize:%d", batchSize);
L
liuyao 已提交
287 288
          continue;
        }
289

L
liuyao 已提交
290
        qDebug("===stream===break batchSize:%d", batchSize);
L
Liu Jicong 已提交
291
        break;
L
Liu Jicong 已提交
292
      }
293 294 295

      if (pInput == NULL) {
        pInput = qItem;
296
        streamQueueProcessSuccess(pTask->inputQueue);
297
        if (pTask->taskLevel == TASK_LEVEL__SINK) {
L
Liu Jicong 已提交
298
          break;
L
Liu Jicong 已提交
299
        }
L
Liu Jicong 已提交
300
      } else {
301
        // todo we need to sort the data block, instead of just appending into the array list.
302 303
        void* newRet = NULL;
        if ((newRet = streamMergeQueueItem(pInput, qItem)) == NULL) {
L
Liu Jicong 已提交
304 305 306
          streamQueueProcessFail(pTask->inputQueue);
          break;
        } else {
307 308
          batchSize++;
          pInput = newRet;
L
Liu Jicong 已提交
309
          streamQueueProcessSuccess(pTask->inputQueue);
L
liuyao 已提交
310
          if (batchSize > MAX_STREAM_EXEC_BATCH_NUM) {
H
Haojun Liao 已提交
311
            qDebug("maximum batch limit:%d reached, processing, %s", MAX_STREAM_EXEC_BATCH_NUM, pTask->id.idStr);
5
54liuyao 已提交
312 313
            break;
          }
L
Liu Jicong 已提交
314
        }
L
Liu Jicong 已提交
315 316
      }
    }
317

318
    if (streamTaskShouldStop(&pTask->status)) {
319 320 321
      if (pInput) {
        streamFreeQitem(pInput);
      }
322

L
Liu Jicong 已提交
323
      return 0;
L
Liu Jicong 已提交
324
    }
L
Liu Jicong 已提交
325

326
    if (pInput == NULL) {
L
Liu Jicong 已提交
327 328 329
      break;
    }

330
    if (pTask->taskLevel == TASK_LEVEL__SINK) {
331
      ASSERT(pInput->type == STREAM_INPUT__DATA_BLOCK);
332
      qDebug("s-task:%s sink node start to sink result. numOfBlocks:%d", pTask->id.idStr, batchSize);
333
      streamTaskOutput(pTask, (SStreamDataBlock*)pInput);
L
Liu Jicong 已提交
334
      continue;
L
Liu Jicong 已提交
335
    }
L
Liu Jicong 已提交
336

H
Haojun Liao 已提交
337 338
    int64_t resSize = 0;
    int64_t st = taosGetTimestampMs();
L
Liu Jicong 已提交
339
    SArray* pRes = taosArrayInit(0, sizeof(SSDataBlock));
340
    qDebug("s-task:%s start to execute, block batches:%d", pTask->id.idStr, batchSize);
L
Liu Jicong 已提交
341

H
Haojun Liao 已提交
342
    streamTaskExecImpl(pTask, pInput, pRes, &resSize);
343

L
liuyao 已提交
344 345 346
    int64_t ckId = 0;
    int64_t dataVer = 0;
    qGetCheckpointVersion(pTask->exec.pExecutor, &dataVer, &ckId);
dengyihao's avatar
dengyihao 已提交
347
    if (ckId > pTask->chkInfo.id) {  // save it since the checkpoint is updated
348 349 350
      qDebug("s-task:%s exec end, start to update check point, ver from %" PRId64 " to %" PRId64
             ", checkPoint id:%" PRId64 " -> %" PRId64,
             pTask->id.idStr, pTask->chkInfo.version, dataVer, pTask->chkInfo.id, ckId);
L
Liu Jicong 已提交
351

dengyihao's avatar
dengyihao 已提交
352
      pTask->chkInfo = (SCheckpointInfo){.version = dataVer, .id = ckId, .currentVer = pTask->chkInfo.currentVer};
353

354
      taosWLockLatch(&pTask->pMeta->lock);
355

356
      streamMetaSaveTask(pTask->pMeta, pTask);
357
      if (streamMetaCommit(pTask->pMeta) < 0) {
358 359
        taosWUnLockLatch(&pTask->pMeta->lock);
        qError("s-task:%s failed to commit stream meta, since %s", pTask->id.idStr, terrstr());
360
        return -1;
361 362 363
      } else {
        taosWUnLockLatch(&pTask->pMeta->lock);
        qDebug("s-task:%s update checkpoint ver succeed", pTask->id.idStr);
364 365
      }
    }
366

H
Haojun Liao 已提交
367 368 369
    double el = (taosGetTimestampMs() - st) / 1000.0;
    qDebug("s-task:%s exec end, elapsed time:%.2fs, result size:%.2fMiB", pTask->id.idStr, el, resSize/1048576.0);

L
Liu Jicong 已提交
370
    if (taosArrayGetSize(pRes) != 0) {
S
Shengliang Guan 已提交
371
      SStreamDataBlock* qRes = taosAllocateQitem(sizeof(SStreamDataBlock), DEF_QITEM, 0);
L
Liu Jicong 已提交
372
      if (qRes == NULL) {
L
Liu Jicong 已提交
373
        taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
374
        streamFreeQitem(pInput);
L
Liu Jicong 已提交
375
        return -1;
L
Liu Jicong 已提交
376
      }
377

L
Liu Jicong 已提交
378 379
      qRes->type = STREAM_INPUT__DATA_BLOCK;
      qRes->blocks = pRes;
L
Liu Jicong 已提交
380

381
      if (((SStreamQueueItem*)pInput)->type == STREAM_INPUT__DATA_SUBMIT) {
382
        SStreamDataSubmit* pSubmit = (SStreamDataSubmit*)pInput;
L
Liu Jicong 已提交
383 384
        qRes->childId = pTask->selfChildId;
        qRes->sourceVer = pSubmit->ver;
385
      } else if (((SStreamQueueItem*)pInput)->type == STREAM_INPUT__MERGED_SUBMIT) {
386
        SStreamMergedSubmit* pMerged = (SStreamMergedSubmit*)pInput;
L
Liu Jicong 已提交
387 388
        qRes->childId = pTask->selfChildId;
        qRes->sourceVer = pMerged->ver;
L
Liu Jicong 已提交
389
      }
L
Liu Jicong 已提交
390

dengyihao's avatar
dengyihao 已提交
391 392 393
      code = streamTaskOutput(pTask, qRes);
      if (code == TSDB_CODE_UTIL_QUEUE_OUT_OF_MEMORY) {
        // backpressure and record position
L
Liu Jicong 已提交
394
        taosArrayDestroyEx(pRes, (FDelete)blockDataFreeRes);
395
        streamFreeQitem(pInput);
L
Liu Jicong 已提交
396
        taosFreeQitem(qRes);
L
Liu Jicong 已提交
397 398
        return -1;
      }
L
Liu Jicong 已提交
399 400
    } else {
      taosArrayDestroy(pRes);
L
Liu Jicong 已提交
401
    }
402
    streamFreeQitem(pInput);
L
Liu Jicong 已提交
403
  }
L
Liu Jicong 已提交
404
  return 0;
L
Liu Jicong 已提交
405 406
}

L
Liu Jicong 已提交
407
int32_t streamTryExec(SStreamTask* pTask) {
408
  // this function may be executed by multi-threads, so status check is required.
L
Liu Jicong 已提交
409
  int8_t schedStatus =
410
      atomic_val_compare_exchange_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__WAITING, TASK_SCHED_STATUS__ACTIVE);
411

L
Liu Jicong 已提交
412 413 414
  if (schedStatus == TASK_SCHED_STATUS__WAITING) {
    int32_t code = streamExecForAll(pTask);
    if (code < 0) {
415
      atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__FAILED);
L
Liu Jicong 已提交
416 417
      return -1;
    }
418

419
    // todo the task should be commit here
420
    atomic_store_8(&pTask->status.schedStatus, TASK_SCHED_STATUS__INACTIVE);
421
    qDebug("s-task:%s exec completed", pTask->id.idStr);
L
Liu Jicong 已提交
422

dengyihao's avatar
dengyihao 已提交
423 424
    if (!taosQueueEmpty(pTask->inputQueue->queue) && (!streamTaskShouldStop(&pTask->status)) &&
        (!streamTaskShouldPause(&pTask->status))) {
L
Liu Jicong 已提交
425
      streamSchedExec(pTask);
L
Liu Jicong 已提交
426 427
    }
  }
428

L
Liu Jicong 已提交
429
  return 0;
L
Liu Jicong 已提交
430
}