executorimpl.c 181.5 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
15

16
#include <executorimpl.h>
H
Haojun Liao 已提交
17 18
#include "filter.h"
#include "function.h"
19 20
#include "functionMgt.h"
#include "os.h"
H
Haojun Liao 已提交
21
#include "querynodes.h"
22
#include "tfill.h"
dengyihao's avatar
dengyihao 已提交
23
#include "tname.h"
X
Xiaoyu Wang 已提交
24
#include "tref.h"
25

H
Haojun Liao 已提交
26
#include "tdatablock.h"
27
#include "tglobal.h"
H
Haojun Liao 已提交
28
#include "tmsg.h"
H
Haojun Liao 已提交
29
#include "tsort.h"
30
#include "ttime.h"
H
Haojun Liao 已提交
31

32
#include "executorimpl.h"
dengyihao's avatar
dengyihao 已提交
33
#include "index.h"
34
#include "query.h"
35 36
#include "tcompare.h"
#include "tcompression.h"
H
Haojun Liao 已提交
37
#include "thash.h"
38
#include "ttypes.h"
dengyihao's avatar
dengyihao 已提交
39
#include "vnode.h"
40

H
Haojun Liao 已提交
41
#define IS_MAIN_SCAN(runtime)          ((runtime)->scanFlag == MAIN_SCAN)
42 43 44 45
#define SET_REVERSE_SCAN_FLAG(runtime) ((runtime)->scanFlag = REVERSE_SCAN)

#define GET_FORWARD_DIRECTION_FACTOR(ord) (((ord) == TSDB_ORDER_ASC) ? QUERY_ASC_FORWARD_STEP : QUERY_DESC_FORWARD_STEP)

46 47 48 49 50
enum {
  PROJECT_RETRIEVE_CONTINUE = 0x1,
  PROJECT_RETRIEVE_DONE = 0x2,
};

51 52
#if 0
static UNUSED_FUNC void *u_malloc (size_t __size) {
wafwerar's avatar
wafwerar 已提交
53
  uint32_t v = taosRand();
54 55 56 57

  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
58
    return taosMemoryMalloc(__size);
59 60 61 62
  }
}

static UNUSED_FUNC void* u_calloc(size_t num, size_t __size) {
wafwerar's avatar
wafwerar 已提交
63
  uint32_t v = taosRand();
64 65 66
  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
67
    return taosMemoryCalloc(num, __size);
68 69 70 71
  }
}

static UNUSED_FUNC void* u_realloc(void* p, size_t __size) {
wafwerar's avatar
wafwerar 已提交
72
  uint32_t v = taosRand();
73 74 75
  if (v % 5 <= 1) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
76
    return taosMemoryRealloc(p, __size);
77 78 79 80 81 82 83 84
  }
}

#define calloc  u_calloc
#define malloc  u_malloc
#define realloc u_realloc
#endif

X
Xiaoyu Wang 已提交
85
#define CLEAR_QUERY_STATUS(q, st)   ((q)->status &= (~(st)))
86 87
#define QUERY_IS_INTERVAL_QUERY(_q) ((_q)->interval.interval > 0)

L
Liu Jicong 已提交
88 89 90
int32_t getMaximumIdleDurationSec() { return tsShellActivityTimer * 2; }

static int32_t getExprFunctionId(SExprInfo* pExprInfo) {
91
  assert(pExprInfo != NULL && pExprInfo->pExpr != NULL && pExprInfo->pExpr->nodeType == TEXPR_UNARYEXPR_NODE);
92
  return 0;
93 94 95 96
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes);

97
static void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExpr, SSDataBlock* pSDataBlock);
98

X
Xiaoyu Wang 已提交
99
static void releaseQueryBuf(size_t numOfTables);
100 101 102 103 104

static void destroySFillOperatorInfo(void* param, int32_t numOfOutput);
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput);
static void destroyOrderOperatorInfo(void* param, int32_t numOfOutput);
static void destroyAggOperatorInfo(void* param, int32_t numOfOutput);
X
Xiaoyu Wang 已提交
105

H
Haojun Liao 已提交
106
static void destroyIntervalOperatorInfo(void* param, int32_t numOfOutput);
H
Haojun Liao 已提交
107 108
static void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput);

109 110
static void destroyOperatorInfo(SOperatorInfo* pOperator);

111
void doSetOperatorCompleted(SOperatorInfo* pOperator) {
112
  pOperator->status = OP_EXEC_DONE;
113

114
  pOperator->cost.totalCost = (taosGetTimestampUs() - pOperator->pTaskInfo->cost.start * 1000) / 1000.0;
H
Haojun Liao 已提交
115
  if (pOperator->pTaskInfo != NULL) {
116
    setTaskStatus(pOperator->pTaskInfo, TASK_COMPLETED);
117 118
  }
}
119

H
Haojun Liao 已提交
120
int32_t operatorDummyOpenFn(SOperatorInfo* pOperator) {
121
  OPTR_SET_OPENED(pOperator);
122
  pOperator->cost.openCost = 0;
H
Haojun Liao 已提交
123
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
124 125
}

126
SOperatorFpSet createOperatorFpSet(__optr_open_fn_t openFn, __optr_fn_t nextFn, __optr_fn_t streamFn,
L
Liu Jicong 已提交
127
                                   __optr_fn_t cleanup, __optr_close_fn_t closeFn, __optr_encode_fn_t encode,
128
                                   __optr_decode_fn_t decode, __optr_explain_fn_t explain) {
129 130 131 132 133 134 135 136 137 138 139 140 141 142
  SOperatorFpSet fpSet = {
      ._openFn = openFn,
      .getNextFn = nextFn,
      .getStreamResFn = streamFn,
      .cleanupFn = cleanup,
      .closeFn = closeFn,
      .encodeResultRow = encode,
      .decodeResultRow = decode,
      .getExplainFn = explain,
  };

  return fpSet;
}

H
Haojun Liao 已提交
143
void operatorDummyCloseFn(void* param, int32_t numOfCols) {}
H
Haojun Liao 已提交
144

X
Xiaoyu Wang 已提交
145 146 147
static int32_t doCopyToSDataBlock(SExecTaskInfo* taskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo,
                                  SDiskbasedBuf* pBuf, SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset,
                                  SqlFunctionCtx* pCtx, int32_t numOfExprs);
H
Haojun Liao 已提交
148

149
static void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size);
L
Liu Jicong 已提交
150 151
static void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                                     uint64_t groupId);
152

L
Liu Jicong 已提交
153 154
// setup the output buffer for each operator
static bool hasNull(SColumn* pColumn, SColumnDataAgg* pStatis) {
dengyihao's avatar
dengyihao 已提交
155 156
  if (TSDB_COL_IS_TAG(pColumn->flag) || TSDB_COL_IS_UD_COL(pColumn->flag) ||
      pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
157 158 159 160 161 162 163 164 165 166
    return false;
  }

  if (pStatis != NULL && pStatis->numOfNull == 0) {
    return false;
  }

  return true;
}

167
#if 0
L
Liu Jicong 已提交
168 169
static bool chkResultRowFromKey(STaskRuntimeEnv* pRuntimeEnv, SResultRowInfo* pResultRowInfo, char* pData,
                                int16_t bytes, bool masterscan, uint64_t uid) {
170 171 172
  bool existed = false;
  SET_RES_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid);

L
Liu Jicong 已提交
173 174
  SResultRow** p1 =
      (SResultRow**)taosHashGet(pRuntimeEnv->pResultRowHashTable, pRuntimeEnv->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
175 176 177 178 179 180 181 182 183 184 185

  // in case of repeat scan/reverse scan, no new time window added.
  if (QUERY_IS_INTERVAL_QUERY(pRuntimeEnv->pQueryAttr)) {
    if (!masterscan) {  // the *p1 may be NULL in case of sliding+offset exists.
      return p1 != NULL;
    }

    if (p1 != NULL) {
      if (pResultRowInfo->size == 0) {
        existed = false;
      } else if (pResultRowInfo->size == 1) {
dengyihao's avatar
dengyihao 已提交
186
        //        existed = (pResultRowInfo->pResult[0] == (*p1));
187 188
      } else {  // check if current pResultRowInfo contains the existed pResultRow
        SET_RES_EXT_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid, pResultRowInfo);
L
Liu Jicong 已提交
189 190
        int64_t* index =
            taosHashGet(pRuntimeEnv->pResultRowListSet, pRuntimeEnv->keyBuf, GET_RES_EXT_WINDOW_KEY_LEN(bytes));
191 192 193 194 195 196 197 198 199 200 201 202 203
        if (index != NULL) {
          existed = true;
        } else {
          existed = false;
        }
      }
    }

    return existed;
  }

  return p1 != NULL;
}
204
#endif
205

206
SResultRow* getNewResultRow(SDiskbasedBuf* pResultBuf, int64_t tableGroupId, int32_t interBufSize) {
L
Liu Jicong 已提交
207
  SFilePage* pData = NULL;
208 209 210 211 212 213 214 215 216 217 218 219 220

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tableGroupId);

  if (taosArrayGetSize(list) == 0) {
    pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
    pData->num = sizeof(SFilePage);
  } else {
    SPageInfo* pi = getLastPageInfo(list);
    pData = getBufPage(pResultBuf, getPageId(pi));
    pageId = getPageId(pi);

wmmhello's avatar
wmmhello 已提交
221
    if (pData->num + interBufSize > getBufPageSize(pResultBuf)) {
222 223 224 225 226 227 228 229 230 231 232 233 234 235
      // release current page first, and prepare the next one
      releaseBufPageInfo(pResultBuf, pi);

      pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
      if (pData != NULL) {
        pData->num = sizeof(SFilePage);
      }
    }
  }

  if (pData == NULL) {
    return NULL;
  }

236 237
  setBufPageDirty(pData, true);

238 239 240 241 242
  // set the number of rows in current disk page
  SResultRow* pResultRow = (SResultRow*)((char*)pData + pData->num);
  pResultRow->pageId = pageId;
  pResultRow->offset = (int32_t)pData->num;

wmmhello's avatar
wmmhello 已提交
243
  pData->num += interBufSize;
244 245 246 247

  return pResultRow;
}

248 249 250 251 252 253 254
/**
 * the struct of key in hash table
 * +----------+---------------+
 * | group id |   key data    |
 * | 8 bytes  | actual length |
 * +----------+---------------+
 */
255 256 257
SResultRow* doSetResultOutBufByKey(SDiskbasedBuf* pResultBuf, SResultRowInfo* pResultRowInfo, char* pData,
                                   int16_t bytes, bool masterscan, uint64_t groupId, SExecTaskInfo* pTaskInfo,
                                   bool isIntervalQuery, SAggSupporter* pSup) {
258
  SET_RES_WINDOW_KEY(pSup->keyBuf, pData, bytes, groupId);
H
Haojun Liao 已提交
259

dengyihao's avatar
dengyihao 已提交
260 261
  SResultRowPosition* p1 =
      (SResultRowPosition*)taosHashGet(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
H
Haojun Liao 已提交
262

263 264
  SResultRow* pResult = NULL;

H
Haojun Liao 已提交
265 266
  // in case of repeat scan/reverse scan, no new time window added.
  if (isIntervalQuery) {
267 268
    if (masterscan && p1 != NULL) {  // the *p1 may be NULL in case of sliding+offset exists.
      pResult = getResultRowByPos(pResultBuf, p1);
269
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
270 271
    }
  } else {
dengyihao's avatar
dengyihao 已提交
272 273
    // In case of group by column query, the required SResultRow object must be existInCurrentResusltRowInfo in the
    // pResultRowInfo object.
H
Haojun Liao 已提交
274
    if (p1 != NULL) {
275
      // todo
276
      pResult = getResultRowByPos(pResultBuf, p1);
277
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
278 279 280
    }
  }

L
Liu Jicong 已提交
281
  // 1. close current opened time window
282
  if (pResultRowInfo->cur.pageId != -1 && ((pResult == NULL) || (pResult->pageId != pResultRowInfo->cur.pageId))) {
283
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
284
    qDebug("page_1");
285
#endif
286
    SResultRowPosition pos = pResultRowInfo->cur;
X
Xiaoyu Wang 已提交
287
    SFilePage*         pPage = getBufPage(pResultBuf, pos.pageId);
288 289 290 291 292
    releaseBufPage(pResultBuf, pPage);
  }

  // allocate a new buffer page
  if (pResult == NULL) {
293
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
294
    qDebug("page_2");
295
#endif
H
Haojun Liao 已提交
296
    ASSERT(pSup->resultRowSize > 0);
297 298
    pResult = getNewResultRow(pResultBuf, groupId, pSup->resultRowSize);

299
    initResultRow(pResult);
H
Haojun Liao 已提交
300

301 302
    // add a new result set for a new group
    SResultRowPosition pos = {.pageId = pResult->pageId, .offset = pResult->offset};
X
Xiaoyu Wang 已提交
303 304
    taosHashPut(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes), &pos,
                sizeof(SResultRowPosition));
H
Haojun Liao 已提交
305 306
  }

307 308 309
  // 2. set the new time window to be the new active time window
  pResultRowInfo->cur = (SResultRowPosition){.pageId = pResult->pageId, .offset = pResult->offset};

H
Haojun Liao 已提交
310
  // too many time window in query
311
  if (taosHashGetSize(pSup->pResultRowHashTable) > MAX_INTERVAL_TIME_WINDOW) {
H
Haojun Liao 已提交
312 313 314
    longjmp(pTaskInfo->env, TSDB_CODE_QRY_TOO_MANY_TIMEWINDOW);
  }

H
Haojun Liao 已提交
315
  return pResult;
H
Haojun Liao 已提交
316 317
}

318
// a new buffer page for each table. Needs to opt this design
L
Liu Jicong 已提交
319
static int32_t addNewWindowResultBuf(SResultRow* pWindowRes, SDiskbasedBuf* pResultBuf, int32_t tid, uint32_t size) {
320 321 322 323
  if (pWindowRes->pageId != -1) {
    return 0;
  }

L
Liu Jicong 已提交
324
  SFilePage* pData = NULL;
325 326 327 328 329 330

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tid);

  if (taosArrayGetSize(list) == 0) {
H
Haojun Liao 已提交
331
    pData = getNewBufPage(pResultBuf, tid, &pageId);
332
    pData->num = sizeof(SFilePage);
333 334
  } else {
    SPageInfo* pi = getLastPageInfo(list);
335
    pData = getBufPage(pResultBuf, getPageId(pi));
336
    pageId = getPageId(pi);
337

338
    if (pData->num + size > getBufPageSize(pResultBuf)) {
339
      // release current page first, and prepare the next one
340
      releaseBufPageInfo(pResultBuf, pi);
341

H
Haojun Liao 已提交
342
      pData = getNewBufPage(pResultBuf, tid, &pageId);
343
      if (pData != NULL) {
344
        pData->num = sizeof(SFilePage);
345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364
      }
    }
  }

  if (pData == NULL) {
    return -1;
  }

  // set the number of rows in current disk page
  if (pWindowRes->pageId == -1) {  // not allocated yet, allocate new buffer
    pWindowRes->pageId = pageId;
    pWindowRes->offset = (int32_t)pData->num;

    pData->num += size;
    assert(pWindowRes->pageId >= 0);
  }

  return 0;
}

365
//  query_range_start, query_range_end, window_duration, window_start, window_end
366
void initExecTimeWindowInfo(SColumnInfoData* pColData, STimeWindow* pQueryWindow) {
367 368 369
  pColData->info.type = TSDB_DATA_TYPE_TIMESTAMP;
  pColData->info.bytes = sizeof(int64_t);

370
  colInfoDataEnsureCapacity(pColData, 5);
371 372 373 374 375 376 377 378 379
  colDataAppendInt64(pColData, 0, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 1, &pQueryWindow->ekey);

  int64_t interval = 0;
  colDataAppendInt64(pColData, 2, &interval);  // this value may be variable in case of 'n' and 'y'.
  colDataAppendInt64(pColData, 3, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 4, &pQueryWindow->ekey);
}

X
Xiaoyu Wang 已提交
380 381 382
void doApplyFunctions(SExecTaskInfo* taskInfo, SqlFunctionCtx* pCtx, STimeWindow* pWin,
                      SColumnInfoData* pTimeWindowData, int32_t offset, int32_t forwardStep, TSKEY* tsCol,
                      int32_t numOfTotal, int32_t numOfOutput, int32_t order) {
383
  for (int32_t k = 0; k < numOfOutput; ++k) {
H
Haojun Liao 已提交
384
    // keep it temporarily
385
    // todo no need this??
dengyihao's avatar
dengyihao 已提交
386 387
    bool    hasAgg = pCtx[k].input.colDataAggIsSet;
    int32_t numOfRows = pCtx[k].input.numOfRows;
H
Haojun Liao 已提交
388
    int32_t startOffset = pCtx[k].input.startRowIndex;
389

390
    pCtx[k].input.startRowIndex = offset;
391
    pCtx[k].input.numOfRows = forwardStep;
392 393 394

    // not a whole block involved in query processing, statistics data can not be used
    // NOTE: the original value of isSet have been changed here
395 396
    if (pCtx[k].input.colDataAggIsSet && forwardStep < numOfTotal) {
      pCtx[k].input.colDataAggIsSet = false;
397 398
    }

399 400
    if (fmIsWindowPseudoColumnFunc(pCtx[k].functionId)) {
      SResultRowEntryInfo* pEntryInfo = GET_RES_INFO(&pCtx[k]);
401 402

      char* p = GET_ROWCELL_INTERBUF(pEntryInfo);
403

404
      SColumnInfoData idata = {0};
dengyihao's avatar
dengyihao 已提交
405
      idata.info.type = TSDB_DATA_TYPE_BIGINT;
406
      idata.info.bytes = tDataTypes[TSDB_DATA_TYPE_BIGINT].bytes;
dengyihao's avatar
dengyihao 已提交
407
      idata.pData = p;
408 409 410 411

      SScalarParam out = {.columnData = &idata};
      SScalarParam tw = {.numOfRows = 5, .columnData = pTimeWindowData};
      pCtx[k].sfp.process(&tw, 1, &out);
412
      pEntryInfo->numOfRes = 1;
413 414 415 416 417 418 419 420 421 422
    } else {
      int32_t code = TSDB_CODE_SUCCESS;
      if (functionNeedToExecute(&pCtx[k]) && pCtx[k].fpSet.process != NULL) {
        code = pCtx[k].fpSet.process(&pCtx[k]);

        if (code != TSDB_CODE_SUCCESS) {
          qError("%s apply functions error, code: %s", GET_TASKID(taskInfo), tstrerror(code));
          taskInfo->code = code;
          longjmp(taskInfo->env, code);
        }
423
      }
424

425 426 427 428 429
      // restore it
      pCtx[k].input.colDataAggIsSet = hasAgg;
      pCtx[k].input.startRowIndex = startOffset;
      pCtx[k].input.numOfRows = numOfRows;
    }
430 431 432
  }
}

dengyihao's avatar
dengyihao 已提交
433
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
434
                                   int32_t scanFlag, bool createDummyCol);
435

dengyihao's avatar
dengyihao 已提交
436 437
static void doSetInputDataBlockInfo(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock,
                                    int32_t order) {
438
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
439
    pCtx[i].order = order;
440
    pCtx[i].input.numOfRows = pBlock->info.rows;
441
    setBlockStatisInfo(&pCtx[i], &pOperator->exprSupp.pExprInfo[i], pBlock);
442 443 444
  }
}

X
Xiaoyu Wang 已提交
445 446
void setInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
                       int32_t scanFlag, bool createDummyCol) {
447
  if (pBlock->pBlockAgg != NULL) {
H
Haojun Liao 已提交
448
    doSetInputDataBlockInfo(pOperator, pCtx, pBlock, order);
449
  } else {
450
    doSetInputDataBlock(pOperator, pCtx, pBlock, order, scanFlag, createDummyCol);
H
Haojun Liao 已提交
451
  }
452 453
}

L
Liu Jicong 已提交
454 455
static int32_t doCreateConstantValColumnInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t paramIndex,
                                             int32_t numOfRows) {
456 457 458 459 460 461 462 463
  SColumnInfoData* pColInfo = NULL;
  if (pInput->pData[paramIndex] == NULL) {
    pColInfo = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pColInfo == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

    // Set the correct column info (data type and bytes)
464 465
    pColInfo->info.type = pFuncParam->param.nType;
    pColInfo->info.bytes = pFuncParam->param.nLen;
466 467

    pInput->pData[paramIndex] = pColInfo;
468 469
  } else {
    pColInfo = pInput->pData[paramIndex];
470 471
  }

472
  colInfoDataEnsureCapacity(pColInfo, numOfRows);
473

474
  int8_t type = pFuncParam->param.nType;
475 476
  if (type == TSDB_DATA_TYPE_BIGINT || type == TSDB_DATA_TYPE_UBIGINT) {
    int64_t v = pFuncParam->param.i;
dengyihao's avatar
dengyihao 已提交
477
    for (int32_t i = 0; i < numOfRows; ++i) {
478 479 480 481
      colDataAppendInt64(pColInfo, i, &v);
    }
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
dengyihao's avatar
dengyihao 已提交
482
    for (int32_t i = 0; i < numOfRows; ++i) {
483 484
      colDataAppendDouble(pColInfo, i, &v);
    }
485
  } else if (type == TSDB_DATA_TYPE_VARCHAR) {
L
Liu Jicong 已提交
486
    char* tmp = taosMemoryMalloc(pFuncParam->param.nLen + VARSTR_HEADER_SIZE);
487
    STR_WITH_SIZE_TO_VARSTR(tmp, pFuncParam->param.pz, pFuncParam->param.nLen);
L
Liu Jicong 已提交
488
    for (int32_t i = 0; i < numOfRows; ++i) {
489 490
      colDataAppend(pColInfo, i, tmp, false);
    }
491 492 493 494 495
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
496
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
X
Xiaoyu Wang 已提交
497
                                   int32_t scanFlag, bool createDummyCol) {
498 499
  int32_t code = TSDB_CODE_SUCCESS;

500
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
L
Liu Jicong 已提交
501
    pCtx[i].order = order;
502 503
    pCtx[i].input.numOfRows = pBlock->info.rows;

L
Liu Jicong 已提交
504
    pCtx[i].pSrcBlock = pBlock;
X
Xiaoyu Wang 已提交
505
    pCtx[i].scanFlag = scanFlag;
H
Haojun Liao 已提交
506

507
    SInputColumnInfoData* pInput = &pCtx[i].input;
508
    pInput->uid = pBlock->info.uid;
C
Cary Xu 已提交
509
    pInput->colDataAggIsSet = false;
510

511
    SExprInfo* pOneExpr = &pOperator->exprSupp.pExprInfo[i];
512
    for (int32_t j = 0; j < pOneExpr->base.numOfParams; ++j) {
dengyihao's avatar
dengyihao 已提交
513
      SFunctParam* pFuncParam = &pOneExpr->base.pParam[j];
G
Ganlin Zhao 已提交
514 515
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
dengyihao's avatar
dengyihao 已提交
516
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
517 518 519
        pInput->totalRows = pBlock->info.rows;
        pInput->numOfRows = pBlock->info.rows;
        pInput->startRowIndex = 0;
520

521
        // NOTE: the last parameter is the primary timestamp column
H
Haojun Liao 已提交
522 523 524 525
        // todo: refactor this
        if (fmIsTimelineFunc(pCtx[i].functionId) && (j == pOneExpr->base.numOfParams - 1)) {
          pInput->pPTS = pInput->pData[j];   // in case of merge function, this is not always the ts column data.
//          ASSERT(pInput->pPTS->info.type == TSDB_DATA_TYPE_TIMESTAMP);
526
        }
527 528
        ASSERT(pInput->pData[j] != NULL);
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
529 530 531
        // todo avoid case: top(k, 12), 12 is the value parameter.
        // sum(11), 11 is also the value parameter.
        if (createDummyCol && pOneExpr->base.numOfParams == 1) {
532 533 534 535
          pInput->totalRows = pBlock->info.rows;
          pInput->numOfRows = pBlock->info.rows;
          pInput->startRowIndex = 0;

536
          code = doCreateConstantValColumnInfo(pInput, pFuncParam, j, pBlock->info.rows);
537 538 539
          if (code != TSDB_CODE_SUCCESS) {
            return code;
          }
540
        }
G
Ganlin Zhao 已提交
541 542
      }
    }
H
Haojun Liao 已提交
543
  }
544 545

  return code;
H
Haojun Liao 已提交
546 547
}

548
static int32_t doAggregateImpl(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx) {
549
  for (int32_t k = 0; k < pOperator->exprSupp.numOfExprs; ++k) {
H
Haojun Liao 已提交
550
    if (functionNeedToExecute(&pCtx[k])) {
551
      // todo add a dummy funtion to avoid process check
552 553 554
      if (pCtx[k].fpSet.process == NULL) {
        continue;
      }
H
Haojun Liao 已提交
555

556 557 558 559
      int32_t code = pCtx[k].fpSet.process(&pCtx[k]);
      if (code != TSDB_CODE_SUCCESS) {
        qError("%s aggregate function error happens, code: %s", GET_TASKID(pOperator->pTaskInfo), tstrerror(code));
        return code;
560
      }
561 562
    }
  }
563 564

  return TSDB_CODE_SUCCESS;
565 566
}

H
Haojun Liao 已提交
567
static void setPseudoOutputColInfo(SSDataBlock* pResult, SqlFunctionCtx* pCtx, SArray* pPseudoList) {
dengyihao's avatar
dengyihao 已提交
568
  size_t num = (pPseudoList != NULL) ? taosArrayGetSize(pPseudoList) : 0;
H
Haojun Liao 已提交
569 570 571 572 573
  for (int32_t i = 0; i < num; ++i) {
    pCtx[i].pOutput = taosArrayGet(pResult->pDataBlock, i);
  }
}

574
int32_t projectApplyFunctions(SExprInfo* pExpr, SSDataBlock* pResult, SSDataBlock* pSrcBlock, SqlFunctionCtx* pCtx,
X
Xiaoyu Wang 已提交
575
                              int32_t numOfOutput, SArray* pPseudoList) {
H
Haojun Liao 已提交
576
  setPseudoOutputColInfo(pResult, pCtx, pPseudoList);
H
Haojun Liao 已提交
577
  pResult->info.groupId = pSrcBlock->info.groupId;
H
Haojun Liao 已提交
578

579 580
  // if the source equals to the destination, it is to create a new column as the result of scalar
  // function or some operators.
581 582
  bool createNewColModel = (pResult == pSrcBlock);

583 584
  int32_t numOfRows = 0;

585
  for (int32_t k = 0; k < numOfOutput; ++k) {
586 587
    int32_t               outputSlotId = pExpr[k].base.resSchema.slotId;
    SqlFunctionCtx*       pfCtx = &pCtx[k];
588
    SInputColumnInfoData* pInputData = &pfCtx->input;
589

L
Liu Jicong 已提交
590
    if (pExpr[k].pExpr->nodeType == QUERY_NODE_COLUMN) {  // it is a project query
591
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
592
      if (pResult->info.rows > 0 && !createNewColModel) {
593 594
        colDataMergeCol(pColInfoData, pResult->info.rows, &pResult->info.capacity, pInputData->pData[0],
                        pInputData->numOfRows);
595
      } else {
596
        colDataAssign(pColInfoData, pInputData->pData[0], pInputData->numOfRows, &pResult->info);
597
      }
598

599
      numOfRows = pInputData->numOfRows;
600
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_VALUE) {
601
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
602

dengyihao's avatar
dengyihao 已提交
603
      int32_t offset = createNewColModel ? 0 : pResult->info.rows;
604 605 606 607 608 609 610 611

      int32_t type = pExpr[k].base.pParam[0].param.nType;
      if (TSDB_DATA_TYPE_NULL == type) {
        colDataAppendNNULL(pColInfoData, offset, pSrcBlock->info.rows);
      } else {
        for (int32_t i = 0; i < pSrcBlock->info.rows; ++i) {
          colDataAppend(pColInfoData, i + offset, taosVariantGet(&pExpr[k].base.pParam[0].param, type), false);
        }
612
      }
613 614

      numOfRows = pSrcBlock->info.rows;
H
Haojun Liao 已提交
615
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_OPERATOR) {
616 617 618
      SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
      taosArrayPush(pBlockList, &pSrcBlock);

619
      SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
620
      SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
621

622
      SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
623
      int32_t      code = scalarCalculate(pExpr[k].pExpr->_optrRoot.pRootNode, pBlockList, &dest);
624 625 626 627
      if (code != TSDB_CODE_SUCCESS) {
        taosArrayDestroy(pBlockList);
        return code;
      }
628

dengyihao's avatar
dengyihao 已提交
629
      int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
630
      ASSERT(pResult->info.capacity > 0);
631
      colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
D
dapan1121 已提交
632 633
      colDataDestroy(&idata);
      
634
      numOfRows = dest.numOfRows;
635 636
      taosArrayDestroy(pBlockList);
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_FUNCTION) {
637 638
      // _rowts/_c0, not tbname column
      if (fmIsPseudoColumnFunc(pfCtx->functionId) && (!fmIsScanPseudoColumnFunc(pfCtx->functionId))) {
H
Haojun Liao 已提交
639
        // do nothing
640
      } else if (fmIsIndefiniteRowsFunc(pfCtx->functionId)) {
641 642
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(pfCtx);
        pfCtx->fpSet.init(pfCtx, pResInfo);
643 644 645 646 647 648 649 650 651 652 653

        pfCtx->pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
        pfCtx->offset = createNewColModel ? 0 : pResult->info.rows;  // set the start offset

        // set the timestamp(_rowts) output buffer
        if (taosArrayGetSize(pPseudoList) > 0) {
          int32_t* outputColIndex = taosArrayGet(pPseudoList, 0);
          pfCtx->pTsOutput = (SColumnInfoData*)pCtx[*outputColIndex].pOutput;
        }

        numOfRows = pfCtx->fpSet.process(pfCtx);
H
Haojun Liao 已提交
654
      } else if (fmIsAggFunc(pfCtx->functionId)) {
655 656
        // _group_key function for "partition by tbname" + csum(col_name) query
        SColumnInfoData* pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
657
        int32_t          slotId = pfCtx->param[0].pCol->slotId;
658 659 660

        // todo handle the json tag
        SColumnInfoData* pInput = taosArrayGet(pSrcBlock->pDataBlock, slotId);
661
        for (int32_t f = 0; f < pSrcBlock->info.rows; ++f) {
662 663 664 665 666 667 668 669 670
          bool isNull = colDataIsNull_s(pInput, f);
          if (isNull) {
            colDataAppendNULL(pOutput, pResult->info.rows + f);
          } else {
            char* data = colDataGetData(pInput, f);
            colDataAppend(pOutput, pResult->info.rows + f, data, isNull);
          }
        }

H
Haojun Liao 已提交
671 672 673
      } else {
        SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
        taosArrayPush(pBlockList, &pSrcBlock);
G
Ganlin Zhao 已提交
674

675
        SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
676
        SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
H
Haojun Liao 已提交
677

678
        SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
679
        int32_t      code = scalarCalculate((SNode*)pExpr[k].pExpr->_function.pFunctNode, pBlockList, &dest);
680 681 682 683
        if (code != TSDB_CODE_SUCCESS) {
          taosArrayDestroy(pBlockList);
          return code;
        }
684

dengyihao's avatar
dengyihao 已提交
685
        int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
686
        ASSERT(pResult->info.capacity > 0);
687
        colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
D
dapan1121 已提交
688
        colDataDestroy(&idata);
689 690

        numOfRows = dest.numOfRows;
H
Haojun Liao 已提交
691 692
        taosArrayDestroy(pBlockList);
      }
693
    } else {
694
      ASSERT(0);
695 696
    }
  }
697

698 699 700
  if (!createNewColModel) {
    pResult->info.rows += numOfRows;
  }
701 702

  return TSDB_CODE_SUCCESS;
703 704
}

5
54liuyao 已提交
705
bool functionNeedToExecute(SqlFunctionCtx* pCtx) {
706
  struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
707

708 709 710 711 712
  // in case of timestamp column, always generated results.
  int32_t functionId = pCtx->functionId;
  if (functionId == -1) {
    return false;
  }
713

714 715
  if (pCtx->scanFlag == REPEAT_SCAN) {
    return fmIsRepeatScanFunc(pCtx->functionId);
716 717
  }

718 719
  if (isRowEntryCompleted(pResInfo)) {
    return false;
720 721
  }

722 723 724
  return true;
}

725 726 727 728 729 730 731
static int32_t doCreateConstantValColumnAggInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t type,
                                                int32_t paramIndex, int32_t numOfRows) {
  if (pInput->pData[paramIndex] == NULL) {
    pInput->pData[paramIndex] = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pInput->pData[paramIndex] == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
732

733 734 735
    // Set the correct column info (data type and bytes)
    pInput->pData[paramIndex]->info.type = type;
    pInput->pData[paramIndex]->info.bytes = tDataTypes[type].bytes;
736
  }
H
Haojun Liao 已提交
737

738 739 740 741 742 743
  SColumnDataAgg* da = NULL;
  if (pInput->pColumnDataAgg[paramIndex] == NULL) {
    da = taosMemoryCalloc(1, sizeof(SColumnDataAgg));
    pInput->pColumnDataAgg[paramIndex] = da;
    if (da == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
744 745
    }
  } else {
746
    da = pInput->pColumnDataAgg[paramIndex];
747 748
  }

749
  ASSERT(!IS_VAR_DATA_TYPE(type));
750

751 752
  if (type == TSDB_DATA_TYPE_BIGINT) {
    int64_t v = pFuncParam->param.i;
753
    *da = (SColumnDataAgg){.numOfNull = 0, .min = v, .max = v, .sum = v * numOfRows};
754 755
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
756
    *da = (SColumnDataAgg){.numOfNull = 0};
757

758 759 760 761 762 763
    *(double*)&da->min = v;
    *(double*)&da->max = v;
    *(double*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_BOOL) {  // todo validate this data type
    bool v = pFuncParam->param.i;

764
    *da = (SColumnDataAgg){.numOfNull = 0};
765 766 767 768 769
    *(bool*)&da->min = 0;
    *(bool*)&da->max = v;
    *(bool*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_TIMESTAMP) {
    // do nothing
770
  } else {
771
    ASSERT(0);
772 773
  }

774 775
  return TSDB_CODE_SUCCESS;
}
776 777 778 779 780 781 782 783 784 785 786

void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, SSDataBlock* pBlock) {
  int32_t numOfRows = pBlock->info.rows;

  SInputColumnInfoData* pInput = &pCtx->input;
  pInput->numOfRows = numOfRows;
  pInput->totalRows = numOfRows;

  if (pBlock->pBlockAgg != NULL) {
    pInput->colDataAggIsSet = true;

787 788
    for (int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      SFunctParam* pFuncParam = &pExprInfo->base.pParam[j];
789

790 791
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
792 793 794 795
        pInput->pColumnDataAgg[j] = pBlock->pBlockAgg[slotId];
        if (pInput->pColumnDataAgg[j] == NULL) {
          pInput->colDataAggIsSet = false;
        }
796 797 798 799

        // Here we set the column info data since the data type for each column data is required, but
        // the data in the corresponding SColumnInfoData will not be used.
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
800 801
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
        doCreateConstantValColumnAggInfo(pInput, pFuncParam, pFuncParam->param.nType, j, pBlock->info.rows);
802 803
      }
    }
804
  } else {
805
    pInput->colDataAggIsSet = false;
806 807 808
  }

  // set the statistics data for primary time stamp column
809 810 811 812 813
  //  if (pCtx->functionId == FUNCTION_SPREAD && pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
  //    pCtx->isAggSet = true;
  //    pCtx->agg.min = pBlock->info.window.skey;
  //    pCtx->agg.max = pBlock->info.window.ekey;
  //  }
814 815
}

L
Liu Jicong 已提交
816
bool isTaskKilled(SExecTaskInfo* pTaskInfo) {
817 818
  // query has been executed more than tsShellActivityTimer, and the retrieve has not arrived
  // abort current query execution.
L
Liu Jicong 已提交
819 820
  if (pTaskInfo->owner != 0 &&
      ((taosGetTimestampSec() - pTaskInfo->cost.start / 1000) > 10 * getMaximumIdleDurationSec())
821 822
      /*(!needBuildResAfterQueryComplete(pTaskInfo))*/) {
    assert(pTaskInfo->cost.start != 0);
L
Liu Jicong 已提交
823 824 825
    //    qDebug("QInfo:%" PRIu64 " retrieve not arrive beyond %d ms, abort current query execution, start:%" PRId64
    //           ", current:%d", pQInfo->qId, 1, pQInfo->startExecTs, taosGetTimestampSec());
    //    return true;
826 827 828 829 830
  }

  return false;
}

L
Liu Jicong 已提交
831
void setTaskKilled(SExecTaskInfo* pTaskInfo) { pTaskInfo->code = TSDB_CODE_TSC_QUERY_CANCELLED; }
832 833

/////////////////////////////////////////////////////////////////////////////////////////////
L
Liu Jicong 已提交
834
// todo refactor : return window
835
void getAlignQueryTimeWindow(SInterval* pInterval, int32_t precision, int64_t key, STimeWindow* win) {
H
Haojun Liao 已提交
836
  win->skey = taosTimeTruncate(key, pInterval, precision);
837 838

  /*
H
Haojun Liao 已提交
839
   * if the realSkey > INT64_MAX - pInterval->interval, the query duration between
840 841
   * realSkey and realEkey must be less than one interval.Therefore, no need to adjust the query ranges.
   */
842 843
  win->ekey = taosTimeAdd(win->skey, pInterval->interval, pInterval->intervalUnit, precision) - 1;
  if (win->ekey < win->skey) {
844 845 846 847
    win->ekey = INT64_MAX;
  }
}

848
#if 0
L
Liu Jicong 已提交
849
static int32_t updateBlockLoadStatus(STaskAttr* pQuery, int32_t status) {
850

851 852 853
  bool hasFirstLastFunc = false;
  bool hasOtherFunc = false;

854
  if (status == BLK_DATA_DATA_LOAD || status == BLK_DATA_FILTEROUT) {
855 856 857 858 859
    return status;
  }

  for (int32_t i = 0; i < pQuery->numOfOutput; ++i) {
    int32_t functionId = getExprFunctionId(&pQuery->pExpr1[i]);
860

861 862 863 864 865 866 867 868 869 870
    if (functionId == FUNCTION_TS || functionId == FUNCTION_TS_DUMMY || functionId == FUNCTION_TAG ||
        functionId == FUNCTION_TAG_DUMMY) {
      continue;
    }

    if (functionId == FUNCTION_FIRST_DST || functionId == FUNCTION_LAST_DST) {
      hasFirstLastFunc = true;
    } else {
      hasOtherFunc = true;
    }
871

872 873
  }

874
  if (hasFirstLastFunc && status == BLK_DATA_NOT_LOAD) {
L
Liu Jicong 已提交
875
    if (!hasOtherFunc) {
876
      return BLK_DATA_FILTEROUT;
877
    } else {
878
      return BLK_DATA_DATA_LOAD;
879 880 881 882 883 884
    }
  }

  return status;
}

885 886
#endif

L
Liu Jicong 已提交
887 888
// static void updateDataCheckOrder(SQInfo *pQInfo, SQueryTableReq* pQueryMsg, bool stableQuery) {
//   STaskAttr* pQueryAttr = pQInfo->runtimeEnv.pQueryAttr;
H
Haojun Liao 已提交
889
//
L
Liu Jicong 已提交
890 891 892 893
//   // in case of point-interpolation query, use asc order scan
//   char msg[] = "QInfo:0x%"PRIx64" scan order changed for %s query, old:%d, new:%d, qrange exchanged, old qrange:%"
//   PRId64
//                "-%" PRId64 ", new qrange:%" PRId64 "-%" PRId64;
H
Haojun Liao 已提交
894
//
L
Liu Jicong 已提交
895 896 897 898 899
//   // todo handle the case the the order irrelevant query type mixed up with order critical query type
//   // descending order query for last_row query
//   if (isFirstLastRowQuery(pQueryAttr)) {
//     //qDebug("QInfo:0x%"PRIx64" scan order changed for last_row query, old:%d, new:%d", pQInfo->qId,
//     pQueryAttr->order.order, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
900
//
L
Liu Jicong 已提交
901 902
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
903
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
904
//     }
H
Haojun Liao 已提交
905
//
L
Liu Jicong 已提交
906 907 908
//     pQueryAttr->needReverseScan = false;
//     return;
//   }
H
Haojun Liao 已提交
909
//
L
Liu Jicong 已提交
910 911 912
//   if (pQueryAttr->groupbyColumn && pQueryAttr->order.order == TSDB_ORDER_DESC) {
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
913
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
914
//     }
H
Haojun Liao 已提交
915
//
L
Liu Jicong 已提交
916 917 918 919
//     pQueryAttr->needReverseScan = false;
//     doUpdateLastKey(pQueryAttr);
//     return;
//   }
H
Haojun Liao 已提交
920
//
L
Liu Jicong 已提交
921 922 923 924 925 926
//   if (pQueryAttr->pointInterpQuery && pQueryAttr->interval.interval == 0) {
//     if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       //qDebug(msg, pQInfo->qId, "interp", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey); TSWAP(pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, TSKEY);
//     }
H
Haojun Liao 已提交
927
//
L
Liu Jicong 已提交
928 929 930
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     return;
//   }
H
Haojun Liao 已提交
931
//
L
Liu Jicong 已提交
932 933 934 935
//   if (pQueryAttr->interval.interval == 0) {
//     if (onlyFirstQuery(pQueryAttr)) {
//       if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//         //qDebug(msg, pQInfo->qId, "only-first", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
H
Haojun Liao 已提交
936 937
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
938
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
939 940 941 942 943 944 945 946 947 948
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_ASC;
//      pQueryAttr->needReverseScan = false;
//    } else if (onlyLastQuery(pQueryAttr) && notContainSessionOrStateWindow(pQueryAttr)) {
//      if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//        //qDebug(msg, pQInfo->qId, "only-last", pQueryAttr->order.order, TSDB_ORDER_DESC, pQueryAttr->window.skey,
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
949
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
950 951 952 953 954 955 956 957 958 959 960 961
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_DESC;
//      pQueryAttr->needReverseScan = false;
//    }
//
//  } else {  // interval query
//    if (stableQuery) {
//      if (onlyFirstQuery(pQueryAttr)) {
//        if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-first stable", pQueryAttr->order.order, TSDB_ORDER_ASC,
L
Liu Jicong 已提交
962 963
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
964
//
wafwerar's avatar
wafwerar 已提交
965
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
966 967 968 969 970 971 972 973
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_ASC;
//        pQueryAttr->needReverseScan = false;
//      } else if (onlyLastQuery(pQueryAttr)) {
//        if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-last stable", pQueryAttr->order.order, TSDB_ORDER_DESC,
L
Liu Jicong 已提交
974 975
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
976
//
wafwerar's avatar
wafwerar 已提交
977
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
978 979 980 981 982 983 984 985 986
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_DESC;
//        pQueryAttr->needReverseScan = false;
//      }
//    }
//  }
//}
987

L
Liu Jicong 已提交
988 989 990
// static FORCE_INLINE bool doFilterByBlockStatistics(STaskRuntimeEnv* pRuntimeEnv, SDataStatis *pDataStatis,
// SqlFunctionCtx *pCtx, int32_t numOfRows) {
//   STaskAttr* pQueryAttr = pRuntimeEnv->pQueryAttr;
991
//
L
Liu Jicong 已提交
992 993 994
//   if (pDataStatis == NULL || pQueryAttr->pFilters == NULL) {
//     return true;
//   }
995
//
L
Liu Jicong 已提交
996 997
//   return filterRangeExecute(pQueryAttr->pFilters, pDataStatis, pQueryAttr->numOfCols, numOfRows);
// }
998
#if 0
H
Haojun Liao 已提交
999
static bool overlapWithTimeWindow(STaskAttr* pQueryAttr, SDataBlockInfo* pBlockInfo) {
1000 1001
  STimeWindow w = {0};

dengyihao's avatar
dengyihao 已提交
1002 1003
  TSKEY sk = TMIN(pQueryAttr->window.skey, pQueryAttr->window.ekey);
  TSKEY ek = TMAX(pQueryAttr->window.skey, pQueryAttr->window.ekey);
1004

1005
  if (true) {
L
Liu Jicong 已提交
1006
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.skey, sk, ek, &w);
1007 1008 1009 1010 1011 1012
    assert(w.ekey >= pBlockInfo->window.skey);

    if (w.ekey < pBlockInfo->window.ekey) {
      return true;
    }

L
Liu Jicong 已提交
1013 1014
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1015 1016 1017 1018 1019 1020 1021 1022 1023 1024
      if (w.skey > pBlockInfo->window.ekey) {
        break;
      }

      assert(w.ekey > pBlockInfo->window.ekey);
      if (w.skey <= pBlockInfo->window.ekey && w.skey > pBlockInfo->window.skey) {
        return true;
      }
    }
  } else {
L
Liu Jicong 已提交
1025
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.ekey, sk, ek, &w);
1026 1027 1028 1029 1030 1031
    assert(w.skey <= pBlockInfo->window.ekey);

    if (w.skey > pBlockInfo->window.skey) {
      return true;
    }

L
Liu Jicong 已提交
1032 1033
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046
      if (w.ekey < pBlockInfo->window.skey) {
        break;
      }

      assert(w.skey < pBlockInfo->window.skey);
      if (w.ekey < pBlockInfo->window.ekey && w.ekey >= pBlockInfo->window.skey) {
        return true;
      }
    }
  }

  return false;
}
1047
#endif
1048 1049

static uint32_t doFilterByBlockTimeWindow(STableScanInfo* pTableScanInfo, SSDataBlock* pBlock) {
H
Haojun Liao 已提交
1050
#if 0
H
Haojun Liao 已提交
1051
  SqlFunctionCtx* pCtx = pTableScanInfo->pCtx;
1052
  uint32_t        status = BLK_DATA_NOT_LOAD;
1053

L
Liu Jicong 已提交
1054
  int32_t numOfOutput = 0;  // pTableScanInfo->numOfOutput;
1055 1056
  for (int32_t i = 0; i < numOfOutput; ++i) {
    int32_t functionId = pCtx[i].functionId;
H
Haojun Liao 已提交
1057
    int32_t colId = pTableScanInfo->pExpr[i].base.pParam[0].pCol->colId;
1058 1059 1060

    // group by + first/last should not apply the first/last block filter
    if (functionId < 0) {
1061
      status |= BLK_DATA_DATA_LOAD;
1062 1063
      return status;
    } else {
L
Liu Jicong 已提交
1064
      //      status |= aAggs[functionId].dataReqFunc(&pTableScanInfo->pCtx[i], &pBlock->info.window, colId);
1065
      //      if ((status & BLK_DATA_DATA_LOAD) == BLK_DATA_DATA_LOAD) {
L
Liu Jicong 已提交
1066 1067
      //        return status;
      //      }
1068 1069 1070 1071
    }
  }

  return status;
H
Haojun Liao 已提交
1072 1073
#endif
  return 0;
1074 1075
}

L
Liu Jicong 已提交
1076 1077
int32_t loadDataBlockOnDemand(SExecTaskInfo* pTaskInfo, STableScanInfo* pTableScanInfo, SSDataBlock* pBlock,
                              uint32_t* status) {
1078
  *status = BLK_DATA_NOT_LOAD;
1079

H
Haojun Liao 已提交
1080
  pBlock->pDataBlock = NULL;
L
Liu Jicong 已提交
1081
  pBlock->pBlockAgg = NULL;
H
Haojun Liao 已提交
1082

L
Liu Jicong 已提交
1083 1084
  //  int64_t groupId = pRuntimeEnv->current->groupIndex;
  //  bool    ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1085

H
Haojun Liao 已提交
1086
  STaskCostInfo* pCost = &pTaskInfo->cost;
1087

1088 1089
//  pCost->totalBlocks += 1;
//  pCost->totalRows += pBlock->info.rows;
H
Haojun Liao 已提交
1090
#if 0
1091 1092 1093
  // Calculate all time windows that are overlapping or contain current data block.
  // If current data block is contained by all possible time window, do not load current data block.
  if (/*pQueryAttr->pFilters || */pQueryAttr->groupbyColumn || pQueryAttr->sw.gap > 0 ||
H
Haojun Liao 已提交
1094
      (QUERY_IS_INTERVAL_QUERY(pQueryAttr) && overlapWithTimeWindow(pTaskInfo, &pBlock->info))) {
1095
    (*status) = BLK_DATA_DATA_LOAD;
1096 1097 1098
  }

  // check if this data block is required to load
1099
  if ((*status) != BLK_DATA_DATA_LOAD) {
1100 1101 1102 1103 1104 1105 1106
    bool needFilter = true;

    // the pCtx[i] result is belonged to previous time window since the outputBuf has not been set yet,
    // the filter result may be incorrect. So in case of interval query, we need to set the correct time output buffer
    if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
      SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1107
      bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1108 1109 1110 1111 1112 1113
      TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

      STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
      if (pQueryAttr->pointInterpQuery) {
        needFilter = chkWindowOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1114
                                    pTableScanInfo->rowEntryInfoOffset);
1115 1116 1117
      } else {
        if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1118
                                    pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1119 1120 1121 1122 1123
          longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
        }
      }
    } else if (pQueryAttr->stableQuery && (!pQueryAttr->tsCompQuery) && (!pQueryAttr->diffQuery)) { // stable aggregate, not interval aggregate or normal column aggregate
      doSetTableGroupOutputBuf(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pTableScanInfo->pCtx,
1124
                               pTableScanInfo->rowEntryInfoOffset, pTableScanInfo->numOfOutput,
1125 1126 1127 1128 1129 1130
                               pRuntimeEnv->current->groupIndex);
    }

    if (needFilter) {
      (*status) = doFilterByBlockTimeWindow(pTableScanInfo, pBlock);
    } else {
1131
      (*status) = BLK_DATA_DATA_LOAD;
1132 1133 1134 1135
    }
  }

  SDataBlockInfo* pBlockInfo = &pBlock->info;
H
Haojun Liao 已提交
1136
//  *status = updateBlockLoadStatus(pRuntimeEnv->pQueryAttr, *status);
1137

1138
  if ((*status) == BLK_DATA_NOT_LOAD || (*status) == BLK_DATA_FILTEROUT) {
1139 1140
    //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//           pBlockInfo->window.ekey, pBlockInfo->rows);
1141
    pCost->skipBlocks += 1;
1142
  } else if ((*status) == BLK_DATA_SMA_LOAD) {
1143 1144
    // this function never returns error?
    pCost->loadBlockStatis += 1;
1145
//    tsdbRetrieveDatablockSMA(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1146 1147

    if (pBlock->pBlockAgg == NULL) {  // data block statistics does not exist, load data block
1148
//      pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1149 1150 1151
      pCost->totalCheckedRows += pBlock->info.rows;
    }
  } else {
1152
    assert((*status) == BLK_DATA_DATA_LOAD);
1153 1154 1155

    // load the data block statistics to perform further filter
    pCost->loadBlockStatis += 1;
1156
//    tsdbRetrieveDatablockSMA(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1157 1158 1159 1160 1161 1162

    if (pQueryAttr->topBotQuery && pBlock->pBlockAgg != NULL) {
      { // set previous window
        if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
          SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1163
          bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1164 1165 1166 1167 1168
          TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

          STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
          if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                      pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1169
                                      pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180
            longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
          }
        }
      }
      bool load = false;
      for (int32_t i = 0; i < pQueryAttr->numOfOutput; ++i) {
        int32_t functionId = pTableScanInfo->pCtx[i].functionId;
        if (functionId == FUNCTION_TOP || functionId == FUNCTION_BOTTOM) {
//          load = topbot_datablock_filter(&pTableScanInfo->pCtx[i], (char*)&(pBlock->pBlockAgg[i].min),
//                                         (char*)&(pBlock->pBlockAgg[i].max));
          if (!load) { // current block has been discard due to filter applied
1181
            pCost->skipBlocks += 1;
1182 1183
            //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId,
//                   pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
1184
            (*status) = BLK_DATA_FILTEROUT;
1185 1186 1187 1188 1189 1190 1191 1192
            return TSDB_CODE_SUCCESS;
          }
        }
      }
    }

    // current block has been discard due to filter applied
//    if (!doFilterByBlockStatistics(pRuntimeEnv, pBlock->pBlockAgg, pTableScanInfo->pCtx, pBlockInfo->rows)) {
1193
//      pCost->skipBlocks += 1;
1194 1195
//      qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//             pBlockInfo->window.ekey, pBlockInfo->rows);
1196
//      (*status) = BLK_DATA_FILTEROUT;
1197 1198 1199 1200 1201
//      return TSDB_CODE_SUCCESS;
//    }

    pCost->totalCheckedRows += pBlockInfo->rows;
    pCost->loadBlocks += 1;
1202
//    pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1203 1204 1205 1206 1207
//    if (pBlock->pDataBlock == NULL) {
//      return terrno;
//    }

//    if (pQueryAttr->pFilters != NULL) {
1208
//      filterSetColFieldData(pQueryAttr->pFilters, taosArrayGetSize(pBlock->pDataBlock), pBlock->pDataBlock);
1209
//    }
1210

1211 1212 1213 1214
//    if (pQueryAttr->pFilters != NULL || pRuntimeEnv->pTsBuf != NULL) {
//      filterColRowsInDataBlock(pRuntimeEnv, pBlock, ascQuery);
//    }
  }
H
Haojun Liao 已提交
1215
#endif
1216 1217 1218
  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
1219
static void updateTableQueryInfoForReverseScan(STableQueryInfo* pTableQueryInfo) {
1220 1221 1222 1223
  if (pTableQueryInfo == NULL) {
    return;
  }

wafwerar's avatar
wafwerar 已提交
1224
  //  TSWAP(pTableQueryInfo->win.skey, pTableQueryInfo->win.ekey);
L
Liu Jicong 已提交
1225
  //  pTableQueryInfo->lastKey = pTableQueryInfo->win.skey;
1226

L
Liu Jicong 已提交
1227 1228
  //  SWITCH_ORDER(pTableQueryInfo->cur.order);
  //  pTableQueryInfo->cur.vgroupIndex = -1;
1229 1230

  // set the index to be the end slot of result rows array
dengyihao's avatar
dengyihao 已提交
1231 1232 1233 1234 1235 1236
  //  SResultRowInfo* pResultRowInfo = &pTableQueryInfo->resInfo;
  //  if (pResultRowInfo->size > 0) {
  //    pResultRowInfo->curPos = pResultRowInfo->size - 1;
  //  } else {
  //    pResultRowInfo->curPos = -1;
  //  }
1237 1238
}

H
Haojun Liao 已提交
1239
void initResultRow(SResultRow* pResultRow) {
X
Xiaoyu Wang 已提交
1240
  //  pResultRow->pEntryInfo = (struct SResultRowEntryInfo*)((char*)pResultRow + sizeof(SResultRow));
1241 1242 1243 1244 1245
}

/*
 * The start of each column SResultRowEntryInfo is denote by RowCellInfoOffset.
 * Note that in case of top/bottom query, the whole multiple rows of result is treated as only one row of results.
H
Haojun Liao 已提交
1246 1247 1248
 * +------------+-----------------result column 1------------+------------------result column 2-----------+
 * | SResultRow | SResultRowEntryInfo | intermediate buffer1 | SResultRowEntryInfo | intermediate buffer 2|
 * +------------+--------------------------------------------+--------------------------------------------+
1249 1250
 *           offset[0]                                  offset[1]                                   offset[2]
 */
1251
// TODO refactor: some function move away
L
Liu Jicong 已提交
1252 1253 1254
void setFunctionResultOutput(SOperatorInfo* pOperator, SOptrBasicInfo* pInfo, SAggSupporter* pSup, int32_t stage,
                             int32_t numOfExprs) {
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1255 1256
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
H
Haojun Liao 已提交
1257

H
Haojun Liao 已提交
1258
  SResultRowInfo* pResultRowInfo = &pInfo->resultRowInfo;
1259
  initResultRowInfo(pResultRowInfo);
H
Haojun Liao 已提交
1260

L
Liu Jicong 已提交
1261 1262
  int64_t     tid = 0;
  int64_t     groupId = 0;
1263 1264
  SResultRow* pRow = doSetResultOutBufByKey(pSup->pResultBuf, pResultRowInfo, (char*)&tid, sizeof(tid), true, groupId,
                                            pTaskInfo, false, pSup);
H
Haojun Liao 已提交
1265

1266
  for (int32_t i = 0; i < numOfExprs; ++i) {
1267
    struct SResultRowEntryInfo* pEntry = getResultEntryInfo(pRow, i, rowEntryInfoOffset);
H
Haojun Liao 已提交
1268 1269
    cleanupResultRowEntry(pEntry);

L
Liu Jicong 已提交
1270
    pCtx[i].resultInfo = pEntry;
1271
    pCtx[i].scanFlag = stage;
H
Haojun Liao 已提交
1272 1273
  }

1274
  initCtxOutputBuffer(pCtx, numOfExprs);
H
Haojun Liao 已提交
1275 1276
}

H
Haojun Liao 已提交
1277
void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size) {
1278 1279
  for (int32_t j = 0; j < size; ++j) {
    struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(&pCtx[j]);
dengyihao's avatar
dengyihao 已提交
1280 1281
    if (isRowEntryInitialized(pResInfo) || fmIsPseudoColumnFunc(pCtx[j].functionId) || pCtx[j].functionId == -1 ||
        fmIsScalarFunc(pCtx[j].functionId)) {
1282 1283 1284
      continue;
    }

H
Haojun Liao 已提交
1285
    pCtx[j].fpSet.init(&pCtx[j], pCtx[j].resultInfo);
1286 1287 1288
  }
}

L
Liu Jicong 已提交
1289
void setTaskStatus(SExecTaskInfo* pTaskInfo, int8_t status) {
1290
  if (status == TASK_NOT_COMPLETED) {
H
Haojun Liao 已提交
1291
    pTaskInfo->status = status;
1292 1293
  } else {
    // QUERY_NOT_COMPLETED is not compatible with any other status, so clear its position first
1294
    CLEAR_QUERY_STATUS(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
1295
    pTaskInfo->status |= status;
1296 1297 1298
  }
}

L
Liu Jicong 已提交
1299
void destroyTableQueryInfoImpl(STableQueryInfo* pTableQueryInfo) {
1300 1301 1302 1303
  if (pTableQueryInfo == NULL) {
    return;
  }

L
Liu Jicong 已提交
1304
  //  taosVariantDestroy(&pTableQueryInfo->tag);
dengyihao's avatar
dengyihao 已提交
1305
  //  cleanupResultRowInfo(&pTableQueryInfo->resInfo);
1306 1307
}

1308
void setResultRowInitCtx(SResultRow* pResult, SqlFunctionCtx* pCtx, int32_t numOfOutput, int32_t* rowEntryInfoOffset) {
1309
  for (int32_t i = 0; i < numOfOutput; ++i) {
1310
    pCtx[i].resultInfo = getResultEntryInfo(pResult, i, rowEntryInfoOffset);
1311 1312 1313 1314 1315

    struct SResultRowEntryInfo* pResInfo = pCtx[i].resultInfo;
    if (isRowEntryCompleted(pResInfo) && isRowEntryInitialized(pResInfo)) {
      continue;
    }
1316 1317 1318 1319 1320

    if (fmIsWindowPseudoColumnFunc(pCtx[i].functionId)) {
      continue;
    }

1321 1322 1323 1324 1325 1326
    if (!pResInfo->initialized) {
      if (pCtx[i].functionId != -1) {
        pCtx[i].fpSet.init(&pCtx[i], pResInfo);
      } else {
        pResInfo->initialized = true;
      }
1327 1328 1329 1330
    }
  }
}

H
Haojun Liao 已提交
1331
static void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep);
1332

1333
void doFilter(const SNode* pFilterNode, SSDataBlock* pBlock) {
1334 1335 1336 1337 1338
  if (pFilterNode == NULL) {
    return;
  }

  SFilterInfo* filter = NULL;
H
Haojun Liao 已提交
1339

H
Haojun Liao 已提交
1340
  // todo move to the initialization function
H
Haojun Liao 已提交
1341
  int32_t code = filterInitFromNode((SNode*)pFilterNode, &filter, 0);
1342

1343
  size_t             numOfCols = taosArrayGetSize(pBlock->pDataBlock);
1344
  SFilterColumnParam param1 = {.numOfCols = numOfCols, .pDataBlock = pBlock->pDataBlock};
1345 1346 1347
  code = filterSetDataFromSlotId(filter, &param1);

  int8_t* rowRes = NULL;
1348

1349
  // todo the keep seems never to be True??
1350
  bool keep = filterExecute(filter, pBlock, &rowRes, NULL, param1.numOfCols);
D
dapan1121 已提交
1351
  filterFreeInfo(filter);
1352

H
Haojun Liao 已提交
1353
  extractQualifiedTupleByFilterResult(pBlock, rowRes, keep);
1354
  blockDataUpdateTsWindow(pBlock, 0);
H
Haojun Liao 已提交
1355 1356

  taosMemoryFree(rowRes);
1357 1358
}

H
Haojun Liao 已提交
1359
void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep) {
1360 1361 1362 1363 1364
  if (keep) {
    return;
  }

  if (rowRes != NULL) {
L
Liu Jicong 已提交
1365
    int32_t      totalRows = pBlock->info.rows;
1366
    SSDataBlock* px = createOneDataBlock(pBlock, true);
1367

1368 1369
    size_t numOfCols = taosArrayGetSize(pBlock->pDataBlock);
    for (int32_t i = 0; i < numOfCols; ++i) {
1370 1371
      SColumnInfoData* pSrc = taosArrayGet(px->pDataBlock, i);
      SColumnInfoData* pDst = taosArrayGet(pBlock->pDataBlock, i);
1372
      // it is a reserved column for scalar function, and no data in this column yet.
1373
      if (pDst->pData == NULL || pSrc->pData == NULL) {
1374 1375 1376
        continue;
      }

1377 1378
      colInfoDataCleanup(pDst, pBlock->info.rows);

1379
      int32_t numOfRows = 0;
1380
      for (int32_t j = 0; j < totalRows; ++j) {
D
dapan1121 已提交
1381 1382 1383
        if (rowRes[j] == 0) {
          continue;
        }
1384

D
dapan1121 已提交
1385
        if (colDataIsNull_s(pSrc, j)) {
1386
          colDataAppendNULL(pDst, numOfRows);
D
dapan1121 已提交
1387
        } else {
1388
          colDataAppend(pDst, numOfRows, colDataGetData(pSrc, j), false);
D
dapan1121 已提交
1389
        }
1390
        numOfRows += 1;
H
Haojun Liao 已提交
1391
      }
1392

1393 1394 1395 1396 1397
      if (pBlock->info.rows == totalRows) {
        pBlock->info.rows = numOfRows;
      } else {
        ASSERT(pBlock->info.rows == numOfRows);
      }
1398
    }
1399

dengyihao's avatar
dengyihao 已提交
1400
    blockDataDestroy(px);  // fix memory leak
1401 1402 1403
  } else {
    // do nothing
    pBlock->info.rows = 0;
1404 1405 1406
  }
}

L
Liu Jicong 已提交
1407 1408
void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                              uint64_t groupId) {
1409
  // for simple group by query without interval, all the tables belong to one group result.
L
Liu Jicong 已提交
1410
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1411
  SResultRowInfo* pResultRowInfo = &pAggInfo->binfo.resultRowInfo;
1412 1413
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
1414

1415
  SResultRow* pResultRow = doSetResultOutBufByKey(pAggInfo->aggSup.pResultBuf, pResultRowInfo, (char*)&groupId,
L
Liu Jicong 已提交
1416
                                                  sizeof(groupId), true, groupId, pTaskInfo, false, &pAggInfo->aggSup);
L
Liu Jicong 已提交
1417
  assert(pResultRow != NULL);
1418 1419 1420 1421 1422 1423

  /*
   * not assign result buffer yet, add new result buffer
   * all group belong to one result set, and each group result has different group id so set the id to be one
   */
  if (pResultRow->pageId == -1) {
dengyihao's avatar
dengyihao 已提交
1424 1425
    int32_t ret =
        addNewWindowResultBuf(pResultRow, pAggInfo->aggSup.pResultBuf, groupId, pAggInfo->binfo.pRes->info.rowSize);
1426 1427 1428 1429 1430
    if (ret != TSDB_CODE_SUCCESS) {
      return;
    }
  }

1431
  setResultRowInitCtx(pResultRow, pCtx, numOfOutput, rowEntryInfoOffset);
1432 1433
}

1434
void setExecutionContext(SOperatorInfo* pOperator, int32_t numOfOutput, uint64_t groupId, SAggOperatorInfo* pAggInfo) {
H
Haojun Liao 已提交
1435
  if (pAggInfo->groupId != INT32_MIN && pAggInfo->groupId == groupId) {
1436 1437
    return;
  }
1438
#ifdef BUF_PAGE_DEBUG
L
Liu Jicong 已提交
1439
  qDebug("page_setbuf, groupId:%" PRIu64, groupId);
1440
#endif
1441
  doSetTableGroupOutputBuf(pOperator, pAggInfo, numOfOutput, groupId);
1442 1443

  // record the current active group id
H
Haojun Liao 已提交
1444
  pAggInfo->groupId = groupId;
1445 1446
}

1447 1448
static void doUpdateNumOfRows(SResultRow* pRow, int32_t numOfExprs, const int32_t* rowCellOffset) {
  for (int32_t j = 0; j < numOfExprs; ++j) {
1449
    struct SResultRowEntryInfo* pResInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1450 1451 1452 1453 1454 1455 1456 1457 1458 1459
    if (!isRowEntryInitialized(pResInfo)) {
      continue;
    }

    if (pRow->numOfRows < pResInfo->numOfRes) {
      pRow->numOfRows = pResInfo->numOfRes;
    }
  }
}

1460
int32_t finalizeResultRowIntoResultDataBlock(SDiskbasedBuf* pBuf, SResultRowPosition* resultRowPosition,
S
shenglian zhou 已提交
1461 1462 1463
                                             SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, int32_t numOfExprs,
                                             const int32_t* rowCellOffset, SSDataBlock* pBlock,
                                             SExecTaskInfo* pTaskInfo) {
1464 1465 1466 1467 1468 1469 1470 1471 1472
  SFilePage*  page = getBufPage(pBuf, resultRowPosition->pageId);
  SResultRow* pRow = (SResultRow*)((char*)page + resultRowPosition->offset);

  doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
  if (pRow->numOfRows == 0) {
    releaseBufPage(pBuf, page);
    return 0;
  }

1473 1474 1475 1476 1477 1478 1479
  while (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
    int32_t code = blockDataEnsureCapacity(pBlock, pBlock->info.capacity * 1.25);
    if (TAOS_FAILED(code)) {
      releaseBufPage(pBuf, page);
      qError("%s ensure result data capacity failed, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
      longjmp(pTaskInfo->env, code);
    }
1480 1481 1482 1483 1484
  }

  for (int32_t j = 0; j < numOfExprs; ++j) {
    int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1485
    pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1486 1487 1488 1489 1490 1491 1492 1493 1494
    if (pCtx[j].fpSet.finalize) {
      int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
      if (TAOS_FAILED(code)) {
        qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
        longjmp(pTaskInfo->env, code);
      }
    } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
      // do nothing, todo refactor
    } else {
1495 1496
      // expand the result into multiple rows. E.g., _wstart, top(k, 20)
      // the _wstart needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
1497 1498 1499 1500 1501 1502 1503 1504 1505
      SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
      char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
      for (int32_t k = 0; k < pRow->numOfRows; ++k) {
        colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
      }
    }
  }

  releaseBufPage(pBuf, page);
1506
  pBlock->info.rows += pRow->numOfRows;
1507 1508 1509 1510

  return 0;
}

X
Xiaoyu Wang 已提交
1511 1512 1513
int32_t doCopyToSDataBlock(SExecTaskInfo* pTaskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo, SDiskbasedBuf* pBuf,
                           SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset, SqlFunctionCtx* pCtx,
                           int32_t numOfExprs) {
1514
  int32_t numOfRows = getNumOfTotalRes(pGroupResInfo);
1515
  int32_t start = pGroupResInfo->index;
1516

1517
  for (int32_t i = start; i < numOfRows; i += 1) {
L
Liu Jicong 已提交
1518 1519
    SResKeyPos* pPos = taosArrayGetP(pGroupResInfo->pRows, i);
    SFilePage*  page = getBufPage(pBuf, pPos->pos.pageId);
1520

1521
    SResultRow* pRow = (SResultRow*)((char*)page + pPos->pos.offset);
1522 1523

    doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
1524 1525
    if (pRow->numOfRows == 0) {
      pGroupResInfo->index += 1;
1526
      releaseBufPage(pBuf, page);
1527 1528 1529
      continue;
    }

1530 1531 1532 1533 1534
    if (pBlock->info.groupId == 0) {
      pBlock->info.groupId = pPos->groupId;
    } else {
      // current value belongs to different group, it can't be packed into one datablock
      if (pBlock->info.groupId != pPos->groupId) {
1535
        releaseBufPage(pBuf, page);
1536 1537 1538 1539
        break;
      }
    }

1540
    if (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
1541
      releaseBufPage(pBuf, page);
1542 1543 1544 1545 1546
      break;
    }

    pGroupResInfo->index += 1;

1547
    for (int32_t j = 0; j < numOfExprs; ++j) {
1548 1549
      int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1550
      pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1551
      if (pCtx[j].fpSet.finalize) {
1552
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1553
        qDebug("\npage_finalize %d", numOfExprs);
1554
#endif
1555
        int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
1556
        if (TAOS_FAILED(code)) {
1557 1558
          qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
          longjmp(pTaskInfo->env, code);
1559
        }
1560 1561
      } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
        // do nothing, todo refactor
1562
      } else {
1563 1564
        // expand the result into multiple rows. E.g., _wstart, top(k, 20)
        // the _wstart needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
X
Xiaoyu Wang 已提交
1565 1566
        SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
        char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
1567
        if (pCtx[j].increase) {
L
Liu Jicong 已提交
1568
          int64_t ts = *(int64_t*)in;
1569
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
L
Liu Jicong 已提交
1570
            colDataAppend(pColInfoData, pBlock->info.rows + k, (const char*)&ts, pCtx[j].resultInfo->isNullRes);
1571 1572 1573 1574 1575 1576
            ts++;
          }
        } else {
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
            colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
          }
X
Xiaoyu Wang 已提交
1577
        }
1578
      }
1579 1580
    }

1581
    releaseBufPage(pBuf, page);
1582
    pBlock->info.rows += pRow->numOfRows;
L
Liu Jicong 已提交
1583 1584 1585
    //    if (pBlock->info.rows >= pBlock->info.capacity) {  // output buffer is full
    //      break;
    //    }
1586 1587
  }

X
Xiaoyu Wang 已提交
1588 1589
  qDebug("%s result generated, rows:%d, groupId:%" PRIu64, GET_TASKID(pTaskInfo), pBlock->info.rows,
         pBlock->info.groupId);
1590
  blockDataUpdateTsWindow(pBlock, 0);
1591 1592 1593
  return 0;
}

X
Xiaoyu Wang 已提交
1594 1595
void doBuildResultDatablock(SOperatorInfo* pOperator, SOptrBasicInfo* pbInfo, SGroupResInfo* pGroupResInfo,
                            SDiskbasedBuf* pBuf) {
1596 1597
  SExprInfo*     pExprInfo = pOperator->exprSupp.pExprInfo;
  int32_t        numOfExprs = pOperator->exprSupp.numOfExprs;
1598 1599
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

1600
  int32_t*        rowCellOffset = pOperator->exprSupp.rowEntryInfoOffset;
X
Xiaoyu Wang 已提交
1601
  SSDataBlock*    pBlock = pbInfo->pRes;
1602
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
1603

1604
  blockDataCleanup(pBlock);
1605
  if (!hasDataInGroupInfo(pGroupResInfo)) {
1606 1607 1608
    return;
  }

1609 1610
  // clear the existed group id
  pBlock->info.groupId = 0;
1611
  doCopyToSDataBlock(pTaskInfo, pBlock, pExprInfo, pBuf, pGroupResInfo, rowCellOffset, pCtx, numOfExprs);
1612 1613
}

L
Liu Jicong 已提交
1614
static void updateNumOfRowsInResultRows(SqlFunctionCtx* pCtx, int32_t numOfOutput, SResultRowInfo* pResultRowInfo,
1615
                                        int32_t* rowEntryInfoOffset) {
1616
  // update the number of result for each, only update the number of rows for the corresponding window result.
L
Liu Jicong 已提交
1617 1618 1619
  //  if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
  //    return;
  //  }
H
Haojun Liao 已提交
1620
#if 0
1621
  for (int32_t i = 0; i < pResultRowInfo->size; ++i) {
L
Liu Jicong 已提交
1622
    SResultRow* pResult = pResultRowInfo->pResult[i];
1623 1624 1625 1626 1627 1628 1629

    for (int32_t j = 0; j < numOfOutput; ++j) {
      int32_t functionId = pCtx[j].functionId;
      if (functionId == FUNCTION_TS || functionId == FUNCTION_TAG || functionId == FUNCTION_TAGPRJ) {
        continue;
      }

1630
      SResultRowEntryInfo* pCell = getResultEntryInfo(pResult, j, rowEntryInfoOffset);
1631
      pResult->numOfRows = (uint16_t)(TMAX(pResult->numOfRows, pCell->numOfRes));
1632 1633
    }
  }
H
Haojun Liao 已提交
1634
#endif
1635 1636
}

L
Liu Jicong 已提交
1637
static int32_t compressQueryColData(SColumnInfoData* pColRes, int32_t numOfRows, char* data, int8_t compressed) {
1638 1639
  int32_t colSize = pColRes->info.bytes * numOfRows;
  return (*(tDataTypes[pColRes->info.type].compFunc))(pColRes->pData, colSize, numOfRows, data,
L
Liu Jicong 已提交
1640
                                                      colSize + COMP_OVERFLOW_BYTES, compressed, NULL, 0);
1641 1642
}

1643 1644 1645
int32_t doFillTimeIntervalGapsInResults(struct SFillInfo* pFillInfo, SSDataBlock* pBlock, int32_t capacity) {
  int32_t numOfRows = (int32_t)taosFillResultDataBlock(pFillInfo, pBlock, capacity - pBlock->info.rows);
  return pBlock->info.rows;
1646 1647
}

L
Liu Jicong 已提交
1648 1649
void queryCostStatis(SExecTaskInfo* pTaskInfo) {
  STaskCostInfo* pSummary = &pTaskInfo->cost;
1650

L
Liu Jicong 已提交
1651 1652 1653
  //  uint64_t hashSize = taosHashGetMemSize(pQInfo->runtimeEnv.pResultRowHashTable);
  //  hashSize += taosHashGetMemSize(pRuntimeEnv->tableqinfoGroupInfo.map);
  //  pSummary->hashSize = hashSize;
1654 1655 1656 1657

  // add the merge time
  pSummary->elapsedTime += pSummary->firstStageMergeTime;

L
Liu Jicong 已提交
1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668
  //  SResultRowPool* p = pTaskInfo->pool;
  //  if (p != NULL) {
  //    pSummary->winInfoSize = getResultRowPoolMemSize(p);
  //    pSummary->numOfTimeWindows = getNumOfAllocatedResultRows(p);
  //  } else {
  //    pSummary->winInfoSize = 0;
  //    pSummary->numOfTimeWindows = 0;
  //  }
  //
  //  calculateOperatorProfResults(pQInfo);

1669 1670
  SFileBlockLoadRecorder* pRecorder = pSummary->pRecoder;
  if (pSummary->pRecoder != NULL) {
X
Xiaoyu Wang 已提交
1671 1672
    qDebug("%s :cost summary: elapsed time:%" PRId64 " us, first merge:%" PRId64
           " us, total blocks:%d, "
1673 1674 1675 1676
           "load block statis:%d, load data block:%d, total rows:%" PRId64 ", check rows:%" PRId64,
           GET_TASKID(pTaskInfo), pSummary->elapsedTime, pSummary->firstStageMergeTime, pRecorder->totalBlocks,
           pRecorder->loadBlockStatis, pRecorder->loadBlocks, pRecorder->totalRows, pRecorder->totalCheckedRows);
  }
L
Liu Jicong 已提交
1677 1678 1679
  // qDebug("QInfo:0x%"PRIx64" :cost summary: winResPool size:%.2f Kb, numOfWin:%"PRId64", tableInfoSize:%.2f Kb,
  // hashTable:%.2f Kb", pQInfo->qId, pSummary->winInfoSize/1024.0,
  //      pSummary->numOfTimeWindows, pSummary->tableInfoSize/1024.0, pSummary->hashSize/1024.0);
1680 1681
}

L
Liu Jicong 已提交
1682 1683 1684
// static void updateOffsetVal(STaskRuntimeEnv *pRuntimeEnv, SDataBlockInfo *pBlockInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
1685
//
L
Liu Jicong 已提交
1686
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1687
//
L
Liu Jicong 已提交
1688 1689 1690 1691
//   if (pQueryAttr->limit.offset == pBlockInfo->rows) {  // current block will ignore completed
//     pTableQueryInfo->lastKey = QUERY_IS_ASC_QUERY(pQueryAttr) ? pBlockInfo->window.ekey + step :
//     pBlockInfo->window.skey + step; pQueryAttr->limit.offset = 0; return;
//   }
1692
//
L
Liu Jicong 已提交
1693 1694 1695 1696 1697
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     pQueryAttr->pos = (int32_t)pQueryAttr->limit.offset;
//   } else {
//     pQueryAttr->pos = pBlockInfo->rows - (int32_t)pQueryAttr->limit.offset - 1;
//   }
1698
//
L
Liu Jicong 已提交
1699
//   assert(pQueryAttr->pos >= 0 && pQueryAttr->pos <= pBlockInfo->rows - 1);
1700
//
L
Liu Jicong 已提交
1701 1702
//   SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//   SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1703
//
L
Liu Jicong 已提交
1704 1705
//   // update the pQueryAttr->limit.offset value, and pQueryAttr->pos value
//   TSKEY *keys = (TSKEY *) pColInfoData->pData;
1706
//
L
Liu Jicong 已提交
1707 1708 1709
//   // update the offset value
//   pTableQueryInfo->lastKey = keys[pQueryAttr->pos];
//   pQueryAttr->limit.offset = 0;
1710
//
L
Liu Jicong 已提交
1711
//   int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
1712
//
L
Liu Jicong 已提交
1713 1714 1715 1716
//   //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numBlocksOfStep:%d, numOfRes:%d,
//   lastKey:%"PRId64, GET_TASKID(pRuntimeEnv),
//          pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes, pQuery->current->lastKey);
// }
1717

L
Liu Jicong 已提交
1718 1719
// void skipBlocks(STaskRuntimeEnv *pRuntimeEnv) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
1720
//
L
Liu Jicong 已提交
1721 1722 1723
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0) {
//     return;
//   }
1724
//
L
Liu Jicong 已提交
1725 1726
//   pQueryAttr->pos = 0;
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1727
//
L
Liu Jicong 已提交
1728 1729
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
//   TsdbQueryHandleT pTsdbReadHandle = pRuntimeEnv->pTsdbReadHandle;
1730
//
L
Liu Jicong 已提交
1731 1732 1733 1734 1735
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pTsdbReadHandle)) {
//     if (isTaskKilled(pRuntimeEnv->qinfo)) {
//       longjmp(pRuntimeEnv->env, TSDB_CODE_TSC_QUERY_CANCELLED);
//     }
1736
//
L
Liu Jicong 已提交
1737
//     tsdbRetrieveDataBlockInfo(pTsdbReadHandle, &blockInfo);
1738
//
L
Liu Jicong 已提交
1739 1740 1741 1742
//     if (pQueryAttr->limit.offset > blockInfo.rows) {
//       pQueryAttr->limit.offset -= blockInfo.rows;
//       pTableQueryInfo->lastKey = (QUERY_IS_ASC_QUERY(pQueryAttr)) ? blockInfo.window.ekey : blockInfo.window.skey;
//       pTableQueryInfo->lastKey += step;
1743
//
L
Liu Jicong 已提交
1744 1745 1746 1747 1748 1749 1750
//       //qDebug("QInfo:0x%"PRIx64" skip rows:%d, offset:%" PRId64, GET_TASKID(pRuntimeEnv), blockInfo.rows,
//              pQuery->limit.offset);
//     } else {  // find the appropriated start position in current block
//       updateOffsetVal(pRuntimeEnv, &blockInfo);
//       break;
//     }
//   }
1751
//
L
Liu Jicong 已提交
1752 1753 1754 1755 1756 1757 1758 1759 1760
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
// }

// static TSKEY doSkipIntervalProcess(STaskRuntimeEnv* pRuntimeEnv, STimeWindow* win, SDataBlockInfo* pBlockInfo,
// STableQueryInfo* pTableQueryInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
1761
//
L
Liu Jicong 已提交
1762 1763 1764
//   assert(pQueryAttr->limit.offset == 0);
//   STimeWindow tw = *win;
//   getNextTimeWindow(pQueryAttr, &tw);
1765
//
L
Liu Jicong 已提交
1766 1767
//   if ((tw.skey <= pBlockInfo->window.ekey && QUERY_IS_ASC_QUERY(pQueryAttr)) ||
//       (tw.ekey >= pBlockInfo->window.skey && !QUERY_IS_ASC_QUERY(pQueryAttr))) {
1768
//
L
Liu Jicong 已提交
1769 1770 1771 1772
//     // load the data block and check data remaining in current data block
//     // TODO optimize performance
//     SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//     SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1773
//
L
Liu Jicong 已提交
1774 1775 1776 1777
//     tw = *win;
//     int32_t startPos =
//         getNextQualifiedWindow(pQueryAttr, &tw, pBlockInfo, pColInfoData->pData, binarySearchForKey, -1);
//     assert(startPos >= 0);
1778
//
L
Liu Jicong 已提交
1779 1780
//     // set the abort info
//     pQueryAttr->pos = startPos;
1781
//
L
Liu Jicong 已提交
1782 1783 1784 1785
//     // reset the query start timestamp
//     pTableQueryInfo->win.skey = ((TSKEY *)pColInfoData->pData)[startPos];
//     pQueryAttr->window.skey = pTableQueryInfo->win.skey;
//     TSKEY key = pTableQueryInfo->win.skey;
1786
//
L
Liu Jicong 已提交
1787 1788
//     pWindowResInfo->prevSKey = tw.skey;
//     int32_t index = pRuntimeEnv->resultRowInfo.curIndex;
1789
//
L
Liu Jicong 已提交
1790 1791
//     int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
//     pRuntimeEnv->resultRowInfo.curIndex = index;  // restore the window index
1792
//
L
Liu Jicong 已提交
1793 1794 1795 1796
//     //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numOfRows:%d, numOfRes:%d,
//     lastKey:%" PRId64,
//            GET_TASKID(pRuntimeEnv), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes,
//            pQueryAttr->current->lastKey);
1797
//
L
Liu Jicong 已提交
1798 1799 1800 1801 1802
//     return key;
//   } else {  // do nothing
//     pQueryAttr->window.skey      = tw.skey;
//     pWindowResInfo->prevSKey = tw.skey;
//     pTableQueryInfo->lastKey = tw.skey;
1803
//
L
Liu Jicong 已提交
1804 1805
//     return tw.skey;
//   }
1806
//
L
Liu Jicong 已提交
1807 1808 1809 1810 1811 1812 1813 1814 1815 1816
//   return true;
// }

// static bool skipTimeInterval(STaskRuntimeEnv *pRuntimeEnv, TSKEY* start) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     assert(*start <= pRuntimeEnv->current->lastKey);
//   } else {
//     assert(*start >= pRuntimeEnv->current->lastKey);
//   }
1817
//
L
Liu Jicong 已提交
1818 1819 1820 1821 1822
//   // if queried with value filter, do NOT forward query start position
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0 || pRuntimeEnv->pTsBuf != NULL ||
//   pRuntimeEnv->pFillInfo != NULL) {
//     return true;
//   }
1823
//
L
Liu Jicong 已提交
1824 1825 1826 1827 1828 1829 1830
//   /*
//    * 1. for interval without interpolation query we forward pQueryAttr->interval.interval at a time for
//    *    pQueryAttr->limit.offset times. Since hole exists, pQueryAttr->interval.interval*pQueryAttr->limit.offset
//    value is
//    *    not valid. otherwise, we only forward pQueryAttr->limit.offset number of points
//    */
//   assert(pRuntimeEnv->resultRowInfo.prevSKey == TSKEY_INITIAL_VAL);
1831
//
L
Liu Jicong 已提交
1832 1833
//   STimeWindow w = TSWINDOW_INITIALIZER;
//   bool ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1834
//
L
Liu Jicong 已提交
1835 1836
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
//   STableQueryInfo *pTableQueryInfo = pRuntimeEnv->current;
1837
//
L
Liu Jicong 已提交
1838 1839 1840
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pRuntimeEnv->pTsdbReadHandle)) {
//     tsdbRetrieveDataBlockInfo(pRuntimeEnv->pTsdbReadHandle, &blockInfo);
1841
//
L
Liu Jicong 已提交
1842 1843 1844 1845 1846 1847 1848 1849 1850
//     if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       if (pWindowResInfo->prevSKey == TSKEY_INITIAL_VAL) {
//         getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.skey, blockInfo.window.skey, pQueryAttr->window.ekey,
//         &w); pWindowResInfo->prevSKey = w.skey;
//       }
//     } else {
//       getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.ekey, pQueryAttr->window.ekey, blockInfo.window.ekey, &w);
//       pWindowResInfo->prevSKey = w.skey;
//     }
1851
//
L
Liu Jicong 已提交
1852 1853
//     // the first time window
//     STimeWindow win = getActiveTimeWindow(pWindowResInfo, pWindowResInfo->prevSKey, pQueryAttr);
1854
//
L
Liu Jicong 已提交
1855 1856
//     while (pQueryAttr->limit.offset > 0) {
//       STimeWindow tw = win;
1857
//
L
Liu Jicong 已提交
1858 1859 1860
//       if ((win.ekey <= blockInfo.window.ekey && ascQuery) || (win.ekey >= blockInfo.window.skey && !ascQuery)) {
//         pQueryAttr->limit.offset -= 1;
//         pWindowResInfo->prevSKey = win.skey;
1861
//
L
Liu Jicong 已提交
1862 1863 1864 1865 1866 1867
//         // current time window is aligned with blockInfo.window.ekey
//         // restart it from next data block by set prevSKey to be TSKEY_INITIAL_VAL;
//         if ((win.ekey == blockInfo.window.ekey && ascQuery) || (win.ekey == blockInfo.window.skey && !ascQuery)) {
//           pWindowResInfo->prevSKey = TSKEY_INITIAL_VAL;
//         }
//       }
1868
//
L
Liu Jicong 已提交
1869 1870 1871 1872
//       if (pQueryAttr->limit.offset == 0) {
//         *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//         return true;
//       }
1873
//
L
Liu Jicong 已提交
1874 1875
//       // current window does not ended in current data block, try next data block
//       getNextTimeWindow(pQueryAttr, &tw);
1876
//
L
Liu Jicong 已提交
1877 1878 1879 1880 1881 1882 1883 1884 1885
//       /*
//        * If the next time window still starts from current data block,
//        * load the primary timestamp column first, and then find the start position for the next queried time window.
//        * Note that only the primary timestamp column is required.
//        * TODO: Optimize for this cases. All data blocks are not needed to be loaded, only if the first actually
//        required
//        * time window resides in current data block.
//        */
//       if ((tw.skey <= blockInfo.window.ekey && ascQuery) || (tw.ekey >= blockInfo.window.skey && !ascQuery)) {
1886
//
L
Liu Jicong 已提交
1887 1888
//         SArray *pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//         SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1889
//
L
Liu Jicong 已提交
1890 1891 1892
//         if ((win.ekey > blockInfo.window.ekey && ascQuery) || (win.ekey < blockInfo.window.skey && !ascQuery)) {
//           pQueryAttr->limit.offset -= 1;
//         }
1893
//
L
Liu Jicong 已提交
1894 1895 1896 1897 1898 1899 1900 1901
//         if (pQueryAttr->limit.offset == 0) {
//           *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//           return true;
//         } else {
//           tw = win;
//           int32_t startPos =
//               getNextQualifiedWindow(pQueryAttr, &tw, &blockInfo, pColInfoData->pData, binarySearchForKey, -1);
//           assert(startPos >= 0);
1902
//
L
Liu Jicong 已提交
1903 1904 1905 1906 1907 1908 1909 1910 1911 1912 1913
//           // set the abort info
//           pQueryAttr->pos = startPos;
//           pTableQueryInfo->lastKey = ((TSKEY *)pColInfoData->pData)[startPos];
//           pWindowResInfo->prevSKey = tw.skey;
//           win = tw;
//         }
//       } else {
//         break;  // offset is not 0, and next time window begins or ends in the next block.
//       }
//     }
//   }
1914
//
L
Liu Jicong 已提交
1915 1916 1917 1918
//   // check for error
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
1919
//
L
Liu Jicong 已提交
1920 1921
//   return true;
// }
1922

1923
int32_t appendDownstream(SOperatorInfo* p, SOperatorInfo** pDownstream, int32_t num) {
H
Haojun Liao 已提交
1924
  if (p->pDownstream == NULL) {
H
Haojun Liao 已提交
1925
    assert(p->numOfDownstream == 0);
1926 1927
  }

wafwerar's avatar
wafwerar 已提交
1928
  p->pDownstream = taosMemoryCalloc(1, num * POINTER_BYTES);
1929 1930 1931 1932 1933 1934 1935
  if (p->pDownstream == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  memcpy(p->pDownstream, pDownstream, num * POINTER_BYTES);
  p->numOfDownstream = num;
  return TSDB_CODE_SUCCESS;
1936 1937
}

wmmhello's avatar
wmmhello 已提交
1938
static void doDestroyTableList(STableListInfo* pTableqinfoList);
1939

1940
static void doTableQueryInfoTimeWindowCheck(SExecTaskInfo* pTaskInfo, STableQueryInfo* pTableQueryInfo, int32_t order) {
H
Haojun Liao 已提交
1941 1942
#if 0
    if (order == TSDB_ORDER_ASC) {
1943 1944
    assert(
        (pTableQueryInfo->win.skey <= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1945 1946
        (pTableQueryInfo->lastKey >= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey >= pTaskInfo->window.skey && pTableQueryInfo->win.ekey <= pTaskInfo->window.ekey));
1947 1948 1949
  } else {
    assert(
        (pTableQueryInfo->win.skey >= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1950 1951
        (pTableQueryInfo->lastKey <= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey <= pTaskInfo->window.skey && pTableQueryInfo->win.ekey >= pTaskInfo->window.ekey));
1952
  }
H
Haojun Liao 已提交
1953
#endif
1954 1955
}

1956 1957 1958 1959
typedef struct SFetchRspHandleWrapper {
  uint32_t exchangeId;
  int32_t  sourceIndex;
} SFetchRspHandleWrapper;
1960

D
dapan1121 已提交
1961
int32_t loadRemoteDataCallback(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1962
  SFetchRspHandleWrapper* pWrapper = (SFetchRspHandleWrapper*)param;
1963 1964 1965 1966 1967 1968 1969

  SExchangeInfo* pExchangeInfo = taosAcquireRef(exchangeObjRefPool, pWrapper->exchangeId);
  if (pExchangeInfo == NULL) {
    qWarn("failed to acquire exchange operator, since it may have been released");
    return TSDB_CODE_SUCCESS;
  }

X
Xiaoyu Wang 已提交
1970
  int32_t          index = pWrapper->sourceIndex;
1971
  SSourceDataInfo* pSourceDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, index);
1972

H
Haojun Liao 已提交
1973 1974
  if (code == TSDB_CODE_SUCCESS) {
    pSourceDataInfo->pRsp = pMsg->pData;
1975

H
Haojun Liao 已提交
1976 1977
    SRetrieveTableRsp* pRsp = pSourceDataInfo->pRsp;
    pRsp->numOfRows = htonl(pRsp->numOfRows);
dengyihao's avatar
dengyihao 已提交
1978
    pRsp->compLen = htonl(pRsp->compLen);
1979
    pRsp->numOfCols = htonl(pRsp->numOfCols);
dengyihao's avatar
dengyihao 已提交
1980
    pRsp->useconds = htobe64(pRsp->useconds);
1981

1982
    ASSERT(pRsp != NULL);
1983
    qDebug("%s fetch rsp received, index:%d, rows:%d", pSourceDataInfo->taskId, index, pRsp->numOfRows);
H
Haojun Liao 已提交
1984 1985
  } else {
    pSourceDataInfo->code = code;
D
dapan1121 已提交
1986
    qDebug("%s fetch rsp received, index:%d, error:%d", pSourceDataInfo->taskId, index, tstrerror(code));
H
Haojun Liao 已提交
1987
  }
H
Haojun Liao 已提交
1988

H
Haojun Liao 已提交
1989
  pSourceDataInfo->status = EX_SOURCE_DATA_READY;
1990 1991 1992 1993 1994

  tsem_post(&pExchangeInfo->ready);
  taosReleaseRef(exchangeObjRefPool, pWrapper->exchangeId);

  taosMemoryFree(pWrapper);
wmmhello's avatar
wmmhello 已提交
1995
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
1996 1997 1998 1999
}

static void destroySendMsgInfo(SMsgSendInfo* pMsgBody) {
  assert(pMsgBody != NULL);
wafwerar's avatar
wafwerar 已提交
2000 2001
  taosMemoryFreeClear(pMsgBody->msgInfo.pData);
  taosMemoryFreeClear(pMsgBody);
H
Haojun Liao 已提交
2002 2003
}

D
dapan1121 已提交
2004
void qProcessRspMsg(void* parent, SRpcMsg* pMsg, SEpSet* pEpSet) {
S
Shengliang Guan 已提交
2005 2006
  SMsgSendInfo* pSendInfo = (SMsgSendInfo*)pMsg->info.ahandle;
  assert(pMsg->info.ahandle != NULL);
H
Haojun Liao 已提交
2007 2008 2009 2010

  SDataBuf buf = {.len = pMsg->contLen, .pData = NULL};

  if (pMsg->contLen > 0) {
wafwerar's avatar
wafwerar 已提交
2011
    buf.pData = taosMemoryCalloc(1, pMsg->contLen);
H
Haojun Liao 已提交
2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022
    if (buf.pData == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      pMsg->code = TSDB_CODE_OUT_OF_MEMORY;
    } else {
      memcpy(buf.pData, pMsg->pCont, pMsg->contLen);
    }
  }

  pSendInfo->fp(pSendInfo->param, &buf, pMsg->code);
  rpcFreeCont(pMsg->pCont);
  destroySendMsgInfo(pSendInfo);
2023 2024
}

L
Liu Jicong 已提交
2025
static int32_t doSendFetchDataRequest(SExchangeInfo* pExchangeInfo, SExecTaskInfo* pTaskInfo, int32_t sourceIndex) {
2026
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2027

wafwerar's avatar
wafwerar 已提交
2028
  SResFetchReq* pMsg = taosMemoryCalloc(1, sizeof(SResFetchReq));
2029 2030 2031 2032
  if (NULL == pMsg) {
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
  }
2033

L
Liu Jicong 已提交
2034 2035
  SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, sourceIndex);
  SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, sourceIndex);
2036

2037 2038
  ASSERT(pDataInfo->status == EX_SOURCE_DATA_NOT_READY);

2039 2040 2041
  qDebug("%s build fetch msg and send to vgId:%d, ep:%s, taskId:0x%" PRIx64 ", execId:%d, %d/%" PRIzu,
         GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->addr.epSet.eps[0].fqdn, pSource->taskId, pSource->execId,
         sourceIndex, totalSources);
2042 2043 2044 2045 2046

  pMsg->header.vgId = htonl(pSource->addr.nodeId);
  pMsg->sId = htobe64(pSource->schedId);
  pMsg->taskId = htobe64(pSource->taskId);
  pMsg->queryId = htobe64(pTaskInfo->id.queryId);
D
dapan1121 已提交
2047
  pMsg->execId = htonl(pSource->execId);
2048 2049

  // send the fetch remote task result reques
wafwerar's avatar
wafwerar 已提交
2050
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
2051
  if (NULL == pMsgSendInfo) {
wafwerar's avatar
wafwerar 已提交
2052
    taosMemoryFreeClear(pMsg);
2053 2054 2055
    qError("%s prepare message %d failed", GET_TASKID(pTaskInfo), (int32_t)sizeof(SMsgSendInfo));
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
H
Haojun Liao 已提交
2056 2057
  }

2058
  SFetchRspHandleWrapper* pWrapper = taosMemoryCalloc(1, sizeof(SFetchRspHandleWrapper));
X
Xiaoyu Wang 已提交
2059
  pWrapper->exchangeId = pExchangeInfo->self;
2060 2061 2062
  pWrapper->sourceIndex = sourceIndex;

  pMsgSendInfo->param = pWrapper;
2063 2064
  pMsgSendInfo->msgInfo.pData = pMsg;
  pMsgSendInfo->msgInfo.len = sizeof(SResFetchReq);
L
Liu Jicong 已提交
2065
  pMsgSendInfo->msgType = pSource->fetchMsgType;
2066
  pMsgSendInfo->fp = loadRemoteDataCallback;
2067

2068
  int64_t transporterId = 0;
L
Liu Jicong 已提交
2069
  int32_t code = asyncSendMsgToServer(pExchangeInfo->pTransporter, &pSource->addr.epSet, &transporterId, pMsgSendInfo);
2070 2071 2072
  return TSDB_CODE_SUCCESS;
}

2073
int32_t extractDataBlockFromFetchRsp(SSDataBlock* pRes, SLoadRemoteDataInfo* pLoadInfo, int32_t numOfRows, char* pData,
L
Liu Jicong 已提交
2074 2075
                                     int32_t compLen, int32_t numOfOutput, int64_t startTs, uint64_t* total,
                                     SArray* pColList) {
H
Haojun Liao 已提交
2076
  if (pColList == NULL) {  // data from other sources
2077
    blockDataCleanup(pRes);
2078
    //    blockDataEnsureCapacity(pRes, numOfRows);
2079
    blockDecode(pRes, numOfOutput, numOfRows, pData);
H
Haojun Liao 已提交
2080
  } else {  // extract data according to pColList
2081
    ASSERT(numOfOutput == taosArrayGetSize(pColList));
2082 2083 2084 2085 2086
    char* pStart = pData;

    int32_t numOfCols = htonl(*(int32_t*)pStart);
    pStart += sizeof(int32_t);

2087
    // todo refactor:extract method
2088
    SSysTableSchema* pSchema = (SSysTableSchema*)pStart;
dengyihao's avatar
dengyihao 已提交
2089
    for (int32_t i = 0; i < numOfCols; ++i) {
2090 2091 2092 2093 2094 2095 2096
      SSysTableSchema* p = (SSysTableSchema*)pStart;

      p->colId = htons(p->colId);
      p->bytes = htonl(p->bytes);
      pStart += sizeof(SSysTableSchema);
    }

2097
    SSDataBlock* pBlock = createDataBlock();
dengyihao's avatar
dengyihao 已提交
2098
    for (int32_t i = 0; i < numOfCols; ++i) {
2099 2100
      SColumnInfoData idata = createColumnInfoData(pSchema[i].type, pSchema[i].bytes, pSchema[i].colId);
      blockDataAppendColInfo(pBlock, &idata);
2101 2102
    }

2103
    blockDecode(pBlock, numOfCols, numOfRows, pStart);
2104 2105
    blockDataEnsureCapacity(pRes, numOfRows);

H
Haojun Liao 已提交
2106
    // data from mnode
2107
    pRes->info.rows = numOfRows;
2108 2109
    relocateColumnData(pRes, pColList, pBlock->pDataBlock, false);
    blockDataDestroy(pBlock);
2110
  }
2111

2112 2113
  // todo move this to time window aggregator, since the primary timestamp may not be known by exchange operator.
  blockDataUpdateTsWindow(pRes, 0);
2114

2115
  int64_t el = taosGetTimestampUs() - startTs;
2116

H
Haojun Liao 已提交
2117 2118
  pLoadInfo->totalRows += numOfRows;
  pLoadInfo->totalSize += compLen;
2119

H
Haojun Liao 已提交
2120 2121 2122
  if (total != NULL) {
    *total += numOfRows;
  }
2123

H
Haojun Liao 已提交
2124
  pLoadInfo->totalElapsed += el;
2125 2126
  return TSDB_CODE_SUCCESS;
}
2127

L
Liu Jicong 已提交
2128 2129
static void* setAllSourcesCompleted(SOperatorInfo* pOperator, int64_t startTs) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
2130
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
H
Haojun Liao 已提交
2131

2132
  int64_t              el = taosGetTimestampUs() - startTs;
H
Haojun Liao 已提交
2133
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2134

H
Haojun Liao 已提交
2135
  pLoadInfo->totalElapsed += el;
H
Haojun Liao 已提交
2136

2137
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
L
Liu Jicong 已提交
2138 2139 2140
  qDebug("%s all %" PRIzu " sources are exhausted, total rows: %" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
         GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
         pLoadInfo->totalElapsed / 1000.0);
2141 2142 2143 2144 2145

  doSetOperatorCompleted(pOperator);
  return NULL;
}

L
Liu Jicong 已提交
2146 2147
static SSDataBlock* concurrentlyLoadRemoteDataImpl(SOperatorInfo* pOperator, SExchangeInfo* pExchangeInfo,
                                                   SExecTaskInfo* pTaskInfo) {
2148 2149 2150 2151 2152 2153 2154 2155
  int32_t code = 0;
  int64_t startTs = taosGetTimestampUs();
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);

  while (1) {
    int32_t completed = 0;
    for (int32_t i = 0; i < totalSources; ++i) {
      SSourceDataInfo* pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, i);
2156
      if (pDataInfo->status == EX_SOURCE_DATA_EXHAUSTED) {
2157
        completed += 1;
H
Haojun Liao 已提交
2158 2159
        continue;
      }
2160

2161
      if (pDataInfo->status != EX_SOURCE_DATA_READY) {
2162 2163 2164
        continue;
      }

2165 2166 2167 2168 2169
      if (pDataInfo->code != TSDB_CODE_SUCCESS) {
        code = pDataInfo->code;
        goto _error;
      }

L
Liu Jicong 已提交
2170
      SRetrieveTableRsp*     pRsp = pDataInfo->pRsp;
X
Xiaoyu Wang 已提交
2171
      SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, i);
2172

L
Liu Jicong 已提交
2173
      SSDataBlock*         pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2174
      SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2175
      if (pRsp->numOfRows == 0) {
2176 2177
        qDebug("%s vgId:%d, taskId:0x%" PRIx64 " execId:%d index:%d completed, rowsOfSource:%" PRIu64
               ", totalRows:%" PRIu64 ", completed:%d try next %d/%" PRIzu,
D
dapan1121 已提交
2178
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pDataInfo->totalRows,
2179
               pExchangeInfo->loadInfo.totalRows, completed + 1, i + 1, totalSources);
2180
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2181
        completed += 1;
D
dapan1121 已提交
2182
        taosMemoryFreeClear(pDataInfo->pRsp);
2183 2184
        continue;
      }
H
Haojun Liao 已提交
2185

H
Haojun Liao 已提交
2186
      SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2187 2188 2189
      code =
          extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
                                       pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2190
      if (code != 0) {
2191
        taosMemoryFreeClear(pDataInfo->pRsp);
2192 2193 2194
        goto _error;
      }

2195
      if (pRsp->completed == 1) {
2196 2197
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64
               " execId:%d"
X
Xiaoyu Wang 已提交
2198 2199
               " index:%d completed, numOfRows:%d, rowsOfSource:%" PRIu64 ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64
               ", completed:%d try next %d/%" PRIzu,
2200 2201
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pRes->info.rows,
               pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, completed + 1, i + 1, totalSources);
2202
        completed += 1;
2203
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2204
      } else {
D
dapan1121 已提交
2205
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
dengyihao's avatar
dengyihao 已提交
2206
               ", totalBytes:%" PRIu64,
2207 2208
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
               pLoadInfo->totalRows, pLoadInfo->totalSize);
2209 2210
      }

2211 2212
      taosMemoryFreeClear(pDataInfo->pRsp);

2213 2214
      if (pDataInfo->status != EX_SOURCE_DATA_EXHAUSTED) {
        pDataInfo->status = EX_SOURCE_DATA_NOT_READY;
2215 2216
        code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
        if (code != TSDB_CODE_SUCCESS) {
2217
          taosMemoryFreeClear(pDataInfo->pRsp);
2218 2219 2220 2221 2222 2223 2224
          goto _error;
        }
      }

      return pExchangeInfo->pResult;
    }

2225
    if (completed == totalSources) {
2226 2227
      return setAllSourcesCompleted(pOperator, startTs);
    }
H
Haojun Liao 已提交
2228 2229

    sched_yield();
2230 2231 2232 2233 2234 2235 2236
  }

_error:
  pTaskInfo->code = code;
  return NULL;
}

L
Liu Jicong 已提交
2237 2238 2239
static int32_t prepareConcurrentlyLoad(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2240

L
Liu Jicong 已提交
2241
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2242 2243 2244
  int64_t startTs = taosGetTimestampUs();

  // Asynchronously send all fetch requests to all sources.
L
Liu Jicong 已提交
2245
  for (int32_t i = 0; i < totalSources; ++i) {
2246 2247
    int32_t code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
    if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2248 2249
      pTaskInfo->code = code;
      return code;
2250 2251 2252 2253
    }
  }

  int64_t endTs = taosGetTimestampUs();
2254
  qDebug("%s send all fetch requests to %" PRIzu " sources completed, elapsed:%.2fms", GET_TASKID(pTaskInfo),
X
Xiaoyu Wang 已提交
2255
         totalSources, (endTs - startTs) / 1000.0);
2256

2257
  pOperator->status = OP_RES_TO_RETURN;
H
Haojun Liao 已提交
2258
  pOperator->cost.openCost = taosGetTimestampUs() - startTs;
2259

2260
  tsem_wait(&pExchangeInfo->ready);
H
Haojun Liao 已提交
2261
  return TSDB_CODE_SUCCESS;
2262 2263
}

L
Liu Jicong 已提交
2264 2265 2266
static SSDataBlock* seqLoadRemoteData(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2267

L
Liu Jicong 已提交
2268
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2269
  int64_t startTs = taosGetTimestampUs();
2270

L
Liu Jicong 已提交
2271
  while (1) {
2272 2273
    if (pExchangeInfo->current >= totalSources) {
      return setAllSourcesCompleted(pOperator, startTs);
2274
    }
2275

2276 2277 2278
    doSendFetchDataRequest(pExchangeInfo, pTaskInfo, pExchangeInfo->current);
    tsem_wait(&pExchangeInfo->ready);

dengyihao's avatar
dengyihao 已提交
2279
    SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, pExchangeInfo->current);
X
Xiaoyu Wang 已提交
2280
    SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, pExchangeInfo->current);
2281

H
Haojun Liao 已提交
2282
    if (pDataInfo->code != TSDB_CODE_SUCCESS) {
2283 2284
      qError("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d error happens, code:%s", GET_TASKID(pTaskInfo),
             pSource->addr.nodeId, pSource->taskId, pSource->execId, tstrerror(pDataInfo->code));
H
Haojun Liao 已提交
2285 2286 2287 2288
      pOperator->pTaskInfo->code = pDataInfo->code;
      return NULL;
    }

L
Liu Jicong 已提交
2289
    SRetrieveTableRsp*   pRsp = pDataInfo->pRsp;
H
Haojun Liao 已提交
2290
    SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2291
    if (pRsp->numOfRows == 0) {
2292 2293
      qDebug("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d %d of total completed, rowsOfSource:%" PRIu64
             ", totalRows:%" PRIu64 " try next",
D
dapan1121 已提交
2294
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pExchangeInfo->current + 1,
H
Haojun Liao 已提交
2295
             pDataInfo->totalRows, pLoadInfo->totalRows);
H
Haojun Liao 已提交
2296

2297
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2298
      pExchangeInfo->current += 1;
D
dapan1121 已提交
2299
      taosMemoryFreeClear(pDataInfo->pRsp);
2300 2301
      continue;
    }
H
Haojun Liao 已提交
2302

L
Liu Jicong 已提交
2303
    SSDataBlock*       pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2304
    SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2305
    int32_t            code =
2306
        extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
L
Liu Jicong 已提交
2307
                                     pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2308 2309

    if (pRsp->completed == 1) {
D
dapan1121 已提交
2310
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, rowsOfSource:%" PRIu64
L
Liu Jicong 已提交
2311
             ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64 " try next %d/%" PRIzu,
2312 2313 2314
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, pExchangeInfo->current + 1,
             totalSources);
2315

2316
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2317 2318
      pExchangeInfo->current += 1;
    } else {
D
dapan1121 已提交
2319
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
L
Liu Jicong 已提交
2320
             ", totalBytes:%" PRIu64,
2321 2322
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pLoadInfo->totalRows, pLoadInfo->totalSize);
2323 2324
    }

2325
    pOperator->resultInfo.totalRows += pRes->info.rows;
2326
    taosMemoryFreeClear(pDataInfo->pRsp);
2327 2328
    return pExchangeInfo->pResult;
  }
2329 2330
}

L
Liu Jicong 已提交
2331
static int32_t prepareLoadRemoteData(SOperatorInfo* pOperator) {
2332
  if (OPTR_IS_OPENED(pOperator)) {
H
Haojun Liao 已提交
2333 2334 2335
    return TSDB_CODE_SUCCESS;
  }

2336 2337
  int64_t st = taosGetTimestampUs();

L
Liu Jicong 已提交
2338
  SExchangeInfo* pExchangeInfo = pOperator->info;
2339
  if (!pExchangeInfo->seqLoadData) {
H
Haojun Liao 已提交
2340 2341 2342 2343 2344 2345
    int32_t code = prepareConcurrentlyLoad(pOperator);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
    }
  }

2346
  OPTR_SET_OPENED(pOperator);
2347
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2348 2349 2350
  return TSDB_CODE_SUCCESS;
}

2351
static SSDataBlock* doLoadRemoteDataImpl(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
2352 2353
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2354

2355
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
2356
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2357 2358
    return NULL;
  }
2359

L
Liu Jicong 已提交
2360
  size_t               totalSources = taosArrayGetSize(pExchangeInfo->pSources);
H
Haojun Liao 已提交
2361
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
H
Haojun Liao 已提交
2362

2363
  if (pOperator->status == OP_EXEC_DONE) {
L
Liu Jicong 已提交
2364 2365 2366
    qDebug("%s all %" PRIzu " source(s) are exhausted, total rows:%" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
           GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
           pLoadInfo->totalElapsed / 1000.0);
2367 2368 2369 2370 2371 2372
    return NULL;
  }

  if (pExchangeInfo->seqLoadData) {
    return seqLoadRemoteData(pOperator);
  } else {
2373
    return concurrentlyLoadRemoteDataImpl(pOperator, pExchangeInfo, pTaskInfo);
2374
  }
H
Haojun Liao 已提交
2375
}
2376

2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400 2401 2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412 2413 2414
static SSDataBlock* doLoadRemoteData(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

  while(1) {
    SSDataBlock* pBlock = doLoadRemoteDataImpl(pOperator);
    if (pBlock == NULL) {
      return NULL;
    }

    ASSERT(pBlock == pExchangeInfo->pResult);

    SLimitInfo* pLimitInfo = &pExchangeInfo->limitInfo;
    if (hasLimitOffsetInfo(pLimitInfo)) {
      int32_t status = handleLimitOffset(pOperator, pLimitInfo, pExchangeInfo->pResult, false);
      if (status == PROJECT_RETRIEVE_CONTINUE) {
        continue;
      } else if (status == PROJECT_RETRIEVE_DONE) {
        size_t rows = pExchangeInfo->pResult->info.rows;
        pExchangeInfo->limitInfo.numOfOutputRows += rows;

        if (rows == 0) {
          doSetOperatorCompleted(pOperator);
          return NULL;
        } else {
          return pExchangeInfo->pResult;
        }
      }
    } else {
      return pExchangeInfo->pResult;
    }
  }
}

2415
static int32_t initDataSource(int32_t numOfSources, SExchangeInfo* pInfo, const char* id) {
2416
  pInfo->pSourceDataInfo = taosArrayInit(numOfSources, sizeof(SSourceDataInfo));
H
Haojun Liao 已提交
2417 2418
  if (pInfo->pSourceDataInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
2419 2420
  }

L
Liu Jicong 已提交
2421
  for (int32_t i = 0; i < numOfSources; ++i) {
2422
    SSourceDataInfo dataInfo = {0};
H
Haojun Liao 已提交
2423
    dataInfo.status = EX_SOURCE_DATA_NOT_READY;
2424
    dataInfo.taskId = id;
L
Liu Jicong 已提交
2425
    dataInfo.index = i;
X
Xiaoyu Wang 已提交
2426
    SSourceDataInfo* pDs = taosArrayPush(pInfo->pSourceDataInfo, &dataInfo);
2427
    if (pDs == NULL) {
H
Haojun Liao 已提交
2428 2429 2430 2431 2432 2433 2434 2435
      taosArrayDestroy(pInfo->pSourceDataInfo);
      return TSDB_CODE_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
}

2436
static int32_t initExchangeOperator(SExchangePhysiNode* pExNode, SExchangeInfo* pInfo, const char* id) {
2437
  size_t numOfSources = LIST_LENGTH(pExNode->pSrcEndPoints);
H
Haojun Liao 已提交
2438

2439
  if (numOfSources == 0) {
X
Xiaoyu Wang 已提交
2440
    qError("%s invalid number: %d of sources in exchange operator", id, (int32_t)numOfSources);
2441 2442 2443
    return TSDB_CODE_INVALID_PARA;
  }

H
Haojun Liao 已提交
2444
  pInfo->pSources = taosArrayInit(numOfSources, sizeof(SDownstreamSourceNode));
wmmhello's avatar
wmmhello 已提交
2445
  if (pInfo->pSources == NULL) {
2446
    return TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
2447 2448
  }

L
Liu Jicong 已提交
2449
  for (int32_t i = 0; i < numOfSources; ++i) {
D
dapan1121 已提交
2450
    SDownstreamSourceNode* pNode = (SDownstreamSourceNode*)nodesListGetNode((SNodeList*)pExNode->pSrcEndPoints, i);
H
Haojun Liao 已提交
2451 2452
    taosArrayPush(pInfo->pSources, pNode);
  }
2453

2454
  initLimitInfo(pExNode->node.pLimit, pExNode->node.pSlimit, &pInfo->limitInfo);
2455 2456
  pInfo->self = taosAddRef(exchangeObjRefPool, pInfo);

2457
  return initDataSource(numOfSources, pInfo, id);
2458 2459 2460 2461 2462 2463
}

SOperatorInfo* createExchangeOperatorInfo(void* pTransporter, SExchangePhysiNode* pExNode, SExecTaskInfo* pTaskInfo) {
  SExchangeInfo* pInfo = taosMemoryCalloc(1, sizeof(SExchangeInfo));
  SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
H
Haojun Liao 已提交
2464
    goto _error;
2465
  }
H
Haojun Liao 已提交
2466

2467
  int32_t code = initExchangeOperator(pExNode, pInfo, GET_TASKID(pTaskInfo));
2468 2469 2470
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2471 2472

  tsem_init(&pInfo->ready, 0, 0);
2473

2474
  pInfo->seqLoadData = false;
2475
  pInfo->pTransporter = pTransporter;
2476 2477
  pInfo->pResult = createResDataBlock(pExNode->node.pOutputDataBlockDesc);
  pOperator->name = "ExchangeOperator";
X
Xiaoyu Wang 已提交
2478
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_EXCHANGE;
X
Xiaoyu Wang 已提交
2479
  pOperator->blocking = false;
2480 2481
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
2482
  pOperator->exprSupp.numOfExprs = taosArrayGetSize(pInfo->pResult->pDataBlock);
X
Xiaoyu Wang 已提交
2483
  pOperator->pTaskInfo = pTaskInfo;
2484

L
Liu Jicong 已提交
2485 2486
  pOperator->fpSet = createOperatorFpSet(prepareLoadRemoteData, doLoadRemoteData, NULL, NULL,
                                         destroyExchangeOperatorInfo, NULL, NULL, NULL);
2487
  return pOperator;
H
Haojun Liao 已提交
2488

L
Liu Jicong 已提交
2489
_error:
H
Haojun Liao 已提交
2490
  if (pInfo != NULL) {
2491
    doDestroyExchangeOperatorInfo(pInfo);
H
Haojun Liao 已提交
2492 2493
  }

wafwerar's avatar
wafwerar 已提交
2494
  taosMemoryFreeClear(pOperator);
2495
  pTaskInfo->code = code;
H
Haojun Liao 已提交
2496
  return NULL;
2497 2498
}

dengyihao's avatar
dengyihao 已提交
2499 2500
static int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                                const char* pKey);
2501

2502
static void destroySortedMergeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
2503
  SSortedMergeOperatorInfo* pInfo = (SSortedMergeOperatorInfo*)param;
H
Haojun Liao 已提交
2504
  taosArrayDestroy(pInfo->pSortInfo);
2505 2506 2507
  taosArrayDestroy(pInfo->groupInfo);

  if (pInfo->pSortHandle != NULL) {
H
Haojun Liao 已提交
2508
    tsortDestroySortHandle(pInfo->pSortHandle);
2509 2510
  }

H
Haojun Liao 已提交
2511
  blockDataDestroy(pInfo->binfo.pRes);
H
Haojun Liao 已提交
2512
  cleanupAggSup(&pInfo->aggSup);
L
Liu Jicong 已提交
2513

D
dapan1121 已提交
2514
  taosMemoryFreeClear(param);
2515
}
H
Haojun Liao 已提交
2516

L
Liu Jicong 已提交
2517
static bool needToMerge(SSDataBlock* pBlock, SArray* groupInfo, char** buf, int32_t rowIndex) {
2518 2519 2520 2521
  size_t size = taosArrayGetSize(groupInfo);
  if (size == 0) {
    return true;
  }
2522

2523 2524
  for (int32_t i = 0; i < size; ++i) {
    int32_t* index = taosArrayGet(groupInfo, i);
2525

2526
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
L
Liu Jicong 已提交
2527
    bool             isNull = colDataIsNull(pColInfo, rowIndex, pBlock->info.rows, NULL);
2528

2529 2530 2531
    if ((isNull && buf[i] != NULL) || (!isNull && buf[i] == NULL)) {
      return false;
    }
2532

2533 2534 2535 2536 2537 2538 2539 2540 2541 2542 2543 2544 2545
    char* pCell = colDataGetData(pColInfo, rowIndex);
    if (IS_VAR_DATA_TYPE(pColInfo->info.type)) {
      if (varDataLen(pCell) != varDataLen(buf[i])) {
        return false;
      } else {
        if (memcmp(varDataVal(pCell), varDataVal(buf[i]), varDataLen(pCell)) != 0) {
          return false;
        }
      }
    } else {
      if (memcmp(pCell, buf[i], pColInfo->info.bytes) != 0) {
        return false;
      }
2546 2547 2548
    }
  }

2549
  return 0;
2550 2551
}

L
Liu Jicong 已提交
2552 2553 2554
static void doMergeResultImpl(SSortedMergeOperatorInfo* pInfo, SqlFunctionCtx* pCtx, int32_t numOfExpr,
                              int32_t rowIndex) {
  for (int32_t j = 0; j < numOfExpr; ++j) {  // TODO set row index
X
Xiaoyu Wang 已提交
2555
                                             //    pCtx[j].startRow = rowIndex;
2556 2557
  }

2558 2559
  for (int32_t j = 0; j < numOfExpr; ++j) {
    int32_t functionId = pCtx[j].functionId;
L
Liu Jicong 已提交
2560 2561 2562 2563 2564 2565 2566 2567 2568
    //    pCtx[j].fpSet->addInput(&pCtx[j]);

    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_MERGE);
    //    } else {
    //      assert(!TSDB_FUNC_IS_SCALAR(functionId));
    //      aAggs[functionId].mergeFunc(&pCtx[j]);
    //    }
2569
  }
2570
}
2571

L
Liu Jicong 已提交
2572 2573
static void doFinalizeResultImpl(SqlFunctionCtx* pCtx, int32_t numOfExpr) {
  for (int32_t j = 0; j < numOfExpr; ++j) {
2574 2575 2576 2577
    int32_t functionId = pCtx[j].functionId;
    //    if (functionId == FUNC_TAG_DUMMY || functionId == FUNC_TS_DUMMY) {
    //      continue;
    //    }
2578

2579 2580 2581 2582
    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_FINALIZE);
    //    } else {
dengyihao's avatar
dengyihao 已提交
2583
    //    pCtx[j].fpSet.finalize(&pCtx[j]);
2584 2585
  }
}
2586

2587
static bool saveCurrentTuple(char** rowColData, SArray* pColumnList, SSDataBlock* pBlock, int32_t rowIndex) {
L
Liu Jicong 已提交
2588
  int32_t size = (int32_t)taosArrayGetSize(pColumnList);
2589

L
Liu Jicong 已提交
2590 2591
  for (int32_t i = 0; i < size; ++i) {
    int32_t*         index = taosArrayGet(pColumnList, i);
2592
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
H
Haojun Liao 已提交
2593

2594 2595 2596
    char* data = colDataGetData(pColInfo, rowIndex);
    memcpy(rowColData[i], data, colDataGetLength(pColInfo, rowIndex));
  }
2597

2598 2599
  return true;
}
2600

2601 2602
static void doMergeImpl(SOperatorInfo* pOperator, int32_t numOfExpr, SSDataBlock* pBlock) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
2603

2604
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
2605

L
Liu Jicong 已提交
2606
  for (int32_t i = 0; i < pBlock->info.rows; ++i) {
2607 2608 2609 2610 2611 2612 2613 2614 2615
    if (!pInfo->hasGroupVal) {
      ASSERT(i == 0);
      doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
    } else {
      if (needToMerge(pBlock, pInfo->groupInfo, pInfo->groupVal, i)) {
        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      } else {
        doFinalizeResultImpl(pCtx, numOfExpr);
2616 2617
        int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
        //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2618

2619
        // TODO check for available buffer;
H
Haojun Liao 已提交
2620

2621 2622 2623 2624 2625
        // next group info data
        pInfo->binfo.pRes->info.rows += numOfRows;
        for (int32_t j = 0; j < numOfExpr; ++j) {
          if (pCtx[j].functionId < 0) {
            continue;
2626
          }
2627

H
Haojun Liao 已提交
2628
          pCtx[j].fpSet.process(&pCtx[j]);
2629
        }
2630 2631 2632

        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
        pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
H
Haojun Liao 已提交
2633
      }
2634 2635 2636 2637
    }
  }
}

2638 2639
static SSDataBlock* doMerge(SOperatorInfo* pOperator) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
L
Liu Jicong 已提交
2640
  SSortHandle*              pHandle = pInfo->pSortHandle;
2641

2642
  SSDataBlock* pDataBlock = createOneDataBlock(pInfo->binfo.pRes, false);
2643
  blockDataEnsureCapacity(pDataBlock, pOperator->resultInfo.capacity);
2644

L
Liu Jicong 已提交
2645
  while (1) {
2646
    blockDataCleanup(pDataBlock);
2647
    while (1) {
H
Haojun Liao 已提交
2648
      STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2649 2650
      if (pTupleHandle == NULL) {
        break;
2651
      }
2652

2653 2654
      // build datablock for merge for one group
      appendOneRowToDataBlock(pDataBlock, pTupleHandle);
2655
      if (pDataBlock->info.rows >= pOperator->resultInfo.capacity) {
2656 2657
        break;
      }
2658
    }
2659

2660 2661 2662
    if (pDataBlock->info.rows == 0) {
      break;
    }
2663

2664
    setInputDataBlock(pOperator, pOperator->exprSupp.pCtx, pDataBlock, TSDB_ORDER_ASC, MAIN_SCAN, true);
L
Liu Jicong 已提交
2665 2666
    //  updateOutputBuf(&pInfo->binfo, &pAggInfo->bufCapacity, pBlock->info.rows * pAggInfo->resultRowFactor,
    //  pOperator->pRuntimeEnv, true);
2667
    doMergeImpl(pOperator, pOperator->exprSupp.numOfExprs, pDataBlock);
2668 2669
    // flush to tuple store, and after all data have been handled, return to upstream node or sink node
  }
2670

2671 2672 2673
  doFinalizeResultImpl(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs);
  int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
  //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2674

2675
  // TODO check for available buffer;
2676

2677 2678
  // next group info data
  pInfo->binfo.pRes->info.rows += numOfRows;
L
Liu Jicong 已提交
2679
  return (pInfo->binfo.pRes->info.rows > 0) ? pInfo->binfo.pRes : NULL;
2680
}
2681

L
Liu Jicong 已提交
2682 2683
SSDataBlock* getSortedMergeBlockData(SSortHandle* pHandle, SSDataBlock* pDataBlock, int32_t capacity,
                                     SArray* pColMatchInfo, SSortedMergeOperatorInfo* pInfo) {
2684 2685 2686 2687 2688 2689 2690 2691 2692 2693
  blockDataCleanup(pDataBlock);

  SSDataBlock* p = tsortGetSortedDataBlock(pHandle);
  if (p == NULL) {
    return NULL;
  }

  blockDataEnsureCapacity(p, capacity);

  while (1) {
2694
    STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2695 2696 2697 2698
    if (pTupleHandle == NULL) {
      break;
    }

2699
    appendOneRowToDataBlock(p, pTupleHandle);
2700 2701 2702 2703 2704 2705 2706 2707 2708 2709 2710 2711 2712
    if (p->info.rows >= capacity) {
      break;
    }
  }

  if (p->info.rows > 0) {
    int32_t numOfCols = taosArrayGetSize(pColMatchInfo);
    for (int32_t i = 0; i < numOfCols; ++i) {
      SColMatchInfo* pmInfo = taosArrayGet(pColMatchInfo, i);
      ASSERT(pmInfo->matchType == COL_MATCH_FROM_SLOT_ID);

      SColumnInfoData* pSrc = taosArrayGet(p->pDataBlock, pmInfo->srcSlotId);
      SColumnInfoData* pDst = taosArrayGet(pDataBlock->pDataBlock, pmInfo->targetSlotId);
2713
      colDataAssign(pDst, pSrc, p->info.rows, &pDataBlock->info);
2714 2715 2716 2717 2718 2719 2720 2721 2722 2723
    }

    pDataBlock->info.rows = p->info.rows;
    pDataBlock->info.capacity = p->info.rows;
  }

  blockDataDestroy(p);
  return (pDataBlock->info.rows > 0) ? pDataBlock : NULL;
}

2724
static SSDataBlock* doSortedMerge(SOperatorInfo* pOperator) {
2725 2726
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
2727 2728
  }

L
Liu Jicong 已提交
2729
  SExecTaskInfo*            pTaskInfo = pOperator->pTaskInfo;
2730
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
H
Haojun Liao 已提交
2731
  if (pOperator->status == OP_RES_TO_RETURN) {
2732
    return getSortedMergeBlockData(pInfo->pSortHandle, pInfo->binfo.pRes, pOperator->resultInfo.capacity, NULL, pInfo);
2733 2734
  }

2735
  int32_t numOfBufPage = pInfo->sortBufSize / pInfo->bufPageSize;
L
Liu Jicong 已提交
2736 2737
  pInfo->pSortHandle = tsortCreateSortHandle(pInfo->pSortInfo, SORT_MULTISOURCE_MERGE, pInfo->bufPageSize, numOfBufPage,
                                             pInfo->binfo.pRes, "GET_TASKID(pTaskInfo)");
H
Haojun Liao 已提交
2738

2739
  tsortSetFetchRawDataFp(pInfo->pSortHandle, loadNextDataBlock, NULL, NULL);
2740

L
Liu Jicong 已提交
2741
  for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
wmmhello's avatar
wmmhello 已提交
2742
    SSortSource* ps = taosMemoryCalloc(1, sizeof(SSortSource));
H
Haojun Liao 已提交
2743
    ps->param = pOperator->pDownstream[i];
H
Haojun Liao 已提交
2744
    tsortAddSource(pInfo->pSortHandle, ps);
2745 2746
  }

H
Haojun Liao 已提交
2747
  int32_t code = tsortOpen(pInfo->pSortHandle);
2748
  if (code != TSDB_CODE_SUCCESS) {
2749
    longjmp(pTaskInfo->env, terrno);
2750 2751
  }

H
Haojun Liao 已提交
2752
  pOperator->status = OP_RES_TO_RETURN;
2753
  return doMerge(pOperator);
2754
}
2755

L
Liu Jicong 已提交
2756 2757
static int32_t initGroupCol(SExprInfo* pExprInfo, int32_t numOfCols, SArray* pGroupInfo,
                            SSortedMergeOperatorInfo* pInfo) {
2758 2759
  if (pGroupInfo == NULL || taosArrayGetSize(pGroupInfo) == 0) {
    return 0;
H
Haojun Liao 已提交
2760 2761
  }

2762 2763 2764 2765 2766 2767 2768 2769
  int32_t len = 0;
  SArray* plist = taosArrayInit(3, sizeof(SColumn));
  pInfo->groupInfo = taosArrayInit(3, sizeof(int32_t));

  if (plist == NULL || pInfo->groupInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

L
Liu Jicong 已提交
2770 2771
  size_t numOfGroupCol = taosArrayGetSize(pInfo->groupInfo);
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2772
    SColumn* pCol = taosArrayGet(pGroupInfo, i);
L
Liu Jicong 已提交
2773
    for (int32_t j = 0; j < numOfCols; ++j) {
H
Haojun Liao 已提交
2774
      SExprInfo* pe = &pExprInfo[j];
2775
      if (pe->base.resSchema.slotId == pCol->colId) {
2776 2777
        taosArrayPush(plist, pCol);
        taosArrayPush(pInfo->groupInfo, &j);
H
Haojun Liao 已提交
2778
        len += pCol->bytes;
2779 2780
        break;
      }
H
Haojun Liao 已提交
2781 2782 2783
    }
  }

2784
  ASSERT(taosArrayGetSize(pGroupInfo) == taosArrayGetSize(plist));
H
Haojun Liao 已提交
2785

wafwerar's avatar
wafwerar 已提交
2786
  pInfo->groupVal = taosMemoryCalloc(1, (POINTER_BYTES * numOfGroupCol + len));
2787 2788 2789 2790
  if (pInfo->groupVal == NULL) {
    taosArrayDestroy(plist);
    return TSDB_CODE_OUT_OF_MEMORY;
  }
H
Haojun Liao 已提交
2791

2792
  int32_t offset = 0;
L
Liu Jicong 已提交
2793 2794
  char*   start = (char*)(pInfo->groupVal + (POINTER_BYTES * numOfGroupCol));
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2795 2796
    pInfo->groupVal[i] = start + offset;
    SColumn* pCol = taosArrayGet(plist, i);
H
Haojun Liao 已提交
2797
    offset += pCol->bytes;
2798
  }
H
Haojun Liao 已提交
2799

2800
  taosArrayDestroy(plist);
H
Haojun Liao 已提交
2801

2802 2803
  return TSDB_CODE_SUCCESS;
}
H
Haojun Liao 已提交
2804

L
Liu Jicong 已提交
2805 2806 2807
SOperatorInfo* createSortedMergeOperatorInfo(SOperatorInfo** downstream, int32_t numOfDownstream, SExprInfo* pExprInfo,
                                             int32_t num, SArray* pSortInfo, SArray* pGroupInfo,
                                             SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
2808
  SSortedMergeOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SSortedMergeOperatorInfo));
L
Liu Jicong 已提交
2809
  SOperatorInfo*            pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2810
  if (pInfo == NULL || pOperator == NULL) {
2811
    goto _error;
2812
  }
H
Haojun Liao 已提交
2813

2814 2815 2816 2817 2818
  int32_t code = initExprSupp(&pOperator->exprSupp, pExprInfo, num);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

2819
  initResultRowInfo(&pInfo->binfo.resultRowInfo);
H
Haojun Liao 已提交
2820

2821
  if (pOperator->exprSupp.pCtx == NULL || pInfo->binfo.pRes == NULL) {
2822 2823
    goto _error;
  }
H
Haojun Liao 已提交
2824

2825
  size_t keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
2826
  code = doInitAggInfoSup(&pInfo->aggSup, pOperator->exprSupp.pCtx, num, keyBufSize, pTaskInfo->id.str);
2827 2828 2829
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2830

2831
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, num);
H
Haojun Liao 已提交
2832
  code = initGroupCol(pExprInfo, num, pGroupInfo, pInfo);
2833 2834 2835
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2836

L
Liu Jicong 已提交
2837 2838 2839 2840 2841
  //  pInfo->resultRowFactor = (int32_t)(getRowNumForMultioutput(pRuntimeEnv->pQueryAttr,
  //      pRuntimeEnv->pQueryAttr->topBotQuery, false));
  pInfo->sortBufSize = 1024 * 16;  // 1MB
  pInfo->bufPageSize = 1024;
  pInfo->pSortInfo = pSortInfo;
H
Haojun Liao 已提交
2842

2843
  pOperator->resultInfo.capacity = blockDataGetCapacityInRow(pInfo->binfo.pRes, pInfo->bufPageSize);
H
Haojun Liao 已提交
2844

L
Liu Jicong 已提交
2845
  pOperator->name = "SortedMerge";
X
Xiaoyu Wang 已提交
2846
  // pOperator->operatorType = OP_SortedMerge;
2847 2848 2849
  pOperator->blocking = true;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
L
Liu Jicong 已提交
2850
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
2851

2852 2853
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doSortedMerge, NULL, NULL, destroySortedMergeOperatorInfo,
                                         NULL, NULL, NULL);
2854 2855 2856
  code = appendDownstream(pOperator, downstream, numOfDownstream);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
2857
  }
H
Haojun Liao 已提交
2858

2859
  return pOperator;
H
Haojun Liao 已提交
2860

L
Liu Jicong 已提交
2861
_error:
2862
  if (pInfo != NULL) {
H
Haojun Liao 已提交
2863
    destroySortedMergeOperatorInfo(pInfo, num);
H
Haojun Liao 已提交
2864 2865
  }

wafwerar's avatar
wafwerar 已提交
2866 2867
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
2868 2869
  terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
  return NULL;
H
Haojun Liao 已提交
2870 2871
}

X
Xiaoyu Wang 已提交
2872
int32_t getTableScanInfo(SOperatorInfo* pOperator, int32_t* order, int32_t* scanFlag) {
2873
  // todo add more information about exchange operation
2874
  int32_t type = pOperator->operatorType;
X
Xiaoyu Wang 已提交
2875
  if (type == QUERY_NODE_PHYSICAL_PLAN_EXCHANGE || type == QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN ||
2876
      type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN ||
2877
      type == QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN) {
2878 2879 2880
    *order = TSDB_ORDER_ASC;
    *scanFlag = MAIN_SCAN;
    return TSDB_CODE_SUCCESS;
2881
  } else if (type == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) {
2882 2883 2884 2885 2886
    STableScanInfo* pTableScanInfo = pOperator->info;
    *order = pTableScanInfo->cond.order;
    *scanFlag = pTableScanInfo->scanFlag;
    return TSDB_CODE_SUCCESS;
  } else {
H
Haojun Liao 已提交
2887
    if (pOperator->pDownstream == NULL || pOperator->pDownstream[0] == NULL) {
2888
      return TSDB_CODE_INVALID_PARA;
H
Haojun Liao 已提交
2889
    } else {
2890
      return getTableScanInfo(pOperator->pDownstream[0], order, scanFlag);
2891 2892 2893
    }
  }
}
L
Liu Jicong 已提交
2894
#if 0
L
Liu Jicong 已提交
2895
int32_t doPrepareScan(SOperatorInfo* pOperator, uint64_t uid, int64_t ts) {
L
Liu Jicong 已提交
2896
  uint8_t type = pOperator->operatorType;
2897 2898 2899

  pOperator->status = OP_OPENED;

L
Liu Jicong 已提交
2900
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2901
    SStreamScanInfo* pScanInfo = pOperator->info;
L
Liu Jicong 已提交
2902
    pScanInfo->blockType = STREAM_INPUT__TABLE_SCAN;
2903

2904
    pScanInfo->pTableScanOp->status = OP_OPENED;
2905

2906
    STableScanInfo* pInfo = pScanInfo->pTableScanOp->info;
2907 2908
    ASSERT(pInfo->scanMode == TABLE_SCAN__TABLE_ORDER);

L
Liu Jicong 已提交
2909 2910 2911 2912
    if (uid == 0) {
      pInfo->noTable = 1;
      return TSDB_CODE_SUCCESS;
    }
2913 2914 2915 2916 2917 2918

    /*if (pSnapShotScanInfo->dataReader == NULL) {*/
    /*pSnapShotScanInfo->dataReader = tsdbReaderOpen(pHandle->vnode, &pSTInfo->cond, tableList, 0, 0);*/
    /*pSnapShotScanInfo->scanMode = TABLE_SCAN__TABLE_ORDER;*/
    /*}*/

L
Liu Jicong 已提交
2919 2920
    pInfo->noTable = 0;

2921
    if (pInfo->lastStatus.uid != uid || pInfo->lastStatus.ts != ts) {
L
Liu Jicong 已提交
2922 2923 2924 2925 2926 2927 2928 2929 2930 2931 2932
      SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

      int32_t tableSz = taosArrayGetSize(pTaskInfo->tableqinfoList.pTableList);
      bool    found = false;
      for (int32_t i = 0; i < tableSz; i++) {
        STableKeyInfo* pTableInfo = taosArrayGet(pTaskInfo->tableqinfoList.pTableList, i);
        if (pTableInfo->uid == uid) {
          found = true;
          pInfo->currentTable = i;
        }
      }
2933
      // TODO after processing drop, found can be false
L
Liu Jicong 已提交
2934
      ASSERT(found);
2935 2936

      tsdbSetTableId(pInfo->dataReader, uid);
H
Haojun Liao 已提交
2937 2938 2939 2940
      int64_t oldSkey = pInfo->cond.twindows.skey;
      pInfo->cond.twindows.skey = ts + 1;
      tsdbReaderReset(pInfo->dataReader, &pInfo->cond);
      pInfo->cond.twindows.skey = oldSkey;
2941 2942
      pInfo->scanTimes = 0;

S
Shengliang Guan 已提交
2943
      qDebug("tsdb reader offset seek to uid %" PRId64 " ts %" PRId64 ", table cur set to %d , all table num %d", uid, ts,
L
Liu Jicong 已提交
2944
             pInfo->currentTable, tableSz);
L
Liu Jicong 已提交
2945
    }
L
Liu Jicong 已提交
2946

L
Liu Jicong 已提交
2947
    return TSDB_CODE_SUCCESS;
2948

L
Liu Jicong 已提交
2949
  } else {
2950 2951 2952 2953 2954
    if (pOperator->numOfDownstream == 1) {
      return doPrepareScan(pOperator->pDownstream[0], uid, ts);
    } else if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator to set the input data block");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2955
    } else {
2956 2957
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2958 2959 2960 2961
    }
  }
}

2962 2963 2964
int32_t doGetScanStatus(SOperatorInfo* pOperator, uint64_t* uid, int64_t* ts) {
  int32_t type = pOperator->operatorType;
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2965 2966
    SStreamScanInfo* pScanInfo = pOperator->info;
    STableScanInfo*  pSnapShotScanInfo = pScanInfo->pTableScanOp->info;
L
Liu Jicong 已提交
2967 2968
    *uid = pSnapShotScanInfo->lastStatus.uid;
    *ts = pSnapShotScanInfo->lastStatus.ts;
2969 2970 2971 2972 2973 2974 2975 2976 2977 2978
  } else {
    if (pOperator->pDownstream[0] == NULL) {
      return TSDB_CODE_INVALID_PARA;
    } else {
      doGetScanStatus(pOperator->pDownstream[0], uid, ts);
    }
  }

  return TSDB_CODE_SUCCESS;
}
L
Liu Jicong 已提交
2979
#endif
2980

2981
// this is a blocking operator
L
Liu Jicong 已提交
2982
static int32_t doOpenAggregateOptr(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
2983 2984
  if (OPTR_IS_OPENED(pOperator)) {
    return TSDB_CODE_SUCCESS;
2985 2986
  }

H
Haojun Liao 已提交
2987
  SExecTaskInfo*    pTaskInfo = pOperator->pTaskInfo;
2988
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
2989

2990 2991
  SExprSupp*     pSup = &pOperator->exprSupp;
  SOperatorInfo* downstream = pOperator->pDownstream[0];
2992

2993 2994
  int64_t st = taosGetTimestampUs();

2995 2996 2997
  int32_t order = TSDB_ORDER_ASC;
  int32_t scanFlag = MAIN_SCAN;

H
Haojun Liao 已提交
2998
  while (1) {
2999
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
3000 3001 3002 3003
    if (pBlock == NULL) {
      break;
    }

3004 3005 3006 3007
    int32_t code = getTableScanInfo(pOperator, &order, &scanFlag);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
3008

3009
    // there is an scalar expression that needs to be calculated before apply the group aggregation.
3010 3011 3012
    if (pAggInfo->scalarExprSup.pExprInfo != NULL) {
      SExprSupp* pSup1 = &pAggInfo->scalarExprSup;
      code = projectApplyFunctions(pSup1->pExprInfo, pBlock, pBlock, pSup1->pCtx, pSup1->numOfExprs, NULL);
3013
      if (code != TSDB_CODE_SUCCESS) {
3014
        longjmp(pTaskInfo->env, code);
3015
      }
3016 3017
    }

3018
    // the pDataBlock are always the same one, no need to call this again
3019 3020
    setExecutionContext(pOperator, pOperator->exprSupp.numOfExprs, pBlock->info.groupId, pAggInfo);
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, true);
3021
    code = doAggregateImpl(pOperator, pSup->pCtx);
3022 3023 3024
    if (code != 0) {
      longjmp(pTaskInfo->env, code);
    }
3025 3026
  }

H
Haojun Liao 已提交
3027
  closeAllResultRows(&pAggInfo->binfo.resultRowInfo);
3028
  initGroupedResultInfo(&pAggInfo->groupResInfo, pAggInfo->aggSup.pResultRowHashTable, 0);
H
Haojun Liao 已提交
3029
  OPTR_SET_OPENED(pOperator);
3030

3031
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
3032 3033 3034
  return TSDB_CODE_SUCCESS;
}

3035
static SSDataBlock* getAggregateResult(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3036
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
3037 3038 3039 3040 3041 3042
  SOptrBasicInfo*   pInfo = &pAggInfo->binfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

L
Liu Jicong 已提交
3043
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3044
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
H
Haojun Liao 已提交
3045
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
3046
    doSetOperatorCompleted(pOperator);
H
Haojun Liao 已提交
3047 3048 3049
    return NULL;
  }

H
Haojun Liao 已提交
3050
  blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);
S
slzhou 已提交
3051 3052 3053 3054 3055 3056 3057 3058
  while (1) {
    doBuildResultDatablock(pOperator, pInfo, &pAggInfo->groupResInfo, pAggInfo->aggSup.pResultBuf);
    doFilter(pAggInfo->pCondition, pInfo->pRes);

    if (!hasDataInGroupInfo(&pAggInfo->groupResInfo)) {
      doSetOperatorCompleted(pOperator);
      break;
    }
3059

S
slzhou 已提交
3060 3061 3062 3063
    if (pInfo->pRes->info.rows > 0) {
      break;
    }
  }
3064
  size_t rows = blockDataGetNumOfRows(pInfo->pRes);
3065 3066
  pOperator->resultInfo.totalRows += rows;

3067
  return (rows == 0) ? NULL : pInfo->pRes;
3068 3069
}

wmmhello's avatar
wmmhello 已提交
3070
int32_t aggEncodeResultRow(SOperatorInfo* pOperator, char** result, int32_t* length) {
3071
  if (result == NULL || length == NULL) {
wmmhello's avatar
wmmhello 已提交
3072 3073 3074
    return TSDB_CODE_TSC_INVALID_INPUT;
  }
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3075 3076 3077 3078 3079
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
  int32_t         size = taosHashGetSize(pSup->pResultRowHashTable);
  size_t          keyLen = sizeof(uint64_t) * 2;  // estimate the key length
  int32_t         totalSize =
      sizeof(int32_t) + sizeof(int32_t) + size * (sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3080

C
Cary Xu 已提交
3081 3082 3083 3084 3085 3086
  // no result
  if (getTotalBufSize(pSup->pResultBuf) == 0) {
    *result = NULL;
    *length = 0;
    return TSDB_CODE_SUCCESS;
  }
3087

wmmhello's avatar
wmmhello 已提交
3088
  *result = (char*)taosMemoryCalloc(1, totalSize);
L
Liu Jicong 已提交
3089
  if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
3090
    return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
3091
  }
wmmhello's avatar
wmmhello 已提交
3092

wmmhello's avatar
wmmhello 已提交
3093
  int32_t offset = sizeof(int32_t);
wmmhello's avatar
wmmhello 已提交
3094 3095
  *(int32_t*)(*result + offset) = size;
  offset += sizeof(int32_t);
3096 3097

  // prepare memory
3098
  SResultRowPosition* pos = &pInfo->resultRowInfo.cur;
dengyihao's avatar
dengyihao 已提交
3099 3100
  void*               pPage = getBufPage(pSup->pResultBuf, pos->pageId);
  SResultRow*         pRow = (SResultRow*)((char*)pPage + pos->offset);
3101 3102 3103
  setBufPageDirty(pPage, true);
  releaseBufPage(pSup->pResultBuf, pPage);

dengyihao's avatar
dengyihao 已提交
3104
  void* pIter = taosHashIterate(pSup->pResultRowHashTable, NULL);
wmmhello's avatar
wmmhello 已提交
3105
  while (pIter) {
dengyihao's avatar
dengyihao 已提交
3106
    void*               key = taosHashGetKey(pIter, &keyLen);
3107
    SResultRowPosition* p1 = (SResultRowPosition*)pIter;
3108

dengyihao's avatar
dengyihao 已提交
3109
    pPage = (SFilePage*)getBufPage(pSup->pResultBuf, p1->pageId);
3110
    pRow = (SResultRow*)((char*)pPage + p1->offset);
3111 3112
    setBufPageDirty(pPage, true);
    releaseBufPage(pSup->pResultBuf, pPage);
wmmhello's avatar
wmmhello 已提交
3113 3114 3115

    // recalculate the result size
    int32_t realTotalSize = offset + sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize;
L
Liu Jicong 已提交
3116
    if (realTotalSize > totalSize) {
wmmhello's avatar
wmmhello 已提交
3117
      char* tmp = (char*)taosMemoryRealloc(*result, realTotalSize);
L
Liu Jicong 已提交
3118
      if (tmp == NULL) {
wafwerar's avatar
wafwerar 已提交
3119
        taosMemoryFree(*result);
wmmhello's avatar
wmmhello 已提交
3120
        *result = NULL;
wmmhello's avatar
wmmhello 已提交
3121
        return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
3122
      } else {
wmmhello's avatar
wmmhello 已提交
3123 3124 3125 3126 3127 3128 3129 3130 3131 3132 3133 3134
        *result = tmp;
      }
    }
    // save key
    *(int32_t*)(*result + offset) = keyLen;
    offset += sizeof(int32_t);
    memcpy(*result + offset, key, keyLen);
    offset += keyLen;

    // save value
    *(int32_t*)(*result + offset) = pSup->resultRowSize;
    offset += sizeof(int32_t);
3135
    memcpy(*result + offset, pRow, pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3136 3137 3138 3139 3140
    offset += pSup->resultRowSize;

    pIter = taosHashIterate(pSup->pResultRowHashTable, pIter);
  }

wmmhello's avatar
wmmhello 已提交
3141 3142 3143 3144
  *(int32_t*)(*result) = offset;
  *length = offset;

  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3145 3146
}

3147
int32_t aggDecodeResultRow(SOperatorInfo* pOperator, char* result) {
3148
  if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
3149
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3150
  }
wmmhello's avatar
wmmhello 已提交
3151
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3152
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
wmmhello's avatar
wmmhello 已提交
3153 3154

  //  int32_t size = taosHashGetSize(pSup->pResultRowHashTable);
3155
  int32_t length = *(int32_t*)(result);
wmmhello's avatar
wmmhello 已提交
3156
  int32_t offset = sizeof(int32_t);
3157 3158 3159 3160

  int32_t count = *(int32_t*)(result + offset);
  offset += sizeof(int32_t);

L
Liu Jicong 已提交
3161
  while (count-- > 0 && length > offset) {
wmmhello's avatar
wmmhello 已提交
3162 3163 3164
    int32_t keyLen = *(int32_t*)(result + offset);
    offset += sizeof(int32_t);

L
Liu Jicong 已提交
3165
    uint64_t    tableGroupId = *(uint64_t*)(result + offset);
3166
    SResultRow* resultRow = getNewResultRow(pSup->pResultBuf, tableGroupId, pSup->resultRowSize);
L
Liu Jicong 已提交
3167
    if (!resultRow) {
wmmhello's avatar
wmmhello 已提交
3168
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3169
    }
3170

wmmhello's avatar
wmmhello 已提交
3171
    // add a new result set for a new group
3172 3173
    SResultRowPosition pos = {.pageId = resultRow->pageId, .offset = resultRow->offset};
    taosHashPut(pSup->pResultRowHashTable, result + offset, keyLen, &pos, sizeof(SResultRowPosition));
wmmhello's avatar
wmmhello 已提交
3174 3175 3176

    offset += keyLen;
    int32_t valueLen = *(int32_t*)(result + offset);
L
Liu Jicong 已提交
3177
    if (valueLen != pSup->resultRowSize) {
wmmhello's avatar
wmmhello 已提交
3178
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3179 3180 3181 3182 3183 3184 3185 3186 3187 3188
    }
    offset += sizeof(int32_t);
    int32_t pageId = resultRow->pageId;
    int32_t pOffset = resultRow->offset;
    memcpy(resultRow, result + offset, valueLen);
    resultRow->pageId = pageId;
    resultRow->offset = pOffset;
    offset += valueLen;

    initResultRow(resultRow);
dengyihao's avatar
dengyihao 已提交
3189
    pInfo->resultRowInfo.cur = (SResultRowPosition){.pageId = resultRow->pageId, .offset = resultRow->offset};
wmmhello's avatar
wmmhello 已提交
3190 3191
  }

L
Liu Jicong 已提交
3192
  if (offset != length) {
wmmhello's avatar
wmmhello 已提交
3193
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3194
  }
wmmhello's avatar
wmmhello 已提交
3195
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3196 3197
}

3198 3199 3200 3201 3202
int32_t handleLimitOffset(SOperatorInfo* pOperator, SLimitInfo* pLimitInfo, SSDataBlock* pBlock, bool holdDataInBuf) {
  if (pLimitInfo->remainGroupOffset > 0) {
    if (pLimitInfo->currentGroupId == 0) {  // it is the first group
      pLimitInfo->currentGroupId = pBlock->info.groupId;
      blockDataCleanup(pBlock);
3203
      return PROJECT_RETRIEVE_CONTINUE;
3204 3205 3206
    } else if (pLimitInfo->currentGroupId != pBlock->info.groupId) {
      // now it is the data from a new group
      pLimitInfo->remainGroupOffset -= 1;
3207 3208

      // ignore data block in current group
3209 3210
      if (pLimitInfo->remainGroupOffset > 0) {
        blockDataCleanup(pBlock);
3211 3212 3213 3214 3215
        return PROJECT_RETRIEVE_CONTINUE;
      }
    }

    // set current group id of the project operator
3216
    pLimitInfo->currentGroupId = pBlock->info.groupId;
3217 3218
  }

3219 3220 3221
  if (pLimitInfo->currentGroupId != 0 && pLimitInfo->currentGroupId != pBlock->info.groupId) {
    pLimitInfo->numOfOutputGroups += 1;
    if ((pLimitInfo->slimit.limit > 0) && (pLimitInfo->slimit.limit <= pLimitInfo->numOfOutputGroups)) {
3222
      pOperator->status = OP_EXEC_DONE;
3223
      blockDataCleanup(pBlock);
3224 3225 3226 3227 3228

      return PROJECT_RETRIEVE_DONE;
    }

    // reset the value for a new group data
3229 3230
    pLimitInfo->numOfOutputRows = 0;
    pLimitInfo->remainOffset = pLimitInfo->limit.offset;
3231 3232 3233 3234 3235
  }

  // here we reach the start position, according to the limit/offset requirements.

  // set current group id
3236
  pLimitInfo->currentGroupId = pBlock->info.groupId;
3237

3238 3239 3240
  if (pLimitInfo->remainOffset >= pBlock->info.rows) {
    pLimitInfo->remainOffset -= pBlock->info.rows;
    blockDataCleanup(pBlock);
3241
    return PROJECT_RETRIEVE_CONTINUE;
3242 3243 3244
  } else if (pLimitInfo->remainOffset < pBlock->info.rows && pLimitInfo->remainOffset > 0) {
    blockDataTrimFirstNRows(pBlock, pLimitInfo->remainOffset);
    pLimitInfo->remainOffset = 0;
3245 3246
  }

3247
  // check for the limitation in each group
3248 3249 3250 3251
  if (pLimitInfo->limit.limit >= 0 && pLimitInfo->numOfOutputRows + pBlock->info.rows >= pLimitInfo->limit.limit) {
    int32_t keepRows = (int32_t)(pLimitInfo->limit.limit - pLimitInfo->numOfOutputRows);
    blockDataKeepFirstNRows(pBlock, keepRows);
    if (pLimitInfo->slimit.limit > 0 && pLimitInfo->slimit.limit <= pLimitInfo->numOfOutputGroups) {
3252 3253 3254
      pOperator->status = OP_EXEC_DONE;
    }

3255
    return PROJECT_RETRIEVE_DONE;
3256
  }
3257

3258
  // todo optimize performance
3259 3260
  // If there are slimit/soffset value exists, multi-round result can not be packed into one group, since the
  // they may not belong to the same group the limit/offset value is not valid in this case.
3261 3262
  if ((!holdDataInBuf) || (pBlock->info.rows >= pOperator->resultInfo.threshold) || pLimitInfo->slimit.offset != -1 ||
      pLimitInfo->slimit.limit != -1) {
3263
    return PROJECT_RETRIEVE_DONE;
L
Liu Jicong 已提交
3264
  } else {  // not full enough, continue to accumulate the output data in the buffer.
3265 3266 3267 3268
    return PROJECT_RETRIEVE_CONTINUE;
  }
}

3269
static SSDataBlock* doProjectOperation(SOperatorInfo* pOperator) {
3270
  SProjectOperatorInfo* pProjectInfo = pOperator->info;
L
Liu Jicong 已提交
3271
  SOptrBasicInfo*       pInfo = &pProjectInfo->binfo;
3272

L
Liu Jicong 已提交
3273
  SExprSupp*   pSup = &pOperator->exprSupp;
3274
  SSDataBlock* pRes = pInfo->pRes;
3275
  blockDataCleanup(pRes);
3276

3277
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3278
  if (pOperator->status == OP_EXEC_DONE) {
L
Liu Jicong 已提交
3279 3280 3281 3282
    if (pTaskInfo->execModel == OPTR_EXEC_MODEL_QUEUE) {
      pOperator->status = OP_OPENED;
      return NULL;
    }
3283 3284
    return NULL;
  }
dengyihao's avatar
dengyihao 已提交
3285

H
Haojun Liao 已提交
3286
#if 0
3287 3288 3289 3290 3291
  if (pProjectInfo->existDataBlock) {  // TODO refactor
    SSDataBlock* pBlock = pProjectInfo->existDataBlock;
    pProjectInfo->existDataBlock = NULL;

    // the pDataBlock are always the same one, no need to call this again
H
Haojun Liao 已提交
3292
    setInputDataBlock(pOperator, pInfo->pCtx, pBlock, TSDB_ORDER_ASC);
3293

H
Haojun Liao 已提交
3294
    blockDataEnsureCapacity(pInfo->pRes, pBlock->info.rows);
3295
    projectApplyFunctions(pOperator->exprSupp.pExprInfo, pInfo->pRes, pBlock, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
L
Liu Jicong 已提交
3296
    if (pRes->info.rows >= pProjectInfo->binfo.capacity * 0.8) {
3297 3298
      copyTsColoum(pRes, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
      resetResultRowEntryResult(pInfo->pCtx, pOperator->exprSupp.numOfExprs);
3299 3300 3301
      return pRes;
    }
  }
H
Haojun Liao 已提交
3302
#endif
3303

3304
  int64_t st = 0;
3305 3306 3307
  int32_t order = 0;
  int32_t scanFlag = 0;

3308 3309 3310 3311
  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

H
Haojun Liao 已提交
3312 3313
  SOperatorInfo* downstream = pOperator->pDownstream[0];

L
Liu Jicong 已提交
3314
  while (1) {
H
Haojun Liao 已提交
3315
    // The downstream exec may change the value of the newgroup, so use a local variable instead.
L
Liu Jicong 已提交
3316
    qDebug("projection call next");
3317
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
3318
    if (pBlock == NULL) {
L
Liu Jicong 已提交
3319 3320 3321
      qDebug("projection get null");

      /*if (pTaskInfo->execModel == OPTR_EXEC_MODEL_BATCH) {*/
3322
      doSetOperatorCompleted(pOperator);
L
Liu Jicong 已提交
3323 3324
      /*} else if (pTaskInfo->execModel == OPTR_EXEC_MODEL_QUEUE) {*/
      /*pOperator->status = OP_RES_TO_RETURN;*/
L
Liu Jicong 已提交
3325
      /*}*/
3326 3327
      break;
    }
3328 3329 3330 3331
    if (pBlock->info.type == STREAM_RETRIEVE) {
      // for stream interval
      return pBlock;
    }
3332 3333

    // the pDataBlock are always the same one, no need to call this again
3334
    int32_t code = getTableScanInfo(pOperator->pDownstream[0], &order, &scanFlag);
3335 3336 3337
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
3338

3339
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
3340 3341
    blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

3342
    code = projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs,
X
Xiaoyu Wang 已提交
3343
                                 pProjectInfo->pPseudoColInfo);
3344 3345
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
3346 3347
    }

3348
    int32_t status = handleLimitOffset(pOperator, &pProjectInfo->limitInfo, pInfo->pRes, true);
3349 3350 3351 3352

    // filter shall be applied after apply functions and limit/offset on the result
    doFilter(pProjectInfo->pFilterNode, pInfo->pRes);

3353
    if (status == PROJECT_RETRIEVE_CONTINUE) {
H
Haojun Liao 已提交
3354
      continue;
L
Liu Jicong 已提交
3355
    } else if (status == PROJECT_RETRIEVE_DONE) {
3356 3357 3358
      break;
    }
  }
dengyihao's avatar
dengyihao 已提交
3359

3360
  size_t rows = pInfo->pRes->info.rows;
3361 3362
  pProjectInfo->limitInfo.numOfOutputRows += rows;

3363 3364 3365
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
3366
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
3367 3368
  }

3369
  return (rows > 0) ? pInfo->pRes : NULL;
3370 3371
}

H
Haojun Liao 已提交
3372
static void doHandleRemainBlockForNewGroupImpl(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo,
L
Liu Jicong 已提交
3373
                                               SExecTaskInfo* pTaskInfo) {
3374
  pInfo->totalInputRows = pInfo->existNewGroupBlock->info.rows;
H
Haojun Liao 已提交
3375

L
Liu Jicong 已提交
3376 3377
  int64_t ekey =
      Q_STATUS_EQUAL(pTaskInfo->status, TASK_COMPLETED) ? pInfo->win.ekey : pInfo->existNewGroupBlock->info.window.ekey;
3378 3379
  taosResetFillInfo(pInfo->pFillInfo, getFillInfoStart(pInfo->pFillInfo));

3380
  taosFillSetStartInfo(pInfo->pFillInfo, pInfo->existNewGroupBlock->info.rows, ekey);
3381 3382
  taosFillSetInputDataBlock(pInfo->pFillInfo, pInfo->existNewGroupBlock);

H
Haojun Liao 已提交
3383 3384 3385
  int32_t numOfResultRows = pResultInfo->capacity - pInfo->pRes->info.rows;
  taosFillResultDataBlock(pInfo->pFillInfo, pInfo->pRes, numOfResultRows);

3386
  pInfo->curGroupId = pInfo->existNewGroupBlock->info.groupId;
3387 3388 3389
  pInfo->existNewGroupBlock = NULL;
}

H
Haojun Liao 已提交
3390
static void doHandleRemainBlockFromNewGroup(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo,
L
Liu Jicong 已提交
3391
                                            SExecTaskInfo* pTaskInfo) {
3392
  if (taosFillHasMoreResults(pInfo->pFillInfo)) {
H
Haojun Liao 已提交
3393 3394 3395
    int32_t numOfResultRows = pResultInfo->capacity - pInfo->pRes->info.rows;
    taosFillResultDataBlock(pInfo->pFillInfo, pInfo->pRes, numOfResultRows);
    if (pInfo->pRes->info.rows > pResultInfo->threshold) {
3396 3397 3398 3399 3400 3401
      return;
    }
  }

  // handle the cached new group data block
  if (pInfo->existNewGroupBlock) {
H
Haojun Liao 已提交
3402
    doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, pTaskInfo);
3403 3404 3405
  }
}

S
slzhou 已提交
3406
static SSDataBlock* doFillImpl(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3407 3408
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;
3409

H
Haojun Liao 已提交
3410
  SResultInfo* pResultInfo = &pOperator->resultInfo;
3411 3412 3413
  SSDataBlock* pResBlock = pInfo->pRes;

  blockDataCleanup(pResBlock);
3414

H
Haojun Liao 已提交
3415 3416
  doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, pTaskInfo);
  if (pResBlock->info.rows > pResultInfo->threshold || pResBlock->info.rows > 0) {
3417
    return pResBlock;
H
Haojun Liao 已提交
3418
  }
3419

H
Haojun Liao 已提交
3420
  SOperatorInfo* pDownstream = pOperator->pDownstream[0];
L
Liu Jicong 已提交
3421
  while (1) {
3422
    SSDataBlock* pBlock = pDownstream->fpSet.getNextFn(pDownstream);
3423 3424 3425 3426 3427
    if (pBlock == NULL) {
      if (pInfo->totalInputRows == 0) {
        pOperator->status = OP_EXEC_DONE;
        return NULL;
      }
3428

3429
      taosFillSetStartInfo(pInfo->pFillInfo, 0, pInfo->win.ekey);
3430
    } else {
3431 3432 3433 3434
      blockDataUpdateTsWindow(pBlock, pInfo->primaryTsCol);

      if (pInfo->curGroupId == 0 || pInfo->curGroupId == pBlock->info.groupId) {
        pInfo->curGroupId = pBlock->info.groupId;   // the first data block
3435 3436

        pInfo->totalInputRows += pBlock->info.rows;
3437

3438 3439
        taosFillSetStartInfo(pInfo->pFillInfo, pBlock->info.rows, pBlock->info.window.ekey);
        taosFillSetInputDataBlock(pInfo->pFillInfo, pBlock);
3440 3441 3442 3443 3444 3445
      } else if (pInfo->curGroupId != pBlock->info.groupId) { // the new group data block
        pInfo->existNewGroupBlock = pBlock;

        // Fill the previous group data block, before handle the data block of new group.
        // Close the fill operation for previous group data block
        taosFillSetStartInfo(pInfo->pFillInfo, 0, pInfo->win.ekey);
3446 3447 3448
      }
    }

3449
    blockDataEnsureCapacity(pResBlock, pOperator->resultInfo.capacity);
H
Haojun Liao 已提交
3450

3451 3452
    int32_t numOfResultRows = pOperator->resultInfo.capacity - pResBlock->info.rows;
    taosFillResultDataBlock(pInfo->pFillInfo, pResBlock, numOfResultRows);
3453 3454

    // current group has no more result to return
3455
    if (pResBlock->info.rows > 0) {
3456 3457
      // 1. The result in current group not reach the threshold of output result, continue
      // 2. If multiple group results existing in one SSDataBlock is not allowed, return immediately
3458
      if (pResBlock->info.rows > pResultInfo->threshold || pBlock == NULL || pInfo->existNewGroupBlock != NULL) {
3459
        return pResBlock;
3460 3461
      }

H
Haojun Liao 已提交
3462
      doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, pTaskInfo);
3463
      if (pResBlock->info.rows >= pOperator->resultInfo.threshold || pBlock == NULL) {
3464
        return pResBlock;
3465 3466 3467
      }
    } else if (pInfo->existNewGroupBlock) {  // try next group
      assert(pBlock != NULL);
H
Haojun Liao 已提交
3468
      doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, pTaskInfo);
3469 3470
      if (pResBlock->info.rows > pResultInfo->threshold) {
        return pResBlock;
3471 3472 3473 3474 3475 3476 3477
      }
    } else {
      return NULL;
    }
  }
}

S
slzhou 已提交
3478 3479 3480 3481 3482 3483 3484 3485
static SSDataBlock* doFill(SOperatorInfo* pOperator) {
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

S
slzhou 已提交
3486
  SSDataBlock* fillResult = NULL;
S
slzhou 已提交
3487
  while (true) {
S
slzhou 已提交
3488
    fillResult = doFillImpl(pOperator);
S
slzhou 已提交
3489 3490 3491 3492 3493 3494 3495 3496 3497 3498 3499 3500 3501 3502
    if (fillResult != NULL) {
      doFilter(pInfo->pCondition, fillResult);
    }

    if (fillResult == NULL) {
      doSetOperatorCompleted(pOperator);
      break;
    }

    if (fillResult->info.rows > 0) {
      break;
    }
  }

S
slzhou 已提交
3503 3504 3505 3506
  if (fillResult != NULL) {
    size_t rows = fillResult->info.rows;
    pOperator->resultInfo.totalRows += rows;
  }
S
slzhou 已提交
3507

S
slzhou 已提交
3508
  return fillResult;
S
slzhou 已提交
3509 3510
}

H
Haojun Liao 已提交
3511 3512 3513
static void destroyExprInfo(SExprInfo* pExpr, int32_t numOfExprs) {
  for (int32_t i = 0; i < numOfExprs; ++i) {
    SExprInfo* pExprInfo = &pExpr[i];
H
Haojun Liao 已提交
3514 3515 3516 3517
    for(int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      if (pExprInfo->base.pParam[j].type == FUNC_PARAM_TYPE_COLUMN) {
        taosMemoryFreeClear(pExprInfo->base.pParam[j].pCol);
      }
H
Haojun Liao 已提交
3518
    }
H
Haojun Liao 已提交
3519

H
Haojun Liao 已提交
3520
    taosMemoryFree(pExprInfo->base.pParam);
H
Haojun Liao 已提交
3521 3522 3523 3524
    taosMemoryFree(pExprInfo->pExpr);
  }
}

3525 3526 3527 3528 3529
static void destroyOperatorInfo(SOperatorInfo* pOperator) {
  if (pOperator == NULL) {
    return;
  }

3530
  if (pOperator->fpSet.closeFn != NULL) {
3531
    pOperator->fpSet.closeFn(pOperator->info, pOperator->exprSupp.numOfExprs);
3532 3533
  }

H
Haojun Liao 已提交
3534
  if (pOperator->pDownstream != NULL) {
L
Liu Jicong 已提交
3535
    for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
H
Haojun Liao 已提交
3536
      destroyOperatorInfo(pOperator->pDownstream[i]);
3537 3538
    }

wafwerar's avatar
wafwerar 已提交
3539
    taosMemoryFreeClear(pOperator->pDownstream);
H
Haojun Liao 已提交
3540
    pOperator->numOfDownstream = 0;
3541 3542
  }

3543
  cleanupExprSupp(&pOperator->exprSupp);
wafwerar's avatar
wafwerar 已提交
3544
  taosMemoryFreeClear(pOperator);
3545 3546
}

3547 3548 3549 3550 3551 3552 3553 3554 3555 3556 3557 3558 3559 3560 3561
int32_t getBufferPgSize(int32_t rowSize, uint32_t* defaultPgsz, uint32_t* defaultBufsz) {
  *defaultPgsz = 4096;
  while (*defaultPgsz < rowSize * 4) {
    *defaultPgsz <<= 1u;
  }

  // at least four pages need to be in buffer
  *defaultBufsz = 4096 * 256;
  if ((*defaultBufsz) <= (*defaultPgsz)) {
    (*defaultBufsz) = (*defaultPgsz) * 4;
  }

  return 0;
}

dengyihao's avatar
dengyihao 已提交
3562 3563
int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                         const char* pKey) {
3564 3565
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);

dengyihao's avatar
dengyihao 已提交
3566 3567
  pAggSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
  pAggSup->keyBuf = taosMemoryCalloc(1, keyBufSize + POINTER_BYTES + sizeof(int64_t));
3568 3569
  pAggSup->pResultRowHashTable = taosHashInit(10, hashFn, true, HASH_NO_LOCK);

H
Haojun Liao 已提交
3570
  if (pAggSup->keyBuf == NULL || pAggSup->pResultRowHashTable == NULL) {
3571 3572 3573
    return TSDB_CODE_OUT_OF_MEMORY;
  }

dengyihao's avatar
dengyihao 已提交
3574
  uint32_t defaultPgsz = 0;
3575 3576
  uint32_t defaultBufsz = 0;
  getBufferPgSize(pAggSup->resultRowSize, &defaultPgsz, &defaultBufsz);
H
Haojun Liao 已提交
3577

3578
  int32_t code = createDiskbasedBuf(&pAggSup->pResultBuf, defaultPgsz, defaultBufsz, pKey, TD_TMP_DIR_PATH);
H
Haojun Liao 已提交
3579 3580 3581 3582
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3583 3584 3585
  return TSDB_CODE_SUCCESS;
}

3586
void cleanupAggSup(SAggSupporter* pAggSup) {
wafwerar's avatar
wafwerar 已提交
3587
  taosMemoryFreeClear(pAggSup->keyBuf);
3588
  taosHashCleanup(pAggSup->pResultRowHashTable);
H
Haojun Liao 已提交
3589
  destroyDiskbasedBuf(pAggSup->pResultBuf);
3590 3591
}

L
Liu Jicong 已提交
3592 3593
int32_t initAggInfo(SExprSupp* pSup, SAggSupporter* pAggSup, SExprInfo* pExprInfo, int32_t numOfCols, size_t keyBufSize,
                    const char* pkey) {
3594 3595 3596 3597 3598
  int32_t code = initExprSupp(pSup, pExprInfo, numOfCols);
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3599
  doInitAggInfoSup(pAggSup, pSup->pCtx, numOfCols, keyBufSize, pkey);
L
Liu Jicong 已提交
3600
  for (int32_t i = 0; i < numOfCols; ++i) {
3601
    pSup->pCtx[i].pBuf = pAggSup->pResultBuf;
3602 3603
  }

3604
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
3605 3606
}

3607
void initResultSizeInfo(SOperatorInfo* pOperator, int32_t numOfRows) {
wmmhello's avatar
wmmhello 已提交
3608
  ASSERT(numOfRows != 0);
3609 3610 3611 3612
  pOperator->resultInfo.capacity = numOfRows;
  pOperator->resultInfo.threshold = numOfRows * 0.75;

  if (pOperator->resultInfo.threshold == 0) {
wmmhello's avatar
wmmhello 已提交
3613
    pOperator->resultInfo.threshold = numOfRows;
3614 3615 3616
  }
}

3617 3618 3619 3620 3621
void initBasicInfo(SOptrBasicInfo* pInfo, SSDataBlock* pBlock) {
  pInfo->pRes = pBlock;
  initResultRowInfo(&pInfo->resultRowInfo);
}

3622 3623 3624 3625 3626 3627 3628 3629 3630 3631 3632 3633 3634 3635 3636 3637 3638 3639 3640
static void* destroySqlFunctionCtx(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
  if (pCtx == NULL) {
    return NULL;
  }

  for (int32_t i = 0; i < numOfOutput; ++i) {
    for (int32_t j = 0; j < pCtx[i].numOfParams; ++j) {
      taosVariantDestroy(&pCtx[i].param[j].param);
    }

    taosMemoryFreeClear(pCtx[i].subsidiaries.pCtx);
    taosMemoryFree(pCtx[i].input.pData);
    taosMemoryFree(pCtx[i].input.pColumnDataAgg);
  }

  taosMemoryFreeClear(pCtx);
  return NULL;
}

3641
int32_t initExprSupp(SExprSupp* pSup, SExprInfo* pExprInfo, int32_t numOfExpr) {
3642 3643 3644 3645
  pSup->pExprInfo = pExprInfo;
  pSup->numOfExprs = numOfExpr;
  if (pSup->pExprInfo != NULL) {
    pSup->pCtx = createSqlFunctionCtx(pExprInfo, numOfExpr, &pSup->rowEntryInfoOffset);
3646 3647 3648
    if (pSup->pCtx == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
3649
  }
3650 3651

  return TSDB_CODE_SUCCESS;
3652 3653
}

3654 3655 3656 3657 3658 3659 3660 3661 3662 3663
void cleanupExprSupp(SExprSupp* pSupp) {
  destroySqlFunctionCtx(pSupp->pCtx, pSupp->numOfExprs);
  if (pSupp->pExprInfo != NULL) {
    destroyExprInfo(pSupp->pExprInfo, pSupp->numOfExprs);
  }

  taosMemoryFreeClear(pSupp->pExprInfo);
  taosMemoryFree(pSupp->rowEntryInfoOffset);
}

L
Liu Jicong 已提交
3664
SOperatorInfo* createAggregateOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
S
slzhou 已提交
3665
                                           SSDataBlock* pResultBlock, SNode* pCondition, SExprInfo* pScalarExprInfo,
wmmhello's avatar
wmmhello 已提交
3666
                                           int32_t numOfScalarExpr, SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3667
  SAggOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SAggOperatorInfo));
L
Liu Jicong 已提交
3668
  SOperatorInfo*    pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3669 3670 3671
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
H
Haojun Liao 已提交
3672

3673
  int32_t numOfRows = 1024;
dengyihao's avatar
dengyihao 已提交
3674
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3675 3676

  initResultSizeInfo(pOperator, numOfRows);
3677
  int32_t code = initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
L
Liu Jicong 已提交
3678
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3679 3680
    goto _error;
  }
H
Haojun Liao 已提交
3681

3682
  initBasicInfo(&pInfo->binfo, pResultBlock);
3683 3684 3685 3686
  code = initExprSupp(&pInfo->scalarExprSup, pScalarExprInfo, numOfScalarExpr);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3687

L
Liu Jicong 已提交
3688
  pInfo->groupId = INT32_MIN;
S
slzhou 已提交
3689
  pInfo->pCondition = pCondition;
dengyihao's avatar
dengyihao 已提交
3690
  pOperator->name = "TableAggregate";
3691
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_HASH_AGG;
3692
  pOperator->blocking = true;
dengyihao's avatar
dengyihao 已提交
3693 3694 3695
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3696

3697 3698
  pOperator->fpSet = createOperatorFpSet(doOpenAggregateOptr, getAggregateResult, NULL, NULL, destroyAggOperatorInfo,
                                         aggEncodeResultRow, aggDecodeResultRow, NULL);
H
Haojun Liao 已提交
3699 3700 3701 3702 3703

  code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3704 3705

  return pOperator;
L
Liu Jicong 已提交
3706
_error:
H
Haojun Liao 已提交
3707
  destroyAggOperatorInfo(pInfo, numOfCols);
wafwerar's avatar
wafwerar 已提交
3708 3709
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
H
Haojun Liao 已提交
3710 3711
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3712 3713
}

3714
void cleanupBasicInfo(SOptrBasicInfo* pInfo) {
3715 3716
  assert(pInfo != NULL);
  cleanupResultRowInfo(&pInfo->resultRowInfo);
H
Haojun Liao 已提交
3717
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
3718 3719
}

H
Haojun Liao 已提交
3720
void destroyBasicOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3721
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)param;
3722
  cleanupBasicInfo(pInfo);
L
Liu Jicong 已提交
3723

D
dapan1121 已提交
3724
  taosMemoryFreeClear(param);
3725
}
H
Haojun Liao 已提交
3726

H
Haojun Liao 已提交
3727 3728 3729 3730 3731 3732 3733 3734

static void freeItem(void* pItem) {
  void** p = pItem;
  if (*p != NULL) {
    taosMemoryFreeClear(*p);
  }
}

H
Haojun Liao 已提交
3735
void destroyAggOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3736
  SAggOperatorInfo* pInfo = (SAggOperatorInfo*)param;
L
Liu Jicong 已提交
3737 3738
  cleanupBasicInfo(&pInfo->binfo);

H
Haojun Liao 已提交
3739 3740
  cleanupAggSup(&pInfo->aggSup);
  taosArrayDestroyEx(pInfo->groupResInfo.pRows, freeItem);
D
dapan1121 已提交
3741
  taosMemoryFreeClear(param);
3742
}
3743

H
Haojun Liao 已提交
3744
void destroySFillOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3745
  SFillOperatorInfo* pInfo = (SFillOperatorInfo*)param;
3746
  pInfo->pFillInfo = taosDestroyFillInfo(pInfo->pFillInfo);
H
Haojun Liao 已提交
3747
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
wafwerar's avatar
wafwerar 已提交
3748
  taosMemoryFreeClear(pInfo->p);
L
Liu Jicong 已提交
3749

D
dapan1121 已提交
3750
  taosMemoryFreeClear(param);
3751 3752
}

H
Haojun Liao 已提交
3753
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput) {
D
fix bug  
dapan 已提交
3754 3755 3756
  if (NULL == param) {
    return;
  }
L
Liu Jicong 已提交
3757
  SProjectOperatorInfo* pInfo = (SProjectOperatorInfo*)param;
3758
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3759
  cleanupAggSup(&pInfo->aggSup);
H
Haojun Liao 已提交
3760
  taosArrayDestroy(pInfo->pPseudoColInfo);
L
Liu Jicong 已提交
3761

D
dapan1121 已提交
3762
  taosMemoryFreeClear(param);
3763 3764
}

H
Haojun Liao 已提交
3765
static void destroyIndefinitOperatorInfo(void* param, int32_t numOfOutput) {
3766
  SIndefOperatorInfo* pInfo = (SIndefOperatorInfo*)param;
3767
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3768 3769 3770

  taosArrayDestroy(pInfo->pPseudoColInfo);
  cleanupAggSup(&pInfo->aggSup);
3771
  cleanupExprSupp(&pInfo->scalarSup);
L
Liu Jicong 已提交
3772

D
dapan1121 已提交
3773
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
3774 3775
}

H
Haojun Liao 已提交
3776
void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3777
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3778 3779 3780 3781
  taosRemoveRef(exchangeObjRefPool, pExInfo->self);
}

void doDestroyExchangeOperatorInfo(void* param) {
X
Xiaoyu Wang 已提交
3782
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3783

H
Haojun Liao 已提交
3784 3785 3786
  taosArrayDestroy(pExInfo->pSources);
  taosArrayDestroy(pExInfo->pSourceDataInfo);
  if (pExInfo->pResult != NULL) {
H
Haojun Liao 已提交
3787
    pExInfo->pResult = blockDataDestroy(pExInfo->pResult);
H
Haojun Liao 已提交
3788 3789 3790
  }

  tsem_destroy(&pExInfo->ready);
L
Liu Jicong 已提交
3791

D
dapan1121 已提交
3792
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
3793 3794
}

H
Haojun Liao 已提交
3795 3796
static SArray* setRowTsColumnOutputInfo(SqlFunctionCtx* pCtx, int32_t numOfCols) {
  SArray* pList = taosArrayInit(4, sizeof(int32_t));
dengyihao's avatar
dengyihao 已提交
3797
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
3798 3799 3800 3801 3802 3803 3804 3805
    if (fmIsPseudoColumnFunc(pCtx[i].functionId)) {
      taosArrayPush(pList, &i);
    }
  }

  return pList;
}

L
Liu Jicong 已提交
3806
SOperatorInfo* createProjectOperatorInfo(SOperatorInfo* downstream, SProjectPhysiNode* pProjPhyNode,
dengyihao's avatar
dengyihao 已提交
3807
                                         SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3808
  SProjectOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SProjectOperatorInfo));
L
Liu Jicong 已提交
3809
  SOperatorInfo*        pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3810 3811 3812
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
3813

L
Liu Jicong 已提交
3814
  int32_t    numOfCols = 0;
3815 3816 3817
  SExprInfo* pExprInfo = createExprInfo(pProjPhyNode->pProjections, NULL, &numOfCols);

  SSDataBlock* pResBlock = createResDataBlock(pProjPhyNode->node.pOutputDataBlockDesc);
3818
  initLimitInfo(pProjPhyNode->node.pLimit, pProjPhyNode->node.pSlimit, &pInfo->limitInfo);
3819

H
Haojun Liao 已提交
3820
  pInfo->binfo.pRes = pResBlock;
3821
  pInfo->pFilterNode = pProjPhyNode->node.pConditions;
H
Haojun Liao 已提交
3822 3823

  int32_t numOfRows = 4096;
dengyihao's avatar
dengyihao 已提交
3824
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3825

3826 3827 3828 3829 3830
  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
3831
  initResultSizeInfo(pOperator, numOfRows);
3832

3833 3834
  initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
  initBasicInfo(&pInfo->binfo, pResBlock);
3835
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfCols);
3836

3837
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pOperator->exprSupp.pCtx, numOfCols);
X
Xiaoyu Wang 已提交
3838
  pOperator->name = "ProjectOperator";
H
Haojun Liao 已提交
3839
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_PROJECT;
X
Xiaoyu Wang 已提交
3840 3841 3842 3843
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
3844

L
Liu Jicong 已提交
3845 3846
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doProjectOperation, NULL, NULL,
                                         destroyProjectOperatorInfo, NULL, NULL, NULL);
L
Liu Jicong 已提交
3847

3848
  int32_t code = appendDownstream(pOperator, &downstream, 1);
H
Haojun Liao 已提交
3849
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3850 3851
    goto _error;
  }
3852 3853

  return pOperator;
H
Haojun Liao 已提交
3854

L
Liu Jicong 已提交
3855
_error:
H
Haojun Liao 已提交
3856 3857
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3858 3859
}

3860 3861
static void doHandleDataBlock(SOperatorInfo* pOperator, SSDataBlock* pBlock, SOperatorInfo* downstream,
                              SExecTaskInfo* pTaskInfo) {
3862 3863 3864 3865 3866 3867 3868 3869 3870 3871 3872 3873 3874 3875 3876 3877 3878 3879 3880 3881 3882 3883 3884 3885 3886 3887 3888 3889 3890 3891 3892 3893 3894
  int32_t order = 0;
  int32_t scanFlag = 0;

  SIndefOperatorInfo* pIndefInfo = pOperator->info;
  SOptrBasicInfo*     pInfo = &pIndefInfo->binfo;
  SExprSupp*          pSup = &pOperator->exprSupp;

  // the pDataBlock are always the same one, no need to call this again
  int32_t code = getTableScanInfo(downstream, &order, &scanFlag);
  if (code != TSDB_CODE_SUCCESS) {
    longjmp(pTaskInfo->env, code);
  }

  // there is an scalar expression that needs to be calculated before apply the group aggregation.
  SExprSupp* pScalarSup = &pIndefInfo->scalarSup;
  if (pScalarSup->pExprInfo != NULL) {
    code = projectApplyFunctions(pScalarSup->pExprInfo, pBlock, pBlock, pScalarSup->pCtx, pScalarSup->numOfExprs,
                                 pIndefInfo->pPseudoColInfo);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
  }

  setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
  blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

  code = projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs,
                               pIndefInfo->pPseudoColInfo);
  if (code != TSDB_CODE_SUCCESS) {
    longjmp(pTaskInfo->env, code);
  }
}

H
Haojun Liao 已提交
3895 3896
static SSDataBlock* doApplyIndefinitFunction(SOperatorInfo* pOperator) {
  SIndefOperatorInfo* pIndefInfo = pOperator->info;
3897
  SOptrBasicInfo*     pInfo = &pIndefInfo->binfo;
L
Liu Jicong 已提交
3898
  SExprSupp*          pSup = &pOperator->exprSupp;
H
Haojun Liao 已提交
3899 3900 3901 3902 3903 3904 3905 3906 3907 3908 3909 3910 3911 3912 3913 3914 3915

  SSDataBlock* pRes = pInfo->pRes;
  blockDataCleanup(pRes);

  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

  int64_t st = 0;

  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

  SOperatorInfo* downstream = pOperator->pDownstream[0];

3916
  while (1) {
3917
    // here we need to handle the existsed group results
3918
    if (pIndefInfo->pNextGroupRes != NULL) {  // todo extract method
3919 3920
      for (int32_t k = 0; k < pSup->numOfExprs; ++k) {
        SqlFunctionCtx* pCtx = &pSup->pCtx[k];
H
Haojun Liao 已提交
3921

3922 3923 3924 3925 3926 3927 3928
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
        pResInfo->initialized = false;
        pCtx->pOutput = NULL;
      }

      doHandleDataBlock(pOperator, pIndefInfo->pNextGroupRes, downstream, pTaskInfo);
      pIndefInfo->pNextGroupRes = NULL;
H
Haojun Liao 已提交
3929 3930
    }

3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941 3942 3943 3944 3945 3946 3947 3948 3949 3950 3951 3952 3953
    if (pInfo->pRes->info.rows < pOperator->resultInfo.threshold) {
      while (1) {
        // The downstream exec may change the value of the newgroup, so use a local variable instead.
        SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
        if (pBlock == NULL) {
          doSetOperatorCompleted(pOperator);
          break;
        }

        if (pIndefInfo->groupId == 0 && pBlock->info.groupId != 0) {
          pIndefInfo->groupId = pBlock->info.groupId;  // this is the initial group result
        } else {
          if (pIndefInfo->groupId != pBlock->info.groupId) {  // reset output buffer and computing status
            pIndefInfo->groupId = pBlock->info.groupId;
            pIndefInfo->pNextGroupRes = pBlock;
            break;
          }
        }

        doHandleDataBlock(pOperator, pBlock, downstream, pTaskInfo);
        if (pInfo->pRes->info.rows >= pOperator->resultInfo.threshold) {
          break;
        }
H
Haojun Liao 已提交
3954 3955 3956
      }
    }

3957 3958 3959 3960
    doFilter(pIndefInfo->pCondition, pInfo->pRes);
    size_t rows = pInfo->pRes->info.rows;
    if (rows >= 0) {
      break;
H
Haojun Liao 已提交
3961 3962 3963 3964 3965 3966 3967 3968 3969 3970 3971 3972 3973
    }
  }

  size_t rows = pInfo->pRes->info.rows;
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
  }

  return (rows > 0) ? pInfo->pRes : NULL;
}

3974 3975
SOperatorInfo* createIndefinitOutputOperatorInfo(SOperatorInfo* downstream, SPhysiNode* pNode,
                                                 SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
3976
  SIndefOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SIndefOperatorInfo));
3977
  SOperatorInfo*      pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3978 3979 3980 3981
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

3982 3983
  SExprSupp* pSup = &pOperator->exprSupp;

H
Haojun Liao 已提交
3984 3985 3986
  SIndefRowsFuncPhysiNode* pPhyNode = (SIndefRowsFuncPhysiNode*)pNode;

  int32_t    numOfExpr = 0;
X
Xiaoyu Wang 已提交
3987
  SExprInfo* pExprInfo = createExprInfo(pPhyNode->pFuncs, NULL, &numOfExpr);
H
Haojun Liao 已提交
3988 3989

  if (pPhyNode->pExprs != NULL) {
3990
    int32_t    num = 0;
3991
    SExprInfo* pSExpr = createExprInfo(pPhyNode->pExprs, NULL, &num);
3992
    int32_t    code = initExprSupp(&pInfo->scalarSup, pSExpr, num);
3993 3994 3995
    if (code != TSDB_CODE_SUCCESS) {
      goto _error;
    }
H
Haojun Liao 已提交
3996 3997
  }

3998
  SSDataBlock* pResBlock = createResDataBlock(pPhyNode->node.pOutputDataBlockDesc);
H
Haojun Liao 已提交
3999 4000 4001 4002 4003 4004 4005 4006 4007

  int32_t numOfRows = 4096;
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;

  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
4008

H
Haojun Liao 已提交
4009 4010
  initResultSizeInfo(pOperator, numOfRows);

4011
  initAggInfo(pSup, &pInfo->aggSup, pExprInfo, numOfExpr, keyBufSize, pTaskInfo->id.str);
4012 4013
  initBasicInfo(&pInfo->binfo, pResBlock);

4014
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfExpr);
H
Haojun Liao 已提交
4015

4016 4017 4018
  pInfo->binfo.pRes = pResBlock;
  pInfo->pCondition = pPhyNode->node.pConditions;
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pSup->pCtx, numOfExpr);
H
Haojun Liao 已提交
4019

4020
  pOperator->name = "IndefinitOperator";
4021
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC;
4022 4023 4024
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
4025
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
4026 4027 4028 4029 4030 4031 4032 4033 4034 4035 4036

  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doApplyIndefinitFunction, NULL, NULL,
                                         destroyIndefinitOperatorInfo, NULL, NULL, NULL);

  int32_t code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  return pOperator;

4037
_error:
H
Haojun Liao 已提交
4038 4039 4040 4041 4042 4043
  taosMemoryFree(pInfo);
  taosMemoryFree(pOperator);
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
}

4044
static int32_t initFillInfo(SFillOperatorInfo* pInfo, SExprInfo* pExpr, int32_t numOfCols, SNodeListNode* pValNode,
L
Liu Jicong 已提交
4045
                            STimeWindow win, int32_t capacity, const char* id, SInterval* pInterval, int32_t fillType) {
4046
  SFillColInfo* pColInfo = createFillColInfo(pExpr, numOfCols, pValNode);
H
Haojun Liao 已提交
4047 4048

  STimeWindow w = TSWINDOW_INITIALIZER;
4049
  getAlignQueryTimeWindow(pInterval, pInterval->precision, win.skey, &w);
4050
  w = getFirstQualifiedTimeWindow(win.skey, &w, pInterval, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
4051 4052

  int32_t order = TSDB_ORDER_ASC;
4053 4054
  pInfo->pFillInfo = taosCreateFillInfo(order, w.skey, 0, capacity, numOfCols, pInterval,
      fillType, pColInfo, pInfo->primaryTsCol, id);
H
Haojun Liao 已提交
4055

4056
  pInfo->win = win;
L
Liu Jicong 已提交
4057
  pInfo->p = taosMemoryCalloc(numOfCols, POINTER_BYTES);
4058

H
Haojun Liao 已提交
4059
  if (pInfo->pFillInfo == NULL || pInfo->p == NULL) {
H
Haojun Liao 已提交
4060 4061
    taosMemoryFree(pInfo->pFillInfo);
    taosMemoryFree(pInfo->p);
H
Haojun Liao 已提交
4062 4063 4064 4065 4066 4067
    return TSDB_CODE_OUT_OF_MEMORY;
  } else {
    return TSDB_CODE_SUCCESS;
  }
}

H
Haojun Liao 已提交
4068
SOperatorInfo* createFillOperatorInfo(SOperatorInfo* downstream, SFillPhysiNode* pPhyFillNode, SExecTaskInfo* pTaskInfo) {
4069 4070 4071 4072 4073 4074
  SFillOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SFillOperatorInfo));
  SOperatorInfo*     pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

L
Liu Jicong 已提交
4075 4076 4077
  int32_t      num = 0;
  SSDataBlock* pResBlock = createResDataBlock(pPhyFillNode->node.pOutputDataBlockDesc);
  SExprInfo*   pExprInfo = createExprInfo(pPhyFillNode->pTargets, NULL, &num);
4078 4079 4080 4081
  SInterval*   pInterval =
      QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == downstream->operatorType
            ? &((SMergeAlignedIntervalAggOperatorInfo*)downstream->info)->intervalAggOperatorInfo->interval
            : &((SIntervalAggOperatorInfo*)downstream->info)->interval;
4082

4083
  int32_t type = convertFillType(pPhyFillNode->mode);
4084

H
Haojun Liao 已提交
4085
  SResultInfo* pResultInfo = &pOperator->resultInfo;
4086
  initResultSizeInfo(pOperator, 4096);
H
Haojun Liao 已提交
4087
  pInfo->primaryTsCol = ((SColumnNode*)pPhyFillNode->pWStartTs)->slotId;
4088

4089
  int32_t numOfOutputCols = 0;
4090 4091
  SArray* pColMatchColInfo = extractColMatchInfo(pPhyFillNode->pTargets, pPhyFillNode->node.pOutputDataBlockDesc,
                                                 &numOfOutputCols, COL_MATCH_FROM_SLOT_ID);
4092

4093 4094
  int32_t code = initFillInfo(pInfo, pExprInfo, num, (SNodeListNode*)pPhyFillNode->pValues, pPhyFillNode->timeRange,
                              pResultInfo->capacity, pTaskInfo->id.str, pInterval, type);
4095 4096 4097
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
4098

4099 4100 4101 4102 4103 4104 4105 4106
  pInfo->pRes = pResBlock;
  pInfo->pCondition = pPhyFillNode->node.pConditions;
  pInfo->pColMatchColInfo = pColMatchColInfo;
  pOperator->name = "FillOperator";
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_FILL;
  pOperator->exprSupp.pExprInfo = pExprInfo;
4107
  pOperator->exprSupp.numOfExprs = num;
4108 4109
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
4110

L
Liu Jicong 已提交
4111 4112
  pOperator->fpSet =
      createOperatorFpSet(operatorDummyOpenFn, doFill, NULL, NULL, destroySFillOperatorInfo, NULL, NULL, NULL);
4113

4114
  code = appendDownstream(pOperator, &downstream, 1);
4115
  return pOperator;
H
Haojun Liao 已提交
4116

L
Liu Jicong 已提交
4117
_error:
wafwerar's avatar
wafwerar 已提交
4118 4119
  taosMemoryFreeClear(pOperator);
  taosMemoryFreeClear(pInfo);
H
Haojun Liao 已提交
4120
  return NULL;
4121 4122
}

D
dapan1121 已提交
4123
static SExecTaskInfo* createExecTaskInfo(uint64_t queryId, uint64_t taskId, EOPTR_EXEC_MODEL model, char* dbFName) {
wafwerar's avatar
wafwerar 已提交
4124
  SExecTaskInfo* pTaskInfo = taosMemoryCalloc(1, sizeof(SExecTaskInfo));
4125
  setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
4126

D
dapan1121 已提交
4127
  pTaskInfo->schemaVer.dbname = strdup(dbFName);
4128
  pTaskInfo->cost.created = taosGetTimestampMs();
H
Haojun Liao 已提交
4129
  pTaskInfo->id.queryId = queryId;
dengyihao's avatar
dengyihao 已提交
4130
  pTaskInfo->execModel = model;
H
Haojun Liao 已提交
4131

wafwerar's avatar
wafwerar 已提交
4132
  char* p = taosMemoryCalloc(1, 128);
L
Liu Jicong 已提交
4133
  snprintf(p, 128, "TID:0x%" PRIx64 " QID:0x%" PRIx64, taskId, queryId);
H
Haojun Liao 已提交
4134
  pTaskInfo->id.str = p;
H
Haojun Liao 已提交
4135

4136 4137
  return pTaskInfo;
}
H
Haojun Liao 已提交
4138

H
Hongze Cheng 已提交
4139
static STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
H
Haojun Liao 已提交
4140
                                       STableListInfo* pTableListInfo, const char* idstr);
H
Haojun Liao 已提交
4141

H
Haojun Liao 已提交
4142
static SArray* extractColumnInfo(SNodeList* pNodeList);
4143

4144
int32_t extractTableSchemaInfo(SReadHandle* pHandle, uint64_t uid, SExecTaskInfo* pTaskInfo) {
4145 4146
  SMetaReader mr = {0};
  metaReaderInit(&mr, pHandle->meta, 0);
D
dapan1121 已提交
4147
  int32_t code = metaGetTableEntryByUid(&mr, uid);
4148
  if (code != TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
4149
    metaReaderClear(&mr);
4150
    return terrno;
D
dapan1121 已提交
4151
  }
4152 4153 4154 4155

  pTaskInfo->schemaVer.tablename = strdup(mr.me.name);

  if (mr.me.type == TSDB_SUPER_TABLE) {
4156
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
4157
    pTaskInfo->schemaVer.tversion = mr.me.stbEntry.schemaTag.version;
4158
  } else if (mr.me.type == TSDB_CHILD_TABLE) {
4159 4160
    tDecoderClear(&mr.coder);

4161 4162
    tb_uid_t suid = mr.me.ctbEntry.suid;
    metaGetTableEntryByUid(&mr, suid);
4163
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
4164
    pTaskInfo->schemaVer.tversion = mr.me.stbEntry.schemaTag.version;
4165
  } else {
4166
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.ntbEntry.schemaRow);
4167
  }
4168 4169

  metaReaderClear(&mr);
D
dapan1121 已提交
4170
  return TSDB_CODE_SUCCESS;
4171 4172
}

4173 4174 4175 4176 4177 4178 4179 4180 4181 4182 4183
static void cleanupTableSchemaInfo(SExecTaskInfo* pTaskInfo) {
  taosMemoryFreeClear(pTaskInfo->schemaVer.dbname);
  if (pTaskInfo->schemaVer.sw == NULL) {
    return;
  }

  taosMemoryFree(pTaskInfo->schemaVer.sw->pSchema);
  taosMemoryFree(pTaskInfo->schemaVer.sw);
  taosMemoryFree(pTaskInfo->schemaVer.tablename);
}

4184
static int32_t sortTableGroup(STableListInfo* pTableListInfo, int32_t groupNum) {
wmmhello's avatar
wmmhello 已提交
4185
  taosArrayClear(pTableListInfo->pGroupList);
4186 4187
  SArray* sortSupport = taosArrayInit(groupNum, sizeof(uint64_t));
  if (sortSupport == NULL) return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
4188 4189
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
4190
    uint64_t*      groupId = taosHashGet(pTableListInfo->map, &info->uid, sizeof(uint64_t));
wmmhello's avatar
wmmhello 已提交
4191 4192

    int32_t index = taosArraySearchIdx(sortSupport, groupId, compareUint64Val, TD_EQ);
4193 4194 4195 4196
    if (index == -1) {
      void*   p = taosArraySearch(sortSupport, groupId, compareUint64Val, TD_GT);
      SArray* tGroup = taosArrayInit(8, sizeof(STableKeyInfo));
      if (tGroup == NULL) {
wmmhello's avatar
wmmhello 已提交
4197 4198 4199
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
4200
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4201 4202 4203 4204
        qError("taos push info array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
4205
      if (p == NULL) {
wmmhello's avatar
wmmhello 已提交
4206
        if (taosArrayPush(sortSupport, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4207 4208 4209 4210
          qError("taos push support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
wmmhello's avatar
wmmhello 已提交
4211
        if (taosArrayPush(pTableListInfo->pGroupList, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4212 4213 4214 4215
          qError("taos push group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4216
      } else {
wmmhello's avatar
wmmhello 已提交
4217
        int32_t pos = TARRAY_ELEM_IDX(sortSupport, p);
4218
        if (taosArrayInsert(sortSupport, pos, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4219 4220 4221 4222
          qError("taos insert support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4223
        if (taosArrayInsert(pTableListInfo->pGroupList, pos, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4224 4225 4226 4227 4228
          qError("taos insert group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
      }
4229
    } else {
wmmhello's avatar
wmmhello 已提交
4230
      SArray* tGroup = (SArray*)taosArrayGetP(pTableListInfo->pGroupList, index);
4231
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4232 4233 4234 4235 4236 4237 4238 4239 4240 4241
        qError("taos push uid array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
    }
  }
  taosArrayDestroy(sortSupport);
  return TDB_CODE_SUCCESS;
}

wmmhello's avatar
wmmhello 已提交
4242 4243
int32_t generateGroupIdMap(STableListInfo* pTableListInfo, SReadHandle* pHandle, SNodeList* group) {
  if (group == NULL) {
wmmhello's avatar
wmmhello 已提交
4244 4245 4246 4247 4248 4249 4250 4251
    return TDB_CODE_SUCCESS;
  }

  pTableListInfo->map = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, HASH_NO_LOCK);
  if (pTableListInfo->map == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
  int32_t keyLen = 0;
X
Xiaoyu Wang 已提交
4252
  void*   keyBuf = NULL;
wmmhello's avatar
wmmhello 已提交
4253

4254
  SNode* node;
wmmhello's avatar
wmmhello 已提交
4255
  FOREACH(node, group) {
4256
    SExprNode* pExpr = (SExprNode*)node;
wmmhello's avatar
wmmhello 已提交
4257
    keyLen += pExpr->resType.bytes;
wmmhello's avatar
wmmhello 已提交
4258 4259
  }

wmmhello's avatar
wmmhello 已提交
4260
  int32_t nullFlagSize = sizeof(int8_t) * LIST_LENGTH(group);
wmmhello's avatar
wmmhello 已提交
4261 4262 4263 4264 4265 4266 4267
  keyLen += nullFlagSize;

  keyBuf = taosMemoryCalloc(1, keyLen);
  if (keyBuf == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

4268
  int32_t groupNum = 0;
X
Xiaoyu Wang 已提交
4269 4270 4271
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
    SMetaReader    mr = {0};
wmmhello's avatar
wmmhello 已提交
4272 4273 4274
    metaReaderInit(&mr, pHandle->meta, 0);
    metaGetTableEntryByUid(&mr, info->uid);

4275
    SNodeList* groupNew = nodesCloneList(group);
wmmhello's avatar
wmmhello 已提交
4276

wmmhello's avatar
wmmhello 已提交
4277
    nodesRewriteExprsPostOrder(groupNew, doTranslateTagExpr, &mr);
wmmhello's avatar
wmmhello 已提交
4278
    char* isNull = (char*)keyBuf;
wmmhello's avatar
wmmhello 已提交
4279 4280
    char* pStart = (char*)keyBuf + nullFlagSize;

4281
    SNode*  pNode;
wmmhello's avatar
wmmhello 已提交
4282
    int32_t index = 0;
4283
    FOREACH(pNode, groupNew) {
wmmhello's avatar
wmmhello 已提交
4284 4285 4286 4287
      SNode*  pNew = NULL;
      int32_t code = scalarCalculateConstants(pNode, &pNew);
      if (TSDB_CODE_SUCCESS == code) {
        REPLACE_NODE(pNew);
X
Xiaoyu Wang 已提交
4288
      } else {
4289
        taosMemoryFree(keyBuf);
wmmhello's avatar
wmmhello 已提交
4290
        nodesClearList(groupNew);
4291
        metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4292
        return code;
wmmhello's avatar
wmmhello 已提交
4293
      }
4294

wmmhello's avatar
wmmhello 已提交
4295
      ASSERT(nodeType(pNew) == QUERY_NODE_VALUE);
4296
      SValueNode* pValue = (SValueNode*)pNew;
4297

wmmhello's avatar
wmmhello 已提交
4298
      if (pValue->node.resType.type == TSDB_DATA_TYPE_NULL || pValue->isNull) {
wmmhello's avatar
wmmhello 已提交
4299 4300 4301 4302
        isNull[index++] = 1;
        continue;
      } else {
        isNull[index++] = 0;
4303
        char* data = nodesGetValueFromNode(pValue);
L
Liu Jicong 已提交
4304 4305
        if (pValue->node.resType.type == TSDB_DATA_TYPE_JSON) {
          if (tTagIsJson(data)) {
wmmhello's avatar
wmmhello 已提交
4306 4307 4308
            terrno = TSDB_CODE_QRY_JSON_IN_GROUP_ERROR;
            taosMemoryFree(keyBuf);
            nodesClearList(groupNew);
4309
            metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4310 4311
            return terrno;
          }
wmmhello's avatar
wmmhello 已提交
4312
          int32_t len = getJsonValueLen(data);
wmmhello's avatar
wmmhello 已提交
4313 4314 4315
          memcpy(pStart, data, len);
          pStart += len;
        } else if (IS_VAR_DATA_TYPE(pValue->node.resType.type)) {
wmmhello's avatar
wmmhello 已提交
4316 4317
          memcpy(pStart, data, varDataTLen(data));
          pStart += varDataTLen(data);
wmmhello's avatar
wmmhello 已提交
4318
        } else {
wmmhello's avatar
wmmhello 已提交
4319 4320
          memcpy(pStart, data, pValue->node.resType.bytes);
          pStart += pValue->node.resType.bytes;
wmmhello's avatar
wmmhello 已提交
4321 4322 4323
        }
      }
    }
4324

4325
    int32_t  len = (int32_t)(pStart - (char*)keyBuf);
4326 4327
    uint64_t groupId = calcGroupId(keyBuf, len);
    taosHashPut(pTableListInfo->map, &(info->uid), sizeof(uint64_t), &groupId, sizeof(uint64_t));
S
slzhou 已提交
4328
    info->groupId = groupId;
4329
    groupNum++;
wmmhello's avatar
wmmhello 已提交
4330

wmmhello's avatar
wmmhello 已提交
4331
    nodesClearList(groupNew);
wmmhello's avatar
wmmhello 已提交
4332 4333 4334
    metaReaderClear(&mr);
  }
  taosMemoryFree(keyBuf);
4335

4336
  if (pTableListInfo->needSortTableByGroupId) {
wmmhello's avatar
wmmhello 已提交
4337
    return sortTableGroup(pTableListInfo, groupNum);
4338 4339
  }

wmmhello's avatar
wmmhello 已提交
4340 4341 4342
  return TDB_CODE_SUCCESS;
}

4343 4344 4345 4346 4347 4348 4349 4350 4351 4352 4353 4354 4355 4356 4357 4358 4359 4360 4361 4362 4363 4364 4365 4366
static int32_t initTableblockDistQueryCond(uint64_t uid, SQueryTableDataCond* pCond) {
  memset(pCond, 0, sizeof(SQueryTableDataCond));

  pCond->order = TSDB_ORDER_ASC;
  pCond->numOfCols = 1;
  pCond->colList = taosMemoryCalloc(1, sizeof(SColumnInfo));
  if (pCond->colList == NULL) {
    terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return terrno;
  }

  pCond->colList->colId = 1;
  pCond->colList->type = TSDB_DATA_TYPE_TIMESTAMP;
  pCond->colList->bytes = sizeof(TSKEY);

  pCond->twindows = (STimeWindow){.skey = INT64_MIN, .ekey = INT64_MAX};
  pCond->suid = uid;
  pCond->type = BLOCK_LOAD_OFFSET_ORDER;
  pCond->startVersion = -1;
  pCond->endVersion  =  -1;

  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
4367
SOperatorInfo* createOperatorTree(SPhysiNode* pPhyNode, SExecTaskInfo* pTaskInfo, SReadHandle* pHandle,
4368 4369
                                  uint64_t queryId, uint64_t taskId, STableListInfo* pTableListInfo,
                                  const char* pUser) {
4370 4371
  int32_t type = nodeType(pPhyNode);

X
Xiaoyu Wang 已提交
4372
  if (pPhyNode->pChildren == NULL || LIST_LENGTH(pPhyNode->pChildren) == 0) {
H
Haojun Liao 已提交
4373
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == type) {
dengyihao's avatar
dengyihao 已提交
4374
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4375

4376 4377
      int32_t code = createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags,
                                             pTableScanNode->groupSort, pHandle, pTableListInfo, queryId, taskId);
4378
      if (code) {
wmmhello's avatar
wmmhello 已提交
4379
        pTaskInfo->code = code;
D
dapan1121 已提交
4380 4381
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4382

4383
      code = extractTableSchemaInfo(pHandle, pTableScanNode->scan.uid, pTaskInfo);
S
slzhou 已提交
4384
      if (code) {
4385
        pTaskInfo->code = terrno;
wmmhello's avatar
wmmhello 已提交
4386 4387 4388
        return NULL;
      }

H
Haojun Liao 已提交
4389
      SOperatorInfo*  pOperator = createTableScanOperatorInfo(pTableScanNode, pHandle, pTaskInfo);
4390 4391
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
S
slzhou 已提交
4392
      return pOperator;
L
Liu Jicong 已提交
4393

S
slzhou 已提交
4394 4395
    } else if (QUERY_NODE_PHYSICAL_PLAN_TABLE_MERGE_SCAN == type) {
      STableMergeScanPhysiNode* pTableScanNode = (STableMergeScanPhysiNode*)pPhyNode;
4396 4397
      int32_t code = createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags,
                                             pTableScanNode->groupSort, pHandle, pTableListInfo, queryId, taskId);
L
Liu Jicong 已提交
4398
      if (code) {
wmmhello's avatar
wmmhello 已提交
4399
        pTaskInfo->code = code;
wmmhello's avatar
wmmhello 已提交
4400 4401
        return NULL;
      }
4402

4403
      code = extractTableSchemaInfo(pHandle, pTableScanNode->scan.uid, pTaskInfo);
wmmhello's avatar
wmmhello 已提交
4404 4405 4406 4407
      if (code) {
        pTaskInfo->code = terrno;
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4408

4409 4410
      SOperatorInfo* pOperator =
          createTableMergeScanOperatorInfo(pTableScanNode, pTableListInfo, pHandle, pTaskInfo, queryId, taskId);
wmmhello's avatar
wmmhello 已提交
4411

4412 4413 4414
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
      return pOperator;
L
Liu Jicong 已提交
4415

H
Haojun Liao 已提交
4416
    } else if (QUERY_NODE_PHYSICAL_PLAN_EXCHANGE == type) {
4417
      return createExchangeOperatorInfo(pHandle->pMsgCb->clientRpc, (SExchangePhysiNode*)pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4418
    } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN == type) {
5
54liuyao 已提交
4419
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
4420
      STimeWindowAggSupp   twSup = {
L
Liu Jicong 已提交
4421 4422 4423 4424
            .waterMark = pTableScanNode->watermark,
            .calTrigger = pTableScanNode->triggerType,
            .maxTs = INT64_MIN,
      };
L
Liu Jicong 已提交
4425
      if (pHandle) {
4426 4427
        int32_t code = createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags,
                                               pTableScanNode->groupSort, pHandle, pTableListInfo, queryId, taskId);
L
Liu Jicong 已提交
4428
        if (code) {
wmmhello's avatar
wmmhello 已提交
4429 4430 4431
          pTaskInfo->code = code;
          return NULL;
        }
5
54liuyao 已提交
4432
      }
4433

4434 4435
      SOperatorInfo* pOperator =
          createStreamScanOperatorInfo(pHandle, pTableScanNode, pTaskInfo, &twSup, queryId, taskId);
H
Haojun Liao 已提交
4436
      return pOperator;
L
Liu Jicong 已提交
4437

H
Haojun Liao 已提交
4438
    } else if (QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN == type) {
L
Liu Jicong 已提交
4439
      SSystemTableScanPhysiNode* pSysScanPhyNode = (SSystemTableScanPhysiNode*)pPhyNode;
4440
      return createSysTableScanOperatorInfo(pHandle, pSysScanPhyNode, pUser, pTaskInfo);
4441
    } else if (QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN == type) {
X
Xiaoyu Wang 已提交
4442
      STagScanPhysiNode* pScanPhyNode = (STagScanPhysiNode*)pPhyNode;
4443

4444
      int32_t code = getTableList(pHandle->meta, pHandle->vnode, pScanPhyNode, pTableListInfo);
4445
      if (code != TSDB_CODE_SUCCESS) {
4446
        pTaskInfo->code = terrno;
4447 4448 4449
        return NULL;
      }

4450
      return createTagScanOperatorInfo(pHandle, pScanPhyNode, pTableListInfo, pTaskInfo);
4451
    } else if (QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN == type) {
4452
      SBlockDistScanPhysiNode* pBlockNode = (SBlockDistScanPhysiNode*)pPhyNode;
4453 4454 4455
      pTableListInfo->pTableList = taosArrayInit(4, sizeof(STableKeyInfo));

      if (pBlockNode->tableType == TSDB_SUPER_TABLE) {
4456
        int32_t code = vnodeGetAllTableList(pHandle->vnode, pBlockNode->uid, pTableListInfo->pTableList);
4457 4458 4459 4460 4461
        if (code != TSDB_CODE_SUCCESS) {
          pTaskInfo->code = terrno;
          return NULL;
        }
      } else {  // Create one table group.
S
slzhou 已提交
4462
        STableKeyInfo info = {.lastKey = 0, .uid = pBlockNode->uid, .groupId = 0};
4463 4464 4465 4466
        taosArrayPush(pTableListInfo->pTableList, &info);
      }

      SQueryTableDataCond cond = {0};
4467 4468 4469
      int32_t code = initTableblockDistQueryCond(pBlockNode->suid, &cond);
      if (code != TSDB_CODE_SUCCESS) {
        return NULL;
4470
      }
H
Haojun Liao 已提交
4471 4472 4473

      STsdbReader* pReader = NULL;
      tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, "");
4474 4475
      cleanupQueryTableDataCond(&cond);

4476
      return createDataBlockInfoScanOperator(pReader, pHandle, cond.suid, pBlockNode, pTaskInfo);
H
Haojun Liao 已提交
4477 4478 4479
    } else if (QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN == type) {
      SLastRowScanPhysiNode* pScanNode = (SLastRowScanPhysiNode*)pPhyNode;

4480 4481
      int32_t code = createScanTableListInfo(&pScanNode->scan, pScanNode->pGroupTags, true, pHandle, pTableListInfo,
                                             queryId, taskId);
4482 4483 4484 4485
      if (code != TSDB_CODE_SUCCESS) {
        pTaskInfo->code = code;
        return NULL;
      }
4486

4487 4488 4489 4490
      code = extractTableSchemaInfo(pHandle, pScanNode->scan.uid, pTaskInfo);
      if (code != TSDB_CODE_SUCCESS) {
        pTaskInfo->code = code;
        return NULL;
H
Haojun Liao 已提交
4491 4492
      }

4493
      return createLastrowScanOperator(pScanNode, pHandle, pTaskInfo);
H
Haojun Liao 已提交
4494 4495
    } else {
      ASSERT(0);
H
Haojun Liao 已提交
4496 4497 4498
    }
  }

4499 4500
  int32_t num = 0;
  size_t  size = LIST_LENGTH(pPhyNode->pChildren);
H
Haojun Liao 已提交
4501

4502
  SOperatorInfo** ops = taosMemoryCalloc(size, POINTER_BYTES);
dengyihao's avatar
dengyihao 已提交
4503
  for (int32_t i = 0; i < size; ++i) {
4504
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pPhyNode->pChildren, i);
4505
    ops[i] = createOperatorTree(pChildNode, pTaskInfo, pHandle, queryId, taskId, pTableListInfo, pUser);
4506 4507 4508
    if (ops[i] == NULL) {
      return NULL;
    }
4509
  }
H
Haojun Liao 已提交
4510

4511
  SOperatorInfo* pOptr = NULL;
H
Haojun Liao 已提交
4512
  if (QUERY_NODE_PHYSICAL_PLAN_PROJECT == type) {
4513
    pOptr = createProjectOperatorInfo(ops[0], (SProjectPhysiNode*)pPhyNode, pTaskInfo);
4514
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_AGG == type) {
H
Haojun Liao 已提交
4515 4516
    SAggPhysiNode* pAggNode = (SAggPhysiNode*)pPhyNode;
    SExprInfo*     pExprInfo = createExprInfo(pAggNode->pAggFuncs, pAggNode->pGroupKeys, &num);
4517
    SSDataBlock*   pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4518

dengyihao's avatar
dengyihao 已提交
4519
    int32_t    numOfScalarExpr = 0;
4520 4521 4522 4523 4524
    SExprInfo* pScalarExprInfo = NULL;
    if (pAggNode->pExprs != NULL) {
      pScalarExprInfo = createExprInfo(pAggNode->pExprs, NULL, &numOfScalarExpr);
    }

H
Haojun Liao 已提交
4525 4526
    if (pAggNode->pGroupKeys != NULL) {
      SArray* pColList = extractColumnInfo(pAggNode->pGroupKeys);
dengyihao's avatar
dengyihao 已提交
4527
      pOptr = createGroupOperatorInfo(ops[0], pExprInfo, num, pResBlock, pColList, pAggNode->node.pConditions,
wmmhello's avatar
wmmhello 已提交
4528
                                      pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4529
    } else {
L
Liu Jicong 已提交
4530 4531
      pOptr = createAggregateOperatorInfo(ops[0], pExprInfo, num, pResBlock, pAggNode->node.pConditions,
                                          pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4532
    }
X
Xiaoyu Wang 已提交
4533
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_INTERVAL == type || QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type) {
H
Haojun Liao 已提交
4534
    SIntervalPhysiNode* pIntervalPhyNode = (SIntervalPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4535

H
Haojun Liao 已提交
4536
    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
4537
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4538

dengyihao's avatar
dengyihao 已提交
4539 4540 4541 4542 4543 4544
    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
H
Haojun Liao 已提交
4545

X
Xiaoyu Wang 已提交
4546 4547 4548 4549 4550
    STimeWindowAggSupp as = {
        .waterMark = pIntervalPhyNode->window.watermark,
        .calTrigger = pIntervalPhyNode->window.triggerType,
        .maxTs = INT64_MIN,
    };
4551
    ASSERT(as.calTrigger != STREAM_TRIGGER_MAX_DELAY);
4552

4553
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4554
    bool    isStream = (QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type);
4555 4556
    pOptr = createIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, &as, pIntervalPhyNode,
                                       pTaskInfo, isStream);
4557

4558 4559
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == type) {
    SMergeAlignedIntervalPhysiNode* pIntervalPhyNode = (SMergeAlignedIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4560 4561 4562 4563 4564 4565 4566 4567 4568 4569

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4570

S
shenglian zhou 已提交
4571
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4572 4573
    pOptr = createMergeAlignedIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId,
                                                   pPhyNode->pConditions, pTaskInfo);
S
shenglian zhou 已提交
4574
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_INTERVAL == type) {
X
Xiaoyu Wang 已提交
4575
    SMergeIntervalPhysiNode* pIntervalPhyNode = (SMergeIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4576 4577 4578 4579 4580 4581 4582 4583 4584 4585

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4586

S
shenglian zhou 已提交
4587 4588
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
    pOptr = createMergeIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, pTaskInfo);
5
54liuyao 已提交
4589
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_INTERVAL == type) {
4590
    int32_t children = 0;
5
54liuyao 已提交
4591 4592
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_INTERVAL == type) {
4593
    int32_t children = 1;
5
54liuyao 已提交
4594
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4595
  } else if (QUERY_NODE_PHYSICAL_PLAN_SORT == type) {
4596
    pOptr = createSortOperatorInfo(ops[0], (SSortPhysiNode*)pPhyNode, pTaskInfo);
S
shenglian zhou 已提交
4597 4598
  } else if (QUERY_NODE_PHYSICAL_PLAN_GROUP_SORT == type) {
    pOptr = createGroupSortOperatorInfo(ops[0], (SGroupSortPhysiNode*)pPhyNode, pTaskInfo);
X
Xiaoyu Wang 已提交
4599
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE == type) {
4600
    SMergePhysiNode* pMergePhyNode = (SMergePhysiNode*)pPhyNode;
4601
    pOptr = createMultiwayMergeOperatorInfo(ops, size, pMergePhyNode, pTaskInfo);
4602
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_SESSION == type) {
H
Haojun Liao 已提交
4603 4604
    SSessionWinodwPhysiNode* pSessionNode = (SSessionWinodwPhysiNode*)pPhyNode;

X
Xiaoyu Wang 已提交
4605 4606
    STimeWindowAggSupp as = {.waterMark = pSessionNode->window.watermark,
                             .calTrigger = pSessionNode->window.triggerType};
4607

H
Haojun Liao 已提交
4608
    SExprInfo*   pExprInfo = createExprInfo(pSessionNode->window.pFuncs, NULL, &num);
4609
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4610 4611
    int32_t      tsSlotId = ((SColumnNode*)pSessionNode->window.pTspk)->slotId;

L
Liu Jicong 已提交
4612 4613
    pOptr = createSessionAggOperatorInfo(ops[0], pExprInfo, num, pResBlock, pSessionNode->gap, tsSlotId, &as,
                                         pPhyNode->pConditions, pTaskInfo);
4614
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SESSION == type) {
4615 4616 4617 4618 4619 4620 4621
    pOptr = createStreamSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_SESSION == type) {
    int32_t children = 0;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_SESSION == type) {
    int32_t children = 1;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4622
  } else if (QUERY_NODE_PHYSICAL_PLAN_PARTITION == type) {
4623
    pOptr = createPartitionOperatorInfo(ops[0], (SPartitionPhysiNode*)pPhyNode, pTaskInfo);
4624
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_STATE == type) {
dengyihao's avatar
dengyihao 已提交
4625
    SStateWinodwPhysiNode* pStateNode = (SStateWinodwPhysiNode*)pPhyNode;
4626

4627 4628
    STimeWindowAggSupp as = {.waterMark = pStateNode->window.watermark, .calTrigger = pStateNode->window.triggerType};

dengyihao's avatar
dengyihao 已提交
4629
    SExprInfo*   pExprInfo = createExprInfo(pStateNode->window.pFuncs, NULL, &num);
4630
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4631 4632
    int32_t      tsSlotId = ((SColumnNode*)pStateNode->window.pTspk)->slotId;

4633
    SColumnNode* pColNode = (SColumnNode*)((STargetNode*)pStateNode->pStateKey)->pExpr;
X
Xiaoyu Wang 已提交
4634
    SColumn      col = extractColumnFromColumnNode(pColNode);
L
Liu Jicong 已提交
4635 4636
    pOptr = createStatewindowOperatorInfo(ops[0], pExprInfo, num, pResBlock, &as, tsSlotId, &col, pPhyNode->pConditions,
                                          pTaskInfo);
4637
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_STATE == type) {
5
54liuyao 已提交
4638
    pOptr = createStreamStateAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4639
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_JOIN == type) {
4640
    pOptr = createMergeJoinOperatorInfo(ops, size, (SJoinPhysiNode*)pPhyNode, pTaskInfo);
4641
  } else if (QUERY_NODE_PHYSICAL_PLAN_FILL == type) {
H
Haojun Liao 已提交
4642
    pOptr = createFillOperatorInfo(ops[0], (SFillPhysiNode*)pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4643 4644
  } else if (QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC == type) {
    pOptr = createIndefinitOutputOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4645 4646
  } else if (QUERY_NODE_PHYSICAL_PLAN_INTERP_FUNC == type) {
    pOptr = createTimeSliceOperatorInfo(ops[0], pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4647 4648
  } else {
    ASSERT(0);
H
Haojun Liao 已提交
4649
  }
4650 4651 4652

  taosMemoryFree(ops);
  return pOptr;
4653
}
H
Haojun Liao 已提交
4654

H
Haojun Liao 已提交
4655
SArray* extractColumnInfo(SNodeList* pNodeList) {
L
Liu Jicong 已提交
4656
  size_t  numOfCols = LIST_LENGTH(pNodeList);
H
Haojun Liao 已提交
4657 4658 4659 4660 4661 4662
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColumn));
  if (pList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

L
Liu Jicong 已提交
4663 4664
  for (int32_t i = 0; i < numOfCols; ++i) {
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pNodeList, i);
H
Haojun Liao 已提交
4665

4666 4667 4668
    if (nodeType(pNode->pExpr) == QUERY_NODE_COLUMN) {
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

4669
      SColumn c = extractColumnFromColumnNode(pColNode);
4670 4671
      taosArrayPush(pList, &c);
    } else if (nodeType(pNode->pExpr) == QUERY_NODE_VALUE) {
L
Liu Jicong 已提交
4672 4673
      SValueNode* pValNode = (SValueNode*)pNode->pExpr;
      SColumn     c = {0};
4674
      c.slotId = pNode->slotId;
L
Liu Jicong 已提交
4675 4676 4677 4678
      c.colId = pNode->slotId;
      c.type = pValNode->node.type;
      c.bytes = pValNode->node.resType.bytes;
      c.scale = pValNode->node.resType.scale;
4679 4680 4681 4682
      c.precision = pValNode->node.resType.precision;

      taosArrayPush(pList, &c);
    }
H
Haojun Liao 已提交
4683 4684 4685 4686 4687
  }

  return pList;
}

L
Liu Jicong 已提交
4688 4689
STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
                                STableListInfo* pTableListInfo, const char* idstr) {
4690
  int32_t code = getTableList(pHandle->meta, pHandle->vnode, &pTableScanNode->scan, pTableListInfo);
wmmhello's avatar
wmmhello 已提交
4691 4692 4693 4694 4695 4696
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  if (taosArrayGetSize(pTableListInfo->pTableList) == 0) {
    code = 0;
H
Haojun Liao 已提交
4697
    qDebug("no table qualified for query, %s", idstr);
wmmhello's avatar
wmmhello 已提交
4698 4699 4700
    goto _error;
  }

4701
  SQueryTableDataCond cond = {0};
wmmhello's avatar
wmmhello 已提交
4702
  code = initQueryTableDataCond(&cond, pTableScanNode);
4703
  if (code != TSDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4704
    goto _error;
X
Xiaoyu Wang 已提交
4705
  }
4706

H
Hongze Cheng 已提交
4707
  STsdbReader* pReader;
H
Haojun Liao 已提交
4708
  code = tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, idstr);
H
Haojun Liao 已提交
4709 4710 4711 4712
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

4713
  cleanupQueryTableDataCond(&cond);
H
Haojun Liao 已提交
4714 4715

  return pReader;
wmmhello's avatar
wmmhello 已提交
4716 4717 4718 4719

_error:
  terrno = code;
  return NULL;
H
Haojun Liao 已提交
4720 4721
}

L
Liu Jicong 已提交
4722 4723 4724 4725 4726 4727 4728 4729 4730 4731 4732 4733 4734
static int32_t extractTbscanInStreamOpTree(SOperatorInfo* pOperator, STableScanInfo** ppInfo) {
  if (pOperator->operatorType != QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
    if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator");
      return TSDB_CODE_QRY_APP_ERROR;
    }

    if (pOperator->numOfDownstream > 1) {
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
    }
    return extractTbscanInStreamOpTree(pOperator->pDownstream[0], ppInfo);
  } else {
4735 4736 4737
    SStreamScanInfo* pInfo = pOperator->info;
    ASSERT(pInfo->pTableScanOp->operatorType == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN);
    *ppInfo = pInfo->pTableScanOp->info;
L
Liu Jicong 已提交
4738 4739 4740 4741
    return 0;
  }
}

4742 4743 4744 4745 4746 4747 4748 4749 4750 4751 4752 4753 4754 4755 4756 4757 4758 4759 4760 4761 4762 4763
int32_t extractTableScanNode(SPhysiNode* pNode, STableScanPhysiNode** ppNode) {
  if (pNode->pChildren == NULL || LIST_LENGTH(pNode->pChildren) == 0) {
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == pNode->type) {
      *ppNode = (STableScanPhysiNode*)pNode;
      return 0;
    } else {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
  } else {
    if (LIST_LENGTH(pNode->pChildren) != 1) {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pNode->pChildren, 0);
    return extractTableScanNode(pChildNode, ppNode);
  }
  return -1;
}

L
Liu Jicong 已提交
4764 4765 4766 4767 4768
int32_t rebuildReader(SOperatorInfo* pOperator, SSubplan* plan, SReadHandle* pHandle, int64_t uid, int64_t ts) {
  STableScanInfo* pTableScanInfo = NULL;
  if (extractTbscanInStreamOpTree(pOperator, &pTableScanInfo) < 0) {
    return -1;
  }
4769

L
Liu Jicong 已提交
4770 4771 4772 4773
  STableScanPhysiNode* pNode = NULL;
  if (extractTableScanNode(plan->pNode, &pNode) < 0) {
    ASSERT(0);
  }
4774

H
Haojun Liao 已提交
4775
  tsdbReaderClose(pTableScanInfo->dataReader);
4776

L
Liu Jicong 已提交
4777
  STableListInfo info = {0};
H
Haojun Liao 已提交
4778
  pTableScanInfo->dataReader = doCreateDataReader(pNode, pHandle, &info, NULL);
L
Liu Jicong 已提交
4779 4780 4781 4782
  if (pTableScanInfo->dataReader == NULL) {
    ASSERT(0);
    qError("failed to create data reader");
    return TSDB_CODE_QRY_APP_ERROR;
4783
  }
L
Liu Jicong 已提交
4784
  // TODO: set uid and ts to data reader
4785 4786 4787
  return 0;
}

C
Cary Xu 已提交
4788
int32_t encodeOperator(SOperatorInfo* ops, char** result, int32_t* length, int32_t* nOptrWithVal) {
wmmhello's avatar
wmmhello 已提交
4789
  int32_t code = TDB_CODE_SUCCESS;
4790
  char*   pCurrent = NULL;
wmmhello's avatar
wmmhello 已提交
4791
  int32_t currLength = 0;
4792
  if (ops->fpSet.encodeResultRow) {
C
Cary Xu 已提交
4793
    if (result == NULL || length == NULL || nOptrWithVal == NULL) {
wmmhello's avatar
wmmhello 已提交
4794 4795 4796
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
    code = ops->fpSet.encodeResultRow(ops, &pCurrent, &currLength);
wmmhello's avatar
wmmhello 已提交
4797

4798 4799
    if (code != TDB_CODE_SUCCESS) {
      if (*result != NULL) {
wmmhello's avatar
wmmhello 已提交
4800 4801 4802 4803
        taosMemoryFree(*result);
        *result = NULL;
      }
      return code;
C
Cary Xu 已提交
4804 4805 4806
    } else if (currLength == 0) {
      ASSERT(!pCurrent);
      goto _downstream;
wmmhello's avatar
wmmhello 已提交
4807
    }
wmmhello's avatar
wmmhello 已提交
4808

C
Cary Xu 已提交
4809 4810
    ++(*nOptrWithVal);

C
Cary Xu 已提交
4811
    ASSERT(currLength >= 0);
wmmhello's avatar
wmmhello 已提交
4812

4813
    if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
4814
      *result = (char*)taosMemoryCalloc(1, currLength + sizeof(int32_t));
wmmhello's avatar
wmmhello 已提交
4815 4816 4817 4818 4819 4820
      if (*result == NULL) {
        taosMemoryFree(pCurrent);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      memcpy(*result + sizeof(int32_t), pCurrent, currLength);
      *(int32_t*)(*result) = currLength + sizeof(int32_t);
4821
    } else {
wmmhello's avatar
wmmhello 已提交
4822
      int32_t sizePre = *(int32_t*)(*result);
4823
      char*   tmp = (char*)taosMemoryRealloc(*result, sizePre + currLength);
wmmhello's avatar
wmmhello 已提交
4824 4825 4826 4827 4828 4829 4830 4831 4832 4833 4834 4835
      if (tmp == NULL) {
        taosMemoryFree(pCurrent);
        taosMemoryFree(*result);
        *result = NULL;
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      *result = tmp;
      memcpy(*result + sizePre, pCurrent, currLength);
      *(int32_t*)(*result) += currLength;
    }
    taosMemoryFree(pCurrent);
    *length = *(int32_t*)(*result);
wmmhello's avatar
wmmhello 已提交
4836 4837
  }

C
Cary Xu 已提交
4838
_downstream:
wmmhello's avatar
wmmhello 已提交
4839
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
C
Cary Xu 已提交
4840
    code = encodeOperator(ops->pDownstream[i], result, length, nOptrWithVal);
4841
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4842
      return code;
wmmhello's avatar
wmmhello 已提交
4843 4844
    }
  }
wmmhello's avatar
wmmhello 已提交
4845
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4846 4847
}

H
Haojun Liao 已提交
4848
int32_t decodeOperator(SOperatorInfo* ops, const char* result, int32_t length) {
wmmhello's avatar
wmmhello 已提交
4849
  int32_t code = TDB_CODE_SUCCESS;
4850 4851
  if (ops->fpSet.decodeResultRow) {
    if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
4852 4853
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
H
Haojun Liao 已提交
4854

4855
    ASSERT(length == *(int32_t*)result);
H
Haojun Liao 已提交
4856 4857

    const char* data = result + sizeof(int32_t);
L
Liu Jicong 已提交
4858
    code = ops->fpSet.decodeResultRow(ops, (char*)data);
4859
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4860 4861
      return code;
    }
wmmhello's avatar
wmmhello 已提交
4862

wmmhello's avatar
wmmhello 已提交
4863
    int32_t totalLength = *(int32_t*)result;
4864 4865
    int32_t dataLength = *(int32_t*)data;

4866
    if (totalLength == dataLength + sizeof(int32_t)) {  // the last data
wmmhello's avatar
wmmhello 已提交
4867 4868
      result = NULL;
      length = 0;
4869
    } else {
wmmhello's avatar
wmmhello 已提交
4870 4871 4872 4873
      result += dataLength;
      *(int32_t*)(result) = totalLength - dataLength;
      length = totalLength - dataLength;
    }
wmmhello's avatar
wmmhello 已提交
4874 4875
  }

wmmhello's avatar
wmmhello 已提交
4876 4877
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
    code = decodeOperator(ops->pDownstream[i], result, length);
4878
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4879
      return code;
wmmhello's avatar
wmmhello 已提交
4880 4881
    }
  }
wmmhello's avatar
wmmhello 已提交
4882
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4883 4884
}

D
dapan1121 已提交
4885
int32_t createDataSinkParam(SDataSinkNode* pNode, void** pParam, qTaskInfo_t* pTaskInfo, SReadHandle* readHandle) {
D
dapan1121 已提交
4886
  SExecTaskInfo* pTask = *(SExecTaskInfo**)pTaskInfo;
4887

D
dapan1121 已提交
4888
  switch (pNode->type) {
D
dapan1121 已提交
4889 4890 4891 4892 4893 4894
    case QUERY_NODE_PHYSICAL_PLAN_QUERY_INSERT: {
      SInserterParam* pInserterParam = taosMemoryCalloc(1, sizeof(SInserterParam));
      if (NULL == pInserterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      pInserterParam->readHandle = readHandle;
L
Liu Jicong 已提交
4895

D
dapan1121 已提交
4896 4897 4898
      *pParam = pInserterParam;
      break;
    }
D
dapan1121 已提交
4899
    case QUERY_NODE_PHYSICAL_PLAN_DELETE: {
4900
      SDeleterParam* pDeleterParam = taosMemoryCalloc(1, sizeof(SDeleterParam));
D
dapan1121 已提交
4901 4902 4903 4904
      if (NULL == pDeleterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      int32_t tbNum = taosArrayGetSize(pTask->tableqinfoList.pTableList);
D
dapan1121 已提交
4905
      pDeleterParam->suid = pTask->tableqinfoList.suid;
D
dapan1121 已提交
4906 4907 4908 4909 4910 4911
      pDeleterParam->pUidList = taosArrayInit(tbNum, sizeof(uint64_t));
      if (NULL == pDeleterParam->pUidList) {
        taosMemoryFree(pDeleterParam);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      for (int32_t i = 0; i < tbNum; ++i) {
4912
        STableKeyInfo* pTable = taosArrayGet(pTask->tableqinfoList.pTableList, i);
D
dapan1121 已提交
4913 4914 4915 4916 4917 4918 4919 4920 4921 4922 4923 4924 4925
        taosArrayPush(pDeleterParam->pUidList, &pTable->uid);
      }

      *pParam = pDeleterParam;
      break;
    }
    default:
      break;
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
4926
int32_t createExecTaskInfoImpl(SSubplan* pPlan, SExecTaskInfo** pTaskInfo, SReadHandle* pHandle, uint64_t taskId,
4927
                               const char* sql, EOPTR_EXEC_MODEL model) {
H
Haojun Liao 已提交
4928 4929
  uint64_t queryId = pPlan->id.queryId;

H
Haojun Liao 已提交
4930
  int32_t code = TSDB_CODE_SUCCESS;
D
dapan1121 已提交
4931
  *pTaskInfo = createExecTaskInfo(queryId, taskId, model, pPlan->dbFName);
H
Haojun Liao 已提交
4932 4933 4934 4935
  if (*pTaskInfo == NULL) {
    code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    goto _complete;
  }
H
Haojun Liao 已提交
4936

4937
  (*pTaskInfo)->sql = sql;
wmmhello's avatar
wmmhello 已提交
4938 4939
  (*pTaskInfo)->tableqinfoList.pTagCond = pPlan->pTagCond;
  (*pTaskInfo)->tableqinfoList.pTagIndexCond = pPlan->pTagIndexCond;
4940 4941
  (*pTaskInfo)->pRoot = createOperatorTree(pPlan->pNode, *pTaskInfo, pHandle, queryId, taskId,
                                           &(*pTaskInfo)->tableqinfoList, pPlan->user);
L
Liu Jicong 已提交
4942

D
dapan1121 已提交
4943
  if (NULL == (*pTaskInfo)->pRoot) {
4944
    code = (*pTaskInfo)->code;
D
dapan1121 已提交
4945
    goto _complete;
4946 4947
  }

H
Haojun Liao 已提交
4948 4949
  return code;

H
Haojun Liao 已提交
4950
_complete:
wafwerar's avatar
wafwerar 已提交
4951
  taosMemoryFreeClear(*pTaskInfo);
H
Haojun Liao 已提交
4952 4953
  terrno = code;
  return code;
H
Haojun Liao 已提交
4954 4955
}

wmmhello's avatar
wmmhello 已提交
4956 4957 4958
static void doDestroyTableList(STableListInfo* pTableqinfoList) {
  taosArrayDestroy(pTableqinfoList->pTableList);
  taosHashCleanup(pTableqinfoList->map);
4959 4960
  if (pTableqinfoList->needSortTableByGroupId) {
    for (int32_t i = 0; i < taosArrayGetSize(pTableqinfoList->pGroupList); i++) {
wmmhello's avatar
wmmhello 已提交
4961
      SArray* tmp = taosArrayGetP(pTableqinfoList->pGroupList, i);
4962 4963 4964
      if (tmp == pTableqinfoList->pTableList) {
        continue;
      }
wmmhello's avatar
wmmhello 已提交
4965 4966 4967 4968
      taosArrayDestroy(tmp);
    }
  }
  taosArrayDestroy(pTableqinfoList->pGroupList);
4969

wmmhello's avatar
wmmhello 已提交
4970 4971
  pTableqinfoList->pTableList = NULL;
  pTableqinfoList->map = NULL;
4972 4973
}

L
Liu Jicong 已提交
4974
void doDestroyTask(SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
4975 4976
  qDebug("%s execTask is freed", GET_TASKID(pTaskInfo));

wmmhello's avatar
wmmhello 已提交
4977
  doDestroyTableList(&pTaskInfo->tableqinfoList);
H
Haojun Liao 已提交
4978
  destroyOperatorInfo(pTaskInfo->pRoot);
4979
  cleanupTableSchemaInfo(pTaskInfo);
4980

wafwerar's avatar
wafwerar 已提交
4981 4982 4983
  taosMemoryFreeClear(pTaskInfo->sql);
  taosMemoryFreeClear(pTaskInfo->id.str);
  taosMemoryFreeClear(pTaskInfo);
4984 4985 4986 4987 4988 4989 4990 4991 4992 4993 4994 4995
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes) {
  if (val == NULL) {
    setNull(output, type, bytes);
    return;
  }

  if (IS_VAR_DATA_TYPE(type)) {
    // Binary data overflows for sort of unknown reasons. Let trim the overflow data
    if (varDataTLen(val) > bytes) {
      int32_t maxLen = bytes - VARSTR_HEADER_SIZE;
L
Liu Jicong 已提交
4996
      int32_t len = (varDataLen(val) > maxLen) ? maxLen : varDataLen(val);
4997 4998 4999 5000 5001 5002 5003 5004 5005 5006 5007 5008
      memcpy(varDataVal(output), varDataVal(val), len);
      varDataSetLen(output, len);
    } else {
      varDataCopy(output, val);
    }
  } else {
    memcpy(output, val, bytes);
  }
}

static int64_t getQuerySupportBufSize(size_t numOfTables) {
  size_t s1 = sizeof(STableQueryInfo);
L
Liu Jicong 已提交
5009 5010
  //  size_t s3 = sizeof(STableCheckInfo);  buffer consumption in tsdb
  return (int64_t)(s1 * 1.5 * numOfTables);
5011 5012 5013 5014 5015 5016 5017
}

int32_t checkForQueryBuf(size_t numOfTables) {
  int64_t t = getQuerySupportBufSize(numOfTables);
  if (tsQueryBufferSizeBytes < 0) {
    return TSDB_CODE_SUCCESS;
  } else if (tsQueryBufferSizeBytes > 0) {
L
Liu Jicong 已提交
5018
    while (1) {
5019 5020 5021 5022 5023 5024 5025 5026 5027 5028 5029 5030 5031 5032 5033 5034 5035 5036 5037 5038 5039 5040 5041 5042 5043 5044
      int64_t s = tsQueryBufferSizeBytes;
      int64_t remain = s - t;
      if (remain >= 0) {
        if (atomic_val_compare_exchange_64(&tsQueryBufferSizeBytes, s, remain) == s) {
          return TSDB_CODE_SUCCESS;
        }
      } else {
        return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
      }
    }
  }

  // disable query processing if the value of tsQueryBufferSize is zero.
  return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
}

void releaseQueryBuf(size_t numOfTables) {
  if (tsQueryBufferSizeBytes < 0) {
    return;
  }

  int64_t t = getQuerySupportBufSize(numOfTables);

  // restore value is not enough buffer available
  atomic_add_fetch_64(&tsQueryBufferSizeBytes, t);
}
D
dapan1121 已提交
5045

dengyihao's avatar
dengyihao 已提交
5046 5047
int32_t getOperatorExplainExecInfo(SOperatorInfo* operatorInfo, SExplainExecInfo** pRes, int32_t* capacity,
                                   int32_t* resNum) {
D
dapan1121 已提交
5048 5049
  if (*resNum >= *capacity) {
    *capacity += 10;
dengyihao's avatar
dengyihao 已提交
5050

D
dapan1121 已提交
5051 5052
    *pRes = taosMemoryRealloc(*pRes, (*capacity) * sizeof(SExplainExecInfo));
    if (NULL == *pRes) {
D
dapan1121 已提交
5053
      qError("malloc %d failed", (*capacity) * (int32_t)sizeof(SExplainExecInfo));
D
dapan1121 已提交
5054 5055 5056 5057
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

5058 5059 5060 5061 5062
  SExplainExecInfo* pInfo = &(*pRes)[*resNum];

  pInfo->numOfRows = operatorInfo->resultInfo.totalRows;
  pInfo->startupCost = operatorInfo->cost.openCost;
  pInfo->totalCost = operatorInfo->cost.totalCost;
D
dapan1121 已提交
5063

5064
  if (operatorInfo->fpSet.getExplainFn) {
5065
    int32_t code = operatorInfo->fpSet.getExplainFn(operatorInfo, &pInfo->verboseInfo, &pInfo->verboseLen);
D
dapan1121 已提交
5066
    if (code) {
5067
      qError("%s operator getExplainFn failed, code:%s", GET_TASKID(operatorInfo->pTaskInfo), tstrerror(code));
D
dapan1121 已提交
5068 5069
      return code;
    }
5070 5071 5072
  } else {
    pInfo->verboseLen = 0;
    pInfo->verboseInfo = NULL;
D
dapan1121 已提交
5073
  }
dengyihao's avatar
dengyihao 已提交
5074

D
dapan1121 已提交
5075
  ++(*resNum);
dengyihao's avatar
dengyihao 已提交
5076

D
dapan1121 已提交
5077
  int32_t code = 0;
D
dapan1121 已提交
5078 5079
  for (int32_t i = 0; i < operatorInfo->numOfDownstream; ++i) {
    code = getOperatorExplainExecInfo(operatorInfo->pDownstream[i], pRes, capacity, resNum);
D
dapan1121 已提交
5080 5081 5082 5083 5084 5085 5086
    if (code) {
      taosMemoryFreeClear(*pRes);
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
D
dapan1121 已提交
5087
}
5
54liuyao 已提交
5088

L
Liu Jicong 已提交
5089
int32_t initStreamAggSupporter(SStreamAggSupporter* pSup, const char* pKey, SqlFunctionCtx* pCtx, int32_t numOfOutput,
5090
                               int32_t size) {
5091
  pSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
5
54liuyao 已提交
5092 5093
  pSup->keySize = sizeof(int64_t) + sizeof(TSKEY);
  pSup->pKeyBuf = taosMemoryCalloc(1, pSup->keySize);
5094 5095
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);
  pSup->pResultRows = taosHashInit(1024, hashFn, false, HASH_NO_LOCK);
5
54liuyao 已提交
5096 5097 5098
  if (pSup->pKeyBuf == NULL || pSup->pResultRows == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
5099
  pSup->valueSize = size;
5
54liuyao 已提交
5100

5
54liuyao 已提交
5101 5102
  pSup->pScanWindow = taosArrayInit(4, sizeof(STimeWindow));

5
54liuyao 已提交
5103 5104 5105 5106 5107 5108 5109 5110 5111
  int32_t pageSize = 4096;
  while (pageSize < pSup->resultRowSize * 4) {
    pageSize <<= 1u;
  }
  // at least four pages need to be in buffer
  int32_t bufSize = 4096 * 256;
  if (bufSize <= pageSize) {
    bufSize = pageSize * 4;
  }
5112
  int32_t code = createDiskbasedBuf(&pSup->pResultBuf, pageSize, bufSize, pKey, TD_TMP_DIR_PATH);
L
Liu Jicong 已提交
5113
  for (int32_t i = 0; i < numOfOutput; ++i) {
5114 5115 5116
    pCtx[i].pBuf = pSup->pResultBuf;
  }
  return code;
5
54liuyao 已提交
5117
}