executorimpl.c 180.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
15

16
#include <executorimpl.h>
H
Haojun Liao 已提交
17 18
#include "filter.h"
#include "function.h"
19 20
#include "functionMgt.h"
#include "os.h"
H
Haojun Liao 已提交
21
#include "querynodes.h"
22
#include "tfill.h"
dengyihao's avatar
dengyihao 已提交
23
#include "tname.h"
X
Xiaoyu Wang 已提交
24
#include "tref.h"
25

H
Haojun Liao 已提交
26
#include "tdatablock.h"
27
#include "tglobal.h"
H
Haojun Liao 已提交
28
#include "tmsg.h"
H
Haojun Liao 已提交
29
#include "tsort.h"
30
#include "ttime.h"
H
Haojun Liao 已提交
31

32
#include "executorimpl.h"
dengyihao's avatar
dengyihao 已提交
33
#include "index.h"
34
#include "query.h"
35 36
#include "tcompare.h"
#include "tcompression.h"
H
Haojun Liao 已提交
37
#include "thash.h"
38
#include "ttypes.h"
dengyihao's avatar
dengyihao 已提交
39
#include "vnode.h"
40

H
Haojun Liao 已提交
41
#define IS_MAIN_SCAN(runtime)          ((runtime)->scanFlag == MAIN_SCAN)
42 43 44 45 46 47
#define SET_REVERSE_SCAN_FLAG(runtime) ((runtime)->scanFlag = REVERSE_SCAN)

#define GET_FORWARD_DIRECTION_FACTOR(ord) (((ord) == TSDB_ORDER_ASC) ? QUERY_ASC_FORWARD_STEP : QUERY_DESC_FORWARD_STEP)

#if 0
static UNUSED_FUNC void *u_malloc (size_t __size) {
wafwerar's avatar
wafwerar 已提交
48
  uint32_t v = taosRand();
49 50 51 52

  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
53
    return taosMemoryMalloc(__size);
54 55 56 57
  }
}

static UNUSED_FUNC void* u_calloc(size_t num, size_t __size) {
wafwerar's avatar
wafwerar 已提交
58
  uint32_t v = taosRand();
59 60 61
  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
62
    return taosMemoryCalloc(num, __size);
63 64 65 66
  }
}

static UNUSED_FUNC void* u_realloc(void* p, size_t __size) {
wafwerar's avatar
wafwerar 已提交
67
  uint32_t v = taosRand();
68 69 70
  if (v % 5 <= 1) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
71
    return taosMemoryRealloc(p, __size);
72 73 74 75 76 77 78 79
  }
}

#define calloc  u_calloc
#define malloc  u_malloc
#define realloc u_realloc
#endif

X
Xiaoyu Wang 已提交
80
#define CLEAR_QUERY_STATUS(q, st)   ((q)->status &= (~(st)))
81 82
#define QUERY_IS_INTERVAL_QUERY(_q) ((_q)->interval.interval > 0)

L
Liu Jicong 已提交
83 84 85
int32_t getMaximumIdleDurationSec() { return tsShellActivityTimer * 2; }

static int32_t getExprFunctionId(SExprInfo* pExprInfo) {
86
  assert(pExprInfo != NULL && pExprInfo->pExpr != NULL && pExprInfo->pExpr->nodeType == TEXPR_UNARYEXPR_NODE);
87
  return 0;
88 89 90 91
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes);

92
static void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExpr, SSDataBlock* pSDataBlock);
93

X
Xiaoyu Wang 已提交
94
static void releaseQueryBuf(size_t numOfTables);
95 96 97 98 99

static void destroySFillOperatorInfo(void* param, int32_t numOfOutput);
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput);
static void destroyOrderOperatorInfo(void* param, int32_t numOfOutput);
static void destroyAggOperatorInfo(void* param, int32_t numOfOutput);
X
Xiaoyu Wang 已提交
100

H
Haojun Liao 已提交
101
static void destroyIntervalOperatorInfo(void* param, int32_t numOfOutput);
H
Haojun Liao 已提交
102 103
static void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput);

104 105
static void destroyOperatorInfo(SOperatorInfo* pOperator);

106
void doSetOperatorCompleted(SOperatorInfo* pOperator) {
107
  pOperator->status = OP_EXEC_DONE;
108

109
  pOperator->cost.totalCost = (taosGetTimestampUs() - pOperator->pTaskInfo->cost.start * 1000) / 1000.0;
H
Haojun Liao 已提交
110
  if (pOperator->pTaskInfo != NULL) {
111
    setTaskStatus(pOperator->pTaskInfo, TASK_COMPLETED);
112 113
  }
}
114

H
Haojun Liao 已提交
115
int32_t operatorDummyOpenFn(SOperatorInfo* pOperator) {
116
  OPTR_SET_OPENED(pOperator);
117
  pOperator->cost.openCost = 0;
H
Haojun Liao 已提交
118
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
119 120
}

121
SOperatorFpSet createOperatorFpSet(__optr_open_fn_t openFn, __optr_fn_t nextFn, __optr_fn_t streamFn,
L
Liu Jicong 已提交
122
                                   __optr_fn_t cleanup, __optr_close_fn_t closeFn, __optr_encode_fn_t encode,
123
                                   __optr_decode_fn_t decode, __optr_explain_fn_t explain) {
124 125 126 127 128 129 130 131 132 133 134 135 136 137
  SOperatorFpSet fpSet = {
      ._openFn = openFn,
      .getNextFn = nextFn,
      .getStreamResFn = streamFn,
      .cleanupFn = cleanup,
      .closeFn = closeFn,
      .encodeResultRow = encode,
      .decodeResultRow = decode,
      .getExplainFn = explain,
  };

  return fpSet;
}

H
Haojun Liao 已提交
138
void operatorDummyCloseFn(void* param, int32_t numOfCols) {}
H
Haojun Liao 已提交
139

X
Xiaoyu Wang 已提交
140 141 142
static int32_t doCopyToSDataBlock(SExecTaskInfo* taskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo,
                                  SDiskbasedBuf* pBuf, SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset,
                                  SqlFunctionCtx* pCtx, int32_t numOfExprs);
H
Haojun Liao 已提交
143

144
static void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size);
L
Liu Jicong 已提交
145 146
static void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                                     uint64_t groupId);
147

L
Liu Jicong 已提交
148 149
// setup the output buffer for each operator
static bool hasNull(SColumn* pColumn, SColumnDataAgg* pStatis) {
dengyihao's avatar
dengyihao 已提交
150 151
  if (TSDB_COL_IS_TAG(pColumn->flag) || TSDB_COL_IS_UD_COL(pColumn->flag) ||
      pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
152 153 154 155 156 157 158 159 160 161
    return false;
  }

  if (pStatis != NULL && pStatis->numOfNull == 0) {
    return false;
  }

  return true;
}

162
#if 0
L
Liu Jicong 已提交
163 164
static bool chkResultRowFromKey(STaskRuntimeEnv* pRuntimeEnv, SResultRowInfo* pResultRowInfo, char* pData,
                                int16_t bytes, bool masterscan, uint64_t uid) {
165 166 167
  bool existed = false;
  SET_RES_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid);

L
Liu Jicong 已提交
168 169
  SResultRow** p1 =
      (SResultRow**)taosHashGet(pRuntimeEnv->pResultRowHashTable, pRuntimeEnv->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
170 171 172 173 174 175 176 177 178 179 180

  // in case of repeat scan/reverse scan, no new time window added.
  if (QUERY_IS_INTERVAL_QUERY(pRuntimeEnv->pQueryAttr)) {
    if (!masterscan) {  // the *p1 may be NULL in case of sliding+offset exists.
      return p1 != NULL;
    }

    if (p1 != NULL) {
      if (pResultRowInfo->size == 0) {
        existed = false;
      } else if (pResultRowInfo->size == 1) {
dengyihao's avatar
dengyihao 已提交
181
        //        existed = (pResultRowInfo->pResult[0] == (*p1));
182 183
      } else {  // check if current pResultRowInfo contains the existed pResultRow
        SET_RES_EXT_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid, pResultRowInfo);
L
Liu Jicong 已提交
184 185
        int64_t* index =
            taosHashGet(pRuntimeEnv->pResultRowListSet, pRuntimeEnv->keyBuf, GET_RES_EXT_WINDOW_KEY_LEN(bytes));
186 187 188 189 190 191 192 193 194 195 196 197 198
        if (index != NULL) {
          existed = true;
        } else {
          existed = false;
        }
      }
    }

    return existed;
  }

  return p1 != NULL;
}
199
#endif
200

201
SResultRow* getNewResultRow(SDiskbasedBuf* pResultBuf, int64_t tableGroupId, int32_t interBufSize) {
L
Liu Jicong 已提交
202
  SFilePage* pData = NULL;
203 204 205 206 207 208 209 210 211 212 213 214 215

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tableGroupId);

  if (taosArrayGetSize(list) == 0) {
    pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
    pData->num = sizeof(SFilePage);
  } else {
    SPageInfo* pi = getLastPageInfo(list);
    pData = getBufPage(pResultBuf, getPageId(pi));
    pageId = getPageId(pi);

wmmhello's avatar
wmmhello 已提交
216
    if (pData->num + interBufSize > getBufPageSize(pResultBuf)) {
217 218 219 220 221 222 223 224 225 226 227 228 229 230
      // release current page first, and prepare the next one
      releaseBufPageInfo(pResultBuf, pi);

      pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
      if (pData != NULL) {
        pData->num = sizeof(SFilePage);
      }
    }
  }

  if (pData == NULL) {
    return NULL;
  }

231 232
  setBufPageDirty(pData, true);

233 234 235 236 237
  // set the number of rows in current disk page
  SResultRow* pResultRow = (SResultRow*)((char*)pData + pData->num);
  pResultRow->pageId = pageId;
  pResultRow->offset = (int32_t)pData->num;

wmmhello's avatar
wmmhello 已提交
238
  pData->num += interBufSize;
239 240 241 242

  return pResultRow;
}

243 244 245 246 247 248 249
/**
 * the struct of key in hash table
 * +----------+---------------+
 * | group id |   key data    |
 * | 8 bytes  | actual length |
 * +----------+---------------+
 */
250 251 252
SResultRow* doSetResultOutBufByKey(SDiskbasedBuf* pResultBuf, SResultRowInfo* pResultRowInfo, char* pData,
                                   int16_t bytes, bool masterscan, uint64_t groupId, SExecTaskInfo* pTaskInfo,
                                   bool isIntervalQuery, SAggSupporter* pSup) {
253
  SET_RES_WINDOW_KEY(pSup->keyBuf, pData, bytes, groupId);
H
Haojun Liao 已提交
254

dengyihao's avatar
dengyihao 已提交
255 256
  SResultRowPosition* p1 =
      (SResultRowPosition*)taosHashGet(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
H
Haojun Liao 已提交
257

258 259
  SResultRow* pResult = NULL;

H
Haojun Liao 已提交
260 261
  // in case of repeat scan/reverse scan, no new time window added.
  if (isIntervalQuery) {
262 263
    if (masterscan && p1 != NULL) {  // the *p1 may be NULL in case of sliding+offset exists.
      pResult = getResultRowByPos(pResultBuf, p1);
264
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
265 266
    }
  } else {
dengyihao's avatar
dengyihao 已提交
267 268
    // In case of group by column query, the required SResultRow object must be existInCurrentResusltRowInfo in the
    // pResultRowInfo object.
H
Haojun Liao 已提交
269
    if (p1 != NULL) {
270
      // todo
271
      pResult = getResultRowByPos(pResultBuf, p1);
272
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
273 274 275
    }
  }

L
Liu Jicong 已提交
276
  // 1. close current opened time window
277
  if (pResultRowInfo->cur.pageId != -1 && ((pResult == NULL) || (pResult->pageId != pResultRowInfo->cur.pageId))) {
278
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
279
    qDebug("page_1");
280
#endif
281
    SResultRowPosition pos = pResultRowInfo->cur;
X
Xiaoyu Wang 已提交
282
    SFilePage*         pPage = getBufPage(pResultBuf, pos.pageId);
283 284 285 286 287
    releaseBufPage(pResultBuf, pPage);
  }

  // allocate a new buffer page
  if (pResult == NULL) {
288
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
289
    qDebug("page_2");
290
#endif
H
Haojun Liao 已提交
291
    ASSERT(pSup->resultRowSize > 0);
292 293
    pResult = getNewResultRow(pResultBuf, groupId, pSup->resultRowSize);

294
    initResultRow(pResult);
H
Haojun Liao 已提交
295

296 297
    // add a new result set for a new group
    SResultRowPosition pos = {.pageId = pResult->pageId, .offset = pResult->offset};
X
Xiaoyu Wang 已提交
298 299
    taosHashPut(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes), &pos,
                sizeof(SResultRowPosition));
H
Haojun Liao 已提交
300 301
  }

302 303 304
  // 2. set the new time window to be the new active time window
  pResultRowInfo->cur = (SResultRowPosition){.pageId = pResult->pageId, .offset = pResult->offset};

H
Haojun Liao 已提交
305
  // too many time window in query
306
  if (taosHashGetSize(pSup->pResultRowHashTable) > MAX_INTERVAL_TIME_WINDOW) {
H
Haojun Liao 已提交
307 308 309
    longjmp(pTaskInfo->env, TSDB_CODE_QRY_TOO_MANY_TIMEWINDOW);
  }

H
Haojun Liao 已提交
310
  return pResult;
H
Haojun Liao 已提交
311 312
}

313
// a new buffer page for each table. Needs to opt this design
L
Liu Jicong 已提交
314
static int32_t addNewWindowResultBuf(SResultRow* pWindowRes, SDiskbasedBuf* pResultBuf, int32_t tid, uint32_t size) {
315 316 317 318
  if (pWindowRes->pageId != -1) {
    return 0;
  }

L
Liu Jicong 已提交
319
  SFilePage* pData = NULL;
320 321 322 323 324 325

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tid);

  if (taosArrayGetSize(list) == 0) {
H
Haojun Liao 已提交
326
    pData = getNewBufPage(pResultBuf, tid, &pageId);
327
    pData->num = sizeof(SFilePage);
328 329
  } else {
    SPageInfo* pi = getLastPageInfo(list);
330
    pData = getBufPage(pResultBuf, getPageId(pi));
331
    pageId = getPageId(pi);
332

333
    if (pData->num + size > getBufPageSize(pResultBuf)) {
334
      // release current page first, and prepare the next one
335
      releaseBufPageInfo(pResultBuf, pi);
336

H
Haojun Liao 已提交
337
      pData = getNewBufPage(pResultBuf, tid, &pageId);
338
      if (pData != NULL) {
339
        pData->num = sizeof(SFilePage);
340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359
      }
    }
  }

  if (pData == NULL) {
    return -1;
  }

  // set the number of rows in current disk page
  if (pWindowRes->pageId == -1) {  // not allocated yet, allocate new buffer
    pWindowRes->pageId = pageId;
    pWindowRes->offset = (int32_t)pData->num;

    pData->num += size;
    assert(pWindowRes->pageId >= 0);
  }

  return 0;
}

360
//  query_range_start, query_range_end, window_duration, window_start, window_end
361
void initExecTimeWindowInfo(SColumnInfoData* pColData, STimeWindow* pQueryWindow) {
362 363 364
  pColData->info.type = TSDB_DATA_TYPE_TIMESTAMP;
  pColData->info.bytes = sizeof(int64_t);

365
  colInfoDataEnsureCapacity(pColData, 5);
366 367 368 369 370 371 372 373 374
  colDataAppendInt64(pColData, 0, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 1, &pQueryWindow->ekey);

  int64_t interval = 0;
  colDataAppendInt64(pColData, 2, &interval);  // this value may be variable in case of 'n' and 'y'.
  colDataAppendInt64(pColData, 3, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 4, &pQueryWindow->ekey);
}

X
Xiaoyu Wang 已提交
375 376 377
void doApplyFunctions(SExecTaskInfo* taskInfo, SqlFunctionCtx* pCtx, STimeWindow* pWin,
                      SColumnInfoData* pTimeWindowData, int32_t offset, int32_t forwardStep, TSKEY* tsCol,
                      int32_t numOfTotal, int32_t numOfOutput, int32_t order) {
378
  for (int32_t k = 0; k < numOfOutput; ++k) {
H
Haojun Liao 已提交
379
    // keep it temporarily
380
    // todo no need this??
dengyihao's avatar
dengyihao 已提交
381 382
    bool    hasAgg = pCtx[k].input.colDataAggIsSet;
    int32_t numOfRows = pCtx[k].input.numOfRows;
H
Haojun Liao 已提交
383
    int32_t startOffset = pCtx[k].input.startRowIndex;
384

385
    pCtx[k].input.startRowIndex = offset;
386
    pCtx[k].input.numOfRows = forwardStep;
387 388 389

    // not a whole block involved in query processing, statistics data can not be used
    // NOTE: the original value of isSet have been changed here
390 391
    if (pCtx[k].input.colDataAggIsSet && forwardStep < numOfTotal) {
      pCtx[k].input.colDataAggIsSet = false;
392 393
    }

394 395
    if (fmIsWindowPseudoColumnFunc(pCtx[k].functionId)) {
      SResultRowEntryInfo* pEntryInfo = GET_RES_INFO(&pCtx[k]);
396 397

      char* p = GET_ROWCELL_INTERBUF(pEntryInfo);
398

399
      SColumnInfoData idata = {0};
dengyihao's avatar
dengyihao 已提交
400
      idata.info.type = TSDB_DATA_TYPE_BIGINT;
401
      idata.info.bytes = tDataTypes[TSDB_DATA_TYPE_BIGINT].bytes;
dengyihao's avatar
dengyihao 已提交
402
      idata.pData = p;
403 404 405 406

      SScalarParam out = {.columnData = &idata};
      SScalarParam tw = {.numOfRows = 5, .columnData = pTimeWindowData};
      pCtx[k].sfp.process(&tw, 1, &out);
407
      pEntryInfo->numOfRes = 1;
408 409 410 411 412 413 414 415 416 417
    } else {
      int32_t code = TSDB_CODE_SUCCESS;
      if (functionNeedToExecute(&pCtx[k]) && pCtx[k].fpSet.process != NULL) {
        code = pCtx[k].fpSet.process(&pCtx[k]);

        if (code != TSDB_CODE_SUCCESS) {
          qError("%s apply functions error, code: %s", GET_TASKID(taskInfo), tstrerror(code));
          taskInfo->code = code;
          longjmp(taskInfo->env, code);
        }
418
      }
419

420 421 422 423 424
      // restore it
      pCtx[k].input.colDataAggIsSet = hasAgg;
      pCtx[k].input.startRowIndex = startOffset;
      pCtx[k].input.numOfRows = numOfRows;
    }
425 426 427
  }
}

dengyihao's avatar
dengyihao 已提交
428
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
429
                                   int32_t scanFlag, bool createDummyCol);
430

dengyihao's avatar
dengyihao 已提交
431 432
static void doSetInputDataBlockInfo(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock,
                                    int32_t order) {
433
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
434
    pCtx[i].order = order;
435
    pCtx[i].input.numOfRows = pBlock->info.rows;
436
    setBlockStatisInfo(&pCtx[i], &pOperator->exprSupp.pExprInfo[i], pBlock);
437 438 439
  }
}

X
Xiaoyu Wang 已提交
440 441
void setInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
                       int32_t scanFlag, bool createDummyCol) {
442
  if (pBlock->pBlockAgg != NULL) {
H
Haojun Liao 已提交
443
    doSetInputDataBlockInfo(pOperator, pCtx, pBlock, order);
444
  } else {
445
    doSetInputDataBlock(pOperator, pCtx, pBlock, order, scanFlag, createDummyCol);
H
Haojun Liao 已提交
446
  }
447 448
}

L
Liu Jicong 已提交
449 450
static int32_t doCreateConstantValColumnInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t paramIndex,
                                             int32_t numOfRows) {
451 452 453 454 455 456 457 458
  SColumnInfoData* pColInfo = NULL;
  if (pInput->pData[paramIndex] == NULL) {
    pColInfo = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pColInfo == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

    // Set the correct column info (data type and bytes)
459 460
    pColInfo->info.type = pFuncParam->param.nType;
    pColInfo->info.bytes = pFuncParam->param.nLen;
461 462

    pInput->pData[paramIndex] = pColInfo;
463 464
  } else {
    pColInfo = pInput->pData[paramIndex];
465 466
  }

467
  colInfoDataEnsureCapacity(pColInfo, numOfRows);
468

469
  int8_t type = pFuncParam->param.nType;
470 471
  if (type == TSDB_DATA_TYPE_BIGINT || type == TSDB_DATA_TYPE_UBIGINT) {
    int64_t v = pFuncParam->param.i;
dengyihao's avatar
dengyihao 已提交
472
    for (int32_t i = 0; i < numOfRows; ++i) {
473 474 475 476
      colDataAppendInt64(pColInfo, i, &v);
    }
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
dengyihao's avatar
dengyihao 已提交
477
    for (int32_t i = 0; i < numOfRows; ++i) {
478 479
      colDataAppendDouble(pColInfo, i, &v);
    }
480
  } else if (type == TSDB_DATA_TYPE_VARCHAR) {
L
Liu Jicong 已提交
481
    char* tmp = taosMemoryMalloc(pFuncParam->param.nLen + VARSTR_HEADER_SIZE);
482
    STR_WITH_SIZE_TO_VARSTR(tmp, pFuncParam->param.pz, pFuncParam->param.nLen);
L
Liu Jicong 已提交
483
    for (int32_t i = 0; i < numOfRows; ++i) {
484 485
      colDataAppend(pColInfo, i, tmp, false);
    }
486 487 488 489 490
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
491
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
X
Xiaoyu Wang 已提交
492
                                   int32_t scanFlag, bool createDummyCol) {
493 494
  int32_t code = TSDB_CODE_SUCCESS;

495
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
L
Liu Jicong 已提交
496
    pCtx[i].order = order;
497 498
    pCtx[i].input.numOfRows = pBlock->info.rows;

L
Liu Jicong 已提交
499
    pCtx[i].pSrcBlock = pBlock;
X
Xiaoyu Wang 已提交
500
    pCtx[i].scanFlag = scanFlag;
H
Haojun Liao 已提交
501

502
    SInputColumnInfoData* pInput = &pCtx[i].input;
503
    pInput->uid = pBlock->info.uid;
C
Cary Xu 已提交
504
    pInput->colDataAggIsSet = false;
505

506
    SExprInfo* pOneExpr = &pOperator->exprSupp.pExprInfo[i];
507
    for (int32_t j = 0; j < pOneExpr->base.numOfParams; ++j) {
dengyihao's avatar
dengyihao 已提交
508
      SFunctParam* pFuncParam = &pOneExpr->base.pParam[j];
G
Ganlin Zhao 已提交
509 510
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
dengyihao's avatar
dengyihao 已提交
511
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
512 513 514
        pInput->totalRows = pBlock->info.rows;
        pInput->numOfRows = pBlock->info.rows;
        pInput->startRowIndex = 0;
515

516
        // NOTE: the last parameter is the primary timestamp column
517 518 519
        if (fmIsTimelineFunc(pCtx[i].functionId) && (j == pOneExpr->base.numOfParams - 1)) {
          pInput->pPTS = pInput->pData[j];
        }
520 521
        ASSERT(pInput->pData[j] != NULL);
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
522 523 524
        // todo avoid case: top(k, 12), 12 is the value parameter.
        // sum(11), 11 is also the value parameter.
        if (createDummyCol && pOneExpr->base.numOfParams == 1) {
525 526 527 528
          pInput->totalRows = pBlock->info.rows;
          pInput->numOfRows = pBlock->info.rows;
          pInput->startRowIndex = 0;

529
          code = doCreateConstantValColumnInfo(pInput, pFuncParam, j, pBlock->info.rows);
530 531 532
          if (code != TSDB_CODE_SUCCESS) {
            return code;
          }
533
        }
G
Ganlin Zhao 已提交
534 535
      }
    }
H
Haojun Liao 已提交
536
  }
537 538

  return code;
H
Haojun Liao 已提交
539 540
}

541
static int32_t doAggregateImpl(SOperatorInfo* pOperator, TSKEY startTs, SqlFunctionCtx* pCtx) {
542
  for (int32_t k = 0; k < pOperator->exprSupp.numOfExprs; ++k) {
H
Haojun Liao 已提交
543
    if (functionNeedToExecute(&pCtx[k])) {
544
      // todo add a dummy funtion to avoid process check
545 546 547
      if (pCtx[k].fpSet.process == NULL) {
        continue;
      }
H
Haojun Liao 已提交
548

549 550 551 552
      int32_t code = pCtx[k].fpSet.process(&pCtx[k]);
      if (code != TSDB_CODE_SUCCESS) {
        qError("%s aggregate function error happens, code: %s", GET_TASKID(pOperator->pTaskInfo), tstrerror(code));
        return code;
553
      }
554 555
    }
  }
556 557

  return TSDB_CODE_SUCCESS;
558 559
}

H
Haojun Liao 已提交
560
static void setPseudoOutputColInfo(SSDataBlock* pResult, SqlFunctionCtx* pCtx, SArray* pPseudoList) {
dengyihao's avatar
dengyihao 已提交
561
  size_t num = (pPseudoList != NULL) ? taosArrayGetSize(pPseudoList) : 0;
H
Haojun Liao 已提交
562 563 564 565 566
  for (int32_t i = 0; i < num; ++i) {
    pCtx[i].pOutput = taosArrayGet(pResult->pDataBlock, i);
  }
}

567
int32_t projectApplyFunctions(SExprInfo* pExpr, SSDataBlock* pResult, SSDataBlock* pSrcBlock, SqlFunctionCtx* pCtx,
X
Xiaoyu Wang 已提交
568
                              int32_t numOfOutput, SArray* pPseudoList) {
H
Haojun Liao 已提交
569
  setPseudoOutputColInfo(pResult, pCtx, pPseudoList);
H
Haojun Liao 已提交
570
  pResult->info.groupId = pSrcBlock->info.groupId;
H
Haojun Liao 已提交
571

572 573
  // if the source equals to the destination, it is to create a new column as the result of scalar
  // function or some operators.
574 575
  bool createNewColModel = (pResult == pSrcBlock);

576 577
  int32_t numOfRows = 0;

578
  for (int32_t k = 0; k < numOfOutput; ++k) {
579 580
    int32_t               outputSlotId = pExpr[k].base.resSchema.slotId;
    SqlFunctionCtx*       pfCtx = &pCtx[k];
581
    SInputColumnInfoData* pInputData = &pfCtx->input;
582

L
Liu Jicong 已提交
583
    if (pExpr[k].pExpr->nodeType == QUERY_NODE_COLUMN) {  // it is a project query
584
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
585
      if (pResult->info.rows > 0 && !createNewColModel) {
586 587
        colDataMergeCol(pColInfoData, pResult->info.rows, &pResult->info.capacity, pInputData->pData[0],
                        pInputData->numOfRows);
588
      } else {
589
        colDataAssign(pColInfoData, pInputData->pData[0], pInputData->numOfRows, &pResult->info);
590
      }
591

592
      numOfRows = pInputData->numOfRows;
593
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_VALUE) {
594
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
595

dengyihao's avatar
dengyihao 已提交
596
      int32_t offset = createNewColModel ? 0 : pResult->info.rows;
597
      for (int32_t i = 0; i < pSrcBlock->info.rows; ++i) {
dengyihao's avatar
dengyihao 已提交
598 599 600
        colDataAppend(pColInfoData, i + offset,
                      taosVariantGet(&pExpr[k].base.pParam[0].param, pExpr[k].base.pParam[0].param.nType),
                      TSDB_DATA_TYPE_NULL == pExpr[k].base.pParam[0].param.nType);
601
      }
602 603

      numOfRows = pSrcBlock->info.rows;
H
Haojun Liao 已提交
604
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_OPERATOR) {
605 606 607
      SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
      taosArrayPush(pBlockList, &pSrcBlock);

608
      SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
609
      SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
610

611
      SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
612
      int32_t      code = scalarCalculate(pExpr[k].pExpr->_optrRoot.pRootNode, pBlockList, &dest);
613 614 615 616
      if (code != TSDB_CODE_SUCCESS) {
        taosArrayDestroy(pBlockList);
        return code;
      }
617

dengyihao's avatar
dengyihao 已提交
618
      int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
619
      ASSERT(pResult->info.capacity > 0);
620
      colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
621 622

      numOfRows = dest.numOfRows;
623 624
      taosArrayDestroy(pBlockList);
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_FUNCTION) {
625 626
      // _rowts/_c0, not tbname column
      if (fmIsPseudoColumnFunc(pfCtx->functionId) && (!fmIsScanPseudoColumnFunc(pfCtx->functionId))) {
H
Haojun Liao 已提交
627
        // do nothing
628
      } else if (fmIsIndefiniteRowsFunc(pfCtx->functionId)) {
629 630
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(pfCtx);
        pfCtx->fpSet.init(pfCtx, pResInfo);
631 632 633 634 635 636 637 638 639 640 641

        pfCtx->pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
        pfCtx->offset = createNewColModel ? 0 : pResult->info.rows;  // set the start offset

        // set the timestamp(_rowts) output buffer
        if (taosArrayGetSize(pPseudoList) > 0) {
          int32_t* outputColIndex = taosArrayGet(pPseudoList, 0);
          pfCtx->pTsOutput = (SColumnInfoData*)pCtx[*outputColIndex].pOutput;
        }

        numOfRows = pfCtx->fpSet.process(pfCtx);
H
Haojun Liao 已提交
642
      } else if (fmIsAggFunc(pfCtx->functionId)) {
643 644
        // _group_key function for "partition by tbname" + csum(col_name) query
        SColumnInfoData* pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
645
        int32_t          slotId = pfCtx->param[0].pCol->slotId;
646 647 648

        // todo handle the json tag
        SColumnInfoData* pInput = taosArrayGet(pSrcBlock->pDataBlock, slotId);
649
        for (int32_t f = 0; f < pSrcBlock->info.rows; ++f) {
650 651 652 653 654 655 656 657 658
          bool isNull = colDataIsNull_s(pInput, f);
          if (isNull) {
            colDataAppendNULL(pOutput, pResult->info.rows + f);
          } else {
            char* data = colDataGetData(pInput, f);
            colDataAppend(pOutput, pResult->info.rows + f, data, isNull);
          }
        }

H
Haojun Liao 已提交
659 660 661
      } else {
        SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
        taosArrayPush(pBlockList, &pSrcBlock);
G
Ganlin Zhao 已提交
662

663
        SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
664
        SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
H
Haojun Liao 已提交
665

666
        SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
667
        int32_t      code = scalarCalculate((SNode*)pExpr[k].pExpr->_function.pFunctNode, pBlockList, &dest);
668 669 670 671
        if (code != TSDB_CODE_SUCCESS) {
          taosArrayDestroy(pBlockList);
          return code;
        }
672

dengyihao's avatar
dengyihao 已提交
673
        int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
674
        ASSERT(pResult->info.capacity > 0);
675
        colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
676 677

        numOfRows = dest.numOfRows;
H
Haojun Liao 已提交
678 679
        taosArrayDestroy(pBlockList);
      }
680
    } else {
681
      ASSERT(0);
682 683
    }
  }
684

685 686 687
  if (!createNewColModel) {
    pResult->info.rows += numOfRows;
  }
688 689

  return TSDB_CODE_SUCCESS;
690 691
}

5
54liuyao 已提交
692
bool functionNeedToExecute(SqlFunctionCtx* pCtx) {
693
  struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
694

695 696 697 698 699
  // in case of timestamp column, always generated results.
  int32_t functionId = pCtx->functionId;
  if (functionId == -1) {
    return false;
  }
700

701 702
  if (pCtx->scanFlag == REPEAT_SCAN) {
    return fmIsRepeatScanFunc(pCtx->functionId);
703 704
  }

705 706
  if (isRowEntryCompleted(pResInfo)) {
    return false;
707 708
  }

709 710 711
  return true;
}

712 713 714 715 716 717 718
static int32_t doCreateConstantValColumnAggInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t type,
                                                int32_t paramIndex, int32_t numOfRows) {
  if (pInput->pData[paramIndex] == NULL) {
    pInput->pData[paramIndex] = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pInput->pData[paramIndex] == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
719

720 721 722
    // Set the correct column info (data type and bytes)
    pInput->pData[paramIndex]->info.type = type;
    pInput->pData[paramIndex]->info.bytes = tDataTypes[type].bytes;
723
  }
H
Haojun Liao 已提交
724

725 726 727 728 729 730
  SColumnDataAgg* da = NULL;
  if (pInput->pColumnDataAgg[paramIndex] == NULL) {
    da = taosMemoryCalloc(1, sizeof(SColumnDataAgg));
    pInput->pColumnDataAgg[paramIndex] = da;
    if (da == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
731 732
    }
  } else {
733
    da = pInput->pColumnDataAgg[paramIndex];
734 735
  }

736
  ASSERT(!IS_VAR_DATA_TYPE(type));
737

738 739
  if (type == TSDB_DATA_TYPE_BIGINT) {
    int64_t v = pFuncParam->param.i;
740
    *da = (SColumnDataAgg){.numOfNull = 0, .min = v, .max = v, .sum = v * numOfRows};
741 742
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
743
    *da = (SColumnDataAgg){.numOfNull = 0};
744

745 746 747 748 749 750
    *(double*)&da->min = v;
    *(double*)&da->max = v;
    *(double*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_BOOL) {  // todo validate this data type
    bool v = pFuncParam->param.i;

751
    *da = (SColumnDataAgg){.numOfNull = 0};
752 753 754 755 756
    *(bool*)&da->min = 0;
    *(bool*)&da->max = v;
    *(bool*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_TIMESTAMP) {
    // do nothing
757
  } else {
758
    ASSERT(0);
759 760
  }

761 762
  return TSDB_CODE_SUCCESS;
}
763 764 765 766 767 768 769 770 771 772 773

void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, SSDataBlock* pBlock) {
  int32_t numOfRows = pBlock->info.rows;

  SInputColumnInfoData* pInput = &pCtx->input;
  pInput->numOfRows = numOfRows;
  pInput->totalRows = numOfRows;

  if (pBlock->pBlockAgg != NULL) {
    pInput->colDataAggIsSet = true;

774 775
    for (int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      SFunctParam* pFuncParam = &pExprInfo->base.pParam[j];
776

777 778
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
779 780 781 782
        pInput->pColumnDataAgg[j] = pBlock->pBlockAgg[slotId];
        if (pInput->pColumnDataAgg[j] == NULL) {
          pInput->colDataAggIsSet = false;
        }
783 784 785 786

        // Here we set the column info data since the data type for each column data is required, but
        // the data in the corresponding SColumnInfoData will not be used.
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
787 788
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
        doCreateConstantValColumnAggInfo(pInput, pFuncParam, pFuncParam->param.nType, j, pBlock->info.rows);
789 790
      }
    }
791
  } else {
792
    pInput->colDataAggIsSet = false;
793 794 795
  }

  // set the statistics data for primary time stamp column
796 797 798 799 800
  //  if (pCtx->functionId == FUNCTION_SPREAD && pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
  //    pCtx->isAggSet = true;
  //    pCtx->agg.min = pBlock->info.window.skey;
  //    pCtx->agg.max = pBlock->info.window.ekey;
  //  }
801 802
}

L
Liu Jicong 已提交
803
bool isTaskKilled(SExecTaskInfo* pTaskInfo) {
804 805
  // query has been executed more than tsShellActivityTimer, and the retrieve has not arrived
  // abort current query execution.
L
Liu Jicong 已提交
806 807
  if (pTaskInfo->owner != 0 &&
      ((taosGetTimestampSec() - pTaskInfo->cost.start / 1000) > 10 * getMaximumIdleDurationSec())
808 809
      /*(!needBuildResAfterQueryComplete(pTaskInfo))*/) {
    assert(pTaskInfo->cost.start != 0);
L
Liu Jicong 已提交
810 811 812
    //    qDebug("QInfo:%" PRIu64 " retrieve not arrive beyond %d ms, abort current query execution, start:%" PRId64
    //           ", current:%d", pQInfo->qId, 1, pQInfo->startExecTs, taosGetTimestampSec());
    //    return true;
813 814 815 816 817
  }

  return false;
}

L
Liu Jicong 已提交
818
void setTaskKilled(SExecTaskInfo* pTaskInfo) { pTaskInfo->code = TSDB_CODE_TSC_QUERY_CANCELLED; }
819 820

/////////////////////////////////////////////////////////////////////////////////////////////
L
Liu Jicong 已提交
821
// todo refactor : return window
822
void getAlignQueryTimeWindow(SInterval* pInterval, int32_t precision, int64_t key, STimeWindow* win) {
H
Haojun Liao 已提交
823
  win->skey = taosTimeTruncate(key, pInterval, precision);
824 825

  /*
H
Haojun Liao 已提交
826
   * if the realSkey > INT64_MAX - pInterval->interval, the query duration between
827 828
   * realSkey and realEkey must be less than one interval.Therefore, no need to adjust the query ranges.
   */
829 830
  win->ekey = taosTimeAdd(win->skey, pInterval->interval, pInterval->intervalUnit, precision) - 1;
  if (win->ekey < win->skey) {
831 832 833 834
    win->ekey = INT64_MAX;
  }
}

835
#if 0
L
Liu Jicong 已提交
836
static int32_t updateBlockLoadStatus(STaskAttr* pQuery, int32_t status) {
837

838 839 840
  bool hasFirstLastFunc = false;
  bool hasOtherFunc = false;

841
  if (status == BLK_DATA_DATA_LOAD || status == BLK_DATA_FILTEROUT) {
842 843 844 845 846
    return status;
  }

  for (int32_t i = 0; i < pQuery->numOfOutput; ++i) {
    int32_t functionId = getExprFunctionId(&pQuery->pExpr1[i]);
847

848 849 850 851 852 853 854 855 856 857
    if (functionId == FUNCTION_TS || functionId == FUNCTION_TS_DUMMY || functionId == FUNCTION_TAG ||
        functionId == FUNCTION_TAG_DUMMY) {
      continue;
    }

    if (functionId == FUNCTION_FIRST_DST || functionId == FUNCTION_LAST_DST) {
      hasFirstLastFunc = true;
    } else {
      hasOtherFunc = true;
    }
858

859 860
  }

861
  if (hasFirstLastFunc && status == BLK_DATA_NOT_LOAD) {
L
Liu Jicong 已提交
862
    if (!hasOtherFunc) {
863
      return BLK_DATA_FILTEROUT;
864
    } else {
865
      return BLK_DATA_DATA_LOAD;
866 867 868 869 870 871
    }
  }

  return status;
}

872 873
#endif

L
Liu Jicong 已提交
874 875
// static void updateDataCheckOrder(SQInfo *pQInfo, SQueryTableReq* pQueryMsg, bool stableQuery) {
//   STaskAttr* pQueryAttr = pQInfo->runtimeEnv.pQueryAttr;
H
Haojun Liao 已提交
876
//
L
Liu Jicong 已提交
877 878 879 880
//   // in case of point-interpolation query, use asc order scan
//   char msg[] = "QInfo:0x%"PRIx64" scan order changed for %s query, old:%d, new:%d, qrange exchanged, old qrange:%"
//   PRId64
//                "-%" PRId64 ", new qrange:%" PRId64 "-%" PRId64;
H
Haojun Liao 已提交
881
//
L
Liu Jicong 已提交
882 883 884 885 886
//   // todo handle the case the the order irrelevant query type mixed up with order critical query type
//   // descending order query for last_row query
//   if (isFirstLastRowQuery(pQueryAttr)) {
//     //qDebug("QInfo:0x%"PRIx64" scan order changed for last_row query, old:%d, new:%d", pQInfo->qId,
//     pQueryAttr->order.order, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
887
//
L
Liu Jicong 已提交
888 889
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
890
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
891
//     }
H
Haojun Liao 已提交
892
//
L
Liu Jicong 已提交
893 894 895
//     pQueryAttr->needReverseScan = false;
//     return;
//   }
H
Haojun Liao 已提交
896
//
L
Liu Jicong 已提交
897 898 899
//   if (pQueryAttr->groupbyColumn && pQueryAttr->order.order == TSDB_ORDER_DESC) {
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
900
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
901
//     }
H
Haojun Liao 已提交
902
//
L
Liu Jicong 已提交
903 904 905 906
//     pQueryAttr->needReverseScan = false;
//     doUpdateLastKey(pQueryAttr);
//     return;
//   }
H
Haojun Liao 已提交
907
//
L
Liu Jicong 已提交
908 909 910 911 912 913
//   if (pQueryAttr->pointInterpQuery && pQueryAttr->interval.interval == 0) {
//     if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       //qDebug(msg, pQInfo->qId, "interp", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey); TSWAP(pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, TSKEY);
//     }
H
Haojun Liao 已提交
914
//
L
Liu Jicong 已提交
915 916 917
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     return;
//   }
H
Haojun Liao 已提交
918
//
L
Liu Jicong 已提交
919 920 921 922
//   if (pQueryAttr->interval.interval == 0) {
//     if (onlyFirstQuery(pQueryAttr)) {
//       if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//         //qDebug(msg, pQInfo->qId, "only-first", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
H
Haojun Liao 已提交
923 924
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
925
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
926 927 928 929 930 931 932 933 934 935
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_ASC;
//      pQueryAttr->needReverseScan = false;
//    } else if (onlyLastQuery(pQueryAttr) && notContainSessionOrStateWindow(pQueryAttr)) {
//      if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//        //qDebug(msg, pQInfo->qId, "only-last", pQueryAttr->order.order, TSDB_ORDER_DESC, pQueryAttr->window.skey,
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
936
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
937 938 939 940 941 942 943 944 945 946 947 948
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_DESC;
//      pQueryAttr->needReverseScan = false;
//    }
//
//  } else {  // interval query
//    if (stableQuery) {
//      if (onlyFirstQuery(pQueryAttr)) {
//        if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-first stable", pQueryAttr->order.order, TSDB_ORDER_ASC,
L
Liu Jicong 已提交
949 950
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
951
//
wafwerar's avatar
wafwerar 已提交
952
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
953 954 955 956 957 958 959 960
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_ASC;
//        pQueryAttr->needReverseScan = false;
//      } else if (onlyLastQuery(pQueryAttr)) {
//        if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-last stable", pQueryAttr->order.order, TSDB_ORDER_DESC,
L
Liu Jicong 已提交
961 962
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
963
//
wafwerar's avatar
wafwerar 已提交
964
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
965 966 967 968 969 970 971 972 973
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_DESC;
//        pQueryAttr->needReverseScan = false;
//      }
//    }
//  }
//}
974

L
Liu Jicong 已提交
975 976 977
// static FORCE_INLINE bool doFilterByBlockStatistics(STaskRuntimeEnv* pRuntimeEnv, SDataStatis *pDataStatis,
// SqlFunctionCtx *pCtx, int32_t numOfRows) {
//   STaskAttr* pQueryAttr = pRuntimeEnv->pQueryAttr;
978
//
L
Liu Jicong 已提交
979 980 981
//   if (pDataStatis == NULL || pQueryAttr->pFilters == NULL) {
//     return true;
//   }
982
//
L
Liu Jicong 已提交
983 984
//   return filterRangeExecute(pQueryAttr->pFilters, pDataStatis, pQueryAttr->numOfCols, numOfRows);
// }
985
#if 0
H
Haojun Liao 已提交
986
static bool overlapWithTimeWindow(STaskAttr* pQueryAttr, SDataBlockInfo* pBlockInfo) {
987 988
  STimeWindow w = {0};

dengyihao's avatar
dengyihao 已提交
989 990
  TSKEY sk = TMIN(pQueryAttr->window.skey, pQueryAttr->window.ekey);
  TSKEY ek = TMAX(pQueryAttr->window.skey, pQueryAttr->window.ekey);
991

992
  if (true) {
L
Liu Jicong 已提交
993
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.skey, sk, ek, &w);
994 995 996 997 998 999
    assert(w.ekey >= pBlockInfo->window.skey);

    if (w.ekey < pBlockInfo->window.ekey) {
      return true;
    }

L
Liu Jicong 已提交
1000 1001
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1002 1003 1004 1005 1006 1007 1008 1009 1010 1011
      if (w.skey > pBlockInfo->window.ekey) {
        break;
      }

      assert(w.ekey > pBlockInfo->window.ekey);
      if (w.skey <= pBlockInfo->window.ekey && w.skey > pBlockInfo->window.skey) {
        return true;
      }
    }
  } else {
L
Liu Jicong 已提交
1012
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.ekey, sk, ek, &w);
1013 1014 1015 1016 1017 1018
    assert(w.skey <= pBlockInfo->window.ekey);

    if (w.skey > pBlockInfo->window.skey) {
      return true;
    }

L
Liu Jicong 已提交
1019 1020
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033
      if (w.ekey < pBlockInfo->window.skey) {
        break;
      }

      assert(w.skey < pBlockInfo->window.skey);
      if (w.ekey < pBlockInfo->window.ekey && w.ekey >= pBlockInfo->window.skey) {
        return true;
      }
    }
  }

  return false;
}
1034
#endif
1035 1036

static uint32_t doFilterByBlockTimeWindow(STableScanInfo* pTableScanInfo, SSDataBlock* pBlock) {
H
Haojun Liao 已提交
1037
#if 0
H
Haojun Liao 已提交
1038
  SqlFunctionCtx* pCtx = pTableScanInfo->pCtx;
1039
  uint32_t        status = BLK_DATA_NOT_LOAD;
1040

L
Liu Jicong 已提交
1041
  int32_t numOfOutput = 0;  // pTableScanInfo->numOfOutput;
1042 1043
  for (int32_t i = 0; i < numOfOutput; ++i) {
    int32_t functionId = pCtx[i].functionId;
H
Haojun Liao 已提交
1044
    int32_t colId = pTableScanInfo->pExpr[i].base.pParam[0].pCol->colId;
1045 1046 1047

    // group by + first/last should not apply the first/last block filter
    if (functionId < 0) {
1048
      status |= BLK_DATA_DATA_LOAD;
1049 1050
      return status;
    } else {
L
Liu Jicong 已提交
1051
      //      status |= aAggs[functionId].dataReqFunc(&pTableScanInfo->pCtx[i], &pBlock->info.window, colId);
1052
      //      if ((status & BLK_DATA_DATA_LOAD) == BLK_DATA_DATA_LOAD) {
L
Liu Jicong 已提交
1053 1054
      //        return status;
      //      }
1055 1056 1057 1058
    }
  }

  return status;
H
Haojun Liao 已提交
1059 1060
#endif
  return 0;
1061 1062
}

L
Liu Jicong 已提交
1063 1064
int32_t loadDataBlockOnDemand(SExecTaskInfo* pTaskInfo, STableScanInfo* pTableScanInfo, SSDataBlock* pBlock,
                              uint32_t* status) {
1065
  *status = BLK_DATA_NOT_LOAD;
1066

H
Haojun Liao 已提交
1067
  pBlock->pDataBlock = NULL;
L
Liu Jicong 已提交
1068
  pBlock->pBlockAgg = NULL;
H
Haojun Liao 已提交
1069

L
Liu Jicong 已提交
1070 1071
  //  int64_t groupId = pRuntimeEnv->current->groupIndex;
  //  bool    ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1072

H
Haojun Liao 已提交
1073
  STaskCostInfo* pCost = &pTaskInfo->cost;
1074

1075 1076
//  pCost->totalBlocks += 1;
//  pCost->totalRows += pBlock->info.rows;
H
Haojun Liao 已提交
1077
#if 0
1078 1079 1080
  // Calculate all time windows that are overlapping or contain current data block.
  // If current data block is contained by all possible time window, do not load current data block.
  if (/*pQueryAttr->pFilters || */pQueryAttr->groupbyColumn || pQueryAttr->sw.gap > 0 ||
H
Haojun Liao 已提交
1081
      (QUERY_IS_INTERVAL_QUERY(pQueryAttr) && overlapWithTimeWindow(pTaskInfo, &pBlock->info))) {
1082
    (*status) = BLK_DATA_DATA_LOAD;
1083 1084 1085
  }

  // check if this data block is required to load
1086
  if ((*status) != BLK_DATA_DATA_LOAD) {
1087 1088 1089 1090 1091 1092 1093
    bool needFilter = true;

    // the pCtx[i] result is belonged to previous time window since the outputBuf has not been set yet,
    // the filter result may be incorrect. So in case of interval query, we need to set the correct time output buffer
    if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
      SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1094
      bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1095 1096 1097 1098 1099 1100
      TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

      STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
      if (pQueryAttr->pointInterpQuery) {
        needFilter = chkWindowOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1101
                                    pTableScanInfo->rowEntryInfoOffset);
1102 1103 1104
      } else {
        if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1105
                                    pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1106 1107 1108 1109 1110
          longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
        }
      }
    } else if (pQueryAttr->stableQuery && (!pQueryAttr->tsCompQuery) && (!pQueryAttr->diffQuery)) { // stable aggregate, not interval aggregate or normal column aggregate
      doSetTableGroupOutputBuf(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pTableScanInfo->pCtx,
1111
                               pTableScanInfo->rowEntryInfoOffset, pTableScanInfo->numOfOutput,
1112 1113 1114 1115 1116 1117
                               pRuntimeEnv->current->groupIndex);
    }

    if (needFilter) {
      (*status) = doFilterByBlockTimeWindow(pTableScanInfo, pBlock);
    } else {
1118
      (*status) = BLK_DATA_DATA_LOAD;
1119 1120 1121 1122
    }
  }

  SDataBlockInfo* pBlockInfo = &pBlock->info;
H
Haojun Liao 已提交
1123
//  *status = updateBlockLoadStatus(pRuntimeEnv->pQueryAttr, *status);
1124

1125
  if ((*status) == BLK_DATA_NOT_LOAD || (*status) == BLK_DATA_FILTEROUT) {
1126 1127
    //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//           pBlockInfo->window.ekey, pBlockInfo->rows);
1128
    pCost->skipBlocks += 1;
1129
  } else if ((*status) == BLK_DATA_SMA_LOAD) {
1130 1131
    // this function never returns error?
    pCost->loadBlockStatis += 1;
1132
//    tsdbRetrieveDatablockSMA(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1133 1134

    if (pBlock->pBlockAgg == NULL) {  // data block statistics does not exist, load data block
1135
//      pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1136 1137 1138
      pCost->totalCheckedRows += pBlock->info.rows;
    }
  } else {
1139
    assert((*status) == BLK_DATA_DATA_LOAD);
1140 1141 1142

    // load the data block statistics to perform further filter
    pCost->loadBlockStatis += 1;
1143
//    tsdbRetrieveDatablockSMA(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1144 1145 1146 1147 1148 1149

    if (pQueryAttr->topBotQuery && pBlock->pBlockAgg != NULL) {
      { // set previous window
        if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
          SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1150
          bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1151 1152 1153 1154 1155
          TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

          STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
          if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                      pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1156
                                      pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167
            longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
          }
        }
      }
      bool load = false;
      for (int32_t i = 0; i < pQueryAttr->numOfOutput; ++i) {
        int32_t functionId = pTableScanInfo->pCtx[i].functionId;
        if (functionId == FUNCTION_TOP || functionId == FUNCTION_BOTTOM) {
//          load = topbot_datablock_filter(&pTableScanInfo->pCtx[i], (char*)&(pBlock->pBlockAgg[i].min),
//                                         (char*)&(pBlock->pBlockAgg[i].max));
          if (!load) { // current block has been discard due to filter applied
1168
            pCost->skipBlocks += 1;
1169 1170
            //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId,
//                   pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
1171
            (*status) = BLK_DATA_FILTEROUT;
1172 1173 1174 1175 1176 1177 1178 1179
            return TSDB_CODE_SUCCESS;
          }
        }
      }
    }

    // current block has been discard due to filter applied
//    if (!doFilterByBlockStatistics(pRuntimeEnv, pBlock->pBlockAgg, pTableScanInfo->pCtx, pBlockInfo->rows)) {
1180
//      pCost->skipBlocks += 1;
1181 1182
//      qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//             pBlockInfo->window.ekey, pBlockInfo->rows);
1183
//      (*status) = BLK_DATA_FILTEROUT;
1184 1185 1186 1187 1188
//      return TSDB_CODE_SUCCESS;
//    }

    pCost->totalCheckedRows += pBlockInfo->rows;
    pCost->loadBlocks += 1;
1189
//    pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1190 1191 1192 1193 1194
//    if (pBlock->pDataBlock == NULL) {
//      return terrno;
//    }

//    if (pQueryAttr->pFilters != NULL) {
1195
//      filterSetColFieldData(pQueryAttr->pFilters, taosArrayGetSize(pBlock->pDataBlock), pBlock->pDataBlock);
1196
//    }
1197

1198 1199 1200 1201
//    if (pQueryAttr->pFilters != NULL || pRuntimeEnv->pTsBuf != NULL) {
//      filterColRowsInDataBlock(pRuntimeEnv, pBlock, ascQuery);
//    }
  }
H
Haojun Liao 已提交
1202
#endif
1203 1204 1205
  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
1206
static void updateTableQueryInfoForReverseScan(STableQueryInfo* pTableQueryInfo) {
1207 1208 1209 1210
  if (pTableQueryInfo == NULL) {
    return;
  }

wafwerar's avatar
wafwerar 已提交
1211
  //  TSWAP(pTableQueryInfo->win.skey, pTableQueryInfo->win.ekey);
L
Liu Jicong 已提交
1212
  //  pTableQueryInfo->lastKey = pTableQueryInfo->win.skey;
1213

L
Liu Jicong 已提交
1214 1215
  //  SWITCH_ORDER(pTableQueryInfo->cur.order);
  //  pTableQueryInfo->cur.vgroupIndex = -1;
1216 1217

  // set the index to be the end slot of result rows array
dengyihao's avatar
dengyihao 已提交
1218 1219 1220 1221 1222 1223
  //  SResultRowInfo* pResultRowInfo = &pTableQueryInfo->resInfo;
  //  if (pResultRowInfo->size > 0) {
  //    pResultRowInfo->curPos = pResultRowInfo->size - 1;
  //  } else {
  //    pResultRowInfo->curPos = -1;
  //  }
1224 1225
}

H
Haojun Liao 已提交
1226
void initResultRow(SResultRow* pResultRow) {
X
Xiaoyu Wang 已提交
1227
  //  pResultRow->pEntryInfo = (struct SResultRowEntryInfo*)((char*)pResultRow + sizeof(SResultRow));
1228 1229 1230 1231 1232
}

/*
 * The start of each column SResultRowEntryInfo is denote by RowCellInfoOffset.
 * Note that in case of top/bottom query, the whole multiple rows of result is treated as only one row of results.
H
Haojun Liao 已提交
1233 1234 1235
 * +------------+-----------------result column 1------------+------------------result column 2-----------+
 * | SResultRow | SResultRowEntryInfo | intermediate buffer1 | SResultRowEntryInfo | intermediate buffer 2|
 * +------------+--------------------------------------------+--------------------------------------------+
1236 1237
 *           offset[0]                                  offset[1]                                   offset[2]
 */
1238
// TODO refactor: some function move away
L
Liu Jicong 已提交
1239 1240 1241
void setFunctionResultOutput(SOperatorInfo* pOperator, SOptrBasicInfo* pInfo, SAggSupporter* pSup, int32_t stage,
                             int32_t numOfExprs) {
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1242 1243
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
H
Haojun Liao 已提交
1244

H
Haojun Liao 已提交
1245
  SResultRowInfo* pResultRowInfo = &pInfo->resultRowInfo;
1246
  initResultRowInfo(pResultRowInfo);
H
Haojun Liao 已提交
1247

L
Liu Jicong 已提交
1248 1249
  int64_t     tid = 0;
  int64_t     groupId = 0;
1250 1251
  SResultRow* pRow = doSetResultOutBufByKey(pSup->pResultBuf, pResultRowInfo, (char*)&tid, sizeof(tid), true, groupId,
                                            pTaskInfo, false, pSup);
H
Haojun Liao 已提交
1252

1253
  for (int32_t i = 0; i < numOfExprs; ++i) {
1254
    struct SResultRowEntryInfo* pEntry = getResultEntryInfo(pRow, i, rowEntryInfoOffset);
H
Haojun Liao 已提交
1255 1256
    cleanupResultRowEntry(pEntry);

L
Liu Jicong 已提交
1257
    pCtx[i].resultInfo = pEntry;
1258
    pCtx[i].scanFlag = stage;
H
Haojun Liao 已提交
1259 1260
  }

1261
  initCtxOutputBuffer(pCtx, numOfExprs);
H
Haojun Liao 已提交
1262 1263
}

H
Haojun Liao 已提交
1264
void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size) {
1265 1266
  for (int32_t j = 0; j < size; ++j) {
    struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(&pCtx[j]);
dengyihao's avatar
dengyihao 已提交
1267 1268
    if (isRowEntryInitialized(pResInfo) || fmIsPseudoColumnFunc(pCtx[j].functionId) || pCtx[j].functionId == -1 ||
        fmIsScalarFunc(pCtx[j].functionId)) {
1269 1270 1271
      continue;
    }

H
Haojun Liao 已提交
1272
    pCtx[j].fpSet.init(&pCtx[j], pCtx[j].resultInfo);
1273 1274 1275
  }
}

L
Liu Jicong 已提交
1276
void setTaskStatus(SExecTaskInfo* pTaskInfo, int8_t status) {
1277
  if (status == TASK_NOT_COMPLETED) {
H
Haojun Liao 已提交
1278
    pTaskInfo->status = status;
1279 1280
  } else {
    // QUERY_NOT_COMPLETED is not compatible with any other status, so clear its position first
1281
    CLEAR_QUERY_STATUS(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
1282
    pTaskInfo->status |= status;
1283 1284 1285
  }
}

L
Liu Jicong 已提交
1286
void destroyTableQueryInfoImpl(STableQueryInfo* pTableQueryInfo) {
1287 1288 1289 1290
  if (pTableQueryInfo == NULL) {
    return;
  }

L
Liu Jicong 已提交
1291
  //  taosVariantDestroy(&pTableQueryInfo->tag);
dengyihao's avatar
dengyihao 已提交
1292
  //  cleanupResultRowInfo(&pTableQueryInfo->resInfo);
1293 1294
}

1295
void setResultRowInitCtx(SResultRow* pResult, SqlFunctionCtx* pCtx, int32_t numOfOutput, int32_t* rowEntryInfoOffset) {
1296
  for (int32_t i = 0; i < numOfOutput; ++i) {
1297
    pCtx[i].resultInfo = getResultEntryInfo(pResult, i, rowEntryInfoOffset);
1298 1299 1300 1301 1302

    struct SResultRowEntryInfo* pResInfo = pCtx[i].resultInfo;
    if (isRowEntryCompleted(pResInfo) && isRowEntryInitialized(pResInfo)) {
      continue;
    }
1303 1304 1305 1306 1307

    if (fmIsWindowPseudoColumnFunc(pCtx[i].functionId)) {
      continue;
    }

1308 1309 1310 1311 1312 1313
    if (!pResInfo->initialized) {
      if (pCtx[i].functionId != -1) {
        pCtx[i].fpSet.init(&pCtx[i], pResInfo);
      } else {
        pResInfo->initialized = true;
      }
1314 1315 1316 1317
    }
  }
}

H
Haojun Liao 已提交
1318
static void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep);
1319

1320
void doFilter(const SNode* pFilterNode, SSDataBlock* pBlock) {
1321 1322 1323 1324 1325
  if (pFilterNode == NULL) {
    return;
  }

  SFilterInfo* filter = NULL;
H
Haojun Liao 已提交
1326

H
Haojun Liao 已提交
1327
  // todo move to the initialization function
H
Haojun Liao 已提交
1328
  int32_t code = filterInitFromNode((SNode*)pFilterNode, &filter, 0);
1329

1330
  size_t             numOfCols = taosArrayGetSize(pBlock->pDataBlock);
1331
  SFilterColumnParam param1 = {.numOfCols = numOfCols, .pDataBlock = pBlock->pDataBlock};
1332 1333 1334
  code = filterSetDataFromSlotId(filter, &param1);

  int8_t* rowRes = NULL;
1335

1336
  // todo the keep seems never to be True??
1337
  bool keep = filterExecute(filter, pBlock, &rowRes, NULL, param1.numOfCols);
D
dapan1121 已提交
1338
  filterFreeInfo(filter);
1339

H
Haojun Liao 已提交
1340
  extractQualifiedTupleByFilterResult(pBlock, rowRes, keep);
1341
  blockDataUpdateTsWindow(pBlock, 0);
H
Haojun Liao 已提交
1342 1343

  taosMemoryFree(rowRes);
1344 1345
}

H
Haojun Liao 已提交
1346
void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep) {
1347 1348 1349 1350 1351
  if (keep) {
    return;
  }

  if (rowRes != NULL) {
L
Liu Jicong 已提交
1352
    int32_t      totalRows = pBlock->info.rows;
1353
    SSDataBlock* px = createOneDataBlock(pBlock, true);
1354

1355 1356
    size_t numOfCols = taosArrayGetSize(pBlock->pDataBlock);
    for (int32_t i = 0; i < numOfCols; ++i) {
1357 1358
      SColumnInfoData* pSrc = taosArrayGet(px->pDataBlock, i);
      SColumnInfoData* pDst = taosArrayGet(pBlock->pDataBlock, i);
1359
      // it is a reserved column for scalar function, and no data in this column yet.
1360
      if (pDst->pData == NULL || pSrc->pData == NULL) {
1361 1362 1363
        continue;
      }

1364 1365
      colInfoDataCleanup(pDst, pBlock->info.rows);

1366
      int32_t numOfRows = 0;
1367
      for (int32_t j = 0; j < totalRows; ++j) {
D
dapan1121 已提交
1368 1369 1370
        if (rowRes[j] == 0) {
          continue;
        }
1371

D
dapan1121 已提交
1372
        if (colDataIsNull_s(pSrc, j)) {
1373
          colDataAppendNULL(pDst, numOfRows);
D
dapan1121 已提交
1374
        } else {
1375
          colDataAppend(pDst, numOfRows, colDataGetData(pSrc, j), false);
D
dapan1121 已提交
1376
        }
1377
        numOfRows += 1;
H
Haojun Liao 已提交
1378
      }
1379

1380 1381 1382 1383 1384
      if (pBlock->info.rows == totalRows) {
        pBlock->info.rows = numOfRows;
      } else {
        ASSERT(pBlock->info.rows == numOfRows);
      }
1385
    }
1386

dengyihao's avatar
dengyihao 已提交
1387
    blockDataDestroy(px);  // fix memory leak
1388 1389 1390
  } else {
    // do nothing
    pBlock->info.rows = 0;
1391 1392 1393
  }
}

L
Liu Jicong 已提交
1394 1395
void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                              uint64_t groupId) {
1396
  // for simple group by query without interval, all the tables belong to one group result.
L
Liu Jicong 已提交
1397
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1398
  SResultRowInfo* pResultRowInfo = &pAggInfo->binfo.resultRowInfo;
1399 1400
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
1401

1402
  SResultRow* pResultRow = doSetResultOutBufByKey(pAggInfo->aggSup.pResultBuf, pResultRowInfo, (char*)&groupId,
L
Liu Jicong 已提交
1403
                                                  sizeof(groupId), true, groupId, pTaskInfo, false, &pAggInfo->aggSup);
L
Liu Jicong 已提交
1404
  assert(pResultRow != NULL);
1405 1406 1407 1408 1409 1410

  /*
   * not assign result buffer yet, add new result buffer
   * all group belong to one result set, and each group result has different group id so set the id to be one
   */
  if (pResultRow->pageId == -1) {
dengyihao's avatar
dengyihao 已提交
1411 1412
    int32_t ret =
        addNewWindowResultBuf(pResultRow, pAggInfo->aggSup.pResultBuf, groupId, pAggInfo->binfo.pRes->info.rowSize);
1413 1414 1415 1416 1417
    if (ret != TSDB_CODE_SUCCESS) {
      return;
    }
  }

1418
  setResultRowInitCtx(pResultRow, pCtx, numOfOutput, rowEntryInfoOffset);
1419 1420
}

1421
void setExecutionContext(SOperatorInfo* pOperator, int32_t numOfOutput, uint64_t groupId, SAggOperatorInfo* pAggInfo) {
H
Haojun Liao 已提交
1422
  if (pAggInfo->groupId != INT32_MIN && pAggInfo->groupId == groupId) {
1423 1424
    return;
  }
1425
#ifdef BUF_PAGE_DEBUG
L
Liu Jicong 已提交
1426
  qDebug("page_setbuf, groupId:%" PRIu64, groupId);
1427
#endif
1428
  doSetTableGroupOutputBuf(pOperator, pAggInfo, numOfOutput, groupId);
1429 1430

  // record the current active group id
H
Haojun Liao 已提交
1431
  pAggInfo->groupId = groupId;
1432 1433
}

1434 1435
static void doUpdateNumOfRows(SResultRow* pRow, int32_t numOfExprs, const int32_t* rowCellOffset) {
  for (int32_t j = 0; j < numOfExprs; ++j) {
1436
    struct SResultRowEntryInfo* pResInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1437 1438 1439 1440 1441 1442 1443 1444 1445 1446
    if (!isRowEntryInitialized(pResInfo)) {
      continue;
    }

    if (pRow->numOfRows < pResInfo->numOfRes) {
      pRow->numOfRows = pResInfo->numOfRes;
    }
  }
}

1447
int32_t finalizeResultRowIntoResultDataBlock(SDiskbasedBuf* pBuf, SResultRowPosition* resultRowPosition,
S
shenglian zhou 已提交
1448 1449 1450
                                             SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, int32_t numOfExprs,
                                             const int32_t* rowCellOffset, SSDataBlock* pBlock,
                                             SExecTaskInfo* pTaskInfo) {
1451 1452 1453 1454 1455 1456 1457 1458 1459
  SFilePage*  page = getBufPage(pBuf, resultRowPosition->pageId);
  SResultRow* pRow = (SResultRow*)((char*)page + resultRowPosition->offset);

  doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
  if (pRow->numOfRows == 0) {
    releaseBufPage(pBuf, page);
    return 0;
  }

1460 1461 1462 1463 1464 1465 1466
  while (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
    int32_t code = blockDataEnsureCapacity(pBlock, pBlock->info.capacity * 1.25);
    if (TAOS_FAILED(code)) {
      releaseBufPage(pBuf, page);
      qError("%s ensure result data capacity failed, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
      longjmp(pTaskInfo->env, code);
    }
1467 1468 1469 1470 1471
  }

  for (int32_t j = 0; j < numOfExprs; ++j) {
    int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1472
    pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492
    if (pCtx[j].fpSet.finalize) {
      int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
      if (TAOS_FAILED(code)) {
        qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
        longjmp(pTaskInfo->env, code);
      }
    } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
      // do nothing, todo refactor
    } else {
      // expand the result into multiple rows. E.g., _wstartts, top(k, 20)
      // the _wstartts needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
      SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
      char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
      for (int32_t k = 0; k < pRow->numOfRows; ++k) {
        colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
      }
    }
  }

  releaseBufPage(pBuf, page);
1493
  pBlock->info.rows += pRow->numOfRows;
1494 1495 1496 1497

  return 0;
}

X
Xiaoyu Wang 已提交
1498 1499 1500
int32_t doCopyToSDataBlock(SExecTaskInfo* pTaskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo, SDiskbasedBuf* pBuf,
                           SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset, SqlFunctionCtx* pCtx,
                           int32_t numOfExprs) {
1501
  int32_t numOfRows = getNumOfTotalRes(pGroupResInfo);
1502
  int32_t start = pGroupResInfo->index;
1503
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1504
  qDebug("\npage_copytoblock rows:%d", numOfRows);
1505
#endif
1506
  for (int32_t i = start; i < numOfRows; i += 1) {
L
Liu Jicong 已提交
1507 1508
    SResKeyPos* pPos = taosArrayGetP(pGroupResInfo->pRows, i);
    SFilePage*  page = getBufPage(pBuf, pPos->pos.pageId);
1509
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1510
    qDebug("page_copytoblock pos pageId:%d, offset:%d", pPos->pos.pageId, pPos->pos.offset);
1511
#endif
1512
    SResultRow* pRow = (SResultRow*)((char*)page + pPos->pos.offset);
1513 1514

    doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
1515 1516
    if (pRow->numOfRows == 0) {
      pGroupResInfo->index += 1;
1517
      releaseBufPage(pBuf, page);
1518 1519 1520
      continue;
    }

1521 1522 1523 1524 1525
    if (pBlock->info.groupId == 0) {
      pBlock->info.groupId = pPos->groupId;
    } else {
      // current value belongs to different group, it can't be packed into one datablock
      if (pBlock->info.groupId != pPos->groupId) {
1526
        releaseBufPage(pBuf, page);
1527 1528 1529 1530
        break;
      }
    }

1531
    if (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
1532
      releaseBufPage(pBuf, page);
1533 1534 1535 1536 1537
      break;
    }

    pGroupResInfo->index += 1;

1538
    for (int32_t j = 0; j < numOfExprs; ++j) {
1539 1540
      int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1541
      pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1542
      if (pCtx[j].fpSet.finalize) {
1543
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1544
        qDebug("\npage_finalize %d", numOfExprs);
1545
#endif
1546
        int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
1547
        if (TAOS_FAILED(code)) {
1548 1549
          qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
          longjmp(pTaskInfo->env, code);
1550
        }
1551 1552
      } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
        // do nothing, todo refactor
1553
      } else {
1554 1555
        // expand the result into multiple rows. E.g., _wstartts, top(k, 20)
        // the _wstartts needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
X
Xiaoyu Wang 已提交
1556 1557
        SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
        char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
1558
        if (pCtx[j].increase) {
L
Liu Jicong 已提交
1559
          int64_t ts = *(int64_t*)in;
1560
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
L
Liu Jicong 已提交
1561
            colDataAppend(pColInfoData, pBlock->info.rows + k, (const char*)&ts, pCtx[j].resultInfo->isNullRes);
1562 1563 1564 1565 1566 1567
            ts++;
          }
        } else {
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
            colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
          }
X
Xiaoyu Wang 已提交
1568
        }
1569
      }
1570 1571
    }

1572
    releaseBufPage(pBuf, page);
1573
    pBlock->info.rows += pRow->numOfRows;
L
Liu Jicong 已提交
1574 1575 1576
    //    if (pBlock->info.rows >= pBlock->info.capacity) {  // output buffer is full
    //      break;
    //    }
1577 1578
  }

X
Xiaoyu Wang 已提交
1579 1580
  qDebug("%s result generated, rows:%d, groupId:%" PRIu64, GET_TASKID(pTaskInfo), pBlock->info.rows,
         pBlock->info.groupId);
1581
  blockDataUpdateTsWindow(pBlock, 0);
1582 1583 1584
  return 0;
}

X
Xiaoyu Wang 已提交
1585 1586
void doBuildResultDatablock(SOperatorInfo* pOperator, SOptrBasicInfo* pbInfo, SGroupResInfo* pGroupResInfo,
                            SDiskbasedBuf* pBuf) {
1587 1588
  SExprInfo*     pExprInfo = pOperator->exprSupp.pExprInfo;
  int32_t        numOfExprs = pOperator->exprSupp.numOfExprs;
1589 1590
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

1591
  int32_t*        rowCellOffset = pOperator->exprSupp.rowEntryInfoOffset;
X
Xiaoyu Wang 已提交
1592
  SSDataBlock*    pBlock = pbInfo->pRes;
1593
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
1594

1595
  blockDataCleanup(pBlock);
1596
  if (!hasDataInGroupInfo(pGroupResInfo)) {
1597 1598 1599
    return;
  }

1600 1601
  // clear the existed group id
  pBlock->info.groupId = 0;
1602
  doCopyToSDataBlock(pTaskInfo, pBlock, pExprInfo, pBuf, pGroupResInfo, rowCellOffset, pCtx, numOfExprs);
1603 1604
}

L
Liu Jicong 已提交
1605
static void updateNumOfRowsInResultRows(SqlFunctionCtx* pCtx, int32_t numOfOutput, SResultRowInfo* pResultRowInfo,
1606
                                        int32_t* rowEntryInfoOffset) {
1607
  // update the number of result for each, only update the number of rows for the corresponding window result.
L
Liu Jicong 已提交
1608 1609 1610
  //  if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
  //    return;
  //  }
H
Haojun Liao 已提交
1611
#if 0
1612
  for (int32_t i = 0; i < pResultRowInfo->size; ++i) {
L
Liu Jicong 已提交
1613
    SResultRow* pResult = pResultRowInfo->pResult[i];
1614 1615 1616 1617 1618 1619 1620

    for (int32_t j = 0; j < numOfOutput; ++j) {
      int32_t functionId = pCtx[j].functionId;
      if (functionId == FUNCTION_TS || functionId == FUNCTION_TAG || functionId == FUNCTION_TAGPRJ) {
        continue;
      }

1621
      SResultRowEntryInfo* pCell = getResultEntryInfo(pResult, j, rowEntryInfoOffset);
1622
      pResult->numOfRows = (uint16_t)(TMAX(pResult->numOfRows, pCell->numOfRes));
1623 1624
    }
  }
H
Haojun Liao 已提交
1625
#endif
1626 1627
}

L
Liu Jicong 已提交
1628
static int32_t compressQueryColData(SColumnInfoData* pColRes, int32_t numOfRows, char* data, int8_t compressed) {
1629 1630
  int32_t colSize = pColRes->info.bytes * numOfRows;
  return (*(tDataTypes[pColRes->info.type].compFunc))(pColRes->pData, colSize, numOfRows, data,
L
Liu Jicong 已提交
1631
                                                      colSize + COMP_OVERFLOW_BYTES, compressed, NULL, 0);
1632 1633
}

1634 1635 1636
int32_t doFillTimeIntervalGapsInResults(struct SFillInfo* pFillInfo, SSDataBlock* pBlock, int32_t capacity) {
  int32_t numOfRows = (int32_t)taosFillResultDataBlock(pFillInfo, pBlock, capacity - pBlock->info.rows);
  pBlock->info.rows += numOfRows;
1637

1638
  return pBlock->info.rows;
1639 1640
}

L
Liu Jicong 已提交
1641 1642
void queryCostStatis(SExecTaskInfo* pTaskInfo) {
  STaskCostInfo* pSummary = &pTaskInfo->cost;
1643

L
Liu Jicong 已提交
1644 1645 1646
  //  uint64_t hashSize = taosHashGetMemSize(pQInfo->runtimeEnv.pResultRowHashTable);
  //  hashSize += taosHashGetMemSize(pRuntimeEnv->tableqinfoGroupInfo.map);
  //  pSummary->hashSize = hashSize;
1647 1648 1649 1650

  // add the merge time
  pSummary->elapsedTime += pSummary->firstStageMergeTime;

L
Liu Jicong 已提交
1651 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661
  //  SResultRowPool* p = pTaskInfo->pool;
  //  if (p != NULL) {
  //    pSummary->winInfoSize = getResultRowPoolMemSize(p);
  //    pSummary->numOfTimeWindows = getNumOfAllocatedResultRows(p);
  //  } else {
  //    pSummary->winInfoSize = 0;
  //    pSummary->numOfTimeWindows = 0;
  //  }
  //
  //  calculateOperatorProfResults(pQInfo);

1662 1663
  SFileBlockLoadRecorder* pRecorder = pSummary->pRecoder;
  if (pSummary->pRecoder != NULL) {
X
Xiaoyu Wang 已提交
1664 1665
    qDebug("%s :cost summary: elapsed time:%" PRId64 " us, first merge:%" PRId64
           " us, total blocks:%d, "
1666 1667 1668 1669
           "load block statis:%d, load data block:%d, total rows:%" PRId64 ", check rows:%" PRId64,
           GET_TASKID(pTaskInfo), pSummary->elapsedTime, pSummary->firstStageMergeTime, pRecorder->totalBlocks,
           pRecorder->loadBlockStatis, pRecorder->loadBlocks, pRecorder->totalRows, pRecorder->totalCheckedRows);
  }
L
Liu Jicong 已提交
1670 1671 1672
  // qDebug("QInfo:0x%"PRIx64" :cost summary: winResPool size:%.2f Kb, numOfWin:%"PRId64", tableInfoSize:%.2f Kb,
  // hashTable:%.2f Kb", pQInfo->qId, pSummary->winInfoSize/1024.0,
  //      pSummary->numOfTimeWindows, pSummary->tableInfoSize/1024.0, pSummary->hashSize/1024.0);
1673 1674
}

L
Liu Jicong 已提交
1675 1676 1677
// static void updateOffsetVal(STaskRuntimeEnv *pRuntimeEnv, SDataBlockInfo *pBlockInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
1678
//
L
Liu Jicong 已提交
1679
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1680
//
L
Liu Jicong 已提交
1681 1682 1683 1684
//   if (pQueryAttr->limit.offset == pBlockInfo->rows) {  // current block will ignore completed
//     pTableQueryInfo->lastKey = QUERY_IS_ASC_QUERY(pQueryAttr) ? pBlockInfo->window.ekey + step :
//     pBlockInfo->window.skey + step; pQueryAttr->limit.offset = 0; return;
//   }
1685
//
L
Liu Jicong 已提交
1686 1687 1688 1689 1690
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     pQueryAttr->pos = (int32_t)pQueryAttr->limit.offset;
//   } else {
//     pQueryAttr->pos = pBlockInfo->rows - (int32_t)pQueryAttr->limit.offset - 1;
//   }
1691
//
L
Liu Jicong 已提交
1692
//   assert(pQueryAttr->pos >= 0 && pQueryAttr->pos <= pBlockInfo->rows - 1);
1693
//
L
Liu Jicong 已提交
1694 1695
//   SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//   SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1696
//
L
Liu Jicong 已提交
1697 1698
//   // update the pQueryAttr->limit.offset value, and pQueryAttr->pos value
//   TSKEY *keys = (TSKEY *) pColInfoData->pData;
1699
//
L
Liu Jicong 已提交
1700 1701 1702
//   // update the offset value
//   pTableQueryInfo->lastKey = keys[pQueryAttr->pos];
//   pQueryAttr->limit.offset = 0;
1703
//
L
Liu Jicong 已提交
1704
//   int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
1705
//
L
Liu Jicong 已提交
1706 1707 1708 1709
//   //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numBlocksOfStep:%d, numOfRes:%d,
//   lastKey:%"PRId64, GET_TASKID(pRuntimeEnv),
//          pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes, pQuery->current->lastKey);
// }
1710

L
Liu Jicong 已提交
1711 1712
// void skipBlocks(STaskRuntimeEnv *pRuntimeEnv) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
1713
//
L
Liu Jicong 已提交
1714 1715 1716
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0) {
//     return;
//   }
1717
//
L
Liu Jicong 已提交
1718 1719
//   pQueryAttr->pos = 0;
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1720
//
L
Liu Jicong 已提交
1721 1722
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
//   TsdbQueryHandleT pTsdbReadHandle = pRuntimeEnv->pTsdbReadHandle;
1723
//
L
Liu Jicong 已提交
1724 1725 1726 1727 1728
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pTsdbReadHandle)) {
//     if (isTaskKilled(pRuntimeEnv->qinfo)) {
//       longjmp(pRuntimeEnv->env, TSDB_CODE_TSC_QUERY_CANCELLED);
//     }
1729
//
L
Liu Jicong 已提交
1730
//     tsdbRetrieveDataBlockInfo(pTsdbReadHandle, &blockInfo);
1731
//
L
Liu Jicong 已提交
1732 1733 1734 1735
//     if (pQueryAttr->limit.offset > blockInfo.rows) {
//       pQueryAttr->limit.offset -= blockInfo.rows;
//       pTableQueryInfo->lastKey = (QUERY_IS_ASC_QUERY(pQueryAttr)) ? blockInfo.window.ekey : blockInfo.window.skey;
//       pTableQueryInfo->lastKey += step;
1736
//
L
Liu Jicong 已提交
1737 1738 1739 1740 1741 1742 1743
//       //qDebug("QInfo:0x%"PRIx64" skip rows:%d, offset:%" PRId64, GET_TASKID(pRuntimeEnv), blockInfo.rows,
//              pQuery->limit.offset);
//     } else {  // find the appropriated start position in current block
//       updateOffsetVal(pRuntimeEnv, &blockInfo);
//       break;
//     }
//   }
1744
//
L
Liu Jicong 已提交
1745 1746 1747 1748 1749 1750 1751 1752 1753
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
// }

// static TSKEY doSkipIntervalProcess(STaskRuntimeEnv* pRuntimeEnv, STimeWindow* win, SDataBlockInfo* pBlockInfo,
// STableQueryInfo* pTableQueryInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
1754
//
L
Liu Jicong 已提交
1755 1756 1757
//   assert(pQueryAttr->limit.offset == 0);
//   STimeWindow tw = *win;
//   getNextTimeWindow(pQueryAttr, &tw);
1758
//
L
Liu Jicong 已提交
1759 1760
//   if ((tw.skey <= pBlockInfo->window.ekey && QUERY_IS_ASC_QUERY(pQueryAttr)) ||
//       (tw.ekey >= pBlockInfo->window.skey && !QUERY_IS_ASC_QUERY(pQueryAttr))) {
1761
//
L
Liu Jicong 已提交
1762 1763 1764 1765
//     // load the data block and check data remaining in current data block
//     // TODO optimize performance
//     SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//     SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1766
//
L
Liu Jicong 已提交
1767 1768 1769 1770
//     tw = *win;
//     int32_t startPos =
//         getNextQualifiedWindow(pQueryAttr, &tw, pBlockInfo, pColInfoData->pData, binarySearchForKey, -1);
//     assert(startPos >= 0);
1771
//
L
Liu Jicong 已提交
1772 1773
//     // set the abort info
//     pQueryAttr->pos = startPos;
1774
//
L
Liu Jicong 已提交
1775 1776 1777 1778
//     // reset the query start timestamp
//     pTableQueryInfo->win.skey = ((TSKEY *)pColInfoData->pData)[startPos];
//     pQueryAttr->window.skey = pTableQueryInfo->win.skey;
//     TSKEY key = pTableQueryInfo->win.skey;
1779
//
L
Liu Jicong 已提交
1780 1781
//     pWindowResInfo->prevSKey = tw.skey;
//     int32_t index = pRuntimeEnv->resultRowInfo.curIndex;
1782
//
L
Liu Jicong 已提交
1783 1784
//     int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
//     pRuntimeEnv->resultRowInfo.curIndex = index;  // restore the window index
1785
//
L
Liu Jicong 已提交
1786 1787 1788 1789
//     //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numOfRows:%d, numOfRes:%d,
//     lastKey:%" PRId64,
//            GET_TASKID(pRuntimeEnv), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes,
//            pQueryAttr->current->lastKey);
1790
//
L
Liu Jicong 已提交
1791 1792 1793 1794 1795
//     return key;
//   } else {  // do nothing
//     pQueryAttr->window.skey      = tw.skey;
//     pWindowResInfo->prevSKey = tw.skey;
//     pTableQueryInfo->lastKey = tw.skey;
1796
//
L
Liu Jicong 已提交
1797 1798
//     return tw.skey;
//   }
1799
//
L
Liu Jicong 已提交
1800 1801 1802 1803 1804 1805 1806 1807 1808 1809
//   return true;
// }

// static bool skipTimeInterval(STaskRuntimeEnv *pRuntimeEnv, TSKEY* start) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     assert(*start <= pRuntimeEnv->current->lastKey);
//   } else {
//     assert(*start >= pRuntimeEnv->current->lastKey);
//   }
1810
//
L
Liu Jicong 已提交
1811 1812 1813 1814 1815
//   // if queried with value filter, do NOT forward query start position
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0 || pRuntimeEnv->pTsBuf != NULL ||
//   pRuntimeEnv->pFillInfo != NULL) {
//     return true;
//   }
1816
//
L
Liu Jicong 已提交
1817 1818 1819 1820 1821 1822 1823
//   /*
//    * 1. for interval without interpolation query we forward pQueryAttr->interval.interval at a time for
//    *    pQueryAttr->limit.offset times. Since hole exists, pQueryAttr->interval.interval*pQueryAttr->limit.offset
//    value is
//    *    not valid. otherwise, we only forward pQueryAttr->limit.offset number of points
//    */
//   assert(pRuntimeEnv->resultRowInfo.prevSKey == TSKEY_INITIAL_VAL);
1824
//
L
Liu Jicong 已提交
1825 1826
//   STimeWindow w = TSWINDOW_INITIALIZER;
//   bool ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1827
//
L
Liu Jicong 已提交
1828 1829
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
//   STableQueryInfo *pTableQueryInfo = pRuntimeEnv->current;
1830
//
L
Liu Jicong 已提交
1831 1832 1833
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pRuntimeEnv->pTsdbReadHandle)) {
//     tsdbRetrieveDataBlockInfo(pRuntimeEnv->pTsdbReadHandle, &blockInfo);
1834
//
L
Liu Jicong 已提交
1835 1836 1837 1838 1839 1840 1841 1842 1843
//     if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       if (pWindowResInfo->prevSKey == TSKEY_INITIAL_VAL) {
//         getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.skey, blockInfo.window.skey, pQueryAttr->window.ekey,
//         &w); pWindowResInfo->prevSKey = w.skey;
//       }
//     } else {
//       getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.ekey, pQueryAttr->window.ekey, blockInfo.window.ekey, &w);
//       pWindowResInfo->prevSKey = w.skey;
//     }
1844
//
L
Liu Jicong 已提交
1845 1846
//     // the first time window
//     STimeWindow win = getActiveTimeWindow(pWindowResInfo, pWindowResInfo->prevSKey, pQueryAttr);
1847
//
L
Liu Jicong 已提交
1848 1849
//     while (pQueryAttr->limit.offset > 0) {
//       STimeWindow tw = win;
1850
//
L
Liu Jicong 已提交
1851 1852 1853
//       if ((win.ekey <= blockInfo.window.ekey && ascQuery) || (win.ekey >= blockInfo.window.skey && !ascQuery)) {
//         pQueryAttr->limit.offset -= 1;
//         pWindowResInfo->prevSKey = win.skey;
1854
//
L
Liu Jicong 已提交
1855 1856 1857 1858 1859 1860
//         // current time window is aligned with blockInfo.window.ekey
//         // restart it from next data block by set prevSKey to be TSKEY_INITIAL_VAL;
//         if ((win.ekey == blockInfo.window.ekey && ascQuery) || (win.ekey == blockInfo.window.skey && !ascQuery)) {
//           pWindowResInfo->prevSKey = TSKEY_INITIAL_VAL;
//         }
//       }
1861
//
L
Liu Jicong 已提交
1862 1863 1864 1865
//       if (pQueryAttr->limit.offset == 0) {
//         *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//         return true;
//       }
1866
//
L
Liu Jicong 已提交
1867 1868
//       // current window does not ended in current data block, try next data block
//       getNextTimeWindow(pQueryAttr, &tw);
1869
//
L
Liu Jicong 已提交
1870 1871 1872 1873 1874 1875 1876 1877 1878
//       /*
//        * If the next time window still starts from current data block,
//        * load the primary timestamp column first, and then find the start position for the next queried time window.
//        * Note that only the primary timestamp column is required.
//        * TODO: Optimize for this cases. All data blocks are not needed to be loaded, only if the first actually
//        required
//        * time window resides in current data block.
//        */
//       if ((tw.skey <= blockInfo.window.ekey && ascQuery) || (tw.ekey >= blockInfo.window.skey && !ascQuery)) {
1879
//
L
Liu Jicong 已提交
1880 1881
//         SArray *pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//         SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1882
//
L
Liu Jicong 已提交
1883 1884 1885
//         if ((win.ekey > blockInfo.window.ekey && ascQuery) || (win.ekey < blockInfo.window.skey && !ascQuery)) {
//           pQueryAttr->limit.offset -= 1;
//         }
1886
//
L
Liu Jicong 已提交
1887 1888 1889 1890 1891 1892 1893 1894
//         if (pQueryAttr->limit.offset == 0) {
//           *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//           return true;
//         } else {
//           tw = win;
//           int32_t startPos =
//               getNextQualifiedWindow(pQueryAttr, &tw, &blockInfo, pColInfoData->pData, binarySearchForKey, -1);
//           assert(startPos >= 0);
1895
//
L
Liu Jicong 已提交
1896 1897 1898 1899 1900 1901 1902 1903 1904 1905 1906
//           // set the abort info
//           pQueryAttr->pos = startPos;
//           pTableQueryInfo->lastKey = ((TSKEY *)pColInfoData->pData)[startPos];
//           pWindowResInfo->prevSKey = tw.skey;
//           win = tw;
//         }
//       } else {
//         break;  // offset is not 0, and next time window begins or ends in the next block.
//       }
//     }
//   }
1907
//
L
Liu Jicong 已提交
1908 1909 1910 1911
//   // check for error
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
1912
//
L
Liu Jicong 已提交
1913 1914
//   return true;
// }
1915

1916
int32_t appendDownstream(SOperatorInfo* p, SOperatorInfo** pDownstream, int32_t num) {
H
Haojun Liao 已提交
1917
  if (p->pDownstream == NULL) {
H
Haojun Liao 已提交
1918
    assert(p->numOfDownstream == 0);
1919 1920
  }

wafwerar's avatar
wafwerar 已提交
1921
  p->pDownstream = taosMemoryCalloc(1, num * POINTER_BYTES);
1922 1923 1924 1925 1926 1927 1928
  if (p->pDownstream == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  memcpy(p->pDownstream, pDownstream, num * POINTER_BYTES);
  p->numOfDownstream = num;
  return TSDB_CODE_SUCCESS;
1929 1930
}

wmmhello's avatar
wmmhello 已提交
1931
static void doDestroyTableList(STableListInfo* pTableqinfoList);
1932

1933
static void doTableQueryInfoTimeWindowCheck(SExecTaskInfo* pTaskInfo, STableQueryInfo* pTableQueryInfo, int32_t order) {
H
Haojun Liao 已提交
1934 1935
#if 0
    if (order == TSDB_ORDER_ASC) {
1936 1937
    assert(
        (pTableQueryInfo->win.skey <= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1938 1939
        (pTableQueryInfo->lastKey >= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey >= pTaskInfo->window.skey && pTableQueryInfo->win.ekey <= pTaskInfo->window.ekey));
1940 1941 1942
  } else {
    assert(
        (pTableQueryInfo->win.skey >= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1943 1944
        (pTableQueryInfo->lastKey <= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey <= pTaskInfo->window.skey && pTableQueryInfo->win.ekey >= pTaskInfo->window.ekey));
1945
  }
H
Haojun Liao 已提交
1946
#endif
1947 1948
}

1949 1950 1951 1952
typedef struct SFetchRspHandleWrapper {
  uint32_t exchangeId;
  int32_t  sourceIndex;
} SFetchRspHandleWrapper;
1953

D
dapan1121 已提交
1954
int32_t loadRemoteDataCallback(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1955
  SFetchRspHandleWrapper* pWrapper = (SFetchRspHandleWrapper*)param;
1956 1957 1958 1959 1960 1961 1962

  SExchangeInfo* pExchangeInfo = taosAcquireRef(exchangeObjRefPool, pWrapper->exchangeId);
  if (pExchangeInfo == NULL) {
    qWarn("failed to acquire exchange operator, since it may have been released");
    return TSDB_CODE_SUCCESS;
  }

X
Xiaoyu Wang 已提交
1963
  int32_t          index = pWrapper->sourceIndex;
1964
  SSourceDataInfo* pSourceDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, index);
1965

H
Haojun Liao 已提交
1966 1967
  if (code == TSDB_CODE_SUCCESS) {
    pSourceDataInfo->pRsp = pMsg->pData;
1968

H
Haojun Liao 已提交
1969 1970
    SRetrieveTableRsp* pRsp = pSourceDataInfo->pRsp;
    pRsp->numOfRows = htonl(pRsp->numOfRows);
dengyihao's avatar
dengyihao 已提交
1971
    pRsp->compLen = htonl(pRsp->compLen);
1972
    pRsp->numOfCols = htonl(pRsp->numOfCols);
dengyihao's avatar
dengyihao 已提交
1973
    pRsp->useconds = htobe64(pRsp->useconds);
1974

1975
    ASSERT(pRsp != NULL);
1976
    qDebug("%s fetch rsp received, index:%d, rows:%d", pSourceDataInfo->taskId, index, pRsp->numOfRows);
H
Haojun Liao 已提交
1977 1978 1979
  } else {
    pSourceDataInfo->code = code;
  }
H
Haojun Liao 已提交
1980

H
Haojun Liao 已提交
1981
  pSourceDataInfo->status = EX_SOURCE_DATA_READY;
1982 1983 1984 1985 1986

  tsem_post(&pExchangeInfo->ready);
  taosReleaseRef(exchangeObjRefPool, pWrapper->exchangeId);

  taosMemoryFree(pWrapper);
wmmhello's avatar
wmmhello 已提交
1987
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
1988 1989 1990 1991
}

static void destroySendMsgInfo(SMsgSendInfo* pMsgBody) {
  assert(pMsgBody != NULL);
wafwerar's avatar
wafwerar 已提交
1992 1993
  taosMemoryFreeClear(pMsgBody->msgInfo.pData);
  taosMemoryFreeClear(pMsgBody);
H
Haojun Liao 已提交
1994 1995
}

D
dapan1121 已提交
1996
void qProcessRspMsg(void* parent, SRpcMsg* pMsg, SEpSet* pEpSet) {
S
Shengliang Guan 已提交
1997 1998
  SMsgSendInfo* pSendInfo = (SMsgSendInfo*)pMsg->info.ahandle;
  assert(pMsg->info.ahandle != NULL);
H
Haojun Liao 已提交
1999 2000 2001 2002

  SDataBuf buf = {.len = pMsg->contLen, .pData = NULL};

  if (pMsg->contLen > 0) {
wafwerar's avatar
wafwerar 已提交
2003
    buf.pData = taosMemoryCalloc(1, pMsg->contLen);
H
Haojun Liao 已提交
2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014
    if (buf.pData == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      pMsg->code = TSDB_CODE_OUT_OF_MEMORY;
    } else {
      memcpy(buf.pData, pMsg->pCont, pMsg->contLen);
    }
  }

  pSendInfo->fp(pSendInfo->param, &buf, pMsg->code);
  rpcFreeCont(pMsg->pCont);
  destroySendMsgInfo(pSendInfo);
2015 2016
}

L
Liu Jicong 已提交
2017
static int32_t doSendFetchDataRequest(SExchangeInfo* pExchangeInfo, SExecTaskInfo* pTaskInfo, int32_t sourceIndex) {
2018
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2019

wafwerar's avatar
wafwerar 已提交
2020
  SResFetchReq* pMsg = taosMemoryCalloc(1, sizeof(SResFetchReq));
2021 2022 2023 2024
  if (NULL == pMsg) {
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
  }
2025

L
Liu Jicong 已提交
2026 2027
  SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, sourceIndex);
  SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, sourceIndex);
2028

2029 2030
  ASSERT(pDataInfo->status == EX_SOURCE_DATA_NOT_READY);

2031 2032 2033
  qDebug("%s build fetch msg and send to vgId:%d, ep:%s, taskId:0x%" PRIx64 ", execId:%d, %d/%" PRIzu,
         GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->addr.epSet.eps[0].fqdn, pSource->taskId, pSource->execId,
         sourceIndex, totalSources);
2034 2035 2036 2037 2038

  pMsg->header.vgId = htonl(pSource->addr.nodeId);
  pMsg->sId = htobe64(pSource->schedId);
  pMsg->taskId = htobe64(pSource->taskId);
  pMsg->queryId = htobe64(pTaskInfo->id.queryId);
D
dapan1121 已提交
2039
  pMsg->execId = htonl(pSource->execId);
2040 2041

  // send the fetch remote task result reques
wafwerar's avatar
wafwerar 已提交
2042
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
2043
  if (NULL == pMsgSendInfo) {
wafwerar's avatar
wafwerar 已提交
2044
    taosMemoryFreeClear(pMsg);
2045 2046 2047
    qError("%s prepare message %d failed", GET_TASKID(pTaskInfo), (int32_t)sizeof(SMsgSendInfo));
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
H
Haojun Liao 已提交
2048 2049
  }

2050
  SFetchRspHandleWrapper* pWrapper = taosMemoryCalloc(1, sizeof(SFetchRspHandleWrapper));
X
Xiaoyu Wang 已提交
2051
  pWrapper->exchangeId = pExchangeInfo->self;
2052 2053 2054
  pWrapper->sourceIndex = sourceIndex;

  pMsgSendInfo->param = pWrapper;
2055 2056
  pMsgSendInfo->msgInfo.pData = pMsg;
  pMsgSendInfo->msgInfo.len = sizeof(SResFetchReq);
L
Liu Jicong 已提交
2057
  pMsgSendInfo->msgType = pSource->fetchMsgType;
2058
  pMsgSendInfo->fp = loadRemoteDataCallback;
2059

2060
  int64_t transporterId = 0;
L
Liu Jicong 已提交
2061
  int32_t code = asyncSendMsgToServer(pExchangeInfo->pTransporter, &pSource->addr.epSet, &transporterId, pMsgSendInfo);
2062 2063 2064
  return TSDB_CODE_SUCCESS;
}

2065
int32_t extractDataBlockFromFetchRsp(SSDataBlock* pRes, SLoadRemoteDataInfo* pLoadInfo, int32_t numOfRows, char* pData,
L
Liu Jicong 已提交
2066 2067
                                     int32_t compLen, int32_t numOfOutput, int64_t startTs, uint64_t* total,
                                     SArray* pColList) {
H
Haojun Liao 已提交
2068
  if (pColList == NULL) {  // data from other sources
2069
    blockDataCleanup(pRes);
2070
    //    blockDataEnsureCapacity(pRes, numOfRows);
2071
    blockDecode(pRes, numOfOutput, numOfRows, pData);
H
Haojun Liao 已提交
2072
  } else {  // extract data according to pColList
2073
    ASSERT(numOfOutput == taosArrayGetSize(pColList));
2074 2075 2076 2077 2078
    char* pStart = pData;

    int32_t numOfCols = htonl(*(int32_t*)pStart);
    pStart += sizeof(int32_t);

2079
    // todo refactor:extract method
2080
    SSysTableSchema* pSchema = (SSysTableSchema*)pStart;
dengyihao's avatar
dengyihao 已提交
2081
    for (int32_t i = 0; i < numOfCols; ++i) {
2082 2083 2084 2085 2086 2087 2088
      SSysTableSchema* p = (SSysTableSchema*)pStart;

      p->colId = htons(p->colId);
      p->bytes = htonl(p->bytes);
      pStart += sizeof(SSysTableSchema);
    }

2089
    SSDataBlock* pBlock = createDataBlock();
dengyihao's avatar
dengyihao 已提交
2090
    for (int32_t i = 0; i < numOfCols; ++i) {
2091 2092
      SColumnInfoData idata = createColumnInfoData(pSchema[i].type, pSchema[i].bytes, pSchema[i].colId);
      blockDataAppendColInfo(pBlock, &idata);
2093 2094
    }

2095
    blockDecode(pBlock, numOfCols, numOfRows, pStart);
2096 2097
    blockDataEnsureCapacity(pRes, numOfRows);

H
Haojun Liao 已提交
2098
    // data from mnode
2099
    pRes->info.rows = numOfRows;
2100 2101
    relocateColumnData(pRes, pColList, pBlock->pDataBlock, false);
    blockDataDestroy(pBlock);
2102
  }
2103

2104 2105
  // todo move this to time window aggregator, since the primary timestamp may not be known by exchange operator.
  blockDataUpdateTsWindow(pRes, 0);
2106

2107
  int64_t el = taosGetTimestampUs() - startTs;
2108

H
Haojun Liao 已提交
2109 2110
  pLoadInfo->totalRows += numOfRows;
  pLoadInfo->totalSize += compLen;
2111

H
Haojun Liao 已提交
2112 2113 2114
  if (total != NULL) {
    *total += numOfRows;
  }
2115

H
Haojun Liao 已提交
2116
  pLoadInfo->totalElapsed += el;
2117 2118
  return TSDB_CODE_SUCCESS;
}
2119

L
Liu Jicong 已提交
2120 2121
static void* setAllSourcesCompleted(SOperatorInfo* pOperator, int64_t startTs) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
2122
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
H
Haojun Liao 已提交
2123

2124
  int64_t              el = taosGetTimestampUs() - startTs;
H
Haojun Liao 已提交
2125
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2126

H
Haojun Liao 已提交
2127
  pLoadInfo->totalElapsed += el;
H
Haojun Liao 已提交
2128

2129
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
L
Liu Jicong 已提交
2130 2131 2132
  qDebug("%s all %" PRIzu " sources are exhausted, total rows: %" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
         GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
         pLoadInfo->totalElapsed / 1000.0);
2133 2134 2135 2136 2137

  doSetOperatorCompleted(pOperator);
  return NULL;
}

L
Liu Jicong 已提交
2138 2139
static SSDataBlock* concurrentlyLoadRemoteDataImpl(SOperatorInfo* pOperator, SExchangeInfo* pExchangeInfo,
                                                   SExecTaskInfo* pTaskInfo) {
2140 2141 2142 2143 2144 2145 2146 2147
  int32_t code = 0;
  int64_t startTs = taosGetTimestampUs();
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);

  while (1) {
    int32_t completed = 0;
    for (int32_t i = 0; i < totalSources; ++i) {
      SSourceDataInfo* pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, i);
2148
      if (pDataInfo->status == EX_SOURCE_DATA_EXHAUSTED) {
2149
        completed += 1;
H
Haojun Liao 已提交
2150 2151
        continue;
      }
2152

2153
      if (pDataInfo->status != EX_SOURCE_DATA_READY) {
2154 2155 2156
        continue;
      }

2157 2158 2159 2160 2161
      if (pDataInfo->code != TSDB_CODE_SUCCESS) {
        code = pDataInfo->code;
        goto _error;
      }

L
Liu Jicong 已提交
2162
      SRetrieveTableRsp*     pRsp = pDataInfo->pRsp;
X
Xiaoyu Wang 已提交
2163
      SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, i);
2164

L
Liu Jicong 已提交
2165
      SSDataBlock*         pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2166
      SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2167
      if (pRsp->numOfRows == 0) {
2168 2169
        qDebug("%s vgId:%d, taskId:0x%" PRIx64 " execId:%d index:%d completed, rowsOfSource:%" PRIu64
               ", totalRows:%" PRIu64 ", completed:%d try next %d/%" PRIzu,
D
dapan1121 已提交
2170
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pDataInfo->totalRows,
2171
               pExchangeInfo->loadInfo.totalRows, completed + 1, i + 1, totalSources);
2172
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2173
        completed += 1;
D
dapan1121 已提交
2174
        taosMemoryFreeClear(pDataInfo->pRsp);
2175 2176
        continue;
      }
H
Haojun Liao 已提交
2177

H
Haojun Liao 已提交
2178
      SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2179 2180 2181
      code =
          extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
                                       pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2182
      if (code != 0) {
2183
        taosMemoryFreeClear(pDataInfo->pRsp);
2184 2185 2186
        goto _error;
      }

2187
      if (pRsp->completed == 1) {
2188 2189
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64
               " execId:%d"
X
Xiaoyu Wang 已提交
2190 2191
               " index:%d completed, numOfRows:%d, rowsOfSource:%" PRIu64 ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64
               ", completed:%d try next %d/%" PRIzu,
2192 2193
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pRes->info.rows,
               pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, completed + 1, i + 1, totalSources);
2194
        completed += 1;
2195
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2196
      } else {
D
dapan1121 已提交
2197
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
dengyihao's avatar
dengyihao 已提交
2198
               ", totalBytes:%" PRIu64,
2199 2200
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
               pLoadInfo->totalRows, pLoadInfo->totalSize);
2201 2202
      }

2203 2204
      taosMemoryFreeClear(pDataInfo->pRsp);

2205 2206
      if (pDataInfo->status != EX_SOURCE_DATA_EXHAUSTED) {
        pDataInfo->status = EX_SOURCE_DATA_NOT_READY;
2207 2208
        code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
        if (code != TSDB_CODE_SUCCESS) {
2209
          taosMemoryFreeClear(pDataInfo->pRsp);
2210 2211 2212 2213 2214 2215 2216
          goto _error;
        }
      }

      return pExchangeInfo->pResult;
    }

2217
    if (completed == totalSources) {
2218 2219 2220 2221 2222 2223 2224 2225 2226
      return setAllSourcesCompleted(pOperator, startTs);
    }
  }

_error:
  pTaskInfo->code = code;
  return NULL;
}

L
Liu Jicong 已提交
2227 2228 2229
static int32_t prepareConcurrentlyLoad(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2230

L
Liu Jicong 已提交
2231
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2232 2233 2234
  int64_t startTs = taosGetTimestampUs();

  // Asynchronously send all fetch requests to all sources.
L
Liu Jicong 已提交
2235
  for (int32_t i = 0; i < totalSources; ++i) {
2236 2237
    int32_t code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
    if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2238 2239
      pTaskInfo->code = code;
      return code;
2240 2241 2242 2243
    }
  }

  int64_t endTs = taosGetTimestampUs();
2244
  qDebug("%s send all fetch requests to %" PRIzu " sources completed, elapsed:%.2fms", GET_TASKID(pTaskInfo),
X
Xiaoyu Wang 已提交
2245
         totalSources, (endTs - startTs) / 1000.0);
2246

2247
  pOperator->status = OP_RES_TO_RETURN;
H
Haojun Liao 已提交
2248
  pOperator->cost.openCost = taosGetTimestampUs() - startTs;
2249

2250
  tsem_wait(&pExchangeInfo->ready);
H
Haojun Liao 已提交
2251
  return TSDB_CODE_SUCCESS;
2252 2253
}

L
Liu Jicong 已提交
2254 2255 2256
static SSDataBlock* seqLoadRemoteData(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2257

L
Liu Jicong 已提交
2258
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2259
  int64_t startTs = taosGetTimestampUs();
2260

L
Liu Jicong 已提交
2261
  while (1) {
2262 2263
    if (pExchangeInfo->current >= totalSources) {
      return setAllSourcesCompleted(pOperator, startTs);
2264
    }
2265

2266 2267 2268
    doSendFetchDataRequest(pExchangeInfo, pTaskInfo, pExchangeInfo->current);
    tsem_wait(&pExchangeInfo->ready);

dengyihao's avatar
dengyihao 已提交
2269
    SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, pExchangeInfo->current);
X
Xiaoyu Wang 已提交
2270
    SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, pExchangeInfo->current);
2271

H
Haojun Liao 已提交
2272
    if (pDataInfo->code != TSDB_CODE_SUCCESS) {
2273 2274
      qError("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d error happens, code:%s", GET_TASKID(pTaskInfo),
             pSource->addr.nodeId, pSource->taskId, pSource->execId, tstrerror(pDataInfo->code));
H
Haojun Liao 已提交
2275 2276 2277 2278
      pOperator->pTaskInfo->code = pDataInfo->code;
      return NULL;
    }

L
Liu Jicong 已提交
2279
    SRetrieveTableRsp*   pRsp = pDataInfo->pRsp;
H
Haojun Liao 已提交
2280
    SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2281
    if (pRsp->numOfRows == 0) {
2282 2283
      qDebug("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d %d of total completed, rowsOfSource:%" PRIu64
             ", totalRows:%" PRIu64 " try next",
D
dapan1121 已提交
2284
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pExchangeInfo->current + 1,
H
Haojun Liao 已提交
2285
             pDataInfo->totalRows, pLoadInfo->totalRows);
H
Haojun Liao 已提交
2286

2287
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2288
      pExchangeInfo->current += 1;
D
dapan1121 已提交
2289
      taosMemoryFreeClear(pDataInfo->pRsp);
2290 2291
      continue;
    }
H
Haojun Liao 已提交
2292

L
Liu Jicong 已提交
2293
    SSDataBlock*       pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2294
    SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2295
    int32_t            code =
2296
        extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
L
Liu Jicong 已提交
2297
                                     pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2298 2299

    if (pRsp->completed == 1) {
D
dapan1121 已提交
2300
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, rowsOfSource:%" PRIu64
L
Liu Jicong 已提交
2301
             ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64 " try next %d/%" PRIzu,
2302 2303 2304
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, pExchangeInfo->current + 1,
             totalSources);
2305

2306
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2307 2308
      pExchangeInfo->current += 1;
    } else {
D
dapan1121 已提交
2309
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
L
Liu Jicong 已提交
2310
             ", totalBytes:%" PRIu64,
2311 2312
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pLoadInfo->totalRows, pLoadInfo->totalSize);
2313 2314
    }

2315
    pOperator->resultInfo.totalRows += pRes->info.rows;
2316
    taosMemoryFreeClear(pDataInfo->pRsp);
2317 2318
    return pExchangeInfo->pResult;
  }
2319 2320
}

L
Liu Jicong 已提交
2321
static int32_t prepareLoadRemoteData(SOperatorInfo* pOperator) {
2322
  if (OPTR_IS_OPENED(pOperator)) {
H
Haojun Liao 已提交
2323 2324 2325
    return TSDB_CODE_SUCCESS;
  }

2326 2327
  int64_t st = taosGetTimestampUs();

L
Liu Jicong 已提交
2328
  SExchangeInfo* pExchangeInfo = pOperator->info;
2329
  if (!pExchangeInfo->seqLoadData) {
H
Haojun Liao 已提交
2330 2331 2332 2333 2334 2335
    int32_t code = prepareConcurrentlyLoad(pOperator);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
    }
  }

2336
  OPTR_SET_OPENED(pOperator);
2337
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2338 2339 2340
  return TSDB_CODE_SUCCESS;
}

2341
static SSDataBlock* doLoadRemoteData(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
2342 2343
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2344

2345
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
2346
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2347 2348
    return NULL;
  }
2349

L
Liu Jicong 已提交
2350
  size_t               totalSources = taosArrayGetSize(pExchangeInfo->pSources);
H
Haojun Liao 已提交
2351
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
H
Haojun Liao 已提交
2352

2353
  if (pOperator->status == OP_EXEC_DONE) {
L
Liu Jicong 已提交
2354 2355 2356
    qDebug("%s all %" PRIzu " source(s) are exhausted, total rows:%" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
           GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
           pLoadInfo->totalElapsed / 1000.0);
2357 2358 2359 2360 2361 2362
    return NULL;
  }

  if (pExchangeInfo->seqLoadData) {
    return seqLoadRemoteData(pOperator);
  } else {
2363
    return concurrentlyLoadRemoteDataImpl(pOperator, pExchangeInfo, pTaskInfo);
2364
  }
H
Haojun Liao 已提交
2365
}
2366

2367
static int32_t initDataSource(int32_t numOfSources, SExchangeInfo* pInfo, const char* id) {
2368
  pInfo->pSourceDataInfo = taosArrayInit(numOfSources, sizeof(SSourceDataInfo));
H
Haojun Liao 已提交
2369 2370
  if (pInfo->pSourceDataInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
2371 2372
  }

L
Liu Jicong 已提交
2373
  for (int32_t i = 0; i < numOfSources; ++i) {
2374
    SSourceDataInfo dataInfo = {0};
H
Haojun Liao 已提交
2375
    dataInfo.status = EX_SOURCE_DATA_NOT_READY;
2376
    dataInfo.taskId = id;
L
Liu Jicong 已提交
2377
    dataInfo.index = i;
X
Xiaoyu Wang 已提交
2378
    SSourceDataInfo* pDs = taosArrayPush(pInfo->pSourceDataInfo, &dataInfo);
2379
    if (pDs == NULL) {
H
Haojun Liao 已提交
2380 2381 2382 2383 2384 2385 2386 2387
      taosArrayDestroy(pInfo->pSourceDataInfo);
      return TSDB_CODE_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
}

2388
static int32_t initExchangeOperator(SExchangePhysiNode* pExNode, SExchangeInfo* pInfo, const char* id) {
2389
  size_t numOfSources = LIST_LENGTH(pExNode->pSrcEndPoints);
H
Haojun Liao 已提交
2390

2391
  if (numOfSources == 0) {
X
Xiaoyu Wang 已提交
2392
    qError("%s invalid number: %d of sources in exchange operator", id, (int32_t)numOfSources);
2393 2394 2395
    return TSDB_CODE_INVALID_PARA;
  }

H
Haojun Liao 已提交
2396
  pInfo->pSources = taosArrayInit(numOfSources, sizeof(SDownstreamSourceNode));
wmmhello's avatar
wmmhello 已提交
2397
  if (pInfo->pSources == NULL) {
2398
    return TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
2399 2400
  }

L
Liu Jicong 已提交
2401
  for (int32_t i = 0; i < numOfSources; ++i) {
D
dapan1121 已提交
2402
    SDownstreamSourceNode* pNode = (SDownstreamSourceNode*)nodesListGetNode((SNodeList*)pExNode->pSrcEndPoints, i);
H
Haojun Liao 已提交
2403 2404
    taosArrayPush(pInfo->pSources, pNode);
  }
2405

2406 2407
  pInfo->self = taosAddRef(exchangeObjRefPool, pInfo);

2408
  return initDataSource(numOfSources, pInfo, id);
2409 2410 2411 2412 2413 2414
}

SOperatorInfo* createExchangeOperatorInfo(void* pTransporter, SExchangePhysiNode* pExNode, SExecTaskInfo* pTaskInfo) {
  SExchangeInfo* pInfo = taosMemoryCalloc(1, sizeof(SExchangeInfo));
  SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
H
Haojun Liao 已提交
2415
    goto _error;
2416
  }
H
Haojun Liao 已提交
2417

2418
  int32_t code = initExchangeOperator(pExNode, pInfo, GET_TASKID(pTaskInfo));
2419 2420 2421
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2422 2423

  tsem_init(&pInfo->ready, 0, 0);
2424

2425
  pInfo->seqLoadData = false;
2426
  pInfo->pTransporter = pTransporter;
2427 2428
  pInfo->pResult = createResDataBlock(pExNode->node.pOutputDataBlockDesc);
  pOperator->name = "ExchangeOperator";
X
Xiaoyu Wang 已提交
2429
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_EXCHANGE;
X
Xiaoyu Wang 已提交
2430
  pOperator->blocking = false;
2431 2432
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
2433
  pOperator->exprSupp.numOfExprs = taosArrayGetSize(pInfo->pResult->pDataBlock);
X
Xiaoyu Wang 已提交
2434
  pOperator->pTaskInfo = pTaskInfo;
2435

L
Liu Jicong 已提交
2436 2437
  pOperator->fpSet = createOperatorFpSet(prepareLoadRemoteData, doLoadRemoteData, NULL, NULL,
                                         destroyExchangeOperatorInfo, NULL, NULL, NULL);
2438
  return pOperator;
H
Haojun Liao 已提交
2439

L
Liu Jicong 已提交
2440
_error:
H
Haojun Liao 已提交
2441
  if (pInfo != NULL) {
2442
    doDestroyExchangeOperatorInfo(pInfo);
H
Haojun Liao 已提交
2443 2444
  }

wafwerar's avatar
wafwerar 已提交
2445
  taosMemoryFreeClear(pOperator);
2446
  pTaskInfo->code = code;
H
Haojun Liao 已提交
2447
  return NULL;
2448 2449
}

dengyihao's avatar
dengyihao 已提交
2450 2451
static int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                                const char* pKey);
2452

2453
static void destroySortedMergeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
2454
  SSortedMergeOperatorInfo* pInfo = (SSortedMergeOperatorInfo*)param;
H
Haojun Liao 已提交
2455
  taosArrayDestroy(pInfo->pSortInfo);
2456 2457 2458
  taosArrayDestroy(pInfo->groupInfo);

  if (pInfo->pSortHandle != NULL) {
H
Haojun Liao 已提交
2459
    tsortDestroySortHandle(pInfo->pSortHandle);
2460 2461
  }

H
Haojun Liao 已提交
2462
  blockDataDestroy(pInfo->binfo.pRes);
H
Haojun Liao 已提交
2463
  cleanupAggSup(&pInfo->aggSup);
L
Liu Jicong 已提交
2464

D
dapan1121 已提交
2465
  taosMemoryFreeClear(param);
2466
}
H
Haojun Liao 已提交
2467

L
Liu Jicong 已提交
2468
static bool needToMerge(SSDataBlock* pBlock, SArray* groupInfo, char** buf, int32_t rowIndex) {
2469 2470 2471 2472
  size_t size = taosArrayGetSize(groupInfo);
  if (size == 0) {
    return true;
  }
2473

2474 2475
  for (int32_t i = 0; i < size; ++i) {
    int32_t* index = taosArrayGet(groupInfo, i);
2476

2477
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
L
Liu Jicong 已提交
2478
    bool             isNull = colDataIsNull(pColInfo, rowIndex, pBlock->info.rows, NULL);
2479

2480 2481 2482
    if ((isNull && buf[i] != NULL) || (!isNull && buf[i] == NULL)) {
      return false;
    }
2483

2484 2485 2486 2487 2488 2489 2490 2491 2492 2493 2494 2495 2496
    char* pCell = colDataGetData(pColInfo, rowIndex);
    if (IS_VAR_DATA_TYPE(pColInfo->info.type)) {
      if (varDataLen(pCell) != varDataLen(buf[i])) {
        return false;
      } else {
        if (memcmp(varDataVal(pCell), varDataVal(buf[i]), varDataLen(pCell)) != 0) {
          return false;
        }
      }
    } else {
      if (memcmp(pCell, buf[i], pColInfo->info.bytes) != 0) {
        return false;
      }
2497 2498 2499
    }
  }

2500
  return 0;
2501 2502
}

L
Liu Jicong 已提交
2503 2504 2505
static void doMergeResultImpl(SSortedMergeOperatorInfo* pInfo, SqlFunctionCtx* pCtx, int32_t numOfExpr,
                              int32_t rowIndex) {
  for (int32_t j = 0; j < numOfExpr; ++j) {  // TODO set row index
X
Xiaoyu Wang 已提交
2506
                                             //    pCtx[j].startRow = rowIndex;
2507 2508
  }

2509 2510
  for (int32_t j = 0; j < numOfExpr; ++j) {
    int32_t functionId = pCtx[j].functionId;
L
Liu Jicong 已提交
2511 2512 2513 2514 2515 2516 2517 2518 2519
    //    pCtx[j].fpSet->addInput(&pCtx[j]);

    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_MERGE);
    //    } else {
    //      assert(!TSDB_FUNC_IS_SCALAR(functionId));
    //      aAggs[functionId].mergeFunc(&pCtx[j]);
    //    }
2520
  }
2521
}
2522

L
Liu Jicong 已提交
2523 2524
static void doFinalizeResultImpl(SqlFunctionCtx* pCtx, int32_t numOfExpr) {
  for (int32_t j = 0; j < numOfExpr; ++j) {
2525 2526 2527 2528
    int32_t functionId = pCtx[j].functionId;
    //    if (functionId == FUNC_TAG_DUMMY || functionId == FUNC_TS_DUMMY) {
    //      continue;
    //    }
2529

2530 2531 2532 2533
    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_FINALIZE);
    //    } else {
dengyihao's avatar
dengyihao 已提交
2534
    //    pCtx[j].fpSet.finalize(&pCtx[j]);
2535 2536
  }
}
2537

2538
static bool saveCurrentTuple(char** rowColData, SArray* pColumnList, SSDataBlock* pBlock, int32_t rowIndex) {
L
Liu Jicong 已提交
2539
  int32_t size = (int32_t)taosArrayGetSize(pColumnList);
2540

L
Liu Jicong 已提交
2541 2542
  for (int32_t i = 0; i < size; ++i) {
    int32_t*         index = taosArrayGet(pColumnList, i);
2543
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
H
Haojun Liao 已提交
2544

2545 2546 2547
    char* data = colDataGetData(pColInfo, rowIndex);
    memcpy(rowColData[i], data, colDataGetLength(pColInfo, rowIndex));
  }
2548

2549 2550
  return true;
}
2551

2552 2553
static void doMergeImpl(SOperatorInfo* pOperator, int32_t numOfExpr, SSDataBlock* pBlock) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
2554

2555
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
2556

L
Liu Jicong 已提交
2557
  for (int32_t i = 0; i < pBlock->info.rows; ++i) {
2558 2559 2560 2561 2562 2563 2564 2565 2566
    if (!pInfo->hasGroupVal) {
      ASSERT(i == 0);
      doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
    } else {
      if (needToMerge(pBlock, pInfo->groupInfo, pInfo->groupVal, i)) {
        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      } else {
        doFinalizeResultImpl(pCtx, numOfExpr);
2567 2568
        int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
        //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2569

2570
        // TODO check for available buffer;
H
Haojun Liao 已提交
2571

2572 2573 2574 2575 2576
        // next group info data
        pInfo->binfo.pRes->info.rows += numOfRows;
        for (int32_t j = 0; j < numOfExpr; ++j) {
          if (pCtx[j].functionId < 0) {
            continue;
2577
          }
2578

H
Haojun Liao 已提交
2579
          pCtx[j].fpSet.process(&pCtx[j]);
2580
        }
2581 2582 2583

        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
        pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
H
Haojun Liao 已提交
2584
      }
2585 2586 2587 2588
    }
  }
}

2589 2590
static SSDataBlock* doMerge(SOperatorInfo* pOperator) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
L
Liu Jicong 已提交
2591
  SSortHandle*              pHandle = pInfo->pSortHandle;
2592

2593
  SSDataBlock* pDataBlock = createOneDataBlock(pInfo->binfo.pRes, false);
2594
  blockDataEnsureCapacity(pDataBlock, pOperator->resultInfo.capacity);
2595

L
Liu Jicong 已提交
2596
  while (1) {
2597
    blockDataCleanup(pDataBlock);
2598
    while (1) {
H
Haojun Liao 已提交
2599
      STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2600 2601
      if (pTupleHandle == NULL) {
        break;
2602
      }
2603

2604 2605
      // build datablock for merge for one group
      appendOneRowToDataBlock(pDataBlock, pTupleHandle);
2606
      if (pDataBlock->info.rows >= pOperator->resultInfo.capacity) {
2607 2608
        break;
      }
2609
    }
2610

2611 2612 2613
    if (pDataBlock->info.rows == 0) {
      break;
    }
2614

2615
    setInputDataBlock(pOperator, pOperator->exprSupp.pCtx, pDataBlock, TSDB_ORDER_ASC, MAIN_SCAN, true);
L
Liu Jicong 已提交
2616 2617
    //  updateOutputBuf(&pInfo->binfo, &pAggInfo->bufCapacity, pBlock->info.rows * pAggInfo->resultRowFactor,
    //  pOperator->pRuntimeEnv, true);
2618
    doMergeImpl(pOperator, pOperator->exprSupp.numOfExprs, pDataBlock);
2619 2620
    // flush to tuple store, and after all data have been handled, return to upstream node or sink node
  }
2621

2622 2623 2624
  doFinalizeResultImpl(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs);
  int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
  //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2625

2626
  // TODO check for available buffer;
2627

2628 2629
  // next group info data
  pInfo->binfo.pRes->info.rows += numOfRows;
L
Liu Jicong 已提交
2630
  return (pInfo->binfo.pRes->info.rows > 0) ? pInfo->binfo.pRes : NULL;
2631
}
2632

L
Liu Jicong 已提交
2633 2634
SSDataBlock* getSortedMergeBlockData(SSortHandle* pHandle, SSDataBlock* pDataBlock, int32_t capacity,
                                     SArray* pColMatchInfo, SSortedMergeOperatorInfo* pInfo) {
2635 2636 2637 2638 2639 2640 2641 2642 2643 2644
  blockDataCleanup(pDataBlock);

  SSDataBlock* p = tsortGetSortedDataBlock(pHandle);
  if (p == NULL) {
    return NULL;
  }

  blockDataEnsureCapacity(p, capacity);

  while (1) {
2645
    STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2646 2647 2648 2649
    if (pTupleHandle == NULL) {
      break;
    }

2650
    appendOneRowToDataBlock(p, pTupleHandle);
2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661 2662 2663
    if (p->info.rows >= capacity) {
      break;
    }
  }

  if (p->info.rows > 0) {
    int32_t numOfCols = taosArrayGetSize(pColMatchInfo);
    for (int32_t i = 0; i < numOfCols; ++i) {
      SColMatchInfo* pmInfo = taosArrayGet(pColMatchInfo, i);
      ASSERT(pmInfo->matchType == COL_MATCH_FROM_SLOT_ID);

      SColumnInfoData* pSrc = taosArrayGet(p->pDataBlock, pmInfo->srcSlotId);
      SColumnInfoData* pDst = taosArrayGet(pDataBlock->pDataBlock, pmInfo->targetSlotId);
2664
      colDataAssign(pDst, pSrc, p->info.rows, &pDataBlock->info);
2665 2666 2667 2668 2669 2670 2671 2672 2673 2674
    }

    pDataBlock->info.rows = p->info.rows;
    pDataBlock->info.capacity = p->info.rows;
  }

  blockDataDestroy(p);
  return (pDataBlock->info.rows > 0) ? pDataBlock : NULL;
}

2675
static SSDataBlock* doSortedMerge(SOperatorInfo* pOperator) {
2676 2677
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
2678 2679
  }

L
Liu Jicong 已提交
2680
  SExecTaskInfo*            pTaskInfo = pOperator->pTaskInfo;
2681
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
H
Haojun Liao 已提交
2682
  if (pOperator->status == OP_RES_TO_RETURN) {
2683
    return getSortedMergeBlockData(pInfo->pSortHandle, pInfo->binfo.pRes, pOperator->resultInfo.capacity, NULL, pInfo);
2684 2685
  }

2686
  int32_t numOfBufPage = pInfo->sortBufSize / pInfo->bufPageSize;
L
Liu Jicong 已提交
2687 2688
  pInfo->pSortHandle = tsortCreateSortHandle(pInfo->pSortInfo, SORT_MULTISOURCE_MERGE, pInfo->bufPageSize, numOfBufPage,
                                             pInfo->binfo.pRes, "GET_TASKID(pTaskInfo)");
H
Haojun Liao 已提交
2689

2690
  tsortSetFetchRawDataFp(pInfo->pSortHandle, loadNextDataBlock, NULL, NULL);
2691

L
Liu Jicong 已提交
2692
  for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
wmmhello's avatar
wmmhello 已提交
2693
    SSortSource* ps = taosMemoryCalloc(1, sizeof(SSortSource));
H
Haojun Liao 已提交
2694
    ps->param = pOperator->pDownstream[i];
H
Haojun Liao 已提交
2695
    tsortAddSource(pInfo->pSortHandle, ps);
2696 2697
  }

H
Haojun Liao 已提交
2698
  int32_t code = tsortOpen(pInfo->pSortHandle);
2699
  if (code != TSDB_CODE_SUCCESS) {
2700
    longjmp(pTaskInfo->env, terrno);
2701 2702
  }

H
Haojun Liao 已提交
2703
  pOperator->status = OP_RES_TO_RETURN;
2704
  return doMerge(pOperator);
2705
}
2706

L
Liu Jicong 已提交
2707 2708
static int32_t initGroupCol(SExprInfo* pExprInfo, int32_t numOfCols, SArray* pGroupInfo,
                            SSortedMergeOperatorInfo* pInfo) {
2709 2710
  if (pGroupInfo == NULL || taosArrayGetSize(pGroupInfo) == 0) {
    return 0;
H
Haojun Liao 已提交
2711 2712
  }

2713 2714 2715 2716 2717 2718 2719 2720
  int32_t len = 0;
  SArray* plist = taosArrayInit(3, sizeof(SColumn));
  pInfo->groupInfo = taosArrayInit(3, sizeof(int32_t));

  if (plist == NULL || pInfo->groupInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

L
Liu Jicong 已提交
2721 2722
  size_t numOfGroupCol = taosArrayGetSize(pInfo->groupInfo);
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2723
    SColumn* pCol = taosArrayGet(pGroupInfo, i);
L
Liu Jicong 已提交
2724
    for (int32_t j = 0; j < numOfCols; ++j) {
H
Haojun Liao 已提交
2725
      SExprInfo* pe = &pExprInfo[j];
2726
      if (pe->base.resSchema.slotId == pCol->colId) {
2727 2728
        taosArrayPush(plist, pCol);
        taosArrayPush(pInfo->groupInfo, &j);
H
Haojun Liao 已提交
2729
        len += pCol->bytes;
2730 2731
        break;
      }
H
Haojun Liao 已提交
2732 2733 2734
    }
  }

2735
  ASSERT(taosArrayGetSize(pGroupInfo) == taosArrayGetSize(plist));
H
Haojun Liao 已提交
2736

wafwerar's avatar
wafwerar 已提交
2737
  pInfo->groupVal = taosMemoryCalloc(1, (POINTER_BYTES * numOfGroupCol + len));
2738 2739 2740 2741
  if (pInfo->groupVal == NULL) {
    taosArrayDestroy(plist);
    return TSDB_CODE_OUT_OF_MEMORY;
  }
H
Haojun Liao 已提交
2742

2743
  int32_t offset = 0;
L
Liu Jicong 已提交
2744 2745
  char*   start = (char*)(pInfo->groupVal + (POINTER_BYTES * numOfGroupCol));
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2746 2747
    pInfo->groupVal[i] = start + offset;
    SColumn* pCol = taosArrayGet(plist, i);
H
Haojun Liao 已提交
2748
    offset += pCol->bytes;
2749
  }
H
Haojun Liao 已提交
2750

2751
  taosArrayDestroy(plist);
H
Haojun Liao 已提交
2752

2753 2754
  return TSDB_CODE_SUCCESS;
}
H
Haojun Liao 已提交
2755

L
Liu Jicong 已提交
2756 2757 2758
SOperatorInfo* createSortedMergeOperatorInfo(SOperatorInfo** downstream, int32_t numOfDownstream, SExprInfo* pExprInfo,
                                             int32_t num, SArray* pSortInfo, SArray* pGroupInfo,
                                             SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
2759
  SSortedMergeOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SSortedMergeOperatorInfo));
L
Liu Jicong 已提交
2760
  SOperatorInfo*            pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2761
  if (pInfo == NULL || pOperator == NULL) {
2762
    goto _error;
2763
  }
H
Haojun Liao 已提交
2764

2765 2766 2767 2768 2769
  int32_t code = initExprSupp(&pOperator->exprSupp, pExprInfo, num);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

2770
  initResultRowInfo(&pInfo->binfo.resultRowInfo);
H
Haojun Liao 已提交
2771

2772
  if (pOperator->exprSupp.pCtx == NULL || pInfo->binfo.pRes == NULL) {
2773 2774
    goto _error;
  }
H
Haojun Liao 已提交
2775

2776
  size_t keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
2777
  code = doInitAggInfoSup(&pInfo->aggSup, pOperator->exprSupp.pCtx, num, keyBufSize, pTaskInfo->id.str);
2778 2779 2780
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2781

2782
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, num);
H
Haojun Liao 已提交
2783
  code = initGroupCol(pExprInfo, num, pGroupInfo, pInfo);
2784 2785 2786
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2787

L
Liu Jicong 已提交
2788 2789 2790 2791 2792
  //  pInfo->resultRowFactor = (int32_t)(getRowNumForMultioutput(pRuntimeEnv->pQueryAttr,
  //      pRuntimeEnv->pQueryAttr->topBotQuery, false));
  pInfo->sortBufSize = 1024 * 16;  // 1MB
  pInfo->bufPageSize = 1024;
  pInfo->pSortInfo = pSortInfo;
H
Haojun Liao 已提交
2793

2794
  pOperator->resultInfo.capacity = blockDataGetCapacityInRow(pInfo->binfo.pRes, pInfo->bufPageSize);
H
Haojun Liao 已提交
2795

L
Liu Jicong 已提交
2796
  pOperator->name = "SortedMerge";
X
Xiaoyu Wang 已提交
2797
  // pOperator->operatorType = OP_SortedMerge;
2798 2799 2800
  pOperator->blocking = true;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
L
Liu Jicong 已提交
2801
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
2802

2803 2804
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doSortedMerge, NULL, NULL, destroySortedMergeOperatorInfo,
                                         NULL, NULL, NULL);
2805 2806 2807
  code = appendDownstream(pOperator, downstream, numOfDownstream);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
2808
  }
H
Haojun Liao 已提交
2809

2810
  return pOperator;
H
Haojun Liao 已提交
2811

L
Liu Jicong 已提交
2812
_error:
2813
  if (pInfo != NULL) {
H
Haojun Liao 已提交
2814
    destroySortedMergeOperatorInfo(pInfo, num);
H
Haojun Liao 已提交
2815 2816
  }

wafwerar's avatar
wafwerar 已提交
2817 2818
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
2819 2820
  terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
  return NULL;
H
Haojun Liao 已提交
2821 2822
}

X
Xiaoyu Wang 已提交
2823
int32_t getTableScanInfo(SOperatorInfo* pOperator, int32_t* order, int32_t* scanFlag) {
2824
  // todo add more information about exchange operation
2825
  int32_t type = pOperator->operatorType;
X
Xiaoyu Wang 已提交
2826
  if (type == QUERY_NODE_PHYSICAL_PLAN_EXCHANGE || type == QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN ||
2827
      type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN ||
2828
      type == QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN) {
2829 2830 2831
    *order = TSDB_ORDER_ASC;
    *scanFlag = MAIN_SCAN;
    return TSDB_CODE_SUCCESS;
2832
  } else if (type == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) {
2833 2834 2835 2836 2837
    STableScanInfo* pTableScanInfo = pOperator->info;
    *order = pTableScanInfo->cond.order;
    *scanFlag = pTableScanInfo->scanFlag;
    return TSDB_CODE_SUCCESS;
  } else {
H
Haojun Liao 已提交
2838
    if (pOperator->pDownstream == NULL || pOperator->pDownstream[0] == NULL) {
2839
      return TSDB_CODE_INVALID_PARA;
H
Haojun Liao 已提交
2840
    } else {
2841
      return getTableScanInfo(pOperator->pDownstream[0], order, scanFlag);
2842 2843 2844
    }
  }
}
L
Liu Jicong 已提交
2845
#if 0
L
Liu Jicong 已提交
2846
int32_t doPrepareScan(SOperatorInfo* pOperator, uint64_t uid, int64_t ts) {
L
Liu Jicong 已提交
2847
  uint8_t type = pOperator->operatorType;
2848 2849 2850

  pOperator->status = OP_OPENED;

L
Liu Jicong 已提交
2851
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2852
    SStreamScanInfo* pScanInfo = pOperator->info;
L
Liu Jicong 已提交
2853
    pScanInfo->blockType = STREAM_INPUT__TABLE_SCAN;
2854

2855
    pScanInfo->pTableScanOp->status = OP_OPENED;
2856

2857
    STableScanInfo* pInfo = pScanInfo->pTableScanOp->info;
2858 2859
    ASSERT(pInfo->scanMode == TABLE_SCAN__TABLE_ORDER);

L
Liu Jicong 已提交
2860 2861 2862 2863
    if (uid == 0) {
      pInfo->noTable = 1;
      return TSDB_CODE_SUCCESS;
    }
2864 2865 2866 2867 2868 2869

    /*if (pSnapShotScanInfo->dataReader == NULL) {*/
    /*pSnapShotScanInfo->dataReader = tsdbReaderOpen(pHandle->vnode, &pSTInfo->cond, tableList, 0, 0);*/
    /*pSnapShotScanInfo->scanMode = TABLE_SCAN__TABLE_ORDER;*/
    /*}*/

L
Liu Jicong 已提交
2870 2871
    pInfo->noTable = 0;

2872
    if (pInfo->lastStatus.uid != uid || pInfo->lastStatus.ts != ts) {
L
Liu Jicong 已提交
2873 2874 2875 2876 2877 2878 2879 2880 2881 2882 2883
      SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

      int32_t tableSz = taosArrayGetSize(pTaskInfo->tableqinfoList.pTableList);
      bool    found = false;
      for (int32_t i = 0; i < tableSz; i++) {
        STableKeyInfo* pTableInfo = taosArrayGet(pTaskInfo->tableqinfoList.pTableList, i);
        if (pTableInfo->uid == uid) {
          found = true;
          pInfo->currentTable = i;
        }
      }
2884
      // TODO after processing drop, found can be false
L
Liu Jicong 已提交
2885
      ASSERT(found);
2886 2887

      tsdbSetTableId(pInfo->dataReader, uid);
H
Haojun Liao 已提交
2888 2889 2890 2891
      int64_t oldSkey = pInfo->cond.twindows.skey;
      pInfo->cond.twindows.skey = ts + 1;
      tsdbReaderReset(pInfo->dataReader, &pInfo->cond);
      pInfo->cond.twindows.skey = oldSkey;
2892 2893
      pInfo->scanTimes = 0;

S
Shengliang Guan 已提交
2894
      qDebug("tsdb reader offset seek to uid %" PRId64 " ts %" PRId64 ", table cur set to %d , all table num %d", uid, ts,
L
Liu Jicong 已提交
2895
             pInfo->currentTable, tableSz);
L
Liu Jicong 已提交
2896
    }
L
Liu Jicong 已提交
2897

L
Liu Jicong 已提交
2898
    return TSDB_CODE_SUCCESS;
2899

L
Liu Jicong 已提交
2900
  } else {
2901 2902 2903 2904 2905
    if (pOperator->numOfDownstream == 1) {
      return doPrepareScan(pOperator->pDownstream[0], uid, ts);
    } else if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator to set the input data block");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2906
    } else {
2907 2908
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2909 2910 2911 2912
    }
  }
}

2913 2914 2915
int32_t doGetScanStatus(SOperatorInfo* pOperator, uint64_t* uid, int64_t* ts) {
  int32_t type = pOperator->operatorType;
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2916 2917
    SStreamScanInfo* pScanInfo = pOperator->info;
    STableScanInfo*  pSnapShotScanInfo = pScanInfo->pTableScanOp->info;
L
Liu Jicong 已提交
2918 2919
    *uid = pSnapShotScanInfo->lastStatus.uid;
    *ts = pSnapShotScanInfo->lastStatus.ts;
2920 2921 2922 2923 2924 2925 2926 2927 2928 2929
  } else {
    if (pOperator->pDownstream[0] == NULL) {
      return TSDB_CODE_INVALID_PARA;
    } else {
      doGetScanStatus(pOperator->pDownstream[0], uid, ts);
    }
  }

  return TSDB_CODE_SUCCESS;
}
L
Liu Jicong 已提交
2930
#endif
2931

2932
// this is a blocking operator
L
Liu Jicong 已提交
2933
static int32_t doOpenAggregateOptr(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
2934 2935
  if (OPTR_IS_OPENED(pOperator)) {
    return TSDB_CODE_SUCCESS;
2936 2937
  }

H
Haojun Liao 已提交
2938
  SExecTaskInfo*    pTaskInfo = pOperator->pTaskInfo;
2939
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
2940

2941 2942
  SExprSupp*     pSup = &pOperator->exprSupp;
  SOperatorInfo* downstream = pOperator->pDownstream[0];
2943

2944 2945
  int64_t st = taosGetTimestampUs();

2946 2947 2948
  int32_t order = TSDB_ORDER_ASC;
  int32_t scanFlag = MAIN_SCAN;

H
Haojun Liao 已提交
2949
  while (1) {
2950
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
2951 2952 2953 2954
    if (pBlock == NULL) {
      break;
    }

2955 2956 2957 2958
    int32_t code = getTableScanInfo(pOperator, &order, &scanFlag);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
2959

2960
    // there is an scalar expression that needs to be calculated before apply the group aggregation.
2961 2962 2963
    if (pAggInfo->scalarExprSup.pExprInfo != NULL) {
      SExprSupp* pSup1 = &pAggInfo->scalarExprSup;
      code = projectApplyFunctions(pSup1->pExprInfo, pBlock, pBlock, pSup1->pCtx, pSup1->numOfExprs, NULL);
2964
      if (code != TSDB_CODE_SUCCESS) {
2965
        longjmp(pTaskInfo->env, code);
2966
      }
2967 2968
    }

2969
    // the pDataBlock are always the same one, no need to call this again
2970 2971 2972
    setExecutionContext(pOperator, pOperator->exprSupp.numOfExprs, pBlock->info.groupId, pAggInfo);
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, true);
    code = doAggregateImpl(pOperator, 0, pSup->pCtx);
2973 2974 2975
    if (code != 0) {
      longjmp(pTaskInfo->env, code);
    }
2976

dengyihao's avatar
dengyihao 已提交
2977
#if 0  // test for encode/decode result info
2978
    if(pOperator->fpSet.encodeResultRow){
2979 2980
      char *result = NULL;
      int32_t length = 0;
2981 2982
      pOperator->fpSet.encodeResultRow(pOperator, &result, &length);
      SAggSupporter* pSup = &pAggInfo->aggSup;
2983 2984
      taosHashClear(pSup->pResultRowHashTable);
      pInfo->resultRowInfo.size = 0;
2985
      pOperator->fpSet.decodeResultRow(pOperator, result);
2986 2987 2988
      if(result){
        taosMemoryFree(result);
      }
2989
    }
2990
#endif
2991 2992
  }

H
Haojun Liao 已提交
2993
  closeAllResultRows(&pAggInfo->binfo.resultRowInfo);
2994
  initGroupedResultInfo(&pAggInfo->groupResInfo, pAggInfo->aggSup.pResultRowHashTable, 0);
H
Haojun Liao 已提交
2995
  OPTR_SET_OPENED(pOperator);
2996

2997
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2998 2999 3000
  return TSDB_CODE_SUCCESS;
}

3001
static SSDataBlock* getAggregateResult(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3002
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
3003 3004 3005 3006 3007 3008
  SOptrBasicInfo*   pInfo = &pAggInfo->binfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

L
Liu Jicong 已提交
3009
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3010
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
H
Haojun Liao 已提交
3011
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
3012
    doSetOperatorCompleted(pOperator);
H
Haojun Liao 已提交
3013 3014 3015
    return NULL;
  }

H
Haojun Liao 已提交
3016
  blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);
S
slzhou 已提交
3017 3018 3019 3020 3021 3022 3023 3024
  while (1) {
    doBuildResultDatablock(pOperator, pInfo, &pAggInfo->groupResInfo, pAggInfo->aggSup.pResultBuf);
    doFilter(pAggInfo->pCondition, pInfo->pRes);

    if (!hasDataInGroupInfo(&pAggInfo->groupResInfo)) {
      doSetOperatorCompleted(pOperator);
      break;
    }
3025

S
slzhou 已提交
3026 3027 3028 3029
    if (pInfo->pRes->info.rows > 0) {
      break;
    }
  }
3030
  size_t rows = blockDataGetNumOfRows(pInfo->pRes);
3031 3032
  pOperator->resultInfo.totalRows += rows;

3033
  return (rows == 0) ? NULL : pInfo->pRes;
3034 3035
}

wmmhello's avatar
wmmhello 已提交
3036
int32_t aggEncodeResultRow(SOperatorInfo* pOperator, char** result, int32_t* length) {
3037
  if (result == NULL || length == NULL) {
wmmhello's avatar
wmmhello 已提交
3038 3039 3040
    return TSDB_CODE_TSC_INVALID_INPUT;
  }
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3041 3042 3043 3044 3045
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
  int32_t         size = taosHashGetSize(pSup->pResultRowHashTable);
  size_t          keyLen = sizeof(uint64_t) * 2;  // estimate the key length
  int32_t         totalSize =
      sizeof(int32_t) + sizeof(int32_t) + size * (sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3046

C
Cary Xu 已提交
3047 3048 3049 3050 3051 3052
  // no result
  if (getTotalBufSize(pSup->pResultBuf) == 0) {
    *result = NULL;
    *length = 0;
    return TSDB_CODE_SUCCESS;
  }
3053

wmmhello's avatar
wmmhello 已提交
3054
  *result = (char*)taosMemoryCalloc(1, totalSize);
L
Liu Jicong 已提交
3055
  if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
3056
    return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
3057
  }
wmmhello's avatar
wmmhello 已提交
3058

wmmhello's avatar
wmmhello 已提交
3059
  int32_t offset = sizeof(int32_t);
wmmhello's avatar
wmmhello 已提交
3060 3061
  *(int32_t*)(*result + offset) = size;
  offset += sizeof(int32_t);
3062 3063

  // prepare memory
3064
  SResultRowPosition* pos = &pInfo->resultRowInfo.cur;
dengyihao's avatar
dengyihao 已提交
3065 3066
  void*               pPage = getBufPage(pSup->pResultBuf, pos->pageId);
  SResultRow*         pRow = (SResultRow*)((char*)pPage + pos->offset);
3067 3068 3069
  setBufPageDirty(pPage, true);
  releaseBufPage(pSup->pResultBuf, pPage);

dengyihao's avatar
dengyihao 已提交
3070
  void* pIter = taosHashIterate(pSup->pResultRowHashTable, NULL);
wmmhello's avatar
wmmhello 已提交
3071
  while (pIter) {
dengyihao's avatar
dengyihao 已提交
3072
    void*               key = taosHashGetKey(pIter, &keyLen);
3073
    SResultRowPosition* p1 = (SResultRowPosition*)pIter;
3074

dengyihao's avatar
dengyihao 已提交
3075
    pPage = (SFilePage*)getBufPage(pSup->pResultBuf, p1->pageId);
3076
    pRow = (SResultRow*)((char*)pPage + p1->offset);
3077 3078
    setBufPageDirty(pPage, true);
    releaseBufPage(pSup->pResultBuf, pPage);
wmmhello's avatar
wmmhello 已提交
3079 3080 3081

    // recalculate the result size
    int32_t realTotalSize = offset + sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize;
L
Liu Jicong 已提交
3082
    if (realTotalSize > totalSize) {
wmmhello's avatar
wmmhello 已提交
3083
      char* tmp = (char*)taosMemoryRealloc(*result, realTotalSize);
L
Liu Jicong 已提交
3084
      if (tmp == NULL) {
wafwerar's avatar
wafwerar 已提交
3085
        taosMemoryFree(*result);
wmmhello's avatar
wmmhello 已提交
3086
        *result = NULL;
wmmhello's avatar
wmmhello 已提交
3087
        return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
3088
      } else {
wmmhello's avatar
wmmhello 已提交
3089 3090 3091 3092 3093 3094 3095 3096 3097 3098 3099 3100
        *result = tmp;
      }
    }
    // save key
    *(int32_t*)(*result + offset) = keyLen;
    offset += sizeof(int32_t);
    memcpy(*result + offset, key, keyLen);
    offset += keyLen;

    // save value
    *(int32_t*)(*result + offset) = pSup->resultRowSize;
    offset += sizeof(int32_t);
3101
    memcpy(*result + offset, pRow, pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3102 3103 3104 3105 3106
    offset += pSup->resultRowSize;

    pIter = taosHashIterate(pSup->pResultRowHashTable, pIter);
  }

wmmhello's avatar
wmmhello 已提交
3107 3108 3109 3110
  *(int32_t*)(*result) = offset;
  *length = offset;

  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3111 3112
}

3113
int32_t aggDecodeResultRow(SOperatorInfo* pOperator, char* result) {
3114
  if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
3115
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3116
  }
wmmhello's avatar
wmmhello 已提交
3117
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3118
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
wmmhello's avatar
wmmhello 已提交
3119 3120

  //  int32_t size = taosHashGetSize(pSup->pResultRowHashTable);
3121
  int32_t length = *(int32_t*)(result);
wmmhello's avatar
wmmhello 已提交
3122
  int32_t offset = sizeof(int32_t);
3123 3124 3125 3126

  int32_t count = *(int32_t*)(result + offset);
  offset += sizeof(int32_t);

L
Liu Jicong 已提交
3127
  while (count-- > 0 && length > offset) {
wmmhello's avatar
wmmhello 已提交
3128 3129 3130
    int32_t keyLen = *(int32_t*)(result + offset);
    offset += sizeof(int32_t);

L
Liu Jicong 已提交
3131
    uint64_t    tableGroupId = *(uint64_t*)(result + offset);
3132
    SResultRow* resultRow = getNewResultRow(pSup->pResultBuf, tableGroupId, pSup->resultRowSize);
L
Liu Jicong 已提交
3133
    if (!resultRow) {
wmmhello's avatar
wmmhello 已提交
3134
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3135
    }
3136

wmmhello's avatar
wmmhello 已提交
3137
    // add a new result set for a new group
3138 3139
    SResultRowPosition pos = {.pageId = resultRow->pageId, .offset = resultRow->offset};
    taosHashPut(pSup->pResultRowHashTable, result + offset, keyLen, &pos, sizeof(SResultRowPosition));
wmmhello's avatar
wmmhello 已提交
3140 3141 3142

    offset += keyLen;
    int32_t valueLen = *(int32_t*)(result + offset);
L
Liu Jicong 已提交
3143
    if (valueLen != pSup->resultRowSize) {
wmmhello's avatar
wmmhello 已提交
3144
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3145 3146 3147 3148 3149 3150 3151 3152 3153 3154
    }
    offset += sizeof(int32_t);
    int32_t pageId = resultRow->pageId;
    int32_t pOffset = resultRow->offset;
    memcpy(resultRow, result + offset, valueLen);
    resultRow->pageId = pageId;
    resultRow->offset = pOffset;
    offset += valueLen;

    initResultRow(resultRow);
dengyihao's avatar
dengyihao 已提交
3155
    pInfo->resultRowInfo.cur = (SResultRowPosition){.pageId = resultRow->pageId, .offset = resultRow->offset};
wmmhello's avatar
wmmhello 已提交
3156 3157
  }

L
Liu Jicong 已提交
3158
  if (offset != length) {
wmmhello's avatar
wmmhello 已提交
3159
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3160
  }
wmmhello's avatar
wmmhello 已提交
3161
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3162 3163
}

3164 3165
enum {
  PROJECT_RETRIEVE_CONTINUE = 0x1,
L
Liu Jicong 已提交
3166
  PROJECT_RETRIEVE_DONE = 0x2,
3167 3168 3169 3170 3171
};

static int32_t handleLimitOffset(SOperatorInfo* pOperator, SSDataBlock* pBlock) {
  SProjectOperatorInfo* pProjectInfo = pOperator->info;
  SOptrBasicInfo*       pInfo = &pProjectInfo->binfo;
L
Liu Jicong 已提交
3172
  SSDataBlock*          pRes = pInfo->pRes;
3173 3174 3175 3176 3177 3178 3179 3180 3181 3182 3183 3184 3185 3186 3187 3188 3189 3190 3191 3192 3193 3194 3195 3196 3197 3198 3199 3200 3201 3202 3203 3204 3205 3206 3207 3208 3209 3210 3211 3212 3213 3214 3215 3216 3217 3218 3219 3220

  if (pProjectInfo->curSOffset > 0) {
    if (pProjectInfo->groupId == 0) {  // it is the first group
      pProjectInfo->groupId = pBlock->info.groupId;
      blockDataCleanup(pInfo->pRes);
      return PROJECT_RETRIEVE_CONTINUE;
    } else if (pProjectInfo->groupId != pBlock->info.groupId) {
      pProjectInfo->curSOffset -= 1;

      // ignore data block in current group
      if (pProjectInfo->curSOffset > 0) {
        blockDataCleanup(pInfo->pRes);
        return PROJECT_RETRIEVE_CONTINUE;
      }
    }

    // set current group id of the project operator
    pProjectInfo->groupId = pBlock->info.groupId;
  }

  if (pProjectInfo->groupId != 0 && pProjectInfo->groupId != pBlock->info.groupId) {
    pProjectInfo->curGroupOutput += 1;
    if ((pProjectInfo->slimit.limit > 0) && (pProjectInfo->slimit.limit <= pProjectInfo->curGroupOutput)) {
      pOperator->status = OP_EXEC_DONE;
      blockDataCleanup(pRes);

      return PROJECT_RETRIEVE_DONE;
    }

    // reset the value for a new group data
    pProjectInfo->curOffset = 0;
    pProjectInfo->curOutput = 0;
  }

  // here we reach the start position, according to the limit/offset requirements.

  // set current group id
  pProjectInfo->groupId = pBlock->info.groupId;

  if (pProjectInfo->curOffset >= pRes->info.rows) {
    pProjectInfo->curOffset -= pRes->info.rows;
    blockDataCleanup(pRes);
    return PROJECT_RETRIEVE_CONTINUE;
  } else if (pProjectInfo->curOffset < pRes->info.rows && pProjectInfo->curOffset > 0) {
    blockDataTrimFirstNRows(pRes, pProjectInfo->curOffset);
    pProjectInfo->curOffset = 0;
  }

3221
  // check for the limitation in each group
wmmhello's avatar
wmmhello 已提交
3222 3223 3224
  if (pProjectInfo->limit.limit >= 0 && pProjectInfo->curOutput + pRes->info.rows >= pProjectInfo->limit.limit) {
    int32_t keepRows = (int32_t)(pProjectInfo->limit.limit - pProjectInfo->curOutput);
    blockDataKeepFirstNRows(pRes, keepRows);
3225
    if (pProjectInfo->slimit.limit > 0 && pProjectInfo->slimit.limit <= pProjectInfo->curGroupOutput) {
3226 3227 3228
      pOperator->status = OP_EXEC_DONE;
    }

3229
    return PROJECT_RETRIEVE_DONE;
3230
  }
3231

3232
  // todo optimize performance
3233 3234
  // If there are slimit/soffset value exists, multi-round result can not be packed into one group, since the
  // they may not belong to the same group the limit/offset value is not valid in this case.
L
Liu Jicong 已提交
3235 3236
  if (pRes->info.rows >= pOperator->resultInfo.threshold || pProjectInfo->slimit.offset != -1 ||
      pProjectInfo->slimit.limit != -1) {
3237
    return PROJECT_RETRIEVE_DONE;
L
Liu Jicong 已提交
3238
  } else {  // not full enough, continue to accumulate the output data in the buffer.
3239 3240 3241 3242
    return PROJECT_RETRIEVE_CONTINUE;
  }
}

3243
static SSDataBlock* doProjectOperation(SOperatorInfo* pOperator) {
3244
  SProjectOperatorInfo* pProjectInfo = pOperator->info;
L
Liu Jicong 已提交
3245
  SOptrBasicInfo*       pInfo = &pProjectInfo->binfo;
3246

L
Liu Jicong 已提交
3247
  SExprSupp*   pSup = &pOperator->exprSupp;
3248
  SSDataBlock* pRes = pInfo->pRes;
3249
  blockDataCleanup(pRes);
3250

3251
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3252 3253 3254
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }
dengyihao's avatar
dengyihao 已提交
3255

H
Haojun Liao 已提交
3256
#if 0
3257 3258 3259 3260 3261
  if (pProjectInfo->existDataBlock) {  // TODO refactor
    SSDataBlock* pBlock = pProjectInfo->existDataBlock;
    pProjectInfo->existDataBlock = NULL;

    // the pDataBlock are always the same one, no need to call this again
H
Haojun Liao 已提交
3262
    setInputDataBlock(pOperator, pInfo->pCtx, pBlock, TSDB_ORDER_ASC);
3263

H
Haojun Liao 已提交
3264
    blockDataEnsureCapacity(pInfo->pRes, pBlock->info.rows);
3265
    projectApplyFunctions(pOperator->exprSupp.pExprInfo, pInfo->pRes, pBlock, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
L
Liu Jicong 已提交
3266
    if (pRes->info.rows >= pProjectInfo->binfo.capacity * 0.8) {
3267 3268
      copyTsColoum(pRes, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
      resetResultRowEntryResult(pInfo->pCtx, pOperator->exprSupp.numOfExprs);
3269 3270 3271
      return pRes;
    }
  }
H
Haojun Liao 已提交
3272
#endif
3273

3274
  int64_t st = 0;
3275 3276 3277
  int32_t order = 0;
  int32_t scanFlag = 0;

3278 3279 3280 3281
  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

H
Haojun Liao 已提交
3282 3283
  SOperatorInfo* downstream = pOperator->pDownstream[0];

L
Liu Jicong 已提交
3284
  while (1) {
H
Haojun Liao 已提交
3285
    // The downstream exec may change the value of the newgroup, so use a local variable instead.
3286
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
3287
    if (pBlock == NULL) {
L
Liu Jicong 已提交
3288 3289
      // TODO optimize
      /*if (pTaskInfo->execModel != OPTR_EXEC_MODEL_STREAM) {*/
3290
      doSetOperatorCompleted(pOperator);
L
Liu Jicong 已提交
3291
      /*}*/
3292 3293
      break;
    }
3294 3295 3296 3297
    if (pBlock->info.type == STREAM_RETRIEVE) {
      // for stream interval
      return pBlock;
    }
3298 3299

    // the pDataBlock are always the same one, no need to call this again
3300
    int32_t code = getTableScanInfo(pOperator->pDownstream[0], &order, &scanFlag);
3301 3302 3303
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
3304

3305
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
3306 3307
    blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

3308
    code = projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs,
X
Xiaoyu Wang 已提交
3309
                                 pProjectInfo->pPseudoColInfo);
3310 3311
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
3312 3313
    }

3314
    int32_t status = handleLimitOffset(pOperator, pBlock);
3315 3316 3317 3318

    // filter shall be applied after apply functions and limit/offset on the result
    doFilter(pProjectInfo->pFilterNode, pInfo->pRes);

3319
    if (status == PROJECT_RETRIEVE_CONTINUE) {
H
Haojun Liao 已提交
3320
      continue;
L
Liu Jicong 已提交
3321
    } else if (status == PROJECT_RETRIEVE_DONE) {
3322 3323 3324
      break;
    }
  }
dengyihao's avatar
dengyihao 已提交
3325

H
Haojun Liao 已提交
3326
  pProjectInfo->curOutput += pInfo->pRes->info.rows;
H
Haojun Liao 已提交
3327

3328 3329 3330 3331
  size_t rows = pInfo->pRes->info.rows;
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
3332
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
3333 3334
  }

3335
  return (rows > 0) ? pInfo->pRes : NULL;
3336 3337
}

L
Liu Jicong 已提交
3338 3339
static void doHandleRemainBlockForNewGroupImpl(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo, bool* newgroup,
                                               SExecTaskInfo* pTaskInfo) {
3340
  pInfo->totalInputRows = pInfo->existNewGroupBlock->info.rows;
H
Haojun Liao 已提交
3341

L
Liu Jicong 已提交
3342 3343
  int64_t ekey =
      Q_STATUS_EQUAL(pTaskInfo->status, TASK_COMPLETED) ? pInfo->win.ekey : pInfo->existNewGroupBlock->info.window.ekey;
3344 3345
  taosResetFillInfo(pInfo->pFillInfo, getFillInfoStart(pInfo->pFillInfo));

3346
  taosFillSetStartInfo(pInfo->pFillInfo, pInfo->existNewGroupBlock->info.rows, ekey);
3347 3348
  taosFillSetInputDataBlock(pInfo->pFillInfo, pInfo->existNewGroupBlock);

3349
  doFillTimeIntervalGapsInResults(pInfo->pFillInfo, pInfo->pRes, pResultInfo->capacity);
3350 3351 3352 3353
  pInfo->existNewGroupBlock = NULL;
  *newgroup = true;
}

L
Liu Jicong 已提交
3354 3355
static void doHandleRemainBlockFromNewGroup(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo, bool* newgroup,
                                            SExecTaskInfo* pTaskInfo) {
3356 3357
  if (taosFillHasMoreResults(pInfo->pFillInfo)) {
    *newgroup = false;
3358
    doFillTimeIntervalGapsInResults(pInfo->pFillInfo, pInfo->pRes, (int32_t)pResultInfo->capacity);
H
Haojun Liao 已提交
3359
    if (pInfo->pRes->info.rows > pResultInfo->threshold || (!pInfo->multigroupResult)) {
3360 3361 3362 3363 3364 3365
      return;
    }
  }

  // handle the cached new group data block
  if (pInfo->existNewGroupBlock) {
3366
    doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, newgroup, pTaskInfo);
3367 3368 3369
  }
}

S
slzhou 已提交
3370
static SSDataBlock* doFillImpl(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3371 3372
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;
3373

H
Haojun Liao 已提交
3374
  SResultInfo* pResultInfo = &pOperator->resultInfo;
3375 3376 3377
  SSDataBlock* pResBlock = pInfo->pRes;

  blockDataCleanup(pResBlock);
3378

3379
  // todo handle different group data interpolation
X
Xiaoyu Wang 已提交
3380 3381
  bool  n = false;
  bool* newgroup = &n;
3382
  doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, newgroup, pTaskInfo);
3383 3384
  if (pResBlock->info.rows > pResultInfo->threshold || (!pInfo->multigroupResult && pResBlock->info.rows > 0)) {
    return pResBlock;
H
Haojun Liao 已提交
3385
  }
3386

H
Haojun Liao 已提交
3387
  SOperatorInfo* pDownstream = pOperator->pDownstream[0];
L
Liu Jicong 已提交
3388
  while (1) {
3389
    SSDataBlock* pBlock = pDownstream->fpSet.getNextFn(pDownstream);
3390 3391 3392 3393
    if (*newgroup) {
      assert(pBlock != NULL);
    }

3394 3395
    blockDataUpdateTsWindow(pBlock, pInfo->primaryTsCol);

3396 3397 3398 3399 3400 3401
    if (*newgroup && pInfo->totalInputRows > 0) {  // there are already processed current group data block
      pInfo->existNewGroupBlock = pBlock;
      *newgroup = false;

      // Fill the previous group data block, before handle the data block of new group.
      // Close the fill operation for previous group data block
3402
      taosFillSetStartInfo(pInfo->pFillInfo, 0, pInfo->win.ekey);
3403 3404 3405 3406 3407 3408 3409
    } else {
      if (pBlock == NULL) {
        if (pInfo->totalInputRows == 0) {
          pOperator->status = OP_EXEC_DONE;
          return NULL;
        }

3410
        taosFillSetStartInfo(pInfo->pFillInfo, 0, pInfo->win.ekey);
3411 3412 3413 3414 3415 3416 3417
      } else {
        pInfo->totalInputRows += pBlock->info.rows;
        taosFillSetStartInfo(pInfo->pFillInfo, pBlock->info.rows, pBlock->info.window.ekey);
        taosFillSetInputDataBlock(pInfo->pFillInfo, pBlock);
      }
    }

3418 3419
    blockDataEnsureCapacity(pResBlock, pOperator->resultInfo.capacity);
    doFillTimeIntervalGapsInResults(pInfo->pFillInfo, pResBlock, pOperator->resultInfo.capacity);
3420 3421

    // current group has no more result to return
3422
    if (pResBlock->info.rows > 0) {
3423 3424
      // 1. The result in current group not reach the threshold of output result, continue
      // 2. If multiple group results existing in one SSDataBlock is not allowed, return immediately
3425 3426
      if (pResBlock->info.rows > pResultInfo->threshold || pBlock == NULL || (!pInfo->multigroupResult)) {
        return pResBlock;
3427 3428
      }

3429
      doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, newgroup, pTaskInfo);
3430 3431
      if (pResBlock->info.rows > pOperator->resultInfo.threshold || pBlock == NULL) {
        return pResBlock;
3432 3433 3434
      }
    } else if (pInfo->existNewGroupBlock) {  // try next group
      assert(pBlock != NULL);
3435
      doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, newgroup, pTaskInfo);
3436 3437
      if (pResBlock->info.rows > pResultInfo->threshold) {
        return pResBlock;
3438 3439 3440 3441 3442 3443 3444
      }
    } else {
      return NULL;
    }
  }
}

S
slzhou 已提交
3445 3446 3447 3448 3449 3450 3451 3452
static SSDataBlock* doFill(SOperatorInfo* pOperator) {
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

S
slzhou 已提交
3453
  SSDataBlock* fillResult = NULL;
S
slzhou 已提交
3454
  while (true) {
S
slzhou 已提交
3455
    fillResult = doFillImpl(pOperator);
S
slzhou 已提交
3456 3457 3458 3459 3460 3461 3462 3463 3464 3465 3466 3467 3468 3469
    if (fillResult != NULL) {
      doFilter(pInfo->pCondition, fillResult);
    }

    if (fillResult == NULL) {
      doSetOperatorCompleted(pOperator);
      break;
    }

    if (fillResult->info.rows > 0) {
      break;
    }
  }

S
slzhou 已提交
3470 3471 3472 3473
  if (fillResult != NULL) {
    size_t rows = fillResult->info.rows;
    pOperator->resultInfo.totalRows += rows;
  }
S
slzhou 已提交
3474

S
slzhou 已提交
3475
  return fillResult;
S
slzhou 已提交
3476 3477
}

H
Haojun Liao 已提交
3478 3479 3480 3481 3482 3483 3484 3485 3486 3487 3488
static void destroyExprInfo(SExprInfo* pExpr, int32_t numOfExprs) {
  for (int32_t i = 0; i < numOfExprs; ++i) {
    SExprInfo* pExprInfo = &pExpr[i];
    if (pExprInfo->pExpr->nodeType == QUERY_NODE_COLUMN) {
      taosMemoryFree(pExprInfo->base.pParam[0].pCol);
    }
    taosMemoryFree(pExprInfo->base.pParam);
    taosMemoryFree(pExprInfo->pExpr);
  }
}

3489 3490 3491 3492 3493
static void destroyOperatorInfo(SOperatorInfo* pOperator) {
  if (pOperator == NULL) {
    return;
  }

3494
  if (pOperator->fpSet.closeFn != NULL) {
3495
    pOperator->fpSet.closeFn(pOperator->info, pOperator->exprSupp.numOfExprs);
3496 3497
  }

H
Haojun Liao 已提交
3498
  if (pOperator->pDownstream != NULL) {
L
Liu Jicong 已提交
3499
    for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
H
Haojun Liao 已提交
3500
      destroyOperatorInfo(pOperator->pDownstream[i]);
3501 3502
    }

wafwerar's avatar
wafwerar 已提交
3503
    taosMemoryFreeClear(pOperator->pDownstream);
H
Haojun Liao 已提交
3504
    pOperator->numOfDownstream = 0;
3505 3506
  }

3507
  cleanupExprSupp(&pOperator->exprSupp);
wafwerar's avatar
wafwerar 已提交
3508
  taosMemoryFreeClear(pOperator);
3509 3510
}

3511 3512 3513 3514 3515 3516 3517 3518 3519 3520 3521 3522 3523 3524 3525
int32_t getBufferPgSize(int32_t rowSize, uint32_t* defaultPgsz, uint32_t* defaultBufsz) {
  *defaultPgsz = 4096;
  while (*defaultPgsz < rowSize * 4) {
    *defaultPgsz <<= 1u;
  }

  // at least four pages need to be in buffer
  *defaultBufsz = 4096 * 256;
  if ((*defaultBufsz) <= (*defaultPgsz)) {
    (*defaultBufsz) = (*defaultPgsz) * 4;
  }

  return 0;
}

dengyihao's avatar
dengyihao 已提交
3526 3527
int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                         const char* pKey) {
3528 3529
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);

dengyihao's avatar
dengyihao 已提交
3530 3531
  pAggSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
  pAggSup->keyBuf = taosMemoryCalloc(1, keyBufSize + POINTER_BYTES + sizeof(int64_t));
3532 3533
  pAggSup->pResultRowHashTable = taosHashInit(10, hashFn, true, HASH_NO_LOCK);

H
Haojun Liao 已提交
3534
  if (pAggSup->keyBuf == NULL || pAggSup->pResultRowHashTable == NULL) {
3535 3536 3537
    return TSDB_CODE_OUT_OF_MEMORY;
  }

dengyihao's avatar
dengyihao 已提交
3538
  uint32_t defaultPgsz = 0;
3539 3540
  uint32_t defaultBufsz = 0;
  getBufferPgSize(pAggSup->resultRowSize, &defaultPgsz, &defaultBufsz);
H
Haojun Liao 已提交
3541

3542
  int32_t code = createDiskbasedBuf(&pAggSup->pResultBuf, defaultPgsz, defaultBufsz, pKey, TD_TMP_DIR_PATH);
H
Haojun Liao 已提交
3543 3544 3545 3546
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3547 3548 3549
  return TSDB_CODE_SUCCESS;
}

3550
void cleanupAggSup(SAggSupporter* pAggSup) {
wafwerar's avatar
wafwerar 已提交
3551
  taosMemoryFreeClear(pAggSup->keyBuf);
3552
  taosHashCleanup(pAggSup->pResultRowHashTable);
H
Haojun Liao 已提交
3553
  destroyDiskbasedBuf(pAggSup->pResultBuf);
3554 3555
}

L
Liu Jicong 已提交
3556 3557
int32_t initAggInfo(SExprSupp* pSup, SAggSupporter* pAggSup, SExprInfo* pExprInfo, int32_t numOfCols, size_t keyBufSize,
                    const char* pkey) {
3558 3559 3560 3561 3562
  int32_t code = initExprSupp(pSup, pExprInfo, numOfCols);
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3563
  doInitAggInfoSup(pAggSup, pSup->pCtx, numOfCols, keyBufSize, pkey);
L
Liu Jicong 已提交
3564
  for (int32_t i = 0; i < numOfCols; ++i) {
3565
    pSup->pCtx[i].pBuf = pAggSup->pResultBuf;
3566 3567
  }

3568
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
3569 3570
}

3571
void initResultSizeInfo(SOperatorInfo* pOperator, int32_t numOfRows) {
wmmhello's avatar
wmmhello 已提交
3572
  ASSERT(numOfRows != 0);
3573 3574 3575 3576
  pOperator->resultInfo.capacity = numOfRows;
  pOperator->resultInfo.threshold = numOfRows * 0.75;

  if (pOperator->resultInfo.threshold == 0) {
wmmhello's avatar
wmmhello 已提交
3577
    pOperator->resultInfo.threshold = numOfRows;
3578 3579 3580
  }
}

3581 3582 3583 3584 3585
void initBasicInfo(SOptrBasicInfo* pInfo, SSDataBlock* pBlock) {
  pInfo->pRes = pBlock;
  initResultRowInfo(&pInfo->resultRowInfo);
}

3586 3587 3588 3589 3590 3591 3592 3593 3594 3595 3596 3597 3598 3599 3600 3601 3602 3603 3604
static void* destroySqlFunctionCtx(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
  if (pCtx == NULL) {
    return NULL;
  }

  for (int32_t i = 0; i < numOfOutput; ++i) {
    for (int32_t j = 0; j < pCtx[i].numOfParams; ++j) {
      taosVariantDestroy(&pCtx[i].param[j].param);
    }

    taosMemoryFreeClear(pCtx[i].subsidiaries.pCtx);
    taosMemoryFree(pCtx[i].input.pData);
    taosMemoryFree(pCtx[i].input.pColumnDataAgg);
  }

  taosMemoryFreeClear(pCtx);
  return NULL;
}

3605
int32_t initExprSupp(SExprSupp* pSup, SExprInfo* pExprInfo, int32_t numOfExpr) {
3606 3607 3608 3609
  pSup->pExprInfo = pExprInfo;
  pSup->numOfExprs = numOfExpr;
  if (pSup->pExprInfo != NULL) {
    pSup->pCtx = createSqlFunctionCtx(pExprInfo, numOfExpr, &pSup->rowEntryInfoOffset);
3610 3611 3612
    if (pSup->pCtx == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
3613
  }
3614 3615

  return TSDB_CODE_SUCCESS;
3616 3617
}

3618 3619 3620 3621 3622 3623 3624 3625 3626 3627
void cleanupExprSupp(SExprSupp* pSupp) {
  destroySqlFunctionCtx(pSupp->pCtx, pSupp->numOfExprs);
  if (pSupp->pExprInfo != NULL) {
    destroyExprInfo(pSupp->pExprInfo, pSupp->numOfExprs);
  }

  taosMemoryFreeClear(pSupp->pExprInfo);
  taosMemoryFree(pSupp->rowEntryInfoOffset);
}

L
Liu Jicong 已提交
3628
SOperatorInfo* createAggregateOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
S
slzhou 已提交
3629
                                           SSDataBlock* pResultBlock, SNode* pCondition, SExprInfo* pScalarExprInfo,
wmmhello's avatar
wmmhello 已提交
3630
                                           int32_t numOfScalarExpr, SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3631
  SAggOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SAggOperatorInfo));
L
Liu Jicong 已提交
3632
  SOperatorInfo*    pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3633 3634 3635
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
H
Haojun Liao 已提交
3636

3637
  int32_t numOfRows = 1024;
dengyihao's avatar
dengyihao 已提交
3638
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3639 3640

  initResultSizeInfo(pOperator, numOfRows);
3641
  int32_t code = initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
L
Liu Jicong 已提交
3642
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3643 3644
    goto _error;
  }
H
Haojun Liao 已提交
3645

3646
  initBasicInfo(&pInfo->binfo, pResultBlock);
3647 3648 3649 3650
  code = initExprSupp(&pInfo->scalarExprSup, pScalarExprInfo, numOfScalarExpr);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3651

L
Liu Jicong 已提交
3652
  pInfo->groupId = INT32_MIN;
S
slzhou 已提交
3653
  pInfo->pCondition = pCondition;
dengyihao's avatar
dengyihao 已提交
3654
  pOperator->name = "TableAggregate";
3655
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_HASH_AGG;
3656
  pOperator->blocking = true;
dengyihao's avatar
dengyihao 已提交
3657 3658 3659
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3660

3661 3662
  pOperator->fpSet = createOperatorFpSet(doOpenAggregateOptr, getAggregateResult, NULL, NULL, destroyAggOperatorInfo,
                                         aggEncodeResultRow, aggDecodeResultRow, NULL);
H
Haojun Liao 已提交
3663 3664 3665 3666 3667

  code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3668 3669

  return pOperator;
L
Liu Jicong 已提交
3670
_error:
H
Haojun Liao 已提交
3671
  destroyAggOperatorInfo(pInfo, numOfCols);
wafwerar's avatar
wafwerar 已提交
3672 3673
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
H
Haojun Liao 已提交
3674 3675
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3676 3677
}

3678
void cleanupBasicInfo(SOptrBasicInfo* pInfo) {
3679 3680
  assert(pInfo != NULL);
  cleanupResultRowInfo(&pInfo->resultRowInfo);
H
Haojun Liao 已提交
3681
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
3682 3683
}

H
Haojun Liao 已提交
3684
void destroyBasicOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3685
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)param;
3686
  cleanupBasicInfo(pInfo);
L
Liu Jicong 已提交
3687

D
dapan1121 已提交
3688
  taosMemoryFreeClear(param);
3689
}
H
Haojun Liao 已提交
3690 3691

void destroyAggOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3692
  SAggOperatorInfo* pInfo = (SAggOperatorInfo*)param;
L
Liu Jicong 已提交
3693 3694
  cleanupBasicInfo(&pInfo->binfo);

D
dapan1121 已提交
3695
  taosMemoryFreeClear(param);
3696
}
3697

H
Haojun Liao 已提交
3698
void destroySFillOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3699
  SFillOperatorInfo* pInfo = (SFillOperatorInfo*)param;
3700
  pInfo->pFillInfo = taosDestroyFillInfo(pInfo->pFillInfo);
H
Haojun Liao 已提交
3701
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
wafwerar's avatar
wafwerar 已提交
3702
  taosMemoryFreeClear(pInfo->p);
L
Liu Jicong 已提交
3703

D
dapan1121 已提交
3704
  taosMemoryFreeClear(param);
3705 3706
}

H
Haojun Liao 已提交
3707
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput) {
D
fix bug  
dapan 已提交
3708 3709 3710
  if (NULL == param) {
    return;
  }
L
Liu Jicong 已提交
3711
  SProjectOperatorInfo* pInfo = (SProjectOperatorInfo*)param;
3712
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3713
  cleanupAggSup(&pInfo->aggSup);
H
Haojun Liao 已提交
3714
  taosArrayDestroy(pInfo->pPseudoColInfo);
L
Liu Jicong 已提交
3715

D
dapan1121 已提交
3716
  taosMemoryFreeClear(param);
3717 3718
}

H
Haojun Liao 已提交
3719
static void destroyIndefinitOperatorInfo(void* param, int32_t numOfOutput) {
3720
  SIndefOperatorInfo* pInfo = (SIndefOperatorInfo*)param;
3721
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3722 3723 3724

  taosArrayDestroy(pInfo->pPseudoColInfo);
  cleanupAggSup(&pInfo->aggSup);
3725
  cleanupExprSupp(&pInfo->scalarSup);
L
Liu Jicong 已提交
3726

D
dapan1121 已提交
3727
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
3728 3729
}

H
Haojun Liao 已提交
3730
void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3731
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3732 3733 3734 3735
  taosRemoveRef(exchangeObjRefPool, pExInfo->self);
}

void doDestroyExchangeOperatorInfo(void* param) {
X
Xiaoyu Wang 已提交
3736
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3737

H
Haojun Liao 已提交
3738 3739 3740 3741 3742 3743 3744
  taosArrayDestroy(pExInfo->pSources);
  taosArrayDestroy(pExInfo->pSourceDataInfo);
  if (pExInfo->pResult != NULL) {
    blockDataDestroy(pExInfo->pResult);
  }

  tsem_destroy(&pExInfo->ready);
L
Liu Jicong 已提交
3745

D
dapan1121 已提交
3746
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
3747 3748
}

H
Haojun Liao 已提交
3749 3750
static SArray* setRowTsColumnOutputInfo(SqlFunctionCtx* pCtx, int32_t numOfCols) {
  SArray* pList = taosArrayInit(4, sizeof(int32_t));
dengyihao's avatar
dengyihao 已提交
3751
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
3752 3753 3754 3755 3756 3757 3758 3759
    if (fmIsPseudoColumnFunc(pCtx[i].functionId)) {
      taosArrayPush(pList, &i);
    }
  }

  return pList;
}

3760 3761 3762 3763
static int64_t getLimit(SNode* pLimit) { return NULL == pLimit ? -1 : ((SLimitNode*)pLimit)->limit; }

static int64_t getOffset(SNode* pLimit) { return NULL == pLimit ? -1 : ((SLimitNode*)pLimit)->offset; }

L
Liu Jicong 已提交
3764
SOperatorInfo* createProjectOperatorInfo(SOperatorInfo* downstream, SProjectPhysiNode* pProjPhyNode,
dengyihao's avatar
dengyihao 已提交
3765
                                         SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3766
  SProjectOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SProjectOperatorInfo));
L
Liu Jicong 已提交
3767
  SOperatorInfo*        pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3768 3769 3770
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
3771

L
Liu Jicong 已提交
3772
  int32_t    numOfCols = 0;
3773 3774 3775
  SExprInfo* pExprInfo = createExprInfo(pProjPhyNode->pProjections, NULL, &numOfCols);

  SSDataBlock* pResBlock = createResDataBlock(pProjPhyNode->node.pOutputDataBlockDesc);
3776 3777
  SLimit       limit = {.limit = getLimit(pProjPhyNode->node.pLimit), .offset = getOffset(pProjPhyNode->node.pLimit)};
  SLimit slimit = {.limit = getLimit(pProjPhyNode->node.pSlimit), .offset = getOffset(pProjPhyNode->node.pSlimit)};
3778

L
Liu Jicong 已提交
3779 3780 3781 3782
  pInfo->limit = limit;
  pInfo->slimit = slimit;
  pInfo->curOffset = limit.offset;
  pInfo->curSOffset = slimit.offset;
H
Haojun Liao 已提交
3783
  pInfo->binfo.pRes = pResBlock;
3784
  pInfo->pFilterNode = pProjPhyNode->node.pConditions;
H
Haojun Liao 已提交
3785 3786

  int32_t numOfRows = 4096;
dengyihao's avatar
dengyihao 已提交
3787
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3788

3789 3790 3791 3792 3793
  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
3794
  initResultSizeInfo(pOperator, numOfRows);
3795

3796 3797
  initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
  initBasicInfo(&pInfo->binfo, pResBlock);
3798
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfCols);
3799

3800
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pOperator->exprSupp.pCtx, numOfCols);
X
Xiaoyu Wang 已提交
3801
  pOperator->name = "ProjectOperator";
H
Haojun Liao 已提交
3802
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_PROJECT;
X
Xiaoyu Wang 已提交
3803 3804 3805 3806
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
3807

L
Liu Jicong 已提交
3808 3809
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doProjectOperation, NULL, NULL,
                                         destroyProjectOperatorInfo, NULL, NULL, NULL);
L
Liu Jicong 已提交
3810

3811
  int32_t code = appendDownstream(pOperator, &downstream, 1);
H
Haojun Liao 已提交
3812
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3813 3814
    goto _error;
  }
3815 3816

  return pOperator;
H
Haojun Liao 已提交
3817

L
Liu Jicong 已提交
3818
_error:
H
Haojun Liao 已提交
3819 3820
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3821 3822
}

3823 3824
static void doHandleDataBlock(SOperatorInfo* pOperator, SSDataBlock* pBlock, SOperatorInfo* downstream,
                              SExecTaskInfo* pTaskInfo) {
3825 3826 3827 3828 3829 3830 3831 3832 3833 3834 3835 3836 3837 3838 3839 3840 3841 3842 3843 3844 3845 3846 3847 3848 3849 3850 3851 3852 3853 3854 3855 3856 3857
  int32_t order = 0;
  int32_t scanFlag = 0;

  SIndefOperatorInfo* pIndefInfo = pOperator->info;
  SOptrBasicInfo*     pInfo = &pIndefInfo->binfo;
  SExprSupp*          pSup = &pOperator->exprSupp;

  // the pDataBlock are always the same one, no need to call this again
  int32_t code = getTableScanInfo(downstream, &order, &scanFlag);
  if (code != TSDB_CODE_SUCCESS) {
    longjmp(pTaskInfo->env, code);
  }

  // there is an scalar expression that needs to be calculated before apply the group aggregation.
  SExprSupp* pScalarSup = &pIndefInfo->scalarSup;
  if (pScalarSup->pExprInfo != NULL) {
    code = projectApplyFunctions(pScalarSup->pExprInfo, pBlock, pBlock, pScalarSup->pCtx, pScalarSup->numOfExprs,
                                 pIndefInfo->pPseudoColInfo);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
  }

  setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
  blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

  code = projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs,
                               pIndefInfo->pPseudoColInfo);
  if (code != TSDB_CODE_SUCCESS) {
    longjmp(pTaskInfo->env, code);
  }
}

H
Haojun Liao 已提交
3858 3859
static SSDataBlock* doApplyIndefinitFunction(SOperatorInfo* pOperator) {
  SIndefOperatorInfo* pIndefInfo = pOperator->info;
3860
  SOptrBasicInfo*     pInfo = &pIndefInfo->binfo;
L
Liu Jicong 已提交
3861
  SExprSupp*          pSup = &pOperator->exprSupp;
H
Haojun Liao 已提交
3862 3863 3864 3865 3866 3867 3868 3869 3870 3871 3872 3873 3874 3875 3876 3877 3878

  SSDataBlock* pRes = pInfo->pRes;
  blockDataCleanup(pRes);

  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

  int64_t st = 0;

  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

  SOperatorInfo* downstream = pOperator->pDownstream[0];

3879
  while (1) {
3880
    // here we need to handle the existsed group results
3881
    if (pIndefInfo->pNextGroupRes != NULL) {  // todo extract method
3882 3883
      for (int32_t k = 0; k < pSup->numOfExprs; ++k) {
        SqlFunctionCtx* pCtx = &pSup->pCtx[k];
H
Haojun Liao 已提交
3884

3885 3886 3887 3888 3889 3890 3891
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
        pResInfo->initialized = false;
        pCtx->pOutput = NULL;
      }

      doHandleDataBlock(pOperator, pIndefInfo->pNextGroupRes, downstream, pTaskInfo);
      pIndefInfo->pNextGroupRes = NULL;
H
Haojun Liao 已提交
3892 3893
    }

3894 3895 3896 3897 3898 3899 3900 3901 3902 3903 3904 3905 3906 3907 3908 3909 3910 3911 3912 3913 3914 3915 3916
    if (pInfo->pRes->info.rows < pOperator->resultInfo.threshold) {
      while (1) {
        // The downstream exec may change the value of the newgroup, so use a local variable instead.
        SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
        if (pBlock == NULL) {
          doSetOperatorCompleted(pOperator);
          break;
        }

        if (pIndefInfo->groupId == 0 && pBlock->info.groupId != 0) {
          pIndefInfo->groupId = pBlock->info.groupId;  // this is the initial group result
        } else {
          if (pIndefInfo->groupId != pBlock->info.groupId) {  // reset output buffer and computing status
            pIndefInfo->groupId = pBlock->info.groupId;
            pIndefInfo->pNextGroupRes = pBlock;
            break;
          }
        }

        doHandleDataBlock(pOperator, pBlock, downstream, pTaskInfo);
        if (pInfo->pRes->info.rows >= pOperator->resultInfo.threshold) {
          break;
        }
H
Haojun Liao 已提交
3917 3918 3919
      }
    }

3920 3921 3922 3923
    doFilter(pIndefInfo->pCondition, pInfo->pRes);
    size_t rows = pInfo->pRes->info.rows;
    if (rows >= 0) {
      break;
H
Haojun Liao 已提交
3924 3925 3926 3927 3928 3929 3930 3931 3932 3933 3934 3935 3936
    }
  }

  size_t rows = pInfo->pRes->info.rows;
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
  }

  return (rows > 0) ? pInfo->pRes : NULL;
}

3937 3938
SOperatorInfo* createIndefinitOutputOperatorInfo(SOperatorInfo* downstream, SPhysiNode* pNode,
                                                 SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
3939
  SIndefOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SIndefOperatorInfo));
3940
  SOperatorInfo*      pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3941 3942 3943 3944
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

3945 3946
  SExprSupp* pSup = &pOperator->exprSupp;

H
Haojun Liao 已提交
3947 3948 3949
  SIndefRowsFuncPhysiNode* pPhyNode = (SIndefRowsFuncPhysiNode*)pNode;

  int32_t    numOfExpr = 0;
X
Xiaoyu Wang 已提交
3950
  SExprInfo* pExprInfo = createExprInfo(pPhyNode->pFuncs, NULL, &numOfExpr);
H
Haojun Liao 已提交
3951 3952

  if (pPhyNode->pExprs != NULL) {
3953
    int32_t    num = 0;
3954
    SExprInfo* pSExpr = createExprInfo(pPhyNode->pExprs, NULL, &num);
3955
    int32_t    code = initExprSupp(&pInfo->scalarSup, pSExpr, num);
3956 3957 3958
    if (code != TSDB_CODE_SUCCESS) {
      goto _error;
    }
H
Haojun Liao 已提交
3959 3960
  }

3961
  SSDataBlock* pResBlock = createResDataBlock(pPhyNode->node.pOutputDataBlockDesc);
H
Haojun Liao 已提交
3962 3963 3964 3965 3966 3967 3968 3969 3970

  int32_t numOfRows = 4096;
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;

  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
3971

H
Haojun Liao 已提交
3972 3973
  initResultSizeInfo(pOperator, numOfRows);

3974
  initAggInfo(pSup, &pInfo->aggSup, pExprInfo, numOfExpr, keyBufSize, pTaskInfo->id.str);
3975 3976
  initBasicInfo(&pInfo->binfo, pResBlock);

3977
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfExpr);
H
Haojun Liao 已提交
3978

3979 3980 3981
  pInfo->binfo.pRes = pResBlock;
  pInfo->pCondition = pPhyNode->node.pConditions;
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pSup->pCtx, numOfExpr);
H
Haojun Liao 已提交
3982

3983
  pOperator->name = "IndefinitOperator";
3984
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC;
3985 3986 3987
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
3988
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3989 3990 3991 3992 3993 3994 3995 3996 3997 3998 3999

  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doApplyIndefinitFunction, NULL, NULL,
                                         destroyIndefinitOperatorInfo, NULL, NULL, NULL);

  int32_t code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  return pOperator;

4000
_error:
H
Haojun Liao 已提交
4001 4002 4003 4004 4005 4006
  taosMemoryFree(pInfo);
  taosMemoryFree(pOperator);
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
}

4007
static int32_t initFillInfo(SFillOperatorInfo* pInfo, SExprInfo* pExpr, int32_t numOfCols, SNodeListNode* pValNode,
L
Liu Jicong 已提交
4008
                            STimeWindow win, int32_t capacity, const char* id, SInterval* pInterval, int32_t fillType) {
4009
  SFillColInfo* pColInfo = createFillColInfo(pExpr, numOfCols, pValNode);
H
Haojun Liao 已提交
4010 4011

  STimeWindow w = TSWINDOW_INITIALIZER;
4012
  getAlignQueryTimeWindow(pInterval, pInterval->precision, win.skey, &w);
4013
  w = getFirstQualifiedTimeWindow(win.skey, &w, pInterval, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
4014 4015

  int32_t order = TSDB_ORDER_ASC;
4016
  pInfo->pFillInfo = taosCreateFillInfo(order, w.skey, 0, capacity, numOfCols, pInterval, fillType, pColInfo, id);
H
Haojun Liao 已提交
4017

4018
  pInfo->win = win;
L
Liu Jicong 已提交
4019
  pInfo->p = taosMemoryCalloc(numOfCols, POINTER_BYTES);
H
Haojun Liao 已提交
4020
  if (pInfo->pFillInfo == NULL || pInfo->p == NULL) {
H
Haojun Liao 已提交
4021 4022
    taosMemoryFree(pInfo->pFillInfo);
    taosMemoryFree(pInfo->p);
H
Haojun Liao 已提交
4023 4024 4025 4026 4027 4028
    return TSDB_CODE_OUT_OF_MEMORY;
  } else {
    return TSDB_CODE_SUCCESS;
  }
}

4029 4030 4031 4032 4033 4034 4035 4036
SOperatorInfo* createFillOperatorInfo(SOperatorInfo* downstream, SFillPhysiNode* pPhyFillNode, bool multigroupResult,
                                      SExecTaskInfo* pTaskInfo) {
  SFillOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SFillOperatorInfo));
  SOperatorInfo*     pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

L
Liu Jicong 已提交
4037 4038 4039
  int32_t      num = 0;
  SSDataBlock* pResBlock = createResDataBlock(pPhyFillNode->node.pOutputDataBlockDesc);
  SExprInfo*   pExprInfo = createExprInfo(pPhyFillNode->pTargets, NULL, &num);
4040 4041 4042 4043
  SInterval*   pInterval =
      QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == downstream->operatorType
            ? &((SMergeAlignedIntervalAggOperatorInfo*)downstream->info)->intervalAggOperatorInfo->interval
            : &((SIntervalAggOperatorInfo*)downstream->info)->interval;
4044

4045
  int32_t type = convertFillType(pPhyFillNode->mode);
4046

H
Haojun Liao 已提交
4047
  SResultInfo* pResultInfo = &pOperator->resultInfo;
4048
  initResultSizeInfo(pOperator, 4096);
H
Haojun Liao 已提交
4049
  pInfo->primaryTsCol = ((SColumnNode*)pPhyFillNode->pWStartTs)->slotId;
4050

4051
  int32_t numOfOutputCols = 0;
4052 4053
  SArray* pColMatchColInfo = extractColMatchInfo(pPhyFillNode->pTargets, pPhyFillNode->node.pOutputDataBlockDesc,
                                                 &numOfOutputCols, COL_MATCH_FROM_SLOT_ID);
4054

4055 4056
  int32_t code = initFillInfo(pInfo, pExprInfo, num, (SNodeListNode*)pPhyFillNode->pValues, pPhyFillNode->timeRange,
                              pResultInfo->capacity, pTaskInfo->id.str, pInterval, type);
4057 4058 4059
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
4060

4061 4062 4063 4064 4065 4066 4067 4068 4069
  pInfo->pRes = pResBlock;
  pInfo->multigroupResult = multigroupResult;
  pInfo->pCondition = pPhyFillNode->node.pConditions;
  pInfo->pColMatchColInfo = pColMatchColInfo;
  pOperator->name = "FillOperator";
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_FILL;
  pOperator->exprSupp.pExprInfo = pExprInfo;
4070
  pOperator->exprSupp.numOfExprs = num;
4071 4072
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
4073

L
Liu Jicong 已提交
4074 4075
  pOperator->fpSet =
      createOperatorFpSet(operatorDummyOpenFn, doFill, NULL, NULL, destroySFillOperatorInfo, NULL, NULL, NULL);
4076

4077
  code = appendDownstream(pOperator, &downstream, 1);
4078
  return pOperator;
H
Haojun Liao 已提交
4079

L
Liu Jicong 已提交
4080
_error:
wafwerar's avatar
wafwerar 已提交
4081 4082
  taosMemoryFreeClear(pOperator);
  taosMemoryFreeClear(pInfo);
H
Haojun Liao 已提交
4083
  return NULL;
4084 4085
}

D
dapan1121 已提交
4086
static SExecTaskInfo* createExecTaskInfo(uint64_t queryId, uint64_t taskId, EOPTR_EXEC_MODEL model, char* dbFName) {
wafwerar's avatar
wafwerar 已提交
4087
  SExecTaskInfo* pTaskInfo = taosMemoryCalloc(1, sizeof(SExecTaskInfo));
4088
  setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
4089

D
dapan1121 已提交
4090
  pTaskInfo->schemaVer.dbname = strdup(dbFName);
4091
  pTaskInfo->cost.created = taosGetTimestampMs();
H
Haojun Liao 已提交
4092
  pTaskInfo->id.queryId = queryId;
dengyihao's avatar
dengyihao 已提交
4093
  pTaskInfo->execModel = model;
H
Haojun Liao 已提交
4094

wafwerar's avatar
wafwerar 已提交
4095
  char* p = taosMemoryCalloc(1, 128);
L
Liu Jicong 已提交
4096
  snprintf(p, 128, "TID:0x%" PRIx64 " QID:0x%" PRIx64, taskId, queryId);
H
Haojun Liao 已提交
4097
  pTaskInfo->id.str = p;
H
Haojun Liao 已提交
4098

4099 4100
  return pTaskInfo;
}
H
Haojun Liao 已提交
4101

H
Hongze Cheng 已提交
4102
static STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
H
Haojun Liao 已提交
4103
                                       STableListInfo* pTableListInfo, const char* idstr);
H
Haojun Liao 已提交
4104

H
Haojun Liao 已提交
4105
static SArray* extractColumnInfo(SNodeList* pNodeList);
4106

4107
int32_t extractTableSchemaInfo(SReadHandle* pHandle, uint64_t uid, SExecTaskInfo* pTaskInfo) {
4108 4109
  SMetaReader mr = {0};
  metaReaderInit(&mr, pHandle->meta, 0);
D
dapan1121 已提交
4110
  int32_t code = metaGetTableEntryByUid(&mr, uid);
4111
  if (code != TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
4112
    metaReaderClear(&mr);
4113
    return terrno;
D
dapan1121 已提交
4114
  }
4115 4116 4117 4118

  pTaskInfo->schemaVer.tablename = strdup(mr.me.name);

  if (mr.me.type == TSDB_SUPER_TABLE) {
4119
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
4120
    pTaskInfo->schemaVer.tversion = mr.me.stbEntry.schemaTag.version;
4121
  } else if (mr.me.type == TSDB_CHILD_TABLE) {
4122 4123
    tDecoderClear(&mr.coder);

4124 4125
    tb_uid_t suid = mr.me.ctbEntry.suid;
    metaGetTableEntryByUid(&mr, suid);
4126
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
4127
    pTaskInfo->schemaVer.tversion = mr.me.stbEntry.schemaTag.version;
4128
  } else {
4129
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.ntbEntry.schemaRow);
4130
  }
4131 4132

  metaReaderClear(&mr);
D
dapan1121 已提交
4133
  return TSDB_CODE_SUCCESS;
4134 4135
}

4136 4137 4138 4139 4140 4141 4142 4143 4144 4145 4146
static void cleanupTableSchemaInfo(SExecTaskInfo* pTaskInfo) {
  taosMemoryFreeClear(pTaskInfo->schemaVer.dbname);
  if (pTaskInfo->schemaVer.sw == NULL) {
    return;
  }

  taosMemoryFree(pTaskInfo->schemaVer.sw->pSchema);
  taosMemoryFree(pTaskInfo->schemaVer.sw);
  taosMemoryFree(pTaskInfo->schemaVer.tablename);
}

4147
static int32_t sortTableGroup(STableListInfo* pTableListInfo, int32_t groupNum) {
wmmhello's avatar
wmmhello 已提交
4148
  taosArrayClear(pTableListInfo->pGroupList);
4149 4150
  SArray* sortSupport = taosArrayInit(groupNum, sizeof(uint64_t));
  if (sortSupport == NULL) return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
4151 4152
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
4153
    uint64_t*      groupId = taosHashGet(pTableListInfo->map, &info->uid, sizeof(uint64_t));
wmmhello's avatar
wmmhello 已提交
4154 4155

    int32_t index = taosArraySearchIdx(sortSupport, groupId, compareUint64Val, TD_EQ);
4156 4157 4158 4159
    if (index == -1) {
      void*   p = taosArraySearch(sortSupport, groupId, compareUint64Val, TD_GT);
      SArray* tGroup = taosArrayInit(8, sizeof(STableKeyInfo));
      if (tGroup == NULL) {
wmmhello's avatar
wmmhello 已提交
4160 4161 4162
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
4163
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4164 4165 4166 4167
        qError("taos push info array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
4168
      if (p == NULL) {
wmmhello's avatar
wmmhello 已提交
4169
        if (taosArrayPush(sortSupport, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4170 4171 4172 4173
          qError("taos push support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
wmmhello's avatar
wmmhello 已提交
4174
        if (taosArrayPush(pTableListInfo->pGroupList, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4175 4176 4177 4178
          qError("taos push group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4179
      } else {
wmmhello's avatar
wmmhello 已提交
4180
        int32_t pos = TARRAY_ELEM_IDX(sortSupport, p);
4181
        if (taosArrayInsert(sortSupport, pos, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4182 4183 4184 4185
          qError("taos insert support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4186
        if (taosArrayInsert(pTableListInfo->pGroupList, pos, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4187 4188 4189 4190 4191
          qError("taos insert group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
      }
4192
    } else {
wmmhello's avatar
wmmhello 已提交
4193
      SArray* tGroup = (SArray*)taosArrayGetP(pTableListInfo->pGroupList, index);
4194
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4195 4196 4197 4198 4199 4200 4201 4202 4203 4204
        qError("taos push uid array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
    }
  }
  taosArrayDestroy(sortSupport);
  return TDB_CODE_SUCCESS;
}

wmmhello's avatar
wmmhello 已提交
4205 4206
int32_t generateGroupIdMap(STableListInfo* pTableListInfo, SReadHandle* pHandle, SNodeList* group) {
  if (group == NULL) {
wmmhello's avatar
wmmhello 已提交
4207 4208 4209 4210 4211 4212 4213 4214
    return TDB_CODE_SUCCESS;
  }

  pTableListInfo->map = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, HASH_NO_LOCK);
  if (pTableListInfo->map == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
  int32_t keyLen = 0;
X
Xiaoyu Wang 已提交
4215
  void*   keyBuf = NULL;
wmmhello's avatar
wmmhello 已提交
4216

4217
  SNode* node;
wmmhello's avatar
wmmhello 已提交
4218
  FOREACH(node, group) {
4219
    SExprNode* pExpr = (SExprNode*)node;
wmmhello's avatar
wmmhello 已提交
4220
    keyLen += pExpr->resType.bytes;
wmmhello's avatar
wmmhello 已提交
4221 4222
  }

wmmhello's avatar
wmmhello 已提交
4223
  int32_t nullFlagSize = sizeof(int8_t) * LIST_LENGTH(group);
wmmhello's avatar
wmmhello 已提交
4224 4225 4226 4227 4228 4229 4230
  keyLen += nullFlagSize;

  keyBuf = taosMemoryCalloc(1, keyLen);
  if (keyBuf == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

4231
  int32_t groupNum = 0;
X
Xiaoyu Wang 已提交
4232 4233 4234
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
    SMetaReader    mr = {0};
wmmhello's avatar
wmmhello 已提交
4235 4236 4237
    metaReaderInit(&mr, pHandle->meta, 0);
    metaGetTableEntryByUid(&mr, info->uid);

4238
    SNodeList* groupNew = nodesCloneList(group);
wmmhello's avatar
wmmhello 已提交
4239

wmmhello's avatar
wmmhello 已提交
4240
    nodesRewriteExprsPostOrder(groupNew, doTranslateTagExpr, &mr);
wmmhello's avatar
wmmhello 已提交
4241
    char* isNull = (char*)keyBuf;
wmmhello's avatar
wmmhello 已提交
4242 4243
    char* pStart = (char*)keyBuf + nullFlagSize;

4244
    SNode*  pNode;
wmmhello's avatar
wmmhello 已提交
4245
    int32_t index = 0;
4246
    FOREACH(pNode, groupNew) {
wmmhello's avatar
wmmhello 已提交
4247 4248 4249 4250
      SNode*  pNew = NULL;
      int32_t code = scalarCalculateConstants(pNode, &pNew);
      if (TSDB_CODE_SUCCESS == code) {
        REPLACE_NODE(pNew);
X
Xiaoyu Wang 已提交
4251
      } else {
4252
        taosMemoryFree(keyBuf);
wmmhello's avatar
wmmhello 已提交
4253
        nodesClearList(groupNew);
4254
        metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4255
        return code;
wmmhello's avatar
wmmhello 已提交
4256
      }
4257

wmmhello's avatar
wmmhello 已提交
4258
      ASSERT(nodeType(pNew) == QUERY_NODE_VALUE);
4259
      SValueNode* pValue = (SValueNode*)pNew;
4260

wmmhello's avatar
wmmhello 已提交
4261
      if (pValue->node.resType.type == TSDB_DATA_TYPE_NULL || pValue->isNull) {
wmmhello's avatar
wmmhello 已提交
4262 4263 4264 4265
        isNull[index++] = 1;
        continue;
      } else {
        isNull[index++] = 0;
4266
        char* data = nodesGetValueFromNode(pValue);
L
Liu Jicong 已提交
4267 4268
        if (pValue->node.resType.type == TSDB_DATA_TYPE_JSON) {
          if (tTagIsJson(data)) {
wmmhello's avatar
wmmhello 已提交
4269 4270 4271
            terrno = TSDB_CODE_QRY_JSON_IN_GROUP_ERROR;
            taosMemoryFree(keyBuf);
            nodesClearList(groupNew);
4272
            metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4273 4274
            return terrno;
          }
wmmhello's avatar
wmmhello 已提交
4275
          int32_t len = getJsonValueLen(data);
wmmhello's avatar
wmmhello 已提交
4276 4277 4278
          memcpy(pStart, data, len);
          pStart += len;
        } else if (IS_VAR_DATA_TYPE(pValue->node.resType.type)) {
wmmhello's avatar
wmmhello 已提交
4279 4280
          memcpy(pStart, data, varDataTLen(data));
          pStart += varDataTLen(data);
wmmhello's avatar
wmmhello 已提交
4281
        } else {
wmmhello's avatar
wmmhello 已提交
4282 4283
          memcpy(pStart, data, pValue->node.resType.bytes);
          pStart += pValue->node.resType.bytes;
wmmhello's avatar
wmmhello 已提交
4284 4285 4286
        }
      }
    }
4287
    int32_t  len = (int32_t)(pStart - (char*)keyBuf);
4288 4289
    uint64_t groupId = calcGroupId(keyBuf, len);
    taosHashPut(pTableListInfo->map, &(info->uid), sizeof(uint64_t), &groupId, sizeof(uint64_t));
S
slzhou 已提交
4290
    info->groupId = groupId;
4291
    groupNum++;
wmmhello's avatar
wmmhello 已提交
4292

wmmhello's avatar
wmmhello 已提交
4293
    nodesClearList(groupNew);
wmmhello's avatar
wmmhello 已提交
4294 4295 4296
    metaReaderClear(&mr);
  }
  taosMemoryFree(keyBuf);
4297

4298
  if (pTableListInfo->needSortTableByGroupId) {
wmmhello's avatar
wmmhello 已提交
4299
    return sortTableGroup(pTableListInfo, groupNum);
4300 4301
  }

wmmhello's avatar
wmmhello 已提交
4302 4303 4304
  return TDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
4305
SOperatorInfo* createOperatorTree(SPhysiNode* pPhyNode, SExecTaskInfo* pTaskInfo, SReadHandle* pHandle,
4306 4307
                                  uint64_t queryId, uint64_t taskId, STableListInfo* pTableListInfo,
                                  const char* pUser) {
4308 4309
  int32_t type = nodeType(pPhyNode);

X
Xiaoyu Wang 已提交
4310
  if (pPhyNode->pChildren == NULL || LIST_LENGTH(pPhyNode->pChildren) == 0) {
H
Haojun Liao 已提交
4311
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == type) {
dengyihao's avatar
dengyihao 已提交
4312
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4313

wmmhello's avatar
wmmhello 已提交
4314
      int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
4315
      if (code) {
wmmhello's avatar
wmmhello 已提交
4316
        pTaskInfo->code = code;
D
dapan1121 已提交
4317 4318
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4319

4320
      code = extractTableSchemaInfo(pHandle, pTableScanNode->scan.uid, pTaskInfo);
S
slzhou 已提交
4321
      if (code) {
4322
        pTaskInfo->code = terrno;
wmmhello's avatar
wmmhello 已提交
4323 4324 4325
        return NULL;
      }

H
Haojun Liao 已提交
4326
      SOperatorInfo*  pOperator = createTableScanOperatorInfo(pTableScanNode, pHandle, pTaskInfo);
4327 4328
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
S
slzhou 已提交
4329
      return pOperator;
L
Liu Jicong 已提交
4330

S
slzhou 已提交
4331 4332
    } else if (QUERY_NODE_PHYSICAL_PLAN_TABLE_MERGE_SCAN == type) {
      STableMergeScanPhysiNode* pTableScanNode = (STableMergeScanPhysiNode*)pPhyNode;
wmmhello's avatar
wmmhello 已提交
4333
      int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
L
Liu Jicong 已提交
4334
      if (code) {
wmmhello's avatar
wmmhello 已提交
4335
        pTaskInfo->code = code;
wmmhello's avatar
wmmhello 已提交
4336 4337
        return NULL;
      }
4338
      code = extractTableSchemaInfo(pHandle, pTableScanNode->scan.uid, pTaskInfo);
wmmhello's avatar
wmmhello 已提交
4339 4340 4341 4342
      if (code) {
        pTaskInfo->code = terrno;
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4343

4344 4345
      SOperatorInfo* pOperator =
          createTableMergeScanOperatorInfo(pTableScanNode, pTableListInfo, pHandle, pTaskInfo, queryId, taskId);
wmmhello's avatar
wmmhello 已提交
4346

4347 4348 4349
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
      return pOperator;
L
Liu Jicong 已提交
4350

H
Haojun Liao 已提交
4351
    } else if (QUERY_NODE_PHYSICAL_PLAN_EXCHANGE == type) {
4352
      return createExchangeOperatorInfo(pHandle->pMsgCb->clientRpc, (SExchangePhysiNode*)pPhyNode, pTaskInfo);
L
Liu Jicong 已提交
4353

H
Haojun Liao 已提交
4354
    } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN == type) {
5
54liuyao 已提交
4355
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
4356
      STimeWindowAggSupp   twSup = {
L
Liu Jicong 已提交
4357 4358 4359 4360
            .waterMark = pTableScanNode->watermark,
            .calTrigger = pTableScanNode->triggerType,
            .maxTs = INT64_MIN,
      };
L
Liu Jicong 已提交
4361
      if (pHandle) {
wmmhello's avatar
wmmhello 已提交
4362
        int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
L
Liu Jicong 已提交
4363
        if (code) {
wmmhello's avatar
wmmhello 已提交
4364 4365 4366
          pTaskInfo->code = code;
          return NULL;
        }
5
54liuyao 已提交
4367
      }
4368

4369 4370
      SOperatorInfo* pOperator =
          createStreamScanOperatorInfo(pHandle, pTableScanNode, pTaskInfo, &twSup, queryId, taskId);
H
Haojun Liao 已提交
4371
      return pOperator;
L
Liu Jicong 已提交
4372

H
Haojun Liao 已提交
4373
    } else if (QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN == type) {
L
Liu Jicong 已提交
4374
      SSystemTableScanPhysiNode* pSysScanPhyNode = (SSystemTableScanPhysiNode*)pPhyNode;
4375
      return createSysTableScanOperatorInfo(pHandle, pSysScanPhyNode, pUser, pTaskInfo);
4376
    } else if (QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN == type) {
X
Xiaoyu Wang 已提交
4377
      STagScanPhysiNode* pScanPhyNode = (STagScanPhysiNode*)pPhyNode;
4378

4379
      int32_t code = getTableList(pHandle->meta, pHandle->vnode, pScanPhyNode, pTableListInfo);
4380
      if (code != TSDB_CODE_SUCCESS) {
4381
        pTaskInfo->code = terrno;
4382 4383 4384
        return NULL;
      }

4385
      return createTagScanOperatorInfo(pHandle, pScanPhyNode, pTableListInfo, pTaskInfo);
4386
    } else if (QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN == type) {
4387
      SBlockDistScanPhysiNode* pBlockNode = (SBlockDistScanPhysiNode*)pPhyNode;
4388 4389 4390
      pTableListInfo->pTableList = taosArrayInit(4, sizeof(STableKeyInfo));

      if (pBlockNode->tableType == TSDB_SUPER_TABLE) {
4391
        int32_t code = vnodeGetAllTableList(pHandle->vnode, pBlockNode->uid, pTableListInfo->pTableList);
4392 4393 4394 4395 4396
        if (code != TSDB_CODE_SUCCESS) {
          pTaskInfo->code = terrno;
          return NULL;
        }
      } else {  // Create one table group.
S
slzhou 已提交
4397
        STableKeyInfo info = {.lastKey = 0, .uid = pBlockNode->uid, .groupId = 0};
4398 4399 4400 4401 4402 4403 4404 4405 4406 4407 4408 4409 4410 4411 4412 4413 4414 4415
        taosArrayPush(pTableListInfo->pTableList, &info);
      }

      SQueryTableDataCond cond = {0};

      {
        cond.order = TSDB_ORDER_ASC;
        cond.numOfCols = 1;
        cond.colList = taosMemoryCalloc(1, sizeof(SColumnInfo));
        if (cond.colList == NULL) {
          terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
          return NULL;
        }

        cond.colList->colId = 1;
        cond.colList->type = TSDB_DATA_TYPE_TIMESTAMP;
        cond.colList->bytes = sizeof(TSKEY);

H
Haojun Liao 已提交
4416
        cond.twindows = (STimeWindow){.skey = INT64_MIN, .ekey = INT64_MAX};
4417
        cond.suid = pBlockNode->suid;
H
Haojun Liao 已提交
4418
        cond.type = BLOCK_LOAD_OFFSET_ORDER;
4419
      }
H
Haojun Liao 已提交
4420 4421 4422

      STsdbReader* pReader = NULL;
      tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, "");
4423 4424
      cleanupQueryTableDataCond(&cond);

4425
      return createDataBlockInfoScanOperator(pReader, pHandle, cond.suid, pBlockNode, pTaskInfo);
H
Haojun Liao 已提交
4426 4427 4428
    } else if (QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN == type) {
      SLastRowScanPhysiNode* pScanNode = (SLastRowScanPhysiNode*)pPhyNode;

L
Liu Jicong 已提交
4429 4430 4431 4432 4433
      //      int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
      //      if (code) {
      //        pTaskInfo->code = code;
      //        return NULL;
      //      }
H
Haojun Liao 已提交
4434

4435
      int32_t code = extractTableSchemaInfo(pHandle, pScanNode->uid, pTaskInfo);
4436 4437 4438 4439
      if (code != TSDB_CODE_SUCCESS) {
        pTaskInfo->code = code;
        return NULL;
      }
4440

H
Haojun Liao 已提交
4441
      pTableListInfo->pTableList = taosArrayInit(4, sizeof(STableKeyInfo));
H
Haojun Liao 已提交
4442
      if (pScanNode->tableType == TSDB_SUPER_TABLE) {
4443
        code = vnodeGetAllTableList(pHandle->vnode, pScanNode->uid, pTableListInfo->pTableList);
H
Haojun Liao 已提交
4444 4445 4446 4447 4448 4449 4450 4451 4452
        if (code != TSDB_CODE_SUCCESS) {
          pTaskInfo->code = terrno;
          return NULL;
        }
      } else {  // Create one table group.
        STableKeyInfo info = {.lastKey = 0, .uid = pScanNode->uid, .groupId = 0};
        taosArrayPush(pTableListInfo->pTableList, &info);
      }

H
Haojun Liao 已提交
4453
      return createLastrowScanOperator(pScanNode, pHandle, pTableListInfo->pTableList, pTaskInfo);
H
Haojun Liao 已提交
4454 4455
    } else {
      ASSERT(0);
H
Haojun Liao 已提交
4456 4457 4458
    }
  }

4459 4460
  int32_t num = 0;
  size_t  size = LIST_LENGTH(pPhyNode->pChildren);
H
Haojun Liao 已提交
4461

4462
  SOperatorInfo** ops = taosMemoryCalloc(size, POINTER_BYTES);
dengyihao's avatar
dengyihao 已提交
4463
  for (int32_t i = 0; i < size; ++i) {
4464
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pPhyNode->pChildren, i);
4465
    ops[i] = createOperatorTree(pChildNode, pTaskInfo, pHandle, queryId, taskId, pTableListInfo, pUser);
4466 4467 4468
    if (ops[i] == NULL) {
      return NULL;
    }
4469
  }
H
Haojun Liao 已提交
4470

4471
  SOperatorInfo* pOptr = NULL;
H
Haojun Liao 已提交
4472
  if (QUERY_NODE_PHYSICAL_PLAN_PROJECT == type) {
4473
    pOptr = createProjectOperatorInfo(ops[0], (SProjectPhysiNode*)pPhyNode, pTaskInfo);
4474
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_AGG == type) {
H
Haojun Liao 已提交
4475 4476
    SAggPhysiNode* pAggNode = (SAggPhysiNode*)pPhyNode;
    SExprInfo*     pExprInfo = createExprInfo(pAggNode->pAggFuncs, pAggNode->pGroupKeys, &num);
4477
    SSDataBlock*   pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4478

dengyihao's avatar
dengyihao 已提交
4479
    int32_t    numOfScalarExpr = 0;
4480 4481 4482 4483 4484
    SExprInfo* pScalarExprInfo = NULL;
    if (pAggNode->pExprs != NULL) {
      pScalarExprInfo = createExprInfo(pAggNode->pExprs, NULL, &numOfScalarExpr);
    }

H
Haojun Liao 已提交
4485 4486
    if (pAggNode->pGroupKeys != NULL) {
      SArray* pColList = extractColumnInfo(pAggNode->pGroupKeys);
dengyihao's avatar
dengyihao 已提交
4487
      pOptr = createGroupOperatorInfo(ops[0], pExprInfo, num, pResBlock, pColList, pAggNode->node.pConditions,
wmmhello's avatar
wmmhello 已提交
4488
                                      pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4489
    } else {
L
Liu Jicong 已提交
4490 4491
      pOptr = createAggregateOperatorInfo(ops[0], pExprInfo, num, pResBlock, pAggNode->node.pConditions,
                                          pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4492
    }
X
Xiaoyu Wang 已提交
4493
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_INTERVAL == type || QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type) {
H
Haojun Liao 已提交
4494
    SIntervalPhysiNode* pIntervalPhyNode = (SIntervalPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4495

H
Haojun Liao 已提交
4496
    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
4497
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4498

dengyihao's avatar
dengyihao 已提交
4499 4500 4501 4502 4503 4504
    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
H
Haojun Liao 已提交
4505

X
Xiaoyu Wang 已提交
4506 4507 4508 4509 4510
    STimeWindowAggSupp as = {
        .waterMark = pIntervalPhyNode->window.watermark,
        .calTrigger = pIntervalPhyNode->window.triggerType,
        .maxTs = INT64_MIN,
    };
4511
    ASSERT(as.calTrigger != STREAM_TRIGGER_MAX_DELAY);
4512

4513
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4514
    bool    isStream = (QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type);
4515 4516
    pOptr = createIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, &as, pIntervalPhyNode,
                                       pTaskInfo, isStream);
4517

4518 4519
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == type) {
    SMergeAlignedIntervalPhysiNode* pIntervalPhyNode = (SMergeAlignedIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4520 4521 4522 4523 4524 4525 4526 4527 4528 4529

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4530

S
shenglian zhou 已提交
4531
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4532 4533
    pOptr = createMergeAlignedIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId,
                                                   pPhyNode->pConditions, pTaskInfo);
S
shenglian zhou 已提交
4534
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_INTERVAL == type) {
X
Xiaoyu Wang 已提交
4535
    SMergeIntervalPhysiNode* pIntervalPhyNode = (SMergeIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4536 4537 4538 4539 4540 4541 4542 4543 4544 4545

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4546

S
shenglian zhou 已提交
4547 4548
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
    pOptr = createMergeIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, pTaskInfo);
5
54liuyao 已提交
4549
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_INTERVAL == type) {
4550
    int32_t children = 0;
5
54liuyao 已提交
4551 4552
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_INTERVAL == type) {
4553
    int32_t children = 1;
5
54liuyao 已提交
4554
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4555
  } else if (QUERY_NODE_PHYSICAL_PLAN_SORT == type) {
4556
    pOptr = createSortOperatorInfo(ops[0], (SSortPhysiNode*)pPhyNode, pTaskInfo);
S
shenglian zhou 已提交
4557 4558
  } else if (QUERY_NODE_PHYSICAL_PLAN_GROUP_SORT == type) {
    pOptr = createGroupSortOperatorInfo(ops[0], (SGroupSortPhysiNode*)pPhyNode, pTaskInfo);
X
Xiaoyu Wang 已提交
4559
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE == type) {
4560
    SMergePhysiNode* pMergePhyNode = (SMergePhysiNode*)pPhyNode;
4561
    pOptr = createMultiwayMergeOperatorInfo(ops, size, pMergePhyNode, pTaskInfo);
4562
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_SESSION == type) {
H
Haojun Liao 已提交
4563 4564
    SSessionWinodwPhysiNode* pSessionNode = (SSessionWinodwPhysiNode*)pPhyNode;

X
Xiaoyu Wang 已提交
4565 4566
    STimeWindowAggSupp as = {.waterMark = pSessionNode->window.watermark,
                             .calTrigger = pSessionNode->window.triggerType};
4567

H
Haojun Liao 已提交
4568
    SExprInfo*   pExprInfo = createExprInfo(pSessionNode->window.pFuncs, NULL, &num);
4569
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4570 4571
    int32_t      tsSlotId = ((SColumnNode*)pSessionNode->window.pTspk)->slotId;

L
Liu Jicong 已提交
4572 4573
    pOptr = createSessionAggOperatorInfo(ops[0], pExprInfo, num, pResBlock, pSessionNode->gap, tsSlotId, &as,
                                         pPhyNode->pConditions, pTaskInfo);
4574
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SESSION == type) {
4575 4576 4577 4578 4579 4580 4581
    pOptr = createStreamSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_SESSION == type) {
    int32_t children = 0;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_SESSION == type) {
    int32_t children = 1;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4582
  } else if (QUERY_NODE_PHYSICAL_PLAN_PARTITION == type) {
4583
    pOptr = createPartitionOperatorInfo(ops[0], (SPartitionPhysiNode*)pPhyNode, pTaskInfo);
4584
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_STATE == type) {
dengyihao's avatar
dengyihao 已提交
4585
    SStateWinodwPhysiNode* pStateNode = (SStateWinodwPhysiNode*)pPhyNode;
4586

4587 4588
    STimeWindowAggSupp as = {.waterMark = pStateNode->window.watermark, .calTrigger = pStateNode->window.triggerType};

dengyihao's avatar
dengyihao 已提交
4589
    SExprInfo*   pExprInfo = createExprInfo(pStateNode->window.pFuncs, NULL, &num);
4590
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4591 4592
    int32_t      tsSlotId = ((SColumnNode*)pStateNode->window.pTspk)->slotId;

4593
    SColumnNode* pColNode = (SColumnNode*)((STargetNode*)pStateNode->pStateKey)->pExpr;
X
Xiaoyu Wang 已提交
4594
    SColumn      col = extractColumnFromColumnNode(pColNode);
L
Liu Jicong 已提交
4595 4596
    pOptr = createStatewindowOperatorInfo(ops[0], pExprInfo, num, pResBlock, &as, tsSlotId, &col, pPhyNode->pConditions,
                                          pTaskInfo);
4597
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_STATE == type) {
5
54liuyao 已提交
4598
    pOptr = createStreamStateAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4599
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_JOIN == type) {
4600
    pOptr = createMergeJoinOperatorInfo(ops, size, (SJoinPhysiNode*)pPhyNode, pTaskInfo);
4601
  } else if (QUERY_NODE_PHYSICAL_PLAN_FILL == type) {
4602
    pOptr = createFillOperatorInfo(ops[0], (SFillPhysiNode*)pPhyNode, false, pTaskInfo);
H
Haojun Liao 已提交
4603 4604
  } else if (QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC == type) {
    pOptr = createIndefinitOutputOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4605 4606
  } else if (QUERY_NODE_PHYSICAL_PLAN_INTERP_FUNC == type) {
    pOptr = createTimeSliceOperatorInfo(ops[0], pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4607 4608
  } else {
    ASSERT(0);
H
Haojun Liao 已提交
4609
  }
4610 4611 4612

  taosMemoryFree(ops);
  return pOptr;
4613
}
H
Haojun Liao 已提交
4614

H
Haojun Liao 已提交
4615
SArray* extractColumnInfo(SNodeList* pNodeList) {
L
Liu Jicong 已提交
4616
  size_t  numOfCols = LIST_LENGTH(pNodeList);
H
Haojun Liao 已提交
4617 4618 4619 4620 4621 4622
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColumn));
  if (pList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

L
Liu Jicong 已提交
4623 4624
  for (int32_t i = 0; i < numOfCols; ++i) {
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pNodeList, i);
H
Haojun Liao 已提交
4625

4626 4627 4628
    if (nodeType(pNode->pExpr) == QUERY_NODE_COLUMN) {
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

4629
      SColumn c = extractColumnFromColumnNode(pColNode);
4630 4631
      taosArrayPush(pList, &c);
    } else if (nodeType(pNode->pExpr) == QUERY_NODE_VALUE) {
L
Liu Jicong 已提交
4632 4633
      SValueNode* pValNode = (SValueNode*)pNode->pExpr;
      SColumn     c = {0};
4634
      c.slotId = pNode->slotId;
L
Liu Jicong 已提交
4635 4636 4637 4638
      c.colId = pNode->slotId;
      c.type = pValNode->node.type;
      c.bytes = pValNode->node.resType.bytes;
      c.scale = pValNode->node.resType.scale;
4639 4640 4641 4642
      c.precision = pValNode->node.resType.precision;

      taosArrayPush(pList, &c);
    }
H
Haojun Liao 已提交
4643 4644 4645 4646 4647
  }

  return pList;
}

L
Liu Jicong 已提交
4648 4649
STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
                                STableListInfo* pTableListInfo, const char* idstr) {
4650
  int32_t code = getTableList(pHandle->meta, pHandle->vnode, &pTableScanNode->scan, pTableListInfo);
wmmhello's avatar
wmmhello 已提交
4651 4652 4653 4654 4655 4656
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  if (taosArrayGetSize(pTableListInfo->pTableList) == 0) {
    code = 0;
H
Haojun Liao 已提交
4657
    qDebug("no table qualified for query, %s", idstr);
wmmhello's avatar
wmmhello 已提交
4658 4659 4660
    goto _error;
  }

4661
  SQueryTableDataCond cond = {0};
wmmhello's avatar
wmmhello 已提交
4662
  code = initQueryTableDataCond(&cond, pTableScanNode);
4663
  if (code != TSDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4664
    goto _error;
X
Xiaoyu Wang 已提交
4665
  }
4666

H
Hongze Cheng 已提交
4667
  STsdbReader* pReader;
H
Haojun Liao 已提交
4668
  code = tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, idstr);
H
Haojun Liao 已提交
4669 4670 4671 4672
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

4673
  cleanupQueryTableDataCond(&cond);
H
Haojun Liao 已提交
4674 4675

  return pReader;
wmmhello's avatar
wmmhello 已提交
4676 4677 4678 4679

_error:
  terrno = code;
  return NULL;
H
Haojun Liao 已提交
4680 4681
}

L
Liu Jicong 已提交
4682 4683 4684 4685 4686 4687 4688 4689 4690 4691 4692 4693 4694
static int32_t extractTbscanInStreamOpTree(SOperatorInfo* pOperator, STableScanInfo** ppInfo) {
  if (pOperator->operatorType != QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
    if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator");
      return TSDB_CODE_QRY_APP_ERROR;
    }

    if (pOperator->numOfDownstream > 1) {
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
    }
    return extractTbscanInStreamOpTree(pOperator->pDownstream[0], ppInfo);
  } else {
4695 4696 4697
    SStreamScanInfo* pInfo = pOperator->info;
    ASSERT(pInfo->pTableScanOp->operatorType == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN);
    *ppInfo = pInfo->pTableScanOp->info;
L
Liu Jicong 已提交
4698 4699 4700 4701
    return 0;
  }
}

4702 4703 4704 4705 4706 4707 4708 4709 4710 4711 4712 4713 4714 4715 4716 4717 4718 4719 4720 4721 4722 4723
int32_t extractTableScanNode(SPhysiNode* pNode, STableScanPhysiNode** ppNode) {
  if (pNode->pChildren == NULL || LIST_LENGTH(pNode->pChildren) == 0) {
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == pNode->type) {
      *ppNode = (STableScanPhysiNode*)pNode;
      return 0;
    } else {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
  } else {
    if (LIST_LENGTH(pNode->pChildren) != 1) {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pNode->pChildren, 0);
    return extractTableScanNode(pChildNode, ppNode);
  }
  return -1;
}

L
Liu Jicong 已提交
4724 4725 4726 4727 4728
int32_t rebuildReader(SOperatorInfo* pOperator, SSubplan* plan, SReadHandle* pHandle, int64_t uid, int64_t ts) {
  STableScanInfo* pTableScanInfo = NULL;
  if (extractTbscanInStreamOpTree(pOperator, &pTableScanInfo) < 0) {
    return -1;
  }
4729

L
Liu Jicong 已提交
4730 4731 4732 4733
  STableScanPhysiNode* pNode = NULL;
  if (extractTableScanNode(plan->pNode, &pNode) < 0) {
    ASSERT(0);
  }
4734

H
Haojun Liao 已提交
4735
  tsdbReaderClose(pTableScanInfo->dataReader);
4736

L
Liu Jicong 已提交
4737
  STableListInfo info = {0};
H
Haojun Liao 已提交
4738
  pTableScanInfo->dataReader = doCreateDataReader(pNode, pHandle, &info, NULL);
L
Liu Jicong 已提交
4739 4740 4741 4742
  if (pTableScanInfo->dataReader == NULL) {
    ASSERT(0);
    qError("failed to create data reader");
    return TSDB_CODE_QRY_APP_ERROR;
4743
  }
L
Liu Jicong 已提交
4744
  // TODO: set uid and ts to data reader
4745 4746 4747
  return 0;
}

C
Cary Xu 已提交
4748
int32_t encodeOperator(SOperatorInfo* ops, char** result, int32_t* length, int32_t* nOptrWithVal) {
wmmhello's avatar
wmmhello 已提交
4749
  int32_t code = TDB_CODE_SUCCESS;
4750
  char*   pCurrent = NULL;
wmmhello's avatar
wmmhello 已提交
4751
  int32_t currLength = 0;
4752
  if (ops->fpSet.encodeResultRow) {
C
Cary Xu 已提交
4753
    if (result == NULL || length == NULL || nOptrWithVal == NULL) {
wmmhello's avatar
wmmhello 已提交
4754 4755 4756
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
    code = ops->fpSet.encodeResultRow(ops, &pCurrent, &currLength);
wmmhello's avatar
wmmhello 已提交
4757

4758 4759
    if (code != TDB_CODE_SUCCESS) {
      if (*result != NULL) {
wmmhello's avatar
wmmhello 已提交
4760 4761 4762 4763
        taosMemoryFree(*result);
        *result = NULL;
      }
      return code;
C
Cary Xu 已提交
4764 4765 4766
    } else if (currLength == 0) {
      ASSERT(!pCurrent);
      goto _downstream;
wmmhello's avatar
wmmhello 已提交
4767
    }
wmmhello's avatar
wmmhello 已提交
4768

C
Cary Xu 已提交
4769 4770
    ++(*nOptrWithVal);

C
Cary Xu 已提交
4771
    ASSERT(currLength >= 0);
wmmhello's avatar
wmmhello 已提交
4772

4773
    if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
4774
      *result = (char*)taosMemoryCalloc(1, currLength + sizeof(int32_t));
wmmhello's avatar
wmmhello 已提交
4775 4776 4777 4778 4779 4780
      if (*result == NULL) {
        taosMemoryFree(pCurrent);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      memcpy(*result + sizeof(int32_t), pCurrent, currLength);
      *(int32_t*)(*result) = currLength + sizeof(int32_t);
4781
    } else {
wmmhello's avatar
wmmhello 已提交
4782
      int32_t sizePre = *(int32_t*)(*result);
4783
      char*   tmp = (char*)taosMemoryRealloc(*result, sizePre + currLength);
wmmhello's avatar
wmmhello 已提交
4784 4785 4786 4787 4788 4789 4790 4791 4792 4793 4794 4795
      if (tmp == NULL) {
        taosMemoryFree(pCurrent);
        taosMemoryFree(*result);
        *result = NULL;
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      *result = tmp;
      memcpy(*result + sizePre, pCurrent, currLength);
      *(int32_t*)(*result) += currLength;
    }
    taosMemoryFree(pCurrent);
    *length = *(int32_t*)(*result);
wmmhello's avatar
wmmhello 已提交
4796 4797
  }

C
Cary Xu 已提交
4798
_downstream:
wmmhello's avatar
wmmhello 已提交
4799
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
C
Cary Xu 已提交
4800
    code = encodeOperator(ops->pDownstream[i], result, length, nOptrWithVal);
4801
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4802
      return code;
wmmhello's avatar
wmmhello 已提交
4803 4804
    }
  }
wmmhello's avatar
wmmhello 已提交
4805
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4806 4807
}

H
Haojun Liao 已提交
4808
int32_t decodeOperator(SOperatorInfo* ops, const char* result, int32_t length) {
wmmhello's avatar
wmmhello 已提交
4809
  int32_t code = TDB_CODE_SUCCESS;
4810 4811
  if (ops->fpSet.decodeResultRow) {
    if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
4812 4813
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
H
Haojun Liao 已提交
4814

4815
    ASSERT(length == *(int32_t*)result);
H
Haojun Liao 已提交
4816 4817

    const char* data = result + sizeof(int32_t);
L
Liu Jicong 已提交
4818
    code = ops->fpSet.decodeResultRow(ops, (char*)data);
4819
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4820 4821
      return code;
    }
wmmhello's avatar
wmmhello 已提交
4822

wmmhello's avatar
wmmhello 已提交
4823
    int32_t totalLength = *(int32_t*)result;
4824 4825
    int32_t dataLength = *(int32_t*)data;

4826
    if (totalLength == dataLength + sizeof(int32_t)) {  // the last data
wmmhello's avatar
wmmhello 已提交
4827 4828
      result = NULL;
      length = 0;
4829
    } else {
wmmhello's avatar
wmmhello 已提交
4830 4831 4832 4833
      result += dataLength;
      *(int32_t*)(result) = totalLength - dataLength;
      length = totalLength - dataLength;
    }
wmmhello's avatar
wmmhello 已提交
4834 4835
  }

wmmhello's avatar
wmmhello 已提交
4836 4837
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
    code = decodeOperator(ops->pDownstream[i], result, length);
4838
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4839
      return code;
wmmhello's avatar
wmmhello 已提交
4840 4841
    }
  }
wmmhello's avatar
wmmhello 已提交
4842
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4843 4844
}

D
dapan1121 已提交
4845
int32_t createDataSinkParam(SDataSinkNode* pNode, void** pParam, qTaskInfo_t* pTaskInfo, SReadHandle* readHandle) {
D
dapan1121 已提交
4846
  SExecTaskInfo* pTask = *(SExecTaskInfo**)pTaskInfo;
4847

D
dapan1121 已提交
4848
  switch (pNode->type) {
D
dapan1121 已提交
4849 4850 4851 4852 4853 4854
    case QUERY_NODE_PHYSICAL_PLAN_QUERY_INSERT: {
      SInserterParam* pInserterParam = taosMemoryCalloc(1, sizeof(SInserterParam));
      if (NULL == pInserterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      pInserterParam->readHandle = readHandle;
L
Liu Jicong 已提交
4855

D
dapan1121 已提交
4856 4857 4858
      *pParam = pInserterParam;
      break;
    }
D
dapan1121 已提交
4859
    case QUERY_NODE_PHYSICAL_PLAN_DELETE: {
4860
      SDeleterParam* pDeleterParam = taosMemoryCalloc(1, sizeof(SDeleterParam));
D
dapan1121 已提交
4861 4862 4863 4864
      if (NULL == pDeleterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      int32_t tbNum = taosArrayGetSize(pTask->tableqinfoList.pTableList);
D
dapan1121 已提交
4865
      pDeleterParam->suid = pTask->tableqinfoList.suid;
D
dapan1121 已提交
4866 4867 4868 4869 4870 4871
      pDeleterParam->pUidList = taosArrayInit(tbNum, sizeof(uint64_t));
      if (NULL == pDeleterParam->pUidList) {
        taosMemoryFree(pDeleterParam);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      for (int32_t i = 0; i < tbNum; ++i) {
4872
        STableKeyInfo* pTable = taosArrayGet(pTask->tableqinfoList.pTableList, i);
D
dapan1121 已提交
4873 4874 4875 4876 4877 4878 4879 4880 4881 4882 4883 4884 4885
        taosArrayPush(pDeleterParam->pUidList, &pTable->uid);
      }

      *pParam = pDeleterParam;
      break;
    }
    default:
      break;
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
4886
int32_t createExecTaskInfoImpl(SSubplan* pPlan, SExecTaskInfo** pTaskInfo, SReadHandle* pHandle, uint64_t taskId,
4887
                               const char* sql, EOPTR_EXEC_MODEL model) {
H
Haojun Liao 已提交
4888 4889
  uint64_t queryId = pPlan->id.queryId;

H
Haojun Liao 已提交
4890
  int32_t code = TSDB_CODE_SUCCESS;
D
dapan1121 已提交
4891
  *pTaskInfo = createExecTaskInfo(queryId, taskId, model, pPlan->dbFName);
H
Haojun Liao 已提交
4892 4893 4894 4895
  if (*pTaskInfo == NULL) {
    code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    goto _complete;
  }
H
Haojun Liao 已提交
4896

4897
  (*pTaskInfo)->sql = sql;
wmmhello's avatar
wmmhello 已提交
4898 4899
  (*pTaskInfo)->tableqinfoList.pTagCond = pPlan->pTagCond;
  (*pTaskInfo)->tableqinfoList.pTagIndexCond = pPlan->pTagIndexCond;
4900 4901
  (*pTaskInfo)->pRoot = createOperatorTree(pPlan->pNode, *pTaskInfo, pHandle, queryId, taskId,
                                           &(*pTaskInfo)->tableqinfoList, pPlan->user);
L
Liu Jicong 已提交
4902

D
dapan1121 已提交
4903
  if (NULL == (*pTaskInfo)->pRoot) {
4904
    code = (*pTaskInfo)->code;
D
dapan1121 已提交
4905
    goto _complete;
4906 4907
  }

H
Haojun Liao 已提交
4908 4909
  return code;

H
Haojun Liao 已提交
4910
_complete:
wafwerar's avatar
wafwerar 已提交
4911
  taosMemoryFreeClear(*pTaskInfo);
H
Haojun Liao 已提交
4912 4913
  terrno = code;
  return code;
H
Haojun Liao 已提交
4914 4915
}

wmmhello's avatar
wmmhello 已提交
4916 4917 4918
static void doDestroyTableList(STableListInfo* pTableqinfoList) {
  taosArrayDestroy(pTableqinfoList->pTableList);
  taosHashCleanup(pTableqinfoList->map);
4919 4920
  if (pTableqinfoList->needSortTableByGroupId) {
    for (int32_t i = 0; i < taosArrayGetSize(pTableqinfoList->pGroupList); i++) {
wmmhello's avatar
wmmhello 已提交
4921 4922 4923 4924 4925
      SArray* tmp = taosArrayGetP(pTableqinfoList->pGroupList, i);
      taosArrayDestroy(tmp);
    }
  }
  taosArrayDestroy(pTableqinfoList->pGroupList);
4926

wmmhello's avatar
wmmhello 已提交
4927 4928
  pTableqinfoList->pTableList = NULL;
  pTableqinfoList->map = NULL;
4929 4930
}

L
Liu Jicong 已提交
4931
void doDestroyTask(SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
4932 4933
  qDebug("%s execTask is freed", GET_TASKID(pTaskInfo));

wmmhello's avatar
wmmhello 已提交
4934
  doDestroyTableList(&pTaskInfo->tableqinfoList);
H
Haojun Liao 已提交
4935
  destroyOperatorInfo(pTaskInfo->pRoot);
4936
  cleanupTableSchemaInfo(pTaskInfo);
4937

wafwerar's avatar
wafwerar 已提交
4938 4939 4940
  taosMemoryFreeClear(pTaskInfo->sql);
  taosMemoryFreeClear(pTaskInfo->id.str);
  taosMemoryFreeClear(pTaskInfo);
4941 4942 4943 4944 4945 4946 4947 4948 4949 4950 4951 4952
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes) {
  if (val == NULL) {
    setNull(output, type, bytes);
    return;
  }

  if (IS_VAR_DATA_TYPE(type)) {
    // Binary data overflows for sort of unknown reasons. Let trim the overflow data
    if (varDataTLen(val) > bytes) {
      int32_t maxLen = bytes - VARSTR_HEADER_SIZE;
L
Liu Jicong 已提交
4953
      int32_t len = (varDataLen(val) > maxLen) ? maxLen : varDataLen(val);
4954 4955 4956 4957 4958 4959 4960 4961 4962 4963 4964 4965
      memcpy(varDataVal(output), varDataVal(val), len);
      varDataSetLen(output, len);
    } else {
      varDataCopy(output, val);
    }
  } else {
    memcpy(output, val, bytes);
  }
}

static int64_t getQuerySupportBufSize(size_t numOfTables) {
  size_t s1 = sizeof(STableQueryInfo);
L
Liu Jicong 已提交
4966 4967
  //  size_t s3 = sizeof(STableCheckInfo);  buffer consumption in tsdb
  return (int64_t)(s1 * 1.5 * numOfTables);
4968 4969 4970 4971 4972 4973 4974
}

int32_t checkForQueryBuf(size_t numOfTables) {
  int64_t t = getQuerySupportBufSize(numOfTables);
  if (tsQueryBufferSizeBytes < 0) {
    return TSDB_CODE_SUCCESS;
  } else if (tsQueryBufferSizeBytes > 0) {
L
Liu Jicong 已提交
4975
    while (1) {
4976 4977 4978 4979 4980 4981 4982 4983 4984 4985 4986 4987 4988 4989 4990 4991 4992 4993 4994 4995 4996 4997 4998 4999 5000 5001
      int64_t s = tsQueryBufferSizeBytes;
      int64_t remain = s - t;
      if (remain >= 0) {
        if (atomic_val_compare_exchange_64(&tsQueryBufferSizeBytes, s, remain) == s) {
          return TSDB_CODE_SUCCESS;
        }
      } else {
        return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
      }
    }
  }

  // disable query processing if the value of tsQueryBufferSize is zero.
  return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
}

void releaseQueryBuf(size_t numOfTables) {
  if (tsQueryBufferSizeBytes < 0) {
    return;
  }

  int64_t t = getQuerySupportBufSize(numOfTables);

  // restore value is not enough buffer available
  atomic_add_fetch_64(&tsQueryBufferSizeBytes, t);
}
D
dapan1121 已提交
5002

dengyihao's avatar
dengyihao 已提交
5003 5004
int32_t getOperatorExplainExecInfo(SOperatorInfo* operatorInfo, SExplainExecInfo** pRes, int32_t* capacity,
                                   int32_t* resNum) {
D
dapan1121 已提交
5005 5006
  if (*resNum >= *capacity) {
    *capacity += 10;
dengyihao's avatar
dengyihao 已提交
5007

D
dapan1121 已提交
5008 5009
    *pRes = taosMemoryRealloc(*pRes, (*capacity) * sizeof(SExplainExecInfo));
    if (NULL == *pRes) {
D
dapan1121 已提交
5010
      qError("malloc %d failed", (*capacity) * (int32_t)sizeof(SExplainExecInfo));
D
dapan1121 已提交
5011 5012 5013 5014
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

5015 5016 5017 5018 5019
  SExplainExecInfo* pInfo = &(*pRes)[*resNum];

  pInfo->numOfRows = operatorInfo->resultInfo.totalRows;
  pInfo->startupCost = operatorInfo->cost.openCost;
  pInfo->totalCost = operatorInfo->cost.totalCost;
D
dapan1121 已提交
5020

5021
  if (operatorInfo->fpSet.getExplainFn) {
5022
    int32_t code = operatorInfo->fpSet.getExplainFn(operatorInfo, &pInfo->verboseInfo, &pInfo->verboseLen);
D
dapan1121 已提交
5023
    if (code) {
5024
      qError("%s operator getExplainFn failed, code:%s", GET_TASKID(operatorInfo->pTaskInfo), tstrerror(code));
D
dapan1121 已提交
5025 5026
      return code;
    }
5027 5028 5029
  } else {
    pInfo->verboseLen = 0;
    pInfo->verboseInfo = NULL;
D
dapan1121 已提交
5030
  }
dengyihao's avatar
dengyihao 已提交
5031

D
dapan1121 已提交
5032
  ++(*resNum);
dengyihao's avatar
dengyihao 已提交
5033

D
dapan1121 已提交
5034
  int32_t code = 0;
D
dapan1121 已提交
5035 5036
  for (int32_t i = 0; i < operatorInfo->numOfDownstream; ++i) {
    code = getOperatorExplainExecInfo(operatorInfo->pDownstream[i], pRes, capacity, resNum);
D
dapan1121 已提交
5037 5038 5039 5040 5041 5042 5043
    if (code) {
      taosMemoryFreeClear(*pRes);
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
D
dapan1121 已提交
5044
}
5
54liuyao 已提交
5045

L
Liu Jicong 已提交
5046
int32_t initStreamAggSupporter(SStreamAggSupporter* pSup, const char* pKey, SqlFunctionCtx* pCtx, int32_t numOfOutput,
5047
                               int32_t size) {
5048
  pSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
5
54liuyao 已提交
5049 5050
  pSup->keySize = sizeof(int64_t) + sizeof(TSKEY);
  pSup->pKeyBuf = taosMemoryCalloc(1, pSup->keySize);
5051 5052
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);
  pSup->pResultRows = taosHashInit(1024, hashFn, false, HASH_NO_LOCK);
5
54liuyao 已提交
5053 5054 5055
  if (pSup->pKeyBuf == NULL || pSup->pResultRows == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
5056
  pSup->valueSize = size;
5
54liuyao 已提交
5057

5
54liuyao 已提交
5058 5059
  pSup->pScanWindow = taosArrayInit(4, sizeof(STimeWindow));

5
54liuyao 已提交
5060 5061 5062 5063 5064 5065 5066 5067 5068
  int32_t pageSize = 4096;
  while (pageSize < pSup->resultRowSize * 4) {
    pageSize <<= 1u;
  }
  // at least four pages need to be in buffer
  int32_t bufSize = 4096 * 256;
  if (bufSize <= pageSize) {
    bufSize = pageSize * 4;
  }
5069
  int32_t code = createDiskbasedBuf(&pSup->pResultBuf, pageSize, bufSize, pKey, TD_TMP_DIR_PATH);
L
Liu Jicong 已提交
5070
  for (int32_t i = 0; i < numOfOutput; ++i) {
5071 5072 5073
    pCtx[i].pBuf = pSup->pResultBuf;
  }
  return code;
5
54liuyao 已提交
5074
}