executorimpl.c 181.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
15

H
Haojun Liao 已提交
16 17
#include "filter.h"
#include "function.h"
18 19
#include "functionMgt.h"
#include "os.h"
H
Haojun Liao 已提交
20
#include "querynodes.h"
21
#include "tfill.h"
dengyihao's avatar
dengyihao 已提交
22
#include "tname.h"
X
Xiaoyu Wang 已提交
23
#include "tref.h"
24

H
Haojun Liao 已提交
25
#include "tdatablock.h"
26
#include "tglobal.h"
H
Haojun Liao 已提交
27
#include "tmsg.h"
H
Haojun Liao 已提交
28
#include "tsort.h"
29
#include "ttime.h"
H
Haojun Liao 已提交
30

31
#include "executorimpl.h"
dengyihao's avatar
dengyihao 已提交
32
#include "index.h"
33
#include "query.h"
34 35
#include "tcompare.h"
#include "tcompression.h"
H
Haojun Liao 已提交
36
#include "thash.h"
37
#include "ttypes.h"
dengyihao's avatar
dengyihao 已提交
38
#include "vnode.h"
39

H
Haojun Liao 已提交
40
#define IS_MAIN_SCAN(runtime)          ((runtime)->scanFlag == MAIN_SCAN)
41 42 43 44
#define SET_REVERSE_SCAN_FLAG(runtime) ((runtime)->scanFlag = REVERSE_SCAN)

#define GET_FORWARD_DIRECTION_FACTOR(ord) (((ord) == TSDB_ORDER_ASC) ? QUERY_ASC_FORWARD_STEP : QUERY_DESC_FORWARD_STEP)

45 46 47 48 49
enum {
  PROJECT_RETRIEVE_CONTINUE = 0x1,
  PROJECT_RETRIEVE_DONE = 0x2,
};

50 51
#if 0
static UNUSED_FUNC void *u_malloc (size_t __size) {
wafwerar's avatar
wafwerar 已提交
52
  uint32_t v = taosRand();
53 54 55 56

  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
57
    return taosMemoryMalloc(__size);
58 59 60 61
  }
}

static UNUSED_FUNC void* u_calloc(size_t num, size_t __size) {
wafwerar's avatar
wafwerar 已提交
62
  uint32_t v = taosRand();
63 64 65
  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
66
    return taosMemoryCalloc(num, __size);
67 68 69 70
  }
}

static UNUSED_FUNC void* u_realloc(void* p, size_t __size) {
wafwerar's avatar
wafwerar 已提交
71
  uint32_t v = taosRand();
72 73 74
  if (v % 5 <= 1) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
75
    return taosMemoryRealloc(p, __size);
76 77 78 79 80 81 82 83
  }
}

#define calloc  u_calloc
#define malloc  u_malloc
#define realloc u_realloc
#endif

X
Xiaoyu Wang 已提交
84
#define CLEAR_QUERY_STATUS(q, st)   ((q)->status &= (~(st)))
85 86
#define QUERY_IS_INTERVAL_QUERY(_q) ((_q)->interval.interval > 0)

L
Liu Jicong 已提交
87 88 89
int32_t getMaximumIdleDurationSec() { return tsShellActivityTimer * 2; }

static int32_t getExprFunctionId(SExprInfo* pExprInfo) {
90
  assert(pExprInfo != NULL && pExprInfo->pExpr != NULL && pExprInfo->pExpr->nodeType == TEXPR_UNARYEXPR_NODE);
91
  return 0;
92 93 94 95
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes);

96
static void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExpr, SSDataBlock* pSDataBlock);
97

X
Xiaoyu Wang 已提交
98
static void releaseQueryBuf(size_t numOfTables);
99 100 101 102 103

static void destroySFillOperatorInfo(void* param, int32_t numOfOutput);
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput);
static void destroyOrderOperatorInfo(void* param, int32_t numOfOutput);
static void destroyAggOperatorInfo(void* param, int32_t numOfOutput);
X
Xiaoyu Wang 已提交
104

H
Haojun Liao 已提交
105
static void destroyIntervalOperatorInfo(void* param, int32_t numOfOutput);
H
Haojun Liao 已提交
106 107
static void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput);

108 109
static void destroyOperatorInfo(SOperatorInfo* pOperator);

110
void doSetOperatorCompleted(SOperatorInfo* pOperator) {
111
  pOperator->status = OP_EXEC_DONE;
112

113
  pOperator->cost.totalCost = (taosGetTimestampUs() - pOperator->pTaskInfo->cost.start * 1000) / 1000.0;
H
Haojun Liao 已提交
114
  if (pOperator->pTaskInfo != NULL) {
115
    setTaskStatus(pOperator->pTaskInfo, TASK_COMPLETED);
116 117
  }
}
118

H
Haojun Liao 已提交
119
int32_t operatorDummyOpenFn(SOperatorInfo* pOperator) {
120
  OPTR_SET_OPENED(pOperator);
121
  pOperator->cost.openCost = 0;
H
Haojun Liao 已提交
122
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
123 124
}

125
SOperatorFpSet createOperatorFpSet(__optr_open_fn_t openFn, __optr_fn_t nextFn, __optr_fn_t streamFn,
L
Liu Jicong 已提交
126
                                   __optr_fn_t cleanup, __optr_close_fn_t closeFn, __optr_encode_fn_t encode,
127
                                   __optr_decode_fn_t decode, __optr_explain_fn_t explain) {
128 129 130 131 132 133 134 135 136 137 138 139 140 141
  SOperatorFpSet fpSet = {
      ._openFn = openFn,
      .getNextFn = nextFn,
      .getStreamResFn = streamFn,
      .cleanupFn = cleanup,
      .closeFn = closeFn,
      .encodeResultRow = encode,
      .decodeResultRow = decode,
      .getExplainFn = explain,
  };

  return fpSet;
}

H
Haojun Liao 已提交
142
void operatorDummyCloseFn(void* param, int32_t numOfCols) {}
H
Haojun Liao 已提交
143

X
Xiaoyu Wang 已提交
144 145 146
static int32_t doCopyToSDataBlock(SExecTaskInfo* taskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo,
                                  SDiskbasedBuf* pBuf, SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset,
                                  SqlFunctionCtx* pCtx, int32_t numOfExprs);
H
Haojun Liao 已提交
147

148
static void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size);
L
Liu Jicong 已提交
149 150
static void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                                     uint64_t groupId);
151

L
Liu Jicong 已提交
152 153
// setup the output buffer for each operator
static bool hasNull(SColumn* pColumn, SColumnDataAgg* pStatis) {
dengyihao's avatar
dengyihao 已提交
154 155
  if (TSDB_COL_IS_TAG(pColumn->flag) || TSDB_COL_IS_UD_COL(pColumn->flag) ||
      pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
156 157 158 159 160 161 162 163 164 165
    return false;
  }

  if (pStatis != NULL && pStatis->numOfNull == 0) {
    return false;
  }

  return true;
}

166
#if 0
L
Liu Jicong 已提交
167 168
static bool chkResultRowFromKey(STaskRuntimeEnv* pRuntimeEnv, SResultRowInfo* pResultRowInfo, char* pData,
                                int16_t bytes, bool masterscan, uint64_t uid) {
169 170 171
  bool existed = false;
  SET_RES_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid);

L
Liu Jicong 已提交
172 173
  SResultRow** p1 =
      (SResultRow**)taosHashGet(pRuntimeEnv->pResultRowHashTable, pRuntimeEnv->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
174 175 176 177 178 179 180 181 182 183 184

  // in case of repeat scan/reverse scan, no new time window added.
  if (QUERY_IS_INTERVAL_QUERY(pRuntimeEnv->pQueryAttr)) {
    if (!masterscan) {  // the *p1 may be NULL in case of sliding+offset exists.
      return p1 != NULL;
    }

    if (p1 != NULL) {
      if (pResultRowInfo->size == 0) {
        existed = false;
      } else if (pResultRowInfo->size == 1) {
dengyihao's avatar
dengyihao 已提交
185
        //        existed = (pResultRowInfo->pResult[0] == (*p1));
186 187
      } else {  // check if current pResultRowInfo contains the existed pResultRow
        SET_RES_EXT_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid, pResultRowInfo);
L
Liu Jicong 已提交
188 189
        int64_t* index =
            taosHashGet(pRuntimeEnv->pResultRowListSet, pRuntimeEnv->keyBuf, GET_RES_EXT_WINDOW_KEY_LEN(bytes));
190 191 192 193 194 195 196 197 198 199 200 201 202
        if (index != NULL) {
          existed = true;
        } else {
          existed = false;
        }
      }
    }

    return existed;
  }

  return p1 != NULL;
}
203
#endif
204

205
SResultRow* getNewResultRow(SDiskbasedBuf* pResultBuf, int64_t tableGroupId, int32_t interBufSize) {
L
Liu Jicong 已提交
206
  SFilePage* pData = NULL;
207 208 209 210 211 212 213 214 215 216 217 218 219

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tableGroupId);

  if (taosArrayGetSize(list) == 0) {
    pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
    pData->num = sizeof(SFilePage);
  } else {
    SPageInfo* pi = getLastPageInfo(list);
    pData = getBufPage(pResultBuf, getPageId(pi));
    pageId = getPageId(pi);

wmmhello's avatar
wmmhello 已提交
220
    if (pData->num + interBufSize > getBufPageSize(pResultBuf)) {
221 222 223 224 225 226 227 228 229 230 231 232 233 234
      // release current page first, and prepare the next one
      releaseBufPageInfo(pResultBuf, pi);

      pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
      if (pData != NULL) {
        pData->num = sizeof(SFilePage);
      }
    }
  }

  if (pData == NULL) {
    return NULL;
  }

235 236
  setBufPageDirty(pData, true);

237 238 239 240 241
  // set the number of rows in current disk page
  SResultRow* pResultRow = (SResultRow*)((char*)pData + pData->num);
  pResultRow->pageId = pageId;
  pResultRow->offset = (int32_t)pData->num;

wmmhello's avatar
wmmhello 已提交
242
  pData->num += interBufSize;
243 244 245 246

  return pResultRow;
}

247 248 249 250 251 252 253
/**
 * the struct of key in hash table
 * +----------+---------------+
 * | group id |   key data    |
 * | 8 bytes  | actual length |
 * +----------+---------------+
 */
254 255 256
SResultRow* doSetResultOutBufByKey(SDiskbasedBuf* pResultBuf, SResultRowInfo* pResultRowInfo, char* pData,
                                   int16_t bytes, bool masterscan, uint64_t groupId, SExecTaskInfo* pTaskInfo,
                                   bool isIntervalQuery, SAggSupporter* pSup) {
257
  SET_RES_WINDOW_KEY(pSup->keyBuf, pData, bytes, groupId);
H
Haojun Liao 已提交
258

dengyihao's avatar
dengyihao 已提交
259 260
  SResultRowPosition* p1 =
      (SResultRowPosition*)taosHashGet(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
H
Haojun Liao 已提交
261

262 263
  SResultRow* pResult = NULL;

H
Haojun Liao 已提交
264 265
  // in case of repeat scan/reverse scan, no new time window added.
  if (isIntervalQuery) {
266 267
    if (masterscan && p1 != NULL) {  // the *p1 may be NULL in case of sliding+offset exists.
      pResult = getResultRowByPos(pResultBuf, p1);
268
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
269 270
    }
  } else {
dengyihao's avatar
dengyihao 已提交
271 272
    // In case of group by column query, the required SResultRow object must be existInCurrentResusltRowInfo in the
    // pResultRowInfo object.
H
Haojun Liao 已提交
273
    if (p1 != NULL) {
274
      // todo
275
      pResult = getResultRowByPos(pResultBuf, p1);
276
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
277 278 279
    }
  }

L
Liu Jicong 已提交
280
  // 1. close current opened time window
281
  if (pResultRowInfo->cur.pageId != -1 && ((pResult == NULL) || (pResult->pageId != pResultRowInfo->cur.pageId))) {
282
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
283
    qDebug("page_1");
284
#endif
285
    SResultRowPosition pos = pResultRowInfo->cur;
X
Xiaoyu Wang 已提交
286
    SFilePage*         pPage = getBufPage(pResultBuf, pos.pageId);
287 288 289 290 291
    releaseBufPage(pResultBuf, pPage);
  }

  // allocate a new buffer page
  if (pResult == NULL) {
292
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
293
    qDebug("page_2");
294
#endif
H
Haojun Liao 已提交
295
    ASSERT(pSup->resultRowSize > 0);
296 297
    pResult = getNewResultRow(pResultBuf, groupId, pSup->resultRowSize);

298
    initResultRow(pResult);
H
Haojun Liao 已提交
299

300 301
    // add a new result set for a new group
    SResultRowPosition pos = {.pageId = pResult->pageId, .offset = pResult->offset};
X
Xiaoyu Wang 已提交
302 303
    taosHashPut(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes), &pos,
                sizeof(SResultRowPosition));
H
Haojun Liao 已提交
304 305
  }

306 307 308
  // 2. set the new time window to be the new active time window
  pResultRowInfo->cur = (SResultRowPosition){.pageId = pResult->pageId, .offset = pResult->offset};

H
Haojun Liao 已提交
309
  // too many time window in query
310
  if (taosHashGetSize(pSup->pResultRowHashTable) > MAX_INTERVAL_TIME_WINDOW) {
H
Haojun Liao 已提交
311 312 313
    longjmp(pTaskInfo->env, TSDB_CODE_QRY_TOO_MANY_TIMEWINDOW);
  }

H
Haojun Liao 已提交
314
  return pResult;
H
Haojun Liao 已提交
315 316
}

317
// a new buffer page for each table. Needs to opt this design
L
Liu Jicong 已提交
318
static int32_t addNewWindowResultBuf(SResultRow* pWindowRes, SDiskbasedBuf* pResultBuf, int32_t tid, uint32_t size) {
319 320 321 322
  if (pWindowRes->pageId != -1) {
    return 0;
  }

L
Liu Jicong 已提交
323
  SFilePage* pData = NULL;
324 325 326 327 328 329

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tid);

  if (taosArrayGetSize(list) == 0) {
H
Haojun Liao 已提交
330
    pData = getNewBufPage(pResultBuf, tid, &pageId);
331
    pData->num = sizeof(SFilePage);
332 333
  } else {
    SPageInfo* pi = getLastPageInfo(list);
334
    pData = getBufPage(pResultBuf, getPageId(pi));
335
    pageId = getPageId(pi);
336

337
    if (pData->num + size > getBufPageSize(pResultBuf)) {
338
      // release current page first, and prepare the next one
339
      releaseBufPageInfo(pResultBuf, pi);
340

H
Haojun Liao 已提交
341
      pData = getNewBufPage(pResultBuf, tid, &pageId);
342
      if (pData != NULL) {
343
        pData->num = sizeof(SFilePage);
344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363
      }
    }
  }

  if (pData == NULL) {
    return -1;
  }

  // set the number of rows in current disk page
  if (pWindowRes->pageId == -1) {  // not allocated yet, allocate new buffer
    pWindowRes->pageId = pageId;
    pWindowRes->offset = (int32_t)pData->num;

    pData->num += size;
    assert(pWindowRes->pageId >= 0);
  }

  return 0;
}

364
//  query_range_start, query_range_end, window_duration, window_start, window_end
365
void initExecTimeWindowInfo(SColumnInfoData* pColData, STimeWindow* pQueryWindow) {
366 367 368
  pColData->info.type = TSDB_DATA_TYPE_TIMESTAMP;
  pColData->info.bytes = sizeof(int64_t);

369
  colInfoDataEnsureCapacity(pColData, 5);
370 371 372 373 374 375 376 377 378
  colDataAppendInt64(pColData, 0, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 1, &pQueryWindow->ekey);

  int64_t interval = 0;
  colDataAppendInt64(pColData, 2, &interval);  // this value may be variable in case of 'n' and 'y'.
  colDataAppendInt64(pColData, 3, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 4, &pQueryWindow->ekey);
}

H
Haojun Liao 已提交
379 380 381 382
void cleanupExecTimeWindowInfo(SColumnInfoData* pColData) {
  colDataDestroy(pColData);
}

X
Xiaoyu Wang 已提交
383 384 385
void doApplyFunctions(SExecTaskInfo* taskInfo, SqlFunctionCtx* pCtx, STimeWindow* pWin,
                      SColumnInfoData* pTimeWindowData, int32_t offset, int32_t forwardStep, TSKEY* tsCol,
                      int32_t numOfTotal, int32_t numOfOutput, int32_t order) {
386
  for (int32_t k = 0; k < numOfOutput; ++k) {
H
Haojun Liao 已提交
387
    // keep it temporarily
388
    // todo no need this??
dengyihao's avatar
dengyihao 已提交
389 390
    bool    hasAgg = pCtx[k].input.colDataAggIsSet;
    int32_t numOfRows = pCtx[k].input.numOfRows;
H
Haojun Liao 已提交
391
    int32_t startOffset = pCtx[k].input.startRowIndex;
392

393
    pCtx[k].input.startRowIndex = offset;
394
    pCtx[k].input.numOfRows = forwardStep;
395 396 397

    // not a whole block involved in query processing, statistics data can not be used
    // NOTE: the original value of isSet have been changed here
398 399
    if (pCtx[k].input.colDataAggIsSet && forwardStep < numOfTotal) {
      pCtx[k].input.colDataAggIsSet = false;
400 401
    }

402 403
    if (fmIsWindowPseudoColumnFunc(pCtx[k].functionId)) {
      SResultRowEntryInfo* pEntryInfo = GET_RES_INFO(&pCtx[k]);
404 405

      char* p = GET_ROWCELL_INTERBUF(pEntryInfo);
406

407
      SColumnInfoData idata = {0};
dengyihao's avatar
dengyihao 已提交
408
      idata.info.type = TSDB_DATA_TYPE_BIGINT;
409
      idata.info.bytes = tDataTypes[TSDB_DATA_TYPE_BIGINT].bytes;
dengyihao's avatar
dengyihao 已提交
410
      idata.pData = p;
411 412 413 414

      SScalarParam out = {.columnData = &idata};
      SScalarParam tw = {.numOfRows = 5, .columnData = pTimeWindowData};
      pCtx[k].sfp.process(&tw, 1, &out);
415
      pEntryInfo->numOfRes = 1;
416 417 418 419 420 421 422 423 424 425
    } else {
      int32_t code = TSDB_CODE_SUCCESS;
      if (functionNeedToExecute(&pCtx[k]) && pCtx[k].fpSet.process != NULL) {
        code = pCtx[k].fpSet.process(&pCtx[k]);

        if (code != TSDB_CODE_SUCCESS) {
          qError("%s apply functions error, code: %s", GET_TASKID(taskInfo), tstrerror(code));
          taskInfo->code = code;
          longjmp(taskInfo->env, code);
        }
426
      }
427

428 429 430 431 432
      // restore it
      pCtx[k].input.colDataAggIsSet = hasAgg;
      pCtx[k].input.startRowIndex = startOffset;
      pCtx[k].input.numOfRows = numOfRows;
    }
433 434 435
  }
}

dengyihao's avatar
dengyihao 已提交
436
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
437
                                   int32_t scanFlag, bool createDummyCol);
438

dengyihao's avatar
dengyihao 已提交
439 440
static void doSetInputDataBlockInfo(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock,
                                    int32_t order) {
441
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
442
    pCtx[i].order = order;
443
    pCtx[i].input.numOfRows = pBlock->info.rows;
444
    setBlockStatisInfo(&pCtx[i], &pOperator->exprSupp.pExprInfo[i], pBlock);
445 446 447
  }
}

X
Xiaoyu Wang 已提交
448 449
void setInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
                       int32_t scanFlag, bool createDummyCol) {
450
  if (pBlock->pBlockAgg != NULL) {
H
Haojun Liao 已提交
451
    doSetInputDataBlockInfo(pOperator, pCtx, pBlock, order);
452
  } else {
453
    doSetInputDataBlock(pOperator, pCtx, pBlock, order, scanFlag, createDummyCol);
H
Haojun Liao 已提交
454
  }
455 456
}

L
Liu Jicong 已提交
457 458
static int32_t doCreateConstantValColumnInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t paramIndex,
                                             int32_t numOfRows) {
459 460 461 462 463 464 465 466
  SColumnInfoData* pColInfo = NULL;
  if (pInput->pData[paramIndex] == NULL) {
    pColInfo = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pColInfo == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

    // Set the correct column info (data type and bytes)
467 468
    pColInfo->info.type = pFuncParam->param.nType;
    pColInfo->info.bytes = pFuncParam->param.nLen;
469 470

    pInput->pData[paramIndex] = pColInfo;
471 472
  } else {
    pColInfo = pInput->pData[paramIndex];
473 474
  }

475
  colInfoDataEnsureCapacity(pColInfo, numOfRows);
476

477
  int8_t type = pFuncParam->param.nType;
478 479
  if (type == TSDB_DATA_TYPE_BIGINT || type == TSDB_DATA_TYPE_UBIGINT) {
    int64_t v = pFuncParam->param.i;
dengyihao's avatar
dengyihao 已提交
480
    for (int32_t i = 0; i < numOfRows; ++i) {
481 482 483 484
      colDataAppendInt64(pColInfo, i, &v);
    }
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
dengyihao's avatar
dengyihao 已提交
485
    for (int32_t i = 0; i < numOfRows; ++i) {
486 487
      colDataAppendDouble(pColInfo, i, &v);
    }
488
  } else if (type == TSDB_DATA_TYPE_VARCHAR) {
L
Liu Jicong 已提交
489
    char* tmp = taosMemoryMalloc(pFuncParam->param.nLen + VARSTR_HEADER_SIZE);
490
    STR_WITH_SIZE_TO_VARSTR(tmp, pFuncParam->param.pz, pFuncParam->param.nLen);
L
Liu Jicong 已提交
491
    for (int32_t i = 0; i < numOfRows; ++i) {
492 493
      colDataAppend(pColInfo, i, tmp, false);
    }
494 495 496 497 498
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
499
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
X
Xiaoyu Wang 已提交
500
                                   int32_t scanFlag, bool createDummyCol) {
501 502
  int32_t code = TSDB_CODE_SUCCESS;

503
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
L
Liu Jicong 已提交
504
    pCtx[i].order = order;
505 506
    pCtx[i].input.numOfRows = pBlock->info.rows;

L
Liu Jicong 已提交
507
    pCtx[i].pSrcBlock = pBlock;
X
Xiaoyu Wang 已提交
508
    pCtx[i].scanFlag = scanFlag;
H
Haojun Liao 已提交
509

510
    SInputColumnInfoData* pInput = &pCtx[i].input;
511
    pInput->uid = pBlock->info.uid;
C
Cary Xu 已提交
512
    pInput->colDataAggIsSet = false;
513

514
    SExprInfo* pOneExpr = &pOperator->exprSupp.pExprInfo[i];
515
    for (int32_t j = 0; j < pOneExpr->base.numOfParams; ++j) {
dengyihao's avatar
dengyihao 已提交
516
      SFunctParam* pFuncParam = &pOneExpr->base.pParam[j];
G
Ganlin Zhao 已提交
517 518
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
dengyihao's avatar
dengyihao 已提交
519
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
520 521 522
        pInput->totalRows = pBlock->info.rows;
        pInput->numOfRows = pBlock->info.rows;
        pInput->startRowIndex = 0;
523

524
        // NOTE: the last parameter is the primary timestamp column
H
Haojun Liao 已提交
525 526 527 528
        // todo: refactor this
        if (fmIsTimelineFunc(pCtx[i].functionId) && (j == pOneExpr->base.numOfParams - 1)) {
          pInput->pPTS = pInput->pData[j];   // in case of merge function, this is not always the ts column data.
//          ASSERT(pInput->pPTS->info.type == TSDB_DATA_TYPE_TIMESTAMP);
529
        }
530 531
        ASSERT(pInput->pData[j] != NULL);
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
532 533 534
        // todo avoid case: top(k, 12), 12 is the value parameter.
        // sum(11), 11 is also the value parameter.
        if (createDummyCol && pOneExpr->base.numOfParams == 1) {
535 536 537 538
          pInput->totalRows = pBlock->info.rows;
          pInput->numOfRows = pBlock->info.rows;
          pInput->startRowIndex = 0;

539
          code = doCreateConstantValColumnInfo(pInput, pFuncParam, j, pBlock->info.rows);
540 541 542
          if (code != TSDB_CODE_SUCCESS) {
            return code;
          }
543
        }
G
Ganlin Zhao 已提交
544 545
      }
    }
H
Haojun Liao 已提交
546
  }
547 548

  return code;
H
Haojun Liao 已提交
549 550
}

551
static int32_t doAggregateImpl(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx) {
552
  for (int32_t k = 0; k < pOperator->exprSupp.numOfExprs; ++k) {
H
Haojun Liao 已提交
553
    if (functionNeedToExecute(&pCtx[k])) {
554
      // todo add a dummy funtion to avoid process check
555 556 557
      if (pCtx[k].fpSet.process == NULL) {
        continue;
      }
H
Haojun Liao 已提交
558

559 560 561 562
      int32_t code = pCtx[k].fpSet.process(&pCtx[k]);
      if (code != TSDB_CODE_SUCCESS) {
        qError("%s aggregate function error happens, code: %s", GET_TASKID(pOperator->pTaskInfo), tstrerror(code));
        return code;
563
      }
564 565
    }
  }
566 567

  return TSDB_CODE_SUCCESS;
568 569
}

H
Haojun Liao 已提交
570
static void setPseudoOutputColInfo(SSDataBlock* pResult, SqlFunctionCtx* pCtx, SArray* pPseudoList) {
dengyihao's avatar
dengyihao 已提交
571
  size_t num = (pPseudoList != NULL) ? taosArrayGetSize(pPseudoList) : 0;
H
Haojun Liao 已提交
572 573 574 575 576
  for (int32_t i = 0; i < num; ++i) {
    pCtx[i].pOutput = taosArrayGet(pResult->pDataBlock, i);
  }
}

577
int32_t projectApplyFunctions(SExprInfo* pExpr, SSDataBlock* pResult, SSDataBlock* pSrcBlock, SqlFunctionCtx* pCtx,
X
Xiaoyu Wang 已提交
578
                              int32_t numOfOutput, SArray* pPseudoList) {
H
Haojun Liao 已提交
579
  setPseudoOutputColInfo(pResult, pCtx, pPseudoList);
H
Haojun Liao 已提交
580
  pResult->info.groupId = pSrcBlock->info.groupId;
H
Haojun Liao 已提交
581

582 583
  // if the source equals to the destination, it is to create a new column as the result of scalar
  // function or some operators.
584 585
  bool createNewColModel = (pResult == pSrcBlock);

586 587
  int32_t numOfRows = 0;

588
  for (int32_t k = 0; k < numOfOutput; ++k) {
589 590
    int32_t               outputSlotId = pExpr[k].base.resSchema.slotId;
    SqlFunctionCtx*       pfCtx = &pCtx[k];
591
    SInputColumnInfoData* pInputData = &pfCtx->input;
592

L
Liu Jicong 已提交
593
    if (pExpr[k].pExpr->nodeType == QUERY_NODE_COLUMN) {  // it is a project query
594
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
595
      if (pResult->info.rows > 0 && !createNewColModel) {
596 597
        colDataMergeCol(pColInfoData, pResult->info.rows, &pResult->info.capacity, pInputData->pData[0],
                        pInputData->numOfRows);
598
      } else {
599
        colDataAssign(pColInfoData, pInputData->pData[0], pInputData->numOfRows, &pResult->info);
600
      }
601

602
      numOfRows = pInputData->numOfRows;
603
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_VALUE) {
604
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
605

dengyihao's avatar
dengyihao 已提交
606
      int32_t offset = createNewColModel ? 0 : pResult->info.rows;
607 608 609 610 611 612 613 614

      int32_t type = pExpr[k].base.pParam[0].param.nType;
      if (TSDB_DATA_TYPE_NULL == type) {
        colDataAppendNNULL(pColInfoData, offset, pSrcBlock->info.rows);
      } else {
        for (int32_t i = 0; i < pSrcBlock->info.rows; ++i) {
          colDataAppend(pColInfoData, i + offset, taosVariantGet(&pExpr[k].base.pParam[0].param, type), false);
        }
615
      }
616 617

      numOfRows = pSrcBlock->info.rows;
H
Haojun Liao 已提交
618
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_OPERATOR) {
619 620 621
      SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
      taosArrayPush(pBlockList, &pSrcBlock);

622
      SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
623
      SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
624

625
      SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
626
      int32_t      code = scalarCalculate(pExpr[k].pExpr->_optrRoot.pRootNode, pBlockList, &dest);
627 628 629 630
      if (code != TSDB_CODE_SUCCESS) {
        taosArrayDestroy(pBlockList);
        return code;
      }
631

dengyihao's avatar
dengyihao 已提交
632
      int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
633
      ASSERT(pResult->info.capacity > 0);
634
      colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
D
dapan1121 已提交
635 636
      colDataDestroy(&idata);
      
637
      numOfRows = dest.numOfRows;
638 639
      taosArrayDestroy(pBlockList);
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_FUNCTION) {
640 641
      // _rowts/_c0, not tbname column
      if (fmIsPseudoColumnFunc(pfCtx->functionId) && (!fmIsScanPseudoColumnFunc(pfCtx->functionId))) {
H
Haojun Liao 已提交
642
        // do nothing
643
      } else if (fmIsIndefiniteRowsFunc(pfCtx->functionId)) {
644 645
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(pfCtx);
        pfCtx->fpSet.init(pfCtx, pResInfo);
646 647 648 649 650 651 652 653 654 655 656

        pfCtx->pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
        pfCtx->offset = createNewColModel ? 0 : pResult->info.rows;  // set the start offset

        // set the timestamp(_rowts) output buffer
        if (taosArrayGetSize(pPseudoList) > 0) {
          int32_t* outputColIndex = taosArrayGet(pPseudoList, 0);
          pfCtx->pTsOutput = (SColumnInfoData*)pCtx[*outputColIndex].pOutput;
        }

        numOfRows = pfCtx->fpSet.process(pfCtx);
H
Haojun Liao 已提交
657
      } else if (fmIsAggFunc(pfCtx->functionId)) {
658 659
        // _group_key function for "partition by tbname" + csum(col_name) query
        SColumnInfoData* pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
660
        int32_t          slotId = pfCtx->param[0].pCol->slotId;
661 662 663

        // todo handle the json tag
        SColumnInfoData* pInput = taosArrayGet(pSrcBlock->pDataBlock, slotId);
664
        for (int32_t f = 0; f < pSrcBlock->info.rows; ++f) {
665 666 667 668 669 670 671 672 673
          bool isNull = colDataIsNull_s(pInput, f);
          if (isNull) {
            colDataAppendNULL(pOutput, pResult->info.rows + f);
          } else {
            char* data = colDataGetData(pInput, f);
            colDataAppend(pOutput, pResult->info.rows + f, data, isNull);
          }
        }

H
Haojun Liao 已提交
674 675 676
      } else {
        SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
        taosArrayPush(pBlockList, &pSrcBlock);
G
Ganlin Zhao 已提交
677

678
        SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
679
        SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
H
Haojun Liao 已提交
680

681
        SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
682
        int32_t      code = scalarCalculate((SNode*)pExpr[k].pExpr->_function.pFunctNode, pBlockList, &dest);
683 684 685 686
        if (code != TSDB_CODE_SUCCESS) {
          taosArrayDestroy(pBlockList);
          return code;
        }
687

dengyihao's avatar
dengyihao 已提交
688
        int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
689
        ASSERT(pResult->info.capacity > 0);
690
        colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
D
dapan1121 已提交
691
        colDataDestroy(&idata);
692 693

        numOfRows = dest.numOfRows;
H
Haojun Liao 已提交
694 695
        taosArrayDestroy(pBlockList);
      }
696
    } else {
697
      ASSERT(0);
698 699
    }
  }
700

701 702 703
  if (!createNewColModel) {
    pResult->info.rows += numOfRows;
  }
704 705

  return TSDB_CODE_SUCCESS;
706 707
}

5
54liuyao 已提交
708
bool functionNeedToExecute(SqlFunctionCtx* pCtx) {
709
  struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
710

711 712 713 714 715
  // in case of timestamp column, always generated results.
  int32_t functionId = pCtx->functionId;
  if (functionId == -1) {
    return false;
  }
716

717 718
  if (pCtx->scanFlag == REPEAT_SCAN) {
    return fmIsRepeatScanFunc(pCtx->functionId);
719 720
  }

721 722
  if (isRowEntryCompleted(pResInfo)) {
    return false;
723 724
  }

725 726 727
  return true;
}

728 729 730 731 732 733 734
static int32_t doCreateConstantValColumnAggInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t type,
                                                int32_t paramIndex, int32_t numOfRows) {
  if (pInput->pData[paramIndex] == NULL) {
    pInput->pData[paramIndex] = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pInput->pData[paramIndex] == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
735

736 737 738
    // Set the correct column info (data type and bytes)
    pInput->pData[paramIndex]->info.type = type;
    pInput->pData[paramIndex]->info.bytes = tDataTypes[type].bytes;
739
  }
H
Haojun Liao 已提交
740

741 742 743 744 745 746
  SColumnDataAgg* da = NULL;
  if (pInput->pColumnDataAgg[paramIndex] == NULL) {
    da = taosMemoryCalloc(1, sizeof(SColumnDataAgg));
    pInput->pColumnDataAgg[paramIndex] = da;
    if (da == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
747 748
    }
  } else {
749
    da = pInput->pColumnDataAgg[paramIndex];
750 751
  }

752
  ASSERT(!IS_VAR_DATA_TYPE(type));
753

754 755
  if (type == TSDB_DATA_TYPE_BIGINT) {
    int64_t v = pFuncParam->param.i;
756
    *da = (SColumnDataAgg){.numOfNull = 0, .min = v, .max = v, .sum = v * numOfRows};
757 758
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
759
    *da = (SColumnDataAgg){.numOfNull = 0};
760

761 762 763 764 765 766
    *(double*)&da->min = v;
    *(double*)&da->max = v;
    *(double*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_BOOL) {  // todo validate this data type
    bool v = pFuncParam->param.i;

767
    *da = (SColumnDataAgg){.numOfNull = 0};
768 769 770 771 772
    *(bool*)&da->min = 0;
    *(bool*)&da->max = v;
    *(bool*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_TIMESTAMP) {
    // do nothing
773
  } else {
774
    ASSERT(0);
775 776
  }

777 778
  return TSDB_CODE_SUCCESS;
}
779 780 781 782 783 784 785 786 787 788 789

void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, SSDataBlock* pBlock) {
  int32_t numOfRows = pBlock->info.rows;

  SInputColumnInfoData* pInput = &pCtx->input;
  pInput->numOfRows = numOfRows;
  pInput->totalRows = numOfRows;

  if (pBlock->pBlockAgg != NULL) {
    pInput->colDataAggIsSet = true;

790 791
    for (int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      SFunctParam* pFuncParam = &pExprInfo->base.pParam[j];
792

793 794
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
795 796 797 798
        pInput->pColumnDataAgg[j] = pBlock->pBlockAgg[slotId];
        if (pInput->pColumnDataAgg[j] == NULL) {
          pInput->colDataAggIsSet = false;
        }
799 800 801 802

        // Here we set the column info data since the data type for each column data is required, but
        // the data in the corresponding SColumnInfoData will not be used.
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
803 804
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
        doCreateConstantValColumnAggInfo(pInput, pFuncParam, pFuncParam->param.nType, j, pBlock->info.rows);
805 806
      }
    }
807
  } else {
808
    pInput->colDataAggIsSet = false;
809 810 811
  }

  // set the statistics data for primary time stamp column
812 813 814 815 816
  //  if (pCtx->functionId == FUNCTION_SPREAD && pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
  //    pCtx->isAggSet = true;
  //    pCtx->agg.min = pBlock->info.window.skey;
  //    pCtx->agg.max = pBlock->info.window.ekey;
  //  }
817 818
}

L
Liu Jicong 已提交
819
bool isTaskKilled(SExecTaskInfo* pTaskInfo) {
820 821
  // query has been executed more than tsShellActivityTimer, and the retrieve has not arrived
  // abort current query execution.
L
Liu Jicong 已提交
822 823
  if (pTaskInfo->owner != 0 &&
      ((taosGetTimestampSec() - pTaskInfo->cost.start / 1000) > 10 * getMaximumIdleDurationSec())
824 825
      /*(!needBuildResAfterQueryComplete(pTaskInfo))*/) {
    assert(pTaskInfo->cost.start != 0);
L
Liu Jicong 已提交
826 827 828
    //    qDebug("QInfo:%" PRIu64 " retrieve not arrive beyond %d ms, abort current query execution, start:%" PRId64
    //           ", current:%d", pQInfo->qId, 1, pQInfo->startExecTs, taosGetTimestampSec());
    //    return true;
829 830 831 832 833
  }

  return false;
}

L
Liu Jicong 已提交
834
void setTaskKilled(SExecTaskInfo* pTaskInfo) { pTaskInfo->code = TSDB_CODE_TSC_QUERY_CANCELLED; }
835 836

/////////////////////////////////////////////////////////////////////////////////////////////
L
Liu Jicong 已提交
837
// todo refactor : return window
838
void getAlignQueryTimeWindow(SInterval* pInterval, int32_t precision, int64_t key, STimeWindow* win) {
H
Haojun Liao 已提交
839
  win->skey = taosTimeTruncate(key, pInterval, precision);
840 841

  /*
H
Haojun Liao 已提交
842
   * if the realSkey > INT64_MAX - pInterval->interval, the query duration between
843 844
   * realSkey and realEkey must be less than one interval.Therefore, no need to adjust the query ranges.
   */
845 846
  win->ekey = taosTimeAdd(win->skey, pInterval->interval, pInterval->intervalUnit, precision) - 1;
  if (win->ekey < win->skey) {
847 848 849 850
    win->ekey = INT64_MAX;
  }
}

851
#if 0
L
Liu Jicong 已提交
852
static int32_t updateBlockLoadStatus(STaskAttr* pQuery, int32_t status) {
853

854 855 856
  bool hasFirstLastFunc = false;
  bool hasOtherFunc = false;

857
  if (status == BLK_DATA_DATA_LOAD || status == BLK_DATA_FILTEROUT) {
858 859 860 861 862
    return status;
  }

  for (int32_t i = 0; i < pQuery->numOfOutput; ++i) {
    int32_t functionId = getExprFunctionId(&pQuery->pExpr1[i]);
863

864 865 866 867 868 869 870 871 872 873
    if (functionId == FUNCTION_TS || functionId == FUNCTION_TS_DUMMY || functionId == FUNCTION_TAG ||
        functionId == FUNCTION_TAG_DUMMY) {
      continue;
    }

    if (functionId == FUNCTION_FIRST_DST || functionId == FUNCTION_LAST_DST) {
      hasFirstLastFunc = true;
    } else {
      hasOtherFunc = true;
    }
874

875 876
  }

877
  if (hasFirstLastFunc && status == BLK_DATA_NOT_LOAD) {
L
Liu Jicong 已提交
878
    if (!hasOtherFunc) {
879
      return BLK_DATA_FILTEROUT;
880
    } else {
881
      return BLK_DATA_DATA_LOAD;
882 883 884 885 886 887
    }
  }

  return status;
}

888 889
#endif

L
Liu Jicong 已提交
890 891
// static void updateDataCheckOrder(SQInfo *pQInfo, SQueryTableReq* pQueryMsg, bool stableQuery) {
//   STaskAttr* pQueryAttr = pQInfo->runtimeEnv.pQueryAttr;
H
Haojun Liao 已提交
892
//
L
Liu Jicong 已提交
893 894 895 896
//   // in case of point-interpolation query, use asc order scan
//   char msg[] = "QInfo:0x%"PRIx64" scan order changed for %s query, old:%d, new:%d, qrange exchanged, old qrange:%"
//   PRId64
//                "-%" PRId64 ", new qrange:%" PRId64 "-%" PRId64;
H
Haojun Liao 已提交
897
//
L
Liu Jicong 已提交
898 899 900 901 902
//   // todo handle the case the the order irrelevant query type mixed up with order critical query type
//   // descending order query for last_row query
//   if (isFirstLastRowQuery(pQueryAttr)) {
//     //qDebug("QInfo:0x%"PRIx64" scan order changed for last_row query, old:%d, new:%d", pQInfo->qId,
//     pQueryAttr->order.order, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
903
//
L
Liu Jicong 已提交
904 905
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
906
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
907
//     }
H
Haojun Liao 已提交
908
//
L
Liu Jicong 已提交
909 910 911
//     pQueryAttr->needReverseScan = false;
//     return;
//   }
H
Haojun Liao 已提交
912
//
L
Liu Jicong 已提交
913 914 915
//   if (pQueryAttr->groupbyColumn && pQueryAttr->order.order == TSDB_ORDER_DESC) {
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
916
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
917
//     }
H
Haojun Liao 已提交
918
//
L
Liu Jicong 已提交
919 920 921 922
//     pQueryAttr->needReverseScan = false;
//     doUpdateLastKey(pQueryAttr);
//     return;
//   }
H
Haojun Liao 已提交
923
//
L
Liu Jicong 已提交
924 925 926 927 928 929
//   if (pQueryAttr->pointInterpQuery && pQueryAttr->interval.interval == 0) {
//     if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       //qDebug(msg, pQInfo->qId, "interp", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey); TSWAP(pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, TSKEY);
//     }
H
Haojun Liao 已提交
930
//
L
Liu Jicong 已提交
931 932 933
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     return;
//   }
H
Haojun Liao 已提交
934
//
L
Liu Jicong 已提交
935 936 937 938
//   if (pQueryAttr->interval.interval == 0) {
//     if (onlyFirstQuery(pQueryAttr)) {
//       if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//         //qDebug(msg, pQInfo->qId, "only-first", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
H
Haojun Liao 已提交
939 940
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
941
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
942 943 944 945 946 947 948 949 950 951
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_ASC;
//      pQueryAttr->needReverseScan = false;
//    } else if (onlyLastQuery(pQueryAttr) && notContainSessionOrStateWindow(pQueryAttr)) {
//      if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//        //qDebug(msg, pQInfo->qId, "only-last", pQueryAttr->order.order, TSDB_ORDER_DESC, pQueryAttr->window.skey,
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
952
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
953 954 955 956 957 958 959 960 961 962 963 964
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_DESC;
//      pQueryAttr->needReverseScan = false;
//    }
//
//  } else {  // interval query
//    if (stableQuery) {
//      if (onlyFirstQuery(pQueryAttr)) {
//        if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-first stable", pQueryAttr->order.order, TSDB_ORDER_ASC,
L
Liu Jicong 已提交
965 966
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
967
//
wafwerar's avatar
wafwerar 已提交
968
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
969 970 971 972 973 974 975 976
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_ASC;
//        pQueryAttr->needReverseScan = false;
//      } else if (onlyLastQuery(pQueryAttr)) {
//        if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-last stable", pQueryAttr->order.order, TSDB_ORDER_DESC,
L
Liu Jicong 已提交
977 978
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
979
//
wafwerar's avatar
wafwerar 已提交
980
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
981 982 983 984 985 986 987 988 989
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_DESC;
//        pQueryAttr->needReverseScan = false;
//      }
//    }
//  }
//}
990

L
Liu Jicong 已提交
991 992 993
// static FORCE_INLINE bool doFilterByBlockStatistics(STaskRuntimeEnv* pRuntimeEnv, SDataStatis *pDataStatis,
// SqlFunctionCtx *pCtx, int32_t numOfRows) {
//   STaskAttr* pQueryAttr = pRuntimeEnv->pQueryAttr;
994
//
L
Liu Jicong 已提交
995 996 997
//   if (pDataStatis == NULL || pQueryAttr->pFilters == NULL) {
//     return true;
//   }
998
//
L
Liu Jicong 已提交
999 1000
//   return filterRangeExecute(pQueryAttr->pFilters, pDataStatis, pQueryAttr->numOfCols, numOfRows);
// }
1001
#if 0
H
Haojun Liao 已提交
1002
static bool overlapWithTimeWindow(STaskAttr* pQueryAttr, SDataBlockInfo* pBlockInfo) {
1003 1004
  STimeWindow w = {0};

dengyihao's avatar
dengyihao 已提交
1005 1006
  TSKEY sk = TMIN(pQueryAttr->window.skey, pQueryAttr->window.ekey);
  TSKEY ek = TMAX(pQueryAttr->window.skey, pQueryAttr->window.ekey);
1007

1008
  if (true) {
L
Liu Jicong 已提交
1009
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.skey, sk, ek, &w);
1010 1011 1012 1013 1014 1015
    assert(w.ekey >= pBlockInfo->window.skey);

    if (w.ekey < pBlockInfo->window.ekey) {
      return true;
    }

L
Liu Jicong 已提交
1016 1017
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1018 1019 1020 1021 1022 1023 1024 1025 1026 1027
      if (w.skey > pBlockInfo->window.ekey) {
        break;
      }

      assert(w.ekey > pBlockInfo->window.ekey);
      if (w.skey <= pBlockInfo->window.ekey && w.skey > pBlockInfo->window.skey) {
        return true;
      }
    }
  } else {
L
Liu Jicong 已提交
1028
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.ekey, sk, ek, &w);
1029 1030 1031 1032 1033 1034
    assert(w.skey <= pBlockInfo->window.ekey);

    if (w.skey > pBlockInfo->window.skey) {
      return true;
    }

L
Liu Jicong 已提交
1035 1036
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049
      if (w.ekey < pBlockInfo->window.skey) {
        break;
      }

      assert(w.skey < pBlockInfo->window.skey);
      if (w.ekey < pBlockInfo->window.ekey && w.ekey >= pBlockInfo->window.skey) {
        return true;
      }
    }
  }

  return false;
}
1050
#endif
1051 1052

static uint32_t doFilterByBlockTimeWindow(STableScanInfo* pTableScanInfo, SSDataBlock* pBlock) {
H
Haojun Liao 已提交
1053
#if 0
H
Haojun Liao 已提交
1054
  SqlFunctionCtx* pCtx = pTableScanInfo->pCtx;
1055
  uint32_t        status = BLK_DATA_NOT_LOAD;
1056

L
Liu Jicong 已提交
1057
  int32_t numOfOutput = 0;  // pTableScanInfo->numOfOutput;
1058 1059
  for (int32_t i = 0; i < numOfOutput; ++i) {
    int32_t functionId = pCtx[i].functionId;
H
Haojun Liao 已提交
1060
    int32_t colId = pTableScanInfo->pExpr[i].base.pParam[0].pCol->colId;
1061 1062 1063

    // group by + first/last should not apply the first/last block filter
    if (functionId < 0) {
1064
      status |= BLK_DATA_DATA_LOAD;
1065 1066
      return status;
    } else {
L
Liu Jicong 已提交
1067
      //      status |= aAggs[functionId].dataReqFunc(&pTableScanInfo->pCtx[i], &pBlock->info.window, colId);
1068
      //      if ((status & BLK_DATA_DATA_LOAD) == BLK_DATA_DATA_LOAD) {
L
Liu Jicong 已提交
1069 1070
      //        return status;
      //      }
1071 1072 1073 1074
    }
  }

  return status;
H
Haojun Liao 已提交
1075 1076
#endif
  return 0;
1077 1078
}

L
Liu Jicong 已提交
1079 1080
int32_t loadDataBlockOnDemand(SExecTaskInfo* pTaskInfo, STableScanInfo* pTableScanInfo, SSDataBlock* pBlock,
                              uint32_t* status) {
1081
  *status = BLK_DATA_NOT_LOAD;
1082

H
Haojun Liao 已提交
1083
  pBlock->pDataBlock = NULL;
L
Liu Jicong 已提交
1084
  pBlock->pBlockAgg = NULL;
H
Haojun Liao 已提交
1085

L
Liu Jicong 已提交
1086 1087
  //  int64_t groupId = pRuntimeEnv->current->groupIndex;
  //  bool    ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1088

H
Haojun Liao 已提交
1089
  STaskCostInfo* pCost = &pTaskInfo->cost;
1090

1091 1092
//  pCost->totalBlocks += 1;
//  pCost->totalRows += pBlock->info.rows;
H
Haojun Liao 已提交
1093
#if 0
1094 1095 1096
  // Calculate all time windows that are overlapping or contain current data block.
  // If current data block is contained by all possible time window, do not load current data block.
  if (/*pQueryAttr->pFilters || */pQueryAttr->groupbyColumn || pQueryAttr->sw.gap > 0 ||
H
Haojun Liao 已提交
1097
      (QUERY_IS_INTERVAL_QUERY(pQueryAttr) && overlapWithTimeWindow(pTaskInfo, &pBlock->info))) {
1098
    (*status) = BLK_DATA_DATA_LOAD;
1099 1100 1101
  }

  // check if this data block is required to load
1102
  if ((*status) != BLK_DATA_DATA_LOAD) {
1103 1104 1105 1106 1107 1108 1109
    bool needFilter = true;

    // the pCtx[i] result is belonged to previous time window since the outputBuf has not been set yet,
    // the filter result may be incorrect. So in case of interval query, we need to set the correct time output buffer
    if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
      SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1110
      bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1111 1112 1113 1114 1115 1116
      TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

      STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
      if (pQueryAttr->pointInterpQuery) {
        needFilter = chkWindowOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1117
                                    pTableScanInfo->rowEntryInfoOffset);
1118 1119 1120
      } else {
        if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1121
                                    pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1122 1123 1124 1125 1126
          longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
        }
      }
    } else if (pQueryAttr->stableQuery && (!pQueryAttr->tsCompQuery) && (!pQueryAttr->diffQuery)) { // stable aggregate, not interval aggregate or normal column aggregate
      doSetTableGroupOutputBuf(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pTableScanInfo->pCtx,
1127
                               pTableScanInfo->rowEntryInfoOffset, pTableScanInfo->numOfOutput,
1128 1129 1130 1131 1132 1133
                               pRuntimeEnv->current->groupIndex);
    }

    if (needFilter) {
      (*status) = doFilterByBlockTimeWindow(pTableScanInfo, pBlock);
    } else {
1134
      (*status) = BLK_DATA_DATA_LOAD;
1135 1136 1137 1138
    }
  }

  SDataBlockInfo* pBlockInfo = &pBlock->info;
H
Haojun Liao 已提交
1139
//  *status = updateBlockLoadStatus(pRuntimeEnv->pQueryAttr, *status);
1140

1141
  if ((*status) == BLK_DATA_NOT_LOAD || (*status) == BLK_DATA_FILTEROUT) {
1142 1143
    //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//           pBlockInfo->window.ekey, pBlockInfo->rows);
1144
    pCost->skipBlocks += 1;
1145
  } else if ((*status) == BLK_DATA_SMA_LOAD) {
1146 1147
    // this function never returns error?
    pCost->loadBlockStatis += 1;
1148
//    tsdbRetrieveDatablockSMA(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1149 1150

    if (pBlock->pBlockAgg == NULL) {  // data block statistics does not exist, load data block
1151
//      pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1152 1153 1154
      pCost->totalCheckedRows += pBlock->info.rows;
    }
  } else {
1155
    assert((*status) == BLK_DATA_DATA_LOAD);
1156 1157 1158

    // load the data block statistics to perform further filter
    pCost->loadBlockStatis += 1;
1159
//    tsdbRetrieveDatablockSMA(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1160 1161 1162 1163 1164 1165

    if (pQueryAttr->topBotQuery && pBlock->pBlockAgg != NULL) {
      { // set previous window
        if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
          SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1166
          bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1167 1168 1169 1170 1171
          TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

          STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
          if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                      pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1172
                                      pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183
            longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
          }
        }
      }
      bool load = false;
      for (int32_t i = 0; i < pQueryAttr->numOfOutput; ++i) {
        int32_t functionId = pTableScanInfo->pCtx[i].functionId;
        if (functionId == FUNCTION_TOP || functionId == FUNCTION_BOTTOM) {
//          load = topbot_datablock_filter(&pTableScanInfo->pCtx[i], (char*)&(pBlock->pBlockAgg[i].min),
//                                         (char*)&(pBlock->pBlockAgg[i].max));
          if (!load) { // current block has been discard due to filter applied
1184
            pCost->skipBlocks += 1;
1185 1186
            //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId,
//                   pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
1187
            (*status) = BLK_DATA_FILTEROUT;
1188 1189 1190 1191 1192 1193 1194 1195
            return TSDB_CODE_SUCCESS;
          }
        }
      }
    }

    // current block has been discard due to filter applied
//    if (!doFilterByBlockStatistics(pRuntimeEnv, pBlock->pBlockAgg, pTableScanInfo->pCtx, pBlockInfo->rows)) {
1196
//      pCost->skipBlocks += 1;
1197 1198
//      qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//             pBlockInfo->window.ekey, pBlockInfo->rows);
1199
//      (*status) = BLK_DATA_FILTEROUT;
1200 1201 1202 1203 1204
//      return TSDB_CODE_SUCCESS;
//    }

    pCost->totalCheckedRows += pBlockInfo->rows;
    pCost->loadBlocks += 1;
1205
//    pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1206 1207 1208 1209 1210
//    if (pBlock->pDataBlock == NULL) {
//      return terrno;
//    }

//    if (pQueryAttr->pFilters != NULL) {
1211
//      filterSetColFieldData(pQueryAttr->pFilters, taosArrayGetSize(pBlock->pDataBlock), pBlock->pDataBlock);
1212
//    }
1213

1214 1215 1216 1217
//    if (pQueryAttr->pFilters != NULL || pRuntimeEnv->pTsBuf != NULL) {
//      filterColRowsInDataBlock(pRuntimeEnv, pBlock, ascQuery);
//    }
  }
H
Haojun Liao 已提交
1218
#endif
1219 1220 1221
  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
1222
static void updateTableQueryInfoForReverseScan(STableQueryInfo* pTableQueryInfo) {
1223 1224 1225 1226
  if (pTableQueryInfo == NULL) {
    return;
  }

wafwerar's avatar
wafwerar 已提交
1227
  //  TSWAP(pTableQueryInfo->win.skey, pTableQueryInfo->win.ekey);
L
Liu Jicong 已提交
1228
  //  pTableQueryInfo->lastKey = pTableQueryInfo->win.skey;
1229

L
Liu Jicong 已提交
1230 1231
  //  SWITCH_ORDER(pTableQueryInfo->cur.order);
  //  pTableQueryInfo->cur.vgroupIndex = -1;
1232 1233

  // set the index to be the end slot of result rows array
dengyihao's avatar
dengyihao 已提交
1234 1235 1236 1237 1238 1239
  //  SResultRowInfo* pResultRowInfo = &pTableQueryInfo->resInfo;
  //  if (pResultRowInfo->size > 0) {
  //    pResultRowInfo->curPos = pResultRowInfo->size - 1;
  //  } else {
  //    pResultRowInfo->curPos = -1;
  //  }
1240 1241
}

H
Haojun Liao 已提交
1242
void initResultRow(SResultRow* pResultRow) {
X
Xiaoyu Wang 已提交
1243
  //  pResultRow->pEntryInfo = (struct SResultRowEntryInfo*)((char*)pResultRow + sizeof(SResultRow));
1244 1245 1246 1247 1248
}

/*
 * The start of each column SResultRowEntryInfo is denote by RowCellInfoOffset.
 * Note that in case of top/bottom query, the whole multiple rows of result is treated as only one row of results.
H
Haojun Liao 已提交
1249 1250 1251
 * +------------+-----------------result column 1------------+------------------result column 2-----------+
 * | SResultRow | SResultRowEntryInfo | intermediate buffer1 | SResultRowEntryInfo | intermediate buffer 2|
 * +------------+--------------------------------------------+--------------------------------------------+
1252 1253
 *           offset[0]                                  offset[1]                                   offset[2]
 */
1254
// TODO refactor: some function move away
L
Liu Jicong 已提交
1255 1256 1257
void setFunctionResultOutput(SOperatorInfo* pOperator, SOptrBasicInfo* pInfo, SAggSupporter* pSup, int32_t stage,
                             int32_t numOfExprs) {
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1258 1259
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
H
Haojun Liao 已提交
1260

H
Haojun Liao 已提交
1261
  SResultRowInfo* pResultRowInfo = &pInfo->resultRowInfo;
1262
  initResultRowInfo(pResultRowInfo);
H
Haojun Liao 已提交
1263

L
Liu Jicong 已提交
1264 1265
  int64_t     tid = 0;
  int64_t     groupId = 0;
1266 1267
  SResultRow* pRow = doSetResultOutBufByKey(pSup->pResultBuf, pResultRowInfo, (char*)&tid, sizeof(tid), true, groupId,
                                            pTaskInfo, false, pSup);
H
Haojun Liao 已提交
1268

1269
  for (int32_t i = 0; i < numOfExprs; ++i) {
1270
    struct SResultRowEntryInfo* pEntry = getResultEntryInfo(pRow, i, rowEntryInfoOffset);
H
Haojun Liao 已提交
1271 1272
    cleanupResultRowEntry(pEntry);

L
Liu Jicong 已提交
1273
    pCtx[i].resultInfo = pEntry;
1274
    pCtx[i].scanFlag = stage;
H
Haojun Liao 已提交
1275 1276
  }

1277
  initCtxOutputBuffer(pCtx, numOfExprs);
H
Haojun Liao 已提交
1278 1279
}

H
Haojun Liao 已提交
1280
void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size) {
1281 1282
  for (int32_t j = 0; j < size; ++j) {
    struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(&pCtx[j]);
dengyihao's avatar
dengyihao 已提交
1283 1284
    if (isRowEntryInitialized(pResInfo) || fmIsPseudoColumnFunc(pCtx[j].functionId) || pCtx[j].functionId == -1 ||
        fmIsScalarFunc(pCtx[j].functionId)) {
1285 1286 1287
      continue;
    }

H
Haojun Liao 已提交
1288
    pCtx[j].fpSet.init(&pCtx[j], pCtx[j].resultInfo);
1289 1290 1291
  }
}

L
Liu Jicong 已提交
1292
void setTaskStatus(SExecTaskInfo* pTaskInfo, int8_t status) {
1293
  if (status == TASK_NOT_COMPLETED) {
H
Haojun Liao 已提交
1294
    pTaskInfo->status = status;
1295 1296
  } else {
    // QUERY_NOT_COMPLETED is not compatible with any other status, so clear its position first
1297
    CLEAR_QUERY_STATUS(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
1298
    pTaskInfo->status |= status;
1299 1300 1301
  }
}

L
Liu Jicong 已提交
1302
void destroyTableQueryInfoImpl(STableQueryInfo* pTableQueryInfo) {
1303 1304 1305 1306
  if (pTableQueryInfo == NULL) {
    return;
  }

L
Liu Jicong 已提交
1307
  //  taosVariantDestroy(&pTableQueryInfo->tag);
dengyihao's avatar
dengyihao 已提交
1308
  //  cleanupResultRowInfo(&pTableQueryInfo->resInfo);
1309 1310
}

1311
void setResultRowInitCtx(SResultRow* pResult, SqlFunctionCtx* pCtx, int32_t numOfOutput, int32_t* rowEntryInfoOffset) {
1312
  for (int32_t i = 0; i < numOfOutput; ++i) {
1313
    pCtx[i].resultInfo = getResultEntryInfo(pResult, i, rowEntryInfoOffset);
1314 1315 1316 1317 1318

    struct SResultRowEntryInfo* pResInfo = pCtx[i].resultInfo;
    if (isRowEntryCompleted(pResInfo) && isRowEntryInitialized(pResInfo)) {
      continue;
    }
1319 1320 1321 1322 1323

    if (fmIsWindowPseudoColumnFunc(pCtx[i].functionId)) {
      continue;
    }

1324 1325 1326 1327 1328 1329
    if (!pResInfo->initialized) {
      if (pCtx[i].functionId != -1) {
        pCtx[i].fpSet.init(&pCtx[i], pResInfo);
      } else {
        pResInfo->initialized = true;
      }
1330 1331 1332 1333
    }
  }
}

H
Haojun Liao 已提交
1334
static void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep);
1335

1336
void doFilter(const SNode* pFilterNode, SSDataBlock* pBlock) {
1337 1338 1339 1340 1341
  if (pFilterNode == NULL) {
    return;
  }

  SFilterInfo* filter = NULL;
H
Haojun Liao 已提交
1342

H
Haojun Liao 已提交
1343
  // todo move to the initialization function
H
Haojun Liao 已提交
1344
  int32_t code = filterInitFromNode((SNode*)pFilterNode, &filter, 0);
1345

1346
  size_t             numOfCols = taosArrayGetSize(pBlock->pDataBlock);
1347
  SFilterColumnParam param1 = {.numOfCols = numOfCols, .pDataBlock = pBlock->pDataBlock};
1348 1349 1350
  code = filterSetDataFromSlotId(filter, &param1);

  int8_t* rowRes = NULL;
1351

1352
  // todo the keep seems never to be True??
1353
  bool keep = filterExecute(filter, pBlock, &rowRes, NULL, param1.numOfCols);
D
dapan1121 已提交
1354
  filterFreeInfo(filter);
1355

H
Haojun Liao 已提交
1356
  extractQualifiedTupleByFilterResult(pBlock, rowRes, keep);
1357
  blockDataUpdateTsWindow(pBlock, 0);
H
Haojun Liao 已提交
1358 1359

  taosMemoryFree(rowRes);
1360 1361
}

H
Haojun Liao 已提交
1362
void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep) {
1363 1364 1365 1366 1367
  if (keep) {
    return;
  }

  if (rowRes != NULL) {
L
Liu Jicong 已提交
1368
    int32_t      totalRows = pBlock->info.rows;
1369
    SSDataBlock* px = createOneDataBlock(pBlock, true);
1370

1371 1372
    size_t numOfCols = taosArrayGetSize(pBlock->pDataBlock);
    for (int32_t i = 0; i < numOfCols; ++i) {
1373 1374
      SColumnInfoData* pSrc = taosArrayGet(px->pDataBlock, i);
      SColumnInfoData* pDst = taosArrayGet(pBlock->pDataBlock, i);
1375
      // it is a reserved column for scalar function, and no data in this column yet.
1376
      if (pDst->pData == NULL || pSrc->pData == NULL) {
1377 1378 1379
        continue;
      }

1380 1381
      colInfoDataCleanup(pDst, pBlock->info.rows);

1382
      int32_t numOfRows = 0;
1383
      for (int32_t j = 0; j < totalRows; ++j) {
D
dapan1121 已提交
1384 1385 1386
        if (rowRes[j] == 0) {
          continue;
        }
1387

D
dapan1121 已提交
1388
        if (colDataIsNull_s(pSrc, j)) {
1389
          colDataAppendNULL(pDst, numOfRows);
D
dapan1121 已提交
1390
        } else {
1391
          colDataAppend(pDst, numOfRows, colDataGetData(pSrc, j), false);
D
dapan1121 已提交
1392
        }
1393
        numOfRows += 1;
H
Haojun Liao 已提交
1394
      }
1395

1396 1397 1398 1399 1400
      if (pBlock->info.rows == totalRows) {
        pBlock->info.rows = numOfRows;
      } else {
        ASSERT(pBlock->info.rows == numOfRows);
      }
1401
    }
1402

dengyihao's avatar
dengyihao 已提交
1403
    blockDataDestroy(px);  // fix memory leak
1404 1405 1406
  } else {
    // do nothing
    pBlock->info.rows = 0;
1407 1408 1409
  }
}

L
Liu Jicong 已提交
1410 1411
void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                              uint64_t groupId) {
1412
  // for simple group by query without interval, all the tables belong to one group result.
L
Liu Jicong 已提交
1413
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1414
  SResultRowInfo* pResultRowInfo = &pAggInfo->binfo.resultRowInfo;
1415 1416
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
1417

1418
  SResultRow* pResultRow = doSetResultOutBufByKey(pAggInfo->aggSup.pResultBuf, pResultRowInfo, (char*)&groupId,
L
Liu Jicong 已提交
1419
                                                  sizeof(groupId), true, groupId, pTaskInfo, false, &pAggInfo->aggSup);
L
Liu Jicong 已提交
1420
  assert(pResultRow != NULL);
1421 1422 1423 1424 1425 1426

  /*
   * not assign result buffer yet, add new result buffer
   * all group belong to one result set, and each group result has different group id so set the id to be one
   */
  if (pResultRow->pageId == -1) {
dengyihao's avatar
dengyihao 已提交
1427 1428
    int32_t ret =
        addNewWindowResultBuf(pResultRow, pAggInfo->aggSup.pResultBuf, groupId, pAggInfo->binfo.pRes->info.rowSize);
1429 1430 1431 1432 1433
    if (ret != TSDB_CODE_SUCCESS) {
      return;
    }
  }

1434
  setResultRowInitCtx(pResultRow, pCtx, numOfOutput, rowEntryInfoOffset);
1435 1436
}

1437
void setExecutionContext(SOperatorInfo* pOperator, int32_t numOfOutput, uint64_t groupId, SAggOperatorInfo* pAggInfo) {
H
Haojun Liao 已提交
1438
  if (pAggInfo->groupId != INT32_MIN && pAggInfo->groupId == groupId) {
1439 1440
    return;
  }
1441
#ifdef BUF_PAGE_DEBUG
L
Liu Jicong 已提交
1442
  qDebug("page_setbuf, groupId:%" PRIu64, groupId);
1443
#endif
1444
  doSetTableGroupOutputBuf(pOperator, pAggInfo, numOfOutput, groupId);
1445 1446

  // record the current active group id
H
Haojun Liao 已提交
1447
  pAggInfo->groupId = groupId;
1448 1449
}

1450 1451
static void doUpdateNumOfRows(SResultRow* pRow, int32_t numOfExprs, const int32_t* rowCellOffset) {
  for (int32_t j = 0; j < numOfExprs; ++j) {
1452
    struct SResultRowEntryInfo* pResInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1453 1454 1455 1456 1457 1458 1459 1460 1461 1462
    if (!isRowEntryInitialized(pResInfo)) {
      continue;
    }

    if (pRow->numOfRows < pResInfo->numOfRes) {
      pRow->numOfRows = pResInfo->numOfRes;
    }
  }
}

1463
int32_t finalizeResultRowIntoResultDataBlock(SDiskbasedBuf* pBuf, SResultRowPosition* resultRowPosition,
S
shenglian zhou 已提交
1464 1465 1466
                                             SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, int32_t numOfExprs,
                                             const int32_t* rowCellOffset, SSDataBlock* pBlock,
                                             SExecTaskInfo* pTaskInfo) {
1467 1468 1469 1470 1471 1472 1473 1474 1475
  SFilePage*  page = getBufPage(pBuf, resultRowPosition->pageId);
  SResultRow* pRow = (SResultRow*)((char*)page + resultRowPosition->offset);

  doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
  if (pRow->numOfRows == 0) {
    releaseBufPage(pBuf, page);
    return 0;
  }

1476 1477 1478 1479 1480 1481 1482
  while (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
    int32_t code = blockDataEnsureCapacity(pBlock, pBlock->info.capacity * 1.25);
    if (TAOS_FAILED(code)) {
      releaseBufPage(pBuf, page);
      qError("%s ensure result data capacity failed, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
      longjmp(pTaskInfo->env, code);
    }
1483 1484 1485 1486 1487
  }

  for (int32_t j = 0; j < numOfExprs; ++j) {
    int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1488
    pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1489 1490 1491 1492 1493 1494 1495 1496 1497
    if (pCtx[j].fpSet.finalize) {
      int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
      if (TAOS_FAILED(code)) {
        qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
        longjmp(pTaskInfo->env, code);
      }
    } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
      // do nothing, todo refactor
    } else {
1498 1499
      // expand the result into multiple rows. E.g., _wstart, top(k, 20)
      // the _wstart needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
1500 1501 1502 1503 1504 1505 1506 1507 1508
      SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
      char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
      for (int32_t k = 0; k < pRow->numOfRows; ++k) {
        colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
      }
    }
  }

  releaseBufPage(pBuf, page);
1509
  pBlock->info.rows += pRow->numOfRows;
1510 1511 1512 1513

  return 0;
}

X
Xiaoyu Wang 已提交
1514 1515 1516
int32_t doCopyToSDataBlock(SExecTaskInfo* pTaskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo, SDiskbasedBuf* pBuf,
                           SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset, SqlFunctionCtx* pCtx,
                           int32_t numOfExprs) {
1517
  int32_t numOfRows = getNumOfTotalRes(pGroupResInfo);
1518
  int32_t start = pGroupResInfo->index;
1519

1520
  for (int32_t i = start; i < numOfRows; i += 1) {
L
Liu Jicong 已提交
1521 1522
    SResKeyPos* pPos = taosArrayGetP(pGroupResInfo->pRows, i);
    SFilePage*  page = getBufPage(pBuf, pPos->pos.pageId);
1523

1524
    SResultRow* pRow = (SResultRow*)((char*)page + pPos->pos.offset);
1525 1526

    doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
1527 1528
    if (pRow->numOfRows == 0) {
      pGroupResInfo->index += 1;
1529
      releaseBufPage(pBuf, page);
1530 1531 1532
      continue;
    }

1533 1534 1535 1536 1537
    if (pBlock->info.groupId == 0) {
      pBlock->info.groupId = pPos->groupId;
    } else {
      // current value belongs to different group, it can't be packed into one datablock
      if (pBlock->info.groupId != pPos->groupId) {
1538
        releaseBufPage(pBuf, page);
1539 1540 1541 1542
        break;
      }
    }

1543
    if (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
1544
      releaseBufPage(pBuf, page);
1545 1546 1547 1548 1549
      break;
    }

    pGroupResInfo->index += 1;

1550
    for (int32_t j = 0; j < numOfExprs; ++j) {
1551 1552
      int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1553
      pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1554
      if (pCtx[j].fpSet.finalize) {
1555
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1556
        qDebug("\npage_finalize %d", numOfExprs);
1557
#endif
1558
        int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
1559
        if (TAOS_FAILED(code)) {
1560 1561
          qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
          longjmp(pTaskInfo->env, code);
1562
        }
1563 1564
      } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
        // do nothing, todo refactor
1565
      } else {
1566 1567
        // expand the result into multiple rows. E.g., _wstart, top(k, 20)
        // the _wstart needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
X
Xiaoyu Wang 已提交
1568 1569
        SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
        char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
1570
        if (pCtx[j].increase) {
L
Liu Jicong 已提交
1571
          int64_t ts = *(int64_t*)in;
1572
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
L
Liu Jicong 已提交
1573
            colDataAppend(pColInfoData, pBlock->info.rows + k, (const char*)&ts, pCtx[j].resultInfo->isNullRes);
1574 1575 1576 1577 1578 1579
            ts++;
          }
        } else {
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
            colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
          }
X
Xiaoyu Wang 已提交
1580
        }
1581
      }
1582 1583
    }

1584
    releaseBufPage(pBuf, page);
1585
    pBlock->info.rows += pRow->numOfRows;
L
Liu Jicong 已提交
1586 1587 1588
    //    if (pBlock->info.rows >= pBlock->info.capacity) {  // output buffer is full
    //      break;
    //    }
1589 1590
  }

X
Xiaoyu Wang 已提交
1591 1592
  qDebug("%s result generated, rows:%d, groupId:%" PRIu64, GET_TASKID(pTaskInfo), pBlock->info.rows,
         pBlock->info.groupId);
1593
  blockDataUpdateTsWindow(pBlock, 0);
1594 1595 1596
  return 0;
}

X
Xiaoyu Wang 已提交
1597 1598
void doBuildResultDatablock(SOperatorInfo* pOperator, SOptrBasicInfo* pbInfo, SGroupResInfo* pGroupResInfo,
                            SDiskbasedBuf* pBuf) {
1599 1600
  SExprInfo*     pExprInfo = pOperator->exprSupp.pExprInfo;
  int32_t        numOfExprs = pOperator->exprSupp.numOfExprs;
1601 1602
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

1603
  int32_t*        rowCellOffset = pOperator->exprSupp.rowEntryInfoOffset;
X
Xiaoyu Wang 已提交
1604
  SSDataBlock*    pBlock = pbInfo->pRes;
1605
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
1606

1607
  blockDataCleanup(pBlock);
1608
  if (!hasDataInGroupInfo(pGroupResInfo)) {
1609 1610 1611
    return;
  }

1612 1613
  // clear the existed group id
  pBlock->info.groupId = 0;
1614
  doCopyToSDataBlock(pTaskInfo, pBlock, pExprInfo, pBuf, pGroupResInfo, rowCellOffset, pCtx, numOfExprs);
1615 1616
}

L
Liu Jicong 已提交
1617
static void updateNumOfRowsInResultRows(SqlFunctionCtx* pCtx, int32_t numOfOutput, SResultRowInfo* pResultRowInfo,
1618
                                        int32_t* rowEntryInfoOffset) {
1619
  // update the number of result for each, only update the number of rows for the corresponding window result.
L
Liu Jicong 已提交
1620 1621 1622
  //  if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
  //    return;
  //  }
H
Haojun Liao 已提交
1623
#if 0
1624
  for (int32_t i = 0; i < pResultRowInfo->size; ++i) {
L
Liu Jicong 已提交
1625
    SResultRow* pResult = pResultRowInfo->pResult[i];
1626 1627 1628 1629 1630 1631 1632

    for (int32_t j = 0; j < numOfOutput; ++j) {
      int32_t functionId = pCtx[j].functionId;
      if (functionId == FUNCTION_TS || functionId == FUNCTION_TAG || functionId == FUNCTION_TAGPRJ) {
        continue;
      }

1633
      SResultRowEntryInfo* pCell = getResultEntryInfo(pResult, j, rowEntryInfoOffset);
1634
      pResult->numOfRows = (uint16_t)(TMAX(pResult->numOfRows, pCell->numOfRes));
1635 1636
    }
  }
H
Haojun Liao 已提交
1637
#endif
1638 1639
}

L
Liu Jicong 已提交
1640
static int32_t compressQueryColData(SColumnInfoData* pColRes, int32_t numOfRows, char* data, int8_t compressed) {
1641 1642
  int32_t colSize = pColRes->info.bytes * numOfRows;
  return (*(tDataTypes[pColRes->info.type].compFunc))(pColRes->pData, colSize, numOfRows, data,
L
Liu Jicong 已提交
1643
                                                      colSize + COMP_OVERFLOW_BYTES, compressed, NULL, 0);
1644 1645
}

1646 1647 1648
int32_t doFillTimeIntervalGapsInResults(struct SFillInfo* pFillInfo, SSDataBlock* pBlock, int32_t capacity) {
  int32_t numOfRows = (int32_t)taosFillResultDataBlock(pFillInfo, pBlock, capacity - pBlock->info.rows);
  return pBlock->info.rows;
1649 1650
}

L
Liu Jicong 已提交
1651 1652
void queryCostStatis(SExecTaskInfo* pTaskInfo) {
  STaskCostInfo* pSummary = &pTaskInfo->cost;
1653

L
Liu Jicong 已提交
1654 1655 1656
  //  uint64_t hashSize = taosHashGetMemSize(pQInfo->runtimeEnv.pResultRowHashTable);
  //  hashSize += taosHashGetMemSize(pRuntimeEnv->tableqinfoGroupInfo.map);
  //  pSummary->hashSize = hashSize;
1657 1658 1659 1660

  // add the merge time
  pSummary->elapsedTime += pSummary->firstStageMergeTime;

L
Liu Jicong 已提交
1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671
  //  SResultRowPool* p = pTaskInfo->pool;
  //  if (p != NULL) {
  //    pSummary->winInfoSize = getResultRowPoolMemSize(p);
  //    pSummary->numOfTimeWindows = getNumOfAllocatedResultRows(p);
  //  } else {
  //    pSummary->winInfoSize = 0;
  //    pSummary->numOfTimeWindows = 0;
  //  }
  //
  //  calculateOperatorProfResults(pQInfo);

1672 1673
  SFileBlockLoadRecorder* pRecorder = pSummary->pRecoder;
  if (pSummary->pRecoder != NULL) {
X
Xiaoyu Wang 已提交
1674 1675
    qDebug("%s :cost summary: elapsed time:%" PRId64 " us, first merge:%" PRId64
           " us, total blocks:%d, "
1676 1677 1678 1679
           "load block statis:%d, load data block:%d, total rows:%" PRId64 ", check rows:%" PRId64,
           GET_TASKID(pTaskInfo), pSummary->elapsedTime, pSummary->firstStageMergeTime, pRecorder->totalBlocks,
           pRecorder->loadBlockStatis, pRecorder->loadBlocks, pRecorder->totalRows, pRecorder->totalCheckedRows);
  }
L
Liu Jicong 已提交
1680 1681 1682
  // qDebug("QInfo:0x%"PRIx64" :cost summary: winResPool size:%.2f Kb, numOfWin:%"PRId64", tableInfoSize:%.2f Kb,
  // hashTable:%.2f Kb", pQInfo->qId, pSummary->winInfoSize/1024.0,
  //      pSummary->numOfTimeWindows, pSummary->tableInfoSize/1024.0, pSummary->hashSize/1024.0);
1683 1684
}

L
Liu Jicong 已提交
1685 1686 1687
// static void updateOffsetVal(STaskRuntimeEnv *pRuntimeEnv, SDataBlockInfo *pBlockInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
1688
//
L
Liu Jicong 已提交
1689
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1690
//
L
Liu Jicong 已提交
1691 1692 1693 1694
//   if (pQueryAttr->limit.offset == pBlockInfo->rows) {  // current block will ignore completed
//     pTableQueryInfo->lastKey = QUERY_IS_ASC_QUERY(pQueryAttr) ? pBlockInfo->window.ekey + step :
//     pBlockInfo->window.skey + step; pQueryAttr->limit.offset = 0; return;
//   }
1695
//
L
Liu Jicong 已提交
1696 1697 1698 1699 1700
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     pQueryAttr->pos = (int32_t)pQueryAttr->limit.offset;
//   } else {
//     pQueryAttr->pos = pBlockInfo->rows - (int32_t)pQueryAttr->limit.offset - 1;
//   }
1701
//
L
Liu Jicong 已提交
1702
//   assert(pQueryAttr->pos >= 0 && pQueryAttr->pos <= pBlockInfo->rows - 1);
1703
//
L
Liu Jicong 已提交
1704 1705
//   SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//   SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1706
//
L
Liu Jicong 已提交
1707 1708
//   // update the pQueryAttr->limit.offset value, and pQueryAttr->pos value
//   TSKEY *keys = (TSKEY *) pColInfoData->pData;
1709
//
L
Liu Jicong 已提交
1710 1711 1712
//   // update the offset value
//   pTableQueryInfo->lastKey = keys[pQueryAttr->pos];
//   pQueryAttr->limit.offset = 0;
1713
//
L
Liu Jicong 已提交
1714
//   int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
1715
//
L
Liu Jicong 已提交
1716 1717 1718 1719
//   //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numBlocksOfStep:%d, numOfRes:%d,
//   lastKey:%"PRId64, GET_TASKID(pRuntimeEnv),
//          pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes, pQuery->current->lastKey);
// }
1720

L
Liu Jicong 已提交
1721 1722
// void skipBlocks(STaskRuntimeEnv *pRuntimeEnv) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
1723
//
L
Liu Jicong 已提交
1724 1725 1726
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0) {
//     return;
//   }
1727
//
L
Liu Jicong 已提交
1728 1729
//   pQueryAttr->pos = 0;
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1730
//
L
Liu Jicong 已提交
1731 1732
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
//   TsdbQueryHandleT pTsdbReadHandle = pRuntimeEnv->pTsdbReadHandle;
1733
//
L
Liu Jicong 已提交
1734 1735 1736 1737 1738
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pTsdbReadHandle)) {
//     if (isTaskKilled(pRuntimeEnv->qinfo)) {
//       longjmp(pRuntimeEnv->env, TSDB_CODE_TSC_QUERY_CANCELLED);
//     }
1739
//
L
Liu Jicong 已提交
1740
//     tsdbRetrieveDataBlockInfo(pTsdbReadHandle, &blockInfo);
1741
//
L
Liu Jicong 已提交
1742 1743 1744 1745
//     if (pQueryAttr->limit.offset > blockInfo.rows) {
//       pQueryAttr->limit.offset -= blockInfo.rows;
//       pTableQueryInfo->lastKey = (QUERY_IS_ASC_QUERY(pQueryAttr)) ? blockInfo.window.ekey : blockInfo.window.skey;
//       pTableQueryInfo->lastKey += step;
1746
//
L
Liu Jicong 已提交
1747 1748 1749 1750 1751 1752 1753
//       //qDebug("QInfo:0x%"PRIx64" skip rows:%d, offset:%" PRId64, GET_TASKID(pRuntimeEnv), blockInfo.rows,
//              pQuery->limit.offset);
//     } else {  // find the appropriated start position in current block
//       updateOffsetVal(pRuntimeEnv, &blockInfo);
//       break;
//     }
//   }
1754
//
L
Liu Jicong 已提交
1755 1756 1757 1758 1759 1760 1761 1762 1763
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
// }

// static TSKEY doSkipIntervalProcess(STaskRuntimeEnv* pRuntimeEnv, STimeWindow* win, SDataBlockInfo* pBlockInfo,
// STableQueryInfo* pTableQueryInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
1764
//
L
Liu Jicong 已提交
1765 1766 1767
//   assert(pQueryAttr->limit.offset == 0);
//   STimeWindow tw = *win;
//   getNextTimeWindow(pQueryAttr, &tw);
1768
//
L
Liu Jicong 已提交
1769 1770
//   if ((tw.skey <= pBlockInfo->window.ekey && QUERY_IS_ASC_QUERY(pQueryAttr)) ||
//       (tw.ekey >= pBlockInfo->window.skey && !QUERY_IS_ASC_QUERY(pQueryAttr))) {
1771
//
L
Liu Jicong 已提交
1772 1773 1774 1775
//     // load the data block and check data remaining in current data block
//     // TODO optimize performance
//     SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//     SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1776
//
L
Liu Jicong 已提交
1777 1778 1779 1780
//     tw = *win;
//     int32_t startPos =
//         getNextQualifiedWindow(pQueryAttr, &tw, pBlockInfo, pColInfoData->pData, binarySearchForKey, -1);
//     assert(startPos >= 0);
1781
//
L
Liu Jicong 已提交
1782 1783
//     // set the abort info
//     pQueryAttr->pos = startPos;
1784
//
L
Liu Jicong 已提交
1785 1786 1787 1788
//     // reset the query start timestamp
//     pTableQueryInfo->win.skey = ((TSKEY *)pColInfoData->pData)[startPos];
//     pQueryAttr->window.skey = pTableQueryInfo->win.skey;
//     TSKEY key = pTableQueryInfo->win.skey;
1789
//
L
Liu Jicong 已提交
1790 1791
//     pWindowResInfo->prevSKey = tw.skey;
//     int32_t index = pRuntimeEnv->resultRowInfo.curIndex;
1792
//
L
Liu Jicong 已提交
1793 1794
//     int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
//     pRuntimeEnv->resultRowInfo.curIndex = index;  // restore the window index
1795
//
L
Liu Jicong 已提交
1796 1797 1798 1799
//     //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numOfRows:%d, numOfRes:%d,
//     lastKey:%" PRId64,
//            GET_TASKID(pRuntimeEnv), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes,
//            pQueryAttr->current->lastKey);
1800
//
L
Liu Jicong 已提交
1801 1802 1803 1804 1805
//     return key;
//   } else {  // do nothing
//     pQueryAttr->window.skey      = tw.skey;
//     pWindowResInfo->prevSKey = tw.skey;
//     pTableQueryInfo->lastKey = tw.skey;
1806
//
L
Liu Jicong 已提交
1807 1808
//     return tw.skey;
//   }
1809
//
L
Liu Jicong 已提交
1810 1811 1812 1813 1814 1815 1816 1817 1818 1819
//   return true;
// }

// static bool skipTimeInterval(STaskRuntimeEnv *pRuntimeEnv, TSKEY* start) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     assert(*start <= pRuntimeEnv->current->lastKey);
//   } else {
//     assert(*start >= pRuntimeEnv->current->lastKey);
//   }
1820
//
L
Liu Jicong 已提交
1821 1822 1823 1824 1825
//   // if queried with value filter, do NOT forward query start position
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0 || pRuntimeEnv->pTsBuf != NULL ||
//   pRuntimeEnv->pFillInfo != NULL) {
//     return true;
//   }
1826
//
L
Liu Jicong 已提交
1827 1828 1829 1830 1831 1832 1833
//   /*
//    * 1. for interval without interpolation query we forward pQueryAttr->interval.interval at a time for
//    *    pQueryAttr->limit.offset times. Since hole exists, pQueryAttr->interval.interval*pQueryAttr->limit.offset
//    value is
//    *    not valid. otherwise, we only forward pQueryAttr->limit.offset number of points
//    */
//   assert(pRuntimeEnv->resultRowInfo.prevSKey == TSKEY_INITIAL_VAL);
1834
//
L
Liu Jicong 已提交
1835 1836
//   STimeWindow w = TSWINDOW_INITIALIZER;
//   bool ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1837
//
L
Liu Jicong 已提交
1838 1839
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
//   STableQueryInfo *pTableQueryInfo = pRuntimeEnv->current;
1840
//
L
Liu Jicong 已提交
1841 1842 1843
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pRuntimeEnv->pTsdbReadHandle)) {
//     tsdbRetrieveDataBlockInfo(pRuntimeEnv->pTsdbReadHandle, &blockInfo);
1844
//
L
Liu Jicong 已提交
1845 1846 1847 1848 1849 1850 1851 1852 1853
//     if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       if (pWindowResInfo->prevSKey == TSKEY_INITIAL_VAL) {
//         getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.skey, blockInfo.window.skey, pQueryAttr->window.ekey,
//         &w); pWindowResInfo->prevSKey = w.skey;
//       }
//     } else {
//       getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.ekey, pQueryAttr->window.ekey, blockInfo.window.ekey, &w);
//       pWindowResInfo->prevSKey = w.skey;
//     }
1854
//
L
Liu Jicong 已提交
1855 1856
//     // the first time window
//     STimeWindow win = getActiveTimeWindow(pWindowResInfo, pWindowResInfo->prevSKey, pQueryAttr);
1857
//
L
Liu Jicong 已提交
1858 1859
//     while (pQueryAttr->limit.offset > 0) {
//       STimeWindow tw = win;
1860
//
L
Liu Jicong 已提交
1861 1862 1863
//       if ((win.ekey <= blockInfo.window.ekey && ascQuery) || (win.ekey >= blockInfo.window.skey && !ascQuery)) {
//         pQueryAttr->limit.offset -= 1;
//         pWindowResInfo->prevSKey = win.skey;
1864
//
L
Liu Jicong 已提交
1865 1866 1867 1868 1869 1870
//         // current time window is aligned with blockInfo.window.ekey
//         // restart it from next data block by set prevSKey to be TSKEY_INITIAL_VAL;
//         if ((win.ekey == blockInfo.window.ekey && ascQuery) || (win.ekey == blockInfo.window.skey && !ascQuery)) {
//           pWindowResInfo->prevSKey = TSKEY_INITIAL_VAL;
//         }
//       }
1871
//
L
Liu Jicong 已提交
1872 1873 1874 1875
//       if (pQueryAttr->limit.offset == 0) {
//         *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//         return true;
//       }
1876
//
L
Liu Jicong 已提交
1877 1878
//       // current window does not ended in current data block, try next data block
//       getNextTimeWindow(pQueryAttr, &tw);
1879
//
L
Liu Jicong 已提交
1880 1881 1882 1883 1884 1885 1886 1887 1888
//       /*
//        * If the next time window still starts from current data block,
//        * load the primary timestamp column first, and then find the start position for the next queried time window.
//        * Note that only the primary timestamp column is required.
//        * TODO: Optimize for this cases. All data blocks are not needed to be loaded, only if the first actually
//        required
//        * time window resides in current data block.
//        */
//       if ((tw.skey <= blockInfo.window.ekey && ascQuery) || (tw.ekey >= blockInfo.window.skey && !ascQuery)) {
1889
//
L
Liu Jicong 已提交
1890 1891
//         SArray *pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//         SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1892
//
L
Liu Jicong 已提交
1893 1894 1895
//         if ((win.ekey > blockInfo.window.ekey && ascQuery) || (win.ekey < blockInfo.window.skey && !ascQuery)) {
//           pQueryAttr->limit.offset -= 1;
//         }
1896
//
L
Liu Jicong 已提交
1897 1898 1899 1900 1901 1902 1903 1904
//         if (pQueryAttr->limit.offset == 0) {
//           *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//           return true;
//         } else {
//           tw = win;
//           int32_t startPos =
//               getNextQualifiedWindow(pQueryAttr, &tw, &blockInfo, pColInfoData->pData, binarySearchForKey, -1);
//           assert(startPos >= 0);
1905
//
L
Liu Jicong 已提交
1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916
//           // set the abort info
//           pQueryAttr->pos = startPos;
//           pTableQueryInfo->lastKey = ((TSKEY *)pColInfoData->pData)[startPos];
//           pWindowResInfo->prevSKey = tw.skey;
//           win = tw;
//         }
//       } else {
//         break;  // offset is not 0, and next time window begins or ends in the next block.
//       }
//     }
//   }
1917
//
L
Liu Jicong 已提交
1918 1919 1920 1921
//   // check for error
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
1922
//
L
Liu Jicong 已提交
1923 1924
//   return true;
// }
1925

1926
int32_t appendDownstream(SOperatorInfo* p, SOperatorInfo** pDownstream, int32_t num) {
H
Haojun Liao 已提交
1927
  if (p->pDownstream == NULL) {
H
Haojun Liao 已提交
1928
    assert(p->numOfDownstream == 0);
1929 1930
  }

wafwerar's avatar
wafwerar 已提交
1931
  p->pDownstream = taosMemoryCalloc(1, num * POINTER_BYTES);
1932 1933 1934 1935 1936 1937 1938
  if (p->pDownstream == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  memcpy(p->pDownstream, pDownstream, num * POINTER_BYTES);
  p->numOfDownstream = num;
  return TSDB_CODE_SUCCESS;
1939 1940
}

wmmhello's avatar
wmmhello 已提交
1941
static void doDestroyTableList(STableListInfo* pTableqinfoList);
1942

1943
static void doTableQueryInfoTimeWindowCheck(SExecTaskInfo* pTaskInfo, STableQueryInfo* pTableQueryInfo, int32_t order) {
H
Haojun Liao 已提交
1944 1945
#if 0
    if (order == TSDB_ORDER_ASC) {
1946 1947
    assert(
        (pTableQueryInfo->win.skey <= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1948 1949
        (pTableQueryInfo->lastKey >= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey >= pTaskInfo->window.skey && pTableQueryInfo->win.ekey <= pTaskInfo->window.ekey));
1950 1951 1952
  } else {
    assert(
        (pTableQueryInfo->win.skey >= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1953 1954
        (pTableQueryInfo->lastKey <= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey <= pTaskInfo->window.skey && pTableQueryInfo->win.ekey >= pTaskInfo->window.ekey));
1955
  }
H
Haojun Liao 已提交
1956
#endif
1957 1958
}

1959 1960 1961 1962
typedef struct SFetchRspHandleWrapper {
  uint32_t exchangeId;
  int32_t  sourceIndex;
} SFetchRspHandleWrapper;
1963

D
dapan1121 已提交
1964
int32_t loadRemoteDataCallback(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1965
  SFetchRspHandleWrapper* pWrapper = (SFetchRspHandleWrapper*)param;
1966 1967 1968 1969 1970 1971 1972

  SExchangeInfo* pExchangeInfo = taosAcquireRef(exchangeObjRefPool, pWrapper->exchangeId);
  if (pExchangeInfo == NULL) {
    qWarn("failed to acquire exchange operator, since it may have been released");
    return TSDB_CODE_SUCCESS;
  }

X
Xiaoyu Wang 已提交
1973
  int32_t          index = pWrapper->sourceIndex;
1974
  SSourceDataInfo* pSourceDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, index);
1975

H
Haojun Liao 已提交
1976 1977
  if (code == TSDB_CODE_SUCCESS) {
    pSourceDataInfo->pRsp = pMsg->pData;
1978

H
Haojun Liao 已提交
1979 1980
    SRetrieveTableRsp* pRsp = pSourceDataInfo->pRsp;
    pRsp->numOfRows = htonl(pRsp->numOfRows);
dengyihao's avatar
dengyihao 已提交
1981
    pRsp->compLen = htonl(pRsp->compLen);
1982
    pRsp->numOfCols = htonl(pRsp->numOfCols);
dengyihao's avatar
dengyihao 已提交
1983
    pRsp->useconds = htobe64(pRsp->useconds);
1984

1985
    ASSERT(pRsp != NULL);
1986
    qDebug("%s fetch rsp received, index:%d, rows:%d", pSourceDataInfo->taskId, index, pRsp->numOfRows);
H
Haojun Liao 已提交
1987 1988
  } else {
    pSourceDataInfo->code = code;
D
dapan1121 已提交
1989
    qDebug("%s fetch rsp received, index:%d, error:%d", pSourceDataInfo->taskId, index, tstrerror(code));
H
Haojun Liao 已提交
1990
  }
H
Haojun Liao 已提交
1991

H
Haojun Liao 已提交
1992
  pSourceDataInfo->status = EX_SOURCE_DATA_READY;
1993 1994 1995 1996

  tsem_post(&pExchangeInfo->ready);
  taosReleaseRef(exchangeObjRefPool, pWrapper->exchangeId);

wmmhello's avatar
wmmhello 已提交
1997
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
1998 1999
}

D
dapan1121 已提交
2000
void qProcessRspMsg(void* parent, SRpcMsg* pMsg, SEpSet* pEpSet) {
S
Shengliang Guan 已提交
2001 2002
  SMsgSendInfo* pSendInfo = (SMsgSendInfo*)pMsg->info.ahandle;
  assert(pMsg->info.ahandle != NULL);
H
Haojun Liao 已提交
2003 2004 2005 2006

  SDataBuf buf = {.len = pMsg->contLen, .pData = NULL};

  if (pMsg->contLen > 0) {
wafwerar's avatar
wafwerar 已提交
2007
    buf.pData = taosMemoryCalloc(1, pMsg->contLen);
H
Haojun Liao 已提交
2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018
    if (buf.pData == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      pMsg->code = TSDB_CODE_OUT_OF_MEMORY;
    } else {
      memcpy(buf.pData, pMsg->pCont, pMsg->contLen);
    }
  }

  pSendInfo->fp(pSendInfo->param, &buf, pMsg->code);
  rpcFreeCont(pMsg->pCont);
  destroySendMsgInfo(pSendInfo);
2019 2020
}

L
Liu Jicong 已提交
2021
static int32_t doSendFetchDataRequest(SExchangeInfo* pExchangeInfo, SExecTaskInfo* pTaskInfo, int32_t sourceIndex) {
2022
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2023

wafwerar's avatar
wafwerar 已提交
2024
  SResFetchReq* pMsg = taosMemoryCalloc(1, sizeof(SResFetchReq));
2025 2026 2027 2028
  if (NULL == pMsg) {
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
  }
2029

L
Liu Jicong 已提交
2030 2031
  SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, sourceIndex);
  SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, sourceIndex);
2032

2033 2034
  ASSERT(pDataInfo->status == EX_SOURCE_DATA_NOT_READY);

2035 2036 2037
  qDebug("%s build fetch msg and send to vgId:%d, ep:%s, taskId:0x%" PRIx64 ", execId:%d, %d/%" PRIzu,
         GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->addr.epSet.eps[0].fqdn, pSource->taskId, pSource->execId,
         sourceIndex, totalSources);
2038 2039 2040 2041 2042

  pMsg->header.vgId = htonl(pSource->addr.nodeId);
  pMsg->sId = htobe64(pSource->schedId);
  pMsg->taskId = htobe64(pSource->taskId);
  pMsg->queryId = htobe64(pTaskInfo->id.queryId);
D
dapan1121 已提交
2043
  pMsg->execId = htonl(pSource->execId);
2044 2045

  // send the fetch remote task result reques
wafwerar's avatar
wafwerar 已提交
2046
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
2047
  if (NULL == pMsgSendInfo) {
wafwerar's avatar
wafwerar 已提交
2048
    taosMemoryFreeClear(pMsg);
2049 2050 2051
    qError("%s prepare message %d failed", GET_TASKID(pTaskInfo), (int32_t)sizeof(SMsgSendInfo));
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
H
Haojun Liao 已提交
2052 2053
  }

2054
  SFetchRspHandleWrapper* pWrapper = taosMemoryCalloc(1, sizeof(SFetchRspHandleWrapper));
X
Xiaoyu Wang 已提交
2055
  pWrapper->exchangeId = pExchangeInfo->self;
2056 2057 2058
  pWrapper->sourceIndex = sourceIndex;

  pMsgSendInfo->param = pWrapper;
D
dapan1121 已提交
2059
  pMsgSendInfo->paramFreeFp = taosMemoryFree;
2060 2061
  pMsgSendInfo->msgInfo.pData = pMsg;
  pMsgSendInfo->msgInfo.len = sizeof(SResFetchReq);
L
Liu Jicong 已提交
2062
  pMsgSendInfo->msgType = pSource->fetchMsgType;
2063
  pMsgSendInfo->fp = loadRemoteDataCallback;
2064

2065
  int64_t transporterId = 0;
L
Liu Jicong 已提交
2066
  int32_t code = asyncSendMsgToServer(pExchangeInfo->pTransporter, &pSource->addr.epSet, &transporterId, pMsgSendInfo);
2067 2068 2069
  return TSDB_CODE_SUCCESS;
}

2070
int32_t extractDataBlockFromFetchRsp(SSDataBlock* pRes, SLoadRemoteDataInfo* pLoadInfo, int32_t numOfRows, char* pData,
L
Liu Jicong 已提交
2071 2072
                                     int32_t compLen, int32_t numOfOutput, int64_t startTs, uint64_t* total,
                                     SArray* pColList) {
H
Haojun Liao 已提交
2073
  if (pColList == NULL) {  // data from other sources
2074
    blockDataCleanup(pRes);
2075
    //    blockDataEnsureCapacity(pRes, numOfRows);
2076
    blockDecode(pRes, numOfOutput, numOfRows, pData);
H
Haojun Liao 已提交
2077
  } else {  // extract data according to pColList
2078
    ASSERT(numOfOutput == taosArrayGetSize(pColList));
2079 2080 2081 2082 2083
    char* pStart = pData;

    int32_t numOfCols = htonl(*(int32_t*)pStart);
    pStart += sizeof(int32_t);

2084
    // todo refactor:extract method
2085
    SSysTableSchema* pSchema = (SSysTableSchema*)pStart;
dengyihao's avatar
dengyihao 已提交
2086
    for (int32_t i = 0; i < numOfCols; ++i) {
2087 2088 2089 2090 2091 2092 2093
      SSysTableSchema* p = (SSysTableSchema*)pStart;

      p->colId = htons(p->colId);
      p->bytes = htonl(p->bytes);
      pStart += sizeof(SSysTableSchema);
    }

2094
    SSDataBlock* pBlock = createDataBlock();
dengyihao's avatar
dengyihao 已提交
2095
    for (int32_t i = 0; i < numOfCols; ++i) {
2096 2097
      SColumnInfoData idata = createColumnInfoData(pSchema[i].type, pSchema[i].bytes, pSchema[i].colId);
      blockDataAppendColInfo(pBlock, &idata);
2098 2099
    }

2100
    blockDecode(pBlock, numOfCols, numOfRows, pStart);
2101 2102
    blockDataEnsureCapacity(pRes, numOfRows);

H
Haojun Liao 已提交
2103
    // data from mnode
2104
    pRes->info.rows = numOfRows;
2105 2106
    relocateColumnData(pRes, pColList, pBlock->pDataBlock, false);
    blockDataDestroy(pBlock);
2107
  }
2108

2109 2110
  // todo move this to time window aggregator, since the primary timestamp may not be known by exchange operator.
  blockDataUpdateTsWindow(pRes, 0);
2111

2112
  int64_t el = taosGetTimestampUs() - startTs;
2113

H
Haojun Liao 已提交
2114 2115
  pLoadInfo->totalRows += numOfRows;
  pLoadInfo->totalSize += compLen;
2116

H
Haojun Liao 已提交
2117 2118 2119
  if (total != NULL) {
    *total += numOfRows;
  }
2120

H
Haojun Liao 已提交
2121
  pLoadInfo->totalElapsed += el;
2122 2123
  return TSDB_CODE_SUCCESS;
}
2124

L
Liu Jicong 已提交
2125 2126
static void* setAllSourcesCompleted(SOperatorInfo* pOperator, int64_t startTs) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
2127
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
H
Haojun Liao 已提交
2128

2129
  int64_t              el = taosGetTimestampUs() - startTs;
H
Haojun Liao 已提交
2130
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2131

H
Haojun Liao 已提交
2132
  pLoadInfo->totalElapsed += el;
H
Haojun Liao 已提交
2133

2134
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
L
Liu Jicong 已提交
2135 2136 2137
  qDebug("%s all %" PRIzu " sources are exhausted, total rows: %" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
         GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
         pLoadInfo->totalElapsed / 1000.0);
2138 2139 2140 2141 2142

  doSetOperatorCompleted(pOperator);
  return NULL;
}

L
Liu Jicong 已提交
2143 2144
static SSDataBlock* concurrentlyLoadRemoteDataImpl(SOperatorInfo* pOperator, SExchangeInfo* pExchangeInfo,
                                                   SExecTaskInfo* pTaskInfo) {
2145 2146 2147 2148 2149 2150 2151 2152
  int32_t code = 0;
  int64_t startTs = taosGetTimestampUs();
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);

  while (1) {
    int32_t completed = 0;
    for (int32_t i = 0; i < totalSources; ++i) {
      SSourceDataInfo* pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, i);
2153
      if (pDataInfo->status == EX_SOURCE_DATA_EXHAUSTED) {
2154
        completed += 1;
H
Haojun Liao 已提交
2155 2156
        continue;
      }
2157

2158
      if (pDataInfo->status != EX_SOURCE_DATA_READY) {
2159 2160 2161
        continue;
      }

2162 2163 2164 2165 2166
      if (pDataInfo->code != TSDB_CODE_SUCCESS) {
        code = pDataInfo->code;
        goto _error;
      }

L
Liu Jicong 已提交
2167
      SRetrieveTableRsp*     pRsp = pDataInfo->pRsp;
X
Xiaoyu Wang 已提交
2168
      SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, i);
2169

L
Liu Jicong 已提交
2170
      SSDataBlock*         pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2171
      SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2172
      if (pRsp->numOfRows == 0) {
2173 2174
        qDebug("%s vgId:%d, taskId:0x%" PRIx64 " execId:%d index:%d completed, rowsOfSource:%" PRIu64
               ", totalRows:%" PRIu64 ", completed:%d try next %d/%" PRIzu,
D
dapan1121 已提交
2175
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pDataInfo->totalRows,
2176
               pExchangeInfo->loadInfo.totalRows, completed + 1, i + 1, totalSources);
2177
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2178
        completed += 1;
D
dapan1121 已提交
2179
        taosMemoryFreeClear(pDataInfo->pRsp);
2180 2181
        continue;
      }
H
Haojun Liao 已提交
2182

H
Haojun Liao 已提交
2183
      SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2184 2185 2186
      code =
          extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
                                       pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2187
      if (code != 0) {
2188
        taosMemoryFreeClear(pDataInfo->pRsp);
2189 2190 2191
        goto _error;
      }

2192
      if (pRsp->completed == 1) {
2193 2194
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64
               " execId:%d"
X
Xiaoyu Wang 已提交
2195 2196
               " index:%d completed, numOfRows:%d, rowsOfSource:%" PRIu64 ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64
               ", completed:%d try next %d/%" PRIzu,
2197 2198
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pRes->info.rows,
               pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, completed + 1, i + 1, totalSources);
2199
        completed += 1;
2200
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2201
      } else {
D
dapan1121 已提交
2202
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
dengyihao's avatar
dengyihao 已提交
2203
               ", totalBytes:%" PRIu64,
2204 2205
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
               pLoadInfo->totalRows, pLoadInfo->totalSize);
2206 2207
      }

2208 2209
      taosMemoryFreeClear(pDataInfo->pRsp);

2210 2211
      if (pDataInfo->status != EX_SOURCE_DATA_EXHAUSTED) {
        pDataInfo->status = EX_SOURCE_DATA_NOT_READY;
2212 2213
        code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
        if (code != TSDB_CODE_SUCCESS) {
2214
          taosMemoryFreeClear(pDataInfo->pRsp);
2215 2216 2217 2218 2219 2220 2221
          goto _error;
        }
      }

      return pExchangeInfo->pResult;
    }

2222
    if (completed == totalSources) {
2223 2224
      return setAllSourcesCompleted(pOperator, startTs);
    }
H
Haojun Liao 已提交
2225 2226

    sched_yield();
2227 2228 2229 2230 2231 2232 2233
  }

_error:
  pTaskInfo->code = code;
  return NULL;
}

L
Liu Jicong 已提交
2234 2235 2236
static int32_t prepareConcurrentlyLoad(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2237

L
Liu Jicong 已提交
2238
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2239 2240 2241
  int64_t startTs = taosGetTimestampUs();

  // Asynchronously send all fetch requests to all sources.
L
Liu Jicong 已提交
2242
  for (int32_t i = 0; i < totalSources; ++i) {
2243 2244
    int32_t code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
    if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2245 2246
      pTaskInfo->code = code;
      return code;
2247 2248 2249 2250
    }
  }

  int64_t endTs = taosGetTimestampUs();
2251
  qDebug("%s send all fetch requests to %" PRIzu " sources completed, elapsed:%.2fms", GET_TASKID(pTaskInfo),
X
Xiaoyu Wang 已提交
2252
         totalSources, (endTs - startTs) / 1000.0);
2253

2254
  pOperator->status = OP_RES_TO_RETURN;
H
Haojun Liao 已提交
2255
  pOperator->cost.openCost = taosGetTimestampUs() - startTs;
2256

2257
  tsem_wait(&pExchangeInfo->ready);
H
Haojun Liao 已提交
2258
  return TSDB_CODE_SUCCESS;
2259 2260
}

L
Liu Jicong 已提交
2261 2262 2263
static SSDataBlock* seqLoadRemoteData(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2264

L
Liu Jicong 已提交
2265
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2266
  int64_t startTs = taosGetTimestampUs();
2267

L
Liu Jicong 已提交
2268
  while (1) {
2269 2270
    if (pExchangeInfo->current >= totalSources) {
      return setAllSourcesCompleted(pOperator, startTs);
2271
    }
2272

2273 2274 2275
    doSendFetchDataRequest(pExchangeInfo, pTaskInfo, pExchangeInfo->current);
    tsem_wait(&pExchangeInfo->ready);

dengyihao's avatar
dengyihao 已提交
2276
    SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, pExchangeInfo->current);
X
Xiaoyu Wang 已提交
2277
    SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, pExchangeInfo->current);
2278

H
Haojun Liao 已提交
2279
    if (pDataInfo->code != TSDB_CODE_SUCCESS) {
2280 2281
      qError("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d error happens, code:%s", GET_TASKID(pTaskInfo),
             pSource->addr.nodeId, pSource->taskId, pSource->execId, tstrerror(pDataInfo->code));
H
Haojun Liao 已提交
2282 2283 2284 2285
      pOperator->pTaskInfo->code = pDataInfo->code;
      return NULL;
    }

L
Liu Jicong 已提交
2286
    SRetrieveTableRsp*   pRsp = pDataInfo->pRsp;
H
Haojun Liao 已提交
2287
    SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2288
    if (pRsp->numOfRows == 0) {
2289 2290
      qDebug("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d %d of total completed, rowsOfSource:%" PRIu64
             ", totalRows:%" PRIu64 " try next",
D
dapan1121 已提交
2291
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pExchangeInfo->current + 1,
H
Haojun Liao 已提交
2292
             pDataInfo->totalRows, pLoadInfo->totalRows);
H
Haojun Liao 已提交
2293

2294
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2295
      pExchangeInfo->current += 1;
D
dapan1121 已提交
2296
      taosMemoryFreeClear(pDataInfo->pRsp);
2297 2298
      continue;
    }
H
Haojun Liao 已提交
2299

L
Liu Jicong 已提交
2300
    SSDataBlock*       pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2301
    SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2302
    int32_t            code =
2303
        extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
L
Liu Jicong 已提交
2304
                                     pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2305 2306

    if (pRsp->completed == 1) {
D
dapan1121 已提交
2307
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, rowsOfSource:%" PRIu64
L
Liu Jicong 已提交
2308
             ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64 " try next %d/%" PRIzu,
2309 2310 2311
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, pExchangeInfo->current + 1,
             totalSources);
2312

2313
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2314 2315
      pExchangeInfo->current += 1;
    } else {
D
dapan1121 已提交
2316
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
L
Liu Jicong 已提交
2317
             ", totalBytes:%" PRIu64,
2318 2319
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pLoadInfo->totalRows, pLoadInfo->totalSize);
2320 2321
    }

2322
    pOperator->resultInfo.totalRows += pRes->info.rows;
2323
    taosMemoryFreeClear(pDataInfo->pRsp);
2324 2325
    return pExchangeInfo->pResult;
  }
2326 2327
}

L
Liu Jicong 已提交
2328
static int32_t prepareLoadRemoteData(SOperatorInfo* pOperator) {
2329
  if (OPTR_IS_OPENED(pOperator)) {
H
Haojun Liao 已提交
2330 2331 2332
    return TSDB_CODE_SUCCESS;
  }

2333 2334
  int64_t st = taosGetTimestampUs();

L
Liu Jicong 已提交
2335
  SExchangeInfo* pExchangeInfo = pOperator->info;
2336
  if (!pExchangeInfo->seqLoadData) {
H
Haojun Liao 已提交
2337 2338 2339 2340 2341 2342
    int32_t code = prepareConcurrentlyLoad(pOperator);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
    }
  }

2343
  OPTR_SET_OPENED(pOperator);
2344
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2345 2346 2347
  return TSDB_CODE_SUCCESS;
}

2348
static SSDataBlock* doLoadRemoteDataImpl(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
2349 2350
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2351

2352
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
2353
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2354 2355
    return NULL;
  }
2356

L
Liu Jicong 已提交
2357
  size_t               totalSources = taosArrayGetSize(pExchangeInfo->pSources);
H
Haojun Liao 已提交
2358
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
H
Haojun Liao 已提交
2359

2360
  if (pOperator->status == OP_EXEC_DONE) {
L
Liu Jicong 已提交
2361 2362 2363
    qDebug("%s all %" PRIzu " source(s) are exhausted, total rows:%" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
           GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
           pLoadInfo->totalElapsed / 1000.0);
2364 2365 2366 2367 2368 2369
    return NULL;
  }

  if (pExchangeInfo->seqLoadData) {
    return seqLoadRemoteData(pOperator);
  } else {
2370
    return concurrentlyLoadRemoteDataImpl(pOperator, pExchangeInfo, pTaskInfo);
2371
  }
H
Haojun Liao 已提交
2372
}
2373

2374 2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400 2401 2402 2403 2404 2405 2406 2407 2408 2409 2410 2411
static SSDataBlock* doLoadRemoteData(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

  while(1) {
    SSDataBlock* pBlock = doLoadRemoteDataImpl(pOperator);
    if (pBlock == NULL) {
      return NULL;
    }

    ASSERT(pBlock == pExchangeInfo->pResult);

    SLimitInfo* pLimitInfo = &pExchangeInfo->limitInfo;
    if (hasLimitOffsetInfo(pLimitInfo)) {
      int32_t status = handleLimitOffset(pOperator, pLimitInfo, pExchangeInfo->pResult, false);
      if (status == PROJECT_RETRIEVE_CONTINUE) {
        continue;
      } else if (status == PROJECT_RETRIEVE_DONE) {
        size_t rows = pExchangeInfo->pResult->info.rows;
        pExchangeInfo->limitInfo.numOfOutputRows += rows;

        if (rows == 0) {
          doSetOperatorCompleted(pOperator);
          return NULL;
        } else {
          return pExchangeInfo->pResult;
        }
      }
    } else {
      return pExchangeInfo->pResult;
    }
  }
}

2412
static int32_t initDataSource(int32_t numOfSources, SExchangeInfo* pInfo, const char* id) {
2413
  pInfo->pSourceDataInfo = taosArrayInit(numOfSources, sizeof(SSourceDataInfo));
H
Haojun Liao 已提交
2414 2415
  if (pInfo->pSourceDataInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
2416 2417
  }

L
Liu Jicong 已提交
2418
  for (int32_t i = 0; i < numOfSources; ++i) {
2419
    SSourceDataInfo dataInfo = {0};
H
Haojun Liao 已提交
2420
    dataInfo.status = EX_SOURCE_DATA_NOT_READY;
2421
    dataInfo.taskId = id;
L
Liu Jicong 已提交
2422
    dataInfo.index = i;
X
Xiaoyu Wang 已提交
2423
    SSourceDataInfo* pDs = taosArrayPush(pInfo->pSourceDataInfo, &dataInfo);
2424
    if (pDs == NULL) {
H
Haojun Liao 已提交
2425 2426 2427 2428 2429 2430 2431 2432
      taosArrayDestroy(pInfo->pSourceDataInfo);
      return TSDB_CODE_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
}

2433
static int32_t initExchangeOperator(SExchangePhysiNode* pExNode, SExchangeInfo* pInfo, const char* id) {
2434
  size_t numOfSources = LIST_LENGTH(pExNode->pSrcEndPoints);
H
Haojun Liao 已提交
2435

2436
  if (numOfSources == 0) {
X
Xiaoyu Wang 已提交
2437
    qError("%s invalid number: %d of sources in exchange operator", id, (int32_t)numOfSources);
2438 2439 2440
    return TSDB_CODE_INVALID_PARA;
  }

H
Haojun Liao 已提交
2441
  pInfo->pSources = taosArrayInit(numOfSources, sizeof(SDownstreamSourceNode));
wmmhello's avatar
wmmhello 已提交
2442
  if (pInfo->pSources == NULL) {
2443
    return TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
2444 2445
  }

L
Liu Jicong 已提交
2446
  for (int32_t i = 0; i < numOfSources; ++i) {
D
dapan1121 已提交
2447
    SDownstreamSourceNode* pNode = (SDownstreamSourceNode*)nodesListGetNode((SNodeList*)pExNode->pSrcEndPoints, i);
H
Haojun Liao 已提交
2448 2449
    taosArrayPush(pInfo->pSources, pNode);
  }
2450

2451
  initLimitInfo(pExNode->node.pLimit, pExNode->node.pSlimit, &pInfo->limitInfo);
2452 2453
  pInfo->self = taosAddRef(exchangeObjRefPool, pInfo);

2454
  return initDataSource(numOfSources, pInfo, id);
2455 2456 2457 2458 2459 2460
}

SOperatorInfo* createExchangeOperatorInfo(void* pTransporter, SExchangePhysiNode* pExNode, SExecTaskInfo* pTaskInfo) {
  SExchangeInfo* pInfo = taosMemoryCalloc(1, sizeof(SExchangeInfo));
  SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
H
Haojun Liao 已提交
2461
    goto _error;
2462
  }
H
Haojun Liao 已提交
2463

2464
  int32_t code = initExchangeOperator(pExNode, pInfo, GET_TASKID(pTaskInfo));
2465 2466 2467
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2468 2469

  tsem_init(&pInfo->ready, 0, 0);
2470

2471
  pInfo->seqLoadData = false;
2472
  pInfo->pTransporter = pTransporter;
2473 2474
  pInfo->pResult = createResDataBlock(pExNode->node.pOutputDataBlockDesc);
  pOperator->name = "ExchangeOperator";
X
Xiaoyu Wang 已提交
2475
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_EXCHANGE;
X
Xiaoyu Wang 已提交
2476
  pOperator->blocking = false;
2477 2478
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
2479
  pOperator->exprSupp.numOfExprs = taosArrayGetSize(pInfo->pResult->pDataBlock);
X
Xiaoyu Wang 已提交
2480
  pOperator->pTaskInfo = pTaskInfo;
2481

L
Liu Jicong 已提交
2482 2483
  pOperator->fpSet = createOperatorFpSet(prepareLoadRemoteData, doLoadRemoteData, NULL, NULL,
                                         destroyExchangeOperatorInfo, NULL, NULL, NULL);
2484
  return pOperator;
H
Haojun Liao 已提交
2485

L
Liu Jicong 已提交
2486
_error:
H
Haojun Liao 已提交
2487
  if (pInfo != NULL) {
2488
    doDestroyExchangeOperatorInfo(pInfo);
H
Haojun Liao 已提交
2489 2490
  }

wafwerar's avatar
wafwerar 已提交
2491
  taosMemoryFreeClear(pOperator);
2492
  pTaskInfo->code = code;
H
Haojun Liao 已提交
2493
  return NULL;
2494 2495
}

dengyihao's avatar
dengyihao 已提交
2496 2497
static int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                                const char* pKey);
2498

2499
static void destroySortedMergeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
2500
  SSortedMergeOperatorInfo* pInfo = (SSortedMergeOperatorInfo*)param;
H
Haojun Liao 已提交
2501
  taosArrayDestroy(pInfo->pSortInfo);
2502 2503 2504
  taosArrayDestroy(pInfo->groupInfo);

  if (pInfo->pSortHandle != NULL) {
H
Haojun Liao 已提交
2505
    tsortDestroySortHandle(pInfo->pSortHandle);
2506 2507
  }

H
Haojun Liao 已提交
2508
  blockDataDestroy(pInfo->binfo.pRes);
H
Haojun Liao 已提交
2509
  cleanupAggSup(&pInfo->aggSup);
L
Liu Jicong 已提交
2510

D
dapan1121 已提交
2511
  taosMemoryFreeClear(param);
2512
}
H
Haojun Liao 已提交
2513

L
Liu Jicong 已提交
2514
static bool needToMerge(SSDataBlock* pBlock, SArray* groupInfo, char** buf, int32_t rowIndex) {
2515 2516 2517 2518
  size_t size = taosArrayGetSize(groupInfo);
  if (size == 0) {
    return true;
  }
2519

2520 2521
  for (int32_t i = 0; i < size; ++i) {
    int32_t* index = taosArrayGet(groupInfo, i);
2522

2523
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
L
Liu Jicong 已提交
2524
    bool             isNull = colDataIsNull(pColInfo, rowIndex, pBlock->info.rows, NULL);
2525

2526 2527 2528
    if ((isNull && buf[i] != NULL) || (!isNull && buf[i] == NULL)) {
      return false;
    }
2529

2530 2531 2532 2533 2534 2535 2536 2537 2538 2539 2540 2541 2542
    char* pCell = colDataGetData(pColInfo, rowIndex);
    if (IS_VAR_DATA_TYPE(pColInfo->info.type)) {
      if (varDataLen(pCell) != varDataLen(buf[i])) {
        return false;
      } else {
        if (memcmp(varDataVal(pCell), varDataVal(buf[i]), varDataLen(pCell)) != 0) {
          return false;
        }
      }
    } else {
      if (memcmp(pCell, buf[i], pColInfo->info.bytes) != 0) {
        return false;
      }
2543 2544 2545
    }
  }

2546
  return 0;
2547 2548
}

L
Liu Jicong 已提交
2549 2550 2551
static void doMergeResultImpl(SSortedMergeOperatorInfo* pInfo, SqlFunctionCtx* pCtx, int32_t numOfExpr,
                              int32_t rowIndex) {
  for (int32_t j = 0; j < numOfExpr; ++j) {  // TODO set row index
X
Xiaoyu Wang 已提交
2552
                                             //    pCtx[j].startRow = rowIndex;
2553 2554
  }

2555 2556
  for (int32_t j = 0; j < numOfExpr; ++j) {
    int32_t functionId = pCtx[j].functionId;
L
Liu Jicong 已提交
2557 2558 2559 2560 2561 2562 2563 2564 2565
    //    pCtx[j].fpSet->addInput(&pCtx[j]);

    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_MERGE);
    //    } else {
    //      assert(!TSDB_FUNC_IS_SCALAR(functionId));
    //      aAggs[functionId].mergeFunc(&pCtx[j]);
    //    }
2566
  }
2567
}
2568

L
Liu Jicong 已提交
2569 2570
static void doFinalizeResultImpl(SqlFunctionCtx* pCtx, int32_t numOfExpr) {
  for (int32_t j = 0; j < numOfExpr; ++j) {
2571 2572 2573 2574
    int32_t functionId = pCtx[j].functionId;
    //    if (functionId == FUNC_TAG_DUMMY || functionId == FUNC_TS_DUMMY) {
    //      continue;
    //    }
2575

2576 2577 2578 2579
    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_FINALIZE);
    //    } else {
dengyihao's avatar
dengyihao 已提交
2580
    //    pCtx[j].fpSet.finalize(&pCtx[j]);
2581 2582
  }
}
2583

2584
static bool saveCurrentTuple(char** rowColData, SArray* pColumnList, SSDataBlock* pBlock, int32_t rowIndex) {
L
Liu Jicong 已提交
2585
  int32_t size = (int32_t)taosArrayGetSize(pColumnList);
2586

L
Liu Jicong 已提交
2587 2588
  for (int32_t i = 0; i < size; ++i) {
    int32_t*         index = taosArrayGet(pColumnList, i);
2589
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
H
Haojun Liao 已提交
2590

2591 2592 2593
    char* data = colDataGetData(pColInfo, rowIndex);
    memcpy(rowColData[i], data, colDataGetLength(pColInfo, rowIndex));
  }
2594

2595 2596
  return true;
}
2597

2598 2599
static void doMergeImpl(SOperatorInfo* pOperator, int32_t numOfExpr, SSDataBlock* pBlock) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
2600

2601
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
2602

L
Liu Jicong 已提交
2603
  for (int32_t i = 0; i < pBlock->info.rows; ++i) {
2604 2605 2606 2607 2608 2609 2610 2611 2612
    if (!pInfo->hasGroupVal) {
      ASSERT(i == 0);
      doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
    } else {
      if (needToMerge(pBlock, pInfo->groupInfo, pInfo->groupVal, i)) {
        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      } else {
        doFinalizeResultImpl(pCtx, numOfExpr);
2613 2614
        int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
        //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2615

2616
        // TODO check for available buffer;
H
Haojun Liao 已提交
2617

2618 2619 2620 2621 2622
        // next group info data
        pInfo->binfo.pRes->info.rows += numOfRows;
        for (int32_t j = 0; j < numOfExpr; ++j) {
          if (pCtx[j].functionId < 0) {
            continue;
2623
          }
2624

H
Haojun Liao 已提交
2625
          pCtx[j].fpSet.process(&pCtx[j]);
2626
        }
2627 2628 2629

        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
        pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
H
Haojun Liao 已提交
2630
      }
2631 2632 2633 2634
    }
  }
}

2635 2636
static SSDataBlock* doMerge(SOperatorInfo* pOperator) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
L
Liu Jicong 已提交
2637
  SSortHandle*              pHandle = pInfo->pSortHandle;
2638

2639
  SSDataBlock* pDataBlock = createOneDataBlock(pInfo->binfo.pRes, false);
2640
  blockDataEnsureCapacity(pDataBlock, pOperator->resultInfo.capacity);
2641

L
Liu Jicong 已提交
2642
  while (1) {
2643
    blockDataCleanup(pDataBlock);
2644
    while (1) {
H
Haojun Liao 已提交
2645
      STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2646 2647
      if (pTupleHandle == NULL) {
        break;
2648
      }
2649

2650 2651
      // build datablock for merge for one group
      appendOneRowToDataBlock(pDataBlock, pTupleHandle);
2652
      if (pDataBlock->info.rows >= pOperator->resultInfo.capacity) {
2653 2654
        break;
      }
2655
    }
2656

2657 2658 2659
    if (pDataBlock->info.rows == 0) {
      break;
    }
2660

2661
    setInputDataBlock(pOperator, pOperator->exprSupp.pCtx, pDataBlock, TSDB_ORDER_ASC, MAIN_SCAN, true);
L
Liu Jicong 已提交
2662 2663
    //  updateOutputBuf(&pInfo->binfo, &pAggInfo->bufCapacity, pBlock->info.rows * pAggInfo->resultRowFactor,
    //  pOperator->pRuntimeEnv, true);
2664
    doMergeImpl(pOperator, pOperator->exprSupp.numOfExprs, pDataBlock);
2665 2666
    // flush to tuple store, and after all data have been handled, return to upstream node or sink node
  }
2667

2668 2669 2670
  doFinalizeResultImpl(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs);
  int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
  //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2671

2672
  // TODO check for available buffer;
2673

2674 2675
  // next group info data
  pInfo->binfo.pRes->info.rows += numOfRows;
L
Liu Jicong 已提交
2676
  return (pInfo->binfo.pRes->info.rows > 0) ? pInfo->binfo.pRes : NULL;
2677
}
2678

L
Liu Jicong 已提交
2679 2680
SSDataBlock* getSortedMergeBlockData(SSortHandle* pHandle, SSDataBlock* pDataBlock, int32_t capacity,
                                     SArray* pColMatchInfo, SSortedMergeOperatorInfo* pInfo) {
2681 2682 2683 2684 2685 2686 2687 2688 2689 2690
  blockDataCleanup(pDataBlock);

  SSDataBlock* p = tsortGetSortedDataBlock(pHandle);
  if (p == NULL) {
    return NULL;
  }

  blockDataEnsureCapacity(p, capacity);

  while (1) {
2691
    STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2692 2693 2694 2695
    if (pTupleHandle == NULL) {
      break;
    }

2696
    appendOneRowToDataBlock(p, pTupleHandle);
2697 2698 2699 2700 2701 2702 2703 2704 2705 2706 2707 2708 2709
    if (p->info.rows >= capacity) {
      break;
    }
  }

  if (p->info.rows > 0) {
    int32_t numOfCols = taosArrayGetSize(pColMatchInfo);
    for (int32_t i = 0; i < numOfCols; ++i) {
      SColMatchInfo* pmInfo = taosArrayGet(pColMatchInfo, i);
      ASSERT(pmInfo->matchType == COL_MATCH_FROM_SLOT_ID);

      SColumnInfoData* pSrc = taosArrayGet(p->pDataBlock, pmInfo->srcSlotId);
      SColumnInfoData* pDst = taosArrayGet(pDataBlock->pDataBlock, pmInfo->targetSlotId);
2710
      colDataAssign(pDst, pSrc, p->info.rows, &pDataBlock->info);
2711 2712 2713 2714 2715 2716 2717 2718 2719 2720
    }

    pDataBlock->info.rows = p->info.rows;
    pDataBlock->info.capacity = p->info.rows;
  }

  blockDataDestroy(p);
  return (pDataBlock->info.rows > 0) ? pDataBlock : NULL;
}

2721
static SSDataBlock* doSortedMerge(SOperatorInfo* pOperator) {
2722 2723
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
2724 2725
  }

L
Liu Jicong 已提交
2726
  SExecTaskInfo*            pTaskInfo = pOperator->pTaskInfo;
2727
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
H
Haojun Liao 已提交
2728
  if (pOperator->status == OP_RES_TO_RETURN) {
2729
    return getSortedMergeBlockData(pInfo->pSortHandle, pInfo->binfo.pRes, pOperator->resultInfo.capacity, NULL, pInfo);
2730 2731
  }

2732
  int32_t numOfBufPage = pInfo->sortBufSize / pInfo->bufPageSize;
L
Liu Jicong 已提交
2733 2734
  pInfo->pSortHandle = tsortCreateSortHandle(pInfo->pSortInfo, SORT_MULTISOURCE_MERGE, pInfo->bufPageSize, numOfBufPage,
                                             pInfo->binfo.pRes, "GET_TASKID(pTaskInfo)");
H
Haojun Liao 已提交
2735

2736
  tsortSetFetchRawDataFp(pInfo->pSortHandle, loadNextDataBlock, NULL, NULL);
2737

L
Liu Jicong 已提交
2738
  for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
wmmhello's avatar
wmmhello 已提交
2739
    SSortSource* ps = taosMemoryCalloc(1, sizeof(SSortSource));
H
Haojun Liao 已提交
2740
    ps->param = pOperator->pDownstream[i];
H
Haojun Liao 已提交
2741
    tsortAddSource(pInfo->pSortHandle, ps);
2742 2743
  }

H
Haojun Liao 已提交
2744
  int32_t code = tsortOpen(pInfo->pSortHandle);
2745
  if (code != TSDB_CODE_SUCCESS) {
2746
    longjmp(pTaskInfo->env, terrno);
2747 2748
  }

H
Haojun Liao 已提交
2749
  pOperator->status = OP_RES_TO_RETURN;
2750
  return doMerge(pOperator);
2751
}
2752

L
Liu Jicong 已提交
2753 2754
static int32_t initGroupCol(SExprInfo* pExprInfo, int32_t numOfCols, SArray* pGroupInfo,
                            SSortedMergeOperatorInfo* pInfo) {
2755 2756
  if (pGroupInfo == NULL || taosArrayGetSize(pGroupInfo) == 0) {
    return 0;
H
Haojun Liao 已提交
2757 2758
  }

2759 2760 2761 2762 2763 2764 2765 2766
  int32_t len = 0;
  SArray* plist = taosArrayInit(3, sizeof(SColumn));
  pInfo->groupInfo = taosArrayInit(3, sizeof(int32_t));

  if (plist == NULL || pInfo->groupInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

L
Liu Jicong 已提交
2767 2768
  size_t numOfGroupCol = taosArrayGetSize(pInfo->groupInfo);
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2769
    SColumn* pCol = taosArrayGet(pGroupInfo, i);
L
Liu Jicong 已提交
2770
    for (int32_t j = 0; j < numOfCols; ++j) {
H
Haojun Liao 已提交
2771
      SExprInfo* pe = &pExprInfo[j];
2772
      if (pe->base.resSchema.slotId == pCol->colId) {
2773 2774
        taosArrayPush(plist, pCol);
        taosArrayPush(pInfo->groupInfo, &j);
H
Haojun Liao 已提交
2775
        len += pCol->bytes;
2776 2777
        break;
      }
H
Haojun Liao 已提交
2778 2779 2780
    }
  }

2781
  ASSERT(taosArrayGetSize(pGroupInfo) == taosArrayGetSize(plist));
H
Haojun Liao 已提交
2782

wafwerar's avatar
wafwerar 已提交
2783
  pInfo->groupVal = taosMemoryCalloc(1, (POINTER_BYTES * numOfGroupCol + len));
2784 2785 2786 2787
  if (pInfo->groupVal == NULL) {
    taosArrayDestroy(plist);
    return TSDB_CODE_OUT_OF_MEMORY;
  }
H
Haojun Liao 已提交
2788

2789
  int32_t offset = 0;
L
Liu Jicong 已提交
2790 2791
  char*   start = (char*)(pInfo->groupVal + (POINTER_BYTES * numOfGroupCol));
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2792 2793
    pInfo->groupVal[i] = start + offset;
    SColumn* pCol = taosArrayGet(plist, i);
H
Haojun Liao 已提交
2794
    offset += pCol->bytes;
2795
  }
H
Haojun Liao 已提交
2796

2797
  taosArrayDestroy(plist);
H
Haojun Liao 已提交
2798

2799 2800
  return TSDB_CODE_SUCCESS;
}
H
Haojun Liao 已提交
2801

L
Liu Jicong 已提交
2802 2803 2804
SOperatorInfo* createSortedMergeOperatorInfo(SOperatorInfo** downstream, int32_t numOfDownstream, SExprInfo* pExprInfo,
                                             int32_t num, SArray* pSortInfo, SArray* pGroupInfo,
                                             SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
2805
  SSortedMergeOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SSortedMergeOperatorInfo));
L
Liu Jicong 已提交
2806
  SOperatorInfo*            pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2807
  if (pInfo == NULL || pOperator == NULL) {
2808
    goto _error;
2809
  }
H
Haojun Liao 已提交
2810

2811 2812 2813 2814 2815
  int32_t code = initExprSupp(&pOperator->exprSupp, pExprInfo, num);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

2816
  initResultRowInfo(&pInfo->binfo.resultRowInfo);
H
Haojun Liao 已提交
2817

2818
  if (pOperator->exprSupp.pCtx == NULL || pInfo->binfo.pRes == NULL) {
2819 2820
    goto _error;
  }
H
Haojun Liao 已提交
2821

2822
  size_t keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
2823
  code = doInitAggInfoSup(&pInfo->aggSup, pOperator->exprSupp.pCtx, num, keyBufSize, pTaskInfo->id.str);
2824 2825 2826
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2827

2828
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, num);
H
Haojun Liao 已提交
2829
  code = initGroupCol(pExprInfo, num, pGroupInfo, pInfo);
2830 2831 2832
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2833

L
Liu Jicong 已提交
2834 2835 2836 2837 2838
  //  pInfo->resultRowFactor = (int32_t)(getRowNumForMultioutput(pRuntimeEnv->pQueryAttr,
  //      pRuntimeEnv->pQueryAttr->topBotQuery, false));
  pInfo->sortBufSize = 1024 * 16;  // 1MB
  pInfo->bufPageSize = 1024;
  pInfo->pSortInfo = pSortInfo;
H
Haojun Liao 已提交
2839

2840
  pOperator->resultInfo.capacity = blockDataGetCapacityInRow(pInfo->binfo.pRes, pInfo->bufPageSize);
H
Haojun Liao 已提交
2841

L
Liu Jicong 已提交
2842
  pOperator->name = "SortedMerge";
X
Xiaoyu Wang 已提交
2843
  // pOperator->operatorType = OP_SortedMerge;
2844 2845 2846
  pOperator->blocking = true;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
L
Liu Jicong 已提交
2847
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
2848

2849 2850
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doSortedMerge, NULL, NULL, destroySortedMergeOperatorInfo,
                                         NULL, NULL, NULL);
2851 2852 2853
  code = appendDownstream(pOperator, downstream, numOfDownstream);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
2854
  }
H
Haojun Liao 已提交
2855

2856
  return pOperator;
H
Haojun Liao 已提交
2857

L
Liu Jicong 已提交
2858
_error:
2859
  if (pInfo != NULL) {
H
Haojun Liao 已提交
2860
    destroySortedMergeOperatorInfo(pInfo, num);
H
Haojun Liao 已提交
2861 2862
  }

wafwerar's avatar
wafwerar 已提交
2863 2864
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
2865 2866
  terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
  return NULL;
H
Haojun Liao 已提交
2867 2868
}

X
Xiaoyu Wang 已提交
2869
int32_t getTableScanInfo(SOperatorInfo* pOperator, int32_t* order, int32_t* scanFlag) {
2870
  // todo add more information about exchange operation
2871
  int32_t type = pOperator->operatorType;
X
Xiaoyu Wang 已提交
2872
  if (type == QUERY_NODE_PHYSICAL_PLAN_EXCHANGE || type == QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN ||
2873
      type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN ||
2874
      type == QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN) {
2875 2876 2877
    *order = TSDB_ORDER_ASC;
    *scanFlag = MAIN_SCAN;
    return TSDB_CODE_SUCCESS;
2878
  } else if (type == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) {
2879 2880 2881 2882 2883
    STableScanInfo* pTableScanInfo = pOperator->info;
    *order = pTableScanInfo->cond.order;
    *scanFlag = pTableScanInfo->scanFlag;
    return TSDB_CODE_SUCCESS;
  } else {
H
Haojun Liao 已提交
2884
    if (pOperator->pDownstream == NULL || pOperator->pDownstream[0] == NULL) {
2885
      return TSDB_CODE_INVALID_PARA;
H
Haojun Liao 已提交
2886
    } else {
2887
      return getTableScanInfo(pOperator->pDownstream[0], order, scanFlag);
2888 2889 2890
    }
  }
}
L
Liu Jicong 已提交
2891
#if 0
L
Liu Jicong 已提交
2892
int32_t doPrepareScan(SOperatorInfo* pOperator, uint64_t uid, int64_t ts) {
L
Liu Jicong 已提交
2893
  uint8_t type = pOperator->operatorType;
2894 2895 2896

  pOperator->status = OP_OPENED;

L
Liu Jicong 已提交
2897
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2898
    SStreamScanInfo* pScanInfo = pOperator->info;
L
Liu Jicong 已提交
2899
    pScanInfo->blockType = STREAM_INPUT__TABLE_SCAN;
2900

2901
    pScanInfo->pTableScanOp->status = OP_OPENED;
2902

2903
    STableScanInfo* pInfo = pScanInfo->pTableScanOp->info;
2904 2905
    ASSERT(pInfo->scanMode == TABLE_SCAN__TABLE_ORDER);

L
Liu Jicong 已提交
2906 2907 2908 2909
    if (uid == 0) {
      pInfo->noTable = 1;
      return TSDB_CODE_SUCCESS;
    }
2910 2911 2912 2913 2914 2915

    /*if (pSnapShotScanInfo->dataReader == NULL) {*/
    /*pSnapShotScanInfo->dataReader = tsdbReaderOpen(pHandle->vnode, &pSTInfo->cond, tableList, 0, 0);*/
    /*pSnapShotScanInfo->scanMode = TABLE_SCAN__TABLE_ORDER;*/
    /*}*/

L
Liu Jicong 已提交
2916 2917
    pInfo->noTable = 0;

2918
    if (pInfo->lastStatus.uid != uid || pInfo->lastStatus.ts != ts) {
L
Liu Jicong 已提交
2919 2920 2921 2922 2923 2924 2925 2926 2927 2928 2929
      SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

      int32_t tableSz = taosArrayGetSize(pTaskInfo->tableqinfoList.pTableList);
      bool    found = false;
      for (int32_t i = 0; i < tableSz; i++) {
        STableKeyInfo* pTableInfo = taosArrayGet(pTaskInfo->tableqinfoList.pTableList, i);
        if (pTableInfo->uid == uid) {
          found = true;
          pInfo->currentTable = i;
        }
      }
2930
      // TODO after processing drop, found can be false
L
Liu Jicong 已提交
2931
      ASSERT(found);
2932 2933

      tsdbSetTableId(pInfo->dataReader, uid);
H
Haojun Liao 已提交
2934 2935 2936 2937
      int64_t oldSkey = pInfo->cond.twindows.skey;
      pInfo->cond.twindows.skey = ts + 1;
      tsdbReaderReset(pInfo->dataReader, &pInfo->cond);
      pInfo->cond.twindows.skey = oldSkey;
2938 2939
      pInfo->scanTimes = 0;

S
Shengliang Guan 已提交
2940
      qDebug("tsdb reader offset seek to uid %" PRId64 " ts %" PRId64 ", table cur set to %d , all table num %d", uid, ts,
L
Liu Jicong 已提交
2941
             pInfo->currentTable, tableSz);
L
Liu Jicong 已提交
2942
    }
L
Liu Jicong 已提交
2943

L
Liu Jicong 已提交
2944
    return TSDB_CODE_SUCCESS;
2945

L
Liu Jicong 已提交
2946
  } else {
2947 2948 2949 2950 2951
    if (pOperator->numOfDownstream == 1) {
      return doPrepareScan(pOperator->pDownstream[0], uid, ts);
    } else if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator to set the input data block");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2952
    } else {
2953 2954
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2955 2956 2957 2958
    }
  }
}

2959 2960 2961
int32_t doGetScanStatus(SOperatorInfo* pOperator, uint64_t* uid, int64_t* ts) {
  int32_t type = pOperator->operatorType;
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2962 2963
    SStreamScanInfo* pScanInfo = pOperator->info;
    STableScanInfo*  pSnapShotScanInfo = pScanInfo->pTableScanOp->info;
L
Liu Jicong 已提交
2964 2965
    *uid = pSnapShotScanInfo->lastStatus.uid;
    *ts = pSnapShotScanInfo->lastStatus.ts;
2966 2967 2968 2969 2970 2971 2972 2973 2974 2975
  } else {
    if (pOperator->pDownstream[0] == NULL) {
      return TSDB_CODE_INVALID_PARA;
    } else {
      doGetScanStatus(pOperator->pDownstream[0], uid, ts);
    }
  }

  return TSDB_CODE_SUCCESS;
}
L
Liu Jicong 已提交
2976
#endif
2977

2978
// this is a blocking operator
L
Liu Jicong 已提交
2979
static int32_t doOpenAggregateOptr(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
2980 2981
  if (OPTR_IS_OPENED(pOperator)) {
    return TSDB_CODE_SUCCESS;
2982 2983
  }

H
Haojun Liao 已提交
2984
  SExecTaskInfo*    pTaskInfo = pOperator->pTaskInfo;
2985
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
2986

2987 2988
  SExprSupp*     pSup = &pOperator->exprSupp;
  SOperatorInfo* downstream = pOperator->pDownstream[0];
2989

2990 2991
  int64_t st = taosGetTimestampUs();

2992 2993 2994
  int32_t order = TSDB_ORDER_ASC;
  int32_t scanFlag = MAIN_SCAN;

H
Haojun Liao 已提交
2995
  while (1) {
2996
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
2997 2998 2999 3000
    if (pBlock == NULL) {
      break;
    }

3001 3002 3003 3004
    int32_t code = getTableScanInfo(pOperator, &order, &scanFlag);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
3005

3006
    // there is an scalar expression that needs to be calculated before apply the group aggregation.
3007 3008 3009
    if (pAggInfo->scalarExprSup.pExprInfo != NULL) {
      SExprSupp* pSup1 = &pAggInfo->scalarExprSup;
      code = projectApplyFunctions(pSup1->pExprInfo, pBlock, pBlock, pSup1->pCtx, pSup1->numOfExprs, NULL);
3010
      if (code != TSDB_CODE_SUCCESS) {
3011
        longjmp(pTaskInfo->env, code);
3012
      }
3013 3014
    }

3015
    // the pDataBlock are always the same one, no need to call this again
3016 3017
    setExecutionContext(pOperator, pOperator->exprSupp.numOfExprs, pBlock->info.groupId, pAggInfo);
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, true);
3018
    code = doAggregateImpl(pOperator, pSup->pCtx);
3019 3020 3021
    if (code != 0) {
      longjmp(pTaskInfo->env, code);
    }
3022 3023
  }

H
Haojun Liao 已提交
3024
  closeAllResultRows(&pAggInfo->binfo.resultRowInfo);
3025
  initGroupedResultInfo(&pAggInfo->groupResInfo, pAggInfo->aggSup.pResultRowHashTable, 0);
H
Haojun Liao 已提交
3026
  OPTR_SET_OPENED(pOperator);
3027

3028
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
3029 3030 3031
  return TSDB_CODE_SUCCESS;
}

3032
static SSDataBlock* getAggregateResult(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3033
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
3034 3035 3036 3037 3038 3039
  SOptrBasicInfo*   pInfo = &pAggInfo->binfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

L
Liu Jicong 已提交
3040
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3041
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
H
Haojun Liao 已提交
3042
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
3043
    doSetOperatorCompleted(pOperator);
H
Haojun Liao 已提交
3044 3045 3046
    return NULL;
  }

H
Haojun Liao 已提交
3047
  blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);
S
slzhou 已提交
3048 3049 3050 3051 3052 3053 3054 3055
  while (1) {
    doBuildResultDatablock(pOperator, pInfo, &pAggInfo->groupResInfo, pAggInfo->aggSup.pResultBuf);
    doFilter(pAggInfo->pCondition, pInfo->pRes);

    if (!hasDataInGroupInfo(&pAggInfo->groupResInfo)) {
      doSetOperatorCompleted(pOperator);
      break;
    }
3056

S
slzhou 已提交
3057 3058 3059 3060
    if (pInfo->pRes->info.rows > 0) {
      break;
    }
  }
3061
  size_t rows = blockDataGetNumOfRows(pInfo->pRes);
3062 3063
  pOperator->resultInfo.totalRows += rows;

3064
  return (rows == 0) ? NULL : pInfo->pRes;
3065 3066
}

wmmhello's avatar
wmmhello 已提交
3067
int32_t aggEncodeResultRow(SOperatorInfo* pOperator, char** result, int32_t* length) {
3068
  if (result == NULL || length == NULL) {
wmmhello's avatar
wmmhello 已提交
3069 3070 3071
    return TSDB_CODE_TSC_INVALID_INPUT;
  }
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3072 3073 3074 3075 3076
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
  int32_t         size = taosHashGetSize(pSup->pResultRowHashTable);
  size_t          keyLen = sizeof(uint64_t) * 2;  // estimate the key length
  int32_t         totalSize =
      sizeof(int32_t) + sizeof(int32_t) + size * (sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3077

C
Cary Xu 已提交
3078 3079 3080 3081 3082 3083
  // no result
  if (getTotalBufSize(pSup->pResultBuf) == 0) {
    *result = NULL;
    *length = 0;
    return TSDB_CODE_SUCCESS;
  }
3084

wmmhello's avatar
wmmhello 已提交
3085
  *result = (char*)taosMemoryCalloc(1, totalSize);
L
Liu Jicong 已提交
3086
  if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
3087
    return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
3088
  }
wmmhello's avatar
wmmhello 已提交
3089

wmmhello's avatar
wmmhello 已提交
3090
  int32_t offset = sizeof(int32_t);
wmmhello's avatar
wmmhello 已提交
3091 3092
  *(int32_t*)(*result + offset) = size;
  offset += sizeof(int32_t);
3093 3094

  // prepare memory
3095
  SResultRowPosition* pos = &pInfo->resultRowInfo.cur;
dengyihao's avatar
dengyihao 已提交
3096 3097
  void*               pPage = getBufPage(pSup->pResultBuf, pos->pageId);
  SResultRow*         pRow = (SResultRow*)((char*)pPage + pos->offset);
3098 3099 3100
  setBufPageDirty(pPage, true);
  releaseBufPage(pSup->pResultBuf, pPage);

dengyihao's avatar
dengyihao 已提交
3101
  void* pIter = taosHashIterate(pSup->pResultRowHashTable, NULL);
wmmhello's avatar
wmmhello 已提交
3102
  while (pIter) {
dengyihao's avatar
dengyihao 已提交
3103
    void*               key = taosHashGetKey(pIter, &keyLen);
3104
    SResultRowPosition* p1 = (SResultRowPosition*)pIter;
3105

dengyihao's avatar
dengyihao 已提交
3106
    pPage = (SFilePage*)getBufPage(pSup->pResultBuf, p1->pageId);
3107
    pRow = (SResultRow*)((char*)pPage + p1->offset);
3108 3109
    setBufPageDirty(pPage, true);
    releaseBufPage(pSup->pResultBuf, pPage);
wmmhello's avatar
wmmhello 已提交
3110 3111 3112

    // recalculate the result size
    int32_t realTotalSize = offset + sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize;
L
Liu Jicong 已提交
3113
    if (realTotalSize > totalSize) {
wmmhello's avatar
wmmhello 已提交
3114
      char* tmp = (char*)taosMemoryRealloc(*result, realTotalSize);
L
Liu Jicong 已提交
3115
      if (tmp == NULL) {
wafwerar's avatar
wafwerar 已提交
3116
        taosMemoryFree(*result);
wmmhello's avatar
wmmhello 已提交
3117
        *result = NULL;
wmmhello's avatar
wmmhello 已提交
3118
        return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
3119
      } else {
wmmhello's avatar
wmmhello 已提交
3120 3121 3122 3123 3124 3125 3126 3127 3128 3129 3130 3131
        *result = tmp;
      }
    }
    // save key
    *(int32_t*)(*result + offset) = keyLen;
    offset += sizeof(int32_t);
    memcpy(*result + offset, key, keyLen);
    offset += keyLen;

    // save value
    *(int32_t*)(*result + offset) = pSup->resultRowSize;
    offset += sizeof(int32_t);
3132
    memcpy(*result + offset, pRow, pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3133 3134 3135 3136 3137
    offset += pSup->resultRowSize;

    pIter = taosHashIterate(pSup->pResultRowHashTable, pIter);
  }

wmmhello's avatar
wmmhello 已提交
3138 3139 3140 3141
  *(int32_t*)(*result) = offset;
  *length = offset;

  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3142 3143
}

3144
int32_t aggDecodeResultRow(SOperatorInfo* pOperator, char* result) {
3145
  if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
3146
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3147
  }
wmmhello's avatar
wmmhello 已提交
3148
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3149
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
wmmhello's avatar
wmmhello 已提交
3150 3151

  //  int32_t size = taosHashGetSize(pSup->pResultRowHashTable);
3152
  int32_t length = *(int32_t*)(result);
wmmhello's avatar
wmmhello 已提交
3153
  int32_t offset = sizeof(int32_t);
3154 3155 3156 3157

  int32_t count = *(int32_t*)(result + offset);
  offset += sizeof(int32_t);

L
Liu Jicong 已提交
3158
  while (count-- > 0 && length > offset) {
wmmhello's avatar
wmmhello 已提交
3159 3160 3161
    int32_t keyLen = *(int32_t*)(result + offset);
    offset += sizeof(int32_t);

L
Liu Jicong 已提交
3162
    uint64_t    tableGroupId = *(uint64_t*)(result + offset);
3163
    SResultRow* resultRow = getNewResultRow(pSup->pResultBuf, tableGroupId, pSup->resultRowSize);
L
Liu Jicong 已提交
3164
    if (!resultRow) {
wmmhello's avatar
wmmhello 已提交
3165
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3166
    }
3167

wmmhello's avatar
wmmhello 已提交
3168
    // add a new result set for a new group
3169 3170
    SResultRowPosition pos = {.pageId = resultRow->pageId, .offset = resultRow->offset};
    taosHashPut(pSup->pResultRowHashTable, result + offset, keyLen, &pos, sizeof(SResultRowPosition));
wmmhello's avatar
wmmhello 已提交
3171 3172 3173

    offset += keyLen;
    int32_t valueLen = *(int32_t*)(result + offset);
L
Liu Jicong 已提交
3174
    if (valueLen != pSup->resultRowSize) {
wmmhello's avatar
wmmhello 已提交
3175
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3176 3177 3178 3179 3180 3181 3182 3183 3184 3185
    }
    offset += sizeof(int32_t);
    int32_t pageId = resultRow->pageId;
    int32_t pOffset = resultRow->offset;
    memcpy(resultRow, result + offset, valueLen);
    resultRow->pageId = pageId;
    resultRow->offset = pOffset;
    offset += valueLen;

    initResultRow(resultRow);
dengyihao's avatar
dengyihao 已提交
3186
    pInfo->resultRowInfo.cur = (SResultRowPosition){.pageId = resultRow->pageId, .offset = resultRow->offset};
wmmhello's avatar
wmmhello 已提交
3187 3188
  }

L
Liu Jicong 已提交
3189
  if (offset != length) {
wmmhello's avatar
wmmhello 已提交
3190
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3191
  }
wmmhello's avatar
wmmhello 已提交
3192
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3193 3194
}

3195 3196 3197 3198 3199
int32_t handleLimitOffset(SOperatorInfo* pOperator, SLimitInfo* pLimitInfo, SSDataBlock* pBlock, bool holdDataInBuf) {
  if (pLimitInfo->remainGroupOffset > 0) {
    if (pLimitInfo->currentGroupId == 0) {  // it is the first group
      pLimitInfo->currentGroupId = pBlock->info.groupId;
      blockDataCleanup(pBlock);
3200
      return PROJECT_RETRIEVE_CONTINUE;
3201 3202 3203
    } else if (pLimitInfo->currentGroupId != pBlock->info.groupId) {
      // now it is the data from a new group
      pLimitInfo->remainGroupOffset -= 1;
3204 3205

      // ignore data block in current group
3206 3207
      if (pLimitInfo->remainGroupOffset > 0) {
        blockDataCleanup(pBlock);
3208 3209 3210 3211 3212
        return PROJECT_RETRIEVE_CONTINUE;
      }
    }

    // set current group id of the project operator
3213
    pLimitInfo->currentGroupId = pBlock->info.groupId;
3214 3215
  }

3216 3217 3218
  if (pLimitInfo->currentGroupId != 0 && pLimitInfo->currentGroupId != pBlock->info.groupId) {
    pLimitInfo->numOfOutputGroups += 1;
    if ((pLimitInfo->slimit.limit > 0) && (pLimitInfo->slimit.limit <= pLimitInfo->numOfOutputGroups)) {
3219
      pOperator->status = OP_EXEC_DONE;
3220
      blockDataCleanup(pBlock);
3221 3222 3223 3224 3225

      return PROJECT_RETRIEVE_DONE;
    }

    // reset the value for a new group data
3226 3227
    pLimitInfo->numOfOutputRows = 0;
    pLimitInfo->remainOffset = pLimitInfo->limit.offset;
3228 3229 3230 3231 3232
  }

  // here we reach the start position, according to the limit/offset requirements.

  // set current group id
3233
  pLimitInfo->currentGroupId = pBlock->info.groupId;
3234

3235 3236 3237
  if (pLimitInfo->remainOffset >= pBlock->info.rows) {
    pLimitInfo->remainOffset -= pBlock->info.rows;
    blockDataCleanup(pBlock);
3238
    return PROJECT_RETRIEVE_CONTINUE;
3239 3240 3241
  } else if (pLimitInfo->remainOffset < pBlock->info.rows && pLimitInfo->remainOffset > 0) {
    blockDataTrimFirstNRows(pBlock, pLimitInfo->remainOffset);
    pLimitInfo->remainOffset = 0;
3242 3243
  }

3244
  // check for the limitation in each group
3245 3246 3247 3248
  if (pLimitInfo->limit.limit >= 0 && pLimitInfo->numOfOutputRows + pBlock->info.rows >= pLimitInfo->limit.limit) {
    int32_t keepRows = (int32_t)(pLimitInfo->limit.limit - pLimitInfo->numOfOutputRows);
    blockDataKeepFirstNRows(pBlock, keepRows);
    if (pLimitInfo->slimit.limit > 0 && pLimitInfo->slimit.limit <= pLimitInfo->numOfOutputGroups) {
3249 3250 3251
      pOperator->status = OP_EXEC_DONE;
    }

3252
    return PROJECT_RETRIEVE_DONE;
3253
  }
3254

3255
  // todo optimize performance
3256 3257
  // If there are slimit/soffset value exists, multi-round result can not be packed into one group, since the
  // they may not belong to the same group the limit/offset value is not valid in this case.
3258 3259
  if ((!holdDataInBuf) || (pBlock->info.rows >= pOperator->resultInfo.threshold) || pLimitInfo->slimit.offset != -1 ||
      pLimitInfo->slimit.limit != -1) {
3260
    return PROJECT_RETRIEVE_DONE;
L
Liu Jicong 已提交
3261
  } else {  // not full enough, continue to accumulate the output data in the buffer.
3262 3263 3264 3265
    return PROJECT_RETRIEVE_CONTINUE;
  }
}

3266
static SSDataBlock* doProjectOperation(SOperatorInfo* pOperator) {
3267
  SProjectOperatorInfo* pProjectInfo = pOperator->info;
L
Liu Jicong 已提交
3268
  SOptrBasicInfo*       pInfo = &pProjectInfo->binfo;
3269

L
Liu Jicong 已提交
3270
  SExprSupp*   pSup = &pOperator->exprSupp;
3271
  SSDataBlock* pRes = pInfo->pRes;
3272
  blockDataCleanup(pRes);
3273

3274
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3275
  if (pOperator->status == OP_EXEC_DONE) {
L
Liu Jicong 已提交
3276 3277 3278 3279
    if (pTaskInfo->execModel == OPTR_EXEC_MODEL_QUEUE) {
      pOperator->status = OP_OPENED;
      return NULL;
    }
3280 3281
    return NULL;
  }
dengyihao's avatar
dengyihao 已提交
3282

H
Haojun Liao 已提交
3283
#if 0
3284 3285 3286 3287 3288
  if (pProjectInfo->existDataBlock) {  // TODO refactor
    SSDataBlock* pBlock = pProjectInfo->existDataBlock;
    pProjectInfo->existDataBlock = NULL;

    // the pDataBlock are always the same one, no need to call this again
H
Haojun Liao 已提交
3289
    setInputDataBlock(pOperator, pInfo->pCtx, pBlock, TSDB_ORDER_ASC);
3290

H
Haojun Liao 已提交
3291
    blockDataEnsureCapacity(pInfo->pRes, pBlock->info.rows);
3292
    projectApplyFunctions(pOperator->exprSupp.pExprInfo, pInfo->pRes, pBlock, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
L
Liu Jicong 已提交
3293
    if (pRes->info.rows >= pProjectInfo->binfo.capacity * 0.8) {
3294 3295
      copyTsColoum(pRes, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
      resetResultRowEntryResult(pInfo->pCtx, pOperator->exprSupp.numOfExprs);
3296 3297 3298
      return pRes;
    }
  }
H
Haojun Liao 已提交
3299
#endif
3300

3301
  int64_t st = 0;
3302 3303 3304
  int32_t order = 0;
  int32_t scanFlag = 0;

3305 3306 3307 3308
  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

H
Haojun Liao 已提交
3309 3310
  SOperatorInfo* downstream = pOperator->pDownstream[0];

L
Liu Jicong 已提交
3311
  while (1) {
H
Haojun Liao 已提交
3312
    // The downstream exec may change the value of the newgroup, so use a local variable instead.
L
Liu Jicong 已提交
3313
    qDebug("projection call next");
3314
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
3315
    if (pBlock == NULL) {
L
Liu Jicong 已提交
3316 3317 3318
      qDebug("projection get null");

      /*if (pTaskInfo->execModel == OPTR_EXEC_MODEL_BATCH) {*/
3319
      doSetOperatorCompleted(pOperator);
L
Liu Jicong 已提交
3320 3321
      /*} else if (pTaskInfo->execModel == OPTR_EXEC_MODEL_QUEUE) {*/
      /*pOperator->status = OP_RES_TO_RETURN;*/
L
Liu Jicong 已提交
3322
      /*}*/
3323 3324
      break;
    }
3325 3326 3327 3328
    if (pBlock->info.type == STREAM_RETRIEVE) {
      // for stream interval
      return pBlock;
    }
3329 3330

    // the pDataBlock are always the same one, no need to call this again
3331
    int32_t code = getTableScanInfo(pOperator->pDownstream[0], &order, &scanFlag);
3332 3333 3334
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
3335

3336
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
3337 3338
    blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

3339
    code = projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs,
X
Xiaoyu Wang 已提交
3340
                                 pProjectInfo->pPseudoColInfo);
3341 3342
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
3343 3344
    }

3345
    int32_t status = handleLimitOffset(pOperator, &pProjectInfo->limitInfo, pInfo->pRes, true);
3346 3347 3348 3349

    // filter shall be applied after apply functions and limit/offset on the result
    doFilter(pProjectInfo->pFilterNode, pInfo->pRes);

3350
    if (status == PROJECT_RETRIEVE_CONTINUE) {
H
Haojun Liao 已提交
3351
      continue;
L
Liu Jicong 已提交
3352
    } else if (status == PROJECT_RETRIEVE_DONE) {
3353 3354 3355
      break;
    }
  }
dengyihao's avatar
dengyihao 已提交
3356

3357
  size_t rows = pInfo->pRes->info.rows;
3358 3359
  pProjectInfo->limitInfo.numOfOutputRows += rows;

3360 3361 3362
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
3363
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
3364 3365
  }

3366
  return (rows > 0) ? pInfo->pRes : NULL;
3367 3368
}

H
Haojun Liao 已提交
3369
static void doHandleRemainBlockForNewGroupImpl(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo,
L
Liu Jicong 已提交
3370
                                               SExecTaskInfo* pTaskInfo) {
3371
  pInfo->totalInputRows = pInfo->existNewGroupBlock->info.rows;
H
Haojun Liao 已提交
3372

L
Liu Jicong 已提交
3373 3374
  int64_t ekey =
      Q_STATUS_EQUAL(pTaskInfo->status, TASK_COMPLETED) ? pInfo->win.ekey : pInfo->existNewGroupBlock->info.window.ekey;
3375 3376
  taosResetFillInfo(pInfo->pFillInfo, getFillInfoStart(pInfo->pFillInfo));

3377
  taosFillSetStartInfo(pInfo->pFillInfo, pInfo->existNewGroupBlock->info.rows, ekey);
3378 3379
  taosFillSetInputDataBlock(pInfo->pFillInfo, pInfo->existNewGroupBlock);

H
Haojun Liao 已提交
3380 3381 3382
  int32_t numOfResultRows = pResultInfo->capacity - pInfo->pRes->info.rows;
  taosFillResultDataBlock(pInfo->pFillInfo, pInfo->pRes, numOfResultRows);

3383
  pInfo->curGroupId = pInfo->existNewGroupBlock->info.groupId;
3384 3385 3386
  pInfo->existNewGroupBlock = NULL;
}

H
Haojun Liao 已提交
3387
static void doHandleRemainBlockFromNewGroup(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo,
L
Liu Jicong 已提交
3388
                                            SExecTaskInfo* pTaskInfo) {
3389
  if (taosFillHasMoreResults(pInfo->pFillInfo)) {
H
Haojun Liao 已提交
3390 3391 3392
    int32_t numOfResultRows = pResultInfo->capacity - pInfo->pRes->info.rows;
    taosFillResultDataBlock(pInfo->pFillInfo, pInfo->pRes, numOfResultRows);
    if (pInfo->pRes->info.rows > pResultInfo->threshold) {
3393 3394 3395 3396 3397 3398
      return;
    }
  }

  // handle the cached new group data block
  if (pInfo->existNewGroupBlock) {
H
Haojun Liao 已提交
3399
    doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, pTaskInfo);
3400 3401 3402
  }
}

S
slzhou 已提交
3403
static SSDataBlock* doFillImpl(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3404 3405
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;
3406

H
Haojun Liao 已提交
3407
  SResultInfo* pResultInfo = &pOperator->resultInfo;
3408 3409 3410
  SSDataBlock* pResBlock = pInfo->pRes;

  blockDataCleanup(pResBlock);
3411

H
Haojun Liao 已提交
3412 3413
  doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, pTaskInfo);
  if (pResBlock->info.rows > pResultInfo->threshold || pResBlock->info.rows > 0) {
3414
    return pResBlock;
H
Haojun Liao 已提交
3415
  }
3416

H
Haojun Liao 已提交
3417
  SOperatorInfo* pDownstream = pOperator->pDownstream[0];
L
Liu Jicong 已提交
3418
  while (1) {
3419
    SSDataBlock* pBlock = pDownstream->fpSet.getNextFn(pDownstream);
3420 3421 3422 3423 3424
    if (pBlock == NULL) {
      if (pInfo->totalInputRows == 0) {
        pOperator->status = OP_EXEC_DONE;
        return NULL;
      }
3425

3426
      taosFillSetStartInfo(pInfo->pFillInfo, 0, pInfo->win.ekey);
3427
    } else {
3428 3429 3430 3431
      blockDataUpdateTsWindow(pBlock, pInfo->primaryTsCol);

      if (pInfo->curGroupId == 0 || pInfo->curGroupId == pBlock->info.groupId) {
        pInfo->curGroupId = pBlock->info.groupId;   // the first data block
3432 3433

        pInfo->totalInputRows += pBlock->info.rows;
3434

3435 3436
        taosFillSetStartInfo(pInfo->pFillInfo, pBlock->info.rows, pBlock->info.window.ekey);
        taosFillSetInputDataBlock(pInfo->pFillInfo, pBlock);
3437 3438 3439 3440 3441 3442
      } else if (pInfo->curGroupId != pBlock->info.groupId) { // the new group data block
        pInfo->existNewGroupBlock = pBlock;

        // Fill the previous group data block, before handle the data block of new group.
        // Close the fill operation for previous group data block
        taosFillSetStartInfo(pInfo->pFillInfo, 0, pInfo->win.ekey);
3443 3444 3445
      }
    }

3446
    blockDataEnsureCapacity(pResBlock, pOperator->resultInfo.capacity);
H
Haojun Liao 已提交
3447

3448 3449
    int32_t numOfResultRows = pOperator->resultInfo.capacity - pResBlock->info.rows;
    taosFillResultDataBlock(pInfo->pFillInfo, pResBlock, numOfResultRows);
3450 3451

    // current group has no more result to return
3452
    if (pResBlock->info.rows > 0) {
3453 3454
      // 1. The result in current group not reach the threshold of output result, continue
      // 2. If multiple group results existing in one SSDataBlock is not allowed, return immediately
3455
      if (pResBlock->info.rows > pResultInfo->threshold || pBlock == NULL || pInfo->existNewGroupBlock != NULL) {
3456
        return pResBlock;
3457 3458
      }

H
Haojun Liao 已提交
3459
      doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, pTaskInfo);
3460
      if (pResBlock->info.rows >= pOperator->resultInfo.threshold || pBlock == NULL) {
3461
        return pResBlock;
3462 3463 3464
      }
    } else if (pInfo->existNewGroupBlock) {  // try next group
      assert(pBlock != NULL);
H
Haojun Liao 已提交
3465
      doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, pTaskInfo);
3466 3467
      if (pResBlock->info.rows > pResultInfo->threshold) {
        return pResBlock;
3468 3469 3470 3471 3472 3473 3474
      }
    } else {
      return NULL;
    }
  }
}

S
slzhou 已提交
3475 3476 3477 3478 3479 3480 3481 3482
static SSDataBlock* doFill(SOperatorInfo* pOperator) {
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

S
slzhou 已提交
3483
  SSDataBlock* fillResult = NULL;
S
slzhou 已提交
3484
  while (true) {
S
slzhou 已提交
3485
    fillResult = doFillImpl(pOperator);
S
slzhou 已提交
3486 3487 3488 3489 3490 3491 3492 3493 3494 3495 3496 3497 3498 3499
    if (fillResult != NULL) {
      doFilter(pInfo->pCondition, fillResult);
    }

    if (fillResult == NULL) {
      doSetOperatorCompleted(pOperator);
      break;
    }

    if (fillResult->info.rows > 0) {
      break;
    }
  }

S
slzhou 已提交
3500 3501 3502 3503
  if (fillResult != NULL) {
    size_t rows = fillResult->info.rows;
    pOperator->resultInfo.totalRows += rows;
  }
S
slzhou 已提交
3504

S
slzhou 已提交
3505
  return fillResult;
S
slzhou 已提交
3506 3507
}

H
Haojun Liao 已提交
3508 3509 3510
static void destroyExprInfo(SExprInfo* pExpr, int32_t numOfExprs) {
  for (int32_t i = 0; i < numOfExprs; ++i) {
    SExprInfo* pExprInfo = &pExpr[i];
H
Haojun Liao 已提交
3511 3512 3513 3514
    for(int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      if (pExprInfo->base.pParam[j].type == FUNC_PARAM_TYPE_COLUMN) {
        taosMemoryFreeClear(pExprInfo->base.pParam[j].pCol);
      }
H
Haojun Liao 已提交
3515
    }
H
Haojun Liao 已提交
3516

H
Haojun Liao 已提交
3517
    taosMemoryFree(pExprInfo->base.pParam);
H
Haojun Liao 已提交
3518 3519 3520 3521
    taosMemoryFree(pExprInfo->pExpr);
  }
}

3522 3523 3524 3525 3526
static void destroyOperatorInfo(SOperatorInfo* pOperator) {
  if (pOperator == NULL) {
    return;
  }

3527
  if (pOperator->fpSet.closeFn != NULL) {
3528
    pOperator->fpSet.closeFn(pOperator->info, pOperator->exprSupp.numOfExprs);
3529 3530
  }

H
Haojun Liao 已提交
3531
  if (pOperator->pDownstream != NULL) {
L
Liu Jicong 已提交
3532
    for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
H
Haojun Liao 已提交
3533
      destroyOperatorInfo(pOperator->pDownstream[i]);
3534 3535
    }

wafwerar's avatar
wafwerar 已提交
3536
    taosMemoryFreeClear(pOperator->pDownstream);
H
Haojun Liao 已提交
3537
    pOperator->numOfDownstream = 0;
3538 3539
  }

3540
  cleanupExprSupp(&pOperator->exprSupp);
wafwerar's avatar
wafwerar 已提交
3541
  taosMemoryFreeClear(pOperator);
3542 3543
}

3544 3545 3546 3547 3548 3549 3550 3551 3552 3553 3554 3555 3556 3557 3558
int32_t getBufferPgSize(int32_t rowSize, uint32_t* defaultPgsz, uint32_t* defaultBufsz) {
  *defaultPgsz = 4096;
  while (*defaultPgsz < rowSize * 4) {
    *defaultPgsz <<= 1u;
  }

  // at least four pages need to be in buffer
  *defaultBufsz = 4096 * 256;
  if ((*defaultBufsz) <= (*defaultPgsz)) {
    (*defaultBufsz) = (*defaultPgsz) * 4;
  }

  return 0;
}

dengyihao's avatar
dengyihao 已提交
3559 3560
int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                         const char* pKey) {
3561 3562
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);

dengyihao's avatar
dengyihao 已提交
3563 3564
  pAggSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
  pAggSup->keyBuf = taosMemoryCalloc(1, keyBufSize + POINTER_BYTES + sizeof(int64_t));
3565 3566
  pAggSup->pResultRowHashTable = taosHashInit(10, hashFn, true, HASH_NO_LOCK);

H
Haojun Liao 已提交
3567
  if (pAggSup->keyBuf == NULL || pAggSup->pResultRowHashTable == NULL) {
3568 3569 3570
    return TSDB_CODE_OUT_OF_MEMORY;
  }

dengyihao's avatar
dengyihao 已提交
3571
  uint32_t defaultPgsz = 0;
3572 3573
  uint32_t defaultBufsz = 0;
  getBufferPgSize(pAggSup->resultRowSize, &defaultPgsz, &defaultBufsz);
H
Haojun Liao 已提交
3574

3575
  int32_t code = createDiskbasedBuf(&pAggSup->pResultBuf, defaultPgsz, defaultBufsz, pKey, TD_TMP_DIR_PATH);
H
Haojun Liao 已提交
3576 3577 3578 3579
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3580 3581 3582
  return TSDB_CODE_SUCCESS;
}

3583
void cleanupAggSup(SAggSupporter* pAggSup) {
wafwerar's avatar
wafwerar 已提交
3584
  taosMemoryFreeClear(pAggSup->keyBuf);
3585
  taosHashCleanup(pAggSup->pResultRowHashTable);
H
Haojun Liao 已提交
3586
  destroyDiskbasedBuf(pAggSup->pResultBuf);
3587 3588
}

L
Liu Jicong 已提交
3589 3590
int32_t initAggInfo(SExprSupp* pSup, SAggSupporter* pAggSup, SExprInfo* pExprInfo, int32_t numOfCols, size_t keyBufSize,
                    const char* pkey) {
3591 3592 3593 3594 3595
  int32_t code = initExprSupp(pSup, pExprInfo, numOfCols);
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3596
  doInitAggInfoSup(pAggSup, pSup->pCtx, numOfCols, keyBufSize, pkey);
L
Liu Jicong 已提交
3597
  for (int32_t i = 0; i < numOfCols; ++i) {
3598
    pSup->pCtx[i].pBuf = pAggSup->pResultBuf;
3599 3600
  }

3601
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
3602 3603
}

3604
void initResultSizeInfo(SOperatorInfo* pOperator, int32_t numOfRows) {
wmmhello's avatar
wmmhello 已提交
3605
  ASSERT(numOfRows != 0);
3606 3607 3608 3609
  pOperator->resultInfo.capacity = numOfRows;
  pOperator->resultInfo.threshold = numOfRows * 0.75;

  if (pOperator->resultInfo.threshold == 0) {
wmmhello's avatar
wmmhello 已提交
3610
    pOperator->resultInfo.threshold = numOfRows;
3611 3612 3613
  }
}

3614 3615 3616 3617 3618
void initBasicInfo(SOptrBasicInfo* pInfo, SSDataBlock* pBlock) {
  pInfo->pRes = pBlock;
  initResultRowInfo(&pInfo->resultRowInfo);
}

3619 3620 3621 3622 3623 3624 3625 3626 3627 3628 3629 3630 3631 3632 3633 3634 3635 3636 3637
static void* destroySqlFunctionCtx(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
  if (pCtx == NULL) {
    return NULL;
  }

  for (int32_t i = 0; i < numOfOutput; ++i) {
    for (int32_t j = 0; j < pCtx[i].numOfParams; ++j) {
      taosVariantDestroy(&pCtx[i].param[j].param);
    }

    taosMemoryFreeClear(pCtx[i].subsidiaries.pCtx);
    taosMemoryFree(pCtx[i].input.pData);
    taosMemoryFree(pCtx[i].input.pColumnDataAgg);
  }

  taosMemoryFreeClear(pCtx);
  return NULL;
}

3638
int32_t initExprSupp(SExprSupp* pSup, SExprInfo* pExprInfo, int32_t numOfExpr) {
3639 3640 3641 3642
  pSup->pExprInfo = pExprInfo;
  pSup->numOfExprs = numOfExpr;
  if (pSup->pExprInfo != NULL) {
    pSup->pCtx = createSqlFunctionCtx(pExprInfo, numOfExpr, &pSup->rowEntryInfoOffset);
3643 3644 3645
    if (pSup->pCtx == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
3646
  }
3647 3648

  return TSDB_CODE_SUCCESS;
3649 3650
}

3651 3652 3653 3654 3655 3656 3657 3658 3659 3660
void cleanupExprSupp(SExprSupp* pSupp) {
  destroySqlFunctionCtx(pSupp->pCtx, pSupp->numOfExprs);
  if (pSupp->pExprInfo != NULL) {
    destroyExprInfo(pSupp->pExprInfo, pSupp->numOfExprs);
  }

  taosMemoryFreeClear(pSupp->pExprInfo);
  taosMemoryFree(pSupp->rowEntryInfoOffset);
}

L
Liu Jicong 已提交
3661
SOperatorInfo* createAggregateOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
S
slzhou 已提交
3662
                                           SSDataBlock* pResultBlock, SNode* pCondition, SExprInfo* pScalarExprInfo,
wmmhello's avatar
wmmhello 已提交
3663
                                           int32_t numOfScalarExpr, SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3664
  SAggOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SAggOperatorInfo));
L
Liu Jicong 已提交
3665
  SOperatorInfo*    pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3666 3667 3668
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
H
Haojun Liao 已提交
3669

3670
  int32_t numOfRows = 1024;
dengyihao's avatar
dengyihao 已提交
3671
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3672 3673

  initResultSizeInfo(pOperator, numOfRows);
3674
  int32_t code = initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
L
Liu Jicong 已提交
3675
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3676 3677
    goto _error;
  }
H
Haojun Liao 已提交
3678

3679
  initBasicInfo(&pInfo->binfo, pResultBlock);
3680 3681 3682 3683
  code = initExprSupp(&pInfo->scalarExprSup, pScalarExprInfo, numOfScalarExpr);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3684

L
Liu Jicong 已提交
3685
  pInfo->groupId = INT32_MIN;
S
slzhou 已提交
3686
  pInfo->pCondition = pCondition;
dengyihao's avatar
dengyihao 已提交
3687
  pOperator->name = "TableAggregate";
3688
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_HASH_AGG;
3689
  pOperator->blocking = true;
dengyihao's avatar
dengyihao 已提交
3690 3691 3692
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3693

3694 3695
  pOperator->fpSet = createOperatorFpSet(doOpenAggregateOptr, getAggregateResult, NULL, NULL, destroyAggOperatorInfo,
                                         aggEncodeResultRow, aggDecodeResultRow, NULL);
H
Haojun Liao 已提交
3696 3697 3698 3699 3700

  code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3701 3702

  return pOperator;
L
Liu Jicong 已提交
3703
_error:
H
Haojun Liao 已提交
3704
  destroyAggOperatorInfo(pInfo, numOfCols);
wafwerar's avatar
wafwerar 已提交
3705 3706
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
H
Haojun Liao 已提交
3707 3708
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3709 3710
}

3711
void cleanupBasicInfo(SOptrBasicInfo* pInfo) {
3712 3713
  assert(pInfo != NULL);
  cleanupResultRowInfo(&pInfo->resultRowInfo);
H
Haojun Liao 已提交
3714
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
3715 3716
}

H
Haojun Liao 已提交
3717
void destroyBasicOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3718
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)param;
3719
  cleanupBasicInfo(pInfo);
L
Liu Jicong 已提交
3720

D
dapan1121 已提交
3721
  taosMemoryFreeClear(param);
3722
}
H
Haojun Liao 已提交
3723

H
Haojun Liao 已提交
3724 3725 3726 3727 3728 3729 3730 3731

static void freeItem(void* pItem) {
  void** p = pItem;
  if (*p != NULL) {
    taosMemoryFreeClear(*p);
  }
}

H
Haojun Liao 已提交
3732
void destroyAggOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3733
  SAggOperatorInfo* pInfo = (SAggOperatorInfo*)param;
L
Liu Jicong 已提交
3734 3735
  cleanupBasicInfo(&pInfo->binfo);

H
Haojun Liao 已提交
3736
  cleanupAggSup(&pInfo->aggSup);
H
Haojun Liao 已提交
3737
  cleanupGroupResInfo(&pInfo->groupResInfo);
D
dapan1121 已提交
3738
  taosMemoryFreeClear(param);
3739
}
3740

H
Haojun Liao 已提交
3741
void destroySFillOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3742
  SFillOperatorInfo* pInfo = (SFillOperatorInfo*)param;
3743
  pInfo->pFillInfo = taosDestroyFillInfo(pInfo->pFillInfo);
H
Haojun Liao 已提交
3744
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
wafwerar's avatar
wafwerar 已提交
3745
  taosMemoryFreeClear(pInfo->p);
L
Liu Jicong 已提交
3746

D
dapan1121 已提交
3747
  taosMemoryFreeClear(param);
3748 3749
}

H
Haojun Liao 已提交
3750
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput) {
D
fix bug  
dapan 已提交
3751 3752 3753
  if (NULL == param) {
    return;
  }
L
Liu Jicong 已提交
3754
  SProjectOperatorInfo* pInfo = (SProjectOperatorInfo*)param;
3755
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3756
  cleanupAggSup(&pInfo->aggSup);
H
Haojun Liao 已提交
3757
  taosArrayDestroy(pInfo->pPseudoColInfo);
L
Liu Jicong 已提交
3758

D
dapan1121 已提交
3759
  taosMemoryFreeClear(param);
3760 3761
}

H
Haojun Liao 已提交
3762
static void destroyIndefinitOperatorInfo(void* param, int32_t numOfOutput) {
3763
  SIndefOperatorInfo* pInfo = (SIndefOperatorInfo*)param;
3764
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3765 3766 3767

  taosArrayDestroy(pInfo->pPseudoColInfo);
  cleanupAggSup(&pInfo->aggSup);
3768
  cleanupExprSupp(&pInfo->scalarSup);
L
Liu Jicong 已提交
3769

D
dapan1121 已提交
3770
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
3771 3772
}

H
Haojun Liao 已提交
3773
void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3774
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3775 3776 3777 3778
  taosRemoveRef(exchangeObjRefPool, pExInfo->self);
}

void doDestroyExchangeOperatorInfo(void* param) {
X
Xiaoyu Wang 已提交
3779
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3780

H
Haojun Liao 已提交
3781 3782 3783
  taosArrayDestroy(pExInfo->pSources);
  taosArrayDestroy(pExInfo->pSourceDataInfo);
  if (pExInfo->pResult != NULL) {
H
Haojun Liao 已提交
3784
    pExInfo->pResult = blockDataDestroy(pExInfo->pResult);
H
Haojun Liao 已提交
3785 3786 3787
  }

  tsem_destroy(&pExInfo->ready);
L
Liu Jicong 已提交
3788

D
dapan1121 已提交
3789
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
3790 3791
}

H
Haojun Liao 已提交
3792 3793
static SArray* setRowTsColumnOutputInfo(SqlFunctionCtx* pCtx, int32_t numOfCols) {
  SArray* pList = taosArrayInit(4, sizeof(int32_t));
dengyihao's avatar
dengyihao 已提交
3794
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
3795 3796 3797 3798 3799 3800 3801 3802
    if (fmIsPseudoColumnFunc(pCtx[i].functionId)) {
      taosArrayPush(pList, &i);
    }
  }

  return pList;
}

L
Liu Jicong 已提交
3803
SOperatorInfo* createProjectOperatorInfo(SOperatorInfo* downstream, SProjectPhysiNode* pProjPhyNode,
dengyihao's avatar
dengyihao 已提交
3804
                                         SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3805
  SProjectOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SProjectOperatorInfo));
L
Liu Jicong 已提交
3806
  SOperatorInfo*        pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3807 3808 3809
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
3810

L
Liu Jicong 已提交
3811
  int32_t    numOfCols = 0;
3812 3813 3814
  SExprInfo* pExprInfo = createExprInfo(pProjPhyNode->pProjections, NULL, &numOfCols);

  SSDataBlock* pResBlock = createResDataBlock(pProjPhyNode->node.pOutputDataBlockDesc);
3815
  initLimitInfo(pProjPhyNode->node.pLimit, pProjPhyNode->node.pSlimit, &pInfo->limitInfo);
3816

H
Haojun Liao 已提交
3817
  pInfo->binfo.pRes = pResBlock;
3818
  pInfo->pFilterNode = pProjPhyNode->node.pConditions;
H
Haojun Liao 已提交
3819 3820

  int32_t numOfRows = 4096;
dengyihao's avatar
dengyihao 已提交
3821
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3822

3823 3824 3825 3826 3827
  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
3828
  initResultSizeInfo(pOperator, numOfRows);
3829

3830 3831
  initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
  initBasicInfo(&pInfo->binfo, pResBlock);
3832
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfCols);
3833

3834
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pOperator->exprSupp.pCtx, numOfCols);
X
Xiaoyu Wang 已提交
3835
  pOperator->name = "ProjectOperator";
H
Haojun Liao 已提交
3836
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_PROJECT;
X
Xiaoyu Wang 已提交
3837 3838 3839 3840
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
3841

L
Liu Jicong 已提交
3842 3843
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doProjectOperation, NULL, NULL,
                                         destroyProjectOperatorInfo, NULL, NULL, NULL);
L
Liu Jicong 已提交
3844

3845
  int32_t code = appendDownstream(pOperator, &downstream, 1);
H
Haojun Liao 已提交
3846
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3847 3848
    goto _error;
  }
3849 3850

  return pOperator;
H
Haojun Liao 已提交
3851

L
Liu Jicong 已提交
3852
_error:
H
Haojun Liao 已提交
3853 3854
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3855 3856
}

3857 3858
static void doHandleDataBlock(SOperatorInfo* pOperator, SSDataBlock* pBlock, SOperatorInfo* downstream,
                              SExecTaskInfo* pTaskInfo) {
3859 3860 3861 3862 3863 3864 3865 3866 3867 3868 3869 3870 3871 3872 3873 3874 3875 3876 3877 3878 3879 3880 3881 3882 3883 3884 3885 3886 3887 3888 3889 3890 3891
  int32_t order = 0;
  int32_t scanFlag = 0;

  SIndefOperatorInfo* pIndefInfo = pOperator->info;
  SOptrBasicInfo*     pInfo = &pIndefInfo->binfo;
  SExprSupp*          pSup = &pOperator->exprSupp;

  // the pDataBlock are always the same one, no need to call this again
  int32_t code = getTableScanInfo(downstream, &order, &scanFlag);
  if (code != TSDB_CODE_SUCCESS) {
    longjmp(pTaskInfo->env, code);
  }

  // there is an scalar expression that needs to be calculated before apply the group aggregation.
  SExprSupp* pScalarSup = &pIndefInfo->scalarSup;
  if (pScalarSup->pExprInfo != NULL) {
    code = projectApplyFunctions(pScalarSup->pExprInfo, pBlock, pBlock, pScalarSup->pCtx, pScalarSup->numOfExprs,
                                 pIndefInfo->pPseudoColInfo);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
  }

  setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
  blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

  code = projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs,
                               pIndefInfo->pPseudoColInfo);
  if (code != TSDB_CODE_SUCCESS) {
    longjmp(pTaskInfo->env, code);
  }
}

H
Haojun Liao 已提交
3892 3893
static SSDataBlock* doApplyIndefinitFunction(SOperatorInfo* pOperator) {
  SIndefOperatorInfo* pIndefInfo = pOperator->info;
3894
  SOptrBasicInfo*     pInfo = &pIndefInfo->binfo;
L
Liu Jicong 已提交
3895
  SExprSupp*          pSup = &pOperator->exprSupp;
H
Haojun Liao 已提交
3896 3897 3898 3899 3900 3901 3902 3903 3904 3905 3906 3907 3908 3909 3910 3911 3912

  SSDataBlock* pRes = pInfo->pRes;
  blockDataCleanup(pRes);

  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

  int64_t st = 0;

  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

  SOperatorInfo* downstream = pOperator->pDownstream[0];

3913
  while (1) {
3914
    // here we need to handle the existsed group results
3915
    if (pIndefInfo->pNextGroupRes != NULL) {  // todo extract method
3916 3917
      for (int32_t k = 0; k < pSup->numOfExprs; ++k) {
        SqlFunctionCtx* pCtx = &pSup->pCtx[k];
H
Haojun Liao 已提交
3918

3919 3920 3921 3922 3923 3924 3925
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
        pResInfo->initialized = false;
        pCtx->pOutput = NULL;
      }

      doHandleDataBlock(pOperator, pIndefInfo->pNextGroupRes, downstream, pTaskInfo);
      pIndefInfo->pNextGroupRes = NULL;
H
Haojun Liao 已提交
3926 3927
    }

3928 3929 3930 3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941 3942 3943 3944 3945 3946 3947 3948 3949 3950
    if (pInfo->pRes->info.rows < pOperator->resultInfo.threshold) {
      while (1) {
        // The downstream exec may change the value of the newgroup, so use a local variable instead.
        SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
        if (pBlock == NULL) {
          doSetOperatorCompleted(pOperator);
          break;
        }

        if (pIndefInfo->groupId == 0 && pBlock->info.groupId != 0) {
          pIndefInfo->groupId = pBlock->info.groupId;  // this is the initial group result
        } else {
          if (pIndefInfo->groupId != pBlock->info.groupId) {  // reset output buffer and computing status
            pIndefInfo->groupId = pBlock->info.groupId;
            pIndefInfo->pNextGroupRes = pBlock;
            break;
          }
        }

        doHandleDataBlock(pOperator, pBlock, downstream, pTaskInfo);
        if (pInfo->pRes->info.rows >= pOperator->resultInfo.threshold) {
          break;
        }
H
Haojun Liao 已提交
3951 3952 3953
      }
    }

3954 3955 3956 3957
    doFilter(pIndefInfo->pCondition, pInfo->pRes);
    size_t rows = pInfo->pRes->info.rows;
    if (rows >= 0) {
      break;
H
Haojun Liao 已提交
3958 3959 3960 3961 3962 3963 3964 3965 3966 3967 3968 3969 3970
    }
  }

  size_t rows = pInfo->pRes->info.rows;
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
  }

  return (rows > 0) ? pInfo->pRes : NULL;
}

3971 3972
SOperatorInfo* createIndefinitOutputOperatorInfo(SOperatorInfo* downstream, SPhysiNode* pNode,
                                                 SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
3973
  SIndefOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SIndefOperatorInfo));
3974
  SOperatorInfo*      pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3975 3976 3977 3978
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

3979 3980
  SExprSupp* pSup = &pOperator->exprSupp;

H
Haojun Liao 已提交
3981 3982 3983
  SIndefRowsFuncPhysiNode* pPhyNode = (SIndefRowsFuncPhysiNode*)pNode;

  int32_t    numOfExpr = 0;
X
Xiaoyu Wang 已提交
3984
  SExprInfo* pExprInfo = createExprInfo(pPhyNode->pFuncs, NULL, &numOfExpr);
H
Haojun Liao 已提交
3985 3986

  if (pPhyNode->pExprs != NULL) {
3987
    int32_t    num = 0;
3988
    SExprInfo* pSExpr = createExprInfo(pPhyNode->pExprs, NULL, &num);
3989
    int32_t    code = initExprSupp(&pInfo->scalarSup, pSExpr, num);
3990 3991 3992
    if (code != TSDB_CODE_SUCCESS) {
      goto _error;
    }
H
Haojun Liao 已提交
3993 3994
  }

3995
  SSDataBlock* pResBlock = createResDataBlock(pPhyNode->node.pOutputDataBlockDesc);
H
Haojun Liao 已提交
3996 3997 3998 3999 4000 4001 4002 4003 4004

  int32_t numOfRows = 4096;
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;

  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
4005

H
Haojun Liao 已提交
4006 4007
  initResultSizeInfo(pOperator, numOfRows);

4008
  initAggInfo(pSup, &pInfo->aggSup, pExprInfo, numOfExpr, keyBufSize, pTaskInfo->id.str);
4009 4010
  initBasicInfo(&pInfo->binfo, pResBlock);

4011
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfExpr);
H
Haojun Liao 已提交
4012

4013 4014 4015
  pInfo->binfo.pRes = pResBlock;
  pInfo->pCondition = pPhyNode->node.pConditions;
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pSup->pCtx, numOfExpr);
H
Haojun Liao 已提交
4016

4017
  pOperator->name = "IndefinitOperator";
4018
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC;
4019 4020 4021
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
4022
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
4023 4024 4025 4026 4027 4028 4029 4030 4031 4032 4033

  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doApplyIndefinitFunction, NULL, NULL,
                                         destroyIndefinitOperatorInfo, NULL, NULL, NULL);

  int32_t code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  return pOperator;

4034
_error:
H
Haojun Liao 已提交
4035 4036 4037 4038 4039 4040
  taosMemoryFree(pInfo);
  taosMemoryFree(pOperator);
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
}

4041
static int32_t initFillInfo(SFillOperatorInfo* pInfo, SExprInfo* pExpr, int32_t numOfCols, SNodeListNode* pValNode,
L
Liu Jicong 已提交
4042
                            STimeWindow win, int32_t capacity, const char* id, SInterval* pInterval, int32_t fillType) {
4043
  SFillColInfo* pColInfo = createFillColInfo(pExpr, numOfCols, pValNode);
H
Haojun Liao 已提交
4044 4045

  STimeWindow w = TSWINDOW_INITIALIZER;
4046
  getAlignQueryTimeWindow(pInterval, pInterval->precision, win.skey, &w);
4047
  w = getFirstQualifiedTimeWindow(win.skey, &w, pInterval, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
4048 4049

  int32_t order = TSDB_ORDER_ASC;
4050 4051
  pInfo->pFillInfo = taosCreateFillInfo(order, w.skey, 0, capacity, numOfCols, pInterval,
      fillType, pColInfo, pInfo->primaryTsCol, id);
H
Haojun Liao 已提交
4052

4053
  pInfo->win = win;
L
Liu Jicong 已提交
4054
  pInfo->p = taosMemoryCalloc(numOfCols, POINTER_BYTES);
4055

H
Haojun Liao 已提交
4056
  if (pInfo->pFillInfo == NULL || pInfo->p == NULL) {
H
Haojun Liao 已提交
4057 4058
    taosMemoryFree(pInfo->pFillInfo);
    taosMemoryFree(pInfo->p);
H
Haojun Liao 已提交
4059 4060 4061 4062 4063 4064
    return TSDB_CODE_OUT_OF_MEMORY;
  } else {
    return TSDB_CODE_SUCCESS;
  }
}

H
Haojun Liao 已提交
4065
SOperatorInfo* createFillOperatorInfo(SOperatorInfo* downstream, SFillPhysiNode* pPhyFillNode, SExecTaskInfo* pTaskInfo) {
4066 4067 4068 4069 4070 4071
  SFillOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SFillOperatorInfo));
  SOperatorInfo*     pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

L
Liu Jicong 已提交
4072 4073 4074
  int32_t      num = 0;
  SSDataBlock* pResBlock = createResDataBlock(pPhyFillNode->node.pOutputDataBlockDesc);
  SExprInfo*   pExprInfo = createExprInfo(pPhyFillNode->pTargets, NULL, &num);
4075 4076 4077 4078
  SInterval*   pInterval =
      QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == downstream->operatorType
            ? &((SMergeAlignedIntervalAggOperatorInfo*)downstream->info)->intervalAggOperatorInfo->interval
            : &((SIntervalAggOperatorInfo*)downstream->info)->interval;
4079

4080
  int32_t type = convertFillType(pPhyFillNode->mode);
4081

H
Haojun Liao 已提交
4082
  SResultInfo* pResultInfo = &pOperator->resultInfo;
4083
  initResultSizeInfo(pOperator, 4096);
H
Haojun Liao 已提交
4084
  pInfo->primaryTsCol = ((SColumnNode*)pPhyFillNode->pWStartTs)->slotId;
4085

4086
  int32_t numOfOutputCols = 0;
4087 4088
  SArray* pColMatchColInfo = extractColMatchInfo(pPhyFillNode->pTargets, pPhyFillNode->node.pOutputDataBlockDesc,
                                                 &numOfOutputCols, COL_MATCH_FROM_SLOT_ID);
4089

4090 4091
  int32_t code = initFillInfo(pInfo, pExprInfo, num, (SNodeListNode*)pPhyFillNode->pValues, pPhyFillNode->timeRange,
                              pResultInfo->capacity, pTaskInfo->id.str, pInterval, type);
4092 4093 4094
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
4095

4096 4097 4098 4099 4100 4101 4102 4103
  pInfo->pRes = pResBlock;
  pInfo->pCondition = pPhyFillNode->node.pConditions;
  pInfo->pColMatchColInfo = pColMatchColInfo;
  pOperator->name = "FillOperator";
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_FILL;
  pOperator->exprSupp.pExprInfo = pExprInfo;
4104
  pOperator->exprSupp.numOfExprs = num;
4105 4106
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
4107

L
Liu Jicong 已提交
4108 4109
  pOperator->fpSet =
      createOperatorFpSet(operatorDummyOpenFn, doFill, NULL, NULL, destroySFillOperatorInfo, NULL, NULL, NULL);
4110

4111
  code = appendDownstream(pOperator, &downstream, 1);
4112
  return pOperator;
H
Haojun Liao 已提交
4113

L
Liu Jicong 已提交
4114
_error:
wafwerar's avatar
wafwerar 已提交
4115 4116
  taosMemoryFreeClear(pOperator);
  taosMemoryFreeClear(pInfo);
H
Haojun Liao 已提交
4117
  return NULL;
4118 4119
}

D
dapan1121 已提交
4120
static SExecTaskInfo* createExecTaskInfo(uint64_t queryId, uint64_t taskId, EOPTR_EXEC_MODEL model, char* dbFName) {
wafwerar's avatar
wafwerar 已提交
4121
  SExecTaskInfo* pTaskInfo = taosMemoryCalloc(1, sizeof(SExecTaskInfo));
4122
  setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
4123

D
dapan1121 已提交
4124
  pTaskInfo->schemaVer.dbname = strdup(dbFName);
4125
  pTaskInfo->cost.created = taosGetTimestampMs();
H
Haojun Liao 已提交
4126
  pTaskInfo->id.queryId = queryId;
dengyihao's avatar
dengyihao 已提交
4127
  pTaskInfo->execModel = model;
H
Haojun Liao 已提交
4128

wafwerar's avatar
wafwerar 已提交
4129
  char* p = taosMemoryCalloc(1, 128);
L
Liu Jicong 已提交
4130
  snprintf(p, 128, "TID:0x%" PRIx64 " QID:0x%" PRIx64, taskId, queryId);
H
Haojun Liao 已提交
4131
  pTaskInfo->id.str = p;
H
Haojun Liao 已提交
4132

4133 4134
  return pTaskInfo;
}
H
Haojun Liao 已提交
4135

H
Hongze Cheng 已提交
4136
static STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
H
Haojun Liao 已提交
4137
                                       STableListInfo* pTableListInfo, const char* idstr);
H
Haojun Liao 已提交
4138

H
Haojun Liao 已提交
4139
static SArray* extractColumnInfo(SNodeList* pNodeList);
4140

4141
int32_t extractTableSchemaInfo(SReadHandle* pHandle, uint64_t uid, SExecTaskInfo* pTaskInfo) {
4142 4143
  SMetaReader mr = {0};
  metaReaderInit(&mr, pHandle->meta, 0);
D
dapan1121 已提交
4144
  int32_t code = metaGetTableEntryByUid(&mr, uid);
4145
  if (code != TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
4146
    metaReaderClear(&mr);
4147
    return terrno;
D
dapan1121 已提交
4148
  }
4149 4150 4151 4152

  pTaskInfo->schemaVer.tablename = strdup(mr.me.name);

  if (mr.me.type == TSDB_SUPER_TABLE) {
4153
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
4154
    pTaskInfo->schemaVer.tversion = mr.me.stbEntry.schemaTag.version;
4155
  } else if (mr.me.type == TSDB_CHILD_TABLE) {
4156 4157
    tDecoderClear(&mr.coder);

4158 4159
    tb_uid_t suid = mr.me.ctbEntry.suid;
    metaGetTableEntryByUid(&mr, suid);
4160
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
4161
    pTaskInfo->schemaVer.tversion = mr.me.stbEntry.schemaTag.version;
4162
  } else {
4163
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.ntbEntry.schemaRow);
4164
  }
4165 4166

  metaReaderClear(&mr);
D
dapan1121 已提交
4167
  return TSDB_CODE_SUCCESS;
4168 4169
}

4170 4171 4172 4173 4174 4175 4176 4177 4178 4179 4180
static void cleanupTableSchemaInfo(SExecTaskInfo* pTaskInfo) {
  taosMemoryFreeClear(pTaskInfo->schemaVer.dbname);
  if (pTaskInfo->schemaVer.sw == NULL) {
    return;
  }

  taosMemoryFree(pTaskInfo->schemaVer.sw->pSchema);
  taosMemoryFree(pTaskInfo->schemaVer.sw);
  taosMemoryFree(pTaskInfo->schemaVer.tablename);
}

4181
static int32_t sortTableGroup(STableListInfo* pTableListInfo, int32_t groupNum) {
wmmhello's avatar
wmmhello 已提交
4182
  taosArrayClear(pTableListInfo->pGroupList);
4183 4184
  SArray* sortSupport = taosArrayInit(groupNum, sizeof(uint64_t));
  if (sortSupport == NULL) return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
4185 4186
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
4187
    uint64_t*      groupId = taosHashGet(pTableListInfo->map, &info->uid, sizeof(uint64_t));
wmmhello's avatar
wmmhello 已提交
4188 4189

    int32_t index = taosArraySearchIdx(sortSupport, groupId, compareUint64Val, TD_EQ);
4190 4191 4192 4193
    if (index == -1) {
      void*   p = taosArraySearch(sortSupport, groupId, compareUint64Val, TD_GT);
      SArray* tGroup = taosArrayInit(8, sizeof(STableKeyInfo));
      if (tGroup == NULL) {
wmmhello's avatar
wmmhello 已提交
4194 4195 4196
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
4197
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4198 4199 4200 4201
        qError("taos push info array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
4202
      if (p == NULL) {
wmmhello's avatar
wmmhello 已提交
4203
        if (taosArrayPush(sortSupport, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4204 4205 4206 4207
          qError("taos push support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
wmmhello's avatar
wmmhello 已提交
4208
        if (taosArrayPush(pTableListInfo->pGroupList, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4209 4210 4211 4212
          qError("taos push group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4213
      } else {
wmmhello's avatar
wmmhello 已提交
4214
        int32_t pos = TARRAY_ELEM_IDX(sortSupport, p);
4215
        if (taosArrayInsert(sortSupport, pos, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4216 4217 4218 4219
          qError("taos insert support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4220
        if (taosArrayInsert(pTableListInfo->pGroupList, pos, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4221 4222 4223 4224 4225
          qError("taos insert group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
      }
4226
    } else {
wmmhello's avatar
wmmhello 已提交
4227
      SArray* tGroup = (SArray*)taosArrayGetP(pTableListInfo->pGroupList, index);
4228
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4229 4230 4231 4232 4233 4234 4235 4236 4237 4238
        qError("taos push uid array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
    }
  }
  taosArrayDestroy(sortSupport);
  return TDB_CODE_SUCCESS;
}

wmmhello's avatar
wmmhello 已提交
4239 4240
int32_t generateGroupIdMap(STableListInfo* pTableListInfo, SReadHandle* pHandle, SNodeList* group) {
  if (group == NULL) {
wmmhello's avatar
wmmhello 已提交
4241 4242 4243 4244 4245 4246 4247 4248
    return TDB_CODE_SUCCESS;
  }

  pTableListInfo->map = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, HASH_NO_LOCK);
  if (pTableListInfo->map == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
  int32_t keyLen = 0;
X
Xiaoyu Wang 已提交
4249
  void*   keyBuf = NULL;
wmmhello's avatar
wmmhello 已提交
4250

4251
  SNode* node;
wmmhello's avatar
wmmhello 已提交
4252
  FOREACH(node, group) {
4253
    SExprNode* pExpr = (SExprNode*)node;
wmmhello's avatar
wmmhello 已提交
4254
    keyLen += pExpr->resType.bytes;
wmmhello's avatar
wmmhello 已提交
4255 4256
  }

wmmhello's avatar
wmmhello 已提交
4257
  int32_t nullFlagSize = sizeof(int8_t) * LIST_LENGTH(group);
wmmhello's avatar
wmmhello 已提交
4258 4259 4260 4261 4262 4263 4264
  keyLen += nullFlagSize;

  keyBuf = taosMemoryCalloc(1, keyLen);
  if (keyBuf == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

4265
  int32_t groupNum = 0;
X
Xiaoyu Wang 已提交
4266 4267 4268
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
    SMetaReader    mr = {0};
wmmhello's avatar
wmmhello 已提交
4269 4270 4271
    metaReaderInit(&mr, pHandle->meta, 0);
    metaGetTableEntryByUid(&mr, info->uid);

4272
    SNodeList* groupNew = nodesCloneList(group);
wmmhello's avatar
wmmhello 已提交
4273

wmmhello's avatar
wmmhello 已提交
4274
    nodesRewriteExprsPostOrder(groupNew, doTranslateTagExpr, &mr);
wmmhello's avatar
wmmhello 已提交
4275
    char* isNull = (char*)keyBuf;
wmmhello's avatar
wmmhello 已提交
4276 4277
    char* pStart = (char*)keyBuf + nullFlagSize;

4278
    SNode*  pNode;
wmmhello's avatar
wmmhello 已提交
4279
    int32_t index = 0;
4280
    FOREACH(pNode, groupNew) {
wmmhello's avatar
wmmhello 已提交
4281 4282 4283 4284
      SNode*  pNew = NULL;
      int32_t code = scalarCalculateConstants(pNode, &pNew);
      if (TSDB_CODE_SUCCESS == code) {
        REPLACE_NODE(pNew);
X
Xiaoyu Wang 已提交
4285
      } else {
4286
        taosMemoryFree(keyBuf);
wmmhello's avatar
wmmhello 已提交
4287
        nodesClearList(groupNew);
4288
        metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4289
        return code;
wmmhello's avatar
wmmhello 已提交
4290
      }
4291

wmmhello's avatar
wmmhello 已提交
4292
      ASSERT(nodeType(pNew) == QUERY_NODE_VALUE);
4293
      SValueNode* pValue = (SValueNode*)pNew;
4294

wmmhello's avatar
wmmhello 已提交
4295
      if (pValue->node.resType.type == TSDB_DATA_TYPE_NULL || pValue->isNull) {
wmmhello's avatar
wmmhello 已提交
4296 4297 4298 4299
        isNull[index++] = 1;
        continue;
      } else {
        isNull[index++] = 0;
4300
        char* data = nodesGetValueFromNode(pValue);
L
Liu Jicong 已提交
4301 4302
        if (pValue->node.resType.type == TSDB_DATA_TYPE_JSON) {
          if (tTagIsJson(data)) {
wmmhello's avatar
wmmhello 已提交
4303 4304 4305
            terrno = TSDB_CODE_QRY_JSON_IN_GROUP_ERROR;
            taosMemoryFree(keyBuf);
            nodesClearList(groupNew);
4306
            metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4307 4308
            return terrno;
          }
wmmhello's avatar
wmmhello 已提交
4309
          int32_t len = getJsonValueLen(data);
wmmhello's avatar
wmmhello 已提交
4310 4311 4312
          memcpy(pStart, data, len);
          pStart += len;
        } else if (IS_VAR_DATA_TYPE(pValue->node.resType.type)) {
wmmhello's avatar
wmmhello 已提交
4313 4314
          memcpy(pStart, data, varDataTLen(data));
          pStart += varDataTLen(data);
wmmhello's avatar
wmmhello 已提交
4315
        } else {
wmmhello's avatar
wmmhello 已提交
4316 4317
          memcpy(pStart, data, pValue->node.resType.bytes);
          pStart += pValue->node.resType.bytes;
wmmhello's avatar
wmmhello 已提交
4318 4319 4320
        }
      }
    }
4321

4322
    int32_t  len = (int32_t)(pStart - (char*)keyBuf);
4323 4324
    uint64_t groupId = calcGroupId(keyBuf, len);
    taosHashPut(pTableListInfo->map, &(info->uid), sizeof(uint64_t), &groupId, sizeof(uint64_t));
S
slzhou 已提交
4325
    info->groupId = groupId;
4326
    groupNum++;
wmmhello's avatar
wmmhello 已提交
4327

wmmhello's avatar
wmmhello 已提交
4328
    nodesClearList(groupNew);
wmmhello's avatar
wmmhello 已提交
4329 4330 4331
    metaReaderClear(&mr);
  }
  taosMemoryFree(keyBuf);
4332

4333
  if (pTableListInfo->needSortTableByGroupId) {
wmmhello's avatar
wmmhello 已提交
4334
    return sortTableGroup(pTableListInfo, groupNum);
4335 4336
  }

wmmhello's avatar
wmmhello 已提交
4337 4338 4339
  return TDB_CODE_SUCCESS;
}

4340 4341 4342 4343 4344 4345 4346 4347 4348 4349 4350 4351 4352 4353 4354 4355 4356 4357 4358 4359 4360 4361 4362 4363
static int32_t initTableblockDistQueryCond(uint64_t uid, SQueryTableDataCond* pCond) {
  memset(pCond, 0, sizeof(SQueryTableDataCond));

  pCond->order = TSDB_ORDER_ASC;
  pCond->numOfCols = 1;
  pCond->colList = taosMemoryCalloc(1, sizeof(SColumnInfo));
  if (pCond->colList == NULL) {
    terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return terrno;
  }

  pCond->colList->colId = 1;
  pCond->colList->type = TSDB_DATA_TYPE_TIMESTAMP;
  pCond->colList->bytes = sizeof(TSKEY);

  pCond->twindows = (STimeWindow){.skey = INT64_MIN, .ekey = INT64_MAX};
  pCond->suid = uid;
  pCond->type = BLOCK_LOAD_OFFSET_ORDER;
  pCond->startVersion = -1;
  pCond->endVersion  =  -1;

  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
4364
SOperatorInfo* createOperatorTree(SPhysiNode* pPhyNode, SExecTaskInfo* pTaskInfo, SReadHandle* pHandle,
4365
                                  STableListInfo* pTableListInfo, SNode* pTagCond, SNode* pTagIndexCond, const char* pUser) {
4366 4367
  int32_t type = nodeType(pPhyNode);

X
Xiaoyu Wang 已提交
4368
  if (pPhyNode->pChildren == NULL || LIST_LENGTH(pPhyNode->pChildren) == 0) {
H
Haojun Liao 已提交
4369
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == type) {
dengyihao's avatar
dengyihao 已提交
4370
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4371

4372
      int32_t code = createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags,
4373
                                             pTableScanNode->groupSort, pHandle, pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
4374
      if (code) {
wmmhello's avatar
wmmhello 已提交
4375
        pTaskInfo->code = code;
D
dapan1121 已提交
4376 4377
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4378

4379
      code = extractTableSchemaInfo(pHandle, pTableScanNode->scan.uid, pTaskInfo);
S
slzhou 已提交
4380
      if (code) {
4381
        pTaskInfo->code = terrno;
wmmhello's avatar
wmmhello 已提交
4382 4383 4384
        return NULL;
      }

H
Haojun Liao 已提交
4385
      SOperatorInfo*  pOperator = createTableScanOperatorInfo(pTableScanNode, pHandle, pTaskInfo);
4386 4387
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
S
slzhou 已提交
4388
      return pOperator;
L
Liu Jicong 已提交
4389

S
slzhou 已提交
4390 4391
    } else if (QUERY_NODE_PHYSICAL_PLAN_TABLE_MERGE_SCAN == type) {
      STableMergeScanPhysiNode* pTableScanNode = (STableMergeScanPhysiNode*)pPhyNode;
4392
      int32_t code = createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags,
4393
                                             pTableScanNode->groupSort, pHandle, pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
L
Liu Jicong 已提交
4394
      if (code) {
wmmhello's avatar
wmmhello 已提交
4395
        pTaskInfo->code = code;
wmmhello's avatar
wmmhello 已提交
4396 4397
        return NULL;
      }
4398

4399
      code = extractTableSchemaInfo(pHandle, pTableScanNode->scan.uid, pTaskInfo);
wmmhello's avatar
wmmhello 已提交
4400 4401 4402 4403
      if (code) {
        pTaskInfo->code = terrno;
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4404

4405
      SOperatorInfo* pOperator =
4406
          createTableMergeScanOperatorInfo(pTableScanNode, pTableListInfo, pHandle, pTaskInfo);
wmmhello's avatar
wmmhello 已提交
4407

4408 4409 4410
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
      return pOperator;
L
Liu Jicong 已提交
4411

H
Haojun Liao 已提交
4412
    } else if (QUERY_NODE_PHYSICAL_PLAN_EXCHANGE == type) {
4413
      return createExchangeOperatorInfo(pHandle->pMsgCb->clientRpc, (SExchangePhysiNode*)pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4414
    } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN == type) {
5
54liuyao 已提交
4415
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
4416
      STimeWindowAggSupp   twSup = {
L
Liu Jicong 已提交
4417 4418 4419 4420
            .waterMark = pTableScanNode->watermark,
            .calTrigger = pTableScanNode->triggerType,
            .maxTs = INT64_MIN,
      };
5
54liuyao 已提交
4421
      if (pHandle->vnode) {
4422
        int32_t code = createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags,
4423
                                               pTableScanNode->groupSort, pHandle, pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
L
Liu Jicong 已提交
4424
        if (code) {
wmmhello's avatar
wmmhello 已提交
4425 4426 4427
          pTaskInfo->code = code;
          return NULL;
        }
5
54liuyao 已提交
4428
      }
4429

4430
      SOperatorInfo* pOperator = createStreamScanOperatorInfo(pHandle, pTableScanNode, pTagCond, pTaskInfo, &twSup);
H
Haojun Liao 已提交
4431
      return pOperator;
L
Liu Jicong 已提交
4432

H
Haojun Liao 已提交
4433
    } else if (QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN == type) {
L
Liu Jicong 已提交
4434
      SSystemTableScanPhysiNode* pSysScanPhyNode = (SSystemTableScanPhysiNode*)pPhyNode;
4435
      return createSysTableScanOperatorInfo(pHandle, pSysScanPhyNode, pUser, pTaskInfo);
4436
    } else if (QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN == type) {
X
Xiaoyu Wang 已提交
4437
      STagScanPhysiNode* pScanPhyNode = (STagScanPhysiNode*)pPhyNode;
4438

4439
      int32_t code = getTableList(pHandle->meta, pHandle->vnode, pScanPhyNode, pTagCond, pTagIndexCond, pTableListInfo);
4440
      if (code != TSDB_CODE_SUCCESS) {
4441
        pTaskInfo->code = terrno;
4442 4443 4444
        return NULL;
      }

4445
      return createTagScanOperatorInfo(pHandle, pScanPhyNode, pTableListInfo, pTaskInfo);
4446
    } else if (QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN == type) {
4447
      SBlockDistScanPhysiNode* pBlockNode = (SBlockDistScanPhysiNode*)pPhyNode;
4448 4449 4450
      pTableListInfo->pTableList = taosArrayInit(4, sizeof(STableKeyInfo));

      if (pBlockNode->tableType == TSDB_SUPER_TABLE) {
4451
        int32_t code = vnodeGetAllTableList(pHandle->vnode, pBlockNode->uid, pTableListInfo->pTableList);
4452 4453 4454 4455 4456
        if (code != TSDB_CODE_SUCCESS) {
          pTaskInfo->code = terrno;
          return NULL;
        }
      } else {  // Create one table group.
S
slzhou 已提交
4457
        STableKeyInfo info = {.lastKey = 0, .uid = pBlockNode->uid, .groupId = 0};
4458 4459 4460 4461
        taosArrayPush(pTableListInfo->pTableList, &info);
      }

      SQueryTableDataCond cond = {0};
4462 4463 4464
      int32_t code = initTableblockDistQueryCond(pBlockNode->suid, &cond);
      if (code != TSDB_CODE_SUCCESS) {
        return NULL;
4465
      }
H
Haojun Liao 已提交
4466 4467 4468

      STsdbReader* pReader = NULL;
      tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, "");
4469 4470
      cleanupQueryTableDataCond(&cond);

4471
      return createDataBlockInfoScanOperator(pReader, pHandle, cond.suid, pBlockNode, pTaskInfo);
H
Haojun Liao 已提交
4472 4473 4474
    } else if (QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN == type) {
      SLastRowScanPhysiNode* pScanNode = (SLastRowScanPhysiNode*)pPhyNode;

4475
      int32_t code = createScanTableListInfo(&pScanNode->scan, pScanNode->pGroupTags, true, pHandle, pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
4476 4477 4478 4479
      if (code != TSDB_CODE_SUCCESS) {
        pTaskInfo->code = code;
        return NULL;
      }
4480

4481 4482 4483 4484
      code = extractTableSchemaInfo(pHandle, pScanNode->scan.uid, pTaskInfo);
      if (code != TSDB_CODE_SUCCESS) {
        pTaskInfo->code = code;
        return NULL;
H
Haojun Liao 已提交
4485 4486
      }

4487
      return createLastrowScanOperator(pScanNode, pHandle, pTaskInfo);
H
Haojun Liao 已提交
4488 4489
    } else {
      ASSERT(0);
H
Haojun Liao 已提交
4490 4491 4492
    }
  }

4493 4494
  int32_t num = 0;
  size_t  size = LIST_LENGTH(pPhyNode->pChildren);
H
Haojun Liao 已提交
4495

4496
  SOperatorInfo** ops = taosMemoryCalloc(size, POINTER_BYTES);
dengyihao's avatar
dengyihao 已提交
4497
  for (int32_t i = 0; i < size; ++i) {
4498
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pPhyNode->pChildren, i);
4499
    ops[i] = createOperatorTree(pChildNode, pTaskInfo, pHandle, pTableListInfo, pTagCond, pTagIndexCond, pUser);
4500 4501 4502
    if (ops[i] == NULL) {
      return NULL;
    }
4503
  }
H
Haojun Liao 已提交
4504

4505
  SOperatorInfo* pOptr = NULL;
H
Haojun Liao 已提交
4506
  if (QUERY_NODE_PHYSICAL_PLAN_PROJECT == type) {
4507
    pOptr = createProjectOperatorInfo(ops[0], (SProjectPhysiNode*)pPhyNode, pTaskInfo);
4508
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_AGG == type) {
H
Haojun Liao 已提交
4509 4510
    SAggPhysiNode* pAggNode = (SAggPhysiNode*)pPhyNode;
    SExprInfo*     pExprInfo = createExprInfo(pAggNode->pAggFuncs, pAggNode->pGroupKeys, &num);
4511
    SSDataBlock*   pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4512

dengyihao's avatar
dengyihao 已提交
4513
    int32_t    numOfScalarExpr = 0;
4514 4515 4516 4517 4518
    SExprInfo* pScalarExprInfo = NULL;
    if (pAggNode->pExprs != NULL) {
      pScalarExprInfo = createExprInfo(pAggNode->pExprs, NULL, &numOfScalarExpr);
    }

H
Haojun Liao 已提交
4519 4520
    if (pAggNode->pGroupKeys != NULL) {
      SArray* pColList = extractColumnInfo(pAggNode->pGroupKeys);
dengyihao's avatar
dengyihao 已提交
4521
      pOptr = createGroupOperatorInfo(ops[0], pExprInfo, num, pResBlock, pColList, pAggNode->node.pConditions,
wmmhello's avatar
wmmhello 已提交
4522
                                      pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4523
    } else {
L
Liu Jicong 已提交
4524 4525
      pOptr = createAggregateOperatorInfo(ops[0], pExprInfo, num, pResBlock, pAggNode->node.pConditions,
                                          pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4526
    }
X
Xiaoyu Wang 已提交
4527
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_INTERVAL == type || QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type) {
H
Haojun Liao 已提交
4528
    SIntervalPhysiNode* pIntervalPhyNode = (SIntervalPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4529

H
Haojun Liao 已提交
4530
    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
4531
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4532

dengyihao's avatar
dengyihao 已提交
4533 4534 4535 4536 4537 4538
    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
H
Haojun Liao 已提交
4539

X
Xiaoyu Wang 已提交
4540 4541 4542 4543 4544
    STimeWindowAggSupp as = {
        .waterMark = pIntervalPhyNode->window.watermark,
        .calTrigger = pIntervalPhyNode->window.triggerType,
        .maxTs = INT64_MIN,
    };
4545
    ASSERT(as.calTrigger != STREAM_TRIGGER_MAX_DELAY);
4546

4547
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4548
    bool    isStream = (QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type);
4549 4550
    pOptr = createIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, &as, pIntervalPhyNode,
                                       pTaskInfo, isStream);
4551

4552 4553
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == type) {
    SMergeAlignedIntervalPhysiNode* pIntervalPhyNode = (SMergeAlignedIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4554 4555 4556 4557 4558 4559 4560 4561 4562 4563

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4564

S
shenglian zhou 已提交
4565
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4566 4567
    pOptr = createMergeAlignedIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId,
                                                   pPhyNode->pConditions, pTaskInfo);
S
shenglian zhou 已提交
4568
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_INTERVAL == type) {
X
Xiaoyu Wang 已提交
4569
    SMergeIntervalPhysiNode* pIntervalPhyNode = (SMergeIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4570 4571 4572 4573 4574 4575 4576 4577 4578 4579

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4580

S
shenglian zhou 已提交
4581 4582
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
    pOptr = createMergeIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, pTaskInfo);
5
54liuyao 已提交
4583
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_INTERVAL == type) {
4584
    int32_t children = 0;
5
54liuyao 已提交
4585 4586
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_INTERVAL == type) {
5
54liuyao 已提交
4587
    int32_t children = pHandle->numOfVgroups;
5
54liuyao 已提交
4588
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4589
  } else if (QUERY_NODE_PHYSICAL_PLAN_SORT == type) {
4590
    pOptr = createSortOperatorInfo(ops[0], (SSortPhysiNode*)pPhyNode, pTaskInfo);
S
shenglian zhou 已提交
4591 4592
  } else if (QUERY_NODE_PHYSICAL_PLAN_GROUP_SORT == type) {
    pOptr = createGroupSortOperatorInfo(ops[0], (SGroupSortPhysiNode*)pPhyNode, pTaskInfo);
X
Xiaoyu Wang 已提交
4593
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE == type) {
4594
    SMergePhysiNode* pMergePhyNode = (SMergePhysiNode*)pPhyNode;
4595
    pOptr = createMultiwayMergeOperatorInfo(ops, size, pMergePhyNode, pTaskInfo);
4596
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_SESSION == type) {
H
Haojun Liao 已提交
4597 4598
    SSessionWinodwPhysiNode* pSessionNode = (SSessionWinodwPhysiNode*)pPhyNode;

X
Xiaoyu Wang 已提交
4599 4600
    STimeWindowAggSupp as = {.waterMark = pSessionNode->window.watermark,
                             .calTrigger = pSessionNode->window.triggerType};
4601

H
Haojun Liao 已提交
4602
    SExprInfo*   pExprInfo = createExprInfo(pSessionNode->window.pFuncs, NULL, &num);
4603
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4604 4605
    int32_t      tsSlotId = ((SColumnNode*)pSessionNode->window.pTspk)->slotId;

L
Liu Jicong 已提交
4606 4607
    pOptr = createSessionAggOperatorInfo(ops[0], pExprInfo, num, pResBlock, pSessionNode->gap, tsSlotId, &as,
                                         pPhyNode->pConditions, pTaskInfo);
4608
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SESSION == type) {
4609 4610 4611 4612 4613 4614 4615
    pOptr = createStreamSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_SESSION == type) {
    int32_t children = 0;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_SESSION == type) {
    int32_t children = 1;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4616
  } else if (QUERY_NODE_PHYSICAL_PLAN_PARTITION == type) {
4617
    pOptr = createPartitionOperatorInfo(ops[0], (SPartitionPhysiNode*)pPhyNode, pTaskInfo);
4618
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_STATE == type) {
dengyihao's avatar
dengyihao 已提交
4619
    SStateWinodwPhysiNode* pStateNode = (SStateWinodwPhysiNode*)pPhyNode;
4620

4621 4622
    STimeWindowAggSupp as = {.waterMark = pStateNode->window.watermark, .calTrigger = pStateNode->window.triggerType};

dengyihao's avatar
dengyihao 已提交
4623
    SExprInfo*   pExprInfo = createExprInfo(pStateNode->window.pFuncs, NULL, &num);
4624
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4625 4626
    int32_t      tsSlotId = ((SColumnNode*)pStateNode->window.pTspk)->slotId;

4627
    SColumnNode* pColNode = (SColumnNode*)((STargetNode*)pStateNode->pStateKey)->pExpr;
X
Xiaoyu Wang 已提交
4628
    SColumn      col = extractColumnFromColumnNode(pColNode);
L
Liu Jicong 已提交
4629 4630
    pOptr = createStatewindowOperatorInfo(ops[0], pExprInfo, num, pResBlock, &as, tsSlotId, &col, pPhyNode->pConditions,
                                          pTaskInfo);
4631
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_STATE == type) {
5
54liuyao 已提交
4632
    pOptr = createStreamStateAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4633
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_JOIN == type) {
4634
    pOptr = createMergeJoinOperatorInfo(ops, size, (SJoinPhysiNode*)pPhyNode, pTaskInfo);
4635
  } else if (QUERY_NODE_PHYSICAL_PLAN_FILL == type) {
H
Haojun Liao 已提交
4636
    pOptr = createFillOperatorInfo(ops[0], (SFillPhysiNode*)pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4637 4638
  } else if (QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC == type) {
    pOptr = createIndefinitOutputOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4639 4640
  } else if (QUERY_NODE_PHYSICAL_PLAN_INTERP_FUNC == type) {
    pOptr = createTimeSliceOperatorInfo(ops[0], pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4641 4642
  } else {
    ASSERT(0);
H
Haojun Liao 已提交
4643
  }
4644 4645 4646

  taosMemoryFree(ops);
  return pOptr;
4647
}
H
Haojun Liao 已提交
4648

H
Haojun Liao 已提交
4649
SArray* extractColumnInfo(SNodeList* pNodeList) {
L
Liu Jicong 已提交
4650
  size_t  numOfCols = LIST_LENGTH(pNodeList);
H
Haojun Liao 已提交
4651 4652 4653 4654 4655 4656
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColumn));
  if (pList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

L
Liu Jicong 已提交
4657 4658
  for (int32_t i = 0; i < numOfCols; ++i) {
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pNodeList, i);
H
Haojun Liao 已提交
4659

4660 4661 4662
    if (nodeType(pNode->pExpr) == QUERY_NODE_COLUMN) {
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

4663
      SColumn c = extractColumnFromColumnNode(pColNode);
4664 4665
      taosArrayPush(pList, &c);
    } else if (nodeType(pNode->pExpr) == QUERY_NODE_VALUE) {
L
Liu Jicong 已提交
4666 4667
      SValueNode* pValNode = (SValueNode*)pNode->pExpr;
      SColumn     c = {0};
4668
      c.slotId = pNode->slotId;
L
Liu Jicong 已提交
4669 4670 4671 4672
      c.colId = pNode->slotId;
      c.type = pValNode->node.type;
      c.bytes = pValNode->node.resType.bytes;
      c.scale = pValNode->node.resType.scale;
4673 4674 4675 4676
      c.precision = pValNode->node.resType.precision;

      taosArrayPush(pList, &c);
    }
H
Haojun Liao 已提交
4677 4678 4679 4680 4681
  }

  return pList;
}

4682
#if 0
L
Liu Jicong 已提交
4683 4684
STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
                                STableListInfo* pTableListInfo, const char* idstr) {
4685
  int32_t code = getTableList(pHandle->meta, pHandle->vnode, &pTableScanNode->scan, pTableListInfo);
wmmhello's avatar
wmmhello 已提交
4686 4687 4688 4689 4690 4691
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  if (taosArrayGetSize(pTableListInfo->pTableList) == 0) {
    code = 0;
H
Haojun Liao 已提交
4692
    qDebug("no table qualified for query, %s", idstr);
wmmhello's avatar
wmmhello 已提交
4693 4694 4695
    goto _error;
  }

4696
  SQueryTableDataCond cond = {0};
wmmhello's avatar
wmmhello 已提交
4697
  code = initQueryTableDataCond(&cond, pTableScanNode);
4698
  if (code != TSDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4699
    goto _error;
X
Xiaoyu Wang 已提交
4700
  }
4701

H
Hongze Cheng 已提交
4702
  STsdbReader* pReader;
H
Haojun Liao 已提交
4703
  code = tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, idstr);
H
Haojun Liao 已提交
4704 4705 4706 4707
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

4708
  cleanupQueryTableDataCond(&cond);
H
Haojun Liao 已提交
4709 4710

  return pReader;
wmmhello's avatar
wmmhello 已提交
4711 4712 4713 4714

_error:
  terrno = code;
  return NULL;
H
Haojun Liao 已提交
4715
}
4716
#endif
H
Haojun Liao 已提交
4717

L
Liu Jicong 已提交
4718 4719 4720 4721 4722 4723 4724 4725 4726 4727 4728 4729 4730
static int32_t extractTbscanInStreamOpTree(SOperatorInfo* pOperator, STableScanInfo** ppInfo) {
  if (pOperator->operatorType != QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
    if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator");
      return TSDB_CODE_QRY_APP_ERROR;
    }

    if (pOperator->numOfDownstream > 1) {
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
    }
    return extractTbscanInStreamOpTree(pOperator->pDownstream[0], ppInfo);
  } else {
4731 4732 4733
    SStreamScanInfo* pInfo = pOperator->info;
    ASSERT(pInfo->pTableScanOp->operatorType == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN);
    *ppInfo = pInfo->pTableScanOp->info;
L
Liu Jicong 已提交
4734 4735 4736 4737
    return 0;
  }
}

4738 4739 4740 4741 4742 4743 4744 4745 4746 4747 4748 4749 4750 4751 4752 4753 4754 4755 4756 4757 4758 4759
int32_t extractTableScanNode(SPhysiNode* pNode, STableScanPhysiNode** ppNode) {
  if (pNode->pChildren == NULL || LIST_LENGTH(pNode->pChildren) == 0) {
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == pNode->type) {
      *ppNode = (STableScanPhysiNode*)pNode;
      return 0;
    } else {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
  } else {
    if (LIST_LENGTH(pNode->pChildren) != 1) {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pNode->pChildren, 0);
    return extractTableScanNode(pChildNode, ppNode);
  }
  return -1;
}

4760
#if 0
L
Liu Jicong 已提交
4761 4762 4763 4764 4765
int32_t rebuildReader(SOperatorInfo* pOperator, SSubplan* plan, SReadHandle* pHandle, int64_t uid, int64_t ts) {
  STableScanInfo* pTableScanInfo = NULL;
  if (extractTbscanInStreamOpTree(pOperator, &pTableScanInfo) < 0) {
    return -1;
  }
4766

L
Liu Jicong 已提交
4767 4768 4769 4770
  STableScanPhysiNode* pNode = NULL;
  if (extractTableScanNode(plan->pNode, &pNode) < 0) {
    ASSERT(0);
  }
4771

H
Haojun Liao 已提交
4772
  tsdbReaderClose(pTableScanInfo->dataReader);
4773

L
Liu Jicong 已提交
4774
  STableListInfo info = {0};
H
Haojun Liao 已提交
4775
  pTableScanInfo->dataReader = doCreateDataReader(pNode, pHandle, &info, NULL);
L
Liu Jicong 已提交
4776 4777 4778 4779
  if (pTableScanInfo->dataReader == NULL) {
    ASSERT(0);
    qError("failed to create data reader");
    return TSDB_CODE_QRY_APP_ERROR;
4780
  }
L
Liu Jicong 已提交
4781
  // TODO: set uid and ts to data reader
4782 4783
  return 0;
}
4784
#endif
4785

C
Cary Xu 已提交
4786
int32_t encodeOperator(SOperatorInfo* ops, char** result, int32_t* length, int32_t* nOptrWithVal) {
wmmhello's avatar
wmmhello 已提交
4787
  int32_t code = TDB_CODE_SUCCESS;
4788
  char*   pCurrent = NULL;
wmmhello's avatar
wmmhello 已提交
4789
  int32_t currLength = 0;
4790
  if (ops->fpSet.encodeResultRow) {
C
Cary Xu 已提交
4791
    if (result == NULL || length == NULL || nOptrWithVal == NULL) {
wmmhello's avatar
wmmhello 已提交
4792 4793 4794
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
    code = ops->fpSet.encodeResultRow(ops, &pCurrent, &currLength);
wmmhello's avatar
wmmhello 已提交
4795

4796 4797
    if (code != TDB_CODE_SUCCESS) {
      if (*result != NULL) {
wmmhello's avatar
wmmhello 已提交
4798 4799 4800 4801
        taosMemoryFree(*result);
        *result = NULL;
      }
      return code;
C
Cary Xu 已提交
4802 4803 4804
    } else if (currLength == 0) {
      ASSERT(!pCurrent);
      goto _downstream;
wmmhello's avatar
wmmhello 已提交
4805
    }
wmmhello's avatar
wmmhello 已提交
4806

C
Cary Xu 已提交
4807 4808
    ++(*nOptrWithVal);

C
Cary Xu 已提交
4809
    ASSERT(currLength >= 0);
wmmhello's avatar
wmmhello 已提交
4810

4811
    if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
4812
      *result = (char*)taosMemoryCalloc(1, currLength + sizeof(int32_t));
wmmhello's avatar
wmmhello 已提交
4813 4814 4815 4816 4817 4818
      if (*result == NULL) {
        taosMemoryFree(pCurrent);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      memcpy(*result + sizeof(int32_t), pCurrent, currLength);
      *(int32_t*)(*result) = currLength + sizeof(int32_t);
4819
    } else {
wmmhello's avatar
wmmhello 已提交
4820
      int32_t sizePre = *(int32_t*)(*result);
4821
      char*   tmp = (char*)taosMemoryRealloc(*result, sizePre + currLength);
wmmhello's avatar
wmmhello 已提交
4822 4823 4824 4825 4826 4827 4828 4829 4830 4831 4832 4833
      if (tmp == NULL) {
        taosMemoryFree(pCurrent);
        taosMemoryFree(*result);
        *result = NULL;
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      *result = tmp;
      memcpy(*result + sizePre, pCurrent, currLength);
      *(int32_t*)(*result) += currLength;
    }
    taosMemoryFree(pCurrent);
    *length = *(int32_t*)(*result);
wmmhello's avatar
wmmhello 已提交
4834 4835
  }

C
Cary Xu 已提交
4836
_downstream:
wmmhello's avatar
wmmhello 已提交
4837
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
C
Cary Xu 已提交
4838
    code = encodeOperator(ops->pDownstream[i], result, length, nOptrWithVal);
4839
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4840
      return code;
wmmhello's avatar
wmmhello 已提交
4841 4842
    }
  }
wmmhello's avatar
wmmhello 已提交
4843
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4844 4845
}

H
Haojun Liao 已提交
4846
int32_t decodeOperator(SOperatorInfo* ops, const char* result, int32_t length) {
wmmhello's avatar
wmmhello 已提交
4847
  int32_t code = TDB_CODE_SUCCESS;
4848 4849
  if (ops->fpSet.decodeResultRow) {
    if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
4850 4851
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
H
Haojun Liao 已提交
4852

4853
    ASSERT(length == *(int32_t*)result);
H
Haojun Liao 已提交
4854 4855

    const char* data = result + sizeof(int32_t);
L
Liu Jicong 已提交
4856
    code = ops->fpSet.decodeResultRow(ops, (char*)data);
4857
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4858 4859
      return code;
    }
wmmhello's avatar
wmmhello 已提交
4860

wmmhello's avatar
wmmhello 已提交
4861
    int32_t totalLength = *(int32_t*)result;
4862 4863
    int32_t dataLength = *(int32_t*)data;

4864
    if (totalLength == dataLength + sizeof(int32_t)) {  // the last data
wmmhello's avatar
wmmhello 已提交
4865 4866
      result = NULL;
      length = 0;
4867
    } else {
wmmhello's avatar
wmmhello 已提交
4868 4869 4870 4871
      result += dataLength;
      *(int32_t*)(result) = totalLength - dataLength;
      length = totalLength - dataLength;
    }
wmmhello's avatar
wmmhello 已提交
4872 4873
  }

wmmhello's avatar
wmmhello 已提交
4874 4875
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
    code = decodeOperator(ops->pDownstream[i], result, length);
4876
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4877
      return code;
wmmhello's avatar
wmmhello 已提交
4878 4879
    }
  }
wmmhello's avatar
wmmhello 已提交
4880
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4881 4882
}

D
dapan1121 已提交
4883
int32_t createDataSinkParam(SDataSinkNode* pNode, void** pParam, qTaskInfo_t* pTaskInfo, SReadHandle* readHandle) {
D
dapan1121 已提交
4884
  SExecTaskInfo* pTask = *(SExecTaskInfo**)pTaskInfo;
4885

D
dapan1121 已提交
4886
  switch (pNode->type) {
D
dapan1121 已提交
4887 4888 4889 4890 4891 4892
    case QUERY_NODE_PHYSICAL_PLAN_QUERY_INSERT: {
      SInserterParam* pInserterParam = taosMemoryCalloc(1, sizeof(SInserterParam));
      if (NULL == pInserterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      pInserterParam->readHandle = readHandle;
L
Liu Jicong 已提交
4893

D
dapan1121 已提交
4894 4895 4896
      *pParam = pInserterParam;
      break;
    }
D
dapan1121 已提交
4897
    case QUERY_NODE_PHYSICAL_PLAN_DELETE: {
4898
      SDeleterParam* pDeleterParam = taosMemoryCalloc(1, sizeof(SDeleterParam));
D
dapan1121 已提交
4899 4900 4901 4902
      if (NULL == pDeleterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      int32_t tbNum = taosArrayGetSize(pTask->tableqinfoList.pTableList);
D
dapan1121 已提交
4903
      pDeleterParam->suid = pTask->tableqinfoList.suid;
D
dapan1121 已提交
4904 4905 4906 4907 4908 4909
      pDeleterParam->pUidList = taosArrayInit(tbNum, sizeof(uint64_t));
      if (NULL == pDeleterParam->pUidList) {
        taosMemoryFree(pDeleterParam);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      for (int32_t i = 0; i < tbNum; ++i) {
4910
        STableKeyInfo* pTable = taosArrayGet(pTask->tableqinfoList.pTableList, i);
D
dapan1121 已提交
4911 4912 4913 4914 4915 4916 4917 4918 4919 4920 4921 4922 4923
        taosArrayPush(pDeleterParam->pUidList, &pTable->uid);
      }

      *pParam = pDeleterParam;
      break;
    }
    default:
      break;
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
4924
int32_t createExecTaskInfoImpl(SSubplan* pPlan, SExecTaskInfo** pTaskInfo, SReadHandle* pHandle, uint64_t taskId,
4925
                               const char* sql, EOPTR_EXEC_MODEL model) {
H
Haojun Liao 已提交
4926 4927
  uint64_t queryId = pPlan->id.queryId;

H
Haojun Liao 已提交
4928
  int32_t code = TSDB_CODE_SUCCESS;
D
dapan1121 已提交
4929
  *pTaskInfo = createExecTaskInfo(queryId, taskId, model, pPlan->dbFName);
H
Haojun Liao 已提交
4930 4931 4932 4933
  if (*pTaskInfo == NULL) {
    code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    goto _complete;
  }
H
Haojun Liao 已提交
4934

4935
  (*pTaskInfo)->sql = sql;
4936
  (*pTaskInfo)->pRoot = createOperatorTree(pPlan->pNode, *pTaskInfo, pHandle, &(*pTaskInfo)->tableqinfoList, pPlan->pTagCond, pPlan->pTagIndexCond, pPlan->user);
L
Liu Jicong 已提交
4937

D
dapan1121 已提交
4938
  if (NULL == (*pTaskInfo)->pRoot) {
4939
    code = (*pTaskInfo)->code;
D
dapan1121 已提交
4940
    goto _complete;
4941 4942
  }

H
Haojun Liao 已提交
4943 4944
  return code;

H
Haojun Liao 已提交
4945
_complete:
wafwerar's avatar
wafwerar 已提交
4946
  taosMemoryFreeClear(*pTaskInfo);
H
Haojun Liao 已提交
4947 4948
  terrno = code;
  return code;
H
Haojun Liao 已提交
4949 4950
}

wmmhello's avatar
wmmhello 已提交
4951 4952 4953
static void doDestroyTableList(STableListInfo* pTableqinfoList) {
  taosArrayDestroy(pTableqinfoList->pTableList);
  taosHashCleanup(pTableqinfoList->map);
4954 4955
  if (pTableqinfoList->needSortTableByGroupId) {
    for (int32_t i = 0; i < taosArrayGetSize(pTableqinfoList->pGroupList); i++) {
wmmhello's avatar
wmmhello 已提交
4956
      SArray* tmp = taosArrayGetP(pTableqinfoList->pGroupList, i);
4957 4958 4959
      if (tmp == pTableqinfoList->pTableList) {
        continue;
      }
wmmhello's avatar
wmmhello 已提交
4960 4961 4962 4963
      taosArrayDestroy(tmp);
    }
  }
  taosArrayDestroy(pTableqinfoList->pGroupList);
4964

wmmhello's avatar
wmmhello 已提交
4965 4966
  pTableqinfoList->pTableList = NULL;
  pTableqinfoList->map = NULL;
4967 4968
}

L
Liu Jicong 已提交
4969
void doDestroyTask(SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
4970 4971
  qDebug("%s execTask is freed", GET_TASKID(pTaskInfo));

wmmhello's avatar
wmmhello 已提交
4972
  doDestroyTableList(&pTaskInfo->tableqinfoList);
H
Haojun Liao 已提交
4973
  destroyOperatorInfo(pTaskInfo->pRoot);
4974
  cleanupTableSchemaInfo(pTaskInfo);
4975

wafwerar's avatar
wafwerar 已提交
4976 4977 4978
  taosMemoryFreeClear(pTaskInfo->sql);
  taosMemoryFreeClear(pTaskInfo->id.str);
  taosMemoryFreeClear(pTaskInfo);
4979 4980 4981 4982 4983 4984 4985 4986 4987 4988 4989 4990
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes) {
  if (val == NULL) {
    setNull(output, type, bytes);
    return;
  }

  if (IS_VAR_DATA_TYPE(type)) {
    // Binary data overflows for sort of unknown reasons. Let trim the overflow data
    if (varDataTLen(val) > bytes) {
      int32_t maxLen = bytes - VARSTR_HEADER_SIZE;
L
Liu Jicong 已提交
4991
      int32_t len = (varDataLen(val) > maxLen) ? maxLen : varDataLen(val);
4992 4993 4994 4995 4996 4997 4998 4999 5000 5001 5002 5003
      memcpy(varDataVal(output), varDataVal(val), len);
      varDataSetLen(output, len);
    } else {
      varDataCopy(output, val);
    }
  } else {
    memcpy(output, val, bytes);
  }
}

static int64_t getQuerySupportBufSize(size_t numOfTables) {
  size_t s1 = sizeof(STableQueryInfo);
L
Liu Jicong 已提交
5004 5005
  //  size_t s3 = sizeof(STableCheckInfo);  buffer consumption in tsdb
  return (int64_t)(s1 * 1.5 * numOfTables);
5006 5007 5008 5009 5010 5011 5012
}

int32_t checkForQueryBuf(size_t numOfTables) {
  int64_t t = getQuerySupportBufSize(numOfTables);
  if (tsQueryBufferSizeBytes < 0) {
    return TSDB_CODE_SUCCESS;
  } else if (tsQueryBufferSizeBytes > 0) {
L
Liu Jicong 已提交
5013
    while (1) {
5014 5015 5016 5017 5018 5019 5020 5021 5022 5023 5024 5025 5026 5027 5028 5029 5030 5031 5032 5033 5034 5035 5036 5037 5038 5039
      int64_t s = tsQueryBufferSizeBytes;
      int64_t remain = s - t;
      if (remain >= 0) {
        if (atomic_val_compare_exchange_64(&tsQueryBufferSizeBytes, s, remain) == s) {
          return TSDB_CODE_SUCCESS;
        }
      } else {
        return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
      }
    }
  }

  // disable query processing if the value of tsQueryBufferSize is zero.
  return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
}

void releaseQueryBuf(size_t numOfTables) {
  if (tsQueryBufferSizeBytes < 0) {
    return;
  }

  int64_t t = getQuerySupportBufSize(numOfTables);

  // restore value is not enough buffer available
  atomic_add_fetch_64(&tsQueryBufferSizeBytes, t);
}
D
dapan1121 已提交
5040

dengyihao's avatar
dengyihao 已提交
5041 5042
int32_t getOperatorExplainExecInfo(SOperatorInfo* operatorInfo, SExplainExecInfo** pRes, int32_t* capacity,
                                   int32_t* resNum) {
D
dapan1121 已提交
5043 5044
  if (*resNum >= *capacity) {
    *capacity += 10;
dengyihao's avatar
dengyihao 已提交
5045

D
dapan1121 已提交
5046 5047
    *pRes = taosMemoryRealloc(*pRes, (*capacity) * sizeof(SExplainExecInfo));
    if (NULL == *pRes) {
D
dapan1121 已提交
5048
      qError("malloc %d failed", (*capacity) * (int32_t)sizeof(SExplainExecInfo));
D
dapan1121 已提交
5049 5050 5051 5052
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

5053 5054 5055 5056 5057
  SExplainExecInfo* pInfo = &(*pRes)[*resNum];

  pInfo->numOfRows = operatorInfo->resultInfo.totalRows;
  pInfo->startupCost = operatorInfo->cost.openCost;
  pInfo->totalCost = operatorInfo->cost.totalCost;
D
dapan1121 已提交
5058

5059
  if (operatorInfo->fpSet.getExplainFn) {
5060
    int32_t code = operatorInfo->fpSet.getExplainFn(operatorInfo, &pInfo->verboseInfo, &pInfo->verboseLen);
D
dapan1121 已提交
5061
    if (code) {
5062
      qError("%s operator getExplainFn failed, code:%s", GET_TASKID(operatorInfo->pTaskInfo), tstrerror(code));
D
dapan1121 已提交
5063 5064
      return code;
    }
5065 5066 5067
  } else {
    pInfo->verboseLen = 0;
    pInfo->verboseInfo = NULL;
D
dapan1121 已提交
5068
  }
dengyihao's avatar
dengyihao 已提交
5069

D
dapan1121 已提交
5070
  ++(*resNum);
dengyihao's avatar
dengyihao 已提交
5071

D
dapan1121 已提交
5072
  int32_t code = 0;
D
dapan1121 已提交
5073 5074
  for (int32_t i = 0; i < operatorInfo->numOfDownstream; ++i) {
    code = getOperatorExplainExecInfo(operatorInfo->pDownstream[i], pRes, capacity, resNum);
D
dapan1121 已提交
5075 5076 5077 5078 5079 5080 5081
    if (code) {
      taosMemoryFreeClear(*pRes);
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
D
dapan1121 已提交
5082
}
5
54liuyao 已提交
5083

L
Liu Jicong 已提交
5084
int32_t initStreamAggSupporter(SStreamAggSupporter* pSup, const char* pKey, SqlFunctionCtx* pCtx, int32_t numOfOutput,
5085
                               int32_t size) {
5086
  pSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
5
54liuyao 已提交
5087 5088
  pSup->keySize = sizeof(int64_t) + sizeof(TSKEY);
  pSup->pKeyBuf = taosMemoryCalloc(1, pSup->keySize);
5089 5090
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);
  pSup->pResultRows = taosHashInit(1024, hashFn, false, HASH_NO_LOCK);
5
54liuyao 已提交
5091 5092 5093
  if (pSup->pKeyBuf == NULL || pSup->pResultRows == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
5094
  pSup->valueSize = size;
5
54liuyao 已提交
5095

5
54liuyao 已提交
5096 5097
  pSup->pScanWindow = taosArrayInit(4, sizeof(STimeWindow));

5
54liuyao 已提交
5098 5099 5100 5101 5102 5103 5104 5105 5106
  int32_t pageSize = 4096;
  while (pageSize < pSup->resultRowSize * 4) {
    pageSize <<= 1u;
  }
  // at least four pages need to be in buffer
  int32_t bufSize = 4096 * 256;
  if (bufSize <= pageSize) {
    bufSize = pageSize * 4;
  }
5107
  int32_t code = createDiskbasedBuf(&pSup->pResultBuf, pageSize, bufSize, pKey, TD_TMP_DIR_PATH);
L
Liu Jicong 已提交
5108
  for (int32_t i = 0; i < numOfOutput; ++i) {
5109 5110 5111
    pCtx[i].pBuf = pSup->pResultBuf;
  }
  return code;
5
54liuyao 已提交
5112
}