executorimpl.c 177.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
15

H
Haojun Liao 已提交
16 17
#include "filter.h"
#include "function.h"
18 19
#include "functionMgt.h"
#include "os.h"
H
Haojun Liao 已提交
20
#include "querynodes.h"
21
#include "tfill.h"
dengyihao's avatar
dengyihao 已提交
22
#include "tname.h"
X
Xiaoyu Wang 已提交
23
#include "tref.h"
24

H
Haojun Liao 已提交
25
#include "tdatablock.h"
26
#include "tglobal.h"
H
Haojun Liao 已提交
27
#include "tmsg.h"
H
Haojun Liao 已提交
28
#include "tsort.h"
29
#include "ttime.h"
H
Haojun Liao 已提交
30

31
#include "executorimpl.h"
dengyihao's avatar
dengyihao 已提交
32
#include "index.h"
33
#include "query.h"
34 35
#include "tcompare.h"
#include "tcompression.h"
H
Haojun Liao 已提交
36
#include "thash.h"
37
#include "ttypes.h"
dengyihao's avatar
dengyihao 已提交
38
#include "vnode.h"
39

H
Haojun Liao 已提交
40
#define IS_MAIN_SCAN(runtime)          ((runtime)->scanFlag == MAIN_SCAN)
41 42 43 44 45 46
#define SET_REVERSE_SCAN_FLAG(runtime) ((runtime)->scanFlag = REVERSE_SCAN)

#define GET_FORWARD_DIRECTION_FACTOR(ord) (((ord) == TSDB_ORDER_ASC) ? QUERY_ASC_FORWARD_STEP : QUERY_DESC_FORWARD_STEP)

#if 0
static UNUSED_FUNC void *u_malloc (size_t __size) {
wafwerar's avatar
wafwerar 已提交
47
  uint32_t v = taosRand();
48 49 50 51

  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
52
    return taosMemoryMalloc(__size);
53 54 55 56
  }
}

static UNUSED_FUNC void* u_calloc(size_t num, size_t __size) {
wafwerar's avatar
wafwerar 已提交
57
  uint32_t v = taosRand();
58 59 60
  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
61
    return taosMemoryCalloc(num, __size);
62 63 64 65
  }
}

static UNUSED_FUNC void* u_realloc(void* p, size_t __size) {
wafwerar's avatar
wafwerar 已提交
66
  uint32_t v = taosRand();
67 68 69
  if (v % 5 <= 1) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
70
    return taosMemoryRealloc(p, __size);
71 72 73 74 75 76 77 78
  }
}

#define calloc  u_calloc
#define malloc  u_malloc
#define realloc u_realloc
#endif

X
Xiaoyu Wang 已提交
79
#define CLEAR_QUERY_STATUS(q, st)   ((q)->status &= (~(st)))
80 81
#define QUERY_IS_INTERVAL_QUERY(_q) ((_q)->interval.interval > 0)

L
Liu Jicong 已提交
82 83 84
int32_t getMaximumIdleDurationSec() { return tsShellActivityTimer * 2; }

static int32_t getExprFunctionId(SExprInfo* pExprInfo) {
85
  assert(pExprInfo != NULL && pExprInfo->pExpr != NULL && pExprInfo->pExpr->nodeType == TEXPR_UNARYEXPR_NODE);
86
  return 0;
87 88 89 90
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes);

91
static void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExpr, SSDataBlock* pSDataBlock);
92

X
Xiaoyu Wang 已提交
93
static void releaseQueryBuf(size_t numOfTables);
94 95 96 97 98

static void destroySFillOperatorInfo(void* param, int32_t numOfOutput);
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput);
static void destroyOrderOperatorInfo(void* param, int32_t numOfOutput);
static void destroyAggOperatorInfo(void* param, int32_t numOfOutput);
X
Xiaoyu Wang 已提交
99

H
Haojun Liao 已提交
100
static void destroyIntervalOperatorInfo(void* param, int32_t numOfOutput);
H
Haojun Liao 已提交
101 102
static void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput);

103 104
static void destroyOperatorInfo(SOperatorInfo* pOperator);

105
void doSetOperatorCompleted(SOperatorInfo* pOperator) {
106
  pOperator->status = OP_EXEC_DONE;
107

108
  pOperator->cost.totalCost = (taosGetTimestampUs() - pOperator->pTaskInfo->cost.start * 1000) / 1000.0;
H
Haojun Liao 已提交
109
  if (pOperator->pTaskInfo != NULL) {
110
    setTaskStatus(pOperator->pTaskInfo, TASK_COMPLETED);
111 112
  }
}
113

H
Haojun Liao 已提交
114
int32_t operatorDummyOpenFn(SOperatorInfo* pOperator) {
115
  OPTR_SET_OPENED(pOperator);
116
  pOperator->cost.openCost = 0;
H
Haojun Liao 已提交
117
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
118 119
}

120
SOperatorFpSet createOperatorFpSet(__optr_open_fn_t openFn, __optr_fn_t nextFn, __optr_fn_t streamFn,
L
Liu Jicong 已提交
121
                                   __optr_fn_t cleanup, __optr_close_fn_t closeFn, __optr_encode_fn_t encode,
122
                                   __optr_decode_fn_t decode, __optr_explain_fn_t explain) {
123 124 125 126 127 128 129 130 131 132 133 134 135 136
  SOperatorFpSet fpSet = {
      ._openFn = openFn,
      .getNextFn = nextFn,
      .getStreamResFn = streamFn,
      .cleanupFn = cleanup,
      .closeFn = closeFn,
      .encodeResultRow = encode,
      .decodeResultRow = decode,
      .getExplainFn = explain,
  };

  return fpSet;
}

H
Haojun Liao 已提交
137
void operatorDummyCloseFn(void* param, int32_t numOfCols) {}
H
Haojun Liao 已提交
138

X
Xiaoyu Wang 已提交
139 140 141
static int32_t doCopyToSDataBlock(SExecTaskInfo* taskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo,
                                  SDiskbasedBuf* pBuf, SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset,
                                  SqlFunctionCtx* pCtx, int32_t numOfExprs);
H
Haojun Liao 已提交
142

143
static void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size);
L
Liu Jicong 已提交
144 145
static void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                                     uint64_t groupId);
146

L
Liu Jicong 已提交
147 148
// setup the output buffer for each operator
static bool hasNull(SColumn* pColumn, SColumnDataAgg* pStatis) {
dengyihao's avatar
dengyihao 已提交
149 150
  if (TSDB_COL_IS_TAG(pColumn->flag) || TSDB_COL_IS_UD_COL(pColumn->flag) ||
      pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
151 152 153 154 155 156 157 158 159 160
    return false;
  }

  if (pStatis != NULL && pStatis->numOfNull == 0) {
    return false;
  }

  return true;
}

161
#if 0
L
Liu Jicong 已提交
162 163
static bool chkResultRowFromKey(STaskRuntimeEnv* pRuntimeEnv, SResultRowInfo* pResultRowInfo, char* pData,
                                int16_t bytes, bool masterscan, uint64_t uid) {
164 165 166
  bool existed = false;
  SET_RES_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid);

L
Liu Jicong 已提交
167 168
  SResultRow** p1 =
      (SResultRow**)taosHashGet(pRuntimeEnv->pResultRowHashTable, pRuntimeEnv->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
169 170 171 172 173 174 175 176 177 178 179

  // in case of repeat scan/reverse scan, no new time window added.
  if (QUERY_IS_INTERVAL_QUERY(pRuntimeEnv->pQueryAttr)) {
    if (!masterscan) {  // the *p1 may be NULL in case of sliding+offset exists.
      return p1 != NULL;
    }

    if (p1 != NULL) {
      if (pResultRowInfo->size == 0) {
        existed = false;
      } else if (pResultRowInfo->size == 1) {
dengyihao's avatar
dengyihao 已提交
180
        //        existed = (pResultRowInfo->pResult[0] == (*p1));
181 182
      } else {  // check if current pResultRowInfo contains the existed pResultRow
        SET_RES_EXT_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid, pResultRowInfo);
L
Liu Jicong 已提交
183 184
        int64_t* index =
            taosHashGet(pRuntimeEnv->pResultRowListSet, pRuntimeEnv->keyBuf, GET_RES_EXT_WINDOW_KEY_LEN(bytes));
185 186 187 188 189 190 191 192 193 194 195 196 197
        if (index != NULL) {
          existed = true;
        } else {
          existed = false;
        }
      }
    }

    return existed;
  }

  return p1 != NULL;
}
198
#endif
199

200
SResultRow* getNewResultRow(SDiskbasedBuf* pResultBuf, int64_t tableGroupId, int32_t interBufSize) {
L
Liu Jicong 已提交
201
  SFilePage* pData = NULL;
202 203 204 205 206 207 208 209 210 211 212 213 214

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tableGroupId);

  if (taosArrayGetSize(list) == 0) {
    pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
    pData->num = sizeof(SFilePage);
  } else {
    SPageInfo* pi = getLastPageInfo(list);
    pData = getBufPage(pResultBuf, getPageId(pi));
    pageId = getPageId(pi);

wmmhello's avatar
wmmhello 已提交
215
    if (pData->num + interBufSize > getBufPageSize(pResultBuf)) {
216 217 218 219 220 221 222 223 224 225 226 227 228 229
      // release current page first, and prepare the next one
      releaseBufPageInfo(pResultBuf, pi);

      pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
      if (pData != NULL) {
        pData->num = sizeof(SFilePage);
      }
    }
  }

  if (pData == NULL) {
    return NULL;
  }

230 231
  setBufPageDirty(pData, true);

232 233 234 235 236
  // set the number of rows in current disk page
  SResultRow* pResultRow = (SResultRow*)((char*)pData + pData->num);
  pResultRow->pageId = pageId;
  pResultRow->offset = (int32_t)pData->num;

wmmhello's avatar
wmmhello 已提交
237
  pData->num += interBufSize;
238 239 240 241

  return pResultRow;
}

242 243 244 245 246 247 248
/**
 * the struct of key in hash table
 * +----------+---------------+
 * | group id |   key data    |
 * | 8 bytes  | actual length |
 * +----------+---------------+
 */
249 250 251
SResultRow* doSetResultOutBufByKey(SDiskbasedBuf* pResultBuf, SResultRowInfo* pResultRowInfo, char* pData,
                                   int16_t bytes, bool masterscan, uint64_t groupId, SExecTaskInfo* pTaskInfo,
                                   bool isIntervalQuery, SAggSupporter* pSup) {
252
  SET_RES_WINDOW_KEY(pSup->keyBuf, pData, bytes, groupId);
H
Haojun Liao 已提交
253

dengyihao's avatar
dengyihao 已提交
254 255
  SResultRowPosition* p1 =
      (SResultRowPosition*)taosHashGet(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
H
Haojun Liao 已提交
256

257 258
  SResultRow* pResult = NULL;

H
Haojun Liao 已提交
259 260
  // in case of repeat scan/reverse scan, no new time window added.
  if (isIntervalQuery) {
261 262
    if (masterscan && p1 != NULL) {  // the *p1 may be NULL in case of sliding+offset exists.
      pResult = getResultRowByPos(pResultBuf, p1);
263
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
264 265
    }
  } else {
dengyihao's avatar
dengyihao 已提交
266 267
    // In case of group by column query, the required SResultRow object must be existInCurrentResusltRowInfo in the
    // pResultRowInfo object.
H
Haojun Liao 已提交
268
    if (p1 != NULL) {
269
      // todo
270
      pResult = getResultRowByPos(pResultBuf, p1);
271
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
272 273 274
    }
  }

L
Liu Jicong 已提交
275
  // 1. close current opened time window
276
  if (pResultRowInfo->cur.pageId != -1 && ((pResult == NULL) || (pResult->pageId != pResultRowInfo->cur.pageId))) {
277
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
278
    qDebug("page_1");
279
#endif
280
    SResultRowPosition pos = pResultRowInfo->cur;
X
Xiaoyu Wang 已提交
281
    SFilePage*         pPage = getBufPage(pResultBuf, pos.pageId);
282 283 284 285 286
    releaseBufPage(pResultBuf, pPage);
  }

  // allocate a new buffer page
  if (pResult == NULL) {
287
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
288
    qDebug("page_2");
289
#endif
H
Haojun Liao 已提交
290
    ASSERT(pSup->resultRowSize > 0);
291 292
    pResult = getNewResultRow(pResultBuf, groupId, pSup->resultRowSize);

293
    initResultRow(pResult);
H
Haojun Liao 已提交
294

295 296
    // add a new result set for a new group
    SResultRowPosition pos = {.pageId = pResult->pageId, .offset = pResult->offset};
X
Xiaoyu Wang 已提交
297 298
    taosHashPut(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes), &pos,
                sizeof(SResultRowPosition));
H
Haojun Liao 已提交
299 300
  }

301 302 303
  // 2. set the new time window to be the new active time window
  pResultRowInfo->cur = (SResultRowPosition){.pageId = pResult->pageId, .offset = pResult->offset};

H
Haojun Liao 已提交
304
  // too many time window in query
305
  if (taosHashGetSize(pSup->pResultRowHashTable) > MAX_INTERVAL_TIME_WINDOW) {
H
Haojun Liao 已提交
306 307 308
    longjmp(pTaskInfo->env, TSDB_CODE_QRY_TOO_MANY_TIMEWINDOW);
  }

H
Haojun Liao 已提交
309
  return pResult;
H
Haojun Liao 已提交
310 311
}

312
// a new buffer page for each table. Needs to opt this design
L
Liu Jicong 已提交
313
static int32_t addNewWindowResultBuf(SResultRow* pWindowRes, SDiskbasedBuf* pResultBuf, int32_t tid, uint32_t size) {
314 315 316 317
  if (pWindowRes->pageId != -1) {
    return 0;
  }

L
Liu Jicong 已提交
318
  SFilePage* pData = NULL;
319 320 321 322 323 324

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tid);

  if (taosArrayGetSize(list) == 0) {
H
Haojun Liao 已提交
325
    pData = getNewBufPage(pResultBuf, tid, &pageId);
326
    pData->num = sizeof(SFilePage);
327 328
  } else {
    SPageInfo* pi = getLastPageInfo(list);
329
    pData = getBufPage(pResultBuf, getPageId(pi));
330
    pageId = getPageId(pi);
331

332
    if (pData->num + size > getBufPageSize(pResultBuf)) {
333
      // release current page first, and prepare the next one
334
      releaseBufPageInfo(pResultBuf, pi);
335

H
Haojun Liao 已提交
336
      pData = getNewBufPage(pResultBuf, tid, &pageId);
337
      if (pData != NULL) {
338
        pData->num = sizeof(SFilePage);
339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358
      }
    }
  }

  if (pData == NULL) {
    return -1;
  }

  // set the number of rows in current disk page
  if (pWindowRes->pageId == -1) {  // not allocated yet, allocate new buffer
    pWindowRes->pageId = pageId;
    pWindowRes->offset = (int32_t)pData->num;

    pData->num += size;
    assert(pWindowRes->pageId >= 0);
  }

  return 0;
}

359
//  query_range_start, query_range_end, window_duration, window_start, window_end
360
void initExecTimeWindowInfo(SColumnInfoData* pColData, STimeWindow* pQueryWindow) {
361 362 363
  pColData->info.type = TSDB_DATA_TYPE_TIMESTAMP;
  pColData->info.bytes = sizeof(int64_t);

364
  colInfoDataEnsureCapacity(pColData, 5);
365 366 367 368 369 370 371 372 373
  colDataAppendInt64(pColData, 0, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 1, &pQueryWindow->ekey);

  int64_t interval = 0;
  colDataAppendInt64(pColData, 2, &interval);  // this value may be variable in case of 'n' and 'y'.
  colDataAppendInt64(pColData, 3, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 4, &pQueryWindow->ekey);
}

X
Xiaoyu Wang 已提交
374 375 376
void doApplyFunctions(SExecTaskInfo* taskInfo, SqlFunctionCtx* pCtx, STimeWindow* pWin,
                      SColumnInfoData* pTimeWindowData, int32_t offset, int32_t forwardStep, TSKEY* tsCol,
                      int32_t numOfTotal, int32_t numOfOutput, int32_t order) {
377
  for (int32_t k = 0; k < numOfOutput; ++k) {
H
Haojun Liao 已提交
378
    // keep it temporarily
379
    // todo no need this??
dengyihao's avatar
dengyihao 已提交
380 381
    bool    hasAgg = pCtx[k].input.colDataAggIsSet;
    int32_t numOfRows = pCtx[k].input.numOfRows;
H
Haojun Liao 已提交
382
    int32_t startOffset = pCtx[k].input.startRowIndex;
383

384
    pCtx[k].input.startRowIndex = offset;
385
    pCtx[k].input.numOfRows = forwardStep;
386 387 388

    // not a whole block involved in query processing, statistics data can not be used
    // NOTE: the original value of isSet have been changed here
389 390
    if (pCtx[k].input.colDataAggIsSet && forwardStep < numOfTotal) {
      pCtx[k].input.colDataAggIsSet = false;
391 392
    }

393 394
    if (fmIsWindowPseudoColumnFunc(pCtx[k].functionId)) {
      SResultRowEntryInfo* pEntryInfo = GET_RES_INFO(&pCtx[k]);
395 396

      char* p = GET_ROWCELL_INTERBUF(pEntryInfo);
397

398
      SColumnInfoData idata = {0};
dengyihao's avatar
dengyihao 已提交
399
      idata.info.type = TSDB_DATA_TYPE_BIGINT;
400
      idata.info.bytes = tDataTypes[TSDB_DATA_TYPE_BIGINT].bytes;
dengyihao's avatar
dengyihao 已提交
401
      idata.pData = p;
402 403 404 405

      SScalarParam out = {.columnData = &idata};
      SScalarParam tw = {.numOfRows = 5, .columnData = pTimeWindowData};
      pCtx[k].sfp.process(&tw, 1, &out);
406
      pEntryInfo->numOfRes = 1;
407 408 409 410 411 412 413 414 415 416
    } else {
      int32_t code = TSDB_CODE_SUCCESS;
      if (functionNeedToExecute(&pCtx[k]) && pCtx[k].fpSet.process != NULL) {
        code = pCtx[k].fpSet.process(&pCtx[k]);

        if (code != TSDB_CODE_SUCCESS) {
          qError("%s apply functions error, code: %s", GET_TASKID(taskInfo), tstrerror(code));
          taskInfo->code = code;
          longjmp(taskInfo->env, code);
        }
417
      }
418

419 420 421 422 423
      // restore it
      pCtx[k].input.colDataAggIsSet = hasAgg;
      pCtx[k].input.startRowIndex = startOffset;
      pCtx[k].input.numOfRows = numOfRows;
    }
424 425 426
  }
}

dengyihao's avatar
dengyihao 已提交
427
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
428
                                   int32_t scanFlag, bool createDummyCol);
429

dengyihao's avatar
dengyihao 已提交
430 431
static void doSetInputDataBlockInfo(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock,
                                    int32_t order) {
432
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
433
    pCtx[i].order = order;
434
    pCtx[i].input.numOfRows = pBlock->info.rows;
435
    setBlockStatisInfo(&pCtx[i], &pOperator->exprSupp.pExprInfo[i], pBlock);
436 437 438
  }
}

X
Xiaoyu Wang 已提交
439 440
void setInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
                       int32_t scanFlag, bool createDummyCol) {
441
  if (pBlock->pBlockAgg != NULL) {
H
Haojun Liao 已提交
442
    doSetInputDataBlockInfo(pOperator, pCtx, pBlock, order);
443
  } else {
444
    doSetInputDataBlock(pOperator, pCtx, pBlock, order, scanFlag, createDummyCol);
H
Haojun Liao 已提交
445
  }
446 447
}

L
Liu Jicong 已提交
448 449
static int32_t doCreateConstantValColumnInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t paramIndex,
                                             int32_t numOfRows) {
450 451 452 453 454 455 456 457
  SColumnInfoData* pColInfo = NULL;
  if (pInput->pData[paramIndex] == NULL) {
    pColInfo = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pColInfo == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

    // Set the correct column info (data type and bytes)
458 459
    pColInfo->info.type = pFuncParam->param.nType;
    pColInfo->info.bytes = pFuncParam->param.nLen;
460 461

    pInput->pData[paramIndex] = pColInfo;
462 463
  } else {
    pColInfo = pInput->pData[paramIndex];
464 465
  }

466
  colInfoDataEnsureCapacity(pColInfo, numOfRows);
467

468
  int8_t type = pFuncParam->param.nType;
469 470
  if (type == TSDB_DATA_TYPE_BIGINT || type == TSDB_DATA_TYPE_UBIGINT) {
    int64_t v = pFuncParam->param.i;
dengyihao's avatar
dengyihao 已提交
471
    for (int32_t i = 0; i < numOfRows; ++i) {
472 473 474 475
      colDataAppendInt64(pColInfo, i, &v);
    }
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
dengyihao's avatar
dengyihao 已提交
476
    for (int32_t i = 0; i < numOfRows; ++i) {
477 478
      colDataAppendDouble(pColInfo, i, &v);
    }
479
  } else if (type == TSDB_DATA_TYPE_VARCHAR) {
L
Liu Jicong 已提交
480
    char* tmp = taosMemoryMalloc(pFuncParam->param.nLen + VARSTR_HEADER_SIZE);
481
    STR_WITH_SIZE_TO_VARSTR(tmp, pFuncParam->param.pz, pFuncParam->param.nLen);
L
Liu Jicong 已提交
482
    for (int32_t i = 0; i < numOfRows; ++i) {
483 484
      colDataAppend(pColInfo, i, tmp, false);
    }
485 486 487 488 489
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
490
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
X
Xiaoyu Wang 已提交
491
                                   int32_t scanFlag, bool createDummyCol) {
492 493
  int32_t code = TSDB_CODE_SUCCESS;

494
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
L
Liu Jicong 已提交
495
    pCtx[i].order = order;
496 497
    pCtx[i].input.numOfRows = pBlock->info.rows;

L
Liu Jicong 已提交
498
    pCtx[i].pSrcBlock = pBlock;
X
Xiaoyu Wang 已提交
499
    pCtx[i].scanFlag = scanFlag;
H
Haojun Liao 已提交
500

501
    SInputColumnInfoData* pInput = &pCtx[i].input;
502
    pInput->uid = pBlock->info.uid;
C
Cary Xu 已提交
503
    pInput->colDataAggIsSet = false;
504

505
    SExprInfo* pOneExpr = &pOperator->exprSupp.pExprInfo[i];
506
    for (int32_t j = 0; j < pOneExpr->base.numOfParams; ++j) {
dengyihao's avatar
dengyihao 已提交
507
      SFunctParam* pFuncParam = &pOneExpr->base.pParam[j];
G
Ganlin Zhao 已提交
508 509
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
dengyihao's avatar
dengyihao 已提交
510
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
511 512 513
        pInput->totalRows = pBlock->info.rows;
        pInput->numOfRows = pBlock->info.rows;
        pInput->startRowIndex = 0;
514

515
        // NOTE: the last parameter is the primary timestamp column
516 517 518
        if (fmIsTimelineFunc(pCtx[i].functionId) && (j == pOneExpr->base.numOfParams - 1)) {
          pInput->pPTS = pInput->pData[j];
        }
519 520
        ASSERT(pInput->pData[j] != NULL);
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
521 522 523
        // todo avoid case: top(k, 12), 12 is the value parameter.
        // sum(11), 11 is also the value parameter.
        if (createDummyCol && pOneExpr->base.numOfParams == 1) {
524 525 526 527
          pInput->totalRows = pBlock->info.rows;
          pInput->numOfRows = pBlock->info.rows;
          pInput->startRowIndex = 0;

528
          code = doCreateConstantValColumnInfo(pInput, pFuncParam, j, pBlock->info.rows);
529 530 531
          if (code != TSDB_CODE_SUCCESS) {
            return code;
          }
532
        }
G
Ganlin Zhao 已提交
533 534
      }
    }
H
Haojun Liao 已提交
535
  }
536 537

  return code;
H
Haojun Liao 已提交
538 539
}

540
static int32_t doAggregateImpl(SOperatorInfo* pOperator, TSKEY startTs, SqlFunctionCtx* pCtx) {
541
  for (int32_t k = 0; k < pOperator->exprSupp.numOfExprs; ++k) {
H
Haojun Liao 已提交
542
    if (functionNeedToExecute(&pCtx[k])) {
543
      // todo add a dummy funtion to avoid process check
544 545 546
      if (pCtx[k].fpSet.process == NULL) {
        continue;
      }
547
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
548
      qDebug("page_process");
549
#endif
550 551 552 553
      int32_t code = pCtx[k].fpSet.process(&pCtx[k]);
      if (code != TSDB_CODE_SUCCESS) {
        qError("%s aggregate function error happens, code: %s", GET_TASKID(pOperator->pTaskInfo), tstrerror(code));
        return code;
554
      }
555 556
    }
  }
557 558

  return TSDB_CODE_SUCCESS;
559 560
}

H
Haojun Liao 已提交
561
static void setPseudoOutputColInfo(SSDataBlock* pResult, SqlFunctionCtx* pCtx, SArray* pPseudoList) {
dengyihao's avatar
dengyihao 已提交
562
  size_t num = (pPseudoList != NULL) ? taosArrayGetSize(pPseudoList) : 0;
H
Haojun Liao 已提交
563 564 565 566 567
  for (int32_t i = 0; i < num; ++i) {
    pCtx[i].pOutput = taosArrayGet(pResult->pDataBlock, i);
  }
}

568
int32_t projectApplyFunctions(SExprInfo* pExpr, SSDataBlock* pResult, SSDataBlock* pSrcBlock, SqlFunctionCtx* pCtx,
X
Xiaoyu Wang 已提交
569
                              int32_t numOfOutput, SArray* pPseudoList) {
H
Haojun Liao 已提交
570
  setPseudoOutputColInfo(pResult, pCtx, pPseudoList);
H
Haojun Liao 已提交
571
  pResult->info.groupId = pSrcBlock->info.groupId;
H
Haojun Liao 已提交
572

dengyihao's avatar
dengyihao 已提交
573 574
  // if the source equals to the destination, it is to create a new column as the result of scalar function or some
  // operators.
575 576
  bool createNewColModel = (pResult == pSrcBlock);

577 578
  int32_t numOfRows = 0;

579
  for (int32_t k = 0; k < numOfOutput; ++k) {
dengyihao's avatar
dengyihao 已提交
580
    int32_t         outputSlotId = pExpr[k].base.resSchema.slotId;
581 582
    SqlFunctionCtx* pfCtx = &pCtx[k];

L
Liu Jicong 已提交
583
    if (pExpr[k].pExpr->nodeType == QUERY_NODE_COLUMN) {  // it is a project query
584
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
585
      if (pResult->info.rows > 0 && !createNewColModel) {
X
Xiaoyu Wang 已提交
586 587
        colDataMergeCol(pColInfoData, pResult->info.rows, &pResult->info.capacity, pfCtx->input.pData[0],
                        pfCtx->input.numOfRows);
588
      } else {
589
        colDataAssign(pColInfoData, pfCtx->input.pData[0], pfCtx->input.numOfRows, &pResult->info);
590
      }
591

592
      numOfRows = pfCtx->input.numOfRows;
593
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_VALUE) {
594
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
595

dengyihao's avatar
dengyihao 已提交
596
      int32_t offset = createNewColModel ? 0 : pResult->info.rows;
597
      for (int32_t i = 0; i < pSrcBlock->info.rows; ++i) {
dengyihao's avatar
dengyihao 已提交
598 599 600
        colDataAppend(pColInfoData, i + offset,
                      taosVariantGet(&pExpr[k].base.pParam[0].param, pExpr[k].base.pParam[0].param.nType),
                      TSDB_DATA_TYPE_NULL == pExpr[k].base.pParam[0].param.nType);
601
      }
602 603

      numOfRows = pSrcBlock->info.rows;
H
Haojun Liao 已提交
604
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_OPERATOR) {
605 606 607
      SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
      taosArrayPush(pBlockList, &pSrcBlock);

608
      SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
609
      SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
610

611
      SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
612
      int32_t      code = scalarCalculate(pExpr[k].pExpr->_optrRoot.pRootNode, pBlockList, &dest);
613 614 615 616
      if (code != TSDB_CODE_SUCCESS) {
        taosArrayDestroy(pBlockList);
        return code;
      }
617

dengyihao's avatar
dengyihao 已提交
618
      int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
619
      ASSERT(pResult->info.capacity > 0);
620
      colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
621 622

      numOfRows = dest.numOfRows;
623 624
      taosArrayDestroy(pBlockList);
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_FUNCTION) {
625
      ASSERT(!fmIsAggFunc(pfCtx->functionId));
626

627 628
      // _rowts/_c0, not tbname column
      if (fmIsPseudoColumnFunc(pfCtx->functionId) && (!fmIsScanPseudoColumnFunc(pfCtx->functionId))) {
H
Haojun Liao 已提交
629
        // do nothing
630 631 632 633 634 635 636 637 638 639 640 641 642 643
      } else if (fmIsIndefiniteRowsFunc(pfCtx->functionId)) {
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(&pCtx[k]);
        pfCtx->fpSet.init(&pCtx[k], pResInfo);

        pfCtx->pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
        pfCtx->offset = createNewColModel ? 0 : pResult->info.rows;  // set the start offset

        // set the timestamp(_rowts) output buffer
        if (taosArrayGetSize(pPseudoList) > 0) {
          int32_t* outputColIndex = taosArrayGet(pPseudoList, 0);
          pfCtx->pTsOutput = (SColumnInfoData*)pCtx[*outputColIndex].pOutput;
        }

        numOfRows = pfCtx->fpSet.process(pfCtx);
H
Haojun Liao 已提交
644 645 646
      } else {
        SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
        taosArrayPush(pBlockList, &pSrcBlock);
G
Ganlin Zhao 已提交
647

648
        SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
649
        SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
H
Haojun Liao 已提交
650

651
        SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
652
        int32_t      code = scalarCalculate((SNode*)pExpr[k].pExpr->_function.pFunctNode, pBlockList, &dest);
653 654 655 656
        if (code != TSDB_CODE_SUCCESS) {
          taosArrayDestroy(pBlockList);
          return code;
        }
657

dengyihao's avatar
dengyihao 已提交
658
        int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
659
        ASSERT(pResult->info.capacity > 0);
660
        colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
661 662

        numOfRows = dest.numOfRows;
H
Haojun Liao 已提交
663 664
        taosArrayDestroy(pBlockList);
      }
665
    } else {
666
      ASSERT(0);
667 668
    }
  }
669

670 671 672
  if (!createNewColModel) {
    pResult->info.rows += numOfRows;
  }
673 674

  return TSDB_CODE_SUCCESS;
675 676
}

677 678 679
static void setResultRowKey(SResultRow* pResultRow, char* pData, int16_t type) {
  if (IS_VAR_DATA_TYPE(type)) {
    // todo disable this
680

681 682 683 684 685 686 687 688 689
    //    if (pResultRow->key == NULL) {
    //      pResultRow->key = taosMemoryMalloc(varDataTLen(pData));
    //      varDataCopy(pResultRow->key, pData);
    //    } else {
    //      ASSERT(memcmp(pResultRow->key, pData, varDataTLen(pData)) == 0);
    //    }
  } else {
    int64_t v = -1;
    GET_TYPED_DATA(v, int64_t, type, pData);
690

691 692
    pResultRow->win.skey = v;
    pResultRow->win.ekey = v;
693 694 695
  }
}

5
54liuyao 已提交
696
bool functionNeedToExecute(SqlFunctionCtx* pCtx) {
697
  struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
698

699 700 701 702 703
  // in case of timestamp column, always generated results.
  int32_t functionId = pCtx->functionId;
  if (functionId == -1) {
    return false;
  }
704

705 706
  if (pCtx->scanFlag == REPEAT_SCAN) {
    return fmIsRepeatScanFunc(pCtx->functionId);
707 708
  }

709 710
  if (isRowEntryCompleted(pResInfo)) {
    return false;
711 712
  }

713 714 715
  return true;
}

716 717 718 719 720 721 722
static int32_t doCreateConstantValColumnAggInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t type,
                                                int32_t paramIndex, int32_t numOfRows) {
  if (pInput->pData[paramIndex] == NULL) {
    pInput->pData[paramIndex] = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pInput->pData[paramIndex] == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
723

724 725 726
    // Set the correct column info (data type and bytes)
    pInput->pData[paramIndex]->info.type = type;
    pInput->pData[paramIndex]->info.bytes = tDataTypes[type].bytes;
727
  }
H
Haojun Liao 已提交
728

729 730 731 732 733 734
  SColumnDataAgg* da = NULL;
  if (pInput->pColumnDataAgg[paramIndex] == NULL) {
    da = taosMemoryCalloc(1, sizeof(SColumnDataAgg));
    pInput->pColumnDataAgg[paramIndex] = da;
    if (da == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
735 736
    }
  } else {
737
    da = pInput->pColumnDataAgg[paramIndex];
738 739
  }

740
  ASSERT(!IS_VAR_DATA_TYPE(type));
741

742 743 744 745 746 747
  if (type == TSDB_DATA_TYPE_BIGINT) {
    int64_t v = pFuncParam->param.i;
    *da = (SColumnDataAgg){.numOfNull = 0, .min = v, .max = v, .maxIndex = 0, .minIndex = 0, .sum = v * numOfRows};
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
    *da = (SColumnDataAgg){.numOfNull = 0, .maxIndex = 0, .minIndex = 0};
748

749 750 751 752 753 754 755 756 757 758 759 760
    *(double*)&da->min = v;
    *(double*)&da->max = v;
    *(double*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_BOOL) {  // todo validate this data type
    bool v = pFuncParam->param.i;

    *da = (SColumnDataAgg){.numOfNull = 0, .maxIndex = 0, .minIndex = 0};
    *(bool*)&da->min = 0;
    *(bool*)&da->max = v;
    *(bool*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_TIMESTAMP) {
    // do nothing
761
  } else {
762
    ASSERT(0);
763 764
  }

765 766
  return TSDB_CODE_SUCCESS;
}
767 768 769 770 771 772 773 774 775 776 777

void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, SSDataBlock* pBlock) {
  int32_t numOfRows = pBlock->info.rows;

  SInputColumnInfoData* pInput = &pCtx->input;
  pInput->numOfRows = numOfRows;
  pInput->totalRows = numOfRows;

  if (pBlock->pBlockAgg != NULL) {
    pInput->colDataAggIsSet = true;

778 779
    for (int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      SFunctParam* pFuncParam = &pExprInfo->base.pParam[j];
780

781 782
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
783 784 785 786
        pInput->pColumnDataAgg[j] = pBlock->pBlockAgg[slotId];
        if (pInput->pColumnDataAgg[j] == NULL) {
          pInput->colDataAggIsSet = false;
        }
787 788 789 790

        // Here we set the column info data since the data type for each column data is required, but
        // the data in the corresponding SColumnInfoData will not be used.
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
791 792
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
        doCreateConstantValColumnAggInfo(pInput, pFuncParam, pFuncParam->param.nType, j, pBlock->info.rows);
793 794
      }
    }
795
  } else {
796
    pInput->colDataAggIsSet = false;
797 798 799
  }

  // set the statistics data for primary time stamp column
800 801 802 803 804
  //  if (pCtx->functionId == FUNCTION_SPREAD && pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
  //    pCtx->isAggSet = true;
  //    pCtx->agg.min = pBlock->info.window.skey;
  //    pCtx->agg.max = pBlock->info.window.ekey;
  //  }
805 806
}

L
Liu Jicong 已提交
807
bool isTaskKilled(SExecTaskInfo* pTaskInfo) {
808 809
  // query has been executed more than tsShellActivityTimer, and the retrieve has not arrived
  // abort current query execution.
L
Liu Jicong 已提交
810 811
  if (pTaskInfo->owner != 0 &&
      ((taosGetTimestampSec() - pTaskInfo->cost.start / 1000) > 10 * getMaximumIdleDurationSec())
812 813
      /*(!needBuildResAfterQueryComplete(pTaskInfo))*/) {
    assert(pTaskInfo->cost.start != 0);
L
Liu Jicong 已提交
814 815 816
    //    qDebug("QInfo:%" PRIu64 " retrieve not arrive beyond %d ms, abort current query execution, start:%" PRId64
    //           ", current:%d", pQInfo->qId, 1, pQInfo->startExecTs, taosGetTimestampSec());
    //    return true;
817 818 819 820 821
  }

  return false;
}

L
Liu Jicong 已提交
822
void setTaskKilled(SExecTaskInfo* pTaskInfo) { pTaskInfo->code = TSDB_CODE_TSC_QUERY_CANCELLED; }
823 824

/////////////////////////////////////////////////////////////////////////////////////////////
L
Liu Jicong 已提交
825
// todo refactor : return window
826
void getAlignQueryTimeWindow(SInterval* pInterval, int32_t precision, int64_t key, STimeWindow* win) {
H
Haojun Liao 已提交
827
  win->skey = taosTimeTruncate(key, pInterval, precision);
828 829

  /*
H
Haojun Liao 已提交
830
   * if the realSkey > INT64_MAX - pInterval->interval, the query duration between
831 832
   * realSkey and realEkey must be less than one interval.Therefore, no need to adjust the query ranges.
   */
833 834
  win->ekey = taosTimeAdd(win->skey, pInterval->interval, pInterval->intervalUnit, precision) - 1;
  if (win->ekey < win->skey) {
835 836 837 838
    win->ekey = INT64_MAX;
  }
}

839
#if 0
L
Liu Jicong 已提交
840
static int32_t updateBlockLoadStatus(STaskAttr* pQuery, int32_t status) {
841

842 843 844
  bool hasFirstLastFunc = false;
  bool hasOtherFunc = false;

845
  if (status == BLK_DATA_DATA_LOAD || status == BLK_DATA_FILTEROUT) {
846 847 848 849 850
    return status;
  }

  for (int32_t i = 0; i < pQuery->numOfOutput; ++i) {
    int32_t functionId = getExprFunctionId(&pQuery->pExpr1[i]);
851

852 853 854 855 856 857 858 859 860 861
    if (functionId == FUNCTION_TS || functionId == FUNCTION_TS_DUMMY || functionId == FUNCTION_TAG ||
        functionId == FUNCTION_TAG_DUMMY) {
      continue;
    }

    if (functionId == FUNCTION_FIRST_DST || functionId == FUNCTION_LAST_DST) {
      hasFirstLastFunc = true;
    } else {
      hasOtherFunc = true;
    }
862

863 864
  }

865
  if (hasFirstLastFunc && status == BLK_DATA_NOT_LOAD) {
L
Liu Jicong 已提交
866
    if (!hasOtherFunc) {
867
      return BLK_DATA_FILTEROUT;
868
    } else {
869
      return BLK_DATA_DATA_LOAD;
870 871 872 873 874 875
    }
  }

  return status;
}

876 877
#endif

L
Liu Jicong 已提交
878 879
// static void updateDataCheckOrder(SQInfo *pQInfo, SQueryTableReq* pQueryMsg, bool stableQuery) {
//   STaskAttr* pQueryAttr = pQInfo->runtimeEnv.pQueryAttr;
H
Haojun Liao 已提交
880
//
L
Liu Jicong 已提交
881 882 883 884
//   // in case of point-interpolation query, use asc order scan
//   char msg[] = "QInfo:0x%"PRIx64" scan order changed for %s query, old:%d, new:%d, qrange exchanged, old qrange:%"
//   PRId64
//                "-%" PRId64 ", new qrange:%" PRId64 "-%" PRId64;
H
Haojun Liao 已提交
885
//
L
Liu Jicong 已提交
886 887 888 889 890
//   // todo handle the case the the order irrelevant query type mixed up with order critical query type
//   // descending order query for last_row query
//   if (isFirstLastRowQuery(pQueryAttr)) {
//     //qDebug("QInfo:0x%"PRIx64" scan order changed for last_row query, old:%d, new:%d", pQInfo->qId,
//     pQueryAttr->order.order, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
891
//
L
Liu Jicong 已提交
892 893
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
894
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
895
//     }
H
Haojun Liao 已提交
896
//
L
Liu Jicong 已提交
897 898 899
//     pQueryAttr->needReverseScan = false;
//     return;
//   }
H
Haojun Liao 已提交
900
//
L
Liu Jicong 已提交
901 902 903
//   if (pQueryAttr->groupbyColumn && pQueryAttr->order.order == TSDB_ORDER_DESC) {
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
904
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
905
//     }
H
Haojun Liao 已提交
906
//
L
Liu Jicong 已提交
907 908 909 910
//     pQueryAttr->needReverseScan = false;
//     doUpdateLastKey(pQueryAttr);
//     return;
//   }
H
Haojun Liao 已提交
911
//
L
Liu Jicong 已提交
912 913 914 915 916 917
//   if (pQueryAttr->pointInterpQuery && pQueryAttr->interval.interval == 0) {
//     if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       //qDebug(msg, pQInfo->qId, "interp", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey); TSWAP(pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, TSKEY);
//     }
H
Haojun Liao 已提交
918
//
L
Liu Jicong 已提交
919 920 921
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     return;
//   }
H
Haojun Liao 已提交
922
//
L
Liu Jicong 已提交
923 924 925 926
//   if (pQueryAttr->interval.interval == 0) {
//     if (onlyFirstQuery(pQueryAttr)) {
//       if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//         //qDebug(msg, pQInfo->qId, "only-first", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
H
Haojun Liao 已提交
927 928
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
929
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
930 931 932 933 934 935 936 937 938 939
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_ASC;
//      pQueryAttr->needReverseScan = false;
//    } else if (onlyLastQuery(pQueryAttr) && notContainSessionOrStateWindow(pQueryAttr)) {
//      if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//        //qDebug(msg, pQInfo->qId, "only-last", pQueryAttr->order.order, TSDB_ORDER_DESC, pQueryAttr->window.skey,
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
940
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
941 942 943 944 945 946 947 948 949 950 951 952
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_DESC;
//      pQueryAttr->needReverseScan = false;
//    }
//
//  } else {  // interval query
//    if (stableQuery) {
//      if (onlyFirstQuery(pQueryAttr)) {
//        if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-first stable", pQueryAttr->order.order, TSDB_ORDER_ASC,
L
Liu Jicong 已提交
953 954
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
955
//
wafwerar's avatar
wafwerar 已提交
956
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
957 958 959 960 961 962 963 964
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_ASC;
//        pQueryAttr->needReverseScan = false;
//      } else if (onlyLastQuery(pQueryAttr)) {
//        if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-last stable", pQueryAttr->order.order, TSDB_ORDER_DESC,
L
Liu Jicong 已提交
965 966
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
967
//
wafwerar's avatar
wafwerar 已提交
968
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
969 970 971 972 973 974 975 976 977
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_DESC;
//        pQueryAttr->needReverseScan = false;
//      }
//    }
//  }
//}
978

L
Liu Jicong 已提交
979 980 981
// static FORCE_INLINE bool doFilterByBlockStatistics(STaskRuntimeEnv* pRuntimeEnv, SDataStatis *pDataStatis,
// SqlFunctionCtx *pCtx, int32_t numOfRows) {
//   STaskAttr* pQueryAttr = pRuntimeEnv->pQueryAttr;
982
//
L
Liu Jicong 已提交
983 984 985
//   if (pDataStatis == NULL || pQueryAttr->pFilters == NULL) {
//     return true;
//   }
986
//
L
Liu Jicong 已提交
987 988
//   return filterRangeExecute(pQueryAttr->pFilters, pDataStatis, pQueryAttr->numOfCols, numOfRows);
// }
989
#if 0
H
Haojun Liao 已提交
990
static bool overlapWithTimeWindow(STaskAttr* pQueryAttr, SDataBlockInfo* pBlockInfo) {
991 992
  STimeWindow w = {0};

dengyihao's avatar
dengyihao 已提交
993 994
  TSKEY sk = TMIN(pQueryAttr->window.skey, pQueryAttr->window.ekey);
  TSKEY ek = TMAX(pQueryAttr->window.skey, pQueryAttr->window.ekey);
995

996
  if (true) {
L
Liu Jicong 已提交
997
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.skey, sk, ek, &w);
998 999 1000 1001 1002 1003
    assert(w.ekey >= pBlockInfo->window.skey);

    if (w.ekey < pBlockInfo->window.ekey) {
      return true;
    }

L
Liu Jicong 已提交
1004 1005
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1006 1007 1008 1009 1010 1011 1012 1013 1014 1015
      if (w.skey > pBlockInfo->window.ekey) {
        break;
      }

      assert(w.ekey > pBlockInfo->window.ekey);
      if (w.skey <= pBlockInfo->window.ekey && w.skey > pBlockInfo->window.skey) {
        return true;
      }
    }
  } else {
L
Liu Jicong 已提交
1016
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.ekey, sk, ek, &w);
1017 1018 1019 1020 1021 1022
    assert(w.skey <= pBlockInfo->window.ekey);

    if (w.skey > pBlockInfo->window.skey) {
      return true;
    }

L
Liu Jicong 已提交
1023 1024
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037
      if (w.ekey < pBlockInfo->window.skey) {
        break;
      }

      assert(w.skey < pBlockInfo->window.skey);
      if (w.ekey < pBlockInfo->window.ekey && w.ekey >= pBlockInfo->window.skey) {
        return true;
      }
    }
  }

  return false;
}
1038
#endif
1039 1040

static uint32_t doFilterByBlockTimeWindow(STableScanInfo* pTableScanInfo, SSDataBlock* pBlock) {
H
Haojun Liao 已提交
1041
  SqlFunctionCtx* pCtx = pTableScanInfo->pCtx;
1042
  uint32_t        status = BLK_DATA_NOT_LOAD;
1043

L
Liu Jicong 已提交
1044
  int32_t numOfOutput = 0;  // pTableScanInfo->numOfOutput;
1045 1046
  for (int32_t i = 0; i < numOfOutput; ++i) {
    int32_t functionId = pCtx[i].functionId;
H
Haojun Liao 已提交
1047
    int32_t colId = pTableScanInfo->pExpr[i].base.pParam[0].pCol->colId;
1048 1049 1050

    // group by + first/last should not apply the first/last block filter
    if (functionId < 0) {
1051
      status |= BLK_DATA_DATA_LOAD;
1052 1053
      return status;
    } else {
L
Liu Jicong 已提交
1054
      //      status |= aAggs[functionId].dataReqFunc(&pTableScanInfo->pCtx[i], &pBlock->info.window, colId);
1055
      //      if ((status & BLK_DATA_DATA_LOAD) == BLK_DATA_DATA_LOAD) {
L
Liu Jicong 已提交
1056 1057
      //        return status;
      //      }
1058 1059 1060 1061 1062 1063
    }
  }

  return status;
}

L
Liu Jicong 已提交
1064 1065
int32_t loadDataBlockOnDemand(SExecTaskInfo* pTaskInfo, STableScanInfo* pTableScanInfo, SSDataBlock* pBlock,
                              uint32_t* status) {
1066
  *status = BLK_DATA_NOT_LOAD;
1067

H
Haojun Liao 已提交
1068
  pBlock->pDataBlock = NULL;
L
Liu Jicong 已提交
1069
  pBlock->pBlockAgg = NULL;
H
Haojun Liao 已提交
1070

L
Liu Jicong 已提交
1071 1072
  //  int64_t groupId = pRuntimeEnv->current->groupIndex;
  //  bool    ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1073

H
Haojun Liao 已提交
1074
  STaskCostInfo* pCost = &pTaskInfo->cost;
1075

1076 1077
//  pCost->totalBlocks += 1;
//  pCost->totalRows += pBlock->info.rows;
H
Haojun Liao 已提交
1078
#if 0
1079 1080 1081
  // Calculate all time windows that are overlapping or contain current data block.
  // If current data block is contained by all possible time window, do not load current data block.
  if (/*pQueryAttr->pFilters || */pQueryAttr->groupbyColumn || pQueryAttr->sw.gap > 0 ||
H
Haojun Liao 已提交
1082
      (QUERY_IS_INTERVAL_QUERY(pQueryAttr) && overlapWithTimeWindow(pTaskInfo, &pBlock->info))) {
1083
    (*status) = BLK_DATA_DATA_LOAD;
1084 1085 1086
  }

  // check if this data block is required to load
1087
  if ((*status) != BLK_DATA_DATA_LOAD) {
1088 1089 1090 1091 1092 1093 1094
    bool needFilter = true;

    // the pCtx[i] result is belonged to previous time window since the outputBuf has not been set yet,
    // the filter result may be incorrect. So in case of interval query, we need to set the correct time output buffer
    if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
      SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1095
      bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1096 1097 1098 1099 1100 1101
      TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

      STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
      if (pQueryAttr->pointInterpQuery) {
        needFilter = chkWindowOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1102
                                    pTableScanInfo->rowEntryInfoOffset);
1103 1104 1105
      } else {
        if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1106
                                    pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1107 1108 1109 1110 1111
          longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
        }
      }
    } else if (pQueryAttr->stableQuery && (!pQueryAttr->tsCompQuery) && (!pQueryAttr->diffQuery)) { // stable aggregate, not interval aggregate or normal column aggregate
      doSetTableGroupOutputBuf(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pTableScanInfo->pCtx,
1112
                               pTableScanInfo->rowEntryInfoOffset, pTableScanInfo->numOfOutput,
1113 1114 1115 1116 1117 1118
                               pRuntimeEnv->current->groupIndex);
    }

    if (needFilter) {
      (*status) = doFilterByBlockTimeWindow(pTableScanInfo, pBlock);
    } else {
1119
      (*status) = BLK_DATA_DATA_LOAD;
1120 1121 1122 1123
    }
  }

  SDataBlockInfo* pBlockInfo = &pBlock->info;
H
Haojun Liao 已提交
1124
//  *status = updateBlockLoadStatus(pRuntimeEnv->pQueryAttr, *status);
1125

1126
  if ((*status) == BLK_DATA_NOT_LOAD || (*status) == BLK_DATA_FILTEROUT) {
1127 1128
    //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//           pBlockInfo->window.ekey, pBlockInfo->rows);
1129
    pCost->skipBlocks += 1;
1130
  } else if ((*status) == BLK_DATA_SMA_LOAD) {
1131 1132
    // this function never returns error?
    pCost->loadBlockStatis += 1;
1133
//    tsdbRetrieveDataBlockStatisInfo(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1134 1135

    if (pBlock->pBlockAgg == NULL) {  // data block statistics does not exist, load data block
1136
//      pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1137 1138 1139
      pCost->totalCheckedRows += pBlock->info.rows;
    }
  } else {
1140
    assert((*status) == BLK_DATA_DATA_LOAD);
1141 1142 1143

    // load the data block statistics to perform further filter
    pCost->loadBlockStatis += 1;
1144
//    tsdbRetrieveDataBlockStatisInfo(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1145 1146 1147 1148 1149 1150

    if (pQueryAttr->topBotQuery && pBlock->pBlockAgg != NULL) {
      { // set previous window
        if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
          SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1151
          bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1152 1153 1154 1155 1156
          TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

          STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
          if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                      pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1157
                                      pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168
            longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
          }
        }
      }
      bool load = false;
      for (int32_t i = 0; i < pQueryAttr->numOfOutput; ++i) {
        int32_t functionId = pTableScanInfo->pCtx[i].functionId;
        if (functionId == FUNCTION_TOP || functionId == FUNCTION_BOTTOM) {
//          load = topbot_datablock_filter(&pTableScanInfo->pCtx[i], (char*)&(pBlock->pBlockAgg[i].min),
//                                         (char*)&(pBlock->pBlockAgg[i].max));
          if (!load) { // current block has been discard due to filter applied
1169
            pCost->skipBlocks += 1;
1170 1171
            //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId,
//                   pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
1172
            (*status) = BLK_DATA_FILTEROUT;
1173 1174 1175 1176 1177 1178 1179 1180
            return TSDB_CODE_SUCCESS;
          }
        }
      }
    }

    // current block has been discard due to filter applied
//    if (!doFilterByBlockStatistics(pRuntimeEnv, pBlock->pBlockAgg, pTableScanInfo->pCtx, pBlockInfo->rows)) {
1181
//      pCost->skipBlocks += 1;
1182 1183
//      qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//             pBlockInfo->window.ekey, pBlockInfo->rows);
1184
//      (*status) = BLK_DATA_FILTEROUT;
1185 1186 1187 1188 1189
//      return TSDB_CODE_SUCCESS;
//    }

    pCost->totalCheckedRows += pBlockInfo->rows;
    pCost->loadBlocks += 1;
1190
//    pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1191 1192 1193 1194 1195
//    if (pBlock->pDataBlock == NULL) {
//      return terrno;
//    }

//    if (pQueryAttr->pFilters != NULL) {
1196
//      filterSetColFieldData(pQueryAttr->pFilters, taosArrayGetSize(pBlock->pDataBlock), pBlock->pDataBlock);
1197
//    }
1198

1199 1200 1201 1202
//    if (pQueryAttr->pFilters != NULL || pRuntimeEnv->pTsBuf != NULL) {
//      filterColRowsInDataBlock(pRuntimeEnv, pBlock, ascQuery);
//    }
  }
H
Haojun Liao 已提交
1203
#endif
1204 1205 1206
  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
1207
static void updateTableQueryInfoForReverseScan(STableQueryInfo* pTableQueryInfo) {
1208 1209 1210 1211
  if (pTableQueryInfo == NULL) {
    return;
  }

wafwerar's avatar
wafwerar 已提交
1212
  //  TSWAP(pTableQueryInfo->win.skey, pTableQueryInfo->win.ekey);
L
Liu Jicong 已提交
1213
  //  pTableQueryInfo->lastKey = pTableQueryInfo->win.skey;
1214

L
Liu Jicong 已提交
1215 1216
  //  SWITCH_ORDER(pTableQueryInfo->cur.order);
  //  pTableQueryInfo->cur.vgroupIndex = -1;
1217 1218

  // set the index to be the end slot of result rows array
dengyihao's avatar
dengyihao 已提交
1219 1220 1221 1222 1223 1224
  //  SResultRowInfo* pResultRowInfo = &pTableQueryInfo->resInfo;
  //  if (pResultRowInfo->size > 0) {
  //    pResultRowInfo->curPos = pResultRowInfo->size - 1;
  //  } else {
  //    pResultRowInfo->curPos = -1;
  //  }
1225 1226
}

H
Haojun Liao 已提交
1227
void initResultRow(SResultRow* pResultRow) {
X
Xiaoyu Wang 已提交
1228
  //  pResultRow->pEntryInfo = (struct SResultRowEntryInfo*)((char*)pResultRow + sizeof(SResultRow));
1229 1230 1231 1232 1233
}

/*
 * The start of each column SResultRowEntryInfo is denote by RowCellInfoOffset.
 * Note that in case of top/bottom query, the whole multiple rows of result is treated as only one row of results.
H
Haojun Liao 已提交
1234 1235 1236
 * +------------+-----------------result column 1------------+------------------result column 2-----------+
 * | SResultRow | SResultRowEntryInfo | intermediate buffer1 | SResultRowEntryInfo | intermediate buffer 2|
 * +------------+--------------------------------------------+--------------------------------------------+
1237 1238
 *           offset[0]                                  offset[1]                                   offset[2]
 */
1239
// TODO refactor: some function move away
L
Liu Jicong 已提交
1240 1241 1242
void setFunctionResultOutput(SOperatorInfo* pOperator, SOptrBasicInfo* pInfo, SAggSupporter* pSup, int32_t stage,
                             int32_t numOfExprs) {
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1243 1244
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
H
Haojun Liao 已提交
1245

H
Haojun Liao 已提交
1246
  SResultRowInfo* pResultRowInfo = &pInfo->resultRowInfo;
1247
  initResultRowInfo(pResultRowInfo);
H
Haojun Liao 已提交
1248

L
Liu Jicong 已提交
1249 1250
  int64_t     tid = 0;
  int64_t     groupId = 0;
1251 1252
  SResultRow* pRow = doSetResultOutBufByKey(pSup->pResultBuf, pResultRowInfo, (char*)&tid, sizeof(tid), true, groupId,
                                            pTaskInfo, false, pSup);
H
Haojun Liao 已提交
1253

1254
  for (int32_t i = 0; i < numOfExprs; ++i) {
1255
    struct SResultRowEntryInfo* pEntry = getResultEntryInfo(pRow, i, rowEntryInfoOffset);
H
Haojun Liao 已提交
1256 1257
    cleanupResultRowEntry(pEntry);

L
Liu Jicong 已提交
1258
    pCtx[i].resultInfo = pEntry;
1259
    pCtx[i].scanFlag = stage;
H
Haojun Liao 已提交
1260 1261
  }

1262
  initCtxOutputBuffer(pCtx, numOfExprs);
H
Haojun Liao 已提交
1263 1264
}

H
Haojun Liao 已提交
1265
void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size) {
1266 1267
  for (int32_t j = 0; j < size; ++j) {
    struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(&pCtx[j]);
dengyihao's avatar
dengyihao 已提交
1268 1269
    if (isRowEntryInitialized(pResInfo) || fmIsPseudoColumnFunc(pCtx[j].functionId) || pCtx[j].functionId == -1 ||
        fmIsScalarFunc(pCtx[j].functionId)) {
1270 1271 1272
      continue;
    }

H
Haojun Liao 已提交
1273
    pCtx[j].fpSet.init(&pCtx[j], pCtx[j].resultInfo);
1274 1275 1276
  }
}

L
Liu Jicong 已提交
1277
void setTaskStatus(SExecTaskInfo* pTaskInfo, int8_t status) {
1278
  if (status == TASK_NOT_COMPLETED) {
H
Haojun Liao 已提交
1279
    pTaskInfo->status = status;
1280 1281
  } else {
    // QUERY_NOT_COMPLETED is not compatible with any other status, so clear its position first
1282
    CLEAR_QUERY_STATUS(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
1283
    pTaskInfo->status |= status;
1284 1285 1286
  }
}

L
Liu Jicong 已提交
1287
void destroyTableQueryInfoImpl(STableQueryInfo* pTableQueryInfo) {
1288 1289 1290 1291
  if (pTableQueryInfo == NULL) {
    return;
  }

L
Liu Jicong 已提交
1292
  //  taosVariantDestroy(&pTableQueryInfo->tag);
dengyihao's avatar
dengyihao 已提交
1293
  //  cleanupResultRowInfo(&pTableQueryInfo->resInfo);
1294 1295
}

1296
void setResultRowInitCtx(SResultRow* pResult, SqlFunctionCtx* pCtx, int32_t numOfOutput, int32_t* rowEntryInfoOffset) {
1297
  for (int32_t i = 0; i < numOfOutput; ++i) {
1298
    pCtx[i].resultInfo = getResultEntryInfo(pResult, i, rowEntryInfoOffset);
1299 1300 1301 1302 1303

    struct SResultRowEntryInfo* pResInfo = pCtx[i].resultInfo;
    if (isRowEntryCompleted(pResInfo) && isRowEntryInitialized(pResInfo)) {
      continue;
    }
1304 1305 1306 1307 1308

    if (fmIsWindowPseudoColumnFunc(pCtx[i].functionId)) {
      continue;
    }

1309 1310 1311 1312 1313 1314
    if (!pResInfo->initialized) {
      if (pCtx[i].functionId != -1) {
        pCtx[i].fpSet.init(&pCtx[i], pResInfo);
      } else {
        pResInfo->initialized = true;
      }
1315 1316 1317 1318
    }
  }
}

H
Haojun Liao 已提交
1319
static void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep);
1320

1321
void doFilter(const SNode* pFilterNode, SSDataBlock* pBlock) {
1322 1323 1324 1325 1326
  if (pFilterNode == NULL) {
    return;
  }

  SFilterInfo* filter = NULL;
H
Haojun Liao 已提交
1327

H
Haojun Liao 已提交
1328
  // todo move to the initialization function
H
Haojun Liao 已提交
1329
  int32_t code = filterInitFromNode((SNode*)pFilterNode, &filter, 0);
1330

1331
  size_t             numOfCols = taosArrayGetSize(pBlock->pDataBlock);
1332
  SFilterColumnParam param1 = {.numOfCols = numOfCols, .pDataBlock = pBlock->pDataBlock};
1333 1334 1335
  code = filterSetDataFromSlotId(filter, &param1);

  int8_t* rowRes = NULL;
1336

1337
  // todo the keep seems never to be True??
1338
  bool keep = filterExecute(filter, pBlock, &rowRes, NULL, param1.numOfCols);
D
dapan1121 已提交
1339
  filterFreeInfo(filter);
1340

H
Haojun Liao 已提交
1341
  extractQualifiedTupleByFilterResult(pBlock, rowRes, keep);
1342
  blockDataUpdateTsWindow(pBlock, 0);
1343 1344
}

H
Haojun Liao 已提交
1345
void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep) {
1346 1347 1348 1349 1350
  if (keep) {
    return;
  }

  if (rowRes != NULL) {
L
Liu Jicong 已提交
1351
    int32_t      totalRows = pBlock->info.rows;
1352
    SSDataBlock* px = createOneDataBlock(pBlock, true);
1353

1354 1355
    size_t numOfCols = taosArrayGetSize(pBlock->pDataBlock);
    for (int32_t i = 0; i < numOfCols; ++i) {
1356 1357
      SColumnInfoData* pSrc = taosArrayGet(px->pDataBlock, i);
      SColumnInfoData* pDst = taosArrayGet(pBlock->pDataBlock, i);
1358
      // it is a reserved column for scalar function, and no data in this column yet.
1359
      if (pDst->pData == NULL || pSrc->pData == NULL) {
1360 1361 1362
        continue;
      }

1363 1364
      colInfoDataCleanup(pDst, pBlock->info.rows);

1365
      int32_t numOfRows = 0;
1366
      for (int32_t j = 0; j < totalRows; ++j) {
D
dapan1121 已提交
1367 1368 1369
        if (rowRes[j] == 0) {
          continue;
        }
1370

D
dapan1121 已提交
1371
        if (colDataIsNull_s(pSrc, j)) {
1372
          colDataAppendNULL(pDst, numOfRows);
D
dapan1121 已提交
1373
        } else {
1374
          colDataAppend(pDst, numOfRows, colDataGetData(pSrc, j), false);
D
dapan1121 已提交
1375
        }
1376
        numOfRows += 1;
H
Haojun Liao 已提交
1377
      }
1378

1379 1380 1381 1382 1383
      if (pBlock->info.rows == totalRows) {
        pBlock->info.rows = numOfRows;
      } else {
        ASSERT(pBlock->info.rows == numOfRows);
      }
1384
    }
1385

dengyihao's avatar
dengyihao 已提交
1386
    blockDataDestroy(px);  // fix memory leak
1387 1388 1389
  } else {
    // do nothing
    pBlock->info.rows = 0;
1390 1391 1392
  }
}

L
Liu Jicong 已提交
1393 1394
void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                              uint64_t groupId) {
1395
  // for simple group by query without interval, all the tables belong to one group result.
L
Liu Jicong 已提交
1396
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1397
  SResultRowInfo* pResultRowInfo = &pAggInfo->binfo.resultRowInfo;
1398 1399
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
1400

1401
  SResultRow* pResultRow = doSetResultOutBufByKey(pAggInfo->aggSup.pResultBuf, pResultRowInfo, (char*)&groupId,
L
Liu Jicong 已提交
1402
                                                  sizeof(groupId), true, groupId, pTaskInfo, false, &pAggInfo->aggSup);
L
Liu Jicong 已提交
1403
  assert(pResultRow != NULL);
1404 1405 1406 1407 1408 1409

  /*
   * not assign result buffer yet, add new result buffer
   * all group belong to one result set, and each group result has different group id so set the id to be one
   */
  if (pResultRow->pageId == -1) {
dengyihao's avatar
dengyihao 已提交
1410 1411
    int32_t ret =
        addNewWindowResultBuf(pResultRow, pAggInfo->aggSup.pResultBuf, groupId, pAggInfo->binfo.pRes->info.rowSize);
1412 1413 1414 1415 1416
    if (ret != TSDB_CODE_SUCCESS) {
      return;
    }
  }

1417
  setResultRowInitCtx(pResultRow, pCtx, numOfOutput, rowEntryInfoOffset);
1418 1419
}

1420
void setExecutionContext(SOperatorInfo* pOperator, int32_t numOfOutput, uint64_t groupId, SAggOperatorInfo* pAggInfo) {
H
Haojun Liao 已提交
1421
  if (pAggInfo->groupId != INT32_MIN && pAggInfo->groupId == groupId) {
1422 1423
    return;
  }
1424
#ifdef BUF_PAGE_DEBUG
L
Liu Jicong 已提交
1425
  qDebug("page_setbuf, groupId:%" PRIu64, groupId);
1426
#endif
1427
  doSetTableGroupOutputBuf(pOperator, pAggInfo, numOfOutput, groupId);
1428 1429

  // record the current active group id
H
Haojun Liao 已提交
1430
  pAggInfo->groupId = groupId;
1431 1432
}

1433 1434
static void doUpdateNumOfRows(SResultRow* pRow, int32_t numOfExprs, const int32_t* rowCellOffset) {
  for (int32_t j = 0; j < numOfExprs; ++j) {
1435
    struct SResultRowEntryInfo* pResInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1436 1437 1438 1439 1440 1441 1442 1443 1444 1445
    if (!isRowEntryInitialized(pResInfo)) {
      continue;
    }

    if (pRow->numOfRows < pResInfo->numOfRes) {
      pRow->numOfRows = pResInfo->numOfRes;
    }
  }
}

1446
int32_t finalizeResultRowIntoResultDataBlock(SDiskbasedBuf* pBuf, SResultRowPosition* resultRowPosition,
S
shenglian zhou 已提交
1447 1448 1449
                                             SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, int32_t numOfExprs,
                                             const int32_t* rowCellOffset, SSDataBlock* pBlock,
                                             SExecTaskInfo* pTaskInfo) {
1450 1451 1452 1453 1454 1455 1456 1457 1458
  SFilePage*  page = getBufPage(pBuf, resultRowPosition->pageId);
  SResultRow* pRow = (SResultRow*)((char*)page + resultRowPosition->offset);

  doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
  if (pRow->numOfRows == 0) {
    releaseBufPage(pBuf, page);
    return 0;
  }

1459 1460 1461 1462 1463 1464 1465
  while (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
    int32_t code = blockDataEnsureCapacity(pBlock, pBlock->info.capacity * 1.25);
    if (TAOS_FAILED(code)) {
      releaseBufPage(pBuf, page);
      qError("%s ensure result data capacity failed, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
      longjmp(pTaskInfo->env, code);
    }
1466 1467 1468 1469 1470
  }

  for (int32_t j = 0; j < numOfExprs; ++j) {
    int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1471
    pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491
    if (pCtx[j].fpSet.finalize) {
      int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
      if (TAOS_FAILED(code)) {
        qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
        longjmp(pTaskInfo->env, code);
      }
    } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
      // do nothing, todo refactor
    } else {
      // expand the result into multiple rows. E.g., _wstartts, top(k, 20)
      // the _wstartts needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
      SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
      char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
      for (int32_t k = 0; k < pRow->numOfRows; ++k) {
        colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
      }
    }
  }

  releaseBufPage(pBuf, page);
1492
  pBlock->info.rows += pRow->numOfRows;
1493 1494 1495 1496

  return 0;
}

X
Xiaoyu Wang 已提交
1497 1498 1499
int32_t doCopyToSDataBlock(SExecTaskInfo* pTaskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo, SDiskbasedBuf* pBuf,
                           SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset, SqlFunctionCtx* pCtx,
                           int32_t numOfExprs) {
1500
  int32_t numOfRows = getNumOfTotalRes(pGroupResInfo);
1501
  int32_t start = pGroupResInfo->index;
1502
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1503
  qDebug("\npage_copytoblock rows:%d", numOfRows);
1504
#endif
1505
  for (int32_t i = start; i < numOfRows; i += 1) {
L
Liu Jicong 已提交
1506 1507
    SResKeyPos* pPos = taosArrayGetP(pGroupResInfo->pRows, i);
    SFilePage*  page = getBufPage(pBuf, pPos->pos.pageId);
1508
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1509
    qDebug("page_copytoblock pos pageId:%d, offset:%d", pPos->pos.pageId, pPos->pos.offset);
1510
#endif
1511
    SResultRow* pRow = (SResultRow*)((char*)page + pPos->pos.offset);
1512 1513

    doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
1514 1515
    if (pRow->numOfRows == 0) {
      pGroupResInfo->index += 1;
1516
      releaseBufPage(pBuf, page);
1517 1518 1519
      continue;
    }

1520 1521 1522 1523 1524
    if (pBlock->info.groupId == 0) {
      pBlock->info.groupId = pPos->groupId;
    } else {
      // current value belongs to different group, it can't be packed into one datablock
      if (pBlock->info.groupId != pPos->groupId) {
1525
        releaseBufPage(pBuf, page);
1526 1527 1528 1529
        break;
      }
    }

1530
    if (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
1531
      releaseBufPage(pBuf, page);
1532 1533 1534 1535 1536
      break;
    }

    pGroupResInfo->index += 1;

1537
    for (int32_t j = 0; j < numOfExprs; ++j) {
1538 1539
      int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1540
      pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1541
      if (pCtx[j].fpSet.finalize) {
1542
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1543
        qDebug("\npage_finalize %d", numOfExprs);
1544
#endif
1545
        int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
1546
        if (TAOS_FAILED(code)) {
1547 1548
          qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
          longjmp(pTaskInfo->env, code);
1549
        }
1550 1551
      } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
        // do nothing, todo refactor
1552
      } else {
1553 1554
        // expand the result into multiple rows. E.g., _wstartts, top(k, 20)
        // the _wstartts needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
X
Xiaoyu Wang 已提交
1555 1556
        SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
        char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
1557
        if (pCtx[j].increase) {
L
Liu Jicong 已提交
1558
          int64_t ts = *(int64_t*)in;
1559
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
L
Liu Jicong 已提交
1560
            colDataAppend(pColInfoData, pBlock->info.rows + k, (const char*)&ts, pCtx[j].resultInfo->isNullRes);
1561 1562 1563 1564 1565 1566
            ts++;
          }
        } else {
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
            colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
          }
X
Xiaoyu Wang 已提交
1567
        }
1568
      }
1569 1570
    }

1571
    releaseBufPage(pBuf, page);
1572
    pBlock->info.rows += pRow->numOfRows;
L
Liu Jicong 已提交
1573 1574 1575
    //    if (pBlock->info.rows >= pBlock->info.capacity) {  // output buffer is full
    //      break;
    //    }
1576 1577
  }

X
Xiaoyu Wang 已提交
1578 1579
  qDebug("%s result generated, rows:%d, groupId:%" PRIu64, GET_TASKID(pTaskInfo), pBlock->info.rows,
         pBlock->info.groupId);
1580
  blockDataUpdateTsWindow(pBlock, 0);
1581 1582 1583
  return 0;
}

X
Xiaoyu Wang 已提交
1584 1585
void doBuildResultDatablock(SOperatorInfo* pOperator, SOptrBasicInfo* pbInfo, SGroupResInfo* pGroupResInfo,
                            SDiskbasedBuf* pBuf) {
1586 1587
  SExprInfo*     pExprInfo = pOperator->exprSupp.pExprInfo;
  int32_t        numOfExprs = pOperator->exprSupp.numOfExprs;
1588 1589
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

1590
  int32_t*        rowCellOffset = pOperator->exprSupp.rowEntryInfoOffset;
X
Xiaoyu Wang 已提交
1591
  SSDataBlock*    pBlock = pbInfo->pRes;
1592
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
1593

1594
  blockDataCleanup(pBlock);
1595
  if (!hasDataInGroupInfo(pGroupResInfo)) {
1596 1597 1598
    return;
  }

1599 1600
  // clear the existed group id
  pBlock->info.groupId = 0;
1601
  doCopyToSDataBlock(pTaskInfo, pBlock, pExprInfo, pBuf, pGroupResInfo, rowCellOffset, pCtx, numOfExprs);
1602 1603
}

L
Liu Jicong 已提交
1604
static void updateNumOfRowsInResultRows(SqlFunctionCtx* pCtx, int32_t numOfOutput, SResultRowInfo* pResultRowInfo,
1605
                                        int32_t* rowEntryInfoOffset) {
1606
  // update the number of result for each, only update the number of rows for the corresponding window result.
L
Liu Jicong 已提交
1607 1608 1609
  //  if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
  //    return;
  //  }
H
Haojun Liao 已提交
1610
#if 0
1611
  for (int32_t i = 0; i < pResultRowInfo->size; ++i) {
L
Liu Jicong 已提交
1612
    SResultRow* pResult = pResultRowInfo->pResult[i];
1613 1614 1615 1616 1617 1618 1619

    for (int32_t j = 0; j < numOfOutput; ++j) {
      int32_t functionId = pCtx[j].functionId;
      if (functionId == FUNCTION_TS || functionId == FUNCTION_TAG || functionId == FUNCTION_TAGPRJ) {
        continue;
      }

1620
      SResultRowEntryInfo* pCell = getResultEntryInfo(pResult, j, rowEntryInfoOffset);
1621
      pResult->numOfRows = (uint16_t)(TMAX(pResult->numOfRows, pCell->numOfRes));
1622 1623
    }
  }
H
Haojun Liao 已提交
1624
#endif
1625 1626
}

L
Liu Jicong 已提交
1627
static int32_t compressQueryColData(SColumnInfoData* pColRes, int32_t numOfRows, char* data, int8_t compressed) {
1628 1629
  int32_t colSize = pColRes->info.bytes * numOfRows;
  return (*(tDataTypes[pColRes->info.type].compFunc))(pColRes->pData, colSize, numOfRows, data,
L
Liu Jicong 已提交
1630
                                                      colSize + COMP_OVERFLOW_BYTES, compressed, NULL, 0);
1631 1632
}

1633 1634 1635
int32_t doFillTimeIntervalGapsInResults(struct SFillInfo* pFillInfo, SSDataBlock* pBlock, int32_t capacity) {
  int32_t numOfRows = (int32_t)taosFillResultDataBlock(pFillInfo, pBlock, capacity - pBlock->info.rows);
  pBlock->info.rows += numOfRows;
1636

1637
  return pBlock->info.rows;
1638 1639
}

L
Liu Jicong 已提交
1640 1641
void queryCostStatis(SExecTaskInfo* pTaskInfo) {
  STaskCostInfo* pSummary = &pTaskInfo->cost;
1642

L
Liu Jicong 已提交
1643 1644 1645
  //  uint64_t hashSize = taosHashGetMemSize(pQInfo->runtimeEnv.pResultRowHashTable);
  //  hashSize += taosHashGetMemSize(pRuntimeEnv->tableqinfoGroupInfo.map);
  //  pSummary->hashSize = hashSize;
1646 1647 1648 1649

  // add the merge time
  pSummary->elapsedTime += pSummary->firstStageMergeTime;

L
Liu Jicong 已提交
1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660
  //  SResultRowPool* p = pTaskInfo->pool;
  //  if (p != NULL) {
  //    pSummary->winInfoSize = getResultRowPoolMemSize(p);
  //    pSummary->numOfTimeWindows = getNumOfAllocatedResultRows(p);
  //  } else {
  //    pSummary->winInfoSize = 0;
  //    pSummary->numOfTimeWindows = 0;
  //  }
  //
  //  calculateOperatorProfResults(pQInfo);

1661 1662
  SFileBlockLoadRecorder* pRecorder = pSummary->pRecoder;
  if (pSummary->pRecoder != NULL) {
X
Xiaoyu Wang 已提交
1663 1664
    qDebug("%s :cost summary: elapsed time:%" PRId64 " us, first merge:%" PRId64
           " us, total blocks:%d, "
1665 1666 1667 1668
           "load block statis:%d, load data block:%d, total rows:%" PRId64 ", check rows:%" PRId64,
           GET_TASKID(pTaskInfo), pSummary->elapsedTime, pSummary->firstStageMergeTime, pRecorder->totalBlocks,
           pRecorder->loadBlockStatis, pRecorder->loadBlocks, pRecorder->totalRows, pRecorder->totalCheckedRows);
  }
L
Liu Jicong 已提交
1669 1670 1671
  // qDebug("QInfo:0x%"PRIx64" :cost summary: winResPool size:%.2f Kb, numOfWin:%"PRId64", tableInfoSize:%.2f Kb,
  // hashTable:%.2f Kb", pQInfo->qId, pSummary->winInfoSize/1024.0,
  //      pSummary->numOfTimeWindows, pSummary->tableInfoSize/1024.0, pSummary->hashSize/1024.0);
1672 1673
}

L
Liu Jicong 已提交
1674 1675 1676
// static void updateOffsetVal(STaskRuntimeEnv *pRuntimeEnv, SDataBlockInfo *pBlockInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
1677
//
L
Liu Jicong 已提交
1678
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1679
//
L
Liu Jicong 已提交
1680 1681 1682 1683
//   if (pQueryAttr->limit.offset == pBlockInfo->rows) {  // current block will ignore completed
//     pTableQueryInfo->lastKey = QUERY_IS_ASC_QUERY(pQueryAttr) ? pBlockInfo->window.ekey + step :
//     pBlockInfo->window.skey + step; pQueryAttr->limit.offset = 0; return;
//   }
1684
//
L
Liu Jicong 已提交
1685 1686 1687 1688 1689
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     pQueryAttr->pos = (int32_t)pQueryAttr->limit.offset;
//   } else {
//     pQueryAttr->pos = pBlockInfo->rows - (int32_t)pQueryAttr->limit.offset - 1;
//   }
1690
//
L
Liu Jicong 已提交
1691
//   assert(pQueryAttr->pos >= 0 && pQueryAttr->pos <= pBlockInfo->rows - 1);
1692
//
L
Liu Jicong 已提交
1693 1694
//   SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//   SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1695
//
L
Liu Jicong 已提交
1696 1697
//   // update the pQueryAttr->limit.offset value, and pQueryAttr->pos value
//   TSKEY *keys = (TSKEY *) pColInfoData->pData;
1698
//
L
Liu Jicong 已提交
1699 1700 1701
//   // update the offset value
//   pTableQueryInfo->lastKey = keys[pQueryAttr->pos];
//   pQueryAttr->limit.offset = 0;
1702
//
L
Liu Jicong 已提交
1703
//   int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
1704
//
L
Liu Jicong 已提交
1705 1706 1707 1708
//   //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numBlocksOfStep:%d, numOfRes:%d,
//   lastKey:%"PRId64, GET_TASKID(pRuntimeEnv),
//          pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes, pQuery->current->lastKey);
// }
1709

L
Liu Jicong 已提交
1710 1711
// void skipBlocks(STaskRuntimeEnv *pRuntimeEnv) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
1712
//
L
Liu Jicong 已提交
1713 1714 1715
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0) {
//     return;
//   }
1716
//
L
Liu Jicong 已提交
1717 1718
//   pQueryAttr->pos = 0;
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1719
//
L
Liu Jicong 已提交
1720 1721
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
//   TsdbQueryHandleT pTsdbReadHandle = pRuntimeEnv->pTsdbReadHandle;
1722
//
L
Liu Jicong 已提交
1723 1724 1725 1726 1727
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pTsdbReadHandle)) {
//     if (isTaskKilled(pRuntimeEnv->qinfo)) {
//       longjmp(pRuntimeEnv->env, TSDB_CODE_TSC_QUERY_CANCELLED);
//     }
1728
//
L
Liu Jicong 已提交
1729
//     tsdbRetrieveDataBlockInfo(pTsdbReadHandle, &blockInfo);
1730
//
L
Liu Jicong 已提交
1731 1732 1733 1734
//     if (pQueryAttr->limit.offset > blockInfo.rows) {
//       pQueryAttr->limit.offset -= blockInfo.rows;
//       pTableQueryInfo->lastKey = (QUERY_IS_ASC_QUERY(pQueryAttr)) ? blockInfo.window.ekey : blockInfo.window.skey;
//       pTableQueryInfo->lastKey += step;
1735
//
L
Liu Jicong 已提交
1736 1737 1738 1739 1740 1741 1742
//       //qDebug("QInfo:0x%"PRIx64" skip rows:%d, offset:%" PRId64, GET_TASKID(pRuntimeEnv), blockInfo.rows,
//              pQuery->limit.offset);
//     } else {  // find the appropriated start position in current block
//       updateOffsetVal(pRuntimeEnv, &blockInfo);
//       break;
//     }
//   }
1743
//
L
Liu Jicong 已提交
1744 1745 1746 1747 1748 1749 1750 1751 1752
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
// }

// static TSKEY doSkipIntervalProcess(STaskRuntimeEnv* pRuntimeEnv, STimeWindow* win, SDataBlockInfo* pBlockInfo,
// STableQueryInfo* pTableQueryInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
1753
//
L
Liu Jicong 已提交
1754 1755 1756
//   assert(pQueryAttr->limit.offset == 0);
//   STimeWindow tw = *win;
//   getNextTimeWindow(pQueryAttr, &tw);
1757
//
L
Liu Jicong 已提交
1758 1759
//   if ((tw.skey <= pBlockInfo->window.ekey && QUERY_IS_ASC_QUERY(pQueryAttr)) ||
//       (tw.ekey >= pBlockInfo->window.skey && !QUERY_IS_ASC_QUERY(pQueryAttr))) {
1760
//
L
Liu Jicong 已提交
1761 1762 1763 1764
//     // load the data block and check data remaining in current data block
//     // TODO optimize performance
//     SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//     SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1765
//
L
Liu Jicong 已提交
1766 1767 1768 1769
//     tw = *win;
//     int32_t startPos =
//         getNextQualifiedWindow(pQueryAttr, &tw, pBlockInfo, pColInfoData->pData, binarySearchForKey, -1);
//     assert(startPos >= 0);
1770
//
L
Liu Jicong 已提交
1771 1772
//     // set the abort info
//     pQueryAttr->pos = startPos;
1773
//
L
Liu Jicong 已提交
1774 1775 1776 1777
//     // reset the query start timestamp
//     pTableQueryInfo->win.skey = ((TSKEY *)pColInfoData->pData)[startPos];
//     pQueryAttr->window.skey = pTableQueryInfo->win.skey;
//     TSKEY key = pTableQueryInfo->win.skey;
1778
//
L
Liu Jicong 已提交
1779 1780
//     pWindowResInfo->prevSKey = tw.skey;
//     int32_t index = pRuntimeEnv->resultRowInfo.curIndex;
1781
//
L
Liu Jicong 已提交
1782 1783
//     int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
//     pRuntimeEnv->resultRowInfo.curIndex = index;  // restore the window index
1784
//
L
Liu Jicong 已提交
1785 1786 1787 1788
//     //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numOfRows:%d, numOfRes:%d,
//     lastKey:%" PRId64,
//            GET_TASKID(pRuntimeEnv), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes,
//            pQueryAttr->current->lastKey);
1789
//
L
Liu Jicong 已提交
1790 1791 1792 1793 1794
//     return key;
//   } else {  // do nothing
//     pQueryAttr->window.skey      = tw.skey;
//     pWindowResInfo->prevSKey = tw.skey;
//     pTableQueryInfo->lastKey = tw.skey;
1795
//
L
Liu Jicong 已提交
1796 1797
//     return tw.skey;
//   }
1798
//
L
Liu Jicong 已提交
1799 1800 1801 1802 1803 1804 1805 1806 1807 1808
//   return true;
// }

// static bool skipTimeInterval(STaskRuntimeEnv *pRuntimeEnv, TSKEY* start) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     assert(*start <= pRuntimeEnv->current->lastKey);
//   } else {
//     assert(*start >= pRuntimeEnv->current->lastKey);
//   }
1809
//
L
Liu Jicong 已提交
1810 1811 1812 1813 1814
//   // if queried with value filter, do NOT forward query start position
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0 || pRuntimeEnv->pTsBuf != NULL ||
//   pRuntimeEnv->pFillInfo != NULL) {
//     return true;
//   }
1815
//
L
Liu Jicong 已提交
1816 1817 1818 1819 1820 1821 1822
//   /*
//    * 1. for interval without interpolation query we forward pQueryAttr->interval.interval at a time for
//    *    pQueryAttr->limit.offset times. Since hole exists, pQueryAttr->interval.interval*pQueryAttr->limit.offset
//    value is
//    *    not valid. otherwise, we only forward pQueryAttr->limit.offset number of points
//    */
//   assert(pRuntimeEnv->resultRowInfo.prevSKey == TSKEY_INITIAL_VAL);
1823
//
L
Liu Jicong 已提交
1824 1825
//   STimeWindow w = TSWINDOW_INITIALIZER;
//   bool ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1826
//
L
Liu Jicong 已提交
1827 1828
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
//   STableQueryInfo *pTableQueryInfo = pRuntimeEnv->current;
1829
//
L
Liu Jicong 已提交
1830 1831 1832
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pRuntimeEnv->pTsdbReadHandle)) {
//     tsdbRetrieveDataBlockInfo(pRuntimeEnv->pTsdbReadHandle, &blockInfo);
1833
//
L
Liu Jicong 已提交
1834 1835 1836 1837 1838 1839 1840 1841 1842
//     if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       if (pWindowResInfo->prevSKey == TSKEY_INITIAL_VAL) {
//         getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.skey, blockInfo.window.skey, pQueryAttr->window.ekey,
//         &w); pWindowResInfo->prevSKey = w.skey;
//       }
//     } else {
//       getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.ekey, pQueryAttr->window.ekey, blockInfo.window.ekey, &w);
//       pWindowResInfo->prevSKey = w.skey;
//     }
1843
//
L
Liu Jicong 已提交
1844 1845
//     // the first time window
//     STimeWindow win = getActiveTimeWindow(pWindowResInfo, pWindowResInfo->prevSKey, pQueryAttr);
1846
//
L
Liu Jicong 已提交
1847 1848
//     while (pQueryAttr->limit.offset > 0) {
//       STimeWindow tw = win;
1849
//
L
Liu Jicong 已提交
1850 1851 1852
//       if ((win.ekey <= blockInfo.window.ekey && ascQuery) || (win.ekey >= blockInfo.window.skey && !ascQuery)) {
//         pQueryAttr->limit.offset -= 1;
//         pWindowResInfo->prevSKey = win.skey;
1853
//
L
Liu Jicong 已提交
1854 1855 1856 1857 1858 1859
//         // current time window is aligned with blockInfo.window.ekey
//         // restart it from next data block by set prevSKey to be TSKEY_INITIAL_VAL;
//         if ((win.ekey == blockInfo.window.ekey && ascQuery) || (win.ekey == blockInfo.window.skey && !ascQuery)) {
//           pWindowResInfo->prevSKey = TSKEY_INITIAL_VAL;
//         }
//       }
1860
//
L
Liu Jicong 已提交
1861 1862 1863 1864
//       if (pQueryAttr->limit.offset == 0) {
//         *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//         return true;
//       }
1865
//
L
Liu Jicong 已提交
1866 1867
//       // current window does not ended in current data block, try next data block
//       getNextTimeWindow(pQueryAttr, &tw);
1868
//
L
Liu Jicong 已提交
1869 1870 1871 1872 1873 1874 1875 1876 1877
//       /*
//        * If the next time window still starts from current data block,
//        * load the primary timestamp column first, and then find the start position for the next queried time window.
//        * Note that only the primary timestamp column is required.
//        * TODO: Optimize for this cases. All data blocks are not needed to be loaded, only if the first actually
//        required
//        * time window resides in current data block.
//        */
//       if ((tw.skey <= blockInfo.window.ekey && ascQuery) || (tw.ekey >= blockInfo.window.skey && !ascQuery)) {
1878
//
L
Liu Jicong 已提交
1879 1880
//         SArray *pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//         SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1881
//
L
Liu Jicong 已提交
1882 1883 1884
//         if ((win.ekey > blockInfo.window.ekey && ascQuery) || (win.ekey < blockInfo.window.skey && !ascQuery)) {
//           pQueryAttr->limit.offset -= 1;
//         }
1885
//
L
Liu Jicong 已提交
1886 1887 1888 1889 1890 1891 1892 1893
//         if (pQueryAttr->limit.offset == 0) {
//           *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//           return true;
//         } else {
//           tw = win;
//           int32_t startPos =
//               getNextQualifiedWindow(pQueryAttr, &tw, &blockInfo, pColInfoData->pData, binarySearchForKey, -1);
//           assert(startPos >= 0);
1894
//
L
Liu Jicong 已提交
1895 1896 1897 1898 1899 1900 1901 1902 1903 1904 1905
//           // set the abort info
//           pQueryAttr->pos = startPos;
//           pTableQueryInfo->lastKey = ((TSKEY *)pColInfoData->pData)[startPos];
//           pWindowResInfo->prevSKey = tw.skey;
//           win = tw;
//         }
//       } else {
//         break;  // offset is not 0, and next time window begins or ends in the next block.
//       }
//     }
//   }
1906
//
L
Liu Jicong 已提交
1907 1908 1909 1910
//   // check for error
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
1911
//
L
Liu Jicong 已提交
1912 1913
//   return true;
// }
1914

1915
int32_t appendDownstream(SOperatorInfo* p, SOperatorInfo** pDownstream, int32_t num) {
H
Haojun Liao 已提交
1916
  if (p->pDownstream == NULL) {
H
Haojun Liao 已提交
1917
    assert(p->numOfDownstream == 0);
1918 1919
  }

wafwerar's avatar
wafwerar 已提交
1920
  p->pDownstream = taosMemoryCalloc(1, num * POINTER_BYTES);
1921 1922 1923 1924 1925 1926 1927
  if (p->pDownstream == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  memcpy(p->pDownstream, pDownstream, num * POINTER_BYTES);
  p->numOfDownstream = num;
  return TSDB_CODE_SUCCESS;
1928 1929
}

wmmhello's avatar
wmmhello 已提交
1930
static void doDestroyTableList(STableListInfo* pTableqinfoList);
1931

1932
static void doTableQueryInfoTimeWindowCheck(SExecTaskInfo* pTaskInfo, STableQueryInfo* pTableQueryInfo, int32_t order) {
H
Haojun Liao 已提交
1933 1934
#if 0
    if (order == TSDB_ORDER_ASC) {
1935 1936
    assert(
        (pTableQueryInfo->win.skey <= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1937 1938
        (pTableQueryInfo->lastKey >= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey >= pTaskInfo->window.skey && pTableQueryInfo->win.ekey <= pTaskInfo->window.ekey));
1939 1940 1941
  } else {
    assert(
        (pTableQueryInfo->win.skey >= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1942 1943
        (pTableQueryInfo->lastKey <= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey <= pTaskInfo->window.skey && pTableQueryInfo->win.ekey >= pTaskInfo->window.ekey));
1944
  }
H
Haojun Liao 已提交
1945
#endif
1946 1947
}

1948 1949 1950 1951
typedef struct SFetchRspHandleWrapper {
  uint32_t exchangeId;
  int32_t  sourceIndex;
} SFetchRspHandleWrapper;
1952

D
dapan1121 已提交
1953
int32_t loadRemoteDataCallback(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1954
  SFetchRspHandleWrapper* pWrapper = (SFetchRspHandleWrapper*)param;
1955 1956 1957 1958 1959 1960 1961

  SExchangeInfo* pExchangeInfo = taosAcquireRef(exchangeObjRefPool, pWrapper->exchangeId);
  if (pExchangeInfo == NULL) {
    qWarn("failed to acquire exchange operator, since it may have been released");
    return TSDB_CODE_SUCCESS;
  }

X
Xiaoyu Wang 已提交
1962
  int32_t          index = pWrapper->sourceIndex;
1963
  SSourceDataInfo* pSourceDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, index);
1964

H
Haojun Liao 已提交
1965 1966
  if (code == TSDB_CODE_SUCCESS) {
    pSourceDataInfo->pRsp = pMsg->pData;
1967

H
Haojun Liao 已提交
1968 1969
    SRetrieveTableRsp* pRsp = pSourceDataInfo->pRsp;
    pRsp->numOfRows = htonl(pRsp->numOfRows);
dengyihao's avatar
dengyihao 已提交
1970
    pRsp->compLen = htonl(pRsp->compLen);
1971
    pRsp->numOfCols = htonl(pRsp->numOfCols);
dengyihao's avatar
dengyihao 已提交
1972
    pRsp->useconds = htobe64(pRsp->useconds);
1973

1974
    ASSERT(pRsp != NULL);
1975
    qDebug("%s fetch rsp received, index:%d, rows:%d", pSourceDataInfo->taskId, index, pRsp->numOfRows);
H
Haojun Liao 已提交
1976 1977 1978
  } else {
    pSourceDataInfo->code = code;
  }
H
Haojun Liao 已提交
1979

H
Haojun Liao 已提交
1980
  pSourceDataInfo->status = EX_SOURCE_DATA_READY;
1981 1982 1983 1984 1985

  tsem_post(&pExchangeInfo->ready);
  taosReleaseRef(exchangeObjRefPool, pWrapper->exchangeId);

  taosMemoryFree(pWrapper);
wmmhello's avatar
wmmhello 已提交
1986
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
1987 1988 1989 1990
}

static void destroySendMsgInfo(SMsgSendInfo* pMsgBody) {
  assert(pMsgBody != NULL);
wafwerar's avatar
wafwerar 已提交
1991 1992
  taosMemoryFreeClear(pMsgBody->msgInfo.pData);
  taosMemoryFreeClear(pMsgBody);
H
Haojun Liao 已提交
1993 1994
}

S
Shengliang Guan 已提交
1995
void qProcessFetchRsp(void* parent, SRpcMsg* pMsg, SEpSet* pEpSet) {
S
Shengliang Guan 已提交
1996 1997
  SMsgSendInfo* pSendInfo = (SMsgSendInfo*)pMsg->info.ahandle;
  assert(pMsg->info.ahandle != NULL);
H
Haojun Liao 已提交
1998 1999 2000 2001

  SDataBuf buf = {.len = pMsg->contLen, .pData = NULL};

  if (pMsg->contLen > 0) {
wafwerar's avatar
wafwerar 已提交
2002
    buf.pData = taosMemoryCalloc(1, pMsg->contLen);
H
Haojun Liao 已提交
2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013
    if (buf.pData == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      pMsg->code = TSDB_CODE_OUT_OF_MEMORY;
    } else {
      memcpy(buf.pData, pMsg->pCont, pMsg->contLen);
    }
  }

  pSendInfo->fp(pSendInfo->param, &buf, pMsg->code);
  rpcFreeCont(pMsg->pCont);
  destroySendMsgInfo(pSendInfo);
2014 2015
}

L
Liu Jicong 已提交
2016
static int32_t doSendFetchDataRequest(SExchangeInfo* pExchangeInfo, SExecTaskInfo* pTaskInfo, int32_t sourceIndex) {
2017
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2018

wafwerar's avatar
wafwerar 已提交
2019
  SResFetchReq* pMsg = taosMemoryCalloc(1, sizeof(SResFetchReq));
2020 2021 2022 2023
  if (NULL == pMsg) {
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
  }
2024

L
Liu Jicong 已提交
2025 2026
  SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, sourceIndex);
  SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, sourceIndex);
2027

2028 2029
  ASSERT(pDataInfo->status == EX_SOURCE_DATA_NOT_READY);

2030 2031 2032
  qDebug("%s build fetch msg and send to vgId:%d, ep:%s, taskId:0x%" PRIx64 ", execId:%d, %d/%" PRIzu,
         GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->addr.epSet.eps[0].fqdn, pSource->taskId, pSource->execId,
         sourceIndex, totalSources);
2033 2034 2035 2036 2037

  pMsg->header.vgId = htonl(pSource->addr.nodeId);
  pMsg->sId = htobe64(pSource->schedId);
  pMsg->taskId = htobe64(pSource->taskId);
  pMsg->queryId = htobe64(pTaskInfo->id.queryId);
D
dapan1121 已提交
2038
  pMsg->execId = htonl(pSource->execId);
2039 2040

  // send the fetch remote task result reques
wafwerar's avatar
wafwerar 已提交
2041
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
2042
  if (NULL == pMsgSendInfo) {
wafwerar's avatar
wafwerar 已提交
2043
    taosMemoryFreeClear(pMsg);
2044 2045 2046
    qError("%s prepare message %d failed", GET_TASKID(pTaskInfo), (int32_t)sizeof(SMsgSendInfo));
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
H
Haojun Liao 已提交
2047 2048
  }

2049
  SFetchRspHandleWrapper* pWrapper = taosMemoryCalloc(1, sizeof(SFetchRspHandleWrapper));
X
Xiaoyu Wang 已提交
2050
  pWrapper->exchangeId = pExchangeInfo->self;
2051 2052 2053
  pWrapper->sourceIndex = sourceIndex;

  pMsgSendInfo->param = pWrapper;
2054 2055
  pMsgSendInfo->msgInfo.pData = pMsg;
  pMsgSendInfo->msgInfo.len = sizeof(SResFetchReq);
L
Liu Jicong 已提交
2056
  pMsgSendInfo->msgType = pSource->fetchMsgType;
2057
  pMsgSendInfo->fp = loadRemoteDataCallback;
2058

2059
  int64_t transporterId = 0;
L
Liu Jicong 已提交
2060
  int32_t code = asyncSendMsgToServer(pExchangeInfo->pTransporter, &pSource->addr.epSet, &transporterId, pMsgSendInfo);
2061 2062 2063
  return TSDB_CODE_SUCCESS;
}

2064
int32_t extractDataBlockFromFetchRsp(SSDataBlock* pRes, SLoadRemoteDataInfo* pLoadInfo, int32_t numOfRows, char* pData,
L
Liu Jicong 已提交
2065 2066
                                     int32_t compLen, int32_t numOfOutput, int64_t startTs, uint64_t* total,
                                     SArray* pColList) {
H
Haojun Liao 已提交
2067
  if (pColList == NULL) {  // data from other sources
2068
    blockDataCleanup(pRes);
2069
    //    blockDataEnsureCapacity(pRes, numOfRows);
2070
    blockDecode(pRes, numOfOutput, numOfRows, pData);
H
Haojun Liao 已提交
2071
  } else {  // extract data according to pColList
2072
    ASSERT(numOfOutput == taosArrayGetSize(pColList));
2073 2074 2075 2076 2077
    char* pStart = pData;

    int32_t numOfCols = htonl(*(int32_t*)pStart);
    pStart += sizeof(int32_t);

2078
    // todo refactor:extract method
2079
    SSysTableSchema* pSchema = (SSysTableSchema*)pStart;
dengyihao's avatar
dengyihao 已提交
2080
    for (int32_t i = 0; i < numOfCols; ++i) {
2081 2082 2083 2084 2085 2086 2087
      SSysTableSchema* p = (SSysTableSchema*)pStart;

      p->colId = htons(p->colId);
      p->bytes = htonl(p->bytes);
      pStart += sizeof(SSysTableSchema);
    }

2088
    SSDataBlock* pBlock = createDataBlock();
dengyihao's avatar
dengyihao 已提交
2089
    for (int32_t i = 0; i < numOfCols; ++i) {
2090 2091
      SColumnInfoData idata = createColumnInfoData(pSchema[i].type, pSchema[i].bytes, pSchema[i].colId);
      blockDataAppendColInfo(pBlock, &idata);
2092 2093
    }

2094
    blockDecode(pBlock, numOfCols, numOfRows, pStart);
2095 2096
    blockDataEnsureCapacity(pRes, numOfRows);

H
Haojun Liao 已提交
2097
    // data from mnode
2098
    pRes->info.rows = numOfRows;
2099 2100
    relocateColumnData(pRes, pColList, pBlock->pDataBlock, false);
    blockDataDestroy(pBlock);
2101
  }
2102

2103 2104
  // todo move this to time window aggregator, since the primary timestamp may not be known by exchange operator.
  blockDataUpdateTsWindow(pRes, 0);
2105

2106
  int64_t el = taosGetTimestampUs() - startTs;
2107

H
Haojun Liao 已提交
2108 2109
  pLoadInfo->totalRows += numOfRows;
  pLoadInfo->totalSize += compLen;
2110

H
Haojun Liao 已提交
2111 2112 2113
  if (total != NULL) {
    *total += numOfRows;
  }
2114

H
Haojun Liao 已提交
2115
  pLoadInfo->totalElapsed += el;
2116 2117
  return TSDB_CODE_SUCCESS;
}
2118

L
Liu Jicong 已提交
2119 2120
static void* setAllSourcesCompleted(SOperatorInfo* pOperator, int64_t startTs) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
2121
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
H
Haojun Liao 已提交
2122

2123
  int64_t              el = taosGetTimestampUs() - startTs;
H
Haojun Liao 已提交
2124
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2125

H
Haojun Liao 已提交
2126
  pLoadInfo->totalElapsed += el;
H
Haojun Liao 已提交
2127

2128
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
L
Liu Jicong 已提交
2129 2130 2131
  qDebug("%s all %" PRIzu " sources are exhausted, total rows: %" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
         GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
         pLoadInfo->totalElapsed / 1000.0);
2132 2133 2134 2135 2136

  doSetOperatorCompleted(pOperator);
  return NULL;
}

L
Liu Jicong 已提交
2137 2138
static SSDataBlock* concurrentlyLoadRemoteDataImpl(SOperatorInfo* pOperator, SExchangeInfo* pExchangeInfo,
                                                   SExecTaskInfo* pTaskInfo) {
2139 2140 2141 2142 2143 2144 2145 2146
  int32_t code = 0;
  int64_t startTs = taosGetTimestampUs();
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);

  while (1) {
    int32_t completed = 0;
    for (int32_t i = 0; i < totalSources; ++i) {
      SSourceDataInfo* pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, i);
2147
      if (pDataInfo->status == EX_SOURCE_DATA_EXHAUSTED) {
2148
        completed += 1;
H
Haojun Liao 已提交
2149 2150
        continue;
      }
2151

2152
      if (pDataInfo->status != EX_SOURCE_DATA_READY) {
2153 2154 2155
        continue;
      }

2156 2157 2158 2159 2160
      if (pDataInfo->code != TSDB_CODE_SUCCESS) {
        code = pDataInfo->code;
        goto _error;
      }

L
Liu Jicong 已提交
2161
      SRetrieveTableRsp*     pRsp = pDataInfo->pRsp;
X
Xiaoyu Wang 已提交
2162
      SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, i);
2163

L
Liu Jicong 已提交
2164
      SSDataBlock*         pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2165
      SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2166
      if (pRsp->numOfRows == 0) {
2167 2168
        qDebug("%s vgId:%d, taskId:0x%" PRIx64 " execId:%d index:%d completed, rowsOfSource:%" PRIu64
               ", totalRows:%" PRIu64 ", completed:%d try next %d/%" PRIzu,
D
dapan1121 已提交
2169
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pDataInfo->totalRows,
2170
               pExchangeInfo->loadInfo.totalRows, completed + 1, i + 1, totalSources);
2171
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2172
        completed += 1;
D
dapan1121 已提交
2173
        taosMemoryFreeClear(pDataInfo->pRsp);
2174 2175
        continue;
      }
H
Haojun Liao 已提交
2176

H
Haojun Liao 已提交
2177
      SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2178 2179 2180
      code =
          extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
                                       pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2181
      if (code != 0) {
2182
        taosMemoryFreeClear(pDataInfo->pRsp);
2183 2184 2185
        goto _error;
      }

2186
      if (pRsp->completed == 1) {
2187 2188
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64
               " execId:%d"
X
Xiaoyu Wang 已提交
2189 2190
               " index:%d completed, numOfRows:%d, rowsOfSource:%" PRIu64 ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64
               ", completed:%d try next %d/%" PRIzu,
2191 2192
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pRes->info.rows,
               pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, completed + 1, i + 1, totalSources);
2193
        completed += 1;
2194
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2195
      } else {
D
dapan1121 已提交
2196
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
dengyihao's avatar
dengyihao 已提交
2197
               ", totalBytes:%" PRIu64,
2198 2199
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
               pLoadInfo->totalRows, pLoadInfo->totalSize);
2200 2201
      }

2202 2203
      taosMemoryFreeClear(pDataInfo->pRsp);

2204 2205
      if (pDataInfo->status != EX_SOURCE_DATA_EXHAUSTED) {
        pDataInfo->status = EX_SOURCE_DATA_NOT_READY;
2206 2207
        code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
        if (code != TSDB_CODE_SUCCESS) {
2208
          taosMemoryFreeClear(pDataInfo->pRsp);
2209 2210 2211 2212 2213 2214 2215
          goto _error;
        }
      }

      return pExchangeInfo->pResult;
    }

2216
    if (completed == totalSources) {
2217 2218 2219 2220 2221 2222 2223 2224 2225
      return setAllSourcesCompleted(pOperator, startTs);
    }
  }

_error:
  pTaskInfo->code = code;
  return NULL;
}

L
Liu Jicong 已提交
2226 2227 2228
static int32_t prepareConcurrentlyLoad(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2229

L
Liu Jicong 已提交
2230
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2231 2232 2233
  int64_t startTs = taosGetTimestampUs();

  // Asynchronously send all fetch requests to all sources.
L
Liu Jicong 已提交
2234
  for (int32_t i = 0; i < totalSources; ++i) {
2235 2236
    int32_t code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
    if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2237 2238
      pTaskInfo->code = code;
      return code;
2239 2240 2241 2242
    }
  }

  int64_t endTs = taosGetTimestampUs();
2243
  qDebug("%s send all fetch requests to %" PRIzu " sources completed, elapsed:%.2fms", GET_TASKID(pTaskInfo),
X
Xiaoyu Wang 已提交
2244
         totalSources, (endTs - startTs) / 1000.0);
2245

2246
  pOperator->status = OP_RES_TO_RETURN;
H
Haojun Liao 已提交
2247
  pOperator->cost.openCost = taosGetTimestampUs() - startTs;
2248

2249
  tsem_wait(&pExchangeInfo->ready);
H
Haojun Liao 已提交
2250
  return TSDB_CODE_SUCCESS;
2251 2252
}

L
Liu Jicong 已提交
2253 2254 2255
static SSDataBlock* seqLoadRemoteData(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2256

L
Liu Jicong 已提交
2257
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2258
  int64_t startTs = taosGetTimestampUs();
2259

L
Liu Jicong 已提交
2260
  while (1) {
2261 2262
    if (pExchangeInfo->current >= totalSources) {
      return setAllSourcesCompleted(pOperator, startTs);
2263
    }
2264

2265 2266 2267
    doSendFetchDataRequest(pExchangeInfo, pTaskInfo, pExchangeInfo->current);
    tsem_wait(&pExchangeInfo->ready);

dengyihao's avatar
dengyihao 已提交
2268
    SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, pExchangeInfo->current);
X
Xiaoyu Wang 已提交
2269
    SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, pExchangeInfo->current);
2270

H
Haojun Liao 已提交
2271
    if (pDataInfo->code != TSDB_CODE_SUCCESS) {
2272 2273
      qError("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d error happens, code:%s", GET_TASKID(pTaskInfo),
             pSource->addr.nodeId, pSource->taskId, pSource->execId, tstrerror(pDataInfo->code));
H
Haojun Liao 已提交
2274 2275 2276 2277
      pOperator->pTaskInfo->code = pDataInfo->code;
      return NULL;
    }

L
Liu Jicong 已提交
2278
    SRetrieveTableRsp*   pRsp = pDataInfo->pRsp;
H
Haojun Liao 已提交
2279
    SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2280
    if (pRsp->numOfRows == 0) {
2281 2282
      qDebug("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d %d of total completed, rowsOfSource:%" PRIu64
             ", totalRows:%" PRIu64 " try next",
D
dapan1121 已提交
2283
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pExchangeInfo->current + 1,
H
Haojun Liao 已提交
2284
             pDataInfo->totalRows, pLoadInfo->totalRows);
H
Haojun Liao 已提交
2285

2286
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2287
      pExchangeInfo->current += 1;
D
dapan1121 已提交
2288
      taosMemoryFreeClear(pDataInfo->pRsp);
2289 2290
      continue;
    }
H
Haojun Liao 已提交
2291

L
Liu Jicong 已提交
2292
    SSDataBlock*       pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2293
    SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2294
    int32_t            code =
2295
        extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
L
Liu Jicong 已提交
2296
                                     pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2297 2298

    if (pRsp->completed == 1) {
D
dapan1121 已提交
2299
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, rowsOfSource:%" PRIu64
L
Liu Jicong 已提交
2300
             ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64 " try next %d/%" PRIzu,
2301 2302 2303
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, pExchangeInfo->current + 1,
             totalSources);
2304

2305
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2306 2307
      pExchangeInfo->current += 1;
    } else {
D
dapan1121 已提交
2308
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
L
Liu Jicong 已提交
2309
             ", totalBytes:%" PRIu64,
2310 2311
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pLoadInfo->totalRows, pLoadInfo->totalSize);
2312 2313
    }

2314
    pOperator->resultInfo.totalRows += pRes->info.rows;
2315
    taosMemoryFreeClear(pDataInfo->pRsp);
2316 2317
    return pExchangeInfo->pResult;
  }
2318 2319
}

L
Liu Jicong 已提交
2320
static int32_t prepareLoadRemoteData(SOperatorInfo* pOperator) {
2321
  if (OPTR_IS_OPENED(pOperator)) {
H
Haojun Liao 已提交
2322 2323 2324
    return TSDB_CODE_SUCCESS;
  }

2325 2326
  int64_t st = taosGetTimestampUs();

L
Liu Jicong 已提交
2327
  SExchangeInfo* pExchangeInfo = pOperator->info;
2328
  if (!pExchangeInfo->seqLoadData) {
H
Haojun Liao 已提交
2329 2330 2331 2332 2333 2334
    int32_t code = prepareConcurrentlyLoad(pOperator);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
    }
  }

2335
  OPTR_SET_OPENED(pOperator);
2336
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2337 2338 2339
  return TSDB_CODE_SUCCESS;
}

2340
static SSDataBlock* doLoadRemoteData(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
2341 2342
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2343

2344
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
2345
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2346 2347
    return NULL;
  }
2348

L
Liu Jicong 已提交
2349
  size_t               totalSources = taosArrayGetSize(pExchangeInfo->pSources);
H
Haojun Liao 已提交
2350
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
H
Haojun Liao 已提交
2351

2352
  if (pOperator->status == OP_EXEC_DONE) {
L
Liu Jicong 已提交
2353 2354 2355
    qDebug("%s all %" PRIzu " source(s) are exhausted, total rows:%" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
           GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
           pLoadInfo->totalElapsed / 1000.0);
2356 2357 2358 2359 2360 2361
    return NULL;
  }

  if (pExchangeInfo->seqLoadData) {
    return seqLoadRemoteData(pOperator);
  } else {
2362
    return concurrentlyLoadRemoteDataImpl(pOperator, pExchangeInfo, pTaskInfo);
2363
  }
H
Haojun Liao 已提交
2364
}
2365

2366
static int32_t initDataSource(int32_t numOfSources, SExchangeInfo* pInfo, const char* id) {
2367
  pInfo->pSourceDataInfo = taosArrayInit(numOfSources, sizeof(SSourceDataInfo));
H
Haojun Liao 已提交
2368 2369
  if (pInfo->pSourceDataInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
2370 2371
  }

L
Liu Jicong 已提交
2372
  for (int32_t i = 0; i < numOfSources; ++i) {
2373
    SSourceDataInfo dataInfo = {0};
H
Haojun Liao 已提交
2374
    dataInfo.status = EX_SOURCE_DATA_NOT_READY;
2375
    dataInfo.taskId = id;
L
Liu Jicong 已提交
2376
    dataInfo.index = i;
X
Xiaoyu Wang 已提交
2377
    SSourceDataInfo* pDs = taosArrayPush(pInfo->pSourceDataInfo, &dataInfo);
2378
    if (pDs == NULL) {
H
Haojun Liao 已提交
2379 2380 2381 2382 2383 2384 2385 2386
      taosArrayDestroy(pInfo->pSourceDataInfo);
      return TSDB_CODE_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
}

2387
static int32_t initExchangeOperator(SExchangePhysiNode* pExNode, SExchangeInfo* pInfo, const char* id) {
2388
  size_t numOfSources = LIST_LENGTH(pExNode->pSrcEndPoints);
H
Haojun Liao 已提交
2389

2390
  if (numOfSources == 0) {
X
Xiaoyu Wang 已提交
2391
    qError("%s invalid number: %d of sources in exchange operator", id, (int32_t)numOfSources);
2392 2393 2394
    return TSDB_CODE_INVALID_PARA;
  }

H
Haojun Liao 已提交
2395
  pInfo->pSources = taosArrayInit(numOfSources, sizeof(SDownstreamSourceNode));
wmmhello's avatar
wmmhello 已提交
2396
  if (pInfo->pSources == NULL) {
2397
    return TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
2398 2399
  }

L
Liu Jicong 已提交
2400
  for (int32_t i = 0; i < numOfSources; ++i) {
D
dapan1121 已提交
2401
    SDownstreamSourceNode* pNode = (SDownstreamSourceNode*)nodesListGetNode((SNodeList*)pExNode->pSrcEndPoints, i);
H
Haojun Liao 已提交
2402 2403
    taosArrayPush(pInfo->pSources, pNode);
  }
2404

2405 2406
  pInfo->self = taosAddRef(exchangeObjRefPool, pInfo);

2407
  return initDataSource(numOfSources, pInfo, id);
2408 2409 2410 2411 2412 2413
}

SOperatorInfo* createExchangeOperatorInfo(void* pTransporter, SExchangePhysiNode* pExNode, SExecTaskInfo* pTaskInfo) {
  SExchangeInfo* pInfo = taosMemoryCalloc(1, sizeof(SExchangeInfo));
  SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
H
Haojun Liao 已提交
2414
    goto _error;
2415
  }
H
Haojun Liao 已提交
2416

2417
  int32_t code = initExchangeOperator(pExNode, pInfo, GET_TASKID(pTaskInfo));
2418 2419 2420
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2421 2422

  tsem_init(&pInfo->ready, 0, 0);
2423

2424
  pInfo->seqLoadData = false;
2425
  pInfo->pTransporter = pTransporter;
2426 2427
  pInfo->pResult = createResDataBlock(pExNode->node.pOutputDataBlockDesc);
  pOperator->name = "ExchangeOperator";
X
Xiaoyu Wang 已提交
2428
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_EXCHANGE;
X
Xiaoyu Wang 已提交
2429
  pOperator->blocking = false;
2430 2431
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
2432
  pOperator->exprSupp.numOfExprs = taosArrayGetSize(pInfo->pResult->pDataBlock);
X
Xiaoyu Wang 已提交
2433
  pOperator->pTaskInfo = pTaskInfo;
2434

L
Liu Jicong 已提交
2435 2436
  pOperator->fpSet = createOperatorFpSet(prepareLoadRemoteData, doLoadRemoteData, NULL, NULL,
                                         destroyExchangeOperatorInfo, NULL, NULL, NULL);
2437
  return pOperator;
H
Haojun Liao 已提交
2438

L
Liu Jicong 已提交
2439
_error:
H
Haojun Liao 已提交
2440
  if (pInfo != NULL) {
2441
    doDestroyExchangeOperatorInfo(pInfo);
H
Haojun Liao 已提交
2442 2443
  }

wafwerar's avatar
wafwerar 已提交
2444 2445
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
2446
  pTaskInfo->code = code;
H
Haojun Liao 已提交
2447
  return NULL;
2448 2449
}

dengyihao's avatar
dengyihao 已提交
2450 2451
static int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                                const char* pKey);
2452

2453
static void destroySortedMergeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
2454
  SSortedMergeOperatorInfo* pInfo = (SSortedMergeOperatorInfo*)param;
H
Haojun Liao 已提交
2455
  taosArrayDestroy(pInfo->pSortInfo);
2456 2457 2458
  taosArrayDestroy(pInfo->groupInfo);

  if (pInfo->pSortHandle != NULL) {
H
Haojun Liao 已提交
2459
    tsortDestroySortHandle(pInfo->pSortHandle);
2460 2461
  }

H
Haojun Liao 已提交
2462
  blockDataDestroy(pInfo->binfo.pRes);
H
Haojun Liao 已提交
2463
  cleanupAggSup(&pInfo->aggSup);
2464
}
H
Haojun Liao 已提交
2465

L
Liu Jicong 已提交
2466
static bool needToMerge(SSDataBlock* pBlock, SArray* groupInfo, char** buf, int32_t rowIndex) {
2467 2468 2469 2470
  size_t size = taosArrayGetSize(groupInfo);
  if (size == 0) {
    return true;
  }
2471

2472 2473
  for (int32_t i = 0; i < size; ++i) {
    int32_t* index = taosArrayGet(groupInfo, i);
2474

2475
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
L
Liu Jicong 已提交
2476
    bool             isNull = colDataIsNull(pColInfo, rowIndex, pBlock->info.rows, NULL);
2477

2478 2479 2480
    if ((isNull && buf[i] != NULL) || (!isNull && buf[i] == NULL)) {
      return false;
    }
2481

2482 2483 2484 2485 2486 2487 2488 2489 2490 2491 2492 2493 2494
    char* pCell = colDataGetData(pColInfo, rowIndex);
    if (IS_VAR_DATA_TYPE(pColInfo->info.type)) {
      if (varDataLen(pCell) != varDataLen(buf[i])) {
        return false;
      } else {
        if (memcmp(varDataVal(pCell), varDataVal(buf[i]), varDataLen(pCell)) != 0) {
          return false;
        }
      }
    } else {
      if (memcmp(pCell, buf[i], pColInfo->info.bytes) != 0) {
        return false;
      }
2495 2496 2497
    }
  }

2498
  return 0;
2499 2500
}

L
Liu Jicong 已提交
2501 2502 2503
static void doMergeResultImpl(SSortedMergeOperatorInfo* pInfo, SqlFunctionCtx* pCtx, int32_t numOfExpr,
                              int32_t rowIndex) {
  for (int32_t j = 0; j < numOfExpr; ++j) {  // TODO set row index
X
Xiaoyu Wang 已提交
2504
                                             //    pCtx[j].startRow = rowIndex;
2505 2506
  }

2507 2508
  for (int32_t j = 0; j < numOfExpr; ++j) {
    int32_t functionId = pCtx[j].functionId;
L
Liu Jicong 已提交
2509 2510 2511 2512 2513 2514 2515 2516 2517
    //    pCtx[j].fpSet->addInput(&pCtx[j]);

    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_MERGE);
    //    } else {
    //      assert(!TSDB_FUNC_IS_SCALAR(functionId));
    //      aAggs[functionId].mergeFunc(&pCtx[j]);
    //    }
2518
  }
2519
}
2520

L
Liu Jicong 已提交
2521 2522
static void doFinalizeResultImpl(SqlFunctionCtx* pCtx, int32_t numOfExpr) {
  for (int32_t j = 0; j < numOfExpr; ++j) {
2523 2524 2525 2526
    int32_t functionId = pCtx[j].functionId;
    //    if (functionId == FUNC_TAG_DUMMY || functionId == FUNC_TS_DUMMY) {
    //      continue;
    //    }
2527

2528 2529 2530 2531
    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_FINALIZE);
    //    } else {
dengyihao's avatar
dengyihao 已提交
2532
    //    pCtx[j].fpSet.finalize(&pCtx[j]);
2533 2534
  }
}
2535

2536
static bool saveCurrentTuple(char** rowColData, SArray* pColumnList, SSDataBlock* pBlock, int32_t rowIndex) {
L
Liu Jicong 已提交
2537
  int32_t size = (int32_t)taosArrayGetSize(pColumnList);
2538

L
Liu Jicong 已提交
2539 2540
  for (int32_t i = 0; i < size; ++i) {
    int32_t*         index = taosArrayGet(pColumnList, i);
2541
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
H
Haojun Liao 已提交
2542

2543 2544 2545
    char* data = colDataGetData(pColInfo, rowIndex);
    memcpy(rowColData[i], data, colDataGetLength(pColInfo, rowIndex));
  }
2546

2547 2548
  return true;
}
2549

2550 2551
static void doMergeImpl(SOperatorInfo* pOperator, int32_t numOfExpr, SSDataBlock* pBlock) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
2552

2553
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
2554

L
Liu Jicong 已提交
2555
  for (int32_t i = 0; i < pBlock->info.rows; ++i) {
2556 2557 2558 2559 2560 2561 2562 2563 2564
    if (!pInfo->hasGroupVal) {
      ASSERT(i == 0);
      doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
    } else {
      if (needToMerge(pBlock, pInfo->groupInfo, pInfo->groupVal, i)) {
        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      } else {
        doFinalizeResultImpl(pCtx, numOfExpr);
2565 2566
        int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
        //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2567

2568
        // TODO check for available buffer;
H
Haojun Liao 已提交
2569

2570 2571 2572 2573 2574
        // next group info data
        pInfo->binfo.pRes->info.rows += numOfRows;
        for (int32_t j = 0; j < numOfExpr; ++j) {
          if (pCtx[j].functionId < 0) {
            continue;
2575
          }
2576

H
Haojun Liao 已提交
2577
          pCtx[j].fpSet.process(&pCtx[j]);
2578
        }
2579 2580 2581

        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
        pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
H
Haojun Liao 已提交
2582
      }
2583 2584 2585 2586
    }
  }
}

2587 2588
static SSDataBlock* doMerge(SOperatorInfo* pOperator) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
L
Liu Jicong 已提交
2589
  SSortHandle*              pHandle = pInfo->pSortHandle;
2590

2591
  SSDataBlock* pDataBlock = createOneDataBlock(pInfo->binfo.pRes, false);
2592
  blockDataEnsureCapacity(pDataBlock, pOperator->resultInfo.capacity);
2593

L
Liu Jicong 已提交
2594
  while (1) {
2595
    blockDataCleanup(pDataBlock);
2596
    while (1) {
H
Haojun Liao 已提交
2597
      STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2598 2599
      if (pTupleHandle == NULL) {
        break;
2600
      }
2601

2602 2603
      // build datablock for merge for one group
      appendOneRowToDataBlock(pDataBlock, pTupleHandle);
2604
      if (pDataBlock->info.rows >= pOperator->resultInfo.capacity) {
2605 2606
        break;
      }
2607
    }
2608

2609 2610 2611
    if (pDataBlock->info.rows == 0) {
      break;
    }
2612

2613
    setInputDataBlock(pOperator, pOperator->exprSupp.pCtx, pDataBlock, TSDB_ORDER_ASC, MAIN_SCAN, true);
L
Liu Jicong 已提交
2614 2615
    //  updateOutputBuf(&pInfo->binfo, &pAggInfo->bufCapacity, pBlock->info.rows * pAggInfo->resultRowFactor,
    //  pOperator->pRuntimeEnv, true);
2616
    doMergeImpl(pOperator, pOperator->exprSupp.numOfExprs, pDataBlock);
2617 2618
    // flush to tuple store, and after all data have been handled, return to upstream node or sink node
  }
2619

2620 2621 2622
  doFinalizeResultImpl(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs);
  int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
  //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2623

2624
  // TODO check for available buffer;
2625

2626 2627
  // next group info data
  pInfo->binfo.pRes->info.rows += numOfRows;
L
Liu Jicong 已提交
2628
  return (pInfo->binfo.pRes->info.rows > 0) ? pInfo->binfo.pRes : NULL;
2629
}
2630

L
Liu Jicong 已提交
2631 2632
SSDataBlock* getSortedMergeBlockData(SSortHandle* pHandle, SSDataBlock* pDataBlock, int32_t capacity,
                                     SArray* pColMatchInfo, SSortedMergeOperatorInfo* pInfo) {
2633 2634 2635 2636 2637 2638 2639 2640 2641 2642
  blockDataCleanup(pDataBlock);

  SSDataBlock* p = tsortGetSortedDataBlock(pHandle);
  if (p == NULL) {
    return NULL;
  }

  blockDataEnsureCapacity(p, capacity);

  while (1) {
2643
    STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2644 2645 2646 2647
    if (pTupleHandle == NULL) {
      break;
    }

2648
    appendOneRowToDataBlock(p, pTupleHandle);
2649 2650 2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661
    if (p->info.rows >= capacity) {
      break;
    }
  }

  if (p->info.rows > 0) {
    int32_t numOfCols = taosArrayGetSize(pColMatchInfo);
    for (int32_t i = 0; i < numOfCols; ++i) {
      SColMatchInfo* pmInfo = taosArrayGet(pColMatchInfo, i);
      ASSERT(pmInfo->matchType == COL_MATCH_FROM_SLOT_ID);

      SColumnInfoData* pSrc = taosArrayGet(p->pDataBlock, pmInfo->srcSlotId);
      SColumnInfoData* pDst = taosArrayGet(pDataBlock->pDataBlock, pmInfo->targetSlotId);
2662
      colDataAssign(pDst, pSrc, p->info.rows, &pDataBlock->info);
2663 2664 2665 2666 2667 2668 2669 2670 2671 2672
    }

    pDataBlock->info.rows = p->info.rows;
    pDataBlock->info.capacity = p->info.rows;
  }

  blockDataDestroy(p);
  return (pDataBlock->info.rows > 0) ? pDataBlock : NULL;
}

2673
static SSDataBlock* doSortedMerge(SOperatorInfo* pOperator) {
2674 2675
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
2676 2677
  }

L
Liu Jicong 已提交
2678
  SExecTaskInfo*            pTaskInfo = pOperator->pTaskInfo;
2679
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
H
Haojun Liao 已提交
2680
  if (pOperator->status == OP_RES_TO_RETURN) {
2681
    return getSortedMergeBlockData(pInfo->pSortHandle, pInfo->binfo.pRes, pOperator->resultInfo.capacity, NULL, pInfo);
2682 2683
  }

2684
  int32_t numOfBufPage = pInfo->sortBufSize / pInfo->bufPageSize;
L
Liu Jicong 已提交
2685 2686
  pInfo->pSortHandle = tsortCreateSortHandle(pInfo->pSortInfo, SORT_MULTISOURCE_MERGE, pInfo->bufPageSize, numOfBufPage,
                                             pInfo->binfo.pRes, "GET_TASKID(pTaskInfo)");
H
Haojun Liao 已提交
2687

2688
  tsortSetFetchRawDataFp(pInfo->pSortHandle, loadNextDataBlock, NULL, NULL);
2689

L
Liu Jicong 已提交
2690
  for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
wmmhello's avatar
wmmhello 已提交
2691
    SSortSource* ps = taosMemoryCalloc(1, sizeof(SSortSource));
H
Haojun Liao 已提交
2692
    ps->param = pOperator->pDownstream[i];
H
Haojun Liao 已提交
2693
    tsortAddSource(pInfo->pSortHandle, ps);
2694 2695
  }

H
Haojun Liao 已提交
2696
  int32_t code = tsortOpen(pInfo->pSortHandle);
2697
  if (code != TSDB_CODE_SUCCESS) {
2698
    longjmp(pTaskInfo->env, terrno);
2699 2700
  }

H
Haojun Liao 已提交
2701
  pOperator->status = OP_RES_TO_RETURN;
2702
  return doMerge(pOperator);
2703
}
2704

L
Liu Jicong 已提交
2705 2706
static int32_t initGroupCol(SExprInfo* pExprInfo, int32_t numOfCols, SArray* pGroupInfo,
                            SSortedMergeOperatorInfo* pInfo) {
2707 2708
  if (pGroupInfo == NULL || taosArrayGetSize(pGroupInfo) == 0) {
    return 0;
H
Haojun Liao 已提交
2709 2710
  }

2711 2712 2713 2714 2715 2716 2717 2718
  int32_t len = 0;
  SArray* plist = taosArrayInit(3, sizeof(SColumn));
  pInfo->groupInfo = taosArrayInit(3, sizeof(int32_t));

  if (plist == NULL || pInfo->groupInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

L
Liu Jicong 已提交
2719 2720
  size_t numOfGroupCol = taosArrayGetSize(pInfo->groupInfo);
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2721
    SColumn* pCol = taosArrayGet(pGroupInfo, i);
L
Liu Jicong 已提交
2722
    for (int32_t j = 0; j < numOfCols; ++j) {
H
Haojun Liao 已提交
2723
      SExprInfo* pe = &pExprInfo[j];
2724
      if (pe->base.resSchema.slotId == pCol->colId) {
2725 2726
        taosArrayPush(plist, pCol);
        taosArrayPush(pInfo->groupInfo, &j);
H
Haojun Liao 已提交
2727
        len += pCol->bytes;
2728 2729
        break;
      }
H
Haojun Liao 已提交
2730 2731 2732
    }
  }

2733
  ASSERT(taosArrayGetSize(pGroupInfo) == taosArrayGetSize(plist));
H
Haojun Liao 已提交
2734

wafwerar's avatar
wafwerar 已提交
2735
  pInfo->groupVal = taosMemoryCalloc(1, (POINTER_BYTES * numOfGroupCol + len));
2736 2737 2738 2739
  if (pInfo->groupVal == NULL) {
    taosArrayDestroy(plist);
    return TSDB_CODE_OUT_OF_MEMORY;
  }
H
Haojun Liao 已提交
2740

2741
  int32_t offset = 0;
L
Liu Jicong 已提交
2742 2743
  char*   start = (char*)(pInfo->groupVal + (POINTER_BYTES * numOfGroupCol));
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2744 2745
    pInfo->groupVal[i] = start + offset;
    SColumn* pCol = taosArrayGet(plist, i);
H
Haojun Liao 已提交
2746
    offset += pCol->bytes;
2747
  }
H
Haojun Liao 已提交
2748

2749
  taosArrayDestroy(plist);
H
Haojun Liao 已提交
2750

2751 2752
  return TSDB_CODE_SUCCESS;
}
H
Haojun Liao 已提交
2753

L
Liu Jicong 已提交
2754 2755 2756
SOperatorInfo* createSortedMergeOperatorInfo(SOperatorInfo** downstream, int32_t numOfDownstream, SExprInfo* pExprInfo,
                                             int32_t num, SArray* pSortInfo, SArray* pGroupInfo,
                                             SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
2757
  SSortedMergeOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SSortedMergeOperatorInfo));
L
Liu Jicong 已提交
2758
  SOperatorInfo*            pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2759
  if (pInfo == NULL || pOperator == NULL) {
2760
    goto _error;
2761
  }
H
Haojun Liao 已提交
2762

2763 2764 2765 2766 2767
  int32_t code = initExprSupp(&pOperator->exprSupp, pExprInfo, num);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

2768
  initResultRowInfo(&pInfo->binfo.resultRowInfo);
H
Haojun Liao 已提交
2769

2770
  if (pOperator->exprSupp.pCtx == NULL || pInfo->binfo.pRes == NULL) {
2771 2772
    goto _error;
  }
H
Haojun Liao 已提交
2773

2774
  size_t keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
2775
  code = doInitAggInfoSup(&pInfo->aggSup, pOperator->exprSupp.pCtx, num, keyBufSize, pTaskInfo->id.str);
2776 2777 2778
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2779

2780
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, num);
H
Haojun Liao 已提交
2781
  code = initGroupCol(pExprInfo, num, pGroupInfo, pInfo);
2782 2783 2784
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2785

L
Liu Jicong 已提交
2786 2787 2788 2789 2790
  //  pInfo->resultRowFactor = (int32_t)(getRowNumForMultioutput(pRuntimeEnv->pQueryAttr,
  //      pRuntimeEnv->pQueryAttr->topBotQuery, false));
  pInfo->sortBufSize = 1024 * 16;  // 1MB
  pInfo->bufPageSize = 1024;
  pInfo->pSortInfo = pSortInfo;
H
Haojun Liao 已提交
2791

2792
  pOperator->resultInfo.capacity = blockDataGetCapacityInRow(pInfo->binfo.pRes, pInfo->bufPageSize);
H
Haojun Liao 已提交
2793

L
Liu Jicong 已提交
2794
  pOperator->name = "SortedMerge";
X
Xiaoyu Wang 已提交
2795
  // pOperator->operatorType = OP_SortedMerge;
2796 2797 2798
  pOperator->blocking = true;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
L
Liu Jicong 已提交
2799
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
2800

2801 2802
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doSortedMerge, NULL, NULL, destroySortedMergeOperatorInfo,
                                         NULL, NULL, NULL);
2803 2804 2805
  code = appendDownstream(pOperator, downstream, numOfDownstream);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
2806
  }
H
Haojun Liao 已提交
2807

2808
  return pOperator;
H
Haojun Liao 已提交
2809

L
Liu Jicong 已提交
2810
_error:
2811
  if (pInfo != NULL) {
H
Haojun Liao 已提交
2812
    destroySortedMergeOperatorInfo(pInfo, num);
H
Haojun Liao 已提交
2813 2814
  }

wafwerar's avatar
wafwerar 已提交
2815 2816
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
2817 2818
  terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
  return NULL;
H
Haojun Liao 已提交
2819 2820
}

X
Xiaoyu Wang 已提交
2821
int32_t getTableScanInfo(SOperatorInfo* pOperator, int32_t* order, int32_t* scanFlag) {
2822
  // todo add more information about exchange operation
2823
  int32_t type = pOperator->operatorType;
X
Xiaoyu Wang 已提交
2824
  if (type == QUERY_NODE_PHYSICAL_PLAN_EXCHANGE || type == QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN ||
2825
      type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN ||
2826
      type == QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN) {
2827 2828 2829
    *order = TSDB_ORDER_ASC;
    *scanFlag = MAIN_SCAN;
    return TSDB_CODE_SUCCESS;
2830
  } else if (type == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) {
2831 2832 2833 2834 2835
    STableScanInfo* pTableScanInfo = pOperator->info;
    *order = pTableScanInfo->cond.order;
    *scanFlag = pTableScanInfo->scanFlag;
    return TSDB_CODE_SUCCESS;
  } else {
H
Haojun Liao 已提交
2836
    if (pOperator->pDownstream == NULL || pOperator->pDownstream[0] == NULL) {
2837
      return TSDB_CODE_INVALID_PARA;
H
Haojun Liao 已提交
2838
    } else {
2839
      return getTableScanInfo(pOperator->pDownstream[0], order, scanFlag);
2840 2841 2842
    }
  }
}
2843

L
Liu Jicong 已提交
2844
int32_t doPrepareScan(SOperatorInfo* pOperator, uint64_t uid, int64_t ts) {
L
Liu Jicong 已提交
2845
  uint8_t type = pOperator->operatorType;
2846 2847 2848

  pOperator->status = OP_OPENED;

L
Liu Jicong 已提交
2849
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2850
    SStreamScanInfo* pScanInfo = pOperator->info;
L
Liu Jicong 已提交
2851
    pScanInfo->blockType = STREAM_INPUT__TABLE_SCAN;
2852

2853
    pScanInfo->pTableScanOp->status = OP_OPENED;
2854

2855
    STableScanInfo* pInfo = pScanInfo->pTableScanOp->info;
2856 2857
    ASSERT(pInfo->scanMode == TABLE_SCAN__TABLE_ORDER);

L
Liu Jicong 已提交
2858 2859 2860 2861
    if (uid == 0) {
      pInfo->noTable = 1;
      return TSDB_CODE_SUCCESS;
    }
2862 2863 2864 2865 2866 2867

    /*if (pSnapShotScanInfo->dataReader == NULL) {*/
    /*pSnapShotScanInfo->dataReader = tsdbReaderOpen(pHandle->vnode, &pSTInfo->cond, tableList, 0, 0);*/
    /*pSnapShotScanInfo->scanMode = TABLE_SCAN__TABLE_ORDER;*/
    /*}*/

L
Liu Jicong 已提交
2868 2869
    pInfo->noTable = 0;

2870
    if (pInfo->lastStatus.uid != uid || pInfo->lastStatus.ts != ts) {
L
Liu Jicong 已提交
2871 2872 2873 2874 2875 2876 2877 2878 2879 2880 2881
      SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

      int32_t tableSz = taosArrayGetSize(pTaskInfo->tableqinfoList.pTableList);
      bool    found = false;
      for (int32_t i = 0; i < tableSz; i++) {
        STableKeyInfo* pTableInfo = taosArrayGet(pTaskInfo->tableqinfoList.pTableList, i);
        if (pTableInfo->uid == uid) {
          found = true;
          pInfo->currentTable = i;
        }
      }
2882
      // TODO after processing drop, found can be false
L
Liu Jicong 已提交
2883
      ASSERT(found);
2884 2885 2886 2887

      tsdbSetTableId(pInfo->dataReader, uid);
      int64_t oldSkey = pInfo->cond.twindows[0].skey;
      pInfo->cond.twindows[0].skey = ts + 1;
H
Haojun Liao 已提交
2888
      tsdbReaderReset(pInfo->dataReader, &pInfo->cond, 0);
2889 2890 2891 2892
      pInfo->cond.twindows[0].skey = oldSkey;
      pInfo->scanTimes = 0;
      pInfo->curTWinIdx = 0;

L
Liu Jicong 已提交
2893 2894
      qDebug("tsdb reader offset seek to uid %ld ts %ld, table cur set to %d , all table num %d", uid, ts,
             pInfo->currentTable, tableSz);
L
Liu Jicong 已提交
2895
    }
L
Liu Jicong 已提交
2896

L
Liu Jicong 已提交
2897
    return TSDB_CODE_SUCCESS;
2898

L
Liu Jicong 已提交
2899
  } else {
2900 2901 2902 2903 2904
    if (pOperator->numOfDownstream == 1) {
      return doPrepareScan(pOperator->pDownstream[0], uid, ts);
    } else if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator to set the input data block");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2905
    } else {
2906 2907
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2908 2909 2910 2911
    }
  }
}

2912 2913 2914
int32_t doGetScanStatus(SOperatorInfo* pOperator, uint64_t* uid, int64_t* ts) {
  int32_t type = pOperator->operatorType;
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2915 2916
    SStreamScanInfo* pScanInfo = pOperator->info;
    STableScanInfo*  pSnapShotScanInfo = pScanInfo->pTableScanOp->info;
L
Liu Jicong 已提交
2917 2918
    *uid = pSnapShotScanInfo->lastStatus.uid;
    *ts = pSnapShotScanInfo->lastStatus.ts;
2919 2920 2921 2922 2923 2924 2925 2926 2927 2928 2929
  } else {
    if (pOperator->pDownstream[0] == NULL) {
      return TSDB_CODE_INVALID_PARA;
    } else {
      doGetScanStatus(pOperator->pDownstream[0], uid, ts);
    }
  }

  return TSDB_CODE_SUCCESS;
}

2930
// this is a blocking operator
L
Liu Jicong 已提交
2931
static int32_t doOpenAggregateOptr(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
2932 2933
  if (OPTR_IS_OPENED(pOperator)) {
    return TSDB_CODE_SUCCESS;
2934 2935
  }

H
Haojun Liao 已提交
2936
  SExecTaskInfo*    pTaskInfo = pOperator->pTaskInfo;
2937
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
2938

2939 2940
  SExprSupp*     pSup = &pOperator->exprSupp;
  SOperatorInfo* downstream = pOperator->pDownstream[0];
2941

2942 2943
  int64_t st = taosGetTimestampUs();

2944 2945 2946
  int32_t order = TSDB_ORDER_ASC;
  int32_t scanFlag = MAIN_SCAN;

H
Haojun Liao 已提交
2947
  while (1) {
2948
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
2949 2950 2951 2952
    if (pBlock == NULL) {
      break;
    }

2953 2954 2955 2956
    int32_t code = getTableScanInfo(pOperator, &order, &scanFlag);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
2957

2958
    // there is an scalar expression that needs to be calculated before apply the group aggregation.
2959 2960 2961
    if (pAggInfo->scalarExprSup.pExprInfo != NULL) {
      SExprSupp* pSup1 = &pAggInfo->scalarExprSup;
      code = projectApplyFunctions(pSup1->pExprInfo, pBlock, pBlock, pSup1->pCtx, pSup1->numOfExprs, NULL);
2962
      if (code != TSDB_CODE_SUCCESS) {
2963
        longjmp(pTaskInfo->env, code);
2964
      }
2965 2966
    }

2967
    // the pDataBlock are always the same one, no need to call this again
2968 2969 2970
    setExecutionContext(pOperator, pOperator->exprSupp.numOfExprs, pBlock->info.groupId, pAggInfo);
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, true);
    code = doAggregateImpl(pOperator, 0, pSup->pCtx);
2971 2972 2973
    if (code != 0) {
      longjmp(pTaskInfo->env, code);
    }
2974

dengyihao's avatar
dengyihao 已提交
2975
#if 0  // test for encode/decode result info
2976
    if(pOperator->fpSet.encodeResultRow){
2977 2978
      char *result = NULL;
      int32_t length = 0;
2979 2980
      pOperator->fpSet.encodeResultRow(pOperator, &result, &length);
      SAggSupporter* pSup = &pAggInfo->aggSup;
2981 2982
      taosHashClear(pSup->pResultRowHashTable);
      pInfo->resultRowInfo.size = 0;
2983
      pOperator->fpSet.decodeResultRow(pOperator, result);
2984 2985 2986
      if(result){
        taosMemoryFree(result);
      }
2987
    }
2988
#endif
2989 2990
  }

H
Haojun Liao 已提交
2991
  closeAllResultRows(&pAggInfo->binfo.resultRowInfo);
2992
  initGroupedResultInfo(&pAggInfo->groupResInfo, pAggInfo->aggSup.pResultRowHashTable, 0);
H
Haojun Liao 已提交
2993
  OPTR_SET_OPENED(pOperator);
2994

2995
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2996 2997 2998
  return TSDB_CODE_SUCCESS;
}

2999
static SSDataBlock* getAggregateResult(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3000
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
3001 3002 3003 3004 3005 3006
  SOptrBasicInfo*   pInfo = &pAggInfo->binfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

L
Liu Jicong 已提交
3007
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3008
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
H
Haojun Liao 已提交
3009
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
3010
    doSetOperatorCompleted(pOperator);
H
Haojun Liao 已提交
3011 3012 3013
    return NULL;
  }

H
Haojun Liao 已提交
3014
  blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);
S
slzhou 已提交
3015 3016 3017 3018 3019 3020 3021 3022
  while (1) {
    doBuildResultDatablock(pOperator, pInfo, &pAggInfo->groupResInfo, pAggInfo->aggSup.pResultBuf);
    doFilter(pAggInfo->pCondition, pInfo->pRes);

    if (!hasDataInGroupInfo(&pAggInfo->groupResInfo)) {
      doSetOperatorCompleted(pOperator);
      break;
    }
3023

S
slzhou 已提交
3024 3025 3026 3027
    if (pInfo->pRes->info.rows > 0) {
      break;
    }
  }
3028
  size_t rows = blockDataGetNumOfRows(pInfo->pRes);
3029 3030
  pOperator->resultInfo.totalRows += rows;

3031
  return (rows == 0) ? NULL : pInfo->pRes;
3032 3033
}

wmmhello's avatar
wmmhello 已提交
3034
int32_t aggEncodeResultRow(SOperatorInfo* pOperator, char** result, int32_t* length) {
3035
  if (result == NULL || length == NULL) {
wmmhello's avatar
wmmhello 已提交
3036 3037 3038
    return TSDB_CODE_TSC_INVALID_INPUT;
  }
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3039 3040 3041 3042 3043
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
  int32_t         size = taosHashGetSize(pSup->pResultRowHashTable);
  size_t          keyLen = sizeof(uint64_t) * 2;  // estimate the key length
  int32_t         totalSize =
      sizeof(int32_t) + sizeof(int32_t) + size * (sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3044

C
Cary Xu 已提交
3045 3046 3047 3048 3049 3050
  // no result
  if (getTotalBufSize(pSup->pResultBuf) == 0) {
    *result = NULL;
    *length = 0;
    return TSDB_CODE_SUCCESS;
  }
3051

wmmhello's avatar
wmmhello 已提交
3052
  *result = (char*)taosMemoryCalloc(1, totalSize);
L
Liu Jicong 已提交
3053
  if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
3054
    return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
3055
  }
wmmhello's avatar
wmmhello 已提交
3056

wmmhello's avatar
wmmhello 已提交
3057
  int32_t offset = sizeof(int32_t);
wmmhello's avatar
wmmhello 已提交
3058 3059
  *(int32_t*)(*result + offset) = size;
  offset += sizeof(int32_t);
3060 3061

  // prepare memory
3062
  SResultRowPosition* pos = &pInfo->resultRowInfo.cur;
dengyihao's avatar
dengyihao 已提交
3063 3064
  void*               pPage = getBufPage(pSup->pResultBuf, pos->pageId);
  SResultRow*         pRow = (SResultRow*)((char*)pPage + pos->offset);
3065 3066 3067
  setBufPageDirty(pPage, true);
  releaseBufPage(pSup->pResultBuf, pPage);

dengyihao's avatar
dengyihao 已提交
3068
  void* pIter = taosHashIterate(pSup->pResultRowHashTable, NULL);
wmmhello's avatar
wmmhello 已提交
3069
  while (pIter) {
dengyihao's avatar
dengyihao 已提交
3070
    void*               key = taosHashGetKey(pIter, &keyLen);
3071
    SResultRowPosition* p1 = (SResultRowPosition*)pIter;
3072

dengyihao's avatar
dengyihao 已提交
3073
    pPage = (SFilePage*)getBufPage(pSup->pResultBuf, p1->pageId);
3074
    pRow = (SResultRow*)((char*)pPage + p1->offset);
3075 3076
    setBufPageDirty(pPage, true);
    releaseBufPage(pSup->pResultBuf, pPage);
wmmhello's avatar
wmmhello 已提交
3077 3078 3079

    // recalculate the result size
    int32_t realTotalSize = offset + sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize;
L
Liu Jicong 已提交
3080
    if (realTotalSize > totalSize) {
wmmhello's avatar
wmmhello 已提交
3081
      char* tmp = (char*)taosMemoryRealloc(*result, realTotalSize);
L
Liu Jicong 已提交
3082
      if (tmp == NULL) {
wafwerar's avatar
wafwerar 已提交
3083
        taosMemoryFree(*result);
wmmhello's avatar
wmmhello 已提交
3084
        *result = NULL;
wmmhello's avatar
wmmhello 已提交
3085
        return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
3086
      } else {
wmmhello's avatar
wmmhello 已提交
3087 3088 3089 3090 3091 3092 3093 3094 3095 3096 3097 3098
        *result = tmp;
      }
    }
    // save key
    *(int32_t*)(*result + offset) = keyLen;
    offset += sizeof(int32_t);
    memcpy(*result + offset, key, keyLen);
    offset += keyLen;

    // save value
    *(int32_t*)(*result + offset) = pSup->resultRowSize;
    offset += sizeof(int32_t);
3099
    memcpy(*result + offset, pRow, pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3100 3101 3102 3103 3104
    offset += pSup->resultRowSize;

    pIter = taosHashIterate(pSup->pResultRowHashTable, pIter);
  }

wmmhello's avatar
wmmhello 已提交
3105 3106 3107 3108
  *(int32_t*)(*result) = offset;
  *length = offset;

  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3109 3110
}

3111
int32_t aggDecodeResultRow(SOperatorInfo* pOperator, char* result) {
3112
  if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
3113
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3114
  }
wmmhello's avatar
wmmhello 已提交
3115
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3116
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
wmmhello's avatar
wmmhello 已提交
3117 3118

  //  int32_t size = taosHashGetSize(pSup->pResultRowHashTable);
3119
  int32_t length = *(int32_t*)(result);
wmmhello's avatar
wmmhello 已提交
3120
  int32_t offset = sizeof(int32_t);
3121 3122 3123 3124

  int32_t count = *(int32_t*)(result + offset);
  offset += sizeof(int32_t);

L
Liu Jicong 已提交
3125
  while (count-- > 0 && length > offset) {
wmmhello's avatar
wmmhello 已提交
3126 3127 3128
    int32_t keyLen = *(int32_t*)(result + offset);
    offset += sizeof(int32_t);

L
Liu Jicong 已提交
3129
    uint64_t    tableGroupId = *(uint64_t*)(result + offset);
3130
    SResultRow* resultRow = getNewResultRow(pSup->pResultBuf, tableGroupId, pSup->resultRowSize);
L
Liu Jicong 已提交
3131
    if (!resultRow) {
wmmhello's avatar
wmmhello 已提交
3132
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3133
    }
3134

wmmhello's avatar
wmmhello 已提交
3135
    // add a new result set for a new group
3136 3137
    SResultRowPosition pos = {.pageId = resultRow->pageId, .offset = resultRow->offset};
    taosHashPut(pSup->pResultRowHashTable, result + offset, keyLen, &pos, sizeof(SResultRowPosition));
wmmhello's avatar
wmmhello 已提交
3138 3139 3140

    offset += keyLen;
    int32_t valueLen = *(int32_t*)(result + offset);
L
Liu Jicong 已提交
3141
    if (valueLen != pSup->resultRowSize) {
wmmhello's avatar
wmmhello 已提交
3142
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3143 3144 3145 3146 3147 3148 3149 3150 3151 3152
    }
    offset += sizeof(int32_t);
    int32_t pageId = resultRow->pageId;
    int32_t pOffset = resultRow->offset;
    memcpy(resultRow, result + offset, valueLen);
    resultRow->pageId = pageId;
    resultRow->offset = pOffset;
    offset += valueLen;

    initResultRow(resultRow);
dengyihao's avatar
dengyihao 已提交
3153
    pInfo->resultRowInfo.cur = (SResultRowPosition){.pageId = resultRow->pageId, .offset = resultRow->offset};
wmmhello's avatar
wmmhello 已提交
3154 3155
  }

L
Liu Jicong 已提交
3156
  if (offset != length) {
wmmhello's avatar
wmmhello 已提交
3157
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3158
  }
wmmhello's avatar
wmmhello 已提交
3159
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3160 3161
}

3162 3163
enum {
  PROJECT_RETRIEVE_CONTINUE = 0x1,
L
Liu Jicong 已提交
3164
  PROJECT_RETRIEVE_DONE = 0x2,
3165 3166 3167 3168 3169
};

static int32_t handleLimitOffset(SOperatorInfo* pOperator, SSDataBlock* pBlock) {
  SProjectOperatorInfo* pProjectInfo = pOperator->info;
  SOptrBasicInfo*       pInfo = &pProjectInfo->binfo;
L
Liu Jicong 已提交
3170
  SSDataBlock*          pRes = pInfo->pRes;
3171 3172 3173 3174 3175 3176 3177 3178 3179 3180 3181 3182 3183 3184 3185 3186 3187 3188 3189 3190 3191 3192 3193 3194 3195 3196 3197 3198 3199 3200 3201 3202 3203 3204 3205 3206 3207 3208 3209 3210 3211 3212 3213 3214 3215 3216 3217 3218

  if (pProjectInfo->curSOffset > 0) {
    if (pProjectInfo->groupId == 0) {  // it is the first group
      pProjectInfo->groupId = pBlock->info.groupId;
      blockDataCleanup(pInfo->pRes);
      return PROJECT_RETRIEVE_CONTINUE;
    } else if (pProjectInfo->groupId != pBlock->info.groupId) {
      pProjectInfo->curSOffset -= 1;

      // ignore data block in current group
      if (pProjectInfo->curSOffset > 0) {
        blockDataCleanup(pInfo->pRes);
        return PROJECT_RETRIEVE_CONTINUE;
      }
    }

    // set current group id of the project operator
    pProjectInfo->groupId = pBlock->info.groupId;
  }

  if (pProjectInfo->groupId != 0 && pProjectInfo->groupId != pBlock->info.groupId) {
    pProjectInfo->curGroupOutput += 1;
    if ((pProjectInfo->slimit.limit > 0) && (pProjectInfo->slimit.limit <= pProjectInfo->curGroupOutput)) {
      pOperator->status = OP_EXEC_DONE;
      blockDataCleanup(pRes);

      return PROJECT_RETRIEVE_DONE;
    }

    // reset the value for a new group data
    pProjectInfo->curOffset = 0;
    pProjectInfo->curOutput = 0;
  }

  // here we reach the start position, according to the limit/offset requirements.

  // set current group id
  pProjectInfo->groupId = pBlock->info.groupId;

  if (pProjectInfo->curOffset >= pRes->info.rows) {
    pProjectInfo->curOffset -= pRes->info.rows;
    blockDataCleanup(pRes);
    return PROJECT_RETRIEVE_CONTINUE;
  } else if (pProjectInfo->curOffset < pRes->info.rows && pProjectInfo->curOffset > 0) {
    blockDataTrimFirstNRows(pRes, pProjectInfo->curOffset);
    pProjectInfo->curOffset = 0;
  }

3219
  // check for the limitation in each group
wmmhello's avatar
wmmhello 已提交
3220 3221 3222
  if (pProjectInfo->limit.limit >= 0 && pProjectInfo->curOutput + pRes->info.rows >= pProjectInfo->limit.limit) {
    int32_t keepRows = (int32_t)(pProjectInfo->limit.limit - pProjectInfo->curOutput);
    blockDataKeepFirstNRows(pRes, keepRows);
3223
    if (pProjectInfo->slimit.limit > 0 && pProjectInfo->slimit.limit <= pProjectInfo->curGroupOutput) {
3224 3225 3226
      pOperator->status = OP_EXEC_DONE;
    }

3227
    return PROJECT_RETRIEVE_DONE;
3228
  }
3229

3230
  // todo optimize performance
3231 3232
  // If there are slimit/soffset value exists, multi-round result can not be packed into one group, since the
  // they may not belong to the same group the limit/offset value is not valid in this case.
L
Liu Jicong 已提交
3233 3234
  if (pRes->info.rows >= pOperator->resultInfo.threshold || pProjectInfo->slimit.offset != -1 ||
      pProjectInfo->slimit.limit != -1) {
3235
    return PROJECT_RETRIEVE_DONE;
L
Liu Jicong 已提交
3236
  } else {  // not full enough, continue to accumulate the output data in the buffer.
3237 3238 3239 3240
    return PROJECT_RETRIEVE_CONTINUE;
  }
}

3241
static SSDataBlock* doProjectOperation(SOperatorInfo* pOperator) {
3242
  SProjectOperatorInfo* pProjectInfo = pOperator->info;
L
Liu Jicong 已提交
3243
  SOptrBasicInfo*       pInfo = &pProjectInfo->binfo;
3244

L
Liu Jicong 已提交
3245
  SExprSupp*   pSup = &pOperator->exprSupp;
3246
  SSDataBlock* pRes = pInfo->pRes;
3247
  blockDataCleanup(pRes);
3248

3249
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3250 3251 3252
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }
dengyihao's avatar
dengyihao 已提交
3253

H
Haojun Liao 已提交
3254
#if 0
3255 3256 3257 3258 3259
  if (pProjectInfo->existDataBlock) {  // TODO refactor
    SSDataBlock* pBlock = pProjectInfo->existDataBlock;
    pProjectInfo->existDataBlock = NULL;

    // the pDataBlock are always the same one, no need to call this again
H
Haojun Liao 已提交
3260
    setInputDataBlock(pOperator, pInfo->pCtx, pBlock, TSDB_ORDER_ASC);
3261

H
Haojun Liao 已提交
3262
    blockDataEnsureCapacity(pInfo->pRes, pBlock->info.rows);
3263
    projectApplyFunctions(pOperator->exprSupp.pExprInfo, pInfo->pRes, pBlock, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
L
Liu Jicong 已提交
3264
    if (pRes->info.rows >= pProjectInfo->binfo.capacity * 0.8) {
3265 3266
      copyTsColoum(pRes, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
      resetResultRowEntryResult(pInfo->pCtx, pOperator->exprSupp.numOfExprs);
3267 3268 3269
      return pRes;
    }
  }
H
Haojun Liao 已提交
3270
#endif
3271

3272
  int64_t st = 0;
3273 3274 3275
  int32_t order = 0;
  int32_t scanFlag = 0;

3276 3277 3278 3279
  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

H
Haojun Liao 已提交
3280 3281
  SOperatorInfo* downstream = pOperator->pDownstream[0];

L
Liu Jicong 已提交
3282
  while (1) {
H
Haojun Liao 已提交
3283
    // The downstream exec may change the value of the newgroup, so use a local variable instead.
3284
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
3285
    if (pBlock == NULL) {
L
Liu Jicong 已提交
3286 3287
      // TODO optimize
      /*if (pTaskInfo->execModel != OPTR_EXEC_MODEL_STREAM) {*/
3288
      doSetOperatorCompleted(pOperator);
L
Liu Jicong 已提交
3289
      /*}*/
3290 3291
      break;
    }
3292 3293 3294 3295
    if (pBlock->info.type == STREAM_RETRIEVE) {
      // for stream interval
      return pBlock;
    }
3296 3297

    // the pDataBlock are always the same one, no need to call this again
3298
    int32_t code = getTableScanInfo(pOperator->pDownstream[0], &order, &scanFlag);
3299 3300 3301
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
3302

3303
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
3304 3305
    blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

3306
    code = projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs,
X
Xiaoyu Wang 已提交
3307
                                 pProjectInfo->pPseudoColInfo);
3308 3309
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
3310 3311
    }

3312
    int32_t status = handleLimitOffset(pOperator, pBlock);
3313 3314 3315 3316

    // filter shall be applied after apply functions and limit/offset on the result
    doFilter(pProjectInfo->pFilterNode, pInfo->pRes);

3317
    if (status == PROJECT_RETRIEVE_CONTINUE) {
H
Haojun Liao 已提交
3318
      continue;
L
Liu Jicong 已提交
3319
    } else if (status == PROJECT_RETRIEVE_DONE) {
3320 3321 3322
      break;
    }
  }
dengyihao's avatar
dengyihao 已提交
3323

H
Haojun Liao 已提交
3324
  pProjectInfo->curOutput += pInfo->pRes->info.rows;
H
Haojun Liao 已提交
3325

3326 3327 3328 3329
  size_t rows = pInfo->pRes->info.rows;
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
3330
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
3331 3332
  }

3333
  return (rows > 0) ? pInfo->pRes : NULL;
3334 3335
}

L
Liu Jicong 已提交
3336 3337
static void doHandleRemainBlockForNewGroupImpl(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo, bool* newgroup,
                                               SExecTaskInfo* pTaskInfo) {
3338
  pInfo->totalInputRows = pInfo->existNewGroupBlock->info.rows;
H
Haojun Liao 已提交
3339

L
Liu Jicong 已提交
3340 3341
  int64_t ekey = Q_STATUS_EQUAL(pTaskInfo->status, TASK_COMPLETED) ? pTaskInfo->window.ekey
                                                                   : pInfo->existNewGroupBlock->info.window.ekey;
3342 3343
  taosResetFillInfo(pInfo->pFillInfo, getFillInfoStart(pInfo->pFillInfo));

3344
  taosFillSetStartInfo(pInfo->pFillInfo, pInfo->existNewGroupBlock->info.rows, ekey);
3345 3346
  taosFillSetInputDataBlock(pInfo->pFillInfo, pInfo->existNewGroupBlock);

3347
  doFillTimeIntervalGapsInResults(pInfo->pFillInfo, pInfo->pRes, pResultInfo->capacity);
3348 3349 3350 3351
  pInfo->existNewGroupBlock = NULL;
  *newgroup = true;
}

L
Liu Jicong 已提交
3352 3353
static void doHandleRemainBlockFromNewGroup(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo, bool* newgroup,
                                            SExecTaskInfo* pTaskInfo) {
3354 3355
  if (taosFillHasMoreResults(pInfo->pFillInfo)) {
    *newgroup = false;
3356
    doFillTimeIntervalGapsInResults(pInfo->pFillInfo, pInfo->pRes, (int32_t)pResultInfo->capacity);
H
Haojun Liao 已提交
3357
    if (pInfo->pRes->info.rows > pResultInfo->threshold || (!pInfo->multigroupResult)) {
3358 3359 3360 3361 3362 3363
      return;
    }
  }

  // handle the cached new group data block
  if (pInfo->existNewGroupBlock) {
3364
    doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, newgroup, pTaskInfo);
3365 3366 3367
  }
}

3368
static SSDataBlock* doFill(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3369 3370
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;
3371

H
Haojun Liao 已提交
3372
  SResultInfo* pResultInfo = &pOperator->resultInfo;
3373 3374 3375
  SSDataBlock* pResBlock = pInfo->pRes;

  blockDataCleanup(pResBlock);
3376 3377 3378 3379
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

3380
  // todo handle different group data interpolation
X
Xiaoyu Wang 已提交
3381 3382
  bool  n = false;
  bool* newgroup = &n;
3383
  doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, newgroup, pTaskInfo);
3384 3385
  if (pResBlock->info.rows > pResultInfo->threshold || (!pInfo->multigroupResult && pResBlock->info.rows > 0)) {
    return pResBlock;
H
Haojun Liao 已提交
3386
  }
3387

H
Haojun Liao 已提交
3388
  SOperatorInfo* pDownstream = pOperator->pDownstream[0];
L
Liu Jicong 已提交
3389
  while (1) {
3390
    SSDataBlock* pBlock = pDownstream->fpSet.getNextFn(pDownstream);
3391 3392 3393 3394 3395 3396 3397 3398 3399 3400
    if (*newgroup) {
      assert(pBlock != NULL);
    }

    if (*newgroup && pInfo->totalInputRows > 0) {  // there are already processed current group data block
      pInfo->existNewGroupBlock = pBlock;
      *newgroup = false;

      // Fill the previous group data block, before handle the data block of new group.
      // Close the fill operation for previous group data block
3401
      taosFillSetStartInfo(pInfo->pFillInfo, 0, pTaskInfo->window.ekey);
3402 3403 3404 3405 3406 3407 3408
    } else {
      if (pBlock == NULL) {
        if (pInfo->totalInputRows == 0) {
          pOperator->status = OP_EXEC_DONE;
          return NULL;
        }

3409
        taosFillSetStartInfo(pInfo->pFillInfo, 0, pTaskInfo->window.ekey);
3410 3411 3412 3413 3414 3415 3416
      } else {
        pInfo->totalInputRows += pBlock->info.rows;
        taosFillSetStartInfo(pInfo->pFillInfo, pBlock->info.rows, pBlock->info.window.ekey);
        taosFillSetInputDataBlock(pInfo->pFillInfo, pBlock);
      }
    }

3417 3418
    blockDataEnsureCapacity(pResBlock, pOperator->resultInfo.capacity);
    doFillTimeIntervalGapsInResults(pInfo->pFillInfo, pResBlock, pOperator->resultInfo.capacity);
3419 3420

    // current group has no more result to return
3421
    if (pResBlock->info.rows > 0) {
3422 3423
      // 1. The result in current group not reach the threshold of output result, continue
      // 2. If multiple group results existing in one SSDataBlock is not allowed, return immediately
3424 3425
      if (pResBlock->info.rows > pResultInfo->threshold || pBlock == NULL || (!pInfo->multigroupResult)) {
        return pResBlock;
3426 3427
      }

3428
      doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, newgroup, pTaskInfo);
3429 3430
      if (pResBlock->info.rows > pOperator->resultInfo.threshold || pBlock == NULL) {
        return pResBlock;
3431 3432 3433
      }
    } else if (pInfo->existNewGroupBlock) {  // try next group
      assert(pBlock != NULL);
3434
      doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, newgroup, pTaskInfo);
3435 3436
      if (pResBlock->info.rows > pResultInfo->threshold) {
        return pResBlock;
3437 3438 3439 3440 3441 3442 3443
      }
    } else {
      return NULL;
    }
  }
}

H
Haojun Liao 已提交
3444 3445 3446 3447 3448 3449 3450 3451 3452 3453 3454
static void destroyExprInfo(SExprInfo* pExpr, int32_t numOfExprs) {
  for (int32_t i = 0; i < numOfExprs; ++i) {
    SExprInfo* pExprInfo = &pExpr[i];
    if (pExprInfo->pExpr->nodeType == QUERY_NODE_COLUMN) {
      taosMemoryFree(pExprInfo->base.pParam[0].pCol);
    }
    taosMemoryFree(pExprInfo->base.pParam);
    taosMemoryFree(pExprInfo->pExpr);
  }
}

3455 3456 3457 3458 3459
static void destroyOperatorInfo(SOperatorInfo* pOperator) {
  if (pOperator == NULL) {
    return;
  }

3460
  if (pOperator->fpSet.closeFn != NULL) {
3461
    pOperator->fpSet.closeFn(pOperator->info, pOperator->exprSupp.numOfExprs);
3462 3463
  }

H
Haojun Liao 已提交
3464
  if (pOperator->pDownstream != NULL) {
L
Liu Jicong 已提交
3465
    for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
H
Haojun Liao 已提交
3466
      destroyOperatorInfo(pOperator->pDownstream[i]);
3467 3468
    }

wafwerar's avatar
wafwerar 已提交
3469
    taosMemoryFreeClear(pOperator->pDownstream);
H
Haojun Liao 已提交
3470
    pOperator->numOfDownstream = 0;
3471 3472
  }

3473 3474
  if (pOperator->exprSupp.pExprInfo != NULL) {
    destroyExprInfo(pOperator->exprSupp.pExprInfo, pOperator->exprSupp.numOfExprs);
H
Haojun Liao 已提交
3475 3476
  }

3477
  taosMemoryFreeClear(pOperator->exprSupp.pExprInfo);
wafwerar's avatar
wafwerar 已提交
3478 3479
  taosMemoryFreeClear(pOperator->info);
  taosMemoryFreeClear(pOperator);
3480 3481
}

3482 3483 3484 3485 3486 3487 3488 3489 3490 3491 3492 3493 3494 3495 3496
int32_t getBufferPgSize(int32_t rowSize, uint32_t* defaultPgsz, uint32_t* defaultBufsz) {
  *defaultPgsz = 4096;
  while (*defaultPgsz < rowSize * 4) {
    *defaultPgsz <<= 1u;
  }

  // at least four pages need to be in buffer
  *defaultBufsz = 4096 * 256;
  if ((*defaultBufsz) <= (*defaultPgsz)) {
    (*defaultBufsz) = (*defaultPgsz) * 4;
  }

  return 0;
}

dengyihao's avatar
dengyihao 已提交
3497 3498
int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                         const char* pKey) {
3499 3500
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);

dengyihao's avatar
dengyihao 已提交
3501 3502
  pAggSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
  pAggSup->keyBuf = taosMemoryCalloc(1, keyBufSize + POINTER_BYTES + sizeof(int64_t));
3503 3504
  pAggSup->pResultRowHashTable = taosHashInit(10, hashFn, true, HASH_NO_LOCK);

H
Haojun Liao 已提交
3505
  if (pAggSup->keyBuf == NULL || pAggSup->pResultRowHashTable == NULL) {
3506 3507 3508
    return TSDB_CODE_OUT_OF_MEMORY;
  }

dengyihao's avatar
dengyihao 已提交
3509
  uint32_t defaultPgsz = 0;
3510 3511
  uint32_t defaultBufsz = 0;
  getBufferPgSize(pAggSup->resultRowSize, &defaultPgsz, &defaultBufsz);
H
Haojun Liao 已提交
3512

3513
  int32_t code = createDiskbasedBuf(&pAggSup->pResultBuf, defaultPgsz, defaultBufsz, pKey, TD_TMP_DIR_PATH);
H
Haojun Liao 已提交
3514 3515 3516 3517
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3518 3519 3520
  return TSDB_CODE_SUCCESS;
}

3521
void cleanupAggSup(SAggSupporter* pAggSup) {
wafwerar's avatar
wafwerar 已提交
3522
  taosMemoryFreeClear(pAggSup->keyBuf);
3523
  taosHashCleanup(pAggSup->pResultRowHashTable);
H
Haojun Liao 已提交
3524
  destroyDiskbasedBuf(pAggSup->pResultBuf);
3525 3526
}

L
Liu Jicong 已提交
3527 3528
int32_t initAggInfo(SExprSupp* pSup, SAggSupporter* pAggSup, SExprInfo* pExprInfo, int32_t numOfCols, size_t keyBufSize,
                    const char* pkey) {
3529 3530 3531 3532 3533
  int32_t code = initExprSupp(pSup, pExprInfo, numOfCols);
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3534
  doInitAggInfoSup(pAggSup, pSup->pCtx, numOfCols, keyBufSize, pkey);
L
Liu Jicong 已提交
3535
  for (int32_t i = 0; i < numOfCols; ++i) {
3536
    pSup->pCtx[i].pBuf = pAggSup->pResultBuf;
3537 3538
  }

3539
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
3540 3541
}

3542
void initResultSizeInfo(SOperatorInfo* pOperator, int32_t numOfRows) {
wmmhello's avatar
wmmhello 已提交
3543
  ASSERT(numOfRows != 0);
3544 3545 3546 3547
  pOperator->resultInfo.capacity = numOfRows;
  pOperator->resultInfo.threshold = numOfRows * 0.75;

  if (pOperator->resultInfo.threshold == 0) {
wmmhello's avatar
wmmhello 已提交
3548
    pOperator->resultInfo.threshold = numOfRows;
3549 3550 3551
  }
}

3552 3553 3554 3555 3556
void initBasicInfo(SOptrBasicInfo* pInfo, SSDataBlock* pBlock) {
  pInfo->pRes = pBlock;
  initResultRowInfo(&pInfo->resultRowInfo);
}

3557
int32_t initExprSupp(SExprSupp* pSup, SExprInfo* pExprInfo, int32_t numOfExpr) {
3558 3559 3560 3561
  pSup->pExprInfo = pExprInfo;
  pSup->numOfExprs = numOfExpr;
  if (pSup->pExprInfo != NULL) {
    pSup->pCtx = createSqlFunctionCtx(pExprInfo, numOfExpr, &pSup->rowEntryInfoOffset);
3562 3563 3564
    if (pSup->pCtx == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
3565
  }
3566 3567

  return TSDB_CODE_SUCCESS;
3568 3569
}

L
Liu Jicong 已提交
3570
SOperatorInfo* createAggregateOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
S
slzhou 已提交
3571
                                           SSDataBlock* pResultBlock, SNode* pCondition, SExprInfo* pScalarExprInfo,
wmmhello's avatar
wmmhello 已提交
3572
                                           int32_t numOfScalarExpr, SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3573
  SAggOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SAggOperatorInfo));
L
Liu Jicong 已提交
3574
  SOperatorInfo*    pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3575 3576 3577
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
H
Haojun Liao 已提交
3578

3579
  int32_t numOfRows = 1024;
dengyihao's avatar
dengyihao 已提交
3580
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3581 3582

  initResultSizeInfo(pOperator, numOfRows);
3583
  int32_t code = initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
L
Liu Jicong 已提交
3584
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3585 3586
    goto _error;
  }
H
Haojun Liao 已提交
3587

3588
  initBasicInfo(&pInfo->binfo, pResultBlock);
3589 3590 3591 3592
  code = initExprSupp(&pInfo->scalarExprSup, pScalarExprInfo, numOfScalarExpr);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3593

L
Liu Jicong 已提交
3594
  pInfo->groupId = INT32_MIN;
S
slzhou 已提交
3595
  pInfo->pCondition = pCondition;
dengyihao's avatar
dengyihao 已提交
3596
  pOperator->name = "TableAggregate";
3597
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_HASH_AGG;
3598
  pOperator->blocking = true;
dengyihao's avatar
dengyihao 已提交
3599 3600 3601
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3602

3603 3604
  pOperator->fpSet = createOperatorFpSet(doOpenAggregateOptr, getAggregateResult, NULL, NULL, destroyAggOperatorInfo,
                                         aggEncodeResultRow, aggDecodeResultRow, NULL);
H
Haojun Liao 已提交
3605 3606 3607 3608 3609

  code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3610 3611

  return pOperator;
L
Liu Jicong 已提交
3612
_error:
H
Haojun Liao 已提交
3613
  destroyAggOperatorInfo(pInfo, numOfCols);
wafwerar's avatar
wafwerar 已提交
3614 3615
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
H
Haojun Liao 已提交
3616 3617
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3618 3619
}

3620 3621 3622 3623 3624 3625 3626 3627 3628 3629 3630 3631 3632 3633 3634 3635 3636 3637 3638
static void* destroySqlFunctionCtx(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
  if (pCtx == NULL) {
    return NULL;
  }

  for (int32_t i = 0; i < numOfOutput; ++i) {
    for (int32_t j = 0; j < pCtx[i].numOfParams; ++j) {
      taosVariantDestroy(&pCtx[i].param[j].param);
    }

    taosMemoryFreeClear(pCtx[i].subsidiaries.pCtx);
    taosMemoryFree(pCtx[i].input.pData);
    taosMemoryFree(pCtx[i].input.pColumnDataAgg);
  }

  taosMemoryFreeClear(pCtx);
  return NULL;
}

3639
void cleanupBasicInfo(SOptrBasicInfo* pInfo) {
3640 3641
  assert(pInfo != NULL);
  cleanupResultRowInfo(&pInfo->resultRowInfo);
H
Haojun Liao 已提交
3642
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
3643 3644
}

H
Haojun Liao 已提交
3645
void destroyBasicOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3646
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)param;
3647
  cleanupBasicInfo(pInfo);
3648
}
H
Haojun Liao 已提交
3649 3650

void destroyAggOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3651
  SAggOperatorInfo* pInfo = (SAggOperatorInfo*)param;
3652
  cleanupBasicInfo(&pInfo->binfo);
3653
}
3654

H
Haojun Liao 已提交
3655
void destroySFillOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3656
  SFillOperatorInfo* pInfo = (SFillOperatorInfo*)param;
3657
  pInfo->pFillInfo = taosDestroyFillInfo(pInfo->pFillInfo);
H
Haojun Liao 已提交
3658
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
wafwerar's avatar
wafwerar 已提交
3659
  taosMemoryFreeClear(pInfo->p);
3660 3661
}

H
Haojun Liao 已提交
3662
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput) {
D
fix bug  
dapan 已提交
3663 3664 3665
  if (NULL == param) {
    return;
  }
L
Liu Jicong 已提交
3666
  SProjectOperatorInfo* pInfo = (SProjectOperatorInfo*)param;
3667
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3668
  cleanupAggSup(&pInfo->aggSup);
H
Haojun Liao 已提交
3669
  taosArrayDestroy(pInfo->pPseudoColInfo);
3670 3671
}

3672
void cleanupExprSupp(SExprSupp* pSupp) {
3673 3674 3675 3676 3677 3678
  destroySqlFunctionCtx(pSupp->pCtx, pSupp->numOfExprs);
  destroyExprInfo(pSupp->pExprInfo, pSupp->numOfExprs);

  taosMemoryFree(pSupp->rowEntryInfoOffset);
}

H
Haojun Liao 已提交
3679
static void destroyIndefinitOperatorInfo(void* param, int32_t numOfOutput) {
3680
  SIndefOperatorInfo* pInfo = (SIndefOperatorInfo*)param;
3681
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3682 3683 3684

  taosArrayDestroy(pInfo->pPseudoColInfo);
  cleanupAggSup(&pInfo->aggSup);
3685
  cleanupExprSupp(&pInfo->scalarSup);
H
Haojun Liao 已提交
3686 3687
}

H
Haojun Liao 已提交
3688
void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3689
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3690 3691 3692 3693
  taosRemoveRef(exchangeObjRefPool, pExInfo->self);
}

void doDestroyExchangeOperatorInfo(void* param) {
X
Xiaoyu Wang 已提交
3694
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3695

H
Haojun Liao 已提交
3696 3697 3698 3699 3700 3701 3702 3703 3704
  taosArrayDestroy(pExInfo->pSources);
  taosArrayDestroy(pExInfo->pSourceDataInfo);
  if (pExInfo->pResult != NULL) {
    blockDataDestroy(pExInfo->pResult);
  }

  tsem_destroy(&pExInfo->ready);
}

H
Haojun Liao 已提交
3705 3706
static SArray* setRowTsColumnOutputInfo(SqlFunctionCtx* pCtx, int32_t numOfCols) {
  SArray* pList = taosArrayInit(4, sizeof(int32_t));
dengyihao's avatar
dengyihao 已提交
3707
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
3708 3709 3710 3711 3712 3713 3714 3715
    if (fmIsPseudoColumnFunc(pCtx[i].functionId)) {
      taosArrayPush(pList, &i);
    }
  }

  return pList;
}

3716 3717 3718 3719
static int64_t getLimit(SNode* pLimit) { return NULL == pLimit ? -1 : ((SLimitNode*)pLimit)->limit; }

static int64_t getOffset(SNode* pLimit) { return NULL == pLimit ? -1 : ((SLimitNode*)pLimit)->offset; }

L
Liu Jicong 已提交
3720
SOperatorInfo* createProjectOperatorInfo(SOperatorInfo* downstream, SProjectPhysiNode* pProjPhyNode,
dengyihao's avatar
dengyihao 已提交
3721
                                         SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3722
  SProjectOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SProjectOperatorInfo));
L
Liu Jicong 已提交
3723
  SOperatorInfo*        pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3724 3725 3726
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
3727

L
Liu Jicong 已提交
3728
  int32_t    numOfCols = 0;
3729 3730 3731
  SExprInfo* pExprInfo = createExprInfo(pProjPhyNode->pProjections, NULL, &numOfCols);

  SSDataBlock* pResBlock = createResDataBlock(pProjPhyNode->node.pOutputDataBlockDesc);
3732 3733
  SLimit       limit = {.limit = getLimit(pProjPhyNode->node.pLimit), .offset = getOffset(pProjPhyNode->node.pLimit)};
  SLimit slimit = {.limit = getLimit(pProjPhyNode->node.pSlimit), .offset = getOffset(pProjPhyNode->node.pSlimit)};
3734

L
Liu Jicong 已提交
3735 3736 3737 3738
  pInfo->limit = limit;
  pInfo->slimit = slimit;
  pInfo->curOffset = limit.offset;
  pInfo->curSOffset = slimit.offset;
H
Haojun Liao 已提交
3739
  pInfo->binfo.pRes = pResBlock;
3740
  pInfo->pFilterNode = pProjPhyNode->node.pConditions;
H
Haojun Liao 已提交
3741 3742

  int32_t numOfRows = 4096;
dengyihao's avatar
dengyihao 已提交
3743
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3744

3745 3746 3747 3748 3749
  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
3750
  initResultSizeInfo(pOperator, numOfRows);
3751

3752 3753
  initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
  initBasicInfo(&pInfo->binfo, pResBlock);
3754
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfCols);
3755

3756
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pOperator->exprSupp.pCtx, numOfCols);
X
Xiaoyu Wang 已提交
3757
  pOperator->name = "ProjectOperator";
H
Haojun Liao 已提交
3758
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_PROJECT;
X
Xiaoyu Wang 已提交
3759 3760 3761 3762
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
3763

L
Liu Jicong 已提交
3764 3765
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doProjectOperation, NULL, NULL,
                                         destroyProjectOperatorInfo, NULL, NULL, NULL);
L
Liu Jicong 已提交
3766

3767
  int32_t code = appendDownstream(pOperator, &downstream, 1);
H
Haojun Liao 已提交
3768
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3769 3770
    goto _error;
  }
3771 3772

  return pOperator;
H
Haojun Liao 已提交
3773

L
Liu Jicong 已提交
3774
_error:
H
Haojun Liao 已提交
3775 3776
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3777 3778
}

H
Haojun Liao 已提交
3779 3780
static SSDataBlock* doApplyIndefinitFunction(SOperatorInfo* pOperator) {
  SIndefOperatorInfo* pIndefInfo = pOperator->info;
3781
  SOptrBasicInfo*     pInfo = &pIndefInfo->binfo;
L
Liu Jicong 已提交
3782
  SExprSupp*          pSup = &pOperator->exprSupp;
H
Haojun Liao 已提交
3783 3784 3785 3786 3787 3788 3789 3790 3791 3792 3793 3794 3795 3796 3797 3798 3799 3800 3801 3802 3803 3804 3805 3806 3807 3808 3809 3810 3811 3812 3813 3814 3815 3816

  SSDataBlock* pRes = pInfo->pRes;
  blockDataCleanup(pRes);

  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

  int64_t st = 0;
  int32_t order = 0;
  int32_t scanFlag = 0;

  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

  SOperatorInfo* downstream = pOperator->pDownstream[0];

  while (1) {
    // The downstream exec may change the value of the newgroup, so use a local variable instead.
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
    if (pBlock == NULL) {
      doSetOperatorCompleted(pOperator);
      break;
    }

    // the pDataBlock are always the same one, no need to call this again
    int32_t code = getTableScanInfo(pOperator->pDownstream[0], &order, &scanFlag);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }

    // there is an scalar expression that needs to be calculated before apply the group aggregation.
3817
    SExprSupp* pScalarSup = &pIndefInfo->scalarSup;
3818 3819
    if (pScalarSup->pExprInfo != NULL) {
      code = projectApplyFunctions(pScalarSup->pExprInfo, pBlock, pBlock, pScalarSup->pCtx, pScalarSup->numOfExprs,
L
Liu Jicong 已提交
3820
                                   pIndefInfo->pPseudoColInfo);
H
Haojun Liao 已提交
3821 3822 3823 3824 3825
      if (code != TSDB_CODE_SUCCESS) {
        longjmp(pTaskInfo->env, code);
      }
    }

3826
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
H
Haojun Liao 已提交
3827 3828
    blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

L
Liu Jicong 已提交
3829 3830
    code = projectApplyFunctions(pOperator->exprSupp.pExprInfo, pInfo->pRes, pBlock, pSup->pCtx,
                                 pOperator->exprSupp.numOfExprs, pIndefInfo->pPseudoColInfo);
H
Haojun Liao 已提交
3831 3832 3833 3834 3835 3836 3837 3838 3839 3840 3841 3842 3843 3844 3845
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
  }

  size_t rows = pInfo->pRes->info.rows;
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
  }

  return (rows > 0) ? pInfo->pRes : NULL;
}

3846 3847
SOperatorInfo* createIndefinitOutputOperatorInfo(SOperatorInfo* downstream, SPhysiNode* pNode,
                                                 SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
3848
  SIndefOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SIndefOperatorInfo));
3849
  SOperatorInfo*      pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3850 3851 3852 3853
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

3854 3855
  SExprSupp* pSup = &pOperator->exprSupp;

H
Haojun Liao 已提交
3856 3857 3858
  SIndefRowsFuncPhysiNode* pPhyNode = (SIndefRowsFuncPhysiNode*)pNode;

  int32_t    numOfExpr = 0;
X
Xiaoyu Wang 已提交
3859
  SExprInfo* pExprInfo = createExprInfo(pPhyNode->pFuncs, NULL, &numOfExpr);
H
Haojun Liao 已提交
3860 3861

  if (pPhyNode->pExprs != NULL) {
3862
    int32_t    num = 0;
3863
    SExprInfo* pSExpr = createExprInfo(pPhyNode->pExprs, NULL, &num);
3864
    int32_t    code = initExprSupp(&pInfo->scalarSup, pSExpr, num);
3865 3866 3867
    if (code != TSDB_CODE_SUCCESS) {
      goto _error;
    }
H
Haojun Liao 已提交
3868 3869
  }

3870
  SSDataBlock* pResBlock = createResDataBlock(pPhyNode->node.pOutputDataBlockDesc);
H
Haojun Liao 已提交
3871 3872 3873 3874 3875 3876 3877 3878 3879 3880 3881

  int32_t numOfRows = 4096;
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;

  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
  initResultSizeInfo(pOperator, numOfRows);

3882 3883 3884
  initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfExpr, keyBufSize, pTaskInfo->id.str);
  initBasicInfo(&pInfo->binfo, pResBlock);

3885
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfExpr);
H
Haojun Liao 已提交
3886

3887 3888
  pInfo->binfo.pRes = pResBlock;
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pSup->pCtx, numOfExpr);
H
Haojun Liao 已提交
3889

3890
  pOperator->name = "IndefinitOperator";
H
Haojun Liao 已提交
3891
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_PROJECT;
3892 3893 3894
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
3895 3896
  pOperator->exprSupp.pExprInfo = pExprInfo;
  pOperator->exprSupp.numOfExprs = numOfExpr;
3897
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3898 3899 3900 3901 3902 3903 3904 3905 3906 3907 3908

  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doApplyIndefinitFunction, NULL, NULL,
                                         destroyIndefinitOperatorInfo, NULL, NULL, NULL);

  int32_t code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  return pOperator;

3909
_error:
H
Haojun Liao 已提交
3910 3911 3912 3913 3914 3915
  taosMemoryFree(pInfo);
  taosMemoryFree(pOperator);
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
}

3916
static int32_t initFillInfo(SFillOperatorInfo* pInfo, SExprInfo* pExpr, int32_t numOfCols, SNodeListNode* pValNode,
L
Liu Jicong 已提交
3917
                            STimeWindow win, int32_t capacity, const char* id, SInterval* pInterval, int32_t fillType) {
3918
  SFillColInfo* pColInfo = createFillColInfo(pExpr, numOfCols, pValNode);
H
Haojun Liao 已提交
3919 3920

  STimeWindow w = TSWINDOW_INITIALIZER;
3921
  getAlignQueryTimeWindow(pInterval, pInterval->precision, win.skey, &w);
H
Haojun Liao 已提交
3922 3923

  int32_t order = TSDB_ORDER_ASC;
3924
  pInfo->pFillInfo = taosCreateFillInfo(order, w.skey, 0, capacity, numOfCols, pInterval, fillType, pColInfo, id);
H
Haojun Liao 已提交
3925

wafwerar's avatar
wafwerar 已提交
3926
  pInfo->p = taosMemoryCalloc(numOfCols, POINTER_BYTES);
H
Haojun Liao 已提交
3927
  if (pInfo->pFillInfo == NULL || pInfo->p == NULL) {
H
Haojun Liao 已提交
3928 3929
    taosMemoryFree(pInfo->pFillInfo);
    taosMemoryFree(pInfo->p);
H
Haojun Liao 已提交
3930 3931 3932 3933 3934 3935
    return TSDB_CODE_OUT_OF_MEMORY;
  } else {
    return TSDB_CODE_SUCCESS;
  }
}

3936 3937 3938 3939 3940 3941 3942 3943
SOperatorInfo* createFillOperatorInfo(SOperatorInfo* downstream, SFillPhysiNode* pPhyFillNode, bool multigroupResult,
                                      SExecTaskInfo* pTaskInfo) {
  SFillOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SFillOperatorInfo));
  SOperatorInfo*     pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

L
Liu Jicong 已提交
3944 3945 3946 3947 3948
  int32_t      num = 0;
  SSDataBlock* pResBlock = createResDataBlock(pPhyFillNode->node.pOutputDataBlockDesc);
  SExprInfo*   pExprInfo = createExprInfo(pPhyFillNode->pTargets, NULL, &num);
  SInterval*   pInterval = &((SIntervalAggOperatorInfo*)downstream->info)->interval;
  int32_t      type = convertFillType(pPhyFillNode->mode);
3949

H
Haojun Liao 已提交
3950
  SResultInfo* pResultInfo = &pOperator->resultInfo;
3951 3952
  initResultSizeInfo(pOperator, 4096);

3953 3954
  int32_t code = initFillInfo(pInfo, pExprInfo, num, (SNodeListNode*)pPhyFillNode->pValues, pPhyFillNode->timeRange,
                              pResultInfo->capacity, pTaskInfo->id.str, pInterval, type);
3955 3956 3957
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3958

L
Liu Jicong 已提交
3959
  pInfo->pRes = pResBlock;
3960
  pInfo->multigroupResult = multigroupResult;
dengyihao's avatar
dengyihao 已提交
3961
  pOperator->name = "FillOperator";
3962
  pOperator->blocking = false;
dengyihao's avatar
dengyihao 已提交
3963
  pOperator->status = OP_NOT_OPENED;
3964
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_FILL;
3965 3966 3967 3968
  pOperator->exprSupp.pExprInfo = pExprInfo;
  pOperator->exprSupp.numOfExprs = num;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3969

L
Liu Jicong 已提交
3970 3971
  pOperator->fpSet =
      createOperatorFpSet(operatorDummyOpenFn, doFill, NULL, NULL, destroySFillOperatorInfo, NULL, NULL, NULL);
3972

3973
  code = appendDownstream(pOperator, &downstream, 1);
3974
  return pOperator;
H
Haojun Liao 已提交
3975

L
Liu Jicong 已提交
3976
_error:
wafwerar's avatar
wafwerar 已提交
3977 3978
  taosMemoryFreeClear(pOperator);
  taosMemoryFreeClear(pInfo);
H
Haojun Liao 已提交
3979
  return NULL;
3980 3981
}

D
dapan1121 已提交
3982
static SExecTaskInfo* createExecTaskInfo(uint64_t queryId, uint64_t taskId, EOPTR_EXEC_MODEL model, char* dbFName) {
wafwerar's avatar
wafwerar 已提交
3983
  SExecTaskInfo* pTaskInfo = taosMemoryCalloc(1, sizeof(SExecTaskInfo));
3984
  setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
3985

D
dapan1121 已提交
3986
  pTaskInfo->schemaVer.dbname = strdup(dbFName);
3987
  pTaskInfo->cost.created = taosGetTimestampMs();
H
Haojun Liao 已提交
3988
  pTaskInfo->id.queryId = queryId;
dengyihao's avatar
dengyihao 已提交
3989
  pTaskInfo->execModel = model;
H
Haojun Liao 已提交
3990

wafwerar's avatar
wafwerar 已提交
3991
  char* p = taosMemoryCalloc(1, 128);
L
Liu Jicong 已提交
3992
  snprintf(p, 128, "TID:0x%" PRIx64 " QID:0x%" PRIx64, taskId, queryId);
H
Haojun Liao 已提交
3993
  pTaskInfo->id.str = p;
H
Haojun Liao 已提交
3994

3995 3996
  return pTaskInfo;
}
H
Haojun Liao 已提交
3997

H
Hongze Cheng 已提交
3998
static STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
H
Haojun Liao 已提交
3999
                                       STableListInfo* pTableListInfo, const char* idstr);
H
Haojun Liao 已提交
4000

H
Haojun Liao 已提交
4001
static SArray* extractColumnInfo(SNodeList* pNodeList);
4002

D
dapan1121 已提交
4003
int32_t extractTableSchemaVersion(SReadHandle* pHandle, uint64_t uid, SExecTaskInfo* pTaskInfo) {
4004 4005
  SMetaReader mr = {0};
  metaReaderInit(&mr, pHandle->meta, 0);
D
dapan1121 已提交
4006
  int32_t code = metaGetTableEntryByUid(&mr, uid);
4007
  if (code != TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
4008
    metaReaderClear(&mr);
4009
    return terrno;
D
dapan1121 已提交
4010
  }
4011 4012 4013 4014

  pTaskInfo->schemaVer.tablename = strdup(mr.me.name);

  if (mr.me.type == TSDB_SUPER_TABLE) {
4015
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
4016
    pTaskInfo->schemaVer.tversion = mr.me.stbEntry.schemaTag.version;
4017 4018 4019
  } else if (mr.me.type == TSDB_CHILD_TABLE) {
    tb_uid_t suid = mr.me.ctbEntry.suid;
    metaGetTableEntryByUid(&mr, suid);
4020
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
4021
    pTaskInfo->schemaVer.tversion = mr.me.stbEntry.schemaTag.version;
4022
  } else {
4023
    pTaskInfo->schemaVer.sw = tCloneSSchemaWrapper(&mr.me.ntbEntry.schemaRow);
4024
  }
4025 4026

  metaReaderClear(&mr);
D
dapan1121 已提交
4027 4028

  return TSDB_CODE_SUCCESS;
4029 4030
}

4031
static int32_t sortTableGroup(STableListInfo* pTableListInfo, int32_t groupNum) {
wmmhello's avatar
wmmhello 已提交
4032
  taosArrayClear(pTableListInfo->pGroupList);
4033 4034
  SArray* sortSupport = taosArrayInit(groupNum, sizeof(uint64_t));
  if (sortSupport == NULL) return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
4035 4036
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
4037
    uint64_t*      groupId = taosHashGet(pTableListInfo->map, &info->uid, sizeof(uint64_t));
wmmhello's avatar
wmmhello 已提交
4038 4039

    int32_t index = taosArraySearchIdx(sortSupport, groupId, compareUint64Val, TD_EQ);
4040 4041 4042 4043
    if (index == -1) {
      void*   p = taosArraySearch(sortSupport, groupId, compareUint64Val, TD_GT);
      SArray* tGroup = taosArrayInit(8, sizeof(STableKeyInfo));
      if (tGroup == NULL) {
wmmhello's avatar
wmmhello 已提交
4044 4045 4046
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
4047
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4048 4049 4050 4051
        qError("taos push info array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
4052
      if (p == NULL) {
wmmhello's avatar
wmmhello 已提交
4053
        if (taosArrayPush(sortSupport, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4054 4055 4056 4057
          qError("taos push support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
wmmhello's avatar
wmmhello 已提交
4058
        if (taosArrayPush(pTableListInfo->pGroupList, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4059 4060 4061 4062
          qError("taos push group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4063
      } else {
wmmhello's avatar
wmmhello 已提交
4064
        int32_t pos = TARRAY_ELEM_IDX(sortSupport, p);
4065
        if (taosArrayInsert(sortSupport, pos, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4066 4067 4068 4069
          qError("taos insert support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4070
        if (taosArrayInsert(pTableListInfo->pGroupList, pos, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4071 4072 4073 4074 4075
          qError("taos insert group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
      }
4076
    } else {
wmmhello's avatar
wmmhello 已提交
4077
      SArray* tGroup = (SArray*)taosArrayGetP(pTableListInfo->pGroupList, index);
4078
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4079 4080 4081 4082 4083 4084 4085 4086 4087 4088
        qError("taos push uid array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
    }
  }
  taosArrayDestroy(sortSupport);
  return TDB_CODE_SUCCESS;
}

wmmhello's avatar
wmmhello 已提交
4089 4090
int32_t generateGroupIdMap(STableListInfo* pTableListInfo, SReadHandle* pHandle, SNodeList* group) {
  if (group == NULL) {
wmmhello's avatar
wmmhello 已提交
4091 4092 4093 4094 4095 4096 4097 4098
    return TDB_CODE_SUCCESS;
  }

  pTableListInfo->map = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, HASH_NO_LOCK);
  if (pTableListInfo->map == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
  int32_t keyLen = 0;
X
Xiaoyu Wang 已提交
4099
  void*   keyBuf = NULL;
wmmhello's avatar
wmmhello 已提交
4100

4101
  SNode* node;
wmmhello's avatar
wmmhello 已提交
4102
  FOREACH(node, group) {
4103
    SExprNode* pExpr = (SExprNode*)node;
wmmhello's avatar
wmmhello 已提交
4104
    keyLen += pExpr->resType.bytes;
wmmhello's avatar
wmmhello 已提交
4105 4106
  }

wmmhello's avatar
wmmhello 已提交
4107
  int32_t nullFlagSize = sizeof(int8_t) * LIST_LENGTH(group);
wmmhello's avatar
wmmhello 已提交
4108 4109 4110 4111 4112 4113 4114
  keyLen += nullFlagSize;

  keyBuf = taosMemoryCalloc(1, keyLen);
  if (keyBuf == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

4115
  int32_t groupNum = 0;
X
Xiaoyu Wang 已提交
4116 4117 4118
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
    SMetaReader    mr = {0};
wmmhello's avatar
wmmhello 已提交
4119 4120 4121
    metaReaderInit(&mr, pHandle->meta, 0);
    metaGetTableEntryByUid(&mr, info->uid);

4122
    SNodeList* groupNew = nodesCloneList(group);
wmmhello's avatar
wmmhello 已提交
4123

wmmhello's avatar
wmmhello 已提交
4124
    nodesRewriteExprsPostOrder(groupNew, doTranslateTagExpr, &mr);
wmmhello's avatar
wmmhello 已提交
4125
    char* isNull = (char*)keyBuf;
wmmhello's avatar
wmmhello 已提交
4126 4127
    char* pStart = (char*)keyBuf + nullFlagSize;

4128
    SNode*  pNode;
wmmhello's avatar
wmmhello 已提交
4129
    int32_t index = 0;
4130
    FOREACH(pNode, groupNew) {
wmmhello's avatar
wmmhello 已提交
4131 4132 4133 4134
      SNode*  pNew = NULL;
      int32_t code = scalarCalculateConstants(pNode, &pNew);
      if (TSDB_CODE_SUCCESS == code) {
        REPLACE_NODE(pNew);
X
Xiaoyu Wang 已提交
4135
      } else {
4136
        taosMemoryFree(keyBuf);
wmmhello's avatar
wmmhello 已提交
4137
        nodesClearList(groupNew);
4138
        metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4139
        return code;
wmmhello's avatar
wmmhello 已提交
4140
      }
4141

wmmhello's avatar
wmmhello 已提交
4142
      ASSERT(nodeType(pNew) == QUERY_NODE_VALUE);
4143
      SValueNode* pValue = (SValueNode*)pNew;
4144

wmmhello's avatar
wmmhello 已提交
4145
      if (pValue->node.resType.type == TSDB_DATA_TYPE_NULL || pValue->isNull) {
wmmhello's avatar
wmmhello 已提交
4146 4147 4148 4149
        isNull[index++] = 1;
        continue;
      } else {
        isNull[index++] = 0;
4150
        char* data = nodesGetValueFromNode(pValue);
L
Liu Jicong 已提交
4151 4152
        if (pValue->node.resType.type == TSDB_DATA_TYPE_JSON) {
          if (tTagIsJson(data)) {
wmmhello's avatar
wmmhello 已提交
4153 4154 4155
            terrno = TSDB_CODE_QRY_JSON_IN_GROUP_ERROR;
            taosMemoryFree(keyBuf);
            nodesClearList(groupNew);
4156
            metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4157 4158
            return terrno;
          }
wmmhello's avatar
wmmhello 已提交
4159
          int32_t len = getJsonValueLen(data);
wmmhello's avatar
wmmhello 已提交
4160 4161 4162
          memcpy(pStart, data, len);
          pStart += len;
        } else if (IS_VAR_DATA_TYPE(pValue->node.resType.type)) {
wmmhello's avatar
wmmhello 已提交
4163 4164
          memcpy(pStart, data, varDataTLen(data));
          pStart += varDataTLen(data);
wmmhello's avatar
wmmhello 已提交
4165
        } else {
wmmhello's avatar
wmmhello 已提交
4166 4167
          memcpy(pStart, data, pValue->node.resType.bytes);
          pStart += pValue->node.resType.bytes;
wmmhello's avatar
wmmhello 已提交
4168 4169 4170
        }
      }
    }
4171
    int32_t  len = (int32_t)(pStart - (char*)keyBuf);
4172 4173
    uint64_t groupId = calcGroupId(keyBuf, len);
    taosHashPut(pTableListInfo->map, &(info->uid), sizeof(uint64_t), &groupId, sizeof(uint64_t));
S
slzhou 已提交
4174
    info->groupId = groupId;
4175
    groupNum++;
wmmhello's avatar
wmmhello 已提交
4176

wmmhello's avatar
wmmhello 已提交
4177
    nodesClearList(groupNew);
wmmhello's avatar
wmmhello 已提交
4178 4179 4180
    metaReaderClear(&mr);
  }
  taosMemoryFree(keyBuf);
4181

4182
  if (pTableListInfo->needSortTableByGroupId) {
wmmhello's avatar
wmmhello 已提交
4183
    return sortTableGroup(pTableListInfo, groupNum);
4184 4185
  }

wmmhello's avatar
wmmhello 已提交
4186 4187 4188
  return TDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
4189
SOperatorInfo* createOperatorTree(SPhysiNode* pPhyNode, SExecTaskInfo* pTaskInfo, SReadHandle* pHandle,
4190 4191
                                  uint64_t queryId, uint64_t taskId, STableListInfo* pTableListInfo,
                                  const char* pUser) {
4192 4193
  int32_t type = nodeType(pPhyNode);

X
Xiaoyu Wang 已提交
4194
  if (pPhyNode->pChildren == NULL || LIST_LENGTH(pPhyNode->pChildren) == 0) {
H
Haojun Liao 已提交
4195
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == type) {
dengyihao's avatar
dengyihao 已提交
4196
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4197

wmmhello's avatar
wmmhello 已提交
4198
      int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
4199
      if (code) {
wmmhello's avatar
wmmhello 已提交
4200
        pTaskInfo->code = code;
D
dapan1121 已提交
4201 4202
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4203

wmmhello's avatar
wmmhello 已提交
4204
      code = extractTableSchemaVersion(pHandle, pTableScanNode->scan.uid, pTaskInfo);
S
slzhou 已提交
4205
      if (code) {
4206
        pTaskInfo->code = terrno;
wmmhello's avatar
wmmhello 已提交
4207 4208 4209
        return NULL;
      }

H
Haojun Liao 已提交
4210
      SOperatorInfo*  pOperator = createTableScanOperatorInfo(pTableScanNode, pHandle, pTaskInfo);
4211 4212
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
S
slzhou 已提交
4213
      return pOperator;
L
Liu Jicong 已提交
4214

S
slzhou 已提交
4215 4216
    } else if (QUERY_NODE_PHYSICAL_PLAN_TABLE_MERGE_SCAN == type) {
      STableMergeScanPhysiNode* pTableScanNode = (STableMergeScanPhysiNode*)pPhyNode;
wmmhello's avatar
wmmhello 已提交
4217
      int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
L
Liu Jicong 已提交
4218
      if (code) {
wmmhello's avatar
wmmhello 已提交
4219
        pTaskInfo->code = code;
wmmhello's avatar
wmmhello 已提交
4220 4221 4222 4223 4224 4225 4226
        return NULL;
      }
      code = extractTableSchemaVersion(pHandle, pTableScanNode->scan.uid, pTaskInfo);
      if (code) {
        pTaskInfo->code = terrno;
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4227

4228 4229
      SOperatorInfo* pOperator =
          createTableMergeScanOperatorInfo(pTableScanNode, pTableListInfo, pHandle, pTaskInfo, queryId, taskId);
wmmhello's avatar
wmmhello 已提交
4230

4231 4232 4233
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
      return pOperator;
L
Liu Jicong 已提交
4234

H
Haojun Liao 已提交
4235
    } else if (QUERY_NODE_PHYSICAL_PLAN_EXCHANGE == type) {
4236
      return createExchangeOperatorInfo(pHandle->pMsgCb->clientRpc, (SExchangePhysiNode*)pPhyNode, pTaskInfo);
L
Liu Jicong 已提交
4237

H
Haojun Liao 已提交
4238
    } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN == type) {
5
54liuyao 已提交
4239
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
4240
      STimeWindowAggSupp   twSup = {
L
Liu Jicong 已提交
4241 4242 4243 4244
            .waterMark = pTableScanNode->watermark,
            .calTrigger = pTableScanNode->triggerType,
            .maxTs = INT64_MIN,
      };
L
Liu Jicong 已提交
4245
      if (pHandle) {
wmmhello's avatar
wmmhello 已提交
4246
        int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
L
Liu Jicong 已提交
4247
        if (code) {
wmmhello's avatar
wmmhello 已提交
4248 4249 4250
          pTaskInfo->code = code;
          return NULL;
        }
5
54liuyao 已提交
4251
      }
4252

4253 4254
      SOperatorInfo* pOperator =
          createStreamScanOperatorInfo(pHandle, pTableScanNode, pTaskInfo, &twSup, queryId, taskId);
H
Haojun Liao 已提交
4255
      return pOperator;
L
Liu Jicong 已提交
4256

H
Haojun Liao 已提交
4257
    } else if (QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN == type) {
L
Liu Jicong 已提交
4258
      SSystemTableScanPhysiNode* pSysScanPhyNode = (SSystemTableScanPhysiNode*)pPhyNode;
4259
      return createSysTableScanOperatorInfo(pHandle, pSysScanPhyNode, pUser, pTaskInfo);
4260
    } else if (QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN == type) {
X
Xiaoyu Wang 已提交
4261
      STagScanPhysiNode* pScanPhyNode = (STagScanPhysiNode*)pPhyNode;
4262

4263
      int32_t code = getTableList(pHandle->meta, pHandle->vnode, pScanPhyNode, pTableListInfo);
4264
      if (code != TSDB_CODE_SUCCESS) {
4265
        pTaskInfo->code = terrno;
4266 4267 4268
        return NULL;
      }

4269
      return createTagScanOperatorInfo(pHandle, pScanPhyNode, pTableListInfo, pTaskInfo);
4270
    } else if (QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN == type) {
4271
      SBlockDistScanPhysiNode* pBlockNode = (SBlockDistScanPhysiNode*)pPhyNode;
4272 4273 4274
      pTableListInfo->pTableList = taosArrayInit(4, sizeof(STableKeyInfo));

      if (pBlockNode->tableType == TSDB_SUPER_TABLE) {
4275
        int32_t code = vnodeGetAllTableList(pHandle->vnode, pBlockNode->uid, pTableListInfo->pTableList);
4276 4277 4278 4279 4280
        if (code != TSDB_CODE_SUCCESS) {
          pTaskInfo->code = terrno;
          return NULL;
        }
      } else {  // Create one table group.
S
slzhou 已提交
4281
        STableKeyInfo info = {.lastKey = 0, .uid = pBlockNode->uid, .groupId = 0};
4282 4283 4284 4285 4286 4287 4288 4289 4290 4291 4292 4293 4294 4295 4296 4297 4298 4299 4300 4301 4302 4303
        taosArrayPush(pTableListInfo->pTableList, &info);
      }

      SQueryTableDataCond cond = {0};

      {
        cond.order = TSDB_ORDER_ASC;
        cond.numOfCols = 1;
        cond.colList = taosMemoryCalloc(1, sizeof(SColumnInfo));
        if (cond.colList == NULL) {
          terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
          return NULL;
        }

        cond.colList->colId = 1;
        cond.colList->type = TSDB_DATA_TYPE_TIMESTAMP;
        cond.colList->bytes = sizeof(TSKEY);

        cond.numOfTWindows = 1;
        cond.twindows = taosMemoryCalloc(1, sizeof(STimeWindow));
        cond.twindows[0] = (STimeWindow){.skey = INT64_MIN, .ekey = INT64_MAX};
        cond.suid = pBlockNode->suid;
H
Haojun Liao 已提交
4304
        cond.type = BLOCK_LOAD_OFFSET_ORDER;
4305
      }
H
Haojun Liao 已提交
4306 4307 4308

      STsdbReader* pReader = NULL;
      tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, "");
4309 4310
      cleanupQueryTableDataCond(&cond);

4311
      return createDataBlockInfoScanOperator(pReader, pHandle, cond.suid, pBlockNode, pTaskInfo);
H
Haojun Liao 已提交
4312 4313 4314
    } else if (QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN == type) {
      SLastRowScanPhysiNode* pScanNode = (SLastRowScanPhysiNode*)pPhyNode;

L
Liu Jicong 已提交
4315 4316 4317 4318 4319
      //      int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
      //      if (code) {
      //        pTaskInfo->code = code;
      //        return NULL;
      //      }
H
Haojun Liao 已提交
4320

4321
      int32_t code = extractTableSchemaVersion(pHandle, pScanNode->uid, pTaskInfo);
4322 4323 4324 4325
      if (code != TSDB_CODE_SUCCESS) {
        pTaskInfo->code = code;
        return NULL;
      }
4326

H
Haojun Liao 已提交
4327
      pTableListInfo->pTableList = taosArrayInit(4, sizeof(STableKeyInfo));
H
Haojun Liao 已提交
4328
      if (pScanNode->tableType == TSDB_SUPER_TABLE) {
4329
        code = vnodeGetAllTableList(pHandle->vnode, pScanNode->uid, pTableListInfo->pTableList);
H
Haojun Liao 已提交
4330 4331 4332 4333 4334 4335 4336 4337 4338
        if (code != TSDB_CODE_SUCCESS) {
          pTaskInfo->code = terrno;
          return NULL;
        }
      } else {  // Create one table group.
        STableKeyInfo info = {.lastKey = 0, .uid = pScanNode->uid, .groupId = 0};
        taosArrayPush(pTableListInfo->pTableList, &info);
      }

H
Haojun Liao 已提交
4339
      return createLastrowScanOperator(pScanNode, pHandle, pTableListInfo->pTableList, pTaskInfo);
H
Haojun Liao 已提交
4340 4341
    } else {
      ASSERT(0);
H
Haojun Liao 已提交
4342 4343 4344
    }
  }

4345 4346
  int32_t num = 0;
  size_t  size = LIST_LENGTH(pPhyNode->pChildren);
H
Haojun Liao 已提交
4347

4348
  SOperatorInfo** ops = taosMemoryCalloc(size, POINTER_BYTES);
dengyihao's avatar
dengyihao 已提交
4349
  for (int32_t i = 0; i < size; ++i) {
4350
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pPhyNode->pChildren, i);
4351
    ops[i] = createOperatorTree(pChildNode, pTaskInfo, pHandle, queryId, taskId, pTableListInfo, pUser);
4352 4353 4354
    if (ops[i] == NULL) {
      return NULL;
    }
4355
  }
H
Haojun Liao 已提交
4356

4357
  SOperatorInfo* pOptr = NULL;
H
Haojun Liao 已提交
4358
  if (QUERY_NODE_PHYSICAL_PLAN_PROJECT == type) {
4359
    pOptr = createProjectOperatorInfo(ops[0], (SProjectPhysiNode*)pPhyNode, pTaskInfo);
4360
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_AGG == type) {
H
Haojun Liao 已提交
4361 4362
    SAggPhysiNode* pAggNode = (SAggPhysiNode*)pPhyNode;
    SExprInfo*     pExprInfo = createExprInfo(pAggNode->pAggFuncs, pAggNode->pGroupKeys, &num);
4363
    SSDataBlock*   pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4364

dengyihao's avatar
dengyihao 已提交
4365
    int32_t    numOfScalarExpr = 0;
4366 4367 4368 4369 4370
    SExprInfo* pScalarExprInfo = NULL;
    if (pAggNode->pExprs != NULL) {
      pScalarExprInfo = createExprInfo(pAggNode->pExprs, NULL, &numOfScalarExpr);
    }

H
Haojun Liao 已提交
4371 4372
    if (pAggNode->pGroupKeys != NULL) {
      SArray* pColList = extractColumnInfo(pAggNode->pGroupKeys);
dengyihao's avatar
dengyihao 已提交
4373
      pOptr = createGroupOperatorInfo(ops[0], pExprInfo, num, pResBlock, pColList, pAggNode->node.pConditions,
wmmhello's avatar
wmmhello 已提交
4374
                                      pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4375
    } else {
L
Liu Jicong 已提交
4376 4377
      pOptr = createAggregateOperatorInfo(ops[0], pExprInfo, num, pResBlock, pAggNode->node.pConditions,
                                          pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4378
    }
X
Xiaoyu Wang 已提交
4379
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_INTERVAL == type || QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type) {
H
Haojun Liao 已提交
4380
    SIntervalPhysiNode* pIntervalPhyNode = (SIntervalPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4381

H
Haojun Liao 已提交
4382
    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
4383
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4384

dengyihao's avatar
dengyihao 已提交
4385 4386 4387 4388 4389 4390
    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
H
Haojun Liao 已提交
4391

X
Xiaoyu Wang 已提交
4392 4393 4394 4395 4396
    STimeWindowAggSupp as = {
        .waterMark = pIntervalPhyNode->window.watermark,
        .calTrigger = pIntervalPhyNode->window.triggerType,
        .maxTs = INT64_MIN,
    };
4397
    ASSERT(as.calTrigger != STREAM_TRIGGER_MAX_DELAY);
4398

4399
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4400
    bool    isStream = (QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type);
4401 4402
    pOptr = createIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, &as, pIntervalPhyNode,
                                       pTaskInfo, isStream);
4403

4404 4405
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == type) {
    SMergeAlignedIntervalPhysiNode* pIntervalPhyNode = (SMergeAlignedIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4406 4407 4408 4409 4410 4411 4412 4413 4414 4415

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4416

S
shenglian zhou 已提交
4417
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
4418
    pOptr = createMergeAlignedIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, pTaskInfo);
S
shenglian zhou 已提交
4419
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_INTERVAL == type) {
X
Xiaoyu Wang 已提交
4420
    SMergeIntervalPhysiNode* pIntervalPhyNode = (SMergeIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4421 4422 4423 4424 4425 4426 4427 4428 4429 4430

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4431

S
shenglian zhou 已提交
4432 4433
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
    pOptr = createMergeIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, pTaskInfo);
5
54liuyao 已提交
4434
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_INTERVAL == type) {
4435
    int32_t children = 0;
5
54liuyao 已提交
4436 4437
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_INTERVAL == type) {
4438
    int32_t children = 1;
5
54liuyao 已提交
4439
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4440
  } else if (QUERY_NODE_PHYSICAL_PLAN_SORT == type) {
4441
    pOptr = createSortOperatorInfo(ops[0], (SSortPhysiNode*)pPhyNode, pTaskInfo);
S
shenglian zhou 已提交
4442 4443
  } else if (QUERY_NODE_PHYSICAL_PLAN_GROUP_SORT == type) {
    pOptr = createGroupSortOperatorInfo(ops[0], (SGroupSortPhysiNode*)pPhyNode, pTaskInfo);
X
Xiaoyu Wang 已提交
4444
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE == type) {
4445
    SMergePhysiNode* pMergePhyNode = (SMergePhysiNode*)pPhyNode;
4446
    pOptr = createMultiwayMergeOperatorInfo(ops, size, pMergePhyNode, pTaskInfo);
4447
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_SESSION == type) {
H
Haojun Liao 已提交
4448 4449
    SSessionWinodwPhysiNode* pSessionNode = (SSessionWinodwPhysiNode*)pPhyNode;

X
Xiaoyu Wang 已提交
4450 4451
    STimeWindowAggSupp as = {.waterMark = pSessionNode->window.watermark,
                             .calTrigger = pSessionNode->window.triggerType};
4452

H
Haojun Liao 已提交
4453
    SExprInfo*   pExprInfo = createExprInfo(pSessionNode->window.pFuncs, NULL, &num);
4454
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4455 4456
    int32_t      tsSlotId = ((SColumnNode*)pSessionNode->window.pTspk)->slotId;

X
Xiaoyu Wang 已提交
4457 4458
    pOptr =
        createSessionAggOperatorInfo(ops[0], pExprInfo, num, pResBlock, pSessionNode->gap, tsSlotId, &as, pTaskInfo);
4459
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SESSION == type) {
4460 4461 4462 4463 4464 4465 4466
    pOptr = createStreamSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_SESSION == type) {
    int32_t children = 0;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_SESSION == type) {
    int32_t children = 1;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4467
  } else if (QUERY_NODE_PHYSICAL_PLAN_PARTITION == type) {
4468
    pOptr = createPartitionOperatorInfo(ops[0], (SPartitionPhysiNode*)pPhyNode, pTaskInfo);
4469
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_STATE == type) {
dengyihao's avatar
dengyihao 已提交
4470
    SStateWinodwPhysiNode* pStateNode = (SStateWinodwPhysiNode*)pPhyNode;
4471

4472 4473
    STimeWindowAggSupp as = {.waterMark = pStateNode->window.watermark, .calTrigger = pStateNode->window.triggerType};

dengyihao's avatar
dengyihao 已提交
4474
    SExprInfo*   pExprInfo = createExprInfo(pStateNode->window.pFuncs, NULL, &num);
4475
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4476 4477
    int32_t      tsSlotId = ((SColumnNode*)pStateNode->window.pTspk)->slotId;

4478
    SColumnNode* pColNode = (SColumnNode*)((STargetNode*)pStateNode->pStateKey)->pExpr;
X
Xiaoyu Wang 已提交
4479
    SColumn      col = extractColumnFromColumnNode(pColNode);
4480
    pOptr = createStatewindowOperatorInfo(ops[0], pExprInfo, num, pResBlock, &as, tsSlotId, &col, pTaskInfo);
4481
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_STATE == type) {
5
54liuyao 已提交
4482
    pOptr = createStreamStateAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4483
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_JOIN == type) {
4484
    pOptr = createMergeJoinOperatorInfo(ops, size, (SJoinPhysiNode*)pPhyNode, pTaskInfo);
4485
  } else if (QUERY_NODE_PHYSICAL_PLAN_FILL == type) {
4486
    pOptr = createFillOperatorInfo(ops[0], (SFillPhysiNode*)pPhyNode, false, pTaskInfo);
H
Haojun Liao 已提交
4487 4488
  } else if (QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC == type) {
    pOptr = createIndefinitOutputOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4489 4490
  } else if (QUERY_NODE_PHYSICAL_PLAN_INTERP_FUNC == type) {
    pOptr = createTimeSliceOperatorInfo(ops[0], pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4491 4492
  } else {
    ASSERT(0);
H
Haojun Liao 已提交
4493
  }
4494 4495 4496

  taosMemoryFree(ops);
  return pOptr;
4497
}
H
Haojun Liao 已提交
4498

4499
int32_t compareTimeWindow(const void* p1, const void* p2, const void* param) {
dengyihao's avatar
dengyihao 已提交
4500 4501 4502
  const SQueryTableDataCond* pCond = param;
  const STimeWindow*         pWin1 = p1;
  const STimeWindow*         pWin2 = p2;
4503 4504 4505 4506 4507 4508 4509 4510
  if (pCond->order == TSDB_ORDER_ASC) {
    return pWin1->skey - pWin2->skey;
  } else if (pCond->order == TSDB_ORDER_DESC) {
    return pWin2->skey - pWin1->skey;
  }
  return 0;
}

H
Haojun Liao 已提交
4511
SArray* extractColumnInfo(SNodeList* pNodeList) {
L
Liu Jicong 已提交
4512
  size_t  numOfCols = LIST_LENGTH(pNodeList);
H
Haojun Liao 已提交
4513 4514 4515 4516 4517 4518
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColumn));
  if (pList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

L
Liu Jicong 已提交
4519 4520
  for (int32_t i = 0; i < numOfCols; ++i) {
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pNodeList, i);
H
Haojun Liao 已提交
4521

4522 4523 4524
    if (nodeType(pNode->pExpr) == QUERY_NODE_COLUMN) {
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

4525
      SColumn c = extractColumnFromColumnNode(pColNode);
4526 4527
      taosArrayPush(pList, &c);
    } else if (nodeType(pNode->pExpr) == QUERY_NODE_VALUE) {
L
Liu Jicong 已提交
4528 4529
      SValueNode* pValNode = (SValueNode*)pNode->pExpr;
      SColumn     c = {0};
4530
      c.slotId = pNode->slotId;
L
Liu Jicong 已提交
4531 4532 4533 4534
      c.colId = pNode->slotId;
      c.type = pValNode->node.type;
      c.bytes = pValNode->node.resType.bytes;
      c.scale = pValNode->node.resType.scale;
4535 4536 4537 4538
      c.precision = pValNode->node.resType.precision;

      taosArrayPush(pList, &c);
    }
H
Haojun Liao 已提交
4539 4540 4541 4542 4543
  }

  return pList;
}

L
Liu Jicong 已提交
4544 4545
STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
                                STableListInfo* pTableListInfo, const char* idstr) {
4546
  int32_t code = getTableList(pHandle->meta, pHandle->vnode, &pTableScanNode->scan, pTableListInfo);
wmmhello's avatar
wmmhello 已提交
4547 4548 4549 4550 4551 4552
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  if (taosArrayGetSize(pTableListInfo->pTableList) == 0) {
    code = 0;
H
Haojun Liao 已提交
4553
    qDebug("no table qualified for query, %s", idstr);
wmmhello's avatar
wmmhello 已提交
4554 4555 4556
    goto _error;
  }

4557
  SQueryTableDataCond cond = {0};
wmmhello's avatar
wmmhello 已提交
4558
  code = initQueryTableDataCond(&cond, pTableScanNode);
4559
  if (code != TSDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4560
    goto _error;
X
Xiaoyu Wang 已提交
4561
  }
4562

H
Hongze Cheng 已提交
4563
  STsdbReader* pReader;
H
Haojun Liao 已提交
4564
  code = tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, idstr);
H
Haojun Liao 已提交
4565 4566 4567 4568
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

4569
  cleanupQueryTableDataCond(&cond);
H
Haojun Liao 已提交
4570 4571

  return pReader;
wmmhello's avatar
wmmhello 已提交
4572 4573 4574 4575

_error:
  terrno = code;
  return NULL;
H
Haojun Liao 已提交
4576 4577
}

L
Liu Jicong 已提交
4578 4579 4580 4581 4582 4583 4584 4585 4586 4587 4588 4589 4590
static int32_t extractTbscanInStreamOpTree(SOperatorInfo* pOperator, STableScanInfo** ppInfo) {
  if (pOperator->operatorType != QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
    if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator");
      return TSDB_CODE_QRY_APP_ERROR;
    }

    if (pOperator->numOfDownstream > 1) {
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
    }
    return extractTbscanInStreamOpTree(pOperator->pDownstream[0], ppInfo);
  } else {
4591 4592 4593
    SStreamScanInfo* pInfo = pOperator->info;
    ASSERT(pInfo->pTableScanOp->operatorType == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN);
    *ppInfo = pInfo->pTableScanOp->info;
L
Liu Jicong 已提交
4594 4595 4596 4597
    return 0;
  }
}

4598 4599 4600 4601 4602 4603 4604 4605 4606 4607 4608 4609 4610 4611 4612 4613 4614 4615 4616 4617 4618 4619
int32_t extractTableScanNode(SPhysiNode* pNode, STableScanPhysiNode** ppNode) {
  if (pNode->pChildren == NULL || LIST_LENGTH(pNode->pChildren) == 0) {
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == pNode->type) {
      *ppNode = (STableScanPhysiNode*)pNode;
      return 0;
    } else {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
  } else {
    if (LIST_LENGTH(pNode->pChildren) != 1) {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pNode->pChildren, 0);
    return extractTableScanNode(pChildNode, ppNode);
  }
  return -1;
}

L
Liu Jicong 已提交
4620 4621 4622 4623 4624
int32_t rebuildReader(SOperatorInfo* pOperator, SSubplan* plan, SReadHandle* pHandle, int64_t uid, int64_t ts) {
  STableScanInfo* pTableScanInfo = NULL;
  if (extractTbscanInStreamOpTree(pOperator, &pTableScanInfo) < 0) {
    return -1;
  }
4625

L
Liu Jicong 已提交
4626 4627 4628 4629
  STableScanPhysiNode* pNode = NULL;
  if (extractTableScanNode(plan->pNode, &pNode) < 0) {
    ASSERT(0);
  }
4630

H
Haojun Liao 已提交
4631
  tsdbReaderClose(pTableScanInfo->dataReader);
4632

L
Liu Jicong 已提交
4633
  STableListInfo info = {0};
H
Haojun Liao 已提交
4634
  pTableScanInfo->dataReader = doCreateDataReader(pNode, pHandle, &info, NULL);
L
Liu Jicong 已提交
4635 4636 4637 4638
  if (pTableScanInfo->dataReader == NULL) {
    ASSERT(0);
    qError("failed to create data reader");
    return TSDB_CODE_QRY_APP_ERROR;
4639
  }
L
Liu Jicong 已提交
4640
  // TODO: set uid and ts to data reader
4641 4642 4643
  return 0;
}

C
Cary Xu 已提交
4644
int32_t encodeOperator(SOperatorInfo* ops, char** result, int32_t* length, int32_t* nOptrWithVal) {
wmmhello's avatar
wmmhello 已提交
4645
  int32_t code = TDB_CODE_SUCCESS;
4646
  char*   pCurrent = NULL;
wmmhello's avatar
wmmhello 已提交
4647
  int32_t currLength = 0;
4648
  if (ops->fpSet.encodeResultRow) {
C
Cary Xu 已提交
4649
    if (result == NULL || length == NULL || nOptrWithVal == NULL) {
wmmhello's avatar
wmmhello 已提交
4650 4651 4652
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
    code = ops->fpSet.encodeResultRow(ops, &pCurrent, &currLength);
wmmhello's avatar
wmmhello 已提交
4653

4654 4655
    if (code != TDB_CODE_SUCCESS) {
      if (*result != NULL) {
wmmhello's avatar
wmmhello 已提交
4656 4657 4658 4659
        taosMemoryFree(*result);
        *result = NULL;
      }
      return code;
C
Cary Xu 已提交
4660 4661 4662
    } else if (currLength == 0) {
      ASSERT(!pCurrent);
      goto _downstream;
wmmhello's avatar
wmmhello 已提交
4663
    }
wmmhello's avatar
wmmhello 已提交
4664

C
Cary Xu 已提交
4665 4666
    ++(*nOptrWithVal);

C
Cary Xu 已提交
4667
    ASSERT(currLength >= 0);
wmmhello's avatar
wmmhello 已提交
4668

4669
    if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
4670
      *result = (char*)taosMemoryCalloc(1, currLength + sizeof(int32_t));
wmmhello's avatar
wmmhello 已提交
4671 4672 4673 4674 4675 4676
      if (*result == NULL) {
        taosMemoryFree(pCurrent);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      memcpy(*result + sizeof(int32_t), pCurrent, currLength);
      *(int32_t*)(*result) = currLength + sizeof(int32_t);
4677
    } else {
wmmhello's avatar
wmmhello 已提交
4678
      int32_t sizePre = *(int32_t*)(*result);
4679
      char*   tmp = (char*)taosMemoryRealloc(*result, sizePre + currLength);
wmmhello's avatar
wmmhello 已提交
4680 4681 4682 4683 4684 4685 4686 4687 4688 4689 4690 4691
      if (tmp == NULL) {
        taosMemoryFree(pCurrent);
        taosMemoryFree(*result);
        *result = NULL;
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      *result = tmp;
      memcpy(*result + sizePre, pCurrent, currLength);
      *(int32_t*)(*result) += currLength;
    }
    taosMemoryFree(pCurrent);
    *length = *(int32_t*)(*result);
wmmhello's avatar
wmmhello 已提交
4692 4693
  }

C
Cary Xu 已提交
4694
_downstream:
wmmhello's avatar
wmmhello 已提交
4695
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
C
Cary Xu 已提交
4696
    code = encodeOperator(ops->pDownstream[i], result, length, nOptrWithVal);
4697
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4698
      return code;
wmmhello's avatar
wmmhello 已提交
4699 4700
    }
  }
wmmhello's avatar
wmmhello 已提交
4701
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4702 4703
}

H
Haojun Liao 已提交
4704
int32_t decodeOperator(SOperatorInfo* ops, const char* result, int32_t length) {
wmmhello's avatar
wmmhello 已提交
4705
  int32_t code = TDB_CODE_SUCCESS;
4706 4707
  if (ops->fpSet.decodeResultRow) {
    if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
4708 4709
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
H
Haojun Liao 已提交
4710

4711
    ASSERT(length == *(int32_t*)result);
H
Haojun Liao 已提交
4712 4713

    const char* data = result + sizeof(int32_t);
L
Liu Jicong 已提交
4714
    code = ops->fpSet.decodeResultRow(ops, (char*)data);
4715
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4716 4717
      return code;
    }
wmmhello's avatar
wmmhello 已提交
4718

wmmhello's avatar
wmmhello 已提交
4719
    int32_t totalLength = *(int32_t*)result;
4720 4721
    int32_t dataLength = *(int32_t*)data;

4722
    if (totalLength == dataLength + sizeof(int32_t)) {  // the last data
wmmhello's avatar
wmmhello 已提交
4723 4724
      result = NULL;
      length = 0;
4725
    } else {
wmmhello's avatar
wmmhello 已提交
4726 4727 4728 4729
      result += dataLength;
      *(int32_t*)(result) = totalLength - dataLength;
      length = totalLength - dataLength;
    }
wmmhello's avatar
wmmhello 已提交
4730 4731
  }

wmmhello's avatar
wmmhello 已提交
4732 4733
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
    code = decodeOperator(ops->pDownstream[i], result, length);
4734
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4735
      return code;
wmmhello's avatar
wmmhello 已提交
4736 4737
    }
  }
wmmhello's avatar
wmmhello 已提交
4738
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4739 4740
}

4741
int32_t createDataSinkParam(SDataSinkNode* pNode, void** pParam, qTaskInfo_t* pTaskInfo) {
D
dapan1121 已提交
4742
  SExecTaskInfo* pTask = *(SExecTaskInfo**)pTaskInfo;
4743

D
dapan1121 已提交
4744 4745
  switch (pNode->type) {
    case QUERY_NODE_PHYSICAL_PLAN_DELETE: {
4746
      SDeleterParam* pDeleterParam = taosMemoryCalloc(1, sizeof(SDeleterParam));
D
dapan1121 已提交
4747 4748 4749 4750
      if (NULL == pDeleterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      int32_t tbNum = taosArrayGetSize(pTask->tableqinfoList.pTableList);
D
dapan1121 已提交
4751
      pDeleterParam->suid = pTask->tableqinfoList.suid;
D
dapan1121 已提交
4752 4753 4754 4755 4756 4757
      pDeleterParam->pUidList = taosArrayInit(tbNum, sizeof(uint64_t));
      if (NULL == pDeleterParam->pUidList) {
        taosMemoryFree(pDeleterParam);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      for (int32_t i = 0; i < tbNum; ++i) {
4758
        STableKeyInfo* pTable = taosArrayGet(pTask->tableqinfoList.pTableList, i);
D
dapan1121 已提交
4759 4760 4761 4762 4763 4764 4765 4766 4767 4768 4769 4770 4771
        taosArrayPush(pDeleterParam->pUidList, &pTable->uid);
      }

      *pParam = pDeleterParam;
      break;
    }
    default:
      break;
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
4772
int32_t createExecTaskInfoImpl(SSubplan* pPlan, SExecTaskInfo** pTaskInfo, SReadHandle* pHandle, uint64_t taskId,
4773
                               const char* sql, EOPTR_EXEC_MODEL model) {
H
Haojun Liao 已提交
4774 4775
  uint64_t queryId = pPlan->id.queryId;

H
Haojun Liao 已提交
4776
  int32_t code = TSDB_CODE_SUCCESS;
D
dapan1121 已提交
4777
  *pTaskInfo = createExecTaskInfo(queryId, taskId, model, pPlan->dbFName);
H
Haojun Liao 已提交
4778 4779 4780 4781
  if (*pTaskInfo == NULL) {
    code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    goto _complete;
  }
H
Haojun Liao 已提交
4782

4783
  (*pTaskInfo)->sql = sql;
wmmhello's avatar
wmmhello 已提交
4784 4785
  (*pTaskInfo)->tableqinfoList.pTagCond = pPlan->pTagCond;
  (*pTaskInfo)->tableqinfoList.pTagIndexCond = pPlan->pTagIndexCond;
4786 4787
  (*pTaskInfo)->pRoot = createOperatorTree(pPlan->pNode, *pTaskInfo, pHandle, queryId, taskId,
                                           &(*pTaskInfo)->tableqinfoList, pPlan->user);
L
Liu Jicong 已提交
4788

D
dapan1121 已提交
4789
  if (NULL == (*pTaskInfo)->pRoot) {
4790
    code = (*pTaskInfo)->code;
D
dapan1121 已提交
4791
    goto _complete;
4792 4793
  }

H
Haojun Liao 已提交
4794 4795
  return code;

H
Haojun Liao 已提交
4796
_complete:
wafwerar's avatar
wafwerar 已提交
4797
  taosMemoryFreeClear(*pTaskInfo);
H
Haojun Liao 已提交
4798 4799
  terrno = code;
  return code;
H
Haojun Liao 已提交
4800 4801
}

wmmhello's avatar
wmmhello 已提交
4802 4803 4804
static void doDestroyTableList(STableListInfo* pTableqinfoList) {
  taosArrayDestroy(pTableqinfoList->pTableList);
  taosHashCleanup(pTableqinfoList->map);
4805 4806
  if (pTableqinfoList->needSortTableByGroupId) {
    for (int32_t i = 0; i < taosArrayGetSize(pTableqinfoList->pGroupList); i++) {
wmmhello's avatar
wmmhello 已提交
4807 4808 4809 4810 4811
      SArray* tmp = taosArrayGetP(pTableqinfoList->pGroupList, i);
      taosArrayDestroy(tmp);
    }
  }
  taosArrayDestroy(pTableqinfoList->pGroupList);
4812

wmmhello's avatar
wmmhello 已提交
4813 4814
  pTableqinfoList->pTableList = NULL;
  pTableqinfoList->map = NULL;
4815 4816
}

L
Liu Jicong 已提交
4817
void doDestroyTask(SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
4818 4819
  qDebug("%s execTask is freed", GET_TASKID(pTaskInfo));

wmmhello's avatar
wmmhello 已提交
4820
  doDestroyTableList(&pTaskInfo->tableqinfoList);
H
Haojun Liao 已提交
4821
  destroyOperatorInfo(pTaskInfo->pRoot);
L
Liu Jicong 已提交
4822 4823
  //  taosArrayDestroy(pTaskInfo->summary.queryProfEvents);
  //  taosHashCleanup(pTaskInfo->summary.operatorProfResults);
4824

4825 4826
  taosMemoryFree(pTaskInfo->schemaVer.dbname);
  taosMemoryFree(pTaskInfo->schemaVer.tablename);
wafwerar's avatar
wafwerar 已提交
4827 4828 4829
  taosMemoryFreeClear(pTaskInfo->sql);
  taosMemoryFreeClear(pTaskInfo->id.str);
  taosMemoryFreeClear(pTaskInfo);
4830 4831 4832 4833 4834 4835 4836 4837 4838 4839 4840 4841
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes) {
  if (val == NULL) {
    setNull(output, type, bytes);
    return;
  }

  if (IS_VAR_DATA_TYPE(type)) {
    // Binary data overflows for sort of unknown reasons. Let trim the overflow data
    if (varDataTLen(val) > bytes) {
      int32_t maxLen = bytes - VARSTR_HEADER_SIZE;
L
Liu Jicong 已提交
4842
      int32_t len = (varDataLen(val) > maxLen) ? maxLen : varDataLen(val);
4843 4844 4845 4846 4847 4848 4849 4850 4851 4852 4853 4854
      memcpy(varDataVal(output), varDataVal(val), len);
      varDataSetLen(output, len);
    } else {
      varDataCopy(output, val);
    }
  } else {
    memcpy(output, val, bytes);
  }
}

static int64_t getQuerySupportBufSize(size_t numOfTables) {
  size_t s1 = sizeof(STableQueryInfo);
L
Liu Jicong 已提交
4855 4856
  //  size_t s3 = sizeof(STableCheckInfo);  buffer consumption in tsdb
  return (int64_t)(s1 * 1.5 * numOfTables);
4857 4858 4859 4860 4861 4862 4863
}

int32_t checkForQueryBuf(size_t numOfTables) {
  int64_t t = getQuerySupportBufSize(numOfTables);
  if (tsQueryBufferSizeBytes < 0) {
    return TSDB_CODE_SUCCESS;
  } else if (tsQueryBufferSizeBytes > 0) {
L
Liu Jicong 已提交
4864
    while (1) {
4865 4866 4867 4868 4869 4870 4871 4872 4873 4874 4875 4876 4877 4878 4879 4880 4881 4882 4883 4884 4885 4886 4887 4888 4889 4890
      int64_t s = tsQueryBufferSizeBytes;
      int64_t remain = s - t;
      if (remain >= 0) {
        if (atomic_val_compare_exchange_64(&tsQueryBufferSizeBytes, s, remain) == s) {
          return TSDB_CODE_SUCCESS;
        }
      } else {
        return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
      }
    }
  }

  // disable query processing if the value of tsQueryBufferSize is zero.
  return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
}

void releaseQueryBuf(size_t numOfTables) {
  if (tsQueryBufferSizeBytes < 0) {
    return;
  }

  int64_t t = getQuerySupportBufSize(numOfTables);

  // restore value is not enough buffer available
  atomic_add_fetch_64(&tsQueryBufferSizeBytes, t);
}
D
dapan1121 已提交
4891

dengyihao's avatar
dengyihao 已提交
4892 4893
int32_t getOperatorExplainExecInfo(SOperatorInfo* operatorInfo, SExplainExecInfo** pRes, int32_t* capacity,
                                   int32_t* resNum) {
D
dapan1121 已提交
4894 4895
  if (*resNum >= *capacity) {
    *capacity += 10;
dengyihao's avatar
dengyihao 已提交
4896

D
dapan1121 已提交
4897 4898
    *pRes = taosMemoryRealloc(*pRes, (*capacity) * sizeof(SExplainExecInfo));
    if (NULL == *pRes) {
D
dapan1121 已提交
4899
      qError("malloc %d failed", (*capacity) * (int32_t)sizeof(SExplainExecInfo));
D
dapan1121 已提交
4900 4901 4902 4903
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

4904 4905 4906 4907 4908
  SExplainExecInfo* pInfo = &(*pRes)[*resNum];

  pInfo->numOfRows = operatorInfo->resultInfo.totalRows;
  pInfo->startupCost = operatorInfo->cost.openCost;
  pInfo->totalCost = operatorInfo->cost.totalCost;
D
dapan1121 已提交
4909

4910
  if (operatorInfo->fpSet.getExplainFn) {
4911
    int32_t code = operatorInfo->fpSet.getExplainFn(operatorInfo, &pInfo->verboseInfo, &pInfo->verboseLen);
D
dapan1121 已提交
4912
    if (code) {
4913
      qError("%s operator getExplainFn failed, code:%s", GET_TASKID(operatorInfo->pTaskInfo), tstrerror(code));
D
dapan1121 已提交
4914 4915
      return code;
    }
4916 4917 4918
  } else {
    pInfo->verboseLen = 0;
    pInfo->verboseInfo = NULL;
D
dapan1121 已提交
4919
  }
dengyihao's avatar
dengyihao 已提交
4920

D
dapan1121 已提交
4921
  ++(*resNum);
dengyihao's avatar
dengyihao 已提交
4922

D
dapan1121 已提交
4923
  int32_t code = 0;
D
dapan1121 已提交
4924 4925
  for (int32_t i = 0; i < operatorInfo->numOfDownstream; ++i) {
    code = getOperatorExplainExecInfo(operatorInfo->pDownstream[i], pRes, capacity, resNum);
D
dapan1121 已提交
4926 4927 4928 4929 4930 4931 4932
    if (code) {
      taosMemoryFreeClear(*pRes);
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
D
dapan1121 已提交
4933
}
5
54liuyao 已提交
4934

L
Liu Jicong 已提交
4935
int32_t initStreamAggSupporter(SStreamAggSupporter* pSup, const char* pKey, SqlFunctionCtx* pCtx, int32_t numOfOutput,
4936
                               int32_t size) {
4937
  pSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
5
54liuyao 已提交
4938 4939
  pSup->keySize = sizeof(int64_t) + sizeof(TSKEY);
  pSup->pKeyBuf = taosMemoryCalloc(1, pSup->keySize);
4940 4941
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);
  pSup->pResultRows = taosHashInit(1024, hashFn, false, HASH_NO_LOCK);
5
54liuyao 已提交
4942 4943 4944
  if (pSup->pKeyBuf == NULL || pSup->pResultRows == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
4945
  pSup->valueSize = size;
5
54liuyao 已提交
4946

5
54liuyao 已提交
4947 4948
  pSup->pScanWindow = taosArrayInit(4, sizeof(STimeWindow));

5
54liuyao 已提交
4949 4950 4951 4952 4953 4954 4955 4956 4957
  int32_t pageSize = 4096;
  while (pageSize < pSup->resultRowSize * 4) {
    pageSize <<= 1u;
  }
  // at least four pages need to be in buffer
  int32_t bufSize = 4096 * 256;
  if (bufSize <= pageSize) {
    bufSize = pageSize * 4;
  }
4958
  int32_t code = createDiskbasedBuf(&pSup->pResultBuf, pageSize, bufSize, pKey, TD_TMP_DIR_PATH);
L
Liu Jicong 已提交
4959
  for (int32_t i = 0; i < numOfOutput; ++i) {
4960 4961 4962
    pCtx[i].pBuf = pSup->pResultBuf;
  }
  return code;
5
54liuyao 已提交
4963
}