executorimpl.c 181.5 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
15

H
Haojun Liao 已提交
16 17
#include "filter.h"
#include "function.h"
18 19
#include "functionMgt.h"
#include "os.h"
H
Haojun Liao 已提交
20
#include "querynodes.h"
21
#include "tfill.h"
dengyihao's avatar
dengyihao 已提交
22
#include "tname.h"
X
Xiaoyu Wang 已提交
23
#include "tref.h"
24

H
Haojun Liao 已提交
25
#include "tdatablock.h"
26
#include "tglobal.h"
H
Haojun Liao 已提交
27
#include "tmsg.h"
H
Haojun Liao 已提交
28
#include "tsort.h"
29
#include "ttime.h"
H
Haojun Liao 已提交
30

31
#include "executorimpl.h"
dengyihao's avatar
dengyihao 已提交
32
#include "index.h"
33
#include "query.h"
34 35
#include "tcompare.h"
#include "tcompression.h"
H
Haojun Liao 已提交
36
#include "thash.h"
37
#include "ttypes.h"
dengyihao's avatar
dengyihao 已提交
38
#include "vnode.h"
39

H
Haojun Liao 已提交
40
#define IS_MAIN_SCAN(runtime)          ((runtime)->scanFlag == MAIN_SCAN)
41 42 43 44
#define SET_REVERSE_SCAN_FLAG(runtime) ((runtime)->scanFlag = REVERSE_SCAN)

#define GET_FORWARD_DIRECTION_FACTOR(ord) (((ord) == TSDB_ORDER_ASC) ? QUERY_ASC_FORWARD_STEP : QUERY_DESC_FORWARD_STEP)

45 46 47 48 49
enum {
  PROJECT_RETRIEVE_CONTINUE = 0x1,
  PROJECT_RETRIEVE_DONE = 0x2,
};

50 51
#if 0
static UNUSED_FUNC void *u_malloc (size_t __size) {
wafwerar's avatar
wafwerar 已提交
52
  uint32_t v = taosRand();
53 54 55 56

  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
57
    return taosMemoryMalloc(__size);
58 59 60 61
  }
}

static UNUSED_FUNC void* u_calloc(size_t num, size_t __size) {
wafwerar's avatar
wafwerar 已提交
62
  uint32_t v = taosRand();
63 64 65
  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
66
    return taosMemoryCalloc(num, __size);
67 68 69 70
  }
}

static UNUSED_FUNC void* u_realloc(void* p, size_t __size) {
wafwerar's avatar
wafwerar 已提交
71
  uint32_t v = taosRand();
72 73 74
  if (v % 5 <= 1) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
75
    return taosMemoryRealloc(p, __size);
76 77 78 79 80 81 82 83
  }
}

#define calloc  u_calloc
#define malloc  u_malloc
#define realloc u_realloc
#endif

X
Xiaoyu Wang 已提交
84
#define CLEAR_QUERY_STATUS(q, st)   ((q)->status &= (~(st)))
85 86
#define QUERY_IS_INTERVAL_QUERY(_q) ((_q)->interval.interval > 0)

L
Liu Jicong 已提交
87 88 89
int32_t getMaximumIdleDurationSec() { return tsShellActivityTimer * 2; }

static int32_t getExprFunctionId(SExprInfo* pExprInfo) {
90
  assert(pExprInfo != NULL && pExprInfo->pExpr != NULL && pExprInfo->pExpr->nodeType == TEXPR_UNARYEXPR_NODE);
91
  return 0;
92 93 94 95
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes);

96
static void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExpr, SSDataBlock* pSDataBlock);
97

X
Xiaoyu Wang 已提交
98
static void releaseQueryBuf(size_t numOfTables);
99 100 101 102 103

static void destroySFillOperatorInfo(void* param, int32_t numOfOutput);
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput);
static void destroyOrderOperatorInfo(void* param, int32_t numOfOutput);
static void destroyAggOperatorInfo(void* param, int32_t numOfOutput);
X
Xiaoyu Wang 已提交
104

H
Haojun Liao 已提交
105
static void destroyIntervalOperatorInfo(void* param, int32_t numOfOutput);
H
Haojun Liao 已提交
106 107
static void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput);

108 109
static void destroyOperatorInfo(SOperatorInfo* pOperator);

110
void doSetOperatorCompleted(SOperatorInfo* pOperator) {
111
  pOperator->status = OP_EXEC_DONE;
112

113
  pOperator->cost.totalCost = (taosGetTimestampUs() - pOperator->pTaskInfo->cost.start * 1000) / 1000.0;
H
Haojun Liao 已提交
114
  if (pOperator->pTaskInfo != NULL) {
115
    setTaskStatus(pOperator->pTaskInfo, TASK_COMPLETED);
116 117
  }
}
118

H
Haojun Liao 已提交
119
int32_t operatorDummyOpenFn(SOperatorInfo* pOperator) {
120
  OPTR_SET_OPENED(pOperator);
121
  pOperator->cost.openCost = 0;
H
Haojun Liao 已提交
122
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
123 124
}

125
SOperatorFpSet createOperatorFpSet(__optr_open_fn_t openFn, __optr_fn_t nextFn, __optr_fn_t streamFn,
L
Liu Jicong 已提交
126
                                   __optr_fn_t cleanup, __optr_close_fn_t closeFn, __optr_encode_fn_t encode,
127
                                   __optr_decode_fn_t decode, __optr_explain_fn_t explain) {
128 129 130 131 132 133 134 135 136 137 138 139 140 141
  SOperatorFpSet fpSet = {
      ._openFn = openFn,
      .getNextFn = nextFn,
      .getStreamResFn = streamFn,
      .cleanupFn = cleanup,
      .closeFn = closeFn,
      .encodeResultRow = encode,
      .decodeResultRow = decode,
      .getExplainFn = explain,
  };

  return fpSet;
}

H
Haojun Liao 已提交
142
void operatorDummyCloseFn(void* param, int32_t numOfCols) {}
H
Haojun Liao 已提交
143

X
Xiaoyu Wang 已提交
144 145 146
static int32_t doCopyToSDataBlock(SExecTaskInfo* taskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo,
                                  SDiskbasedBuf* pBuf, SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset,
                                  SqlFunctionCtx* pCtx, int32_t numOfExprs);
H
Haojun Liao 已提交
147

148
static void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size);
L
Liu Jicong 已提交
149 150
static void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                                     uint64_t groupId);
151

L
Liu Jicong 已提交
152 153
// setup the output buffer for each operator
static bool hasNull(SColumn* pColumn, SColumnDataAgg* pStatis) {
dengyihao's avatar
dengyihao 已提交
154 155
  if (TSDB_COL_IS_TAG(pColumn->flag) || TSDB_COL_IS_UD_COL(pColumn->flag) ||
      pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
156 157 158 159 160 161 162 163 164 165
    return false;
  }

  if (pStatis != NULL && pStatis->numOfNull == 0) {
    return false;
  }

  return true;
}

166
#if 0
L
Liu Jicong 已提交
167 168
static bool chkResultRowFromKey(STaskRuntimeEnv* pRuntimeEnv, SResultRowInfo* pResultRowInfo, char* pData,
                                int16_t bytes, bool masterscan, uint64_t uid) {
169 170 171
  bool existed = false;
  SET_RES_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid);

L
Liu Jicong 已提交
172 173
  SResultRow** p1 =
      (SResultRow**)taosHashGet(pRuntimeEnv->pResultRowHashTable, pRuntimeEnv->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
174 175 176 177 178 179 180 181 182 183 184

  // in case of repeat scan/reverse scan, no new time window added.
  if (QUERY_IS_INTERVAL_QUERY(pRuntimeEnv->pQueryAttr)) {
    if (!masterscan) {  // the *p1 may be NULL in case of sliding+offset exists.
      return p1 != NULL;
    }

    if (p1 != NULL) {
      if (pResultRowInfo->size == 0) {
        existed = false;
      } else if (pResultRowInfo->size == 1) {
dengyihao's avatar
dengyihao 已提交
185
        //        existed = (pResultRowInfo->pResult[0] == (*p1));
186 187
      } else {  // check if current pResultRowInfo contains the existed pResultRow
        SET_RES_EXT_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid, pResultRowInfo);
L
Liu Jicong 已提交
188 189
        int64_t* index =
            taosHashGet(pRuntimeEnv->pResultRowListSet, pRuntimeEnv->keyBuf, GET_RES_EXT_WINDOW_KEY_LEN(bytes));
190 191 192 193 194 195 196 197 198 199 200 201 202
        if (index != NULL) {
          existed = true;
        } else {
          existed = false;
        }
      }
    }

    return existed;
  }

  return p1 != NULL;
}
203
#endif
204

205
SResultRow* getNewResultRow(SDiskbasedBuf* pResultBuf, int64_t tableGroupId, int32_t interBufSize) {
L
Liu Jicong 已提交
206
  SFilePage* pData = NULL;
207 208 209 210 211 212 213 214 215 216 217 218 219

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tableGroupId);

  if (taosArrayGetSize(list) == 0) {
    pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
    pData->num = sizeof(SFilePage);
  } else {
    SPageInfo* pi = getLastPageInfo(list);
    pData = getBufPage(pResultBuf, getPageId(pi));
    pageId = getPageId(pi);

wmmhello's avatar
wmmhello 已提交
220
    if (pData->num + interBufSize > getBufPageSize(pResultBuf)) {
221 222 223 224 225 226 227 228 229 230 231 232 233 234
      // release current page first, and prepare the next one
      releaseBufPageInfo(pResultBuf, pi);

      pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
      if (pData != NULL) {
        pData->num = sizeof(SFilePage);
      }
    }
  }

  if (pData == NULL) {
    return NULL;
  }

235 236
  setBufPageDirty(pData, true);

237 238 239 240 241
  // set the number of rows in current disk page
  SResultRow* pResultRow = (SResultRow*)((char*)pData + pData->num);
  pResultRow->pageId = pageId;
  pResultRow->offset = (int32_t)pData->num;

wmmhello's avatar
wmmhello 已提交
242
  pData->num += interBufSize;
243 244 245 246

  return pResultRow;
}

247 248 249 250 251 252 253
/**
 * the struct of key in hash table
 * +----------+---------------+
 * | group id |   key data    |
 * | 8 bytes  | actual length |
 * +----------+---------------+
 */
254 255 256
SResultRow* doSetResultOutBufByKey(SDiskbasedBuf* pResultBuf, SResultRowInfo* pResultRowInfo, char* pData,
                                   int16_t bytes, bool masterscan, uint64_t groupId, SExecTaskInfo* pTaskInfo,
                                   bool isIntervalQuery, SAggSupporter* pSup) {
257
  SET_RES_WINDOW_KEY(pSup->keyBuf, pData, bytes, groupId);
H
Haojun Liao 已提交
258

dengyihao's avatar
dengyihao 已提交
259 260
  SResultRowPosition* p1 =
      (SResultRowPosition*)taosHashGet(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
H
Haojun Liao 已提交
261

262 263
  SResultRow* pResult = NULL;

H
Haojun Liao 已提交
264 265
  // in case of repeat scan/reverse scan, no new time window added.
  if (isIntervalQuery) {
266 267
    if (masterscan && p1 != NULL) {  // the *p1 may be NULL in case of sliding+offset exists.
      pResult = getResultRowByPos(pResultBuf, p1);
268
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
269 270
    }
  } else {
dengyihao's avatar
dengyihao 已提交
271 272
    // In case of group by column query, the required SResultRow object must be existInCurrentResusltRowInfo in the
    // pResultRowInfo object.
H
Haojun Liao 已提交
273
    if (p1 != NULL) {
274
      // todo
275
      pResult = getResultRowByPos(pResultBuf, p1);
276
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
277 278 279
    }
  }

L
Liu Jicong 已提交
280
  // 1. close current opened time window
281
  if (pResultRowInfo->cur.pageId != -1 && ((pResult == NULL) || (pResult->pageId != pResultRowInfo->cur.pageId))) {
282
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
283
    qDebug("page_1");
284
#endif
285
    SResultRowPosition pos = pResultRowInfo->cur;
X
Xiaoyu Wang 已提交
286
    SFilePage*         pPage = getBufPage(pResultBuf, pos.pageId);
287 288 289 290 291
    releaseBufPage(pResultBuf, pPage);
  }

  // allocate a new buffer page
  if (pResult == NULL) {
292
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
293
    qDebug("page_2");
294
#endif
H
Haojun Liao 已提交
295
    ASSERT(pSup->resultRowSize > 0);
296 297
    pResult = getNewResultRow(pResultBuf, groupId, pSup->resultRowSize);

298
    initResultRow(pResult);
H
Haojun Liao 已提交
299

300 301
    // add a new result set for a new group
    SResultRowPosition pos = {.pageId = pResult->pageId, .offset = pResult->offset};
X
Xiaoyu Wang 已提交
302 303
    taosHashPut(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes), &pos,
                sizeof(SResultRowPosition));
H
Haojun Liao 已提交
304 305
  }

306 307 308
  // 2. set the new time window to be the new active time window
  pResultRowInfo->cur = (SResultRowPosition){.pageId = pResult->pageId, .offset = pResult->offset};

H
Haojun Liao 已提交
309
  // too many time window in query
310
  if (taosHashGetSize(pSup->pResultRowHashTable) > MAX_INTERVAL_TIME_WINDOW) {
H
Haojun Liao 已提交
311 312 313
    longjmp(pTaskInfo->env, TSDB_CODE_QRY_TOO_MANY_TIMEWINDOW);
  }

H
Haojun Liao 已提交
314
  return pResult;
H
Haojun Liao 已提交
315 316
}

317
// a new buffer page for each table. Needs to opt this design
L
Liu Jicong 已提交
318
static int32_t addNewWindowResultBuf(SResultRow* pWindowRes, SDiskbasedBuf* pResultBuf, int32_t tid, uint32_t size) {
319 320 321 322
  if (pWindowRes->pageId != -1) {
    return 0;
  }

L
Liu Jicong 已提交
323
  SFilePage* pData = NULL;
324 325 326 327 328 329

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tid);

  if (taosArrayGetSize(list) == 0) {
H
Haojun Liao 已提交
330
    pData = getNewBufPage(pResultBuf, tid, &pageId);
331
    pData->num = sizeof(SFilePage);
332 333
  } else {
    SPageInfo* pi = getLastPageInfo(list);
334
    pData = getBufPage(pResultBuf, getPageId(pi));
335
    pageId = getPageId(pi);
336

337
    if (pData->num + size > getBufPageSize(pResultBuf)) {
338
      // release current page first, and prepare the next one
339
      releaseBufPageInfo(pResultBuf, pi);
340

H
Haojun Liao 已提交
341
      pData = getNewBufPage(pResultBuf, tid, &pageId);
342
      if (pData != NULL) {
343
        pData->num = sizeof(SFilePage);
344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363
      }
    }
  }

  if (pData == NULL) {
    return -1;
  }

  // set the number of rows in current disk page
  if (pWindowRes->pageId == -1) {  // not allocated yet, allocate new buffer
    pWindowRes->pageId = pageId;
    pWindowRes->offset = (int32_t)pData->num;

    pData->num += size;
    assert(pWindowRes->pageId >= 0);
  }

  return 0;
}

364
//  query_range_start, query_range_end, window_duration, window_start, window_end
365
void initExecTimeWindowInfo(SColumnInfoData* pColData, STimeWindow* pQueryWindow) {
366 367 368
  pColData->info.type = TSDB_DATA_TYPE_TIMESTAMP;
  pColData->info.bytes = sizeof(int64_t);

369
  colInfoDataEnsureCapacity(pColData, 5);
370 371 372 373 374 375 376 377 378
  colDataAppendInt64(pColData, 0, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 1, &pQueryWindow->ekey);

  int64_t interval = 0;
  colDataAppendInt64(pColData, 2, &interval);  // this value may be variable in case of 'n' and 'y'.
  colDataAppendInt64(pColData, 3, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 4, &pQueryWindow->ekey);
}

H
Haojun Liao 已提交
379 380 381 382
void cleanupExecTimeWindowInfo(SColumnInfoData* pColData) {
  colDataDestroy(pColData);
}

X
Xiaoyu Wang 已提交
383 384 385
void doApplyFunctions(SExecTaskInfo* taskInfo, SqlFunctionCtx* pCtx, STimeWindow* pWin,
                      SColumnInfoData* pTimeWindowData, int32_t offset, int32_t forwardStep, TSKEY* tsCol,
                      int32_t numOfTotal, int32_t numOfOutput, int32_t order) {
386
  for (int32_t k = 0; k < numOfOutput; ++k) {
H
Haojun Liao 已提交
387
    // keep it temporarily
388
    // todo no need this??
dengyihao's avatar
dengyihao 已提交
389 390
    bool    hasAgg = pCtx[k].input.colDataAggIsSet;
    int32_t numOfRows = pCtx[k].input.numOfRows;
H
Haojun Liao 已提交
391
    int32_t startOffset = pCtx[k].input.startRowIndex;
392

393
    pCtx[k].input.startRowIndex = offset;
394
    pCtx[k].input.numOfRows = forwardStep;
395 396 397

    // not a whole block involved in query processing, statistics data can not be used
    // NOTE: the original value of isSet have been changed here
398 399
    if (pCtx[k].input.colDataAggIsSet && forwardStep < numOfTotal) {
      pCtx[k].input.colDataAggIsSet = false;
400 401
    }

402 403
    if (fmIsWindowPseudoColumnFunc(pCtx[k].functionId)) {
      SResultRowEntryInfo* pEntryInfo = GET_RES_INFO(&pCtx[k]);
404 405

      char* p = GET_ROWCELL_INTERBUF(pEntryInfo);
406

407
      SColumnInfoData idata = {0};
dengyihao's avatar
dengyihao 已提交
408
      idata.info.type = TSDB_DATA_TYPE_BIGINT;
409
      idata.info.bytes = tDataTypes[TSDB_DATA_TYPE_BIGINT].bytes;
dengyihao's avatar
dengyihao 已提交
410
      idata.pData = p;
411 412 413 414

      SScalarParam out = {.columnData = &idata};
      SScalarParam tw = {.numOfRows = 5, .columnData = pTimeWindowData};
      pCtx[k].sfp.process(&tw, 1, &out);
415
      pEntryInfo->numOfRes = 1;
416 417 418 419 420 421 422 423 424 425
    } else {
      int32_t code = TSDB_CODE_SUCCESS;
      if (functionNeedToExecute(&pCtx[k]) && pCtx[k].fpSet.process != NULL) {
        code = pCtx[k].fpSet.process(&pCtx[k]);

        if (code != TSDB_CODE_SUCCESS) {
          qError("%s apply functions error, code: %s", GET_TASKID(taskInfo), tstrerror(code));
          taskInfo->code = code;
          longjmp(taskInfo->env, code);
        }
426
      }
427

428 429 430 431 432
      // restore it
      pCtx[k].input.colDataAggIsSet = hasAgg;
      pCtx[k].input.startRowIndex = startOffset;
      pCtx[k].input.numOfRows = numOfRows;
    }
433 434 435
  }
}

dengyihao's avatar
dengyihao 已提交
436
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
437
                                   int32_t scanFlag, bool createDummyCol);
438

dengyihao's avatar
dengyihao 已提交
439 440
static void doSetInputDataBlockInfo(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock,
                                    int32_t order) {
441
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
442
    pCtx[i].order = order;
443
    pCtx[i].input.numOfRows = pBlock->info.rows;
444
    setBlockStatisInfo(&pCtx[i], &pOperator->exprSupp.pExprInfo[i], pBlock);
445 446 447
  }
}

X
Xiaoyu Wang 已提交
448 449
void setInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
                       int32_t scanFlag, bool createDummyCol) {
450
  if (pBlock->pBlockAgg != NULL) {
H
Haojun Liao 已提交
451
    doSetInputDataBlockInfo(pOperator, pCtx, pBlock, order);
452
  } else {
453
    doSetInputDataBlock(pOperator, pCtx, pBlock, order, scanFlag, createDummyCol);
H
Haojun Liao 已提交
454
  }
455 456
}

L
Liu Jicong 已提交
457 458
static int32_t doCreateConstantValColumnInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t paramIndex,
                                             int32_t numOfRows) {
459 460 461 462 463 464 465 466
  SColumnInfoData* pColInfo = NULL;
  if (pInput->pData[paramIndex] == NULL) {
    pColInfo = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pColInfo == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

    // Set the correct column info (data type and bytes)
467 468
    pColInfo->info.type = pFuncParam->param.nType;
    pColInfo->info.bytes = pFuncParam->param.nLen;
469 470

    pInput->pData[paramIndex] = pColInfo;
471 472
  } else {
    pColInfo = pInput->pData[paramIndex];
473 474
  }

475
  colInfoDataEnsureCapacity(pColInfo, numOfRows);
476

477
  int8_t type = pFuncParam->param.nType;
478 479
  if (type == TSDB_DATA_TYPE_BIGINT || type == TSDB_DATA_TYPE_UBIGINT) {
    int64_t v = pFuncParam->param.i;
dengyihao's avatar
dengyihao 已提交
480
    for (int32_t i = 0; i < numOfRows; ++i) {
481 482 483 484
      colDataAppendInt64(pColInfo, i, &v);
    }
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
dengyihao's avatar
dengyihao 已提交
485
    for (int32_t i = 0; i < numOfRows; ++i) {
486 487
      colDataAppendDouble(pColInfo, i, &v);
    }
488
  } else if (type == TSDB_DATA_TYPE_VARCHAR) {
L
Liu Jicong 已提交
489
    char* tmp = taosMemoryMalloc(pFuncParam->param.nLen + VARSTR_HEADER_SIZE);
490
    STR_WITH_SIZE_TO_VARSTR(tmp, pFuncParam->param.pz, pFuncParam->param.nLen);
L
Liu Jicong 已提交
491
    for (int32_t i = 0; i < numOfRows; ++i) {
492 493
      colDataAppend(pColInfo, i, tmp, false);
    }
494 495 496 497 498
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
499
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
X
Xiaoyu Wang 已提交
500
                                   int32_t scanFlag, bool createDummyCol) {
501 502
  int32_t code = TSDB_CODE_SUCCESS;

503
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
L
Liu Jicong 已提交
504
    pCtx[i].order = order;
505 506
    pCtx[i].input.numOfRows = pBlock->info.rows;

L
Liu Jicong 已提交
507
    pCtx[i].pSrcBlock = pBlock;
X
Xiaoyu Wang 已提交
508
    pCtx[i].scanFlag = scanFlag;
H
Haojun Liao 已提交
509

510
    SInputColumnInfoData* pInput = &pCtx[i].input;
511
    pInput->uid = pBlock->info.uid;
C
Cary Xu 已提交
512
    pInput->colDataAggIsSet = false;
513

514
    SExprInfo* pOneExpr = &pOperator->exprSupp.pExprInfo[i];
515
    for (int32_t j = 0; j < pOneExpr->base.numOfParams; ++j) {
dengyihao's avatar
dengyihao 已提交
516
      SFunctParam* pFuncParam = &pOneExpr->base.pParam[j];
G
Ganlin Zhao 已提交
517 518
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
dengyihao's avatar
dengyihao 已提交
519
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
520 521 522
        pInput->totalRows = pBlock->info.rows;
        pInput->numOfRows = pBlock->info.rows;
        pInput->startRowIndex = 0;
523

524
        // NOTE: the last parameter is the primary timestamp column
H
Haojun Liao 已提交
525 526 527 528
        // todo: refactor this
        if (fmIsTimelineFunc(pCtx[i].functionId) && (j == pOneExpr->base.numOfParams - 1)) {
          pInput->pPTS = pInput->pData[j];   // in case of merge function, this is not always the ts column data.
//          ASSERT(pInput->pPTS->info.type == TSDB_DATA_TYPE_TIMESTAMP);
529
        }
530 531
        ASSERT(pInput->pData[j] != NULL);
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
532 533 534
        // todo avoid case: top(k, 12), 12 is the value parameter.
        // sum(11), 11 is also the value parameter.
        if (createDummyCol && pOneExpr->base.numOfParams == 1) {
535 536 537 538
          pInput->totalRows = pBlock->info.rows;
          pInput->numOfRows = pBlock->info.rows;
          pInput->startRowIndex = 0;

539
          code = doCreateConstantValColumnInfo(pInput, pFuncParam, j, pBlock->info.rows);
540 541 542
          if (code != TSDB_CODE_SUCCESS) {
            return code;
          }
543
        }
G
Ganlin Zhao 已提交
544 545
      }
    }
H
Haojun Liao 已提交
546
  }
547 548

  return code;
H
Haojun Liao 已提交
549 550
}

551
static int32_t doAggregateImpl(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx) {
552
  for (int32_t k = 0; k < pOperator->exprSupp.numOfExprs; ++k) {
H
Haojun Liao 已提交
553
    if (functionNeedToExecute(&pCtx[k])) {
554
      // todo add a dummy funtion to avoid process check
555 556 557
      if (pCtx[k].fpSet.process == NULL) {
        continue;
      }
H
Haojun Liao 已提交
558

559 560 561 562
      int32_t code = pCtx[k].fpSet.process(&pCtx[k]);
      if (code != TSDB_CODE_SUCCESS) {
        qError("%s aggregate function error happens, code: %s", GET_TASKID(pOperator->pTaskInfo), tstrerror(code));
        return code;
563
      }
564 565
    }
  }
566 567

  return TSDB_CODE_SUCCESS;
568 569
}

H
Haojun Liao 已提交
570
static void setPseudoOutputColInfo(SSDataBlock* pResult, SqlFunctionCtx* pCtx, SArray* pPseudoList) {
dengyihao's avatar
dengyihao 已提交
571
  size_t num = (pPseudoList != NULL) ? taosArrayGetSize(pPseudoList) : 0;
H
Haojun Liao 已提交
572 573 574 575 576
  for (int32_t i = 0; i < num; ++i) {
    pCtx[i].pOutput = taosArrayGet(pResult->pDataBlock, i);
  }
}

577
int32_t projectApplyFunctions(SExprInfo* pExpr, SSDataBlock* pResult, SSDataBlock* pSrcBlock, SqlFunctionCtx* pCtx,
X
Xiaoyu Wang 已提交
578
                              int32_t numOfOutput, SArray* pPseudoList) {
H
Haojun Liao 已提交
579
  setPseudoOutputColInfo(pResult, pCtx, pPseudoList);
H
Haojun Liao 已提交
580
  pResult->info.groupId = pSrcBlock->info.groupId;
H
Haojun Liao 已提交
581

582 583
  // if the source equals to the destination, it is to create a new column as the result of scalar
  // function or some operators.
584 585
  bool createNewColModel = (pResult == pSrcBlock);

586 587
  int32_t numOfRows = 0;

588
  for (int32_t k = 0; k < numOfOutput; ++k) {
589 590
    int32_t               outputSlotId = pExpr[k].base.resSchema.slotId;
    SqlFunctionCtx*       pfCtx = &pCtx[k];
591
    SInputColumnInfoData* pInputData = &pfCtx->input;
592

L
Liu Jicong 已提交
593
    if (pExpr[k].pExpr->nodeType == QUERY_NODE_COLUMN) {  // it is a project query
594
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
595
      if (pResult->info.rows > 0 && !createNewColModel) {
596 597
        colDataMergeCol(pColInfoData, pResult->info.rows, &pResult->info.capacity, pInputData->pData[0],
                        pInputData->numOfRows);
598
      } else {
599
        colDataAssign(pColInfoData, pInputData->pData[0], pInputData->numOfRows, &pResult->info);
600
      }
601

602
      numOfRows = pInputData->numOfRows;
603
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_VALUE) {
604
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
605

dengyihao's avatar
dengyihao 已提交
606
      int32_t offset = createNewColModel ? 0 : pResult->info.rows;
607 608 609 610 611 612 613 614

      int32_t type = pExpr[k].base.pParam[0].param.nType;
      if (TSDB_DATA_TYPE_NULL == type) {
        colDataAppendNNULL(pColInfoData, offset, pSrcBlock->info.rows);
      } else {
        for (int32_t i = 0; i < pSrcBlock->info.rows; ++i) {
          colDataAppend(pColInfoData, i + offset, taosVariantGet(&pExpr[k].base.pParam[0].param, type), false);
        }
615
      }
616 617

      numOfRows = pSrcBlock->info.rows;
H
Haojun Liao 已提交
618
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_OPERATOR) {
619 620 621
      SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
      taosArrayPush(pBlockList, &pSrcBlock);

622
      SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
623
      SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
624

625
      SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
626
      int32_t      code = scalarCalculate(pExpr[k].pExpr->_optrRoot.pRootNode, pBlockList, &dest);
627 628 629 630
      if (code != TSDB_CODE_SUCCESS) {
        taosArrayDestroy(pBlockList);
        return code;
      }
631

dengyihao's avatar
dengyihao 已提交
632
      int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
633
      ASSERT(pResult->info.capacity > 0);
634
      colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
D
dapan1121 已提交
635 636
      colDataDestroy(&idata);
      
637
      numOfRows = dest.numOfRows;
638 639
      taosArrayDestroy(pBlockList);
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_FUNCTION) {
640 641
      // _rowts/_c0, not tbname column
      if (fmIsPseudoColumnFunc(pfCtx->functionId) && (!fmIsScanPseudoColumnFunc(pfCtx->functionId))) {
H
Haojun Liao 已提交
642
        // do nothing
643
      } else if (fmIsIndefiniteRowsFunc(pfCtx->functionId)) {
644 645
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(pfCtx);
        pfCtx->fpSet.init(pfCtx, pResInfo);
646 647 648 649 650 651 652 653 654 655 656

        pfCtx->pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
        pfCtx->offset = createNewColModel ? 0 : pResult->info.rows;  // set the start offset

        // set the timestamp(_rowts) output buffer
        if (taosArrayGetSize(pPseudoList) > 0) {
          int32_t* outputColIndex = taosArrayGet(pPseudoList, 0);
          pfCtx->pTsOutput = (SColumnInfoData*)pCtx[*outputColIndex].pOutput;
        }

        numOfRows = pfCtx->fpSet.process(pfCtx);
H
Haojun Liao 已提交
657
      } else if (fmIsAggFunc(pfCtx->functionId)) {
658 659
        // _group_key function for "partition by tbname" + csum(col_name) query
        SColumnInfoData* pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
660
        int32_t          slotId = pfCtx->param[0].pCol->slotId;
661 662 663

        // todo handle the json tag
        SColumnInfoData* pInput = taosArrayGet(pSrcBlock->pDataBlock, slotId);
664
        for (int32_t f = 0; f < pSrcBlock->info.rows; ++f) {
665 666 667 668 669 670 671 672 673
          bool isNull = colDataIsNull_s(pInput, f);
          if (isNull) {
            colDataAppendNULL(pOutput, pResult->info.rows + f);
          } else {
            char* data = colDataGetData(pInput, f);
            colDataAppend(pOutput, pResult->info.rows + f, data, isNull);
          }
        }

H
Haojun Liao 已提交
674 675 676
      } else {
        SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
        taosArrayPush(pBlockList, &pSrcBlock);
G
Ganlin Zhao 已提交
677

678
        SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
679
        SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
H
Haojun Liao 已提交
680

681
        SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
682
        int32_t      code = scalarCalculate((SNode*)pExpr[k].pExpr->_function.pFunctNode, pBlockList, &dest);
683 684 685 686
        if (code != TSDB_CODE_SUCCESS) {
          taosArrayDestroy(pBlockList);
          return code;
        }
687

dengyihao's avatar
dengyihao 已提交
688
        int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
689
        ASSERT(pResult->info.capacity > 0);
690
        colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
D
dapan1121 已提交
691
        colDataDestroy(&idata);
692 693

        numOfRows = dest.numOfRows;
H
Haojun Liao 已提交
694 695
        taosArrayDestroy(pBlockList);
      }
696
    } else {
697
      ASSERT(0);
698 699
    }
  }
700

701 702 703
  if (!createNewColModel) {
    pResult->info.rows += numOfRows;
  }
704 705

  return TSDB_CODE_SUCCESS;
706 707
}

5
54liuyao 已提交
708
bool functionNeedToExecute(SqlFunctionCtx* pCtx) {
709
  struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
710

711 712 713 714 715
  // in case of timestamp column, always generated results.
  int32_t functionId = pCtx->functionId;
  if (functionId == -1) {
    return false;
  }
716

717 718
  if (pCtx->scanFlag == REPEAT_SCAN) {
    return fmIsRepeatScanFunc(pCtx->functionId);
719 720
  }

721 722
  if (isRowEntryCompleted(pResInfo)) {
    return false;
723 724
  }

725 726 727
  return true;
}

728 729 730 731 732 733 734
static int32_t doCreateConstantValColumnAggInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t type,
                                                int32_t paramIndex, int32_t numOfRows) {
  if (pInput->pData[paramIndex] == NULL) {
    pInput->pData[paramIndex] = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pInput->pData[paramIndex] == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
735

736 737 738
    // Set the correct column info (data type and bytes)
    pInput->pData[paramIndex]->info.type = type;
    pInput->pData[paramIndex]->info.bytes = tDataTypes[type].bytes;
739
  }
H
Haojun Liao 已提交
740

741 742 743 744 745 746
  SColumnDataAgg* da = NULL;
  if (pInput->pColumnDataAgg[paramIndex] == NULL) {
    da = taosMemoryCalloc(1, sizeof(SColumnDataAgg));
    pInput->pColumnDataAgg[paramIndex] = da;
    if (da == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
747 748
    }
  } else {
749
    da = pInput->pColumnDataAgg[paramIndex];
750 751
  }

752
  ASSERT(!IS_VAR_DATA_TYPE(type));
753

754 755
  if (type == TSDB_DATA_TYPE_BIGINT) {
    int64_t v = pFuncParam->param.i;
756
    *da = (SColumnDataAgg){.numOfNull = 0, .min = v, .max = v, .sum = v * numOfRows};
757 758
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
759
    *da = (SColumnDataAgg){.numOfNull = 0};
760

761 762 763 764 765 766
    *(double*)&da->min = v;
    *(double*)&da->max = v;
    *(double*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_BOOL) {  // todo validate this data type
    bool v = pFuncParam->param.i;

767
    *da = (SColumnDataAgg){.numOfNull = 0};
768 769 770 771 772
    *(bool*)&da->min = 0;
    *(bool*)&da->max = v;
    *(bool*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_TIMESTAMP) {
    // do nothing
773
  } else {
774
    ASSERT(0);
775 776
  }

777 778
  return TSDB_CODE_SUCCESS;
}
779 780 781 782 783 784 785 786 787 788 789

void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, SSDataBlock* pBlock) {
  int32_t numOfRows = pBlock->info.rows;

  SInputColumnInfoData* pInput = &pCtx->input;
  pInput->numOfRows = numOfRows;
  pInput->totalRows = numOfRows;

  if (pBlock->pBlockAgg != NULL) {
    pInput->colDataAggIsSet = true;

790 791
    for (int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      SFunctParam* pFuncParam = &pExprInfo->base.pParam[j];
792

793 794
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
795 796 797 798
        pInput->pColumnDataAgg[j] = pBlock->pBlockAgg[slotId];
        if (pInput->pColumnDataAgg[j] == NULL) {
          pInput->colDataAggIsSet = false;
        }
799 800 801 802

        // Here we set the column info data since the data type for each column data is required, but
        // the data in the corresponding SColumnInfoData will not be used.
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
803 804
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
        doCreateConstantValColumnAggInfo(pInput, pFuncParam, pFuncParam->param.nType, j, pBlock->info.rows);
805 806
      }
    }
807
  } else {
808
    pInput->colDataAggIsSet = false;
809 810 811
  }

  // set the statistics data for primary time stamp column
812 813 814 815 816
  //  if (pCtx->functionId == FUNCTION_SPREAD && pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
  //    pCtx->isAggSet = true;
  //    pCtx->agg.min = pBlock->info.window.skey;
  //    pCtx->agg.max = pBlock->info.window.ekey;
  //  }
817 818
}

L
Liu Jicong 已提交
819
bool isTaskKilled(SExecTaskInfo* pTaskInfo) {
820 821
  // query has been executed more than tsShellActivityTimer, and the retrieve has not arrived
  // abort current query execution.
L
Liu Jicong 已提交
822 823
  if (pTaskInfo->owner != 0 &&
      ((taosGetTimestampSec() - pTaskInfo->cost.start / 1000) > 10 * getMaximumIdleDurationSec())
824 825
      /*(!needBuildResAfterQueryComplete(pTaskInfo))*/) {
    assert(pTaskInfo->cost.start != 0);
L
Liu Jicong 已提交
826 827 828
    //    qDebug("QInfo:%" PRIu64 " retrieve not arrive beyond %d ms, abort current query execution, start:%" PRId64
    //           ", current:%d", pQInfo->qId, 1, pQInfo->startExecTs, taosGetTimestampSec());
    //    return true;
829 830 831 832 833
  }

  return false;
}

L
Liu Jicong 已提交
834
void setTaskKilled(SExecTaskInfo* pTaskInfo) { pTaskInfo->code = TSDB_CODE_TSC_QUERY_CANCELLED; }
835 836

/////////////////////////////////////////////////////////////////////////////////////////////
L
Liu Jicong 已提交
837
// todo refactor : return window
838
void getAlignQueryTimeWindow(SInterval* pInterval, int32_t precision, int64_t key, STimeWindow* win) {
H
Haojun Liao 已提交
839
  win->skey = taosTimeTruncate(key, pInterval, precision);
840 841

  /*
H
Haojun Liao 已提交
842
   * if the realSkey > INT64_MAX - pInterval->interval, the query duration between
843 844
   * realSkey and realEkey must be less than one interval.Therefore, no need to adjust the query ranges.
   */
845 846
  win->ekey = taosTimeAdd(win->skey, pInterval->interval, pInterval->intervalUnit, precision) - 1;
  if (win->ekey < win->skey) {
847 848 849 850
    win->ekey = INT64_MAX;
  }
}

851
#if 0
L
Liu Jicong 已提交
852
static int32_t updateBlockLoadStatus(STaskAttr* pQuery, int32_t status) {
853

854 855 856
  bool hasFirstLastFunc = false;
  bool hasOtherFunc = false;

857
  if (status == BLK_DATA_DATA_LOAD || status == BLK_DATA_FILTEROUT) {
858 859 860 861 862
    return status;
  }

  for (int32_t i = 0; i < pQuery->numOfOutput; ++i) {
    int32_t functionId = getExprFunctionId(&pQuery->pExpr1[i]);
863

864 865 866 867 868 869 870 871 872 873
    if (functionId == FUNCTION_TS || functionId == FUNCTION_TS_DUMMY || functionId == FUNCTION_TAG ||
        functionId == FUNCTION_TAG_DUMMY) {
      continue;
    }

    if (functionId == FUNCTION_FIRST_DST || functionId == FUNCTION_LAST_DST) {
      hasFirstLastFunc = true;
    } else {
      hasOtherFunc = true;
    }
874

875 876
  }

877
  if (hasFirstLastFunc && status == BLK_DATA_NOT_LOAD) {
L
Liu Jicong 已提交
878
    if (!hasOtherFunc) {
879
      return BLK_DATA_FILTEROUT;
880
    } else {
881
      return BLK_DATA_DATA_LOAD;
882 883 884 885 886 887
    }
  }

  return status;
}

888 889
#endif

L
Liu Jicong 已提交
890 891
// static void updateDataCheckOrder(SQInfo *pQInfo, SQueryTableReq* pQueryMsg, bool stableQuery) {
//   STaskAttr* pQueryAttr = pQInfo->runtimeEnv.pQueryAttr;
H
Haojun Liao 已提交
892
//
L
Liu Jicong 已提交
893 894 895 896
//   // in case of point-interpolation query, use asc order scan
//   char msg[] = "QInfo:0x%"PRIx64" scan order changed for %s query, old:%d, new:%d, qrange exchanged, old qrange:%"
//   PRId64
//                "-%" PRId64 ", new qrange:%" PRId64 "-%" PRId64;
H
Haojun Liao 已提交
897
//
L
Liu Jicong 已提交
898 899 900 901 902
//   // todo handle the case the the order irrelevant query type mixed up with order critical query type
//   // descending order query for last_row query
//   if (isFirstLastRowQuery(pQueryAttr)) {
//     //qDebug("QInfo:0x%"PRIx64" scan order changed for last_row query, old:%d, new:%d", pQInfo->qId,
//     pQueryAttr->order.order, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
903
//
L
Liu Jicong 已提交
904 905
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
906
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
907
//     }
H
Haojun Liao 已提交
908
//
L
Liu Jicong 已提交
909 910 911
//     pQueryAttr->needReverseScan = false;
//     return;
//   }
H
Haojun Liao 已提交
912
//
L
Liu Jicong 已提交
913 914 915
//   if (pQueryAttr->groupbyColumn && pQueryAttr->order.order == TSDB_ORDER_DESC) {
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
916
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
917
//     }
H
Haojun Liao 已提交
918
//
L
Liu Jicong 已提交
919 920 921 922
//     pQueryAttr->needReverseScan = false;
//     doUpdateLastKey(pQueryAttr);
//     return;
//   }
H
Haojun Liao 已提交
923
//
L
Liu Jicong 已提交
924 925 926 927 928 929
//   if (pQueryAttr->pointInterpQuery && pQueryAttr->interval.interval == 0) {
//     if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       //qDebug(msg, pQInfo->qId, "interp", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey); TSWAP(pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, TSKEY);
//     }
H
Haojun Liao 已提交
930
//
L
Liu Jicong 已提交
931 932 933
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     return;
//   }
H
Haojun Liao 已提交
934
//
L
Liu Jicong 已提交
935 936 937 938
//   if (pQueryAttr->interval.interval == 0) {
//     if (onlyFirstQuery(pQueryAttr)) {
//       if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//         //qDebug(msg, pQInfo->qId, "only-first", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
H
Haojun Liao 已提交
939 940
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
941
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
942 943 944 945 946 947 948 949 950 951
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_ASC;
//      pQueryAttr->needReverseScan = false;
//    } else if (onlyLastQuery(pQueryAttr) && notContainSessionOrStateWindow(pQueryAttr)) {
//      if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//        //qDebug(msg, pQInfo->qId, "only-last", pQueryAttr->order.order, TSDB_ORDER_DESC, pQueryAttr->window.skey,
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
952
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
953 954 955 956 957 958 959 960 961 962 963 964
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_DESC;
//      pQueryAttr->needReverseScan = false;
//    }
//
//  } else {  // interval query
//    if (stableQuery) {
//      if (onlyFirstQuery(pQueryAttr)) {
//        if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-first stable", pQueryAttr->order.order, TSDB_ORDER_ASC,
L
Liu Jicong 已提交
965 966
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
967
//
wafwerar's avatar
wafwerar 已提交
968
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
969 970 971 972 973 974 975 976
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_ASC;
//        pQueryAttr->needReverseScan = false;
//      } else if (onlyLastQuery(pQueryAttr)) {
//        if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-last stable", pQueryAttr->order.order, TSDB_ORDER_DESC,
L
Liu Jicong 已提交
977 978
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
979
//
wafwerar's avatar
wafwerar 已提交
980
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
981 982 983 984 985 986 987 988 989
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_DESC;
//        pQueryAttr->needReverseScan = false;
//      }
//    }
//  }
//}
990

L
Liu Jicong 已提交
991 992 993
// static FORCE_INLINE bool doFilterByBlockStatistics(STaskRuntimeEnv* pRuntimeEnv, SDataStatis *pDataStatis,
// SqlFunctionCtx *pCtx, int32_t numOfRows) {
//   STaskAttr* pQueryAttr = pRuntimeEnv->pQueryAttr;
994
//
L
Liu Jicong 已提交
995 996 997
//   if (pDataStatis == NULL || pQueryAttr->pFilters == NULL) {
//     return true;
//   }
998
//
L
Liu Jicong 已提交
999 1000
//   return filterRangeExecute(pQueryAttr->pFilters, pDataStatis, pQueryAttr->numOfCols, numOfRows);
// }
1001
#if 0
H
Haojun Liao 已提交
1002
static bool overlapWithTimeWindow(STaskAttr* pQueryAttr, SDataBlockInfo* pBlockInfo) {
1003 1004
  STimeWindow w = {0};

dengyihao's avatar
dengyihao 已提交
1005 1006
  TSKEY sk = TMIN(pQueryAttr->window.skey, pQueryAttr->window.ekey);
  TSKEY ek = TMAX(pQueryAttr->window.skey, pQueryAttr->window.ekey);
1007

1008
  if (true) {
L
Liu Jicong 已提交
1009
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.skey, sk, ek, &w);
1010 1011 1012 1013 1014 1015
    assert(w.ekey >= pBlockInfo->window.skey);

    if (w.ekey < pBlockInfo->window.ekey) {
      return true;
    }

L
Liu Jicong 已提交
1016 1017
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1018 1019 1020 1021 1022 1023 1024 1025 1026 1027
      if (w.skey > pBlockInfo->window.ekey) {
        break;
      }

      assert(w.ekey > pBlockInfo->window.ekey);
      if (w.skey <= pBlockInfo->window.ekey && w.skey > pBlockInfo->window.skey) {
        return true;
      }
    }
  } else {
L
Liu Jicong 已提交
1028
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.ekey, sk, ek, &w);
1029 1030 1031 1032 1033 1034
    assert(w.skey <= pBlockInfo->window.ekey);

    if (w.skey > pBlockInfo->window.skey) {
      return true;
    }

L
Liu Jicong 已提交
1035 1036
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048 1049
      if (w.ekey < pBlockInfo->window.skey) {
        break;
      }

      assert(w.skey < pBlockInfo->window.skey);
      if (w.ekey < pBlockInfo->window.ekey && w.ekey >= pBlockInfo->window.skey) {
        return true;
      }
    }
  }

  return false;
}
1050
#endif
1051 1052

static uint32_t doFilterByBlockTimeWindow(STableScanInfo* pTableScanInfo, SSDataBlock* pBlock) {
H
Haojun Liao 已提交
1053
#if 0
H
Haojun Liao 已提交
1054
  SqlFunctionCtx* pCtx = pTableScanInfo->pCtx;
1055
  uint32_t        status = BLK_DATA_NOT_LOAD;
1056

L
Liu Jicong 已提交
1057
  int32_t numOfOutput = 0;  // pTableScanInfo->numOfOutput;
1058 1059
  for (int32_t i = 0; i < numOfOutput; ++i) {
    int32_t functionId = pCtx[i].functionId;
H
Haojun Liao 已提交
1060
    int32_t colId = pTableScanInfo->pExpr[i].base.pParam[0].pCol->colId;
1061 1062 1063

    // group by + first/last should not apply the first/last block filter
    if (functionId < 0) {
1064
      status |= BLK_DATA_DATA_LOAD;
1065 1066
      return status;
    } else {
L
Liu Jicong 已提交
1067
      //      status |= aAggs[functionId].dataReqFunc(&pTableScanInfo->pCtx[i], &pBlock->info.window, colId);
1068
      //      if ((status & BLK_DATA_DATA_LOAD) == BLK_DATA_DATA_LOAD) {
L
Liu Jicong 已提交
1069 1070
      //        return status;
      //      }
1071 1072 1073 1074
    }
  }

  return status;
H
Haojun Liao 已提交
1075 1076
#endif
  return 0;
1077 1078
}

L
Liu Jicong 已提交
1079 1080
int32_t loadDataBlockOnDemand(SExecTaskInfo* pTaskInfo, STableScanInfo* pTableScanInfo, SSDataBlock* pBlock,
                              uint32_t* status) {
1081
  *status = BLK_DATA_NOT_LOAD;
1082

H
Haojun Liao 已提交
1083
  pBlock->pDataBlock = NULL;
L
Liu Jicong 已提交
1084
  pBlock->pBlockAgg = NULL;
H
Haojun Liao 已提交
1085

L
Liu Jicong 已提交
1086 1087
  //  int64_t groupId = pRuntimeEnv->current->groupIndex;
  //  bool    ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1088

H
Haojun Liao 已提交
1089
  STaskCostInfo* pCost = &pTaskInfo->cost;
1090

1091 1092
//  pCost->totalBlocks += 1;
//  pCost->totalRows += pBlock->info.rows;
H
Haojun Liao 已提交
1093
#if 0
1094 1095 1096
  // Calculate all time windows that are overlapping or contain current data block.
  // If current data block is contained by all possible time window, do not load current data block.
  if (/*pQueryAttr->pFilters || */pQueryAttr->groupbyColumn || pQueryAttr->sw.gap > 0 ||
H
Haojun Liao 已提交
1097
      (QUERY_IS_INTERVAL_QUERY(pQueryAttr) && overlapWithTimeWindow(pTaskInfo, &pBlock->info))) {
1098
    (*status) = BLK_DATA_DATA_LOAD;
1099 1100 1101
  }

  // check if this data block is required to load
1102
  if ((*status) != BLK_DATA_DATA_LOAD) {
1103 1104 1105 1106 1107 1108 1109
    bool needFilter = true;

    // the pCtx[i] result is belonged to previous time window since the outputBuf has not been set yet,
    // the filter result may be incorrect. So in case of interval query, we need to set the correct time output buffer
    if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
      SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1110
      bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1111 1112 1113 1114 1115 1116
      TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

      STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
      if (pQueryAttr->pointInterpQuery) {
        needFilter = chkWindowOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1117
                                    pTableScanInfo->rowEntryInfoOffset);
1118 1119 1120
      } else {
        if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1121
                                    pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1122 1123 1124 1125 1126
          longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
        }
      }
    } else if (pQueryAttr->stableQuery && (!pQueryAttr->tsCompQuery) && (!pQueryAttr->diffQuery)) { // stable aggregate, not interval aggregate or normal column aggregate
      doSetTableGroupOutputBuf(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pTableScanInfo->pCtx,
1127
                               pTableScanInfo->rowEntryInfoOffset, pTableScanInfo->numOfOutput,
1128 1129 1130 1131 1132 1133
                               pRuntimeEnv->current->groupIndex);
    }

    if (needFilter) {
      (*status) = doFilterByBlockTimeWindow(pTableScanInfo, pBlock);
    } else {
1134
      (*status) = BLK_DATA_DATA_LOAD;
1135 1136 1137 1138
    }
  }

  SDataBlockInfo* pBlockInfo = &pBlock->info;
H
Haojun Liao 已提交
1139
//  *status = updateBlockLoadStatus(pRuntimeEnv->pQueryAttr, *status);
1140

1141
  if ((*status) == BLK_DATA_NOT_LOAD || (*status) == BLK_DATA_FILTEROUT) {
1142 1143
    //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//           pBlockInfo->window.ekey, pBlockInfo->rows);
1144
    pCost->skipBlocks += 1;
1145
  } else if ((*status) == BLK_DATA_SMA_LOAD) {
1146 1147
    // this function never returns error?
    pCost->loadBlockStatis += 1;
1148
//    tsdbRetrieveDatablockSMA(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1149 1150

    if (pBlock->pBlockAgg == NULL) {  // data block statistics does not exist, load data block
1151
//      pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1152 1153 1154
      pCost->totalCheckedRows += pBlock->info.rows;
    }
  } else {
1155
    assert((*status) == BLK_DATA_DATA_LOAD);
1156 1157 1158

    // load the data block statistics to perform further filter
    pCost->loadBlockStatis += 1;
1159
//    tsdbRetrieveDatablockSMA(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1160 1161 1162 1163 1164 1165

    if (pQueryAttr->topBotQuery && pBlock->pBlockAgg != NULL) {
      { // set previous window
        if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
          SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1166
          bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1167 1168 1169 1170 1171
          TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

          STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
          if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                      pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1172
                                      pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183
            longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
          }
        }
      }
      bool load = false;
      for (int32_t i = 0; i < pQueryAttr->numOfOutput; ++i) {
        int32_t functionId = pTableScanInfo->pCtx[i].functionId;
        if (functionId == FUNCTION_TOP || functionId == FUNCTION_BOTTOM) {
//          load = topbot_datablock_filter(&pTableScanInfo->pCtx[i], (char*)&(pBlock->pBlockAgg[i].min),
//                                         (char*)&(pBlock->pBlockAgg[i].max));
          if (!load) { // current block has been discard due to filter applied
1184
            pCost->skipBlocks += 1;
1185 1186
            //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId,
//                   pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
1187
            (*status) = BLK_DATA_FILTEROUT;
1188 1189 1190 1191 1192 1193 1194 1195
            return TSDB_CODE_SUCCESS;
          }
        }
      }
    }

    // current block has been discard due to filter applied
//    if (!doFilterByBlockStatistics(pRuntimeEnv, pBlock->pBlockAgg, pTableScanInfo->pCtx, pBlockInfo->rows)) {
1196
//      pCost->skipBlocks += 1;
1197 1198
//      qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//             pBlockInfo->window.ekey, pBlockInfo->rows);
1199
//      (*status) = BLK_DATA_FILTEROUT;
1200 1201 1202 1203 1204
//      return TSDB_CODE_SUCCESS;
//    }

    pCost->totalCheckedRows += pBlockInfo->rows;
    pCost->loadBlocks += 1;
1205
//    pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1206 1207 1208 1209 1210
//    if (pBlock->pDataBlock == NULL) {
//      return terrno;
//    }

//    if (pQueryAttr->pFilters != NULL) {
1211
//      filterSetColFieldData(pQueryAttr->pFilters, taosArrayGetSize(pBlock->pDataBlock), pBlock->pDataBlock);
1212
//    }
1213

1214 1215 1216 1217
//    if (pQueryAttr->pFilters != NULL || pRuntimeEnv->pTsBuf != NULL) {
//      filterColRowsInDataBlock(pRuntimeEnv, pBlock, ascQuery);
//    }
  }
H
Haojun Liao 已提交
1218
#endif
1219 1220 1221
  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
1222
static void updateTableQueryInfoForReverseScan(STableQueryInfo* pTableQueryInfo) {
1223 1224 1225 1226
  if (pTableQueryInfo == NULL) {
    return;
  }

wafwerar's avatar
wafwerar 已提交
1227
  //  TSWAP(pTableQueryInfo->win.skey, pTableQueryInfo->win.ekey);
L
Liu Jicong 已提交
1228
  //  pTableQueryInfo->lastKey = pTableQueryInfo->win.skey;
1229

L
Liu Jicong 已提交
1230 1231
  //  SWITCH_ORDER(pTableQueryInfo->cur.order);
  //  pTableQueryInfo->cur.vgroupIndex = -1;
1232 1233

  // set the index to be the end slot of result rows array
dengyihao's avatar
dengyihao 已提交
1234 1235 1236 1237 1238 1239
  //  SResultRowInfo* pResultRowInfo = &pTableQueryInfo->resInfo;
  //  if (pResultRowInfo->size > 0) {
  //    pResultRowInfo->curPos = pResultRowInfo->size - 1;
  //  } else {
  //    pResultRowInfo->curPos = -1;
  //  }
1240 1241
}

H
Haojun Liao 已提交
1242
void initResultRow(SResultRow* pResultRow) {
X
Xiaoyu Wang 已提交
1243
  //  pResultRow->pEntryInfo = (struct SResultRowEntryInfo*)((char*)pResultRow + sizeof(SResultRow));
1244 1245 1246 1247 1248
}

/*
 * The start of each column SResultRowEntryInfo is denote by RowCellInfoOffset.
 * Note that in case of top/bottom query, the whole multiple rows of result is treated as only one row of results.
H
Haojun Liao 已提交
1249 1250 1251
 * +------------+-----------------result column 1------------+------------------result column 2-----------+
 * | SResultRow | SResultRowEntryInfo | intermediate buffer1 | SResultRowEntryInfo | intermediate buffer 2|
 * +------------+--------------------------------------------+--------------------------------------------+
1252 1253
 *           offset[0]                                  offset[1]                                   offset[2]
 */
1254
// TODO refactor: some function move away
L
Liu Jicong 已提交
1255 1256 1257
void setFunctionResultOutput(SOperatorInfo* pOperator, SOptrBasicInfo* pInfo, SAggSupporter* pSup, int32_t stage,
                             int32_t numOfExprs) {
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1258 1259
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
H
Haojun Liao 已提交
1260

H
Haojun Liao 已提交
1261
  SResultRowInfo* pResultRowInfo = &pInfo->resultRowInfo;
1262
  initResultRowInfo(pResultRowInfo);
H
Haojun Liao 已提交
1263

L
Liu Jicong 已提交
1264 1265
  int64_t     tid = 0;
  int64_t     groupId = 0;
1266 1267
  SResultRow* pRow = doSetResultOutBufByKey(pSup->pResultBuf, pResultRowInfo, (char*)&tid, sizeof(tid), true, groupId,
                                            pTaskInfo, false, pSup);
H
Haojun Liao 已提交
1268

1269
  for (int32_t i = 0; i < numOfExprs; ++i) {
1270
    struct SResultRowEntryInfo* pEntry = getResultEntryInfo(pRow, i, rowEntryInfoOffset);
H
Haojun Liao 已提交
1271 1272
    cleanupResultRowEntry(pEntry);

L
Liu Jicong 已提交
1273
    pCtx[i].resultInfo = pEntry;
1274
    pCtx[i].scanFlag = stage;
H
Haojun Liao 已提交
1275 1276
  }

1277
  initCtxOutputBuffer(pCtx, numOfExprs);
H
Haojun Liao 已提交
1278 1279
}

H
Haojun Liao 已提交
1280
void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size) {
1281 1282
  for (int32_t j = 0; j < size; ++j) {
    struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(&pCtx[j]);
dengyihao's avatar
dengyihao 已提交
1283 1284
    if (isRowEntryInitialized(pResInfo) || fmIsPseudoColumnFunc(pCtx[j].functionId) || pCtx[j].functionId == -1 ||
        fmIsScalarFunc(pCtx[j].functionId)) {
1285 1286 1287
      continue;
    }

H
Haojun Liao 已提交
1288
    pCtx[j].fpSet.init(&pCtx[j], pCtx[j].resultInfo);
1289 1290 1291
  }
}

L
Liu Jicong 已提交
1292
void setTaskStatus(SExecTaskInfo* pTaskInfo, int8_t status) {
1293
  if (status == TASK_NOT_COMPLETED) {
H
Haojun Liao 已提交
1294
    pTaskInfo->status = status;
1295 1296
  } else {
    // QUERY_NOT_COMPLETED is not compatible with any other status, so clear its position first
1297
    CLEAR_QUERY_STATUS(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
1298
    pTaskInfo->status |= status;
1299 1300 1301
  }
}

L
Liu Jicong 已提交
1302
void destroyTableQueryInfoImpl(STableQueryInfo* pTableQueryInfo) {
1303 1304 1305 1306
  if (pTableQueryInfo == NULL) {
    return;
  }

L
Liu Jicong 已提交
1307
  //  taosVariantDestroy(&pTableQueryInfo->tag);
dengyihao's avatar
dengyihao 已提交
1308
  //  cleanupResultRowInfo(&pTableQueryInfo->resInfo);
1309 1310
}

1311
void setResultRowInitCtx(SResultRow* pResult, SqlFunctionCtx* pCtx, int32_t numOfOutput, int32_t* rowEntryInfoOffset) {
1312
  for (int32_t i = 0; i < numOfOutput; ++i) {
1313
    pCtx[i].resultInfo = getResultEntryInfo(pResult, i, rowEntryInfoOffset);
1314 1315 1316 1317 1318

    struct SResultRowEntryInfo* pResInfo = pCtx[i].resultInfo;
    if (isRowEntryCompleted(pResInfo) && isRowEntryInitialized(pResInfo)) {
      continue;
    }
1319 1320 1321 1322 1323

    if (fmIsWindowPseudoColumnFunc(pCtx[i].functionId)) {
      continue;
    }

1324 1325 1326 1327 1328 1329
    if (!pResInfo->initialized) {
      if (pCtx[i].functionId != -1) {
        pCtx[i].fpSet.init(&pCtx[i], pResInfo);
      } else {
        pResInfo->initialized = true;
      }
1330 1331 1332 1333
    }
  }
}

H
Haojun Liao 已提交
1334
static void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep);
1335

1336
void doFilter(const SNode* pFilterNode, SSDataBlock* pBlock) {
1337 1338 1339 1340 1341
  if (pFilterNode == NULL) {
    return;
  }

  SFilterInfo* filter = NULL;
H
Haojun Liao 已提交
1342

H
Haojun Liao 已提交
1343
  // todo move to the initialization function
H
Haojun Liao 已提交
1344
  int32_t code = filterInitFromNode((SNode*)pFilterNode, &filter, 0);
1345

1346
  size_t             numOfCols = taosArrayGetSize(pBlock->pDataBlock);
1347
  SFilterColumnParam param1 = {.numOfCols = numOfCols, .pDataBlock = pBlock->pDataBlock};
1348 1349 1350
  code = filterSetDataFromSlotId(filter, &param1);

  int8_t* rowRes = NULL;
1351

1352
  // todo the keep seems never to be True??
1353
  bool keep = filterExecute(filter, pBlock, &rowRes, NULL, param1.numOfCols);
D
dapan1121 已提交
1354
  filterFreeInfo(filter);
1355

H
Haojun Liao 已提交
1356
  extractQualifiedTupleByFilterResult(pBlock, rowRes, keep);
1357
  blockDataUpdateTsWindow(pBlock, 0);
H
Haojun Liao 已提交
1358 1359

  taosMemoryFree(rowRes);
1360 1361
}

H
Haojun Liao 已提交
1362
void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep) {
1363 1364 1365 1366 1367
  if (keep) {
    return;
  }

  if (rowRes != NULL) {
L
Liu Jicong 已提交
1368
    int32_t      totalRows = pBlock->info.rows;
1369
    SSDataBlock* px = createOneDataBlock(pBlock, true);
1370

1371 1372
    size_t numOfCols = taosArrayGetSize(pBlock->pDataBlock);
    for (int32_t i = 0; i < numOfCols; ++i) {
1373 1374
      SColumnInfoData* pSrc = taosArrayGet(px->pDataBlock, i);
      SColumnInfoData* pDst = taosArrayGet(pBlock->pDataBlock, i);
1375
      // it is a reserved column for scalar function, and no data in this column yet.
1376
      if (pDst->pData == NULL || pSrc->pData == NULL) {
1377 1378 1379
        continue;
      }

1380 1381
      colInfoDataCleanup(pDst, pBlock->info.rows);

1382
      int32_t numOfRows = 0;
1383
      for (int32_t j = 0; j < totalRows; ++j) {
D
dapan1121 已提交
1384 1385 1386
        if (rowRes[j] == 0) {
          continue;
        }
1387

D
dapan1121 已提交
1388
        if (colDataIsNull_s(pSrc, j)) {
1389
          colDataAppendNULL(pDst, numOfRows);
D
dapan1121 已提交
1390
        } else {
1391
          colDataAppend(pDst, numOfRows, colDataGetData(pSrc, j), false);
D
dapan1121 已提交
1392
        }
1393
        numOfRows += 1;
H
Haojun Liao 已提交
1394
      }
1395

1396 1397 1398 1399 1400
      if (pBlock->info.rows == totalRows) {
        pBlock->info.rows = numOfRows;
      } else {
        ASSERT(pBlock->info.rows == numOfRows);
      }
1401
    }
1402

dengyihao's avatar
dengyihao 已提交
1403
    blockDataDestroy(px);  // fix memory leak
1404 1405 1406
  } else {
    // do nothing
    pBlock->info.rows = 0;
1407 1408 1409
  }
}

L
Liu Jicong 已提交
1410 1411
void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                              uint64_t groupId) {
1412
  // for simple group by query without interval, all the tables belong to one group result.
L
Liu Jicong 已提交
1413
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1414
  SResultRowInfo* pResultRowInfo = &pAggInfo->binfo.resultRowInfo;
1415 1416
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
1417

1418
  SResultRow* pResultRow = doSetResultOutBufByKey(pAggInfo->aggSup.pResultBuf, pResultRowInfo, (char*)&groupId,
L
Liu Jicong 已提交
1419
                                                  sizeof(groupId), true, groupId, pTaskInfo, false, &pAggInfo->aggSup);
L
Liu Jicong 已提交
1420
  assert(pResultRow != NULL);
1421 1422 1423 1424 1425 1426

  /*
   * not assign result buffer yet, add new result buffer
   * all group belong to one result set, and each group result has different group id so set the id to be one
   */
  if (pResultRow->pageId == -1) {
dengyihao's avatar
dengyihao 已提交
1427 1428
    int32_t ret =
        addNewWindowResultBuf(pResultRow, pAggInfo->aggSup.pResultBuf, groupId, pAggInfo->binfo.pRes->info.rowSize);
1429 1430 1431 1432 1433
    if (ret != TSDB_CODE_SUCCESS) {
      return;
    }
  }

1434
  setResultRowInitCtx(pResultRow, pCtx, numOfOutput, rowEntryInfoOffset);
1435 1436
}

1437
void setExecutionContext(SOperatorInfo* pOperator, int32_t numOfOutput, uint64_t groupId, SAggOperatorInfo* pAggInfo) {
H
Haojun Liao 已提交
1438
  if (pAggInfo->groupId != INT32_MIN && pAggInfo->groupId == groupId) {
1439 1440
    return;
  }
1441
#ifdef BUF_PAGE_DEBUG
L
Liu Jicong 已提交
1442
  qDebug("page_setbuf, groupId:%" PRIu64, groupId);
1443
#endif
1444
  doSetTableGroupOutputBuf(pOperator, pAggInfo, numOfOutput, groupId);
1445 1446

  // record the current active group id
H
Haojun Liao 已提交
1447
  pAggInfo->groupId = groupId;
1448 1449
}

1450 1451
static void doUpdateNumOfRows(SResultRow* pRow, int32_t numOfExprs, const int32_t* rowCellOffset) {
  for (int32_t j = 0; j < numOfExprs; ++j) {
1452
    struct SResultRowEntryInfo* pResInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1453 1454 1455 1456 1457 1458 1459 1460 1461 1462
    if (!isRowEntryInitialized(pResInfo)) {
      continue;
    }

    if (pRow->numOfRows < pResInfo->numOfRes) {
      pRow->numOfRows = pResInfo->numOfRes;
    }
  }
}

1463
int32_t finalizeResultRowIntoResultDataBlock(SDiskbasedBuf* pBuf, SResultRowPosition* resultRowPosition,
S
shenglian zhou 已提交
1464 1465 1466
                                             SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, int32_t numOfExprs,
                                             const int32_t* rowCellOffset, SSDataBlock* pBlock,
                                             SExecTaskInfo* pTaskInfo) {
1467 1468 1469 1470 1471 1472 1473 1474 1475
  SFilePage*  page = getBufPage(pBuf, resultRowPosition->pageId);
  SResultRow* pRow = (SResultRow*)((char*)page + resultRowPosition->offset);

  doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
  if (pRow->numOfRows == 0) {
    releaseBufPage(pBuf, page);
    return 0;
  }

1476 1477 1478 1479 1480 1481 1482
  while (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
    int32_t code = blockDataEnsureCapacity(pBlock, pBlock->info.capacity * 1.25);
    if (TAOS_FAILED(code)) {
      releaseBufPage(pBuf, page);
      qError("%s ensure result data capacity failed, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
      longjmp(pTaskInfo->env, code);
    }
1483 1484 1485 1486 1487
  }

  for (int32_t j = 0; j < numOfExprs; ++j) {
    int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1488
    pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1489 1490 1491 1492 1493 1494 1495 1496 1497
    if (pCtx[j].fpSet.finalize) {
      int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
      if (TAOS_FAILED(code)) {
        qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
        longjmp(pTaskInfo->env, code);
      }
    } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
      // do nothing, todo refactor
    } else {
1498 1499
      // expand the result into multiple rows. E.g., _wstart, top(k, 20)
      // the _wstart needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
1500 1501 1502 1503 1504 1505 1506 1507 1508
      SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
      char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
      for (int32_t k = 0; k < pRow->numOfRows; ++k) {
        colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
      }
    }
  }

  releaseBufPage(pBuf, page);
1509
  pBlock->info.rows += pRow->numOfRows;
1510 1511 1512 1513

  return 0;
}

X
Xiaoyu Wang 已提交
1514 1515 1516
int32_t doCopyToSDataBlock(SExecTaskInfo* pTaskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo, SDiskbasedBuf* pBuf,
                           SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset, SqlFunctionCtx* pCtx,
                           int32_t numOfExprs) {
1517
  int32_t numOfRows = getNumOfTotalRes(pGroupResInfo);
1518
  int32_t start = pGroupResInfo->index;
1519

1520
  for (int32_t i = start; i < numOfRows; i += 1) {
L
Liu Jicong 已提交
1521 1522
    SResKeyPos* pPos = taosArrayGetP(pGroupResInfo->pRows, i);
    SFilePage*  page = getBufPage(pBuf, pPos->pos.pageId);
1523

1524
    SResultRow* pRow = (SResultRow*)((char*)page + pPos->pos.offset);
1525 1526

    doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
1527 1528
    if (pRow->numOfRows == 0) {
      pGroupResInfo->index += 1;
1529
      releaseBufPage(pBuf, page);
1530 1531 1532
      continue;
    }

1533 1534 1535 1536 1537
    if (pBlock->info.groupId == 0) {
      pBlock->info.groupId = pPos->groupId;
    } else {
      // current value belongs to different group, it can't be packed into one datablock
      if (pBlock->info.groupId != pPos->groupId) {
1538
        releaseBufPage(pBuf, page);
1539 1540 1541 1542
        break;
      }
    }

1543
    if (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
1544
      releaseBufPage(pBuf, page);
1545 1546 1547 1548 1549
      break;
    }

    pGroupResInfo->index += 1;

1550
    for (int32_t j = 0; j < numOfExprs; ++j) {
1551 1552
      int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1553
      pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1554
      if (pCtx[j].fpSet.finalize) {
1555
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1556
        qDebug("\npage_finalize %d", numOfExprs);
1557
#endif
1558
        int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
1559
        if (TAOS_FAILED(code)) {
1560 1561
          qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
          longjmp(pTaskInfo->env, code);
1562
        }
1563 1564
      } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
        // do nothing, todo refactor
1565
      } else {
1566 1567
        // expand the result into multiple rows. E.g., _wstart, top(k, 20)
        // the _wstart needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
X
Xiaoyu Wang 已提交
1568 1569
        SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
        char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
1570
        if (pCtx[j].increase) {
L
Liu Jicong 已提交
1571
          int64_t ts = *(int64_t*)in;
1572
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
L
Liu Jicong 已提交
1573
            colDataAppend(pColInfoData, pBlock->info.rows + k, (const char*)&ts, pCtx[j].resultInfo->isNullRes);
1574 1575 1576 1577 1578 1579
            ts++;
          }
        } else {
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
            colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
          }
X
Xiaoyu Wang 已提交
1580
        }
1581
      }
1582 1583
    }

1584
    releaseBufPage(pBuf, page);
1585
    pBlock->info.rows += pRow->numOfRows;
L
Liu Jicong 已提交
1586 1587 1588
    //    if (pBlock->info.rows >= pBlock->info.capacity) {  // output buffer is full
    //      break;
    //    }
1589 1590
  }

X
Xiaoyu Wang 已提交
1591 1592
  qDebug("%s result generated, rows:%d, groupId:%" PRIu64, GET_TASKID(pTaskInfo), pBlock->info.rows,
         pBlock->info.groupId);
1593
  blockDataUpdateTsWindow(pBlock, 0);
1594 1595 1596
  return 0;
}

X
Xiaoyu Wang 已提交
1597 1598
void doBuildResultDatablock(SOperatorInfo* pOperator, SOptrBasicInfo* pbInfo, SGroupResInfo* pGroupResInfo,
                            SDiskbasedBuf* pBuf) {
1599 1600
  SExprInfo*     pExprInfo = pOperator->exprSupp.pExprInfo;
  int32_t        numOfExprs = pOperator->exprSupp.numOfExprs;
1601 1602
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

1603
  int32_t*        rowCellOffset = pOperator->exprSupp.rowEntryInfoOffset;
X
Xiaoyu Wang 已提交
1604
  SSDataBlock*    pBlock = pbInfo->pRes;
1605
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
1606

1607
  blockDataCleanup(pBlock);
1608
  if (!hasDataInGroupInfo(pGroupResInfo)) {
1609 1610 1611
    return;
  }

1612 1613
  // clear the existed group id
  pBlock->info.groupId = 0;
1614
  doCopyToSDataBlock(pTaskInfo, pBlock, pExprInfo, pBuf, pGroupResInfo, rowCellOffset, pCtx, numOfExprs);
1615 1616
}

L
Liu Jicong 已提交
1617
static void updateNumOfRowsInResultRows(SqlFunctionCtx* pCtx, int32_t numOfOutput, SResultRowInfo* pResultRowInfo,
1618
                                        int32_t* rowEntryInfoOffset) {
1619
  // update the number of result for each, only update the number of rows for the corresponding window result.
L
Liu Jicong 已提交
1620 1621 1622
  //  if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
  //    return;
  //  }
H
Haojun Liao 已提交
1623
#if 0
1624
  for (int32_t i = 0; i < pResultRowInfo->size; ++i) {
L
Liu Jicong 已提交
1625
    SResultRow* pResult = pResultRowInfo->pResult[i];
1626 1627 1628 1629 1630 1631 1632

    for (int32_t j = 0; j < numOfOutput; ++j) {
      int32_t functionId = pCtx[j].functionId;
      if (functionId == FUNCTION_TS || functionId == FUNCTION_TAG || functionId == FUNCTION_TAGPRJ) {
        continue;
      }

1633
      SResultRowEntryInfo* pCell = getResultEntryInfo(pResult, j, rowEntryInfoOffset);
1634
      pResult->numOfRows = (uint16_t)(TMAX(pResult->numOfRows, pCell->numOfRes));
1635 1636
    }
  }
H
Haojun Liao 已提交
1637
#endif
1638 1639
}

L
Liu Jicong 已提交
1640
static int32_t compressQueryColData(SColumnInfoData* pColRes, int32_t numOfRows, char* data, int8_t compressed) {
1641 1642
  int32_t colSize = pColRes->info.bytes * numOfRows;
  return (*(tDataTypes[pColRes->info.type].compFunc))(pColRes->pData, colSize, numOfRows, data,
L
Liu Jicong 已提交
1643
                                                      colSize + COMP_OVERFLOW_BYTES, compressed, NULL, 0);
1644 1645
}

1646 1647 1648
int32_t doFillTimeIntervalGapsInResults(struct SFillInfo* pFillInfo, SSDataBlock* pBlock, int32_t capacity) {
  int32_t numOfRows = (int32_t)taosFillResultDataBlock(pFillInfo, pBlock, capacity - pBlock->info.rows);
  return pBlock->info.rows;
1649 1650
}

L
Liu Jicong 已提交
1651 1652
void queryCostStatis(SExecTaskInfo* pTaskInfo) {
  STaskCostInfo* pSummary = &pTaskInfo->cost;
1653

L
Liu Jicong 已提交
1654 1655 1656
  //  uint64_t hashSize = taosHashGetMemSize(pQInfo->runtimeEnv.pResultRowHashTable);
  //  hashSize += taosHashGetMemSize(pRuntimeEnv->tableqinfoGroupInfo.map);
  //  pSummary->hashSize = hashSize;
1657 1658 1659 1660

  // add the merge time
  pSummary->elapsedTime += pSummary->firstStageMergeTime;

L
Liu Jicong 已提交
1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671
  //  SResultRowPool* p = pTaskInfo->pool;
  //  if (p != NULL) {
  //    pSummary->winInfoSize = getResultRowPoolMemSize(p);
  //    pSummary->numOfTimeWindows = getNumOfAllocatedResultRows(p);
  //  } else {
  //    pSummary->winInfoSize = 0;
  //    pSummary->numOfTimeWindows = 0;
  //  }
  //
  //  calculateOperatorProfResults(pQInfo);

1672 1673
  SFileBlockLoadRecorder* pRecorder = pSummary->pRecoder;
  if (pSummary->pRecoder != NULL) {
X
Xiaoyu Wang 已提交
1674 1675
    qDebug("%s :cost summary: elapsed time:%" PRId64 " us, first merge:%" PRId64
           " us, total blocks:%d, "
1676 1677 1678 1679
           "load block statis:%d, load data block:%d, total rows:%" PRId64 ", check rows:%" PRId64,
           GET_TASKID(pTaskInfo), pSummary->elapsedTime, pSummary->firstStageMergeTime, pRecorder->totalBlocks,
           pRecorder->loadBlockStatis, pRecorder->loadBlocks, pRecorder->totalRows, pRecorder->totalCheckedRows);
  }
L
Liu Jicong 已提交
1680 1681 1682
  // qDebug("QInfo:0x%"PRIx64" :cost summary: winResPool size:%.2f Kb, numOfWin:%"PRId64", tableInfoSize:%.2f Kb,
  // hashTable:%.2f Kb", pQInfo->qId, pSummary->winInfoSize/1024.0,
  //      pSummary->numOfTimeWindows, pSummary->tableInfoSize/1024.0, pSummary->hashSize/1024.0);
1683 1684
}

L
Liu Jicong 已提交
1685 1686 1687
// static void updateOffsetVal(STaskRuntimeEnv *pRuntimeEnv, SDataBlockInfo *pBlockInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
1688
//
L
Liu Jicong 已提交
1689
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1690
//
L
Liu Jicong 已提交
1691 1692 1693 1694
//   if (pQueryAttr->limit.offset == pBlockInfo->rows) {  // current block will ignore completed
//     pTableQueryInfo->lastKey = QUERY_IS_ASC_QUERY(pQueryAttr) ? pBlockInfo->window.ekey + step :
//     pBlockInfo->window.skey + step; pQueryAttr->limit.offset = 0; return;
//   }
1695
//
L
Liu Jicong 已提交
1696 1697 1698 1699 1700
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     pQueryAttr->pos = (int32_t)pQueryAttr->limit.offset;
//   } else {
//     pQueryAttr->pos = pBlockInfo->rows - (int32_t)pQueryAttr->limit.offset - 1;
//   }
1701
//
L
Liu Jicong 已提交
1702
//   assert(pQueryAttr->pos >= 0 && pQueryAttr->pos <= pBlockInfo->rows - 1);
1703
//
L
Liu Jicong 已提交
1704 1705
//   SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//   SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1706
//
L
Liu Jicong 已提交
1707 1708
//   // update the pQueryAttr->limit.offset value, and pQueryAttr->pos value
//   TSKEY *keys = (TSKEY *) pColInfoData->pData;
1709
//
L
Liu Jicong 已提交
1710 1711 1712
//   // update the offset value
//   pTableQueryInfo->lastKey = keys[pQueryAttr->pos];
//   pQueryAttr->limit.offset = 0;
1713
//
L
Liu Jicong 已提交
1714
//   int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
1715
//
L
Liu Jicong 已提交
1716 1717 1718 1719
//   //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numBlocksOfStep:%d, numOfRes:%d,
//   lastKey:%"PRId64, GET_TASKID(pRuntimeEnv),
//          pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes, pQuery->current->lastKey);
// }
1720

L
Liu Jicong 已提交
1721 1722
// void skipBlocks(STaskRuntimeEnv *pRuntimeEnv) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
1723
//
L
Liu Jicong 已提交
1724 1725 1726
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0) {
//     return;
//   }
1727
//
L
Liu Jicong 已提交
1728 1729
//   pQueryAttr->pos = 0;
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1730
//
L
Liu Jicong 已提交
1731 1732
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
//   TsdbQueryHandleT pTsdbReadHandle = pRuntimeEnv->pTsdbReadHandle;
1733
//
L
Liu Jicong 已提交
1734 1735 1736 1737 1738
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pTsdbReadHandle)) {
//     if (isTaskKilled(pRuntimeEnv->qinfo)) {
//       longjmp(pRuntimeEnv->env, TSDB_CODE_TSC_QUERY_CANCELLED);
//     }
1739
//
L
Liu Jicong 已提交
1740
//     tsdbRetrieveDataBlockInfo(pTsdbReadHandle, &blockInfo);
1741
//
L
Liu Jicong 已提交
1742 1743 1744 1745
//     if (pQueryAttr->limit.offset > blockInfo.rows) {
//       pQueryAttr->limit.offset -= blockInfo.rows;
//       pTableQueryInfo->lastKey = (QUERY_IS_ASC_QUERY(pQueryAttr)) ? blockInfo.window.ekey : blockInfo.window.skey;
//       pTableQueryInfo->lastKey += step;
1746
//
L
Liu Jicong 已提交
1747 1748 1749 1750 1751 1752 1753
//       //qDebug("QInfo:0x%"PRIx64" skip rows:%d, offset:%" PRId64, GET_TASKID(pRuntimeEnv), blockInfo.rows,
//              pQuery->limit.offset);
//     } else {  // find the appropriated start position in current block
//       updateOffsetVal(pRuntimeEnv, &blockInfo);
//       break;
//     }
//   }
1754
//
L
Liu Jicong 已提交
1755 1756 1757 1758 1759 1760 1761 1762 1763
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
// }

// static TSKEY doSkipIntervalProcess(STaskRuntimeEnv* pRuntimeEnv, STimeWindow* win, SDataBlockInfo* pBlockInfo,
// STableQueryInfo* pTableQueryInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
1764
//
L
Liu Jicong 已提交
1765 1766 1767
//   assert(pQueryAttr->limit.offset == 0);
//   STimeWindow tw = *win;
//   getNextTimeWindow(pQueryAttr, &tw);
1768
//
L
Liu Jicong 已提交
1769 1770
//   if ((tw.skey <= pBlockInfo->window.ekey && QUERY_IS_ASC_QUERY(pQueryAttr)) ||
//       (tw.ekey >= pBlockInfo->window.skey && !QUERY_IS_ASC_QUERY(pQueryAttr))) {
1771
//
L
Liu Jicong 已提交
1772 1773 1774 1775
//     // load the data block and check data remaining in current data block
//     // TODO optimize performance
//     SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//     SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1776
//
L
Liu Jicong 已提交
1777 1778 1779 1780
//     tw = *win;
//     int32_t startPos =
//         getNextQualifiedWindow(pQueryAttr, &tw, pBlockInfo, pColInfoData->pData, binarySearchForKey, -1);
//     assert(startPos >= 0);
1781
//
L
Liu Jicong 已提交
1782 1783
//     // set the abort info
//     pQueryAttr->pos = startPos;
1784
//
L
Liu Jicong 已提交
1785 1786 1787 1788
//     // reset the query start timestamp
//     pTableQueryInfo->win.skey = ((TSKEY *)pColInfoData->pData)[startPos];
//     pQueryAttr->window.skey = pTableQueryInfo->win.skey;
//     TSKEY key = pTableQueryInfo->win.skey;
1789
//
L
Liu Jicong 已提交
1790 1791
//     pWindowResInfo->prevSKey = tw.skey;
//     int32_t index = pRuntimeEnv->resultRowInfo.curIndex;
1792
//
L
Liu Jicong 已提交
1793 1794
//     int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
//     pRuntimeEnv->resultRowInfo.curIndex = index;  // restore the window index
1795
//
L
Liu Jicong 已提交
1796 1797 1798 1799
//     //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numOfRows:%d, numOfRes:%d,
//     lastKey:%" PRId64,
//            GET_TASKID(pRuntimeEnv), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes,
//            pQueryAttr->current->lastKey);
1800
//
L
Liu Jicong 已提交
1801 1802 1803 1804 1805
//     return key;
//   } else {  // do nothing
//     pQueryAttr->window.skey      = tw.skey;
//     pWindowResInfo->prevSKey = tw.skey;
//     pTableQueryInfo->lastKey = tw.skey;
1806
//
L
Liu Jicong 已提交
1807 1808
//     return tw.skey;
//   }
1809
//
L
Liu Jicong 已提交
1810 1811 1812 1813 1814 1815 1816 1817 1818 1819
//   return true;
// }

// static bool skipTimeInterval(STaskRuntimeEnv *pRuntimeEnv, TSKEY* start) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     assert(*start <= pRuntimeEnv->current->lastKey);
//   } else {
//     assert(*start >= pRuntimeEnv->current->lastKey);
//   }
1820
//
L
Liu Jicong 已提交
1821 1822 1823 1824 1825
//   // if queried with value filter, do NOT forward query start position
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0 || pRuntimeEnv->pTsBuf != NULL ||
//   pRuntimeEnv->pFillInfo != NULL) {
//     return true;
//   }
1826
//
L
Liu Jicong 已提交
1827 1828 1829 1830 1831 1832 1833
//   /*
//    * 1. for interval without interpolation query we forward pQueryAttr->interval.interval at a time for
//    *    pQueryAttr->limit.offset times. Since hole exists, pQueryAttr->interval.interval*pQueryAttr->limit.offset
//    value is
//    *    not valid. otherwise, we only forward pQueryAttr->limit.offset number of points
//    */
//   assert(pRuntimeEnv->resultRowInfo.prevSKey == TSKEY_INITIAL_VAL);
1834
//
L
Liu Jicong 已提交
1835 1836
//   STimeWindow w = TSWINDOW_INITIALIZER;
//   bool ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1837
//
L
Liu Jicong 已提交
1838 1839
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
//   STableQueryInfo *pTableQueryInfo = pRuntimeEnv->current;
1840
//
L
Liu Jicong 已提交
1841 1842 1843
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pRuntimeEnv->pTsdbReadHandle)) {
//     tsdbRetrieveDataBlockInfo(pRuntimeEnv->pTsdbReadHandle, &blockInfo);
1844
//
L
Liu Jicong 已提交
1845 1846 1847 1848 1849 1850 1851 1852 1853
//     if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       if (pWindowResInfo->prevSKey == TSKEY_INITIAL_VAL) {
//         getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.skey, blockInfo.window.skey, pQueryAttr->window.ekey,
//         &w); pWindowResInfo->prevSKey = w.skey;
//       }
//     } else {
//       getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.ekey, pQueryAttr->window.ekey, blockInfo.window.ekey, &w);
//       pWindowResInfo->prevSKey = w.skey;
//     }
1854
//
L
Liu Jicong 已提交
1855 1856
//     // the first time window
//     STimeWindow win = getActiveTimeWindow(pWindowResInfo, pWindowResInfo->prevSKey, pQueryAttr);
1857
//
L
Liu Jicong 已提交
1858 1859
//     while (pQueryAttr->limit.offset > 0) {
//       STimeWindow tw = win;
1860
//
L
Liu Jicong 已提交
1861 1862 1863
//       if ((win.ekey <= blockInfo.window.ekey && ascQuery) || (win.ekey >= blockInfo.window.skey && !ascQuery)) {
//         pQueryAttr->limit.offset -= 1;
//         pWindowResInfo->prevSKey = win.skey;
1864
//
L
Liu Jicong 已提交
1865 1866 1867 1868 1869 1870
//         // current time window is aligned with blockInfo.window.ekey
//         // restart it from next data block by set prevSKey to be TSKEY_INITIAL_VAL;
//         if ((win.ekey == blockInfo.window.ekey && ascQuery) || (win.ekey == blockInfo.window.skey && !ascQuery)) {
//           pWindowResInfo->prevSKey = TSKEY_INITIAL_VAL;
//         }
//       }
1871
//
L
Liu Jicong 已提交
1872 1873 1874 1875
//       if (pQueryAttr->limit.offset == 0) {
//         *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//         return true;
//       }
1876
//
L
Liu Jicong 已提交
1877 1878
//       // current window does not ended in current data block, try next data block
//       getNextTimeWindow(pQueryAttr, &tw);
1879
//
L
Liu Jicong 已提交
1880 1881 1882 1883 1884 1885 1886 1887 1888
//       /*
//        * If the next time window still starts from current data block,
//        * load the primary timestamp column first, and then find the start position for the next queried time window.
//        * Note that only the primary timestamp column is required.
//        * TODO: Optimize for this cases. All data blocks are not needed to be loaded, only if the first actually
//        required
//        * time window resides in current data block.
//        */
//       if ((tw.skey <= blockInfo.window.ekey && ascQuery) || (tw.ekey >= blockInfo.window.skey && !ascQuery)) {
1889
//
L
Liu Jicong 已提交
1890 1891
//         SArray *pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//         SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1892
//
L
Liu Jicong 已提交
1893 1894 1895
//         if ((win.ekey > blockInfo.window.ekey && ascQuery) || (win.ekey < blockInfo.window.skey && !ascQuery)) {
//           pQueryAttr->limit.offset -= 1;
//         }
1896
//
L
Liu Jicong 已提交
1897 1898 1899 1900 1901 1902 1903 1904
//         if (pQueryAttr->limit.offset == 0) {
//           *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//           return true;
//         } else {
//           tw = win;
//           int32_t startPos =
//               getNextQualifiedWindow(pQueryAttr, &tw, &blockInfo, pColInfoData->pData, binarySearchForKey, -1);
//           assert(startPos >= 0);
1905
//
L
Liu Jicong 已提交
1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916
//           // set the abort info
//           pQueryAttr->pos = startPos;
//           pTableQueryInfo->lastKey = ((TSKEY *)pColInfoData->pData)[startPos];
//           pWindowResInfo->prevSKey = tw.skey;
//           win = tw;
//         }
//       } else {
//         break;  // offset is not 0, and next time window begins or ends in the next block.
//       }
//     }
//   }
1917
//
L
Liu Jicong 已提交
1918 1919 1920 1921
//   // check for error
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
1922
//
L
Liu Jicong 已提交
1923 1924
//   return true;
// }
1925

1926
int32_t appendDownstream(SOperatorInfo* p, SOperatorInfo** pDownstream, int32_t num) {
H
Haojun Liao 已提交
1927
  if (p->pDownstream == NULL) {
H
Haojun Liao 已提交
1928
    assert(p->numOfDownstream == 0);
1929 1930
  }

wafwerar's avatar
wafwerar 已提交
1931
  p->pDownstream = taosMemoryCalloc(1, num * POINTER_BYTES);
1932 1933 1934 1935 1936 1937 1938
  if (p->pDownstream == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  memcpy(p->pDownstream, pDownstream, num * POINTER_BYTES);
  p->numOfDownstream = num;
  return TSDB_CODE_SUCCESS;
1939 1940
}

wmmhello's avatar
wmmhello 已提交
1941
static void doDestroyTableList(STableListInfo* pTableqinfoList);
1942

1943
static void doTableQueryInfoTimeWindowCheck(SExecTaskInfo* pTaskInfo, STableQueryInfo* pTableQueryInfo, int32_t order) {
H
Haojun Liao 已提交
1944 1945
#if 0
    if (order == TSDB_ORDER_ASC) {
1946 1947
    assert(
        (pTableQueryInfo->win.skey <= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1948 1949
        (pTableQueryInfo->lastKey >= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey >= pTaskInfo->window.skey && pTableQueryInfo->win.ekey <= pTaskInfo->window.ekey));
1950 1951 1952
  } else {
    assert(
        (pTableQueryInfo->win.skey >= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1953 1954
        (pTableQueryInfo->lastKey <= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey <= pTaskInfo->window.skey && pTableQueryInfo->win.ekey >= pTaskInfo->window.ekey));
1955
  }
H
Haojun Liao 已提交
1956
#endif
1957 1958
}

1959 1960 1961 1962
typedef struct SFetchRspHandleWrapper {
  uint32_t exchangeId;
  int32_t  sourceIndex;
} SFetchRspHandleWrapper;
1963

D
dapan1121 已提交
1964
int32_t loadRemoteDataCallback(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1965
  SFetchRspHandleWrapper* pWrapper = (SFetchRspHandleWrapper*)param;
1966 1967 1968 1969 1970 1971 1972

  SExchangeInfo* pExchangeInfo = taosAcquireRef(exchangeObjRefPool, pWrapper->exchangeId);
  if (pExchangeInfo == NULL) {
    qWarn("failed to acquire exchange operator, since it may have been released");
    return TSDB_CODE_SUCCESS;
  }

X
Xiaoyu Wang 已提交
1973
  int32_t          index = pWrapper->sourceIndex;
1974
  SSourceDataInfo* pSourceDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, index);
1975

H
Haojun Liao 已提交
1976 1977
  if (code == TSDB_CODE_SUCCESS) {
    pSourceDataInfo->pRsp = pMsg->pData;
1978

H
Haojun Liao 已提交
1979 1980
    SRetrieveTableRsp* pRsp = pSourceDataInfo->pRsp;
    pRsp->numOfRows = htonl(pRsp->numOfRows);
dengyihao's avatar
dengyihao 已提交
1981
    pRsp->compLen = htonl(pRsp->compLen);
1982
    pRsp->numOfCols = htonl(pRsp->numOfCols);
dengyihao's avatar
dengyihao 已提交
1983
    pRsp->useconds = htobe64(pRsp->useconds);
1984

1985
    ASSERT(pRsp != NULL);
1986
    qDebug("%s fetch rsp received, index:%d, rows:%d", pSourceDataInfo->taskId, index, pRsp->numOfRows);
H
Haojun Liao 已提交
1987 1988
  } else {
    pSourceDataInfo->code = code;
D
dapan1121 已提交
1989
    qDebug("%s fetch rsp received, index:%d, error:%d", pSourceDataInfo->taskId, index, tstrerror(code));
H
Haojun Liao 已提交
1990
  }
H
Haojun Liao 已提交
1991

H
Haojun Liao 已提交
1992
  pSourceDataInfo->status = EX_SOURCE_DATA_READY;
1993 1994 1995 1996 1997

  tsem_post(&pExchangeInfo->ready);
  taosReleaseRef(exchangeObjRefPool, pWrapper->exchangeId);

  taosMemoryFree(pWrapper);
wmmhello's avatar
wmmhello 已提交
1998
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
1999 2000 2001 2002
}

static void destroySendMsgInfo(SMsgSendInfo* pMsgBody) {
  assert(pMsgBody != NULL);
wafwerar's avatar
wafwerar 已提交
2003 2004
  taosMemoryFreeClear(pMsgBody->msgInfo.pData);
  taosMemoryFreeClear(pMsgBody);
H
Haojun Liao 已提交
2005 2006
}

D
dapan1121 已提交
2007
void qProcessRspMsg(void* parent, SRpcMsg* pMsg, SEpSet* pEpSet) {
S
Shengliang Guan 已提交
2008 2009
  SMsgSendInfo* pSendInfo = (SMsgSendInfo*)pMsg->info.ahandle;
  assert(pMsg->info.ahandle != NULL);
H
Haojun Liao 已提交
2010 2011 2012 2013

  SDataBuf buf = {.len = pMsg->contLen, .pData = NULL};

  if (pMsg->contLen > 0) {
wafwerar's avatar
wafwerar 已提交
2014
    buf.pData = taosMemoryCalloc(1, pMsg->contLen);
H
Haojun Liao 已提交
2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025
    if (buf.pData == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      pMsg->code = TSDB_CODE_OUT_OF_MEMORY;
    } else {
      memcpy(buf.pData, pMsg->pCont, pMsg->contLen);
    }
  }

  pSendInfo->fp(pSendInfo->param, &buf, pMsg->code);
  rpcFreeCont(pMsg->pCont);
  destroySendMsgInfo(pSendInfo);
2026 2027
}

L
Liu Jicong 已提交
2028
static int32_t doSendFetchDataRequest(SExchangeInfo* pExchangeInfo, SExecTaskInfo* pTaskInfo, int32_t sourceIndex) {
2029
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2030

wafwerar's avatar
wafwerar 已提交
2031
  SResFetchReq* pMsg = taosMemoryCalloc(1, sizeof(SResFetchReq));
2032 2033 2034 2035
  if (NULL == pMsg) {
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
  }
2036

L
Liu Jicong 已提交
2037 2038
  SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, sourceIndex);
  SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, sourceIndex);
2039

2040 2041
  ASSERT(pDataInfo->status == EX_SOURCE_DATA_NOT_READY);

2042 2043 2044
  qDebug("%s build fetch msg and send to vgId:%d, ep:%s, taskId:0x%" PRIx64 ", execId:%d, %d/%" PRIzu,
         GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->addr.epSet.eps[0].fqdn, pSource->taskId, pSource->execId,
         sourceIndex, totalSources);
2045 2046 2047 2048 2049

  pMsg->header.vgId = htonl(pSource->addr.nodeId);
  pMsg->sId = htobe64(pSource->schedId);
  pMsg->taskId = htobe64(pSource->taskId);
  pMsg->queryId = htobe64(pTaskInfo->id.queryId);
D
dapan1121 已提交
2050
  pMsg->execId = htonl(pSource->execId);
2051 2052

  // send the fetch remote task result reques
wafwerar's avatar
wafwerar 已提交
2053
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
2054
  if (NULL == pMsgSendInfo) {
wafwerar's avatar
wafwerar 已提交
2055
    taosMemoryFreeClear(pMsg);
2056 2057 2058
    qError("%s prepare message %d failed", GET_TASKID(pTaskInfo), (int32_t)sizeof(SMsgSendInfo));
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
H
Haojun Liao 已提交
2059 2060
  }

2061
  SFetchRspHandleWrapper* pWrapper = taosMemoryCalloc(1, sizeof(SFetchRspHandleWrapper));
X
Xiaoyu Wang 已提交
2062
  pWrapper->exchangeId = pExchangeInfo->self;
2063 2064 2065
  pWrapper->sourceIndex = sourceIndex;

  pMsgSendInfo->param = pWrapper;
2066 2067
  pMsgSendInfo->msgInfo.pData = pMsg;
  pMsgSendInfo->msgInfo.len = sizeof(SResFetchReq);
L
Liu Jicong 已提交
2068
  pMsgSendInfo->msgType = pSource->fetchMsgType;
2069
  pMsgSendInfo->fp = loadRemoteDataCallback;
2070

2071
  int64_t transporterId = 0;
L
Liu Jicong 已提交
2072
  int32_t code = asyncSendMsgToServer(pExchangeInfo->pTransporter, &pSource->addr.epSet, &transporterId, pMsgSendInfo);
2073 2074 2075
  return TSDB_CODE_SUCCESS;
}

2076
int32_t extractDataBlockFromFetchRsp(SSDataBlock* pRes, SLoadRemoteDataInfo* pLoadInfo, int32_t numOfRows, char* pData,
L
Liu Jicong 已提交
2077 2078
                                     int32_t compLen, int32_t numOfOutput, int64_t startTs, uint64_t* total,
                                     SArray* pColList) {
H
Haojun Liao 已提交
2079
  if (pColList == NULL) {  // data from other sources
2080
    blockDataCleanup(pRes);
2081
    //    blockDataEnsureCapacity(pRes, numOfRows);
2082
    blockDecode(pRes, numOfOutput, numOfRows, pData);
H
Haojun Liao 已提交
2083
  } else {  // extract data according to pColList
2084
    ASSERT(numOfOutput == taosArrayGetSize(pColList));
2085 2086 2087 2088 2089
    char* pStart = pData;

    int32_t numOfCols = htonl(*(int32_t*)pStart);
    pStart += sizeof(int32_t);

2090
    // todo refactor:extract method
2091
    SSysTableSchema* pSchema = (SSysTableSchema*)pStart;
dengyihao's avatar
dengyihao 已提交
2092
    for (int32_t i = 0; i < numOfCols; ++i) {
2093 2094 2095 2096 2097 2098 2099
      SSysTableSchema* p = (SSysTableSchema*)pStart;

      p->colId = htons(p->colId);
      p->bytes = htonl(p->bytes);
      pStart += sizeof(SSysTableSchema);
    }

2100
    SSDataBlock* pBlock = createDataBlock();
dengyihao's avatar
dengyihao 已提交
2101
    for (int32_t i = 0; i < numOfCols; ++i) {
2102 2103
      SColumnInfoData idata = createColumnInfoData(pSchema[i].type, pSchema[i].bytes, pSchema[i].colId);
      blockDataAppendColInfo(pBlock, &idata);
2104 2105
    }

2106
    blockDecode(pBlock, numOfCols, numOfRows, pStart);
2107 2108
    blockDataEnsureCapacity(pRes, numOfRows);

H
Haojun Liao 已提交
2109
    // data from mnode
2110
    pRes->info.rows = numOfRows;
2111 2112
    relocateColumnData(pRes, pColList, pBlock->pDataBlock, false);
    blockDataDestroy(pBlock);
2113
  }
2114

2115 2116
  // todo move this to time window aggregator, since the primary timestamp may not be known by exchange operator.
  blockDataUpdateTsWindow(pRes, 0);
2117

2118
  int64_t el = taosGetTimestampUs() - startTs;
2119

H
Haojun Liao 已提交
2120 2121
  pLoadInfo->totalRows += numOfRows;
  pLoadInfo->totalSize += compLen;
2122

H
Haojun Liao 已提交
2123 2124 2125
  if (total != NULL) {
    *total += numOfRows;
  }
2126

H
Haojun Liao 已提交
2127
  pLoadInfo->totalElapsed += el;
2128 2129
  return TSDB_CODE_SUCCESS;
}
2130

L
Liu Jicong 已提交
2131 2132
static void* setAllSourcesCompleted(SOperatorInfo* pOperator, int64_t startTs) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
2133
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
H
Haojun Liao 已提交
2134

2135
  int64_t              el = taosGetTimestampUs() - startTs;
H
Haojun Liao 已提交
2136
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2137

H
Haojun Liao 已提交
2138
  pLoadInfo->totalElapsed += el;
H
Haojun Liao 已提交
2139

2140
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
L
Liu Jicong 已提交
2141 2142 2143
  qDebug("%s all %" PRIzu " sources are exhausted, total rows: %" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
         GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
         pLoadInfo->totalElapsed / 1000.0);
2144 2145 2146 2147 2148

  doSetOperatorCompleted(pOperator);
  return NULL;
}

L
Liu Jicong 已提交
2149 2150
static SSDataBlock* concurrentlyLoadRemoteDataImpl(SOperatorInfo* pOperator, SExchangeInfo* pExchangeInfo,
                                                   SExecTaskInfo* pTaskInfo) {
2151 2152 2153 2154 2155 2156 2157 2158
  int32_t code = 0;
  int64_t startTs = taosGetTimestampUs();
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);

  while (1) {
    int32_t completed = 0;
    for (int32_t i = 0; i < totalSources; ++i) {
      SSourceDataInfo* pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, i);
2159
      if (pDataInfo->status == EX_SOURCE_DATA_EXHAUSTED) {
2160
        completed += 1;
H
Haojun Liao 已提交
2161 2162
        continue;
      }
2163

2164
      if (pDataInfo->status != EX_SOURCE_DATA_READY) {
2165 2166 2167
        continue;
      }

2168 2169 2170 2171 2172
      if (pDataInfo->code != TSDB_CODE_SUCCESS) {
        code = pDataInfo->code;
        goto _error;
      }

L
Liu Jicong 已提交
2173
      SRetrieveTableRsp*     pRsp = pDataInfo->pRsp;
X
Xiaoyu Wang 已提交
2174
      SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, i);
2175

L
Liu Jicong 已提交
2176
      SSDataBlock*         pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2177
      SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2178
      if (pRsp->numOfRows == 0) {
2179 2180
        qDebug("%s vgId:%d, taskId:0x%" PRIx64 " execId:%d index:%d completed, rowsOfSource:%" PRIu64
               ", totalRows:%" PRIu64 ", completed:%d try next %d/%" PRIzu,
D
dapan1121 已提交
2181
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pDataInfo->totalRows,
2182
               pExchangeInfo->loadInfo.totalRows, completed + 1, i + 1, totalSources);
2183
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2184
        completed += 1;
D
dapan1121 已提交
2185
        taosMemoryFreeClear(pDataInfo->pRsp);
2186 2187
        continue;
      }
H
Haojun Liao 已提交
2188

H
Haojun Liao 已提交
2189
      SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2190 2191 2192
      code =
          extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
                                       pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2193
      if (code != 0) {
2194
        taosMemoryFreeClear(pDataInfo->pRsp);
2195 2196 2197
        goto _error;
      }

2198
      if (pRsp->completed == 1) {
2199 2200
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64
               " execId:%d"
X
Xiaoyu Wang 已提交
2201 2202
               " index:%d completed, numOfRows:%d, rowsOfSource:%" PRIu64 ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64
               ", completed:%d try next %d/%" PRIzu,
2203 2204
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pRes->info.rows,
               pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, completed + 1, i + 1, totalSources);
2205
        completed += 1;
2206
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2207
      } else {
D
dapan1121 已提交
2208
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
dengyihao's avatar
dengyihao 已提交
2209
               ", totalBytes:%" PRIu64,
2210 2211
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
               pLoadInfo->totalRows, pLoadInfo->totalSize);
2212 2213
      }

2214 2215
      taosMemoryFreeClear(pDataInfo->pRsp);

2216 2217
      if (pDataInfo->status != EX_SOURCE_DATA_EXHAUSTED) {
        pDataInfo->status = EX_SOURCE_DATA_NOT_READY;
2218 2219
        code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
        if (code != TSDB_CODE_SUCCESS) {
2220
          taosMemoryFreeClear(pDataInfo->pRsp);
2221 2222 2223 2224 2225 2226 2227
          goto _error;
        }
      }

      return pExchangeInfo->pResult;
    }

2228
    if (completed == totalSources) {
2229 2230
      return setAllSourcesCompleted(pOperator, startTs);
    }
H
Haojun Liao 已提交
2231 2232

    sched_yield();
2233 2234 2235 2236 2237 2238 2239
  }

_error:
  pTaskInfo->code = code;
  return NULL;
}

L
Liu Jicong 已提交
2240 2241 2242
static int32_t prepareConcurrentlyLoad(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2243

L
Liu Jicong 已提交
2244
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2245 2246 2247
  int64_t startTs = taosGetTimestampUs();

  // Asynchronously send all fetch requests to all sources.
L
Liu Jicong 已提交
2248
  for (int32_t i = 0; i < totalSources; ++i) {
2249 2250
    int32_t code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
    if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2251 2252
      pTaskInfo->code = code;
      return code;
2253 2254 2255 2256
    }
  }

  int64_t endTs = taosGetTimestampUs();
2257
  qDebug("%s send all fetch requests to %" PRIzu " sources completed, elapsed:%.2fms", GET_TASKID(pTaskInfo),
X
Xiaoyu Wang 已提交
2258
         totalSources, (endTs - startTs) / 1000.0);
2259

2260
  pOperator->status = OP_RES_TO_RETURN;
H
Haojun Liao 已提交
2261
  pOperator->cost.openCost = taosGetTimestampUs() - startTs;
2262

2263
  tsem_wait(&pExchangeInfo->ready);
H
Haojun Liao 已提交
2264
  return TSDB_CODE_SUCCESS;
2265 2266
}

L
Liu Jicong 已提交
2267 2268 2269
static SSDataBlock* seqLoadRemoteData(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2270

L
Liu Jicong 已提交
2271
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2272
  int64_t startTs = taosGetTimestampUs();
2273

L
Liu Jicong 已提交
2274
  while (1) {
2275 2276
    if (pExchangeInfo->current >= totalSources) {
      return setAllSourcesCompleted(pOperator, startTs);
2277
    }
2278

2279 2280 2281
    doSendFetchDataRequest(pExchangeInfo, pTaskInfo, pExchangeInfo->current);
    tsem_wait(&pExchangeInfo->ready);

dengyihao's avatar
dengyihao 已提交
2282
    SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, pExchangeInfo->current);
X
Xiaoyu Wang 已提交
2283
    SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, pExchangeInfo->current);
2284

H
Haojun Liao 已提交
2285
    if (pDataInfo->code != TSDB_CODE_SUCCESS) {
2286 2287
      qError("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d error happens, code:%s", GET_TASKID(pTaskInfo),
             pSource->addr.nodeId, pSource->taskId, pSource->execId, tstrerror(pDataInfo->code));
H
Haojun Liao 已提交
2288 2289 2290 2291
      pOperator->pTaskInfo->code = pDataInfo->code;
      return NULL;
    }

L
Liu Jicong 已提交
2292
    SRetrieveTableRsp*   pRsp = pDataInfo->pRsp;
H
Haojun Liao 已提交
2293
    SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2294
    if (pRsp->numOfRows == 0) {
2295 2296
      qDebug("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d %d of total completed, rowsOfSource:%" PRIu64
             ", totalRows:%" PRIu64 " try next",
D
dapan1121 已提交
2297
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pExchangeInfo->current + 1,
H
Haojun Liao 已提交
2298
             pDataInfo->totalRows, pLoadInfo->totalRows);
H
Haojun Liao 已提交
2299

2300
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2301
      pExchangeInfo->current += 1;
D
dapan1121 已提交
2302
      taosMemoryFreeClear(pDataInfo->pRsp);
2303 2304
      continue;
    }
H
Haojun Liao 已提交
2305

L
Liu Jicong 已提交
2306
    SSDataBlock*       pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2307
    SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2308
    int32_t            code =
2309
        extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
L
Liu Jicong 已提交
2310
                                     pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2311 2312

    if (pRsp->completed == 1) {
D
dapan1121 已提交
2313
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, rowsOfSource:%" PRIu64
L
Liu Jicong 已提交
2314
             ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64 " try next %d/%" PRIzu,
2315 2316 2317
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, pExchangeInfo->current + 1,
             totalSources);
2318

2319
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2320 2321
      pExchangeInfo->current += 1;
    } else {
D
dapan1121 已提交
2322
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
L
Liu Jicong 已提交
2323
             ", totalBytes:%" PRIu64,
2324 2325
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pLoadInfo->totalRows, pLoadInfo->totalSize);
2326 2327
    }

2328
    pOperator->resultInfo.totalRows += pRes->info.rows;
2329
    taosMemoryFreeClear(pDataInfo->pRsp);
2330 2331
    return pExchangeInfo->pResult;
  }
2332 2333
}

L
Liu Jicong 已提交
2334
static int32_t prepareLoadRemoteData(SOperatorInfo* pOperator) {
2335
  if (OPTR_IS_OPENED(pOperator)) {
H
Haojun Liao 已提交
2336 2337 2338
    return TSDB_CODE_SUCCESS;
  }

2339 2340
  int64_t st = taosGetTimestampUs();

L
Liu Jicong 已提交
2341
  SExchangeInfo* pExchangeInfo = pOperator->info;
2342
  if (!pExchangeInfo->seqLoadData) {
H
Haojun Liao 已提交
2343 2344 2345 2346 2347 2348
    int32_t code = prepareConcurrentlyLoad(pOperator);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
    }
  }

2349
  OPTR_SET_OPENED(pOperator);
2350
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2351 2352 2353
  return TSDB_CODE_SUCCESS;
}

2354
static SSDataBlock* doLoadRemoteDataImpl(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
2355 2356
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2357

2358
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
2359
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2360 2361
    return NULL;
  }
2362

L
Liu Jicong 已提交
2363
  size_t               totalSources = taosArrayGetSize(pExchangeInfo->pSources);
H
Haojun Liao 已提交
2364
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
H
Haojun Liao 已提交
2365

2366
  if (pOperator->status == OP_EXEC_DONE) {
L
Liu Jicong 已提交
2367 2368 2369
    qDebug("%s all %" PRIzu " source(s) are exhausted, total rows:%" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
           GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
           pLoadInfo->totalElapsed / 1000.0);
2370 2371 2372 2373 2374 2375
    return NULL;
  }

  if (pExchangeInfo->seqLoadData) {
    return seqLoadRemoteData(pOperator);
  } else {
2376
    return concurrentlyLoadRemoteDataImpl(pOperator, pExchangeInfo, pTaskInfo);
2377
  }
H
Haojun Liao 已提交
2378
}
2379

2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400 2401 2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412 2413 2414 2415 2416 2417
static SSDataBlock* doLoadRemoteData(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

  while(1) {
    SSDataBlock* pBlock = doLoadRemoteDataImpl(pOperator);
    if (pBlock == NULL) {
      return NULL;
    }

    ASSERT(pBlock == pExchangeInfo->pResult);

    SLimitInfo* pLimitInfo = &pExchangeInfo->limitInfo;
    if (hasLimitOffsetInfo(pLimitInfo)) {
      int32_t status = handleLimitOffset(pOperator, pLimitInfo, pExchangeInfo->pResult, false);
      if (status == PROJECT_RETRIEVE_CONTINUE) {
        continue;
      } else if (status == PROJECT_RETRIEVE_DONE) {
        size_t rows = pExchangeInfo->pResult->info.rows;
        pExchangeInfo->limitInfo.numOfOutputRows += rows;

        if (rows == 0) {
          doSetOperatorCompleted(pOperator);
          return NULL;
        } else {
          return pExchangeInfo->pResult;
        }
      }
    } else {
      return pExchangeInfo->pResult;
    }
  }
}

2418
static int32_t initDataSource(int32_t numOfSources, SExchangeInfo* pInfo, const char* id) {
2419
  pInfo->pSourceDataInfo = taosArrayInit(numOfSources, sizeof(SSourceDataInfo));
H
Haojun Liao 已提交
2420 2421
  if (pInfo->pSourceDataInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
2422 2423
  }

L
Liu Jicong 已提交
2424
  for (int32_t i = 0; i < numOfSources; ++i) {
2425
    SSourceDataInfo dataInfo = {0};
H
Haojun Liao 已提交
2426
    dataInfo.status = EX_SOURCE_DATA_NOT_READY;
2427
    dataInfo.taskId = id;
L
Liu Jicong 已提交
2428
    dataInfo.index = i;
X
Xiaoyu Wang 已提交
2429
    SSourceDataInfo* pDs = taosArrayPush(pInfo->pSourceDataInfo, &dataInfo);
2430
    if (pDs == NULL) {
H
Haojun Liao 已提交
2431 2432 2433 2434 2435 2436 2437 2438
      taosArrayDestroy(pInfo->pSourceDataInfo);
      return TSDB_CODE_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
}

2439
static int32_t initExchangeOperator(SExchangePhysiNode* pExNode, SExchangeInfo* pInfo, const char* id) {
2440
  size_t numOfSources = LIST_LENGTH(pExNode->pSrcEndPoints);
H
Haojun Liao 已提交
2441

2442
  if (numOfSources == 0) {
X
Xiaoyu Wang 已提交
2443
    qError("%s invalid number: %d of sources in exchange operator", id, (int32_t)numOfSources);
2444 2445 2446
    return TSDB_CODE_INVALID_PARA;
  }

H
Haojun Liao 已提交
2447
  pInfo->pSources = taosArrayInit(numOfSources, sizeof(SDownstreamSourceNode));
wmmhello's avatar
wmmhello 已提交
2448
  if (pInfo->pSources == NULL) {
2449
    return TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
2450 2451
  }

L
Liu Jicong 已提交
2452
  for (int32_t i = 0; i < numOfSources; ++i) {
D
dapan1121 已提交
2453
    SDownstreamSourceNode* pNode = (SDownstreamSourceNode*)nodesListGetNode((SNodeList*)pExNode->pSrcEndPoints, i);
H
Haojun Liao 已提交
2454 2455
    taosArrayPush(pInfo->pSources, pNode);
  }
2456

2457
  initLimitInfo(pExNode->node.pLimit, pExNode->node.pSlimit, &pInfo->limitInfo);
2458 2459
  pInfo->self = taosAddRef(exchangeObjRefPool, pInfo);

2460
  return initDataSource(numOfSources, pInfo, id);
2461 2462 2463 2464 2465 2466
}

SOperatorInfo* createExchangeOperatorInfo(void* pTransporter, SExchangePhysiNode* pExNode, SExecTaskInfo* pTaskInfo) {
  SExchangeInfo* pInfo = taosMemoryCalloc(1, sizeof(SExchangeInfo));
  SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
H
Haojun Liao 已提交
2467
    goto _error;
2468
  }
H
Haojun Liao 已提交
2469

2470
  int32_t code = initExchangeOperator(pExNode, pInfo, GET_TASKID(pTaskInfo));
2471 2472 2473
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2474 2475

  tsem_init(&pInfo->ready, 0, 0);
2476

2477
  pInfo->seqLoadData = false;
2478
  pInfo->pTransporter = pTransporter;
2479 2480
  pInfo->pResult = createResDataBlock(pExNode->node.pOutputDataBlockDesc);
  pOperator->name = "ExchangeOperator";
X
Xiaoyu Wang 已提交
2481
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_EXCHANGE;
X
Xiaoyu Wang 已提交
2482
  pOperator->blocking = false;
2483 2484
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
2485
  pOperator->exprSupp.numOfExprs = taosArrayGetSize(pInfo->pResult->pDataBlock);
X
Xiaoyu Wang 已提交
2486
  pOperator->pTaskInfo = pTaskInfo;
2487

L
Liu Jicong 已提交
2488 2489
  pOperator->fpSet = createOperatorFpSet(prepareLoadRemoteData, doLoadRemoteData, NULL, NULL,
                                         destroyExchangeOperatorInfo, NULL, NULL, NULL);
2490
  return pOperator;
H
Haojun Liao 已提交
2491

L
Liu Jicong 已提交
2492
_error:
H
Haojun Liao 已提交
2493
  if (pInfo != NULL) {
2494
    doDestroyExchangeOperatorInfo(pInfo);
H
Haojun Liao 已提交
2495 2496
  }

wafwerar's avatar
wafwerar 已提交
2497
  taosMemoryFreeClear(pOperator);
2498
  pTaskInfo->code = code;
H
Haojun Liao 已提交
2499
  return NULL;
2500 2501
}

dengyihao's avatar
dengyihao 已提交
2502 2503
static int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                                const char* pKey);
2504

2505
static void destroySortedMergeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
2506
  SSortedMergeOperatorInfo* pInfo = (SSortedMergeOperatorInfo*)param;
H
Haojun Liao 已提交
2507
  taosArrayDestroy(pInfo->pSortInfo);
2508 2509 2510
  taosArrayDestroy(pInfo->groupInfo);

  if (pInfo->pSortHandle != NULL) {
H
Haojun Liao 已提交
2511
    tsortDestroySortHandle(pInfo->pSortHandle);
2512 2513
  }

H
Haojun Liao 已提交
2514
  blockDataDestroy(pInfo->binfo.pRes);
H
Haojun Liao 已提交
2515
  cleanupAggSup(&pInfo->aggSup);
L
Liu Jicong 已提交
2516

D
dapan1121 已提交
2517
  taosMemoryFreeClear(param);
2518
}
H
Haojun Liao 已提交
2519

L
Liu Jicong 已提交
2520
static bool needToMerge(SSDataBlock* pBlock, SArray* groupInfo, char** buf, int32_t rowIndex) {
2521 2522 2523 2524
  size_t size = taosArrayGetSize(groupInfo);
  if (size == 0) {
    return true;
  }
2525

2526 2527
  for (int32_t i = 0; i < size; ++i) {
    int32_t* index = taosArrayGet(groupInfo, i);
2528

2529
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
L
Liu Jicong 已提交
2530
    bool             isNull = colDataIsNull(pColInfo, rowIndex, pBlock->info.rows, NULL);
2531

2532 2533 2534
    if ((isNull && buf[i] != NULL) || (!isNull && buf[i] == NULL)) {
      return false;
    }
2535

2536 2537 2538 2539 2540 2541 2542 2543 2544 2545 2546 2547 2548
    char* pCell = colDataGetData(pColInfo, rowIndex);
    if (IS_VAR_DATA_TYPE(pColInfo->info.type)) {
      if (varDataLen(pCell) != varDataLen(buf[i])) {
        return false;
      } else {
        if (memcmp(varDataVal(pCell), varDataVal(buf[i]), varDataLen(pCell)) != 0) {
          return false;
        }
      }
    } else {
      if (memcmp(pCell, buf[i], pColInfo->info.bytes) != 0) {
        return false;
      }
2549 2550 2551
    }
  }

2552
  return 0;
2553 2554
}

L
Liu Jicong 已提交
2555 2556 2557
static void doMergeResultImpl(SSortedMergeOperatorInfo* pInfo, SqlFunctionCtx* pCtx, int32_t numOfExpr,
                              int32_t rowIndex) {
  for (int32_t j = 0; j < numOfExpr; ++j) {  // TODO set row index
X
Xiaoyu Wang 已提交
2558
                                             //    pCtx[j].startRow = rowIndex;
2559 2560
  }

2561 2562
  for (int32_t j = 0; j < numOfExpr; ++j) {
    int32_t functionId = pCtx[j].functionId;
L
Liu Jicong 已提交
2563 2564 2565 2566 2567 2568 2569 2570 2571
    //    pCtx[j].fpSet->addInput(&pCtx[j]);

    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_MERGE);
    //    } else {
    //      assert(!TSDB_FUNC_IS_SCALAR(functionId));
    //      aAggs[functionId].mergeFunc(&pCtx[j]);
    //    }
2572
  }
2573
}
2574

L
Liu Jicong 已提交
2575 2576
static void doFinalizeResultImpl(SqlFunctionCtx* pCtx, int32_t numOfExpr) {
  for (int32_t j = 0; j < numOfExpr; ++j) {
2577 2578 2579 2580
    int32_t functionId = pCtx[j].functionId;
    //    if (functionId == FUNC_TAG_DUMMY || functionId == FUNC_TS_DUMMY) {
    //      continue;
    //    }
2581

2582 2583 2584 2585
    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_FINALIZE);
    //    } else {
dengyihao's avatar
dengyihao 已提交
2586
    //    pCtx[j].fpSet.finalize(&pCtx[j]);
2587 2588
  }
}
2589

2590
static bool saveCurrentTuple(char** rowColData, SArray* pColumnList, SSDataBlock* pBlock, int32_t rowIndex) {
L
Liu Jicong 已提交
2591
  int32_t size = (int32_t)taosArrayGetSize(pColumnList);
2592

L
Liu Jicong 已提交
2593 2594
  for (int32_t i = 0; i < size; ++i) {
    int32_t*         index = taosArrayGet(pColumnList, i);
2595
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
H
Haojun Liao 已提交
2596

2597 2598 2599
    char* data = colDataGetData(pColInfo, rowIndex);
    memcpy(rowColData[i], data, colDataGetLength(pColInfo, rowIndex));
  }
2600

2601 2602
  return true;
}
2603

2604 2605
static void doMergeImpl(SOperatorInfo* pOperator, int32_t numOfExpr, SSDataBlock* pBlock) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
2606

2607
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
2608

L
Liu Jicong 已提交
2609
  for (int32_t i = 0; i < pBlock->info.rows; ++i) {
2610 2611 2612 2613 2614 2615 2616 2617 2618
    if (!pInfo->hasGroupVal) {
      ASSERT(i == 0);
      doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
    } else {
      if (needToMerge(pBlock, pInfo->groupInfo, pInfo->groupVal, i)) {
        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      } else {
        doFinalizeResultImpl(pCtx, numOfExpr);
2619 2620
        int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
        //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2621

2622
        // TODO check for available buffer;
H
Haojun Liao 已提交
2623

2624 2625 2626 2627 2628
        // next group info data
        pInfo->binfo.pRes->info.rows += numOfRows;
        for (int32_t j = 0; j < numOfExpr; ++j) {
          if (pCtx[j].functionId < 0) {
            continue;
2629
          }
2630

H
Haojun Liao 已提交
2631
          pCtx[j].fpSet.process(&pCtx[j]);
2632
        }
2633 2634 2635

        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
        pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
H
Haojun Liao 已提交
2636
      }
2637 2638 2639 2640
    }
  }
}

2641 2642
static SSDataBlock* doMerge(SOperatorInfo* pOperator) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
L
Liu Jicong 已提交
2643
  SSortHandle*              pHandle = pInfo->pSortHandle;
2644

2645
  SSDataBlock* pDataBlock = createOneDataBlock(pInfo->binfo.pRes, false);
2646
  blockDataEnsureCapacity(pDataBlock, pOperator->resultInfo.capacity);
2647

L
Liu Jicong 已提交
2648
  while (1) {
2649
    blockDataCleanup(pDataBlock);
2650
    while (1) {
H
Haojun Liao 已提交
2651
      STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2652 2653
      if (pTupleHandle == NULL) {
        break;
2654
      }
2655

2656 2657
      // build datablock for merge for one group
      appendOneRowToDataBlock(pDataBlock, pTupleHandle);
2658
      if (pDataBlock->info.rows >= pOperator->resultInfo.capacity) {
2659 2660
        break;
      }
2661
    }
2662

2663 2664 2665
    if (pDataBlock->info.rows == 0) {
      break;
    }
2666

2667
    setInputDataBlock(pOperator, pOperator->exprSupp.pCtx, pDataBlock, TSDB_ORDER_ASC, MAIN_SCAN, true);
L
Liu Jicong 已提交
2668 2669
    //  updateOutputBuf(&pInfo->binfo, &pAggInfo->bufCapacity, pBlock->info.rows * pAggInfo->resultRowFactor,
    //  pOperator->pRuntimeEnv, true);
2670
    doMergeImpl(pOperator, pOperator->exprSupp.numOfExprs, pDataBlock);
2671 2672
    // flush to tuple store, and after all data have been handled, return to upstream node or sink node
  }
2673

2674 2675 2676
  doFinalizeResultImpl(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs);
  int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
  //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2677

2678
  // TODO check for available buffer;
2679

2680 2681
  // next group info data
  pInfo->binfo.pRes->info.rows += numOfRows;
L
Liu Jicong 已提交
2682
  return (pInfo->binfo.pRes->info.rows > 0) ? pInfo->binfo.pRes : NULL;
2683
}
2684

L
Liu Jicong 已提交
2685 2686
SSDataBlock* getSortedMergeBlockData(SSortHandle* pHandle, SSDataBlock* pDataBlock, int32_t capacity,
                                     SArray* pColMatchInfo, SSortedMergeOperatorInfo* pInfo) {
2687 2688 2689 2690 2691 2692 2693 2694 2695 2696
  blockDataCleanup(pDataBlock);

  SSDataBlock* p = tsortGetSortedDataBlock(pHandle);
  if (p == NULL) {
    return NULL;
  }

  blockDataEnsureCapacity(p, capacity);

  while (1) {
2697
    STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2698 2699 2700 2701
    if (pTupleHandle == NULL) {
      break;
    }

2702
    appendOneRowToDataBlock(p, pTupleHandle);
2703 2704 2705 2706 2707 2708 2709 2710 2711 2712 2713 2714 2715
    if (p->info.rows >= capacity) {
      break;
    }
  }

  if (p->info.rows > 0) {
    int32_t numOfCols = taosArrayGetSize(pColMatchInfo);
    for (int32_t i = 0; i < numOfCols; ++i) {
      SColMatchInfo* pmInfo = taosArrayGet(pColMatchInfo, i);
      ASSERT(pmInfo->matchType == COL_MATCH_FROM_SLOT_ID);

      SColumnInfoData* pSrc = taosArrayGet(p->pDataBlock, pmInfo->srcSlotId);
      SColumnInfoData* pDst = taosArrayGet(pDataBlock->pDataBlock, pmInfo->targetSlotId);
2716
      colDataAssign(pDst, pSrc, p->info.rows, &pDataBlock->info);
2717 2718 2719 2720 2721 2722 2723 2724 2725 2726
    }

    pDataBlock->info.rows = p->info.rows;
    pDataBlock->info.capacity = p->info.rows;
  }

  blockDataDestroy(p);
  return (pDataBlock->info.rows > 0) ? pDataBlock : NULL;
}

2727
static SSDataBlock* doSortedMerge(SOperatorInfo* pOperator) {
2728 2729
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
2730 2731
  }

L
Liu Jicong 已提交
2732
  SExecTaskInfo*            pTaskInfo = pOperator->pTaskInfo;
2733
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
H
Haojun Liao 已提交
2734
  if (pOperator->status == OP_RES_TO_RETURN) {
2735
    return getSortedMergeBlockData(pInfo->pSortHandle, pInfo->binfo.pRes, pOperator->resultInfo.capacity, NULL, pInfo);
2736 2737
  }

2738
  int32_t numOfBufPage = pInfo->sortBufSize / pInfo->bufPageSize;
L
Liu Jicong 已提交
2739 2740
  pInfo->pSortHandle = tsortCreateSortHandle(pInfo->pSortInfo, SORT_MULTISOURCE_MERGE, pInfo->bufPageSize, numOfBufPage,
                                             pInfo->binfo.pRes, "GET_TASKID(pTaskInfo)");
H
Haojun Liao 已提交
2741

2742
  tsortSetFetchRawDataFp(pInfo->pSortHandle, loadNextDataBlock, NULL, NULL);
2743

L
Liu Jicong 已提交
2744
  for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
wmmhello's avatar
wmmhello 已提交
2745
    SSortSource* ps = taosMemoryCalloc(1, sizeof(SSortSource));
H
Haojun Liao 已提交
2746
    ps->param = pOperator->pDownstream[i];
H
Haojun Liao 已提交
2747
    tsortAddSource(pInfo->pSortHandle, ps);
2748 2749
  }

H
Haojun Liao 已提交
2750
  int32_t code = tsortOpen(pInfo->pSortHandle);
2751
  if (code != TSDB_CODE_SUCCESS) {
2752
    longjmp(pTaskInfo->env, terrno);
2753 2754
  }

H
Haojun Liao 已提交
2755
  pOperator->status = OP_RES_TO_RETURN;
2756
  return doMerge(pOperator);
2757
}
2758

L
Liu Jicong 已提交
2759 2760
static int32_t initGroupCol(SExprInfo* pExprInfo, int32_t numOfCols, SArray* pGroupInfo,
                            SSortedMergeOperatorInfo* pInfo) {
2761 2762
  if (pGroupInfo == NULL || taosArrayGetSize(pGroupInfo) == 0) {
    return 0;
H
Haojun Liao 已提交
2763 2764
  }

2765 2766 2767 2768 2769 2770 2771 2772
  int32_t len = 0;
  SArray* plist = taosArrayInit(3, sizeof(SColumn));
  pInfo->groupInfo = taosArrayInit(3, sizeof(int32_t));

  if (plist == NULL || pInfo->groupInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

L
Liu Jicong 已提交
2773 2774
  size_t numOfGroupCol = taosArrayGetSize(pInfo->groupInfo);
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2775
    SColumn* pCol = taosArrayGet(pGroupInfo, i);
L
Liu Jicong 已提交
2776
    for (int32_t j = 0; j < numOfCols; ++j) {
H
Haojun Liao 已提交
2777
      SExprInfo* pe = &pExprInfo[j];
2778
      if (pe->base.resSchema.slotId == pCol->colId) {
2779 2780
        taosArrayPush(plist, pCol);
        taosArrayPush(pInfo->groupInfo, &j);
H
Haojun Liao 已提交
2781
        len += pCol->bytes;
2782 2783
        break;
      }
H
Haojun Liao 已提交
2784 2785 2786
    }
  }

2787
  ASSERT(taosArrayGetSize(pGroupInfo) == taosArrayGetSize(plist));
H
Haojun Liao 已提交
2788

wafwerar's avatar
wafwerar 已提交
2789
  pInfo->groupVal = taosMemoryCalloc(1, (POINTER_BYTES * numOfGroupCol + len));
2790 2791 2792 2793
  if (pInfo->groupVal == NULL) {
    taosArrayDestroy(plist);
    return TSDB_CODE_OUT_OF_MEMORY;
  }
H
Haojun Liao 已提交
2794

2795
  int32_t offset = 0;
L
Liu Jicong 已提交
2796 2797
  char*   start = (char*)(pInfo->groupVal + (POINTER_BYTES * numOfGroupCol));
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2798 2799
    pInfo->groupVal[i] = start + offset;
    SColumn* pCol = taosArrayGet(plist, i);
H
Haojun Liao 已提交
2800
    offset += pCol->bytes;
2801
  }
H
Haojun Liao 已提交
2802

2803
  taosArrayDestroy(plist);
H
Haojun Liao 已提交
2804

2805 2806
  return TSDB_CODE_SUCCESS;
}
H
Haojun Liao 已提交
2807

L
Liu Jicong 已提交
2808 2809 2810
SOperatorInfo* createSortedMergeOperatorInfo(SOperatorInfo** downstream, int32_t numOfDownstream, SExprInfo* pExprInfo,
                                             int32_t num, SArray* pSortInfo, SArray* pGroupInfo,
                                             SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
2811
  SSortedMergeOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SSortedMergeOperatorInfo));
L
Liu Jicong 已提交
2812
  SOperatorInfo*            pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2813
  if (pInfo == NULL || pOperator == NULL) {
2814
    goto _error;
2815
  }
H
Haojun Liao 已提交
2816

2817 2818 2819 2820 2821
  int32_t code = initExprSupp(&pOperator->exprSupp, pExprInfo, num);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

2822
  initResultRowInfo(&pInfo->binfo.resultRowInfo);
H
Haojun Liao 已提交
2823

2824
  if (pOperator->exprSupp.pCtx == NULL || pInfo->binfo.pRes == NULL) {
2825 2826
    goto _error;
  }
H
Haojun Liao 已提交
2827

2828
  size_t keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
2829
  code = doInitAggInfoSup(&pInfo->aggSup, pOperator->exprSupp.pCtx, num, keyBufSize, pTaskInfo->id.str);
2830 2831 2832
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2833

2834
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, num);
H
Haojun Liao 已提交
2835
  code = initGroupCol(pExprInfo, num, pGroupInfo, pInfo);
2836 2837 2838
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2839

L
Liu Jicong 已提交
2840 2841 2842 2843 2844
  //  pInfo->resultRowFactor = (int32_t)(getRowNumForMultioutput(pRuntimeEnv->pQueryAttr,
  //      pRuntimeEnv->pQueryAttr->topBotQuery, false));
  pInfo->sortBufSize = 1024 * 16;  // 1MB
  pInfo->bufPageSize = 1024;
  pInfo->pSortInfo = pSortInfo;
H
Haojun Liao 已提交
2845

2846
  pOperator->resultInfo.capacity = blockDataGetCapacityInRow(pInfo->binfo.pRes, pInfo->bufPageSize);
H
Haojun Liao 已提交
2847

L
Liu Jicong 已提交
2848
  pOperator->name = "SortedMerge";
X
Xiaoyu Wang 已提交
2849
  // pOperator->operatorType = OP_SortedMerge;
2850 2851 2852
  pOperator->blocking = true;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
L
Liu Jicong 已提交
2853
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
2854

2855 2856
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doSortedMerge, NULL, NULL, destroySortedMergeOperatorInfo,
                                         NULL, NULL, NULL);
2857 2858 2859
  code = appendDownstream(pOperator, downstream, numOfDownstream);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
2860
  }
H
Haojun Liao 已提交
2861

2862
  return pOperator;
H
Haojun Liao 已提交
2863

L
Liu Jicong 已提交
2864
_error:
2865
  if (pInfo != NULL) {
H
Haojun Liao 已提交
2866
    destroySortedMergeOperatorInfo(pInfo, num);
H
Haojun Liao 已提交
2867 2868
  }

wafwerar's avatar
wafwerar 已提交
2869 2870
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
2871 2872
  terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
  return NULL;
H
Haojun Liao 已提交
2873 2874
}

X
Xiaoyu Wang 已提交
2875
int32_t getTableScanInfo(SOperatorInfo* pOperator, int32_t* order, int32_t* scanFlag) {
2876
  // todo add more information about exchange operation
2877
  int32_t type = pOperator->operatorType;
X
Xiaoyu Wang 已提交
2878
  if (type == QUERY_NODE_PHYSICAL_PLAN_EXCHANGE || type == QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN ||
2879
      type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN ||
2880
      type == QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN) {
2881 2882 2883
    *order = TSDB_ORDER_ASC;
    *scanFlag = MAIN_SCAN;
    return TSDB_CODE_SUCCESS;
2884
  } else if (type == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) {
2885 2886 2887 2888 2889
    STableScanInfo* pTableScanInfo = pOperator->info;
    *order = pTableScanInfo->cond.order;
    *scanFlag = pTableScanInfo->scanFlag;
    return TSDB_CODE_SUCCESS;
  } else {
H
Haojun Liao 已提交
2890
    if (pOperator->pDownstream == NULL || pOperator->pDownstream[0] == NULL) {
2891
      return TSDB_CODE_INVALID_PARA;
H
Haojun Liao 已提交
2892
    } else {
2893
      return getTableScanInfo(pOperator->pDownstream[0], order, scanFlag);
2894 2895 2896
    }
  }
}
L
Liu Jicong 已提交
2897
#if 0
L
Liu Jicong 已提交
2898
int32_t doPrepareScan(SOperatorInfo* pOperator, uint64_t uid, int64_t ts) {
L
Liu Jicong 已提交
2899
  uint8_t type = pOperator->operatorType;
2900 2901 2902

  pOperator->status = OP_OPENED;

L
Liu Jicong 已提交
2903
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2904
    SStreamScanInfo* pScanInfo = pOperator->info;
L
Liu Jicong 已提交
2905
    pScanInfo->blockType = STREAM_INPUT__TABLE_SCAN;
2906

2907
    pScanInfo->pTableScanOp->status = OP_OPENED;
2908

2909
    STableScanInfo* pInfo = pScanInfo->pTableScanOp->info;
2910 2911
    ASSERT(pInfo->scanMode == TABLE_SCAN__TABLE_ORDER);

L
Liu Jicong 已提交
2912 2913 2914 2915
    if (uid == 0) {
      pInfo->noTable = 1;
      return TSDB_CODE_SUCCESS;
    }
2916 2917 2918 2919 2920 2921

    /*if (pSnapShotScanInfo->dataReader == NULL) {*/
    /*pSnapShotScanInfo->dataReader = tsdbReaderOpen(pHandle->vnode, &pSTInfo->cond, tableList, 0, 0);*/
    /*pSnapShotScanInfo->scanMode = TABLE_SCAN__TABLE_ORDER;*/
    /*}*/

L
Liu Jicong 已提交
2922 2923
    pInfo->noTable = 0;

2924
    if (pInfo->lastStatus.uid != uid || pInfo->lastStatus.ts != ts) {
L
Liu Jicong 已提交
2925 2926 2927 2928 2929 2930 2931 2932 2933 2934 2935
      SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

      int32_t tableSz = taosArrayGetSize(pTaskInfo->tableqinfoList.pTableList);
      bool    found = false;
      for (int32_t i = 0; i < tableSz; i++) {
        STableKeyInfo* pTableInfo = taosArrayGet(pTaskInfo->tableqinfoList.pTableList, i);
        if (pTableInfo->uid == uid) {
          found = true;
          pInfo->currentTable = i;
        }
      }
2936
      // TODO after processing drop, found can be false
L
Liu Jicong 已提交
2937
      ASSERT(found);
2938 2939

      tsdbSetTableId(pInfo->dataReader, uid);
H
Haojun Liao 已提交
2940 2941 2942 2943
      int64_t oldSkey = pInfo->cond.twindows.skey;
      pInfo->cond.twindows.skey = ts + 1;
      tsdbReaderReset(pInfo->dataReader, &pInfo->cond);
      pInfo->cond.twindows.skey = oldSkey;
2944 2945
      pInfo->scanTimes = 0;

S
Shengliang Guan 已提交
2946
      qDebug("tsdb reader offset seek to uid %" PRId64 " ts %" PRId64 ", table cur set to %d , all table num %d", uid, ts,
L
Liu Jicong 已提交
2947
             pInfo->currentTable, tableSz);
L
Liu Jicong 已提交
2948
    }
L
Liu Jicong 已提交
2949

L
Liu Jicong 已提交
2950
    return TSDB_CODE_SUCCESS;
2951

L
Liu Jicong 已提交
2952
  } else {
2953 2954 2955 2956 2957
    if (pOperator->numOfDownstream == 1) {
      return doPrepareScan(pOperator->pDownstream[0], uid, ts);
    } else if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator to set the input data block");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2958
    } else {
2959 2960
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2961 2962 2963 2964
    }
  }
}

2965 2966 2967
int32_t doGetScanStatus(SOperatorInfo* pOperator, uint64_t* uid, int64_t* ts) {
  int32_t type = pOperator->operatorType;
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2968 2969
    SStreamScanInfo* pScanInfo = pOperator->info;
    STableScanInfo*  pSnapShotScanInfo = pScanInfo->pTableScanOp->info;
L
Liu Jicong 已提交
2970 2971
    *uid = pSnapShotScanInfo->lastStatus.uid;
    *ts = pSnapShotScanInfo->lastStatus.ts;
2972 2973 2974 2975 2976 2977 2978 2979 2980 2981
  } else {
    if (pOperator->pDownstream[0] == NULL) {
      return TSDB_CODE_INVALID_PARA;
    } else {
      doGetScanStatus(pOperator->pDownstream[0], uid, ts);
    }
  }

  return TSDB_CODE_SUCCESS;
}
L
Liu Jicong 已提交
2982
#endif
2983

2984
// this is a blocking operator
L
Liu Jicong 已提交
2985
static int32_t doOpenAggregateOptr(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
2986 2987
  if (OPTR_IS_OPENED(pOperator)) {
    return TSDB_CODE_SUCCESS;
2988 2989
  }

H
Haojun Liao 已提交
2990
  SExecTaskInfo*    pTaskInfo = pOperator->pTaskInfo;
2991
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
2992

2993 2994
  SExprSupp*     pSup = &pOperator->exprSupp;
  SOperatorInfo* downstream = pOperator->pDownstream[0];
2995

2996 2997
  int64_t st = taosGetTimestampUs();

2998 2999 3000
  int32_t order = TSDB_ORDER_ASC;
  int32_t scanFlag = MAIN_SCAN;

H
Haojun Liao 已提交
3001
  while (1) {
3002
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
3003 3004 3005 3006
    if (pBlock == NULL) {
      break;
    }

3007 3008 3009 3010
    int32_t code = getTableScanInfo(pOperator, &order, &scanFlag);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
3011

3012
    // there is an scalar expression that needs to be calculated before apply the group aggregation.
3013 3014 3015
    if (pAggInfo->scalarExprSup.pExprInfo != NULL) {
      SExprSupp* pSup1 = &pAggInfo->scalarExprSup;
      code = projectApplyFunctions(pSup1->pExprInfo, pBlock, pBlock, pSup1->pCtx, pSup1->numOfExprs, NULL);
3016
      if (code != TSDB_CODE_SUCCESS) {
3017
        longjmp(pTaskInfo->env, code);
3018
      }
3019 3020
    }

3021
    // the pDataBlock are always the same one, no need to call this again
3022 3023
    setExecutionContext(pOperator, pOperator->exprSupp.numOfExprs, pBlock->info.groupId, pAggInfo);
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, true);
3024
    code = doAggregateImpl(pOperator, pSup->pCtx);
3025 3026 3027
    if (code != 0) {
      longjmp(pTaskInfo->env, code);
    }
3028 3029
  }

H
Haojun Liao 已提交
3030
  closeAllResultRows(&pAggInfo->binfo.resultRowInfo);
3031
  initGroupedResultInfo(&pAggInfo->groupResInfo, pAggInfo->aggSup.pResultRowHashTable, 0);
H
Haojun Liao 已提交
3032
  OPTR_SET_OPENED(pOperator);
3033

3034
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
3035 3036 3037
  return TSDB_CODE_SUCCESS;
}

3038
static SSDataBlock* getAggregateResult(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3039
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
3040 3041 3042 3043 3044 3045
  SOptrBasicInfo*   pInfo = &pAggInfo->binfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

L
Liu Jicong 已提交
3046
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3047
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
H
Haojun Liao 已提交
3048
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
3049
    doSetOperatorCompleted(pOperator);
H
Haojun Liao 已提交
3050 3051 3052
    return NULL;
  }

H
Haojun Liao 已提交
3053
  blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);
S
slzhou 已提交
3054 3055 3056 3057 3058 3059 3060 3061
  while (1) {
    doBuildResultDatablock(pOperator, pInfo, &pAggInfo->groupResInfo, pAggInfo->aggSup.pResultBuf);
    doFilter(pAggInfo->pCondition, pInfo->pRes);

    if (!hasDataInGroupInfo(&pAggInfo->groupResInfo)) {
      doSetOperatorCompleted(pOperator);
      break;
    }
3062

S
slzhou 已提交
3063 3064 3065 3066
    if (pInfo->pRes->info.rows > 0) {
      break;
    }
  }
3067
  size_t rows = blockDataGetNumOfRows(pInfo->pRes);
3068 3069
  pOperator->resultInfo.totalRows += rows;

3070
  return (rows == 0) ? NULL : pInfo->pRes;
3071 3072
}

wmmhello's avatar
wmmhello 已提交
3073
int32_t aggEncodeResultRow(SOperatorInfo* pOperator, char** result, int32_t* length) {
3074
  if (result == NULL || length == NULL) {
wmmhello's avatar
wmmhello 已提交
3075 3076 3077
    return TSDB_CODE_TSC_INVALID_INPUT;
  }
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3078 3079 3080 3081 3082
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
  int32_t         size = taosHashGetSize(pSup->pResultRowHashTable);
  size_t          keyLen = sizeof(uint64_t) * 2;  // estimate the key length
  int32_t         totalSize =
      sizeof(int32_t) + sizeof(int32_t) + size * (sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3083

C
Cary Xu 已提交
3084 3085 3086 3087 3088 3089
  // no result
  if (getTotalBufSize(pSup->pResultBuf) == 0) {
    *result = NULL;
    *length = 0;
    return TSDB_CODE_SUCCESS;
  }
3090

wmmhello's avatar
wmmhello 已提交
3091
  *result = (char*)taosMemoryCalloc(1, totalSize);
L
Liu Jicong 已提交
3092
  if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
3093
    return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
3094
  }
wmmhello's avatar
wmmhello 已提交
3095

wmmhello's avatar
wmmhello 已提交
3096
  int32_t offset = sizeof(int32_t);
wmmhello's avatar
wmmhello 已提交
3097 3098
  *(int32_t*)(*result + offset) = size;
  offset += sizeof(int32_t);
3099 3100

  // prepare memory
3101
  SResultRowPosition* pos = &pInfo->resultRowInfo.cur;
dengyihao's avatar
dengyihao 已提交
3102 3103
  void*               pPage = getBufPage(pSup->pResultBuf, pos->pageId);
  SResultRow*         pRow = (SResultRow*)((char*)pPage + pos->offset);
3104 3105 3106
  setBufPageDirty(pPage, true);
  releaseBufPage(pSup->pResultBuf, pPage);

dengyihao's avatar
dengyihao 已提交
3107
  void* pIter = taosHashIterate(pSup->pResultRowHashTable, NULL);
wmmhello's avatar
wmmhello 已提交
3108
  while (pIter) {
dengyihao's avatar
dengyihao 已提交
3109
    void*               key = taosHashGetKey(pIter, &keyLen);
3110
    SResultRowPosition* p1 = (SResultRowPosition*)pIter;
3111

dengyihao's avatar
dengyihao 已提交
3112
    pPage = (SFilePage*)getBufPage(pSup->pResultBuf, p1->pageId);
3113
    pRow = (SResultRow*)((char*)pPage + p1->offset);
3114 3115
    setBufPageDirty(pPage, true);
    releaseBufPage(pSup->pResultBuf, pPage);
wmmhello's avatar
wmmhello 已提交
3116 3117 3118

    // recalculate the result size
    int32_t realTotalSize = offset + sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize;
L
Liu Jicong 已提交
3119
    if (realTotalSize > totalSize) {
wmmhello's avatar
wmmhello 已提交
3120
      char* tmp = (char*)taosMemoryRealloc(*result, realTotalSize);
L
Liu Jicong 已提交
3121
      if (tmp == NULL) {
wafwerar's avatar
wafwerar 已提交
3122
        taosMemoryFree(*result);
wmmhello's avatar
wmmhello 已提交
3123
        *result = NULL;
wmmhello's avatar
wmmhello 已提交
3124
        return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
3125
      } else {
wmmhello's avatar
wmmhello 已提交
3126 3127 3128 3129 3130 3131 3132 3133 3134 3135 3136 3137
        *result = tmp;
      }
    }
    // save key
    *(int32_t*)(*result + offset) = keyLen;
    offset += sizeof(int32_t);
    memcpy(*result + offset, key, keyLen);
    offset += keyLen;

    // save value
    *(int32_t*)(*result + offset) = pSup->resultRowSize;
    offset += sizeof(int32_t);
3138
    memcpy(*result + offset, pRow, pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3139 3140 3141 3142 3143
    offset += pSup->resultRowSize;

    pIter = taosHashIterate(pSup->pResultRowHashTable, pIter);
  }

wmmhello's avatar
wmmhello 已提交
3144 3145 3146 3147
  *(int32_t*)(*result) = offset;
  *length = offset;

  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3148 3149
}

3150
int32_t aggDecodeResultRow(SOperatorInfo* pOperator, char* result) {
3151
  if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
3152
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3153
  }
wmmhello's avatar
wmmhello 已提交
3154
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3155
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
wmmhello's avatar
wmmhello 已提交
3156 3157

  //  int32_t size = taosHashGetSize(pSup->pResultRowHashTable);
3158
  int32_t length = *(int32_t*)(result);
wmmhello's avatar
wmmhello 已提交
3159
  int32_t offset = sizeof(int32_t);
3160 3161 3162 3163

  int32_t count = *(int32_t*)(result + offset);
  offset += sizeof(int32_t);

L
Liu Jicong 已提交
3164
  while (count-- > 0 && length > offset) {
wmmhello's avatar
wmmhello 已提交
3165 3166 3167
    int32_t keyLen = *(int32_t*)(result + offset);
    offset += sizeof(int32_t);

L
Liu Jicong 已提交
3168
    uint64_t    tableGroupId = *(uint64_t*)(result + offset);
3169
    SResultRow* resultRow = getNewResultRow(pSup->pResultBuf, tableGroupId, pSup->resultRowSize);
L
Liu Jicong 已提交
3170
    if (!resultRow) {
wmmhello's avatar
wmmhello 已提交
3171
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3172
    }
3173

wmmhello's avatar
wmmhello 已提交
3174
    // add a new result set for a new group
3175 3176
    SResultRowPosition pos = {.pageId = resultRow->pageId, .offset = resultRow->offset};
    taosHashPut(pSup->pResultRowHashTable, result + offset, keyLen, &pos, sizeof(SResultRowPosition));
wmmhello's avatar
wmmhello 已提交
3177 3178 3179

    offset += keyLen;
    int32_t valueLen = *(int32_t*)(result + offset);
L
Liu Jicong 已提交
3180
    if (valueLen != pSup->resultRowSize) {
wmmhello's avatar
wmmhello 已提交
3181
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3182 3183 3184 3185 3186 3187 3188 3189 3190 3191
    }
    offset += sizeof(int32_t);
    int32_t pageId = resultRow->pageId;
    int32_t pOffset = resultRow->offset;
    memcpy(resultRow, result + offset, valueLen);
    resultRow->pageId = pageId;
    resultRow->offset = pOffset;
    offset += valueLen;

    initResultRow(resultRow);
dengyihao's avatar
dengyihao 已提交
3192
    pInfo->resultRowInfo.cur = (SResultRowPosition){.pageId = resultRow->pageId, .offset = resultRow->offset};
wmmhello's avatar
wmmhello 已提交
3193 3194
  }

L
Liu Jicong 已提交
3195
  if (offset != length) {
wmmhello's avatar
wmmhello 已提交
3196
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3197
  }
wmmhello's avatar
wmmhello 已提交
3198
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3199 3200
}

3201 3202 3203 3204 3205
int32_t handleLimitOffset(SOperatorInfo* pOperator, SLimitInfo* pLimitInfo, SSDataBlock* pBlock, bool holdDataInBuf) {
  if (pLimitInfo->remainGroupOffset > 0) {
    if (pLimitInfo->currentGroupId == 0) {  // it is the first group
      pLimitInfo->currentGroupId = pBlock->info.groupId;
      blockDataCleanup(pBlock);
3206
      return PROJECT_RETRIEVE_CONTINUE;
3207 3208 3209
    } else if (pLimitInfo->currentGroupId != pBlock->info.groupId) {
      // now it is the data from a new group
      pLimitInfo->remainGroupOffset -= 1;
3210 3211

      // ignore data block in current group
3212 3213
      if (pLimitInfo->remainGroupOffset > 0) {
        blockDataCleanup(pBlock);
3214 3215 3216 3217 3218
        return PROJECT_RETRIEVE_CONTINUE;
      }
    }

    // set current group id of the project operator
3219
    pLimitInfo->currentGroupId = pBlock->info.groupId;
3220 3221
  }

3222 3223 3224
  if (pLimitInfo->currentGroupId != 0 && pLimitInfo->currentGroupId != pBlock->info.groupId) {
    pLimitInfo->numOfOutputGroups += 1;
    if ((pLimitInfo->slimit.limit > 0) && (pLimitInfo->slimit.limit <= pLimitInfo->numOfOutputGroups)) {
3225
      pOperator->status = OP_EXEC_DONE;
3226
      blockDataCleanup(pBlock);
3227 3228 3229 3230 3231

      return PROJECT_RETRIEVE_DONE;
    }

    // reset the value for a new group data
3232 3233
    pLimitInfo->numOfOutputRows = 0;
    pLimitInfo->remainOffset = pLimitInfo->limit.offset;
3234 3235 3236 3237 3238
  }

  // here we reach the start position, according to the limit/offset requirements.

  // set current group id
3239
  pLimitInfo->currentGroupId = pBlock->info.groupId;
3240

3241 3242 3243
  if (pLimitInfo->remainOffset >= pBlock->info.rows) {
    pLimitInfo->remainOffset -= pBlock->info.rows;
    blockDataCleanup(pBlock);
3244
    return PROJECT_RETRIEVE_CONTINUE;
3245 3246 3247
  } else if (pLimitInfo->remainOffset < pBlock->info.rows && pLimitInfo->remainOffset > 0) {
    blockDataTrimFirstNRows(pBlock, pLimitInfo->remainOffset);
    pLimitInfo->remainOffset = 0;
3248 3249
  }

3250
  // check for the limitation in each group
3251 3252 3253 3254
  if (pLimitInfo->limit.limit >= 0 && pLimitInfo->numOfOutputRows + pBlock->info.rows >= pLimitInfo->limit.limit) {
    int32_t keepRows = (int32_t)(pLimitInfo->limit.limit - pLimitInfo->numOfOutputRows);
    blockDataKeepFirstNRows(pBlock, keepRows);
    if (pLimitInfo->slimit.limit > 0 && pLimitInfo->slimit.limit <= pLimitInfo->numOfOutputGroups) {
3255 3256 3257
      pOperator->status = OP_EXEC_DONE;
    }

3258
    return PROJECT_RETRIEVE_DONE;
3259
  }
3260

3261
  // todo optimize performance
3262 3263
  // If there are slimit/soffset value exists, multi-round result can not be packed into one group, since the
  // they may not belong to the same group the limit/offset value is not valid in this case.
3264 3265
  if ((!holdDataInBuf) || (pBlock->info.rows >= pOperator->resultInfo.threshold) || pLimitInfo->slimit.offset != -1 ||
      pLimitInfo->slimit.limit != -1) {
3266
    return PROJECT_RETRIEVE_DONE;
L
Liu Jicong 已提交
3267
  } else {  // not full enough, continue to accumulate the output data in the buffer.
3268 3269 3270 3271
    return PROJECT_RETRIEVE_CONTINUE;
  }
}

3272
static SSDataBlock* doProjectOperation(SOperatorInfo* pOperator) {
3273
  SProjectOperatorInfo* pProjectInfo = pOperator->info;
L
Liu Jicong 已提交
3274
  SOptrBasicInfo*       pInfo = &pProjectInfo->binfo;
3275

L
Liu Jicong 已提交
3276
  SExprSupp*   pSup = &pOperator->exprSupp;
3277
  SSDataBlock* pRes = pInfo->pRes;
3278
  blockDataCleanup(pRes);
3279

3280
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3281
  if (pOperator->status == OP_EXEC_DONE) {
L
Liu Jicong 已提交
3282 3283 3284 3285
    if (pTaskInfo->execModel == OPTR_EXEC_MODEL_QUEUE) {
      pOperator->status = OP_OPENED;
      return NULL;
    }
3286 3287
    return NULL;
  }
dengyihao's avatar
dengyihao 已提交
3288

H
Haojun Liao 已提交
3289
#if 0
3290 3291 3292 3293 3294
  if (pProjectInfo->existDataBlock) {  // TODO refactor
    SSDataBlock* pBlock = pProjectInfo->existDataBlock;
    pProjectInfo->existDataBlock = NULL;

    // the pDataBlock are always the same one, no need to call this again
H
Haojun Liao 已提交
3295
    setInputDataBlock(pOperator, pInfo->pCtx, pBlock, TSDB_ORDER_ASC);
3296

H
Haojun Liao 已提交
3297
    blockDataEnsureCapacity(pInfo->pRes, pBlock->info.rows);
3298
    projectApplyFunctions(pOperator->exprSupp.pExprInfo, pInfo->pRes, pBlock, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
L
Liu Jicong 已提交
3299
    if (pRes->info.rows >= pProjectInfo->binfo.capacity * 0.8) {
3300 3301
      copyTsColoum(pRes, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
      resetResultRowEntryResult(pInfo->pCtx, pOperator->exprSupp.numOfExprs);
3302 3303 3304
      return pRes;
    }
  }
H
Haojun Liao 已提交
3305
#endif
3306

3307
  int64_t st = 0;
3308 3309 3310
  int32_t order = 0;
  int32_t scanFlag = 0;

3311 3312 3313 3314
  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

H
Haojun Liao 已提交
3315 3316
  SOperatorInfo* downstream = pOperator->pDownstream[0];

L
Liu Jicong 已提交
3317
  while (1) {
H
Haojun Liao 已提交
3318
    // The downstream exec may change the value of the newgroup, so use a local variable instead.
L
Liu Jicong 已提交
3319
    qDebug("projection call next");
3320
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
3321
    if (pBlock == NULL) {
L
Liu Jicong 已提交
3322 3323 3324
      qDebug("projection get null");

      /*if (pTaskInfo->execModel == OPTR_EXEC_MODEL_BATCH) {*/
3325
      doSetOperatorCompleted(pOperator);
L
Liu Jicong 已提交
3326 3327
      /*} else if (pTaskInfo->execModel == OPTR_EXEC_MODEL_QUEUE) {*/
      /*pOperator->status = OP_RES_TO_RETURN;*/
L
Liu Jicong 已提交
3328
      /*}*/
3329 3330
      break;
    }
3331 3332 3333 3334
    if (pBlock->info.type == STREAM_RETRIEVE) {
      // for stream interval
      return pBlock;
    }
3335 3336

    // the pDataBlock are always the same one, no need to call this again
3337
    int32_t code = getTableScanInfo(pOperator->pDownstream[0], &order, &scanFlag);
3338 3339 3340
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
3341

3342
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
3343 3344
    blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

3345
    code = projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs,
X
Xiaoyu Wang 已提交
3346
                                 pProjectInfo->pPseudoColInfo);
3347 3348
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
3349 3350
    }

3351
    int32_t status = handleLimitOffset(pOperator, &pProjectInfo->limitInfo, pInfo->pRes, true);
3352 3353 3354 3355

    // filter shall be applied after apply functions and limit/offset on the result
    doFilter(pProjectInfo->pFilterNode, pInfo->pRes);

3356
    if (status == PROJECT_RETRIEVE_CONTINUE) {
H
Haojun Liao 已提交
3357
      continue;
L
Liu Jicong 已提交
3358
    } else if (status == PROJECT_RETRIEVE_DONE) {
3359 3360 3361
      break;
    }
  }
dengyihao's avatar
dengyihao 已提交
3362

3363
  size_t rows = pInfo->pRes->info.rows;
3364 3365
  pProjectInfo->limitInfo.numOfOutputRows += rows;

3366 3367 3368
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
3369
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
3370 3371
  }

3372
  return (rows > 0) ? pInfo->pRes : NULL;
3373 3374
}

H
Haojun Liao 已提交
3375
static void doHandleRemainBlockForNewGroupImpl(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo,
L
Liu Jicong 已提交
3376
                                               SExecTaskInfo* pTaskInfo) {
3377
  pInfo->totalInputRows = pInfo->existNewGroupBlock->info.rows;
H
Haojun Liao 已提交
3378

L
Liu Jicong 已提交
3379 3380
  int64_t ekey =
      Q_STATUS_EQUAL(pTaskInfo->status, TASK_COMPLETED) ? pInfo->win.ekey : pInfo->existNewGroupBlock->info.window.ekey;
3381 3382
  taosResetFillInfo(pInfo->pFillInfo, getFillInfoStart(pInfo->pFillInfo));

3383
  taosFillSetStartInfo(pInfo->pFillInfo, pInfo->existNewGroupBlock->info.rows, ekey);
3384 3385
  taosFillSetInputDataBlock(pInfo->pFillInfo, pInfo->existNewGroupBlock);

H
Haojun Liao 已提交
3386 3387 3388
  int32_t numOfResultRows = pResultInfo->capacity - pInfo->pRes->info.rows;
  taosFillResultDataBlock(pInfo->pFillInfo, pInfo->pRes, numOfResultRows);

3389
  pInfo->curGroupId = pInfo->existNewGroupBlock->info.groupId;
3390 3391 3392
  pInfo->existNewGroupBlock = NULL;
}

H
Haojun Liao 已提交
3393
static void doHandleRemainBlockFromNewGroup(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo,
L
Liu Jicong 已提交
3394
                                            SExecTaskInfo* pTaskInfo) {
3395
  if (taosFillHasMoreResults(pInfo->pFillInfo)) {
H
Haojun Liao 已提交
3396 3397 3398
    int32_t numOfResultRows = pResultInfo->capacity - pInfo->pRes->info.rows;
    taosFillResultDataBlock(pInfo->pFillInfo, pInfo->pRes, numOfResultRows);
    if (pInfo->pRes->info.rows > pResultInfo->threshold) {
3399 3400 3401 3402 3403 3404
      return;
    }
  }

  // handle the cached new group data block
  if (pInfo->existNewGroupBlock) {
H
Haojun Liao 已提交
3405
    doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, pTaskInfo);
3406 3407 3408
  }
}

S
slzhou 已提交
3409
static SSDataBlock* doFillImpl(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3410 3411
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;
3412

H
Haojun Liao 已提交
3413
  SResultInfo* pResultInfo = &pOperator->resultInfo;
3414 3415 3416
  SSDataBlock* pResBlock = pInfo->pRes;

  blockDataCleanup(pResBlock);
3417

H
Haojun Liao 已提交
3418 3419
  doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, pTaskInfo);
  if (pResBlock->info.rows > pResultInfo->threshold || pResBlock->info.rows > 0) {
3420
    return pResBlock;
H
Haojun Liao 已提交
3421
  }
3422

H
Haojun Liao 已提交
3423
  SOperatorInfo* pDownstream = pOperator->pDownstream[0];
L
Liu Jicong 已提交
3424
  while (1) {
3425
    SSDataBlock* pBlock = pDownstream->fpSet.getNextFn(pDownstream);
3426 3427 3428 3429 3430
    if (pBlock == NULL) {
      if (pInfo->totalInputRows == 0) {
        pOperator->status = OP_EXEC_DONE;
        return NULL;
      }
3431

3432
      taosFillSetStartInfo(pInfo->pFillInfo, 0, pInfo->win.ekey);
3433
    } else {
3434 3435 3436 3437
      blockDataUpdateTsWindow(pBlock, pInfo->primaryTsCol);

      if (pInfo->curGroupId == 0 || pInfo->curGroupId == pBlock->info.groupId) {
        pInfo->curGroupId = pBlock->info.groupId;   // the first data block
3438 3439

        pInfo->totalInputRows += pBlock->info.rows;
3440

3441 3442
        taosFillSetStartInfo(pInfo->pFillInfo, pBlock->info.rows, pBlock->info.window.ekey);
        taosFillSetInputDataBlock(pInfo->pFillInfo, pBlock);
3443 3444 3445 3446 3447 3448
      } else if (pInfo->curGroupId != pBlock->info.groupId) { // the new group data block
        pInfo->existNewGroupBlock = pBlock;

        // Fill the previous group data block, before handle the data block of new group.
        // Close the fill operation for previous group data block
        taosFillSetStartInfo(pInfo->pFillInfo, 0, pInfo->win.ekey);
3449 3450 3451
      }
    }

3452
    blockDataEnsureCapacity(pResBlock, pOperator->resultInfo.capacity);
H
Haojun Liao 已提交
3453

3454 3455
    int32_t numOfResultRows = pOperator->resultInfo.capacity - pResBlock->info.rows;
    taosFillResultDataBlock(pInfo->pFillInfo, pResBlock, numOfResultRows);
3456 3457

    // current group has no more result to return
3458
    if (pResBlock->info.rows > 0) {
3459 3460
      // 1. The result in current group not reach the threshold of output result, continue
      // 2. If multiple group results existing in one SSDataBlock is not allowed, return immediately
3461
      if (pResBlock->info.rows > pResultInfo->threshold || pBlock == NULL || pInfo->existNewGroupBlock != NULL) {
3462
        return pResBlock;
3463 3464
      }

H
Haojun Liao 已提交
3465
      doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, pTaskInfo);
3466
      if (pResBlock->info.rows >= pOperator->resultInfo.threshold || pBlock == NULL) {
3467
        return pResBlock;
3468 3469 3470
      }
    } else if (pInfo->existNewGroupBlock) {  // try next group
      assert(pBlock != NULL);
H
Haojun Liao 已提交
3471
      doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, pTaskInfo);
3472 3473
      if (pResBlock->info.rows > pResultInfo->threshold) {
        return pResBlock;
3474 3475 3476 3477 3478 3479 3480
      }
    } else {
      return NULL;
    }
  }
}

S
slzhou 已提交
3481 3482 3483 3484 3485 3486 3487 3488
static SSDataBlock* doFill(SOperatorInfo* pOperator) {
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

S
slzhou 已提交
3489
  SSDataBlock* fillResult = NULL;
S
slzhou 已提交
3490
  while (true) {
S
slzhou 已提交
3491
    fillResult = doFillImpl(pOperator);
S
slzhou 已提交
3492 3493 3494 3495 3496 3497 3498 3499 3500 3501 3502 3503 3504 3505
    if (fillResult != NULL) {
      doFilter(pInfo->pCondition, fillResult);
    }

    if (fillResult == NULL) {
      doSetOperatorCompleted(pOperator);
      break;
    }

    if (fillResult->info.rows > 0) {
      break;
    }
  }

S
slzhou 已提交
3506 3507 3508 3509
  if (fillResult != NULL) {
    size_t rows = fillResult->info.rows;
    pOperator->resultInfo.totalRows += rows;
  }
S
slzhou 已提交
3510

S
slzhou 已提交
3511
  return fillResult;
S
slzhou 已提交
3512 3513
}

H
Haojun Liao 已提交
3514 3515 3516
static void destroyExprInfo(SExprInfo* pExpr, int32_t numOfExprs) {
  for (int32_t i = 0; i < numOfExprs; ++i) {
    SExprInfo* pExprInfo = &pExpr[i];
H
Haojun Liao 已提交
3517 3518 3519 3520
    for(int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      if (pExprInfo->base.pParam[j].type == FUNC_PARAM_TYPE_COLUMN) {
        taosMemoryFreeClear(pExprInfo->base.pParam[j].pCol);
      }
H
Haojun Liao 已提交
3521
    }
H
Haojun Liao 已提交
3522

H
Haojun Liao 已提交
3523
    taosMemoryFree(pExprInfo->base.pParam);
H
Haojun Liao 已提交
3524 3525 3526 3527
    taosMemoryFree(pExprInfo->pExpr);
  }
}

3528 3529 3530 3531 3532
static void destroyOperatorInfo(SOperatorInfo* pOperator) {
  if (pOperator == NULL) {
    return;
  }

3533
  if (pOperator->fpSet.closeFn != NULL) {
3534
    pOperator->fpSet.closeFn(pOperator->info, pOperator->exprSupp.numOfExprs);
3535 3536
  }

H
Haojun Liao 已提交
3537
  if (pOperator->pDownstream != NULL) {
L
Liu Jicong 已提交
3538
    for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
H
Haojun Liao 已提交
3539
      destroyOperatorInfo(pOperator->pDownstream[i]);
3540 3541
    }

wafwerar's avatar
wafwerar 已提交
3542
    taosMemoryFreeClear(pOperator->pDownstream);
H
Haojun Liao 已提交
3543
    pOperator->numOfDownstream = 0;
3544 3545
  }

3546
  cleanupExprSupp(&pOperator->exprSupp);
wafwerar's avatar
wafwerar 已提交
3547
  taosMemoryFreeClear(pOperator);
3548 3549
}

3550 3551 3552 3553 3554 3555 3556 3557 3558 3559 3560 3561 3562 3563 3564
int32_t getBufferPgSize(int32_t rowSize, uint32_t* defaultPgsz, uint32_t* defaultBufsz) {
  *defaultPgsz = 4096;
  while (*defaultPgsz < rowSize * 4) {
    *defaultPgsz <<= 1u;
  }

  // at least four pages need to be in buffer
  *defaultBufsz = 4096 * 256;
  if ((*defaultBufsz) <= (*defaultPgsz)) {
    (*defaultBufsz) = (*defaultPgsz) * 4;
  }

  return 0;
}

dengyihao's avatar
dengyihao 已提交
3565 3566
int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                         const char* pKey) {
3567 3568
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);

dengyihao's avatar
dengyihao 已提交
3569 3570
  pAggSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
  pAggSup->keyBuf = taosMemoryCalloc(1, keyBufSize + POINTER_BYTES + sizeof(int64_t));
3571 3572
  pAggSup->pResultRowHashTable = taosHashInit(10, hashFn, true, HASH_NO_LOCK);

H
Haojun Liao 已提交
3573
  if (pAggSup->keyBuf == NULL || pAggSup->pResultRowHashTable == NULL) {
3574 3575 3576
    return TSDB_CODE_OUT_OF_MEMORY;
  }

dengyihao's avatar
dengyihao 已提交
3577
  uint32_t defaultPgsz = 0;
3578 3579
  uint32_t defaultBufsz = 0;
  getBufferPgSize(pAggSup->resultRowSize, &defaultPgsz, &defaultBufsz);
H
Haojun Liao 已提交
3580

3581
  int32_t code = createDiskbasedBuf(&pAggSup->pResultBuf, defaultPgsz, defaultBufsz, pKey, TD_TMP_DIR_PATH);
H
Haojun Liao 已提交
3582 3583 3584 3585
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3586 3587 3588
  return TSDB_CODE_SUCCESS;
}

3589
void cleanupAggSup(SAggSupporter* pAggSup) {
wafwerar's avatar
wafwerar 已提交
3590
  taosMemoryFreeClear(pAggSup->keyBuf);
3591
  taosHashCleanup(pAggSup->pResultRowHashTable);
H
Haojun Liao 已提交
3592
  destroyDiskbasedBuf(pAggSup->pResultBuf);
3593 3594
}

L
Liu Jicong 已提交
3595 3596
int32_t initAggInfo(SExprSupp* pSup, SAggSupporter* pAggSup, SExprInfo* pExprInfo, int32_t numOfCols, size_t keyBufSize,
                    const char* pkey) {
3597 3598 3599 3600 3601
  int32_t code = initExprSupp(pSup, pExprInfo, numOfCols);
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3602
  doInitAggInfoSup(pAggSup, pSup->pCtx, numOfCols, keyBufSize, pkey);
L
Liu Jicong 已提交
3603
  for (int32_t i = 0; i < numOfCols; ++i) {
3604
    pSup->pCtx[i].pBuf = pAggSup->pResultBuf;
3605 3606
  }

3607
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
3608 3609
}

3610
void initResultSizeInfo(SOperatorInfo* pOperator, int32_t numOfRows) {
wmmhello's avatar
wmmhello 已提交
3611
  ASSERT(numOfRows != 0);
3612 3613 3614 3615
  pOperator->resultInfo.capacity = numOfRows;
  pOperator->resultInfo.threshold = numOfRows * 0.75;

  if (pOperator->resultInfo.threshold == 0) {
wmmhello's avatar
wmmhello 已提交
3616
    pOperator->resultInfo.threshold = numOfRows;
3617 3618 3619
  }
}

3620 3621 3622 3623 3624
void initBasicInfo(SOptrBasicInfo* pInfo, SSDataBlock* pBlock) {
  pInfo->pRes = pBlock;
  initResultRowInfo(&pInfo->resultRowInfo);
}

3625 3626 3627 3628 3629 3630 3631 3632 3633 3634 3635 3636 3637 3638 3639 3640 3641 3642 3643
static void* destroySqlFunctionCtx(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
  if (pCtx == NULL) {
    return NULL;
  }

  for (int32_t i = 0; i < numOfOutput; ++i) {
    for (int32_t j = 0; j < pCtx[i].numOfParams; ++j) {
      taosVariantDestroy(&pCtx[i].param[j].param);
    }

    taosMemoryFreeClear(pCtx[i].subsidiaries.pCtx);
    taosMemoryFree(pCtx[i].input.pData);
    taosMemoryFree(pCtx[i].input.pColumnDataAgg);
  }

  taosMemoryFreeClear(pCtx);
  return NULL;
}

3644
int32_t initExprSupp(SExprSupp* pSup, SExprInfo* pExprInfo, int32_t numOfExpr) {
3645 3646 3647 3648
  pSup->pExprInfo = pExprInfo;
  pSup->numOfExprs = numOfExpr;
  if (pSup->pExprInfo != NULL) {
    pSup->pCtx = createSqlFunctionCtx(pExprInfo, numOfExpr, &pSup->rowEntryInfoOffset);
3649 3650 3651
    if (pSup->pCtx == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
3652
  }
3653 3654

  return TSDB_CODE_SUCCESS;
3655 3656
}

3657 3658 3659 3660 3661 3662 3663 3664 3665 3666
void cleanupExprSupp(SExprSupp* pSupp) {
  destroySqlFunctionCtx(pSupp->pCtx, pSupp->numOfExprs);
  if (pSupp->pExprInfo != NULL) {
    destroyExprInfo(pSupp->pExprInfo, pSupp->numOfExprs);
  }

  taosMemoryFreeClear(pSupp->pExprInfo);
  taosMemoryFree(pSupp->rowEntryInfoOffset);
}

L
Liu Jicong 已提交
3667
SOperatorInfo* createAggregateOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
S
slzhou 已提交
3668
                                           SSDataBlock* pResultBlock, SNode* pCondition, SExprInfo* pScalarExprInfo,
wmmhello's avatar
wmmhello 已提交
3669
                                           int32_t numOfScalarExpr, SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3670
  SAggOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SAggOperatorInfo));
L
Liu Jicong 已提交
3671
  SOperatorInfo*    pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3672 3673 3674
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
H
Haojun Liao 已提交
3675

3676
  int32_t numOfRows = 1024;
dengyihao's avatar
dengyihao 已提交
3677
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3678 3679

  initResultSizeInfo(pOperator, numOfRows);
3680
  int32_t code = initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
L
Liu Jicong 已提交
3681
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3682 3683
    goto _error;
  }
H
Haojun Liao 已提交
3684

3685
  initBasicInfo(&pInfo->binfo, pResultBlock);
3686 3687 3688 3689
  code = initExprSupp(&pInfo->scalarExprSup, pScalarExprInfo, numOfScalarExpr);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3690

L
Liu Jicong 已提交
3691
  pInfo->groupId = INT32_MIN;
S
slzhou 已提交
3692
  pInfo->pCondition = pCondition;
dengyihao's avatar
dengyihao 已提交
3693
  pOperator->name = "TableAggregate";
3694
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_HASH_AGG;
3695
  pOperator->blocking = true;
dengyihao's avatar
dengyihao 已提交
3696 3697 3698
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3699

3700 3701
  pOperator->fpSet = createOperatorFpSet(doOpenAggregateOptr, getAggregateResult, NULL, NULL, destroyAggOperatorInfo,
                                         aggEncodeResultRow, aggDecodeResultRow, NULL);
H
Haojun Liao 已提交
3702 3703 3704 3705 3706

  code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3707 3708

  return pOperator;
L
Liu Jicong 已提交
3709
_error:
H
Haojun Liao 已提交
3710
  destroyAggOperatorInfo(pInfo, numOfCols);
wafwerar's avatar
wafwerar 已提交
3711 3712
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
H
Haojun Liao 已提交
3713 3714
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3715 3716
}

3717
void cleanupBasicInfo(SOptrBasicInfo* pInfo) {
3718 3719
  assert(pInfo != NULL);
  cleanupResultRowInfo(&pInfo->resultRowInfo);
H
Haojun Liao 已提交
3720
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
3721 3722
}

H
Haojun Liao 已提交
3723
void destroyBasicOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3724
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)param;
3725
  cleanupBasicInfo(pInfo);
L
Liu Jicong 已提交
3726

D
dapan1121 已提交
3727
  taosMemoryFreeClear(param);
3728
}
H
Haojun Liao 已提交
3729

H
Haojun Liao 已提交
3730 3731 3732 3733 3734 3735 3736 3737

static void freeItem(void* pItem) {
  void** p = pItem;
  if (*p != NULL) {
    taosMemoryFreeClear(*p);
  }
}

H
Haojun Liao 已提交
3738
void destroyAggOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3739
  SAggOperatorInfo* pInfo = (SAggOperatorInfo*)param;
L
Liu Jicong 已提交
3740 3741
  cleanupBasicInfo(&pInfo->binfo);

H
Haojun Liao 已提交
3742
  cleanupAggSup(&pInfo->aggSup);
H
Haojun Liao 已提交
3743
  cleanupGroupResInfo(&pInfo->groupResInfo);
D
dapan1121 已提交
3744
  taosMemoryFreeClear(param);
3745
}
3746

H
Haojun Liao 已提交
3747
void destroySFillOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3748
  SFillOperatorInfo* pInfo = (SFillOperatorInfo*)param;
3749
  pInfo->pFillInfo = taosDestroyFillInfo(pInfo->pFillInfo);
H
Haojun Liao 已提交
3750
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
wafwerar's avatar
wafwerar 已提交
3751
  taosMemoryFreeClear(pInfo->p);
L
Liu Jicong 已提交
3752

D
dapan1121 已提交
3753
  taosMemoryFreeClear(param);
3754 3755
}

H
Haojun Liao 已提交
3756
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput) {
D
fix bug  
dapan 已提交
3757 3758 3759
  if (NULL == param) {
    return;
  }
L
Liu Jicong 已提交
3760
  SProjectOperatorInfo* pInfo = (SProjectOperatorInfo*)param;
3761
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3762
  cleanupAggSup(&pInfo->aggSup);
H
Haojun Liao 已提交
3763
  taosArrayDestroy(pInfo->pPseudoColInfo);
L
Liu Jicong 已提交
3764

D
dapan1121 已提交
3765
  taosMemoryFreeClear(param);
3766 3767
}

H
Haojun Liao 已提交
3768
static void destroyIndefinitOperatorInfo(void* param, int32_t numOfOutput) {
3769
  SIndefOperatorInfo* pInfo = (SIndefOperatorInfo*)param;
3770
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3771 3772 3773

  taosArrayDestroy(pInfo->pPseudoColInfo);
  cleanupAggSup(&pInfo->aggSup);
3774
  cleanupExprSupp(&pInfo->scalarSup);
L
Liu Jicong 已提交
3775

D
dapan1121 已提交
3776
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
3777 3778
}

H
Haojun Liao 已提交
3779
void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3780
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3781 3782 3783 3784
  taosRemoveRef(exchangeObjRefPool, pExInfo->self);
}

void doDestroyExchangeOperatorInfo(void* param) {
X
Xiaoyu Wang 已提交
3785
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3786

H
Haojun Liao 已提交
3787 3788 3789
  taosArrayDestroy(pExInfo->pSources);
  taosArrayDestroy(pExInfo->pSourceDataInfo);
  if (pExInfo->pResult != NULL) {
H
Haojun Liao 已提交
3790
    pExInfo->pResult = blockDataDestroy(pExInfo->pResult);
H
Haojun Liao 已提交
3791 3792 3793
  }

  tsem_destroy(&pExInfo->ready);
L
Liu Jicong 已提交
3794

D
dapan1121 已提交
3795
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
3796 3797
}

H
Haojun Liao 已提交
3798 3799
static SArray* setRowTsColumnOutputInfo(SqlFunctionCtx* pCtx, int32_t numOfCols) {
  SArray* pList = taosArrayInit(4, sizeof(int32_t));
dengyihao's avatar
dengyihao 已提交
3800
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
3801 3802 3803 3804 3805 3806 3807 3808
    if (fmIsPseudoColumnFunc(pCtx[i].functionId)) {
      taosArrayPush(pList, &i);
    }
  }

  return pList;
}

L
Liu Jicong 已提交
3809
SOperatorInfo* createProjectOperatorInfo(SOperatorInfo* downstream, SProjectPhysiNode* pProjPhyNode,
dengyihao's avatar
dengyihao 已提交
3810
                                         SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3811
  SProjectOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SProjectOperatorInfo));
L
Liu Jicong 已提交
3812
  SOperatorInfo*        pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3813 3814 3815
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
3816

L
Liu Jicong 已提交
3817
  int32_t    numOfCols = 0;
3818 3819 3820
  SExprInfo* pExprInfo = createExprInfo(pProjPhyNode->pProjections, NULL, &numOfCols);

  SSDataBlock* pResBlock = createResDataBlock(pProjPhyNode->node.pOutputDataBlockDesc);
3821
  initLimitInfo(pProjPhyNode->node.pLimit, pProjPhyNode->node.pSlimit, &pInfo->limitInfo);
3822

H
Haojun Liao 已提交
3823
  pInfo->binfo.pRes = pResBlock;
3824
  pInfo->pFilterNode = pProjPhyNode->node.pConditions;
H
Haojun Liao 已提交
3825 3826

  int32_t numOfRows = 4096;
dengyihao's avatar
dengyihao 已提交
3827
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3828

3829 3830 3831 3832 3833
  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
3834
  initResultSizeInfo(pOperator, numOfRows);
3835

3836 3837
  initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
  initBasicInfo(&pInfo->binfo, pResBlock);
3838
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfCols);
3839

3840
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pOperator->exprSupp.pCtx, numOfCols);
X
Xiaoyu Wang 已提交
3841
  pOperator->name = "ProjectOperator";
H
Haojun Liao 已提交
3842
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_PROJECT;
X
Xiaoyu Wang 已提交
3843 3844 3845 3846
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
3847

L
Liu Jicong 已提交
3848 3849
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doProjectOperation, NULL, NULL,
                                         destroyProjectOperatorInfo, NULL, NULL, NULL);
L
Liu Jicong 已提交
3850

3851
  int32_t code = appendDownstream(pOperator, &downstream, 1);
H
Haojun Liao 已提交
3852
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3853 3854
    goto _error;
  }
3855 3856

  return pOperator;
H
Haojun Liao 已提交
3857

L
Liu Jicong 已提交
3858
_error:
H
Haojun Liao 已提交
3859 3860
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3861 3862
}

3863 3864
static void doHandleDataBlock(SOperatorInfo* pOperator, SSDataBlock* pBlock, SOperatorInfo* downstream,
                              SExecTaskInfo* pTaskInfo) {
3865 3866 3867 3868 3869 3870 3871 3872 3873 3874 3875 3876 3877 3878 3879 3880 3881 3882 3883 3884 3885 3886 3887 3888 3889 3890 3891 3892 3893 3894 3895 3896 3897
  int32_t order = 0;
  int32_t scanFlag = 0;

  SIndefOperatorInfo* pIndefInfo = pOperator->info;
  SOptrBasicInfo*     pInfo = &pIndefInfo->binfo;
  SExprSupp*          pSup = &pOperator->exprSupp;

  // the pDataBlock are always the same one, no need to call this again
  int32_t code = getTableScanInfo(downstream, &order, &scanFlag);
  if (code != TSDB_CODE_SUCCESS) {
    longjmp(pTaskInfo->env, code);
  }

  // there is an scalar expression that needs to be calculated before apply the group aggregation.
  SExprSupp* pScalarSup = &pIndefInfo->scalarSup;
  if (pScalarSup->pExprInfo != NULL) {
    code = projectApplyFunctions(pScalarSup->pExprInfo, pBlock, pBlock, pScalarSup->pCtx, pScalarSup->numOfExprs,
                                 pIndefInfo->pPseudoColInfo);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
  }

  setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
  blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

  code = projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs,
                               pIndefInfo->pPseudoColInfo);
  if (code != TSDB_CODE_SUCCESS) {
    longjmp(pTaskInfo->env, code);
  }
}

H
Haojun Liao 已提交
3898 3899
static SSDataBlock* doApplyIndefinitFunction(SOperatorInfo* pOperator) {
  SIndefOperatorInfo* pIndefInfo = pOperator->info;
3900
  SOptrBasicInfo*     pInfo = &pIndefInfo->binfo;
L
Liu Jicong 已提交
3901
  SExprSupp*          pSup = &pOperator->exprSupp;
H
Haojun Liao 已提交
3902 3903 3904 3905 3906 3907 3908 3909 3910 3911 3912 3913 3914 3915 3916 3917 3918

  SSDataBlock* pRes = pInfo->pRes;
  blockDataCleanup(pRes);

  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

  int64_t st = 0;

  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

  SOperatorInfo* downstream = pOperator->pDownstream[0];

3919
  while (1) {
3920
    // here we need to handle the existsed group results
3921
    if (pIndefInfo->pNextGroupRes != NULL) {  // todo extract method
3922 3923
      for (int32_t k = 0; k < pSup->numOfExprs; ++k) {
        SqlFunctionCtx* pCtx = &pSup->pCtx[k];
H
Haojun Liao 已提交
3924

3925 3926 3927 3928 3929 3930 3931
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
        pResInfo->initialized = false;
        pCtx->pOutput = NULL;
      }

      doHandleDataBlock(pOperator, pIndefInfo->pNextGroupRes, downstream, pTaskInfo);
      pIndefInfo->pNextGroupRes = NULL;
H
Haojun Liao 已提交
3932 3933
    }

3934 3935 3936 3937 3938 3939 3940 3941 3942 3943 3944 3945 3946 3947 3948 3949 3950 3951 3952 3953 3954 3955 3956
    if (pInfo->pRes->info.rows < pOperator->resultInfo.threshold) {
      while (1) {
        // The downstream exec may change the value of the newgroup, so use a local variable instead.
        SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
        if (pBlock == NULL) {
          doSetOperatorCompleted(pOperator);
          break;
        }

        if (pIndefInfo->groupId == 0 && pBlock->info.groupId != 0) {
          pIndefInfo->groupId = pBlock->info.groupId;  // this is the initial group result
        } else {
          if (pIndefInfo->groupId != pBlock->info.groupId) {  // reset output buffer and computing status
            pIndefInfo->groupId = pBlock->info.groupId;
            pIndefInfo->pNextGroupRes = pBlock;
            break;
          }
        }

        doHandleDataBlock(pOperator, pBlock, downstream, pTaskInfo);
        if (pInfo->pRes->info.rows >= pOperator->resultInfo.threshold) {
          break;
        }
H
Haojun Liao 已提交
3957 3958 3959
      }
    }

3960 3961 3962 3963
    doFilter(pIndefInfo->pCondition, pInfo->pRes);
    size_t rows = pInfo->pRes->info.rows;
    if (rows >= 0) {
      break;
H
Haojun Liao 已提交
3964 3965 3966 3967 3968 3969 3970 3971 3972 3973 3974 3975 3976
    }
  }

  size_t rows = pInfo->pRes->info.rows;
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
  }

  return (rows > 0) ? pInfo->pRes : NULL;
}

3977 3978
SOperatorInfo* createIndefinitOutputOperatorInfo(SOperatorInfo* downstream, SPhysiNode* pNode,
                                                 SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
3979
  SIndefOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SIndefOperatorInfo));
3980
  SOperatorInfo*      pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3981 3982 3983 3984
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

3985 3986
  SExprSupp* pSup = &pOperator->exprSupp;

H
Haojun Liao 已提交
3987 3988 3989
  SIndefRowsFuncPhysiNode* pPhyNode = (SIndefRowsFuncPhysiNode*)pNode;

  int32_t    numOfExpr = 0;
X
Xiaoyu Wang 已提交
3990
  SExprInfo* pExprInfo = createExprInfo(pPhyNode->pFuncs, NULL, &numOfExpr);
H
Haojun Liao 已提交
3991 3992

  if (pPhyNode->pExprs != NULL) {
3993
    int32_t    num = 0;
3994
    SExprInfo* pSExpr = createExprInfo(pPhyNode->pExprs, NULL, &num);
3995
    int32_t    code = initExprSupp(&pInfo->scalarSup, pSExpr, num);
3996 3997 3998
    if (code != TSDB_CODE_SUCCESS) {
      goto _error;
    }
H
Haojun Liao 已提交
3999 4000
  }

4001
  SSDataBlock* pResBlock = createResDataBlock(pPhyNode->node.pOutputDataBlockDesc);
H
Haojun Liao 已提交
4002 4003 4004 4005 4006 4007 4008 4009 4010

  int32_t numOfRows = 4096;
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;

  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
4011

H
Haojun Liao 已提交
4012 4013
  initResultSizeInfo(pOperator, numOfRows);

4014
  initAggInfo(pSup, &pInfo->aggSup, pExprInfo, numOfExpr, keyBufSize, pTaskInfo->id.str);
4015 4016
  initBasicInfo(&pInfo->binfo, pResBlock);

4017
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfExpr);
H
Haojun Liao 已提交
4018

4019 4020 4021
  pInfo->binfo.pRes = pResBlock;
  pInfo->pCondition = pPhyNode->node.pConditions;
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pSup->pCtx, numOfExpr);
H
Haojun Liao 已提交
4022

4023
  pOperator->name = "IndefinitOperator";
4024
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC;
4025 4026 4027
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
4028
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
4029 4030 4031 4032 4033 4034 4035 4036 4037 4038 4039

  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doApplyIndefinitFunction, NULL, NULL,
                                         destroyIndefinitOperatorInfo, NULL, NULL, NULL);

  int32_t code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  return pOperator;

4040
_error:
H
Haojun Liao 已提交
4041 4042 4043 4044 4045 4046
  taosMemoryFree(pInfo);
  taosMemoryFree(pOperator);
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
}

4047
static int32_t initFillInfo(SFillOperatorInfo* pInfo, SExprInfo* pExpr, int32_t numOfCols, SNodeListNode* pValNode,
L
Liu Jicong 已提交
4048
                            STimeWindow win, int32_t capacity, const char* id, SInterval* pInterval, int32_t fillType) {
4049
  SFillColInfo* pColInfo = createFillColInfo(pExpr, numOfCols, pValNode);
H
Haojun Liao 已提交
4050 4051

  STimeWindow w = TSWINDOW_INITIALIZER;
4052
  getAlignQueryTimeWindow(pInterval, pInterval->precision, win.skey, &w);
4053
  w = getFirstQualifiedTimeWindow(win.skey, &w, pInterval, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
4054 4055

  int32_t order = TSDB_ORDER_ASC;
4056 4057
  pInfo->pFillInfo = taosCreateFillInfo(order, w.skey, 0, capacity, numOfCols, pInterval,
      fillType, pColInfo, pInfo->primaryTsCol, id);
H
Haojun Liao 已提交
4058

4059
  pInfo->win = win;
L
Liu Jicong 已提交
4060
  pInfo->p = taosMemoryCalloc(numOfCols, POINTER_BYTES);
4061

H
Haojun Liao 已提交
4062
  if (pInfo->pFillInfo == NULL || pInfo->p == NULL) {
H
Haojun Liao 已提交
4063 4064
    taosMemoryFree(pInfo->pFillInfo);
    taosMemoryFree(pInfo->p);
H
Haojun Liao 已提交
4065 4066 4067 4068 4069 4070
    return TSDB_CODE_OUT_OF_MEMORY;
  } else {
    return TSDB_CODE_SUCCESS;
  }
}

H
Haojun Liao 已提交
4071
SOperatorInfo* createFillOperatorInfo(SOperatorInfo* downstream, SFillPhysiNode* pPhyFillNode, SExecTaskInfo* pTaskInfo) {
4072 4073 4074 4075 4076 4077
  SFillOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SFillOperatorInfo));
  SOperatorInfo*     pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

L
Liu Jicong 已提交
4078 4079 4080
  int32_t      num = 0;
  SSDataBlock* pResBlock = createResDataBlock(pPhyFillNode->node.pOutputDataBlockDesc);
  SExprInfo*   pExprInfo = createExprInfo(pPhyFillNode->pTargets, NULL, &num);
4081 4082 4083 4084
  SInterval*   pInterval =
      QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == downstream->operatorType
            ? &((SMergeAlignedIntervalAggOperatorInfo*)downstream->info)->intervalAggOperatorInfo->interval
            : &((SIntervalAggOperatorInfo*)downstream->info)->interval;
4085

4086
  int32_t type = convertFillType(pPhyFillNode->mode);
4087

H
Haojun Liao 已提交
4088
  SResultInfo* pResultInfo = &pOperator->resultInfo;
4089
  initResultSizeInfo(pOperator, 4096);
H
Haojun Liao 已提交
4090
  pInfo->primaryTsCol = ((SColumnNode*)pPhyFillNode->pWStartTs)->slotId;
4091

4092
  int32_t numOfOutputCols = 0;
4093 4094
  SArray* pColMatchColInfo = extractColMatchInfo(pPhyFillNode->pTargets, pPhyFillNode->node.pOutputDataBlockDesc,
                                                 &numOfOutputCols, COL_MATCH_FROM_SLOT_ID);
4095

4096 4097
  int32_t code = initFillInfo(pInfo, pExprInfo, num, (SNodeListNode*)pPhyFillNode->pValues, pPhyFillNode->timeRange,
                              pResultInfo->capacity, pTaskInfo->id.str, pInterval, type);
4098 4099 4100
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
4101

4102 4103 4104 4105 4106 4107 4108 4109
  pInfo->pRes = pResBlock;
  pInfo->pCondition = pPhyFillNode->node.pConditions;
  pInfo->pColMatchColInfo = pColMatchColInfo;
  pOperator->name = "FillOperator";
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_FILL;
  pOperator->exprSupp.pExprInfo = pExprInfo;
4110
  pOperator->exprSupp.numOfExprs = num;
4111 4112
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
4113

L
Liu Jicong 已提交
4114 4115
  pOperator->fpSet =
      createOperatorFpSet(operatorDummyOpenFn, doFill, NULL, NULL, destroySFillOperatorInfo, NULL, NULL, NULL);
4116

4117
  code = appendDownstream(pOperator, &downstream, 1);
4118
  return pOperator;
H
Haojun Liao 已提交
4119

L
Liu Jicong 已提交
4120
_error:
wafwerar's avatar
wafwerar 已提交
4121 4122
  taosMemoryFreeClear(pOperator);
  taosMemoryFreeClear(pInfo);
H
Haojun Liao 已提交
4123
  return NULL;
4124 4125
}

D
dapan1121 已提交
4126
static SExecTaskInfo* createExecTaskInfo(uint64_t queryId, uint64_t taskId, EOPTR_EXEC_MODEL model, char* dbFName) {
wafwerar's avatar
wafwerar 已提交
4127
  SExecTaskInfo* pTaskInfo = taosMemoryCalloc(1, sizeof(SExecTaskInfo));
4128
  setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
4129

4130
  pTaskInfo->schemaInfo.dbname = strdup(dbFName);
4131
  pTaskInfo->cost.created = taosGetTimestampMs();
H
Haojun Liao 已提交
4132
  pTaskInfo->id.queryId = queryId;
dengyihao's avatar
dengyihao 已提交
4133
  pTaskInfo->execModel = model;
H
Haojun Liao 已提交
4134

wafwerar's avatar
wafwerar 已提交
4135
  char* p = taosMemoryCalloc(1, 128);
L
Liu Jicong 已提交
4136
  snprintf(p, 128, "TID:0x%" PRIx64 " QID:0x%" PRIx64, taskId, queryId);
H
Haojun Liao 已提交
4137
  pTaskInfo->id.str = p;
H
Haojun Liao 已提交
4138

4139 4140
  return pTaskInfo;
}
H
Haojun Liao 已提交
4141

H
Hongze Cheng 已提交
4142
static STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
H
Haojun Liao 已提交
4143
                                       STableListInfo* pTableListInfo, const char* idstr);
H
Haojun Liao 已提交
4144

H
Haojun Liao 已提交
4145
static SArray* extractColumnInfo(SNodeList* pNodeList);
4146

4147
int32_t extractTableSchemaInfo(SReadHandle* pHandle, uint64_t uid, SExecTaskInfo* pTaskInfo) {
4148 4149
  SMetaReader mr = {0};
  metaReaderInit(&mr, pHandle->meta, 0);
D
dapan1121 已提交
4150
  int32_t code = metaGetTableEntryByUid(&mr, uid);
4151
  if (code != TSDB_CODE_SUCCESS) {
D
dapan1121 已提交
4152
    metaReaderClear(&mr);
4153
    return terrno;
D
dapan1121 已提交
4154
  }
4155

4156
  pTaskInfo->schemaInfo.tablename = strdup(mr.me.name);
4157 4158

  if (mr.me.type == TSDB_SUPER_TABLE) {
4159 4160
    pTaskInfo->schemaInfo.sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
    pTaskInfo->schemaInfo.tversion = mr.me.stbEntry.schemaTag.version;
4161
  } else if (mr.me.type == TSDB_CHILD_TABLE) {
4162 4163
    tDecoderClear(&mr.coder);

4164 4165
    tb_uid_t suid = mr.me.ctbEntry.suid;
    metaGetTableEntryByUid(&mr, suid);
4166 4167
    pTaskInfo->schemaInfo.sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
    pTaskInfo->schemaInfo.tversion = mr.me.stbEntry.schemaTag.version;
4168
  } else {
4169
    pTaskInfo->schemaInfo.sw = tCloneSSchemaWrapper(&mr.me.ntbEntry.schemaRow);
4170
  }
4171 4172

  metaReaderClear(&mr);
D
dapan1121 已提交
4173
  return TSDB_CODE_SUCCESS;
4174 4175
}

4176 4177 4178
static void cleanupTableSchemaInfo(SSchemaInfo* pSchemaInfo) {
  taosMemoryFreeClear(pSchemaInfo->dbname);
  if (pSchemaInfo->sw == NULL) {
4179 4180 4181
    return;
  }

4182 4183 4184
  taosMemoryFree(pSchemaInfo->tablename);
  taosMemoryFree(pSchemaInfo->sw->pSchema);
  taosMemoryFree(pSchemaInfo->sw);
4185 4186
}

4187
static int32_t sortTableGroup(STableListInfo* pTableListInfo, int32_t groupNum) {
wmmhello's avatar
wmmhello 已提交
4188
  taosArrayClear(pTableListInfo->pGroupList);
4189 4190
  SArray* sortSupport = taosArrayInit(groupNum, sizeof(uint64_t));
  if (sortSupport == NULL) return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
4191 4192
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
4193
    uint64_t*      groupId = taosHashGet(pTableListInfo->map, &info->uid, sizeof(uint64_t));
wmmhello's avatar
wmmhello 已提交
4194 4195

    int32_t index = taosArraySearchIdx(sortSupport, groupId, compareUint64Val, TD_EQ);
4196 4197 4198 4199
    if (index == -1) {
      void*   p = taosArraySearch(sortSupport, groupId, compareUint64Val, TD_GT);
      SArray* tGroup = taosArrayInit(8, sizeof(STableKeyInfo));
      if (tGroup == NULL) {
wmmhello's avatar
wmmhello 已提交
4200 4201 4202
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
4203
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4204 4205 4206 4207
        qError("taos push info array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
4208
      if (p == NULL) {
wmmhello's avatar
wmmhello 已提交
4209
        if (taosArrayPush(sortSupport, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4210 4211 4212 4213
          qError("taos push support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
wmmhello's avatar
wmmhello 已提交
4214
        if (taosArrayPush(pTableListInfo->pGroupList, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4215 4216 4217 4218
          qError("taos push group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4219
      } else {
wmmhello's avatar
wmmhello 已提交
4220
        int32_t pos = TARRAY_ELEM_IDX(sortSupport, p);
4221
        if (taosArrayInsert(sortSupport, pos, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4222 4223 4224 4225
          qError("taos insert support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4226
        if (taosArrayInsert(pTableListInfo->pGroupList, pos, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4227 4228 4229 4230 4231
          qError("taos insert group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
      }
4232
    } else {
wmmhello's avatar
wmmhello 已提交
4233
      SArray* tGroup = (SArray*)taosArrayGetP(pTableListInfo->pGroupList, index);
4234
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4235 4236 4237 4238 4239 4240 4241 4242 4243 4244
        qError("taos push uid array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
    }
  }
  taosArrayDestroy(sortSupport);
  return TDB_CODE_SUCCESS;
}

wmmhello's avatar
wmmhello 已提交
4245 4246
int32_t generateGroupIdMap(STableListInfo* pTableListInfo, SReadHandle* pHandle, SNodeList* group) {
  if (group == NULL) {
wmmhello's avatar
wmmhello 已提交
4247 4248 4249 4250 4251 4252 4253 4254
    return TDB_CODE_SUCCESS;
  }

  pTableListInfo->map = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, HASH_NO_LOCK);
  if (pTableListInfo->map == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
  int32_t keyLen = 0;
X
Xiaoyu Wang 已提交
4255
  void*   keyBuf = NULL;
wmmhello's avatar
wmmhello 已提交
4256

4257
  SNode* node;
wmmhello's avatar
wmmhello 已提交
4258
  FOREACH(node, group) {
4259
    SExprNode* pExpr = (SExprNode*)node;
wmmhello's avatar
wmmhello 已提交
4260
    keyLen += pExpr->resType.bytes;
wmmhello's avatar
wmmhello 已提交
4261 4262
  }

wmmhello's avatar
wmmhello 已提交
4263
  int32_t nullFlagSize = sizeof(int8_t) * LIST_LENGTH(group);
wmmhello's avatar
wmmhello 已提交
4264 4265 4266 4267 4268 4269 4270
  keyLen += nullFlagSize;

  keyBuf = taosMemoryCalloc(1, keyLen);
  if (keyBuf == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

4271
  int32_t groupNum = 0;
X
Xiaoyu Wang 已提交
4272 4273 4274
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
    SMetaReader    mr = {0};
wmmhello's avatar
wmmhello 已提交
4275 4276 4277
    metaReaderInit(&mr, pHandle->meta, 0);
    metaGetTableEntryByUid(&mr, info->uid);

4278
    SNodeList* groupNew = nodesCloneList(group);
wmmhello's avatar
wmmhello 已提交
4279

wmmhello's avatar
wmmhello 已提交
4280
    nodesRewriteExprsPostOrder(groupNew, doTranslateTagExpr, &mr);
wmmhello's avatar
wmmhello 已提交
4281
    char* isNull = (char*)keyBuf;
wmmhello's avatar
wmmhello 已提交
4282 4283
    char* pStart = (char*)keyBuf + nullFlagSize;

4284
    SNode*  pNode;
wmmhello's avatar
wmmhello 已提交
4285
    int32_t index = 0;
4286
    FOREACH(pNode, groupNew) {
wmmhello's avatar
wmmhello 已提交
4287 4288 4289 4290
      SNode*  pNew = NULL;
      int32_t code = scalarCalculateConstants(pNode, &pNew);
      if (TSDB_CODE_SUCCESS == code) {
        REPLACE_NODE(pNew);
X
Xiaoyu Wang 已提交
4291
      } else {
4292
        taosMemoryFree(keyBuf);
wmmhello's avatar
wmmhello 已提交
4293
        nodesClearList(groupNew);
4294
        metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4295
        return code;
wmmhello's avatar
wmmhello 已提交
4296
      }
4297

wmmhello's avatar
wmmhello 已提交
4298
      ASSERT(nodeType(pNew) == QUERY_NODE_VALUE);
4299
      SValueNode* pValue = (SValueNode*)pNew;
4300

wmmhello's avatar
wmmhello 已提交
4301
      if (pValue->node.resType.type == TSDB_DATA_TYPE_NULL || pValue->isNull) {
wmmhello's avatar
wmmhello 已提交
4302 4303 4304 4305
        isNull[index++] = 1;
        continue;
      } else {
        isNull[index++] = 0;
4306
        char* data = nodesGetValueFromNode(pValue);
L
Liu Jicong 已提交
4307 4308
        if (pValue->node.resType.type == TSDB_DATA_TYPE_JSON) {
          if (tTagIsJson(data)) {
wmmhello's avatar
wmmhello 已提交
4309 4310 4311
            terrno = TSDB_CODE_QRY_JSON_IN_GROUP_ERROR;
            taosMemoryFree(keyBuf);
            nodesClearList(groupNew);
4312
            metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4313 4314
            return terrno;
          }
wmmhello's avatar
wmmhello 已提交
4315
          int32_t len = getJsonValueLen(data);
wmmhello's avatar
wmmhello 已提交
4316 4317 4318
          memcpy(pStart, data, len);
          pStart += len;
        } else if (IS_VAR_DATA_TYPE(pValue->node.resType.type)) {
wmmhello's avatar
wmmhello 已提交
4319 4320
          memcpy(pStart, data, varDataTLen(data));
          pStart += varDataTLen(data);
wmmhello's avatar
wmmhello 已提交
4321
        } else {
wmmhello's avatar
wmmhello 已提交
4322 4323
          memcpy(pStart, data, pValue->node.resType.bytes);
          pStart += pValue->node.resType.bytes;
wmmhello's avatar
wmmhello 已提交
4324 4325 4326
        }
      }
    }
4327

4328
    int32_t  len = (int32_t)(pStart - (char*)keyBuf);
4329 4330
    uint64_t groupId = calcGroupId(keyBuf, len);
    taosHashPut(pTableListInfo->map, &(info->uid), sizeof(uint64_t), &groupId, sizeof(uint64_t));
S
slzhou 已提交
4331
    info->groupId = groupId;
4332
    groupNum++;
wmmhello's avatar
wmmhello 已提交
4333

wmmhello's avatar
wmmhello 已提交
4334
    nodesClearList(groupNew);
wmmhello's avatar
wmmhello 已提交
4335 4336 4337
    metaReaderClear(&mr);
  }
  taosMemoryFree(keyBuf);
4338

4339
  if (pTableListInfo->needSortTableByGroupId) {
wmmhello's avatar
wmmhello 已提交
4340
    return sortTableGroup(pTableListInfo, groupNum);
4341 4342
  }

wmmhello's avatar
wmmhello 已提交
4343 4344 4345
  return TDB_CODE_SUCCESS;
}

4346 4347 4348 4349 4350 4351 4352 4353 4354 4355 4356 4357 4358 4359 4360 4361 4362 4363 4364 4365 4366 4367 4368 4369
static int32_t initTableblockDistQueryCond(uint64_t uid, SQueryTableDataCond* pCond) {
  memset(pCond, 0, sizeof(SQueryTableDataCond));

  pCond->order = TSDB_ORDER_ASC;
  pCond->numOfCols = 1;
  pCond->colList = taosMemoryCalloc(1, sizeof(SColumnInfo));
  if (pCond->colList == NULL) {
    terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return terrno;
  }

  pCond->colList->colId = 1;
  pCond->colList->type = TSDB_DATA_TYPE_TIMESTAMP;
  pCond->colList->bytes = sizeof(TSKEY);

  pCond->twindows = (STimeWindow){.skey = INT64_MIN, .ekey = INT64_MAX};
  pCond->suid = uid;
  pCond->type = BLOCK_LOAD_OFFSET_ORDER;
  pCond->startVersion = -1;
  pCond->endVersion  =  -1;

  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
4370
SOperatorInfo* createOperatorTree(SPhysiNode* pPhyNode, SExecTaskInfo* pTaskInfo, SReadHandle* pHandle,
4371
                                  STableListInfo* pTableListInfo, SNode* pTagCond, SNode* pTagIndexCond, const char* pUser) {
4372 4373
  int32_t type = nodeType(pPhyNode);

X
Xiaoyu Wang 已提交
4374
  if (pPhyNode->pChildren == NULL || LIST_LENGTH(pPhyNode->pChildren) == 0) {
H
Haojun Liao 已提交
4375
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == type) {
dengyihao's avatar
dengyihao 已提交
4376
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4377

4378
      int32_t code = createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags,
4379
                                             pTableScanNode->groupSort, pHandle, pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
4380
      if (code) {
wmmhello's avatar
wmmhello 已提交
4381
        pTaskInfo->code = code;
D
dapan1121 已提交
4382 4383
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4384

4385
      code = extractTableSchemaInfo(pHandle, pTableScanNode->scan.uid, pTaskInfo);
S
slzhou 已提交
4386
      if (code) {
4387
        pTaskInfo->code = terrno;
wmmhello's avatar
wmmhello 已提交
4388 4389 4390
        return NULL;
      }

H
Haojun Liao 已提交
4391
      SOperatorInfo*  pOperator = createTableScanOperatorInfo(pTableScanNode, pHandle, pTaskInfo);
4392 4393
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
S
slzhou 已提交
4394
      return pOperator;
L
Liu Jicong 已提交
4395

S
slzhou 已提交
4396 4397
    } else if (QUERY_NODE_PHYSICAL_PLAN_TABLE_MERGE_SCAN == type) {
      STableMergeScanPhysiNode* pTableScanNode = (STableMergeScanPhysiNode*)pPhyNode;
4398
      int32_t code = createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags,
4399
                                             pTableScanNode->groupSort, pHandle, pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
L
Liu Jicong 已提交
4400
      if (code) {
wmmhello's avatar
wmmhello 已提交
4401
        pTaskInfo->code = code;
wmmhello's avatar
wmmhello 已提交
4402 4403
        return NULL;
      }
4404

4405
      code = extractTableSchemaInfo(pHandle, pTableScanNode->scan.uid, pTaskInfo);
wmmhello's avatar
wmmhello 已提交
4406 4407 4408 4409
      if (code) {
        pTaskInfo->code = terrno;
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4410

4411
      SOperatorInfo* pOperator =
4412
          createTableMergeScanOperatorInfo(pTableScanNode, pTableListInfo, pHandle, pTaskInfo);
wmmhello's avatar
wmmhello 已提交
4413

4414 4415 4416
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
      return pOperator;
L
Liu Jicong 已提交
4417

H
Haojun Liao 已提交
4418
    } else if (QUERY_NODE_PHYSICAL_PLAN_EXCHANGE == type) {
4419
      return createExchangeOperatorInfo(pHandle->pMsgCb->clientRpc, (SExchangePhysiNode*)pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4420
    } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN == type) {
5
54liuyao 已提交
4421
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
4422
      STimeWindowAggSupp   twSup = {
L
Liu Jicong 已提交
4423 4424 4425 4426
            .waterMark = pTableScanNode->watermark,
            .calTrigger = pTableScanNode->triggerType,
            .maxTs = INT64_MIN,
      };
L
Liu Jicong 已提交
4427
      if (pHandle) {
4428
        int32_t code = createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags,
4429
                                               pTableScanNode->groupSort, pHandle, pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
L
Liu Jicong 已提交
4430
        if (code) {
wmmhello's avatar
wmmhello 已提交
4431 4432 4433
          pTaskInfo->code = code;
          return NULL;
        }
5
54liuyao 已提交
4434
      }
4435

4436
      SOperatorInfo* pOperator = createStreamScanOperatorInfo(pHandle, pTableScanNode, pTagCond, pTaskInfo, &twSup);
H
Haojun Liao 已提交
4437
      return pOperator;
L
Liu Jicong 已提交
4438

H
Haojun Liao 已提交
4439
    } else if (QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN == type) {
L
Liu Jicong 已提交
4440
      SSystemTableScanPhysiNode* pSysScanPhyNode = (SSystemTableScanPhysiNode*)pPhyNode;
4441
      return createSysTableScanOperatorInfo(pHandle, pSysScanPhyNode, pUser, pTaskInfo);
4442
    } else if (QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN == type) {
X
Xiaoyu Wang 已提交
4443
      STagScanPhysiNode* pScanPhyNode = (STagScanPhysiNode*)pPhyNode;
4444

4445
      int32_t code = getTableList(pHandle->meta, pHandle->vnode, pScanPhyNode, pTagCond, pTagIndexCond, pTableListInfo);
4446
      if (code != TSDB_CODE_SUCCESS) {
4447
        pTaskInfo->code = terrno;
4448 4449 4450
        return NULL;
      }

4451
      return createTagScanOperatorInfo(pHandle, pScanPhyNode, pTableListInfo, pTaskInfo);
4452
    } else if (QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN == type) {
4453
      SBlockDistScanPhysiNode* pBlockNode = (SBlockDistScanPhysiNode*)pPhyNode;
4454 4455 4456
      pTableListInfo->pTableList = taosArrayInit(4, sizeof(STableKeyInfo));

      if (pBlockNode->tableType == TSDB_SUPER_TABLE) {
4457
        int32_t code = vnodeGetAllTableList(pHandle->vnode, pBlockNode->uid, pTableListInfo->pTableList);
4458 4459 4460 4461 4462
        if (code != TSDB_CODE_SUCCESS) {
          pTaskInfo->code = terrno;
          return NULL;
        }
      } else {  // Create one table group.
S
slzhou 已提交
4463
        STableKeyInfo info = {.lastKey = 0, .uid = pBlockNode->uid, .groupId = 0};
4464 4465 4466 4467
        taosArrayPush(pTableListInfo->pTableList, &info);
      }

      SQueryTableDataCond cond = {0};
4468 4469 4470
      int32_t code = initTableblockDistQueryCond(pBlockNode->suid, &cond);
      if (code != TSDB_CODE_SUCCESS) {
        return NULL;
4471
      }
H
Haojun Liao 已提交
4472 4473 4474

      STsdbReader* pReader = NULL;
      tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, "");
4475 4476
      cleanupQueryTableDataCond(&cond);

4477
      return createDataBlockInfoScanOperator(pReader, pHandle, cond.suid, pBlockNode, pTaskInfo);
H
Haojun Liao 已提交
4478 4479 4480
    } else if (QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN == type) {
      SLastRowScanPhysiNode* pScanNode = (SLastRowScanPhysiNode*)pPhyNode;

4481
      int32_t code = createScanTableListInfo(&pScanNode->scan, pScanNode->pGroupTags, true, pHandle, pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
4482 4483 4484 4485
      if (code != TSDB_CODE_SUCCESS) {
        pTaskInfo->code = code;
        return NULL;
      }
4486

4487 4488 4489 4490
      code = extractTableSchemaInfo(pHandle, pScanNode->scan.uid, pTaskInfo);
      if (code != TSDB_CODE_SUCCESS) {
        pTaskInfo->code = code;
        return NULL;
H
Haojun Liao 已提交
4491 4492
      }

4493
      return createLastrowScanOperator(pScanNode, pHandle, pTaskInfo);
H
Haojun Liao 已提交
4494 4495
    } else {
      ASSERT(0);
H
Haojun Liao 已提交
4496 4497 4498
    }
  }

4499 4500
  int32_t num = 0;
  size_t  size = LIST_LENGTH(pPhyNode->pChildren);
H
Haojun Liao 已提交
4501

4502
  SOperatorInfo** ops = taosMemoryCalloc(size, POINTER_BYTES);
dengyihao's avatar
dengyihao 已提交
4503
  for (int32_t i = 0; i < size; ++i) {
4504
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pPhyNode->pChildren, i);
4505
    ops[i] = createOperatorTree(pChildNode, pTaskInfo, pHandle, pTableListInfo, pTagCond, pTagIndexCond, pUser);
4506 4507 4508
    if (ops[i] == NULL) {
      return NULL;
    }
4509
  }
H
Haojun Liao 已提交
4510

4511
  SOperatorInfo* pOptr = NULL;
H
Haojun Liao 已提交
4512
  if (QUERY_NODE_PHYSICAL_PLAN_PROJECT == type) {
4513
    pOptr = createProjectOperatorInfo(ops[0], (SProjectPhysiNode*)pPhyNode, pTaskInfo);
4514
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_AGG == type) {
H
Haojun Liao 已提交
4515 4516
    SAggPhysiNode* pAggNode = (SAggPhysiNode*)pPhyNode;
    SExprInfo*     pExprInfo = createExprInfo(pAggNode->pAggFuncs, pAggNode->pGroupKeys, &num);
4517
    SSDataBlock*   pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4518

dengyihao's avatar
dengyihao 已提交
4519
    int32_t    numOfScalarExpr = 0;
4520 4521 4522 4523 4524
    SExprInfo* pScalarExprInfo = NULL;
    if (pAggNode->pExprs != NULL) {
      pScalarExprInfo = createExprInfo(pAggNode->pExprs, NULL, &numOfScalarExpr);
    }

H
Haojun Liao 已提交
4525 4526
    if (pAggNode->pGroupKeys != NULL) {
      SArray* pColList = extractColumnInfo(pAggNode->pGroupKeys);
dengyihao's avatar
dengyihao 已提交
4527
      pOptr = createGroupOperatorInfo(ops[0], pExprInfo, num, pResBlock, pColList, pAggNode->node.pConditions,
wmmhello's avatar
wmmhello 已提交
4528
                                      pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4529
    } else {
L
Liu Jicong 已提交
4530 4531
      pOptr = createAggregateOperatorInfo(ops[0], pExprInfo, num, pResBlock, pAggNode->node.pConditions,
                                          pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4532
    }
X
Xiaoyu Wang 已提交
4533
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_INTERVAL == type || QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type) {
H
Haojun Liao 已提交
4534
    SIntervalPhysiNode* pIntervalPhyNode = (SIntervalPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4535

H
Haojun Liao 已提交
4536
    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
4537
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4538

dengyihao's avatar
dengyihao 已提交
4539 4540 4541 4542 4543 4544
    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
H
Haojun Liao 已提交
4545

X
Xiaoyu Wang 已提交
4546 4547 4548 4549 4550
    STimeWindowAggSupp as = {
        .waterMark = pIntervalPhyNode->window.watermark,
        .calTrigger = pIntervalPhyNode->window.triggerType,
        .maxTs = INT64_MIN,
    };
4551
    ASSERT(as.calTrigger != STREAM_TRIGGER_MAX_DELAY);
4552

4553
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4554
    bool    isStream = (QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type);
4555 4556
    pOptr = createIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, &as, pIntervalPhyNode,
                                       pTaskInfo, isStream);
4557

4558 4559
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == type) {
    SMergeAlignedIntervalPhysiNode* pIntervalPhyNode = (SMergeAlignedIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4560 4561 4562 4563 4564 4565 4566 4567 4568 4569

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4570

S
shenglian zhou 已提交
4571
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4572 4573
    pOptr = createMergeAlignedIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId,
                                                   pPhyNode->pConditions, pTaskInfo);
S
shenglian zhou 已提交
4574
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_INTERVAL == type) {
X
Xiaoyu Wang 已提交
4575
    SMergeIntervalPhysiNode* pIntervalPhyNode = (SMergeIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4576 4577 4578 4579 4580 4581 4582 4583 4584 4585

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4586

S
shenglian zhou 已提交
4587 4588
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
    pOptr = createMergeIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, pTaskInfo);
5
54liuyao 已提交
4589
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_INTERVAL == type) {
4590
    int32_t children = 0;
5
54liuyao 已提交
4591 4592
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_INTERVAL == type) {
4593
    int32_t children = 1;
5
54liuyao 已提交
4594
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4595
  } else if (QUERY_NODE_PHYSICAL_PLAN_SORT == type) {
4596
    pOptr = createSortOperatorInfo(ops[0], (SSortPhysiNode*)pPhyNode, pTaskInfo);
S
shenglian zhou 已提交
4597 4598
  } else if (QUERY_NODE_PHYSICAL_PLAN_GROUP_SORT == type) {
    pOptr = createGroupSortOperatorInfo(ops[0], (SGroupSortPhysiNode*)pPhyNode, pTaskInfo);
X
Xiaoyu Wang 已提交
4599
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE == type) {
4600
    SMergePhysiNode* pMergePhyNode = (SMergePhysiNode*)pPhyNode;
4601
    pOptr = createMultiwayMergeOperatorInfo(ops, size, pMergePhyNode, pTaskInfo);
4602
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_SESSION == type) {
H
Haojun Liao 已提交
4603 4604
    SSessionWinodwPhysiNode* pSessionNode = (SSessionWinodwPhysiNode*)pPhyNode;

X
Xiaoyu Wang 已提交
4605 4606
    STimeWindowAggSupp as = {.waterMark = pSessionNode->window.watermark,
                             .calTrigger = pSessionNode->window.triggerType};
4607

H
Haojun Liao 已提交
4608
    SExprInfo*   pExprInfo = createExprInfo(pSessionNode->window.pFuncs, NULL, &num);
4609
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4610 4611
    int32_t      tsSlotId = ((SColumnNode*)pSessionNode->window.pTspk)->slotId;

L
Liu Jicong 已提交
4612 4613
    pOptr = createSessionAggOperatorInfo(ops[0], pExprInfo, num, pResBlock, pSessionNode->gap, tsSlotId, &as,
                                         pPhyNode->pConditions, pTaskInfo);
4614
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SESSION == type) {
4615 4616 4617 4618 4619 4620 4621
    pOptr = createStreamSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_SESSION == type) {
    int32_t children = 0;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_SESSION == type) {
    int32_t children = 1;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4622
  } else if (QUERY_NODE_PHYSICAL_PLAN_PARTITION == type) {
4623
    pOptr = createPartitionOperatorInfo(ops[0], (SPartitionPhysiNode*)pPhyNode, pTaskInfo);
4624
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_STATE == type) {
dengyihao's avatar
dengyihao 已提交
4625
    SStateWinodwPhysiNode* pStateNode = (SStateWinodwPhysiNode*)pPhyNode;
4626

4627 4628
    STimeWindowAggSupp as = {.waterMark = pStateNode->window.watermark, .calTrigger = pStateNode->window.triggerType};

dengyihao's avatar
dengyihao 已提交
4629
    SExprInfo*   pExprInfo = createExprInfo(pStateNode->window.pFuncs, NULL, &num);
4630
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4631 4632
    int32_t      tsSlotId = ((SColumnNode*)pStateNode->window.pTspk)->slotId;

4633
    SColumnNode* pColNode = (SColumnNode*)((STargetNode*)pStateNode->pStateKey)->pExpr;
X
Xiaoyu Wang 已提交
4634
    SColumn      col = extractColumnFromColumnNode(pColNode);
L
Liu Jicong 已提交
4635 4636
    pOptr = createStatewindowOperatorInfo(ops[0], pExprInfo, num, pResBlock, &as, tsSlotId, &col, pPhyNode->pConditions,
                                          pTaskInfo);
4637
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_STATE == type) {
5
54liuyao 已提交
4638
    pOptr = createStreamStateAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4639
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_JOIN == type) {
4640
    pOptr = createMergeJoinOperatorInfo(ops, size, (SJoinPhysiNode*)pPhyNode, pTaskInfo);
4641
  } else if (QUERY_NODE_PHYSICAL_PLAN_FILL == type) {
H
Haojun Liao 已提交
4642
    pOptr = createFillOperatorInfo(ops[0], (SFillPhysiNode*)pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4643 4644
  } else if (QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC == type) {
    pOptr = createIndefinitOutputOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4645 4646
  } else if (QUERY_NODE_PHYSICAL_PLAN_INTERP_FUNC == type) {
    pOptr = createTimeSliceOperatorInfo(ops[0], pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4647 4648
  } else {
    ASSERT(0);
H
Haojun Liao 已提交
4649
  }
4650 4651 4652

  taosMemoryFree(ops);
  return pOptr;
4653
}
H
Haojun Liao 已提交
4654

H
Haojun Liao 已提交
4655
SArray* extractColumnInfo(SNodeList* pNodeList) {
L
Liu Jicong 已提交
4656
  size_t  numOfCols = LIST_LENGTH(pNodeList);
H
Haojun Liao 已提交
4657 4658 4659 4660 4661 4662
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColumn));
  if (pList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

L
Liu Jicong 已提交
4663 4664
  for (int32_t i = 0; i < numOfCols; ++i) {
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pNodeList, i);
H
Haojun Liao 已提交
4665

4666 4667 4668
    if (nodeType(pNode->pExpr) == QUERY_NODE_COLUMN) {
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

4669
      SColumn c = extractColumnFromColumnNode(pColNode);
4670 4671
      taosArrayPush(pList, &c);
    } else if (nodeType(pNode->pExpr) == QUERY_NODE_VALUE) {
L
Liu Jicong 已提交
4672 4673
      SValueNode* pValNode = (SValueNode*)pNode->pExpr;
      SColumn     c = {0};
4674
      c.slotId = pNode->slotId;
L
Liu Jicong 已提交
4675 4676 4677 4678
      c.colId = pNode->slotId;
      c.type = pValNode->node.type;
      c.bytes = pValNode->node.resType.bytes;
      c.scale = pValNode->node.resType.scale;
4679 4680 4681 4682
      c.precision = pValNode->node.resType.precision;

      taosArrayPush(pList, &c);
    }
H
Haojun Liao 已提交
4683 4684 4685 4686 4687
  }

  return pList;
}

4688
#if 0
L
Liu Jicong 已提交
4689 4690
STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
                                STableListInfo* pTableListInfo, const char* idstr) {
4691
  int32_t code = getTableList(pHandle->meta, pHandle->vnode, &pTableScanNode->scan, pTableListInfo);
wmmhello's avatar
wmmhello 已提交
4692 4693 4694 4695 4696 4697
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  if (taosArrayGetSize(pTableListInfo->pTableList) == 0) {
    code = 0;
H
Haojun Liao 已提交
4698
    qDebug("no table qualified for query, %s", idstr);
wmmhello's avatar
wmmhello 已提交
4699 4700 4701
    goto _error;
  }

4702
  SQueryTableDataCond cond = {0};
wmmhello's avatar
wmmhello 已提交
4703
  code = initQueryTableDataCond(&cond, pTableScanNode);
4704
  if (code != TSDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4705
    goto _error;
X
Xiaoyu Wang 已提交
4706
  }
4707

H
Hongze Cheng 已提交
4708
  STsdbReader* pReader;
H
Haojun Liao 已提交
4709
  code = tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, idstr);
H
Haojun Liao 已提交
4710 4711 4712 4713
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

4714
  cleanupQueryTableDataCond(&cond);
H
Haojun Liao 已提交
4715 4716

  return pReader;
wmmhello's avatar
wmmhello 已提交
4717 4718 4719 4720

_error:
  terrno = code;
  return NULL;
H
Haojun Liao 已提交
4721
}
4722
#endif
H
Haojun Liao 已提交
4723

L
Liu Jicong 已提交
4724 4725 4726 4727 4728 4729 4730 4731 4732 4733 4734 4735 4736
static int32_t extractTbscanInStreamOpTree(SOperatorInfo* pOperator, STableScanInfo** ppInfo) {
  if (pOperator->operatorType != QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
    if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator");
      return TSDB_CODE_QRY_APP_ERROR;
    }

    if (pOperator->numOfDownstream > 1) {
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
    }
    return extractTbscanInStreamOpTree(pOperator->pDownstream[0], ppInfo);
  } else {
4737 4738 4739
    SStreamScanInfo* pInfo = pOperator->info;
    ASSERT(pInfo->pTableScanOp->operatorType == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN);
    *ppInfo = pInfo->pTableScanOp->info;
L
Liu Jicong 已提交
4740 4741 4742 4743
    return 0;
  }
}

4744 4745 4746 4747 4748 4749 4750 4751 4752 4753 4754 4755 4756 4757 4758 4759 4760 4761 4762 4763 4764 4765
int32_t extractTableScanNode(SPhysiNode* pNode, STableScanPhysiNode** ppNode) {
  if (pNode->pChildren == NULL || LIST_LENGTH(pNode->pChildren) == 0) {
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == pNode->type) {
      *ppNode = (STableScanPhysiNode*)pNode;
      return 0;
    } else {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
  } else {
    if (LIST_LENGTH(pNode->pChildren) != 1) {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pNode->pChildren, 0);
    return extractTableScanNode(pChildNode, ppNode);
  }
  return -1;
}

4766
#if 0
L
Liu Jicong 已提交
4767 4768 4769 4770 4771
int32_t rebuildReader(SOperatorInfo* pOperator, SSubplan* plan, SReadHandle* pHandle, int64_t uid, int64_t ts) {
  STableScanInfo* pTableScanInfo = NULL;
  if (extractTbscanInStreamOpTree(pOperator, &pTableScanInfo) < 0) {
    return -1;
  }
4772

L
Liu Jicong 已提交
4773 4774 4775 4776
  STableScanPhysiNode* pNode = NULL;
  if (extractTableScanNode(plan->pNode, &pNode) < 0) {
    ASSERT(0);
  }
4777

H
Haojun Liao 已提交
4778
  tsdbReaderClose(pTableScanInfo->dataReader);
4779

L
Liu Jicong 已提交
4780
  STableListInfo info = {0};
H
Haojun Liao 已提交
4781
  pTableScanInfo->dataReader = doCreateDataReader(pNode, pHandle, &info, NULL);
L
Liu Jicong 已提交
4782 4783 4784 4785
  if (pTableScanInfo->dataReader == NULL) {
    ASSERT(0);
    qError("failed to create data reader");
    return TSDB_CODE_QRY_APP_ERROR;
4786
  }
L
Liu Jicong 已提交
4787
  // TODO: set uid and ts to data reader
4788 4789
  return 0;
}
4790
#endif
4791

C
Cary Xu 已提交
4792
int32_t encodeOperator(SOperatorInfo* ops, char** result, int32_t* length, int32_t* nOptrWithVal) {
wmmhello's avatar
wmmhello 已提交
4793
  int32_t code = TDB_CODE_SUCCESS;
4794
  char*   pCurrent = NULL;
wmmhello's avatar
wmmhello 已提交
4795
  int32_t currLength = 0;
4796
  if (ops->fpSet.encodeResultRow) {
C
Cary Xu 已提交
4797
    if (result == NULL || length == NULL || nOptrWithVal == NULL) {
wmmhello's avatar
wmmhello 已提交
4798 4799 4800
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
    code = ops->fpSet.encodeResultRow(ops, &pCurrent, &currLength);
wmmhello's avatar
wmmhello 已提交
4801

4802 4803
    if (code != TDB_CODE_SUCCESS) {
      if (*result != NULL) {
wmmhello's avatar
wmmhello 已提交
4804 4805 4806 4807
        taosMemoryFree(*result);
        *result = NULL;
      }
      return code;
C
Cary Xu 已提交
4808 4809 4810
    } else if (currLength == 0) {
      ASSERT(!pCurrent);
      goto _downstream;
wmmhello's avatar
wmmhello 已提交
4811
    }
wmmhello's avatar
wmmhello 已提交
4812

C
Cary Xu 已提交
4813 4814
    ++(*nOptrWithVal);

C
Cary Xu 已提交
4815
    ASSERT(currLength >= 0);
wmmhello's avatar
wmmhello 已提交
4816

4817
    if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
4818
      *result = (char*)taosMemoryCalloc(1, currLength + sizeof(int32_t));
wmmhello's avatar
wmmhello 已提交
4819 4820 4821 4822 4823 4824
      if (*result == NULL) {
        taosMemoryFree(pCurrent);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      memcpy(*result + sizeof(int32_t), pCurrent, currLength);
      *(int32_t*)(*result) = currLength + sizeof(int32_t);
4825
    } else {
wmmhello's avatar
wmmhello 已提交
4826
      int32_t sizePre = *(int32_t*)(*result);
4827
      char*   tmp = (char*)taosMemoryRealloc(*result, sizePre + currLength);
wmmhello's avatar
wmmhello 已提交
4828 4829 4830 4831 4832 4833 4834 4835 4836 4837 4838 4839
      if (tmp == NULL) {
        taosMemoryFree(pCurrent);
        taosMemoryFree(*result);
        *result = NULL;
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      *result = tmp;
      memcpy(*result + sizePre, pCurrent, currLength);
      *(int32_t*)(*result) += currLength;
    }
    taosMemoryFree(pCurrent);
    *length = *(int32_t*)(*result);
wmmhello's avatar
wmmhello 已提交
4840 4841
  }

C
Cary Xu 已提交
4842
_downstream:
wmmhello's avatar
wmmhello 已提交
4843
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
C
Cary Xu 已提交
4844
    code = encodeOperator(ops->pDownstream[i], result, length, nOptrWithVal);
4845
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4846
      return code;
wmmhello's avatar
wmmhello 已提交
4847 4848
    }
  }
wmmhello's avatar
wmmhello 已提交
4849
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4850 4851
}

H
Haojun Liao 已提交
4852
int32_t decodeOperator(SOperatorInfo* ops, const char* result, int32_t length) {
wmmhello's avatar
wmmhello 已提交
4853
  int32_t code = TDB_CODE_SUCCESS;
4854 4855
  if (ops->fpSet.decodeResultRow) {
    if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
4856 4857
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
H
Haojun Liao 已提交
4858

4859
    ASSERT(length == *(int32_t*)result);
H
Haojun Liao 已提交
4860 4861

    const char* data = result + sizeof(int32_t);
L
Liu Jicong 已提交
4862
    code = ops->fpSet.decodeResultRow(ops, (char*)data);
4863
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4864 4865
      return code;
    }
wmmhello's avatar
wmmhello 已提交
4866

wmmhello's avatar
wmmhello 已提交
4867
    int32_t totalLength = *(int32_t*)result;
4868 4869
    int32_t dataLength = *(int32_t*)data;

4870
    if (totalLength == dataLength + sizeof(int32_t)) {  // the last data
wmmhello's avatar
wmmhello 已提交
4871 4872
      result = NULL;
      length = 0;
4873
    } else {
wmmhello's avatar
wmmhello 已提交
4874 4875 4876 4877
      result += dataLength;
      *(int32_t*)(result) = totalLength - dataLength;
      length = totalLength - dataLength;
    }
wmmhello's avatar
wmmhello 已提交
4878 4879
  }

wmmhello's avatar
wmmhello 已提交
4880 4881
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
    code = decodeOperator(ops->pDownstream[i], result, length);
4882
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4883
      return code;
wmmhello's avatar
wmmhello 已提交
4884 4885
    }
  }
wmmhello's avatar
wmmhello 已提交
4886
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4887 4888
}

D
dapan1121 已提交
4889
int32_t createDataSinkParam(SDataSinkNode* pNode, void** pParam, qTaskInfo_t* pTaskInfo, SReadHandle* readHandle) {
D
dapan1121 已提交
4890
  SExecTaskInfo* pTask = *(SExecTaskInfo**)pTaskInfo;
4891

D
dapan1121 已提交
4892
  switch (pNode->type) {
D
dapan1121 已提交
4893 4894 4895 4896 4897 4898
    case QUERY_NODE_PHYSICAL_PLAN_QUERY_INSERT: {
      SInserterParam* pInserterParam = taosMemoryCalloc(1, sizeof(SInserterParam));
      if (NULL == pInserterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      pInserterParam->readHandle = readHandle;
L
Liu Jicong 已提交
4899

D
dapan1121 已提交
4900 4901 4902
      *pParam = pInserterParam;
      break;
    }
D
dapan1121 已提交
4903
    case QUERY_NODE_PHYSICAL_PLAN_DELETE: {
4904
      SDeleterParam* pDeleterParam = taosMemoryCalloc(1, sizeof(SDeleterParam));
D
dapan1121 已提交
4905 4906 4907 4908
      if (NULL == pDeleterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      int32_t tbNum = taosArrayGetSize(pTask->tableqinfoList.pTableList);
D
dapan1121 已提交
4909
      pDeleterParam->suid = pTask->tableqinfoList.suid;
D
dapan1121 已提交
4910 4911 4912 4913 4914 4915
      pDeleterParam->pUidList = taosArrayInit(tbNum, sizeof(uint64_t));
      if (NULL == pDeleterParam->pUidList) {
        taosMemoryFree(pDeleterParam);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      for (int32_t i = 0; i < tbNum; ++i) {
4916
        STableKeyInfo* pTable = taosArrayGet(pTask->tableqinfoList.pTableList, i);
D
dapan1121 已提交
4917 4918 4919 4920 4921 4922 4923 4924 4925 4926 4927 4928 4929
        taosArrayPush(pDeleterParam->pUidList, &pTable->uid);
      }

      *pParam = pDeleterParam;
      break;
    }
    default:
      break;
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
4930
int32_t createExecTaskInfoImpl(SSubplan* pPlan, SExecTaskInfo** pTaskInfo, SReadHandle* pHandle, uint64_t taskId,
4931
                               const char* sql, EOPTR_EXEC_MODEL model) {
H
Haojun Liao 已提交
4932 4933
  uint64_t queryId = pPlan->id.queryId;

H
Haojun Liao 已提交
4934
  int32_t code = TSDB_CODE_SUCCESS;
D
dapan1121 已提交
4935
  *pTaskInfo = createExecTaskInfo(queryId, taskId, model, pPlan->dbFName);
H
Haojun Liao 已提交
4936 4937 4938 4939
  if (*pTaskInfo == NULL) {
    code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    goto _complete;
  }
H
Haojun Liao 已提交
4940

4941
  (*pTaskInfo)->sql = sql;
4942
  (*pTaskInfo)->pSubplan = pPlan;
4943
  (*pTaskInfo)->pRoot = createOperatorTree(pPlan->pNode, *pTaskInfo, pHandle, &(*pTaskInfo)->tableqinfoList, pPlan->pTagCond, pPlan->pTagIndexCond, pPlan->user);
L
Liu Jicong 已提交
4944

D
dapan1121 已提交
4945
  if (NULL == (*pTaskInfo)->pRoot) {
4946
    code = (*pTaskInfo)->code;
D
dapan1121 已提交
4947
    goto _complete;
4948 4949
  }

H
Haojun Liao 已提交
4950 4951
  return code;

H
Haojun Liao 已提交
4952
_complete:
wafwerar's avatar
wafwerar 已提交
4953
  taosMemoryFreeClear(*pTaskInfo);
H
Haojun Liao 已提交
4954 4955
  terrno = code;
  return code;
H
Haojun Liao 已提交
4956 4957
}

wmmhello's avatar
wmmhello 已提交
4958 4959 4960
static void doDestroyTableList(STableListInfo* pTableqinfoList) {
  taosArrayDestroy(pTableqinfoList->pTableList);
  taosHashCleanup(pTableqinfoList->map);
4961 4962
  if (pTableqinfoList->needSortTableByGroupId) {
    for (int32_t i = 0; i < taosArrayGetSize(pTableqinfoList->pGroupList); i++) {
wmmhello's avatar
wmmhello 已提交
4963
      SArray* tmp = taosArrayGetP(pTableqinfoList->pGroupList, i);
4964 4965 4966
      if (tmp == pTableqinfoList->pTableList) {
        continue;
      }
wmmhello's avatar
wmmhello 已提交
4967 4968 4969 4970
      taosArrayDestroy(tmp);
    }
  }
  taosArrayDestroy(pTableqinfoList->pGroupList);
4971

wmmhello's avatar
wmmhello 已提交
4972 4973
  pTableqinfoList->pTableList = NULL;
  pTableqinfoList->map = NULL;
4974 4975
}

L
Liu Jicong 已提交
4976
void doDestroyTask(SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
4977 4978
  qDebug("%s execTask is freed", GET_TASKID(pTaskInfo));

wmmhello's avatar
wmmhello 已提交
4979
  doDestroyTableList(&pTaskInfo->tableqinfoList);
H
Haojun Liao 已提交
4980
  destroyOperatorInfo(pTaskInfo->pRoot);
4981 4982 4983
  cleanupTableSchemaInfo(&pTaskInfo->schemaInfo);

  nodesDestroyNode((SNode*)pTaskInfo->pSubplan);
4984

wafwerar's avatar
wafwerar 已提交
4985 4986 4987
  taosMemoryFreeClear(pTaskInfo->sql);
  taosMemoryFreeClear(pTaskInfo->id.str);
  taosMemoryFreeClear(pTaskInfo);
4988 4989 4990 4991 4992 4993 4994 4995 4996 4997 4998 4999
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes) {
  if (val == NULL) {
    setNull(output, type, bytes);
    return;
  }

  if (IS_VAR_DATA_TYPE(type)) {
    // Binary data overflows for sort of unknown reasons. Let trim the overflow data
    if (varDataTLen(val) > bytes) {
      int32_t maxLen = bytes - VARSTR_HEADER_SIZE;
L
Liu Jicong 已提交
5000
      int32_t len = (varDataLen(val) > maxLen) ? maxLen : varDataLen(val);
5001 5002 5003 5004 5005 5006 5007 5008 5009 5010 5011 5012
      memcpy(varDataVal(output), varDataVal(val), len);
      varDataSetLen(output, len);
    } else {
      varDataCopy(output, val);
    }
  } else {
    memcpy(output, val, bytes);
  }
}

static int64_t getQuerySupportBufSize(size_t numOfTables) {
  size_t s1 = sizeof(STableQueryInfo);
L
Liu Jicong 已提交
5013 5014
  //  size_t s3 = sizeof(STableCheckInfo);  buffer consumption in tsdb
  return (int64_t)(s1 * 1.5 * numOfTables);
5015 5016 5017 5018 5019 5020 5021
}

int32_t checkForQueryBuf(size_t numOfTables) {
  int64_t t = getQuerySupportBufSize(numOfTables);
  if (tsQueryBufferSizeBytes < 0) {
    return TSDB_CODE_SUCCESS;
  } else if (tsQueryBufferSizeBytes > 0) {
L
Liu Jicong 已提交
5022
    while (1) {
5023 5024 5025 5026 5027 5028 5029 5030 5031 5032 5033 5034 5035 5036 5037 5038 5039 5040 5041 5042 5043 5044 5045 5046 5047 5048
      int64_t s = tsQueryBufferSizeBytes;
      int64_t remain = s - t;
      if (remain >= 0) {
        if (atomic_val_compare_exchange_64(&tsQueryBufferSizeBytes, s, remain) == s) {
          return TSDB_CODE_SUCCESS;
        }
      } else {
        return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
      }
    }
  }

  // disable query processing if the value of tsQueryBufferSize is zero.
  return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
}

void releaseQueryBuf(size_t numOfTables) {
  if (tsQueryBufferSizeBytes < 0) {
    return;
  }

  int64_t t = getQuerySupportBufSize(numOfTables);

  // restore value is not enough buffer available
  atomic_add_fetch_64(&tsQueryBufferSizeBytes, t);
}
D
dapan1121 已提交
5049

dengyihao's avatar
dengyihao 已提交
5050 5051
int32_t getOperatorExplainExecInfo(SOperatorInfo* operatorInfo, SExplainExecInfo** pRes, int32_t* capacity,
                                   int32_t* resNum) {
D
dapan1121 已提交
5052 5053
  if (*resNum >= *capacity) {
    *capacity += 10;
dengyihao's avatar
dengyihao 已提交
5054

D
dapan1121 已提交
5055 5056
    *pRes = taosMemoryRealloc(*pRes, (*capacity) * sizeof(SExplainExecInfo));
    if (NULL == *pRes) {
D
dapan1121 已提交
5057
      qError("malloc %d failed", (*capacity) * (int32_t)sizeof(SExplainExecInfo));
D
dapan1121 已提交
5058 5059 5060 5061
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

5062 5063 5064 5065 5066
  SExplainExecInfo* pInfo = &(*pRes)[*resNum];

  pInfo->numOfRows = operatorInfo->resultInfo.totalRows;
  pInfo->startupCost = operatorInfo->cost.openCost;
  pInfo->totalCost = operatorInfo->cost.totalCost;
D
dapan1121 已提交
5067

5068
  if (operatorInfo->fpSet.getExplainFn) {
5069
    int32_t code = operatorInfo->fpSet.getExplainFn(operatorInfo, &pInfo->verboseInfo, &pInfo->verboseLen);
D
dapan1121 已提交
5070
    if (code) {
5071
      qError("%s operator getExplainFn failed, code:%s", GET_TASKID(operatorInfo->pTaskInfo), tstrerror(code));
D
dapan1121 已提交
5072 5073
      return code;
    }
5074 5075 5076
  } else {
    pInfo->verboseLen = 0;
    pInfo->verboseInfo = NULL;
D
dapan1121 已提交
5077
  }
dengyihao's avatar
dengyihao 已提交
5078

D
dapan1121 已提交
5079
  ++(*resNum);
dengyihao's avatar
dengyihao 已提交
5080

D
dapan1121 已提交
5081
  int32_t code = 0;
D
dapan1121 已提交
5082 5083
  for (int32_t i = 0; i < operatorInfo->numOfDownstream; ++i) {
    code = getOperatorExplainExecInfo(operatorInfo->pDownstream[i], pRes, capacity, resNum);
D
dapan1121 已提交
5084 5085 5086 5087 5088 5089 5090
    if (code) {
      taosMemoryFreeClear(*pRes);
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
D
dapan1121 已提交
5091
}
5
54liuyao 已提交
5092

L
Liu Jicong 已提交
5093
int32_t initStreamAggSupporter(SStreamAggSupporter* pSup, const char* pKey, SqlFunctionCtx* pCtx, int32_t numOfOutput,
5094
                               int32_t size) {
5095
  pSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
5
54liuyao 已提交
5096 5097
  pSup->keySize = sizeof(int64_t) + sizeof(TSKEY);
  pSup->pKeyBuf = taosMemoryCalloc(1, pSup->keySize);
5098 5099
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);
  pSup->pResultRows = taosHashInit(1024, hashFn, false, HASH_NO_LOCK);
5
54liuyao 已提交
5100 5101 5102
  if (pSup->pKeyBuf == NULL || pSup->pResultRows == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
5103
  pSup->valueSize = size;
5
54liuyao 已提交
5104

5
54liuyao 已提交
5105 5106
  pSup->pScanWindow = taosArrayInit(4, sizeof(STimeWindow));

5
54liuyao 已提交
5107 5108 5109 5110 5111 5112 5113 5114 5115
  int32_t pageSize = 4096;
  while (pageSize < pSup->resultRowSize * 4) {
    pageSize <<= 1u;
  }
  // at least four pages need to be in buffer
  int32_t bufSize = 4096 * 256;
  if (bufSize <= pageSize) {
    bufSize = pageSize * 4;
  }
5116
  int32_t code = createDiskbasedBuf(&pSup->pResultBuf, pageSize, bufSize, pKey, TD_TMP_DIR_PATH);
L
Liu Jicong 已提交
5117
  for (int32_t i = 0; i < numOfOutput; ++i) {
5118 5119 5120
    pCtx[i].pBuf = pSup->pResultBuf;
  }
  return code;
5
54liuyao 已提交
5121
}