executorimpl.c 175.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
15

H
Haojun Liao 已提交
16 17
#include "filter.h"
#include "function.h"
18 19
#include "functionMgt.h"
#include "os.h"
H
Haojun Liao 已提交
20
#include "querynodes.h"
21
#include "tfill.h"
dengyihao's avatar
dengyihao 已提交
22
#include "tname.h"
X
Xiaoyu Wang 已提交
23
#include "tref.h"
24

H
Haojun Liao 已提交
25
#include "tdatablock.h"
26
#include "tglobal.h"
H
Haojun Liao 已提交
27
#include "tmsg.h"
H
Haojun Liao 已提交
28
#include "tsort.h"
29
#include "ttime.h"
H
Haojun Liao 已提交
30

31
#include "executorimpl.h"
dengyihao's avatar
dengyihao 已提交
32
#include "index.h"
33
#include "query.h"
34 35
#include "tcompare.h"
#include "tcompression.h"
H
Haojun Liao 已提交
36
#include "thash.h"
37
#include "ttypes.h"
dengyihao's avatar
dengyihao 已提交
38
#include "vnode.h"
39

H
Haojun Liao 已提交
40
#define IS_MAIN_SCAN(runtime)          ((runtime)->scanFlag == MAIN_SCAN)
41 42 43 44 45 46
#define SET_REVERSE_SCAN_FLAG(runtime) ((runtime)->scanFlag = REVERSE_SCAN)

#define GET_FORWARD_DIRECTION_FACTOR(ord) (((ord) == TSDB_ORDER_ASC) ? QUERY_ASC_FORWARD_STEP : QUERY_DESC_FORWARD_STEP)

#if 0
static UNUSED_FUNC void *u_malloc (size_t __size) {
wafwerar's avatar
wafwerar 已提交
47
  uint32_t v = taosRand();
48 49 50 51

  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
52
    return taosMemoryMalloc(__size);
53 54 55 56
  }
}

static UNUSED_FUNC void* u_calloc(size_t num, size_t __size) {
wafwerar's avatar
wafwerar 已提交
57
  uint32_t v = taosRand();
58 59 60
  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
61
    return taosMemoryCalloc(num, __size);
62 63 64 65
  }
}

static UNUSED_FUNC void* u_realloc(void* p, size_t __size) {
wafwerar's avatar
wafwerar 已提交
66
  uint32_t v = taosRand();
67 68 69
  if (v % 5 <= 1) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
70
    return taosMemoryRealloc(p, __size);
71 72 73 74 75 76 77 78
  }
}

#define calloc  u_calloc
#define malloc  u_malloc
#define realloc u_realloc
#endif

X
Xiaoyu Wang 已提交
79
#define CLEAR_QUERY_STATUS(q, st)   ((q)->status &= (~(st)))
80 81
#define QUERY_IS_INTERVAL_QUERY(_q) ((_q)->interval.interval > 0)

L
Liu Jicong 已提交
82 83 84
int32_t getMaximumIdleDurationSec() { return tsShellActivityTimer * 2; }

static int32_t getExprFunctionId(SExprInfo* pExprInfo) {
85
  assert(pExprInfo != NULL && pExprInfo->pExpr != NULL && pExprInfo->pExpr->nodeType == TEXPR_UNARYEXPR_NODE);
86
  return 0;
87 88 89 90
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes);

91
static void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExpr, SSDataBlock* pSDataBlock);
92

X
Xiaoyu Wang 已提交
93
static void releaseQueryBuf(size_t numOfTables);
94 95 96 97 98

static void destroySFillOperatorInfo(void* param, int32_t numOfOutput);
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput);
static void destroyOrderOperatorInfo(void* param, int32_t numOfOutput);
static void destroyAggOperatorInfo(void* param, int32_t numOfOutput);
X
Xiaoyu Wang 已提交
99

H
Haojun Liao 已提交
100
static void destroyIntervalOperatorInfo(void* param, int32_t numOfOutput);
H
Haojun Liao 已提交
101 102
static void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput);

103 104
static void destroyOperatorInfo(SOperatorInfo* pOperator);

105
void doSetOperatorCompleted(SOperatorInfo* pOperator) {
106
  pOperator->status = OP_EXEC_DONE;
107

108
  pOperator->cost.totalCost = (taosGetTimestampUs() - pOperator->pTaskInfo->cost.start * 1000) / 1000.0;
H
Haojun Liao 已提交
109
  if (pOperator->pTaskInfo != NULL) {
110
    setTaskStatus(pOperator->pTaskInfo, TASK_COMPLETED);
111 112
  }
}
113

H
Haojun Liao 已提交
114
int32_t operatorDummyOpenFn(SOperatorInfo* pOperator) {
115
  OPTR_SET_OPENED(pOperator);
116
  pOperator->cost.openCost = 0;
H
Haojun Liao 已提交
117
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
118 119
}

120
SOperatorFpSet createOperatorFpSet(__optr_open_fn_t openFn, __optr_fn_t nextFn, __optr_fn_t streamFn,
L
Liu Jicong 已提交
121
                                   __optr_fn_t cleanup, __optr_close_fn_t closeFn, __optr_encode_fn_t encode,
122
                                   __optr_decode_fn_t decode, __optr_explain_fn_t explain) {
123 124 125 126 127 128 129 130 131 132 133 134 135 136
  SOperatorFpSet fpSet = {
      ._openFn = openFn,
      .getNextFn = nextFn,
      .getStreamResFn = streamFn,
      .cleanupFn = cleanup,
      .closeFn = closeFn,
      .encodeResultRow = encode,
      .decodeResultRow = decode,
      .getExplainFn = explain,
  };

  return fpSet;
}

H
Haojun Liao 已提交
137
void operatorDummyCloseFn(void* param, int32_t numOfCols) {}
H
Haojun Liao 已提交
138

X
Xiaoyu Wang 已提交
139 140 141
static int32_t doCopyToSDataBlock(SExecTaskInfo* taskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo,
                                  SDiskbasedBuf* pBuf, SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset,
                                  SqlFunctionCtx* pCtx, int32_t numOfExprs);
H
Haojun Liao 已提交
142

143
static void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size);
L
Liu Jicong 已提交
144 145
static void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                                     uint64_t groupId);
146

L
Liu Jicong 已提交
147 148
// setup the output buffer for each operator
static bool hasNull(SColumn* pColumn, SColumnDataAgg* pStatis) {
dengyihao's avatar
dengyihao 已提交
149 150
  if (TSDB_COL_IS_TAG(pColumn->flag) || TSDB_COL_IS_UD_COL(pColumn->flag) ||
      pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
151 152 153 154 155 156 157 158 159 160
    return false;
  }

  if (pStatis != NULL && pStatis->numOfNull == 0) {
    return false;
  }

  return true;
}

161
#if 0
L
Liu Jicong 已提交
162 163
static bool chkResultRowFromKey(STaskRuntimeEnv* pRuntimeEnv, SResultRowInfo* pResultRowInfo, char* pData,
                                int16_t bytes, bool masterscan, uint64_t uid) {
164 165 166
  bool existed = false;
  SET_RES_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid);

L
Liu Jicong 已提交
167 168
  SResultRow** p1 =
      (SResultRow**)taosHashGet(pRuntimeEnv->pResultRowHashTable, pRuntimeEnv->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
169 170 171 172 173 174 175 176 177 178 179

  // in case of repeat scan/reverse scan, no new time window added.
  if (QUERY_IS_INTERVAL_QUERY(pRuntimeEnv->pQueryAttr)) {
    if (!masterscan) {  // the *p1 may be NULL in case of sliding+offset exists.
      return p1 != NULL;
    }

    if (p1 != NULL) {
      if (pResultRowInfo->size == 0) {
        existed = false;
      } else if (pResultRowInfo->size == 1) {
dengyihao's avatar
dengyihao 已提交
180
        //        existed = (pResultRowInfo->pResult[0] == (*p1));
181 182
      } else {  // check if current pResultRowInfo contains the existed pResultRow
        SET_RES_EXT_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid, pResultRowInfo);
L
Liu Jicong 已提交
183 184
        int64_t* index =
            taosHashGet(pRuntimeEnv->pResultRowListSet, pRuntimeEnv->keyBuf, GET_RES_EXT_WINDOW_KEY_LEN(bytes));
185 186 187 188 189 190 191 192 193 194 195 196 197
        if (index != NULL) {
          existed = true;
        } else {
          existed = false;
        }
      }
    }

    return existed;
  }

  return p1 != NULL;
}
198
#endif
199

200
SResultRow* getNewResultRow(SDiskbasedBuf* pResultBuf, int64_t tableGroupId, int32_t interBufSize) {
L
Liu Jicong 已提交
201
  SFilePage* pData = NULL;
202 203 204 205 206 207 208 209 210 211 212 213 214

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tableGroupId);

  if (taosArrayGetSize(list) == 0) {
    pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
    pData->num = sizeof(SFilePage);
  } else {
    SPageInfo* pi = getLastPageInfo(list);
    pData = getBufPage(pResultBuf, getPageId(pi));
    pageId = getPageId(pi);

wmmhello's avatar
wmmhello 已提交
215
    if (pData->num + interBufSize > getBufPageSize(pResultBuf)) {
216 217 218 219 220 221 222 223 224 225 226 227 228 229
      // release current page first, and prepare the next one
      releaseBufPageInfo(pResultBuf, pi);

      pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
      if (pData != NULL) {
        pData->num = sizeof(SFilePage);
      }
    }
  }

  if (pData == NULL) {
    return NULL;
  }

230 231
  setBufPageDirty(pData, true);

232 233 234 235 236
  // set the number of rows in current disk page
  SResultRow* pResultRow = (SResultRow*)((char*)pData + pData->num);
  pResultRow->pageId = pageId;
  pResultRow->offset = (int32_t)pData->num;

wmmhello's avatar
wmmhello 已提交
237
  pData->num += interBufSize;
238 239 240 241

  return pResultRow;
}

242 243 244 245 246 247 248
/**
 * the struct of key in hash table
 * +----------+---------------+
 * | group id |   key data    |
 * | 8 bytes  | actual length |
 * +----------+---------------+
 */
249 250 251
SResultRow* doSetResultOutBufByKey(SDiskbasedBuf* pResultBuf, SResultRowInfo* pResultRowInfo, char* pData,
                                   int16_t bytes, bool masterscan, uint64_t groupId, SExecTaskInfo* pTaskInfo,
                                   bool isIntervalQuery, SAggSupporter* pSup) {
252
  SET_RES_WINDOW_KEY(pSup->keyBuf, pData, bytes, groupId);
H
Haojun Liao 已提交
253

dengyihao's avatar
dengyihao 已提交
254 255
  SResultRowPosition* p1 =
      (SResultRowPosition*)taosHashGet(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
H
Haojun Liao 已提交
256

257 258
  SResultRow* pResult = NULL;

H
Haojun Liao 已提交
259 260
  // in case of repeat scan/reverse scan, no new time window added.
  if (isIntervalQuery) {
261 262
    if (masterscan && p1 != NULL) {  // the *p1 may be NULL in case of sliding+offset exists.
      pResult = getResultRowByPos(pResultBuf, p1);
263
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
264 265
    }
  } else {
dengyihao's avatar
dengyihao 已提交
266 267
    // In case of group by column query, the required SResultRow object must be existInCurrentResusltRowInfo in the
    // pResultRowInfo object.
H
Haojun Liao 已提交
268
    if (p1 != NULL) {
269
      // todo
270
      pResult = getResultRowByPos(pResultBuf, p1);
271
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
272 273 274
    }
  }

L
Liu Jicong 已提交
275
  // 1. close current opened time window
276
  if (pResultRowInfo->cur.pageId != -1 && ((pResult == NULL) || (pResult->pageId != pResultRowInfo->cur.pageId))) {
277
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
278
    qDebug("page_1");
279
#endif
280
    SResultRowPosition pos = pResultRowInfo->cur;
X
Xiaoyu Wang 已提交
281
    SFilePage*         pPage = getBufPage(pResultBuf, pos.pageId);
282 283 284 285 286
    releaseBufPage(pResultBuf, pPage);
  }

  // allocate a new buffer page
  if (pResult == NULL) {
287
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
288
    qDebug("page_2");
289
#endif
H
Haojun Liao 已提交
290
    ASSERT(pSup->resultRowSize > 0);
291 292
    pResult = getNewResultRow(pResultBuf, groupId, pSup->resultRowSize);

293
    initResultRow(pResult);
H
Haojun Liao 已提交
294

295 296
    // add a new result set for a new group
    SResultRowPosition pos = {.pageId = pResult->pageId, .offset = pResult->offset};
X
Xiaoyu Wang 已提交
297 298
    taosHashPut(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes), &pos,
                sizeof(SResultRowPosition));
H
Haojun Liao 已提交
299 300
  }

301 302 303
  // 2. set the new time window to be the new active time window
  pResultRowInfo->cur = (SResultRowPosition){.pageId = pResult->pageId, .offset = pResult->offset};

H
Haojun Liao 已提交
304
  // too many time window in query
305
  if (taosHashGetSize(pSup->pResultRowHashTable) > MAX_INTERVAL_TIME_WINDOW) {
H
Haojun Liao 已提交
306 307 308
    longjmp(pTaskInfo->env, TSDB_CODE_QRY_TOO_MANY_TIMEWINDOW);
  }

H
Haojun Liao 已提交
309
  return pResult;
H
Haojun Liao 已提交
310 311
}

312
// a new buffer page for each table. Needs to opt this design
L
Liu Jicong 已提交
313
static int32_t addNewWindowResultBuf(SResultRow* pWindowRes, SDiskbasedBuf* pResultBuf, int32_t tid, uint32_t size) {
314 315 316 317
  if (pWindowRes->pageId != -1) {
    return 0;
  }

L
Liu Jicong 已提交
318
  SFilePage* pData = NULL;
319 320 321 322 323 324

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tid);

  if (taosArrayGetSize(list) == 0) {
H
Haojun Liao 已提交
325
    pData = getNewBufPage(pResultBuf, tid, &pageId);
326
    pData->num = sizeof(SFilePage);
327 328
  } else {
    SPageInfo* pi = getLastPageInfo(list);
329
    pData = getBufPage(pResultBuf, getPageId(pi));
330
    pageId = getPageId(pi);
331

332
    if (pData->num + size > getBufPageSize(pResultBuf)) {
333
      // release current page first, and prepare the next one
334
      releaseBufPageInfo(pResultBuf, pi);
335

H
Haojun Liao 已提交
336
      pData = getNewBufPage(pResultBuf, tid, &pageId);
337
      if (pData != NULL) {
338
        pData->num = sizeof(SFilePage);
339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358
      }
    }
  }

  if (pData == NULL) {
    return -1;
  }

  // set the number of rows in current disk page
  if (pWindowRes->pageId == -1) {  // not allocated yet, allocate new buffer
    pWindowRes->pageId = pageId;
    pWindowRes->offset = (int32_t)pData->num;

    pData->num += size;
    assert(pWindowRes->pageId >= 0);
  }

  return 0;
}

359
//  query_range_start, query_range_end, window_duration, window_start, window_end
360
void initExecTimeWindowInfo(SColumnInfoData* pColData, STimeWindow* pQueryWindow) {
361 362 363
  pColData->info.type = TSDB_DATA_TYPE_TIMESTAMP;
  pColData->info.bytes = sizeof(int64_t);

364
  colInfoDataEnsureCapacity(pColData, 5);
365 366 367 368 369 370 371 372 373
  colDataAppendInt64(pColData, 0, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 1, &pQueryWindow->ekey);

  int64_t interval = 0;
  colDataAppendInt64(pColData, 2, &interval);  // this value may be variable in case of 'n' and 'y'.
  colDataAppendInt64(pColData, 3, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 4, &pQueryWindow->ekey);
}

X
Xiaoyu Wang 已提交
374 375 376
void doApplyFunctions(SExecTaskInfo* taskInfo, SqlFunctionCtx* pCtx, STimeWindow* pWin,
                      SColumnInfoData* pTimeWindowData, int32_t offset, int32_t forwardStep, TSKEY* tsCol,
                      int32_t numOfTotal, int32_t numOfOutput, int32_t order) {
377
  for (int32_t k = 0; k < numOfOutput; ++k) {
H
Haojun Liao 已提交
378
    // keep it temporarily
379
    // todo no need this??
dengyihao's avatar
dengyihao 已提交
380 381
    bool    hasAgg = pCtx[k].input.colDataAggIsSet;
    int32_t numOfRows = pCtx[k].input.numOfRows;
H
Haojun Liao 已提交
382
    int32_t startOffset = pCtx[k].input.startRowIndex;
383

384
    pCtx[k].input.startRowIndex = offset;
385
    pCtx[k].input.numOfRows = forwardStep;
386 387 388

    // not a whole block involved in query processing, statistics data can not be used
    // NOTE: the original value of isSet have been changed here
389 390
    if (pCtx[k].input.colDataAggIsSet && forwardStep < numOfTotal) {
      pCtx[k].input.colDataAggIsSet = false;
391 392
    }

393 394
    if (fmIsWindowPseudoColumnFunc(pCtx[k].functionId)) {
      SResultRowEntryInfo* pEntryInfo = GET_RES_INFO(&pCtx[k]);
395 396

      char* p = GET_ROWCELL_INTERBUF(pEntryInfo);
397

398
      SColumnInfoData idata = {0};
dengyihao's avatar
dengyihao 已提交
399
      idata.info.type = TSDB_DATA_TYPE_BIGINT;
400
      idata.info.bytes = tDataTypes[TSDB_DATA_TYPE_BIGINT].bytes;
dengyihao's avatar
dengyihao 已提交
401
      idata.pData = p;
402 403 404 405

      SScalarParam out = {.columnData = &idata};
      SScalarParam tw = {.numOfRows = 5, .columnData = pTimeWindowData};
      pCtx[k].sfp.process(&tw, 1, &out);
406
      pEntryInfo->numOfRes = 1;
407 408 409 410 411 412 413 414 415 416
    } else {
      int32_t code = TSDB_CODE_SUCCESS;
      if (functionNeedToExecute(&pCtx[k]) && pCtx[k].fpSet.process != NULL) {
        code = pCtx[k].fpSet.process(&pCtx[k]);

        if (code != TSDB_CODE_SUCCESS) {
          qError("%s apply functions error, code: %s", GET_TASKID(taskInfo), tstrerror(code));
          taskInfo->code = code;
          longjmp(taskInfo->env, code);
        }
417
      }
418

419 420 421 422 423
      // restore it
      pCtx[k].input.colDataAggIsSet = hasAgg;
      pCtx[k].input.startRowIndex = startOffset;
      pCtx[k].input.numOfRows = numOfRows;
    }
424 425 426
  }
}

dengyihao's avatar
dengyihao 已提交
427
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
428
                                   int32_t scanFlag, bool createDummyCol);
429

dengyihao's avatar
dengyihao 已提交
430 431
static void doSetInputDataBlockInfo(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock,
                                    int32_t order) {
432
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
433
    pCtx[i].order = order;
434
    pCtx[i].input.numOfRows = pBlock->info.rows;
435
    setBlockStatisInfo(&pCtx[i], &pOperator->exprSupp.pExprInfo[i], pBlock);
436 437 438
  }
}

X
Xiaoyu Wang 已提交
439 440
void setInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
                       int32_t scanFlag, bool createDummyCol) {
441
  if (pBlock->pBlockAgg != NULL) {
H
Haojun Liao 已提交
442
    doSetInputDataBlockInfo(pOperator, pCtx, pBlock, order);
443
  } else {
444
    doSetInputDataBlock(pOperator, pCtx, pBlock, order, scanFlag, createDummyCol);
H
Haojun Liao 已提交
445
  }
446 447
}

L
Liu Jicong 已提交
448 449
static int32_t doCreateConstantValColumnInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t paramIndex,
                                             int32_t numOfRows) {
450 451 452 453 454 455 456 457
  SColumnInfoData* pColInfo = NULL;
  if (pInput->pData[paramIndex] == NULL) {
    pColInfo = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pColInfo == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

    // Set the correct column info (data type and bytes)
458 459
    pColInfo->info.type = pFuncParam->param.nType;
    pColInfo->info.bytes = pFuncParam->param.nLen;
460 461

    pInput->pData[paramIndex] = pColInfo;
462 463
  } else {
    pColInfo = pInput->pData[paramIndex];
464 465
  }

466
  colInfoDataEnsureCapacity(pColInfo, numOfRows);
467

468
  int8_t type = pFuncParam->param.nType;
469 470
  if (type == TSDB_DATA_TYPE_BIGINT || type == TSDB_DATA_TYPE_UBIGINT) {
    int64_t v = pFuncParam->param.i;
dengyihao's avatar
dengyihao 已提交
471
    for (int32_t i = 0; i < numOfRows; ++i) {
472 473 474 475
      colDataAppendInt64(pColInfo, i, &v);
    }
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
dengyihao's avatar
dengyihao 已提交
476
    for (int32_t i = 0; i < numOfRows; ++i) {
477 478
      colDataAppendDouble(pColInfo, i, &v);
    }
479
  } else if (type == TSDB_DATA_TYPE_VARCHAR) {
L
Liu Jicong 已提交
480
    char* tmp = taosMemoryMalloc(pFuncParam->param.nLen + VARSTR_HEADER_SIZE);
481
    STR_WITH_SIZE_TO_VARSTR(tmp, pFuncParam->param.pz, pFuncParam->param.nLen);
L
Liu Jicong 已提交
482
    for (int32_t i = 0; i < numOfRows; ++i) {
483 484
      colDataAppend(pColInfo, i, tmp, false);
    }
485 486 487 488 489
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
490
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
X
Xiaoyu Wang 已提交
491
                                   int32_t scanFlag, bool createDummyCol) {
492 493
  int32_t code = TSDB_CODE_SUCCESS;

494
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
L
Liu Jicong 已提交
495
    pCtx[i].order = order;
496 497
    pCtx[i].input.numOfRows = pBlock->info.rows;

L
Liu Jicong 已提交
498
    pCtx[i].pSrcBlock = pBlock;
X
Xiaoyu Wang 已提交
499
    pCtx[i].scanFlag = scanFlag;
H
Haojun Liao 已提交
500

501
    SInputColumnInfoData* pInput = &pCtx[i].input;
502
    pInput->uid = pBlock->info.uid;
C
Cary Xu 已提交
503
    pInput->colDataAggIsSet = false;
504

505
    SExprInfo* pOneExpr = &pOperator->exprSupp.pExprInfo[i];
506
    for (int32_t j = 0; j < pOneExpr->base.numOfParams; ++j) {
dengyihao's avatar
dengyihao 已提交
507
      SFunctParam* pFuncParam = &pOneExpr->base.pParam[j];
G
Ganlin Zhao 已提交
508 509
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
dengyihao's avatar
dengyihao 已提交
510
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
511 512 513
        pInput->totalRows = pBlock->info.rows;
        pInput->numOfRows = pBlock->info.rows;
        pInput->startRowIndex = 0;
514

515
        // NOTE: the last parameter is the primary timestamp column
516 517 518
        if (fmIsTimelineFunc(pCtx[i].functionId) && (j == pOneExpr->base.numOfParams - 1)) {
          pInput->pPTS = pInput->pData[j];
        }
519 520
        ASSERT(pInput->pData[j] != NULL);
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
521 522 523
        // todo avoid case: top(k, 12), 12 is the value parameter.
        // sum(11), 11 is also the value parameter.
        if (createDummyCol && pOneExpr->base.numOfParams == 1) {
524 525 526 527
          pInput->totalRows = pBlock->info.rows;
          pInput->numOfRows = pBlock->info.rows;
          pInput->startRowIndex = 0;

528
          code = doCreateConstantValColumnInfo(pInput, pFuncParam, j, pBlock->info.rows);
529 530 531
          if (code != TSDB_CODE_SUCCESS) {
            return code;
          }
532
        }
G
Ganlin Zhao 已提交
533 534
      }
    }
H
Haojun Liao 已提交
535
  }
536 537

  return code;
H
Haojun Liao 已提交
538 539
}

540
static int32_t doAggregateImpl(SOperatorInfo* pOperator, TSKEY startTs, SqlFunctionCtx* pCtx) {
541
  for (int32_t k = 0; k < pOperator->exprSupp.numOfExprs; ++k) {
H
Haojun Liao 已提交
542
    if (functionNeedToExecute(&pCtx[k])) {
543
      // todo add a dummy funtion to avoid process check
544 545 546
      if (pCtx[k].fpSet.process == NULL) {
        continue;
      }
547
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
548
      qDebug("page_process");
549
#endif
550 551 552 553
      int32_t code = pCtx[k].fpSet.process(&pCtx[k]);
      if (code != TSDB_CODE_SUCCESS) {
        qError("%s aggregate function error happens, code: %s", GET_TASKID(pOperator->pTaskInfo), tstrerror(code));
        return code;
554
      }
555 556
    }
  }
557 558

  return TSDB_CODE_SUCCESS;
559 560
}

H
Haojun Liao 已提交
561
static void setPseudoOutputColInfo(SSDataBlock* pResult, SqlFunctionCtx* pCtx, SArray* pPseudoList) {
dengyihao's avatar
dengyihao 已提交
562
  size_t num = (pPseudoList != NULL) ? taosArrayGetSize(pPseudoList) : 0;
H
Haojun Liao 已提交
563 564 565 566 567
  for (int32_t i = 0; i < num; ++i) {
    pCtx[i].pOutput = taosArrayGet(pResult->pDataBlock, i);
  }
}

568
int32_t projectApplyFunctions(SExprInfo* pExpr, SSDataBlock* pResult, SSDataBlock* pSrcBlock, SqlFunctionCtx* pCtx,
X
Xiaoyu Wang 已提交
569
                              int32_t numOfOutput, SArray* pPseudoList) {
H
Haojun Liao 已提交
570
  setPseudoOutputColInfo(pResult, pCtx, pPseudoList);
H
Haojun Liao 已提交
571
  pResult->info.groupId = pSrcBlock->info.groupId;
H
Haojun Liao 已提交
572

dengyihao's avatar
dengyihao 已提交
573 574
  // if the source equals to the destination, it is to create a new column as the result of scalar function or some
  // operators.
575 576
  bool createNewColModel = (pResult == pSrcBlock);

577 578
  int32_t numOfRows = 0;

579
  for (int32_t k = 0; k < numOfOutput; ++k) {
dengyihao's avatar
dengyihao 已提交
580
    int32_t         outputSlotId = pExpr[k].base.resSchema.slotId;
581 582
    SqlFunctionCtx* pfCtx = &pCtx[k];

L
Liu Jicong 已提交
583
    if (pExpr[k].pExpr->nodeType == QUERY_NODE_COLUMN) {  // it is a project query
584
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
585
      if (pResult->info.rows > 0 && !createNewColModel) {
X
Xiaoyu Wang 已提交
586 587
        colDataMergeCol(pColInfoData, pResult->info.rows, &pResult->info.capacity, pfCtx->input.pData[0],
                        pfCtx->input.numOfRows);
588
      } else {
589
        colDataAssign(pColInfoData, pfCtx->input.pData[0], pfCtx->input.numOfRows, &pResult->info);
590
      }
591

592
      numOfRows = pfCtx->input.numOfRows;
593
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_VALUE) {
594
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
595

dengyihao's avatar
dengyihao 已提交
596
      int32_t offset = createNewColModel ? 0 : pResult->info.rows;
597
      for (int32_t i = 0; i < pSrcBlock->info.rows; ++i) {
dengyihao's avatar
dengyihao 已提交
598 599 600
        colDataAppend(pColInfoData, i + offset,
                      taosVariantGet(&pExpr[k].base.pParam[0].param, pExpr[k].base.pParam[0].param.nType),
                      TSDB_DATA_TYPE_NULL == pExpr[k].base.pParam[0].param.nType);
601
      }
602 603

      numOfRows = pSrcBlock->info.rows;
H
Haojun Liao 已提交
604
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_OPERATOR) {
605 606 607
      SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
      taosArrayPush(pBlockList, &pSrcBlock);

608
      SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
609
      SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
610

611
      SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
612
      int32_t      code = scalarCalculate(pExpr[k].pExpr->_optrRoot.pRootNode, pBlockList, &dest);
613 614 615 616
      if (code != TSDB_CODE_SUCCESS) {
        taosArrayDestroy(pBlockList);
        return code;
      }
617

dengyihao's avatar
dengyihao 已提交
618
      int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
619
      ASSERT(pResult->info.capacity > 0);
620
      colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
621 622

      numOfRows = dest.numOfRows;
623 624
      taosArrayDestroy(pBlockList);
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_FUNCTION) {
625
      ASSERT(!fmIsAggFunc(pfCtx->functionId));
626

627 628
      // _rowts/_c0, not tbname column
      if (fmIsPseudoColumnFunc(pfCtx->functionId) && (!fmIsScanPseudoColumnFunc(pfCtx->functionId))) {
H
Haojun Liao 已提交
629
        // do nothing
630 631 632 633 634 635 636 637 638 639 640 641 642 643
      } else if (fmIsIndefiniteRowsFunc(pfCtx->functionId)) {
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(&pCtx[k]);
        pfCtx->fpSet.init(&pCtx[k], pResInfo);

        pfCtx->pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
        pfCtx->offset = createNewColModel ? 0 : pResult->info.rows;  // set the start offset

        // set the timestamp(_rowts) output buffer
        if (taosArrayGetSize(pPseudoList) > 0) {
          int32_t* outputColIndex = taosArrayGet(pPseudoList, 0);
          pfCtx->pTsOutput = (SColumnInfoData*)pCtx[*outputColIndex].pOutput;
        }

        numOfRows = pfCtx->fpSet.process(pfCtx);
H
Haojun Liao 已提交
644 645 646
      } else {
        SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
        taosArrayPush(pBlockList, &pSrcBlock);
G
Ganlin Zhao 已提交
647

648
        SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
649
        SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
H
Haojun Liao 已提交
650

651
        SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
652
        int32_t      code = scalarCalculate((SNode*)pExpr[k].pExpr->_function.pFunctNode, pBlockList, &dest);
653 654 655 656
        if (code != TSDB_CODE_SUCCESS) {
          taosArrayDestroy(pBlockList);
          return code;
        }
657

dengyihao's avatar
dengyihao 已提交
658
        int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
659
        ASSERT(pResult->info.capacity > 0);
660
        colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
661 662

        numOfRows = dest.numOfRows;
H
Haojun Liao 已提交
663 664
        taosArrayDestroy(pBlockList);
      }
665
    } else {
666
      ASSERT(0);
667 668
    }
  }
669

670 671 672
  if (!createNewColModel) {
    pResult->info.rows += numOfRows;
  }
673 674

  return TSDB_CODE_SUCCESS;
675 676
}

677 678 679
static void setResultRowKey(SResultRow* pResultRow, char* pData, int16_t type) {
  if (IS_VAR_DATA_TYPE(type)) {
    // todo disable this
680

681 682 683 684 685 686 687 688 689
    //    if (pResultRow->key == NULL) {
    //      pResultRow->key = taosMemoryMalloc(varDataTLen(pData));
    //      varDataCopy(pResultRow->key, pData);
    //    } else {
    //      ASSERT(memcmp(pResultRow->key, pData, varDataTLen(pData)) == 0);
    //    }
  } else {
    int64_t v = -1;
    GET_TYPED_DATA(v, int64_t, type, pData);
690

691 692
    pResultRow->win.skey = v;
    pResultRow->win.ekey = v;
693 694 695
  }
}

5
54liuyao 已提交
696
bool functionNeedToExecute(SqlFunctionCtx* pCtx) {
697
  struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
698

699 700 701 702 703
  // in case of timestamp column, always generated results.
  int32_t functionId = pCtx->functionId;
  if (functionId == -1) {
    return false;
  }
704

705 706
  if (pCtx->scanFlag == REPEAT_SCAN) {
    return fmIsRepeatScanFunc(pCtx->functionId);
707 708
  }

709 710
  if (isRowEntryCompleted(pResInfo)) {
    return false;
711 712
  }

713 714 715
  return true;
}

716 717 718 719 720 721 722
static int32_t doCreateConstantValColumnAggInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t type,
                                                int32_t paramIndex, int32_t numOfRows) {
  if (pInput->pData[paramIndex] == NULL) {
    pInput->pData[paramIndex] = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pInput->pData[paramIndex] == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
723

724 725 726
    // Set the correct column info (data type and bytes)
    pInput->pData[paramIndex]->info.type = type;
    pInput->pData[paramIndex]->info.bytes = tDataTypes[type].bytes;
727
  }
H
Haojun Liao 已提交
728

729 730 731 732 733 734
  SColumnDataAgg* da = NULL;
  if (pInput->pColumnDataAgg[paramIndex] == NULL) {
    da = taosMemoryCalloc(1, sizeof(SColumnDataAgg));
    pInput->pColumnDataAgg[paramIndex] = da;
    if (da == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
735 736
    }
  } else {
737
    da = pInput->pColumnDataAgg[paramIndex];
738 739
  }

740
  ASSERT(!IS_VAR_DATA_TYPE(type));
741

742 743 744 745 746 747
  if (type == TSDB_DATA_TYPE_BIGINT) {
    int64_t v = pFuncParam->param.i;
    *da = (SColumnDataAgg){.numOfNull = 0, .min = v, .max = v, .maxIndex = 0, .minIndex = 0, .sum = v * numOfRows};
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
    *da = (SColumnDataAgg){.numOfNull = 0, .maxIndex = 0, .minIndex = 0};
748

749 750 751 752 753 754 755 756 757 758 759 760
    *(double*)&da->min = v;
    *(double*)&da->max = v;
    *(double*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_BOOL) {  // todo validate this data type
    bool v = pFuncParam->param.i;

    *da = (SColumnDataAgg){.numOfNull = 0, .maxIndex = 0, .minIndex = 0};
    *(bool*)&da->min = 0;
    *(bool*)&da->max = v;
    *(bool*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_TIMESTAMP) {
    // do nothing
761
  } else {
762
    ASSERT(0);
763 764
  }

765 766
  return TSDB_CODE_SUCCESS;
}
767 768 769 770 771 772 773 774 775 776 777

void setBlockStatisInfo(SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, SSDataBlock* pBlock) {
  int32_t numOfRows = pBlock->info.rows;

  SInputColumnInfoData* pInput = &pCtx->input;
  pInput->numOfRows = numOfRows;
  pInput->totalRows = numOfRows;

  if (pBlock->pBlockAgg != NULL) {
    pInput->colDataAggIsSet = true;

778 779
    for (int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      SFunctParam* pFuncParam = &pExprInfo->base.pParam[j];
780

781 782
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
783 784 785 786
        pInput->pColumnDataAgg[j] = pBlock->pBlockAgg[slotId];
        if (pInput->pColumnDataAgg[j] == NULL) {
          pInput->colDataAggIsSet = false;
        }
787 788 789 790

        // Here we set the column info data since the data type for each column data is required, but
        // the data in the corresponding SColumnInfoData will not be used.
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
791 792
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
        doCreateConstantValColumnAggInfo(pInput, pFuncParam, pFuncParam->param.nType, j, pBlock->info.rows);
793 794
      }
    }
795
  } else {
796
    pInput->colDataAggIsSet = false;
797 798 799
  }

  // set the statistics data for primary time stamp column
800 801 802 803 804
  //  if (pCtx->functionId == FUNCTION_SPREAD && pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
  //    pCtx->isAggSet = true;
  //    pCtx->agg.min = pBlock->info.window.skey;
  //    pCtx->agg.max = pBlock->info.window.ekey;
  //  }
805 806
}

L
Liu Jicong 已提交
807
bool isTaskKilled(SExecTaskInfo* pTaskInfo) {
808 809
  // query has been executed more than tsShellActivityTimer, and the retrieve has not arrived
  // abort current query execution.
L
Liu Jicong 已提交
810 811
  if (pTaskInfo->owner != 0 &&
      ((taosGetTimestampSec() - pTaskInfo->cost.start / 1000) > 10 * getMaximumIdleDurationSec())
812 813
      /*(!needBuildResAfterQueryComplete(pTaskInfo))*/) {
    assert(pTaskInfo->cost.start != 0);
L
Liu Jicong 已提交
814 815 816
    //    qDebug("QInfo:%" PRIu64 " retrieve not arrive beyond %d ms, abort current query execution, start:%" PRId64
    //           ", current:%d", pQInfo->qId, 1, pQInfo->startExecTs, taosGetTimestampSec());
    //    return true;
817 818 819 820 821
  }

  return false;
}

L
Liu Jicong 已提交
822
void setTaskKilled(SExecTaskInfo* pTaskInfo) { pTaskInfo->code = TSDB_CODE_TSC_QUERY_CANCELLED; }
823 824

/////////////////////////////////////////////////////////////////////////////////////////////
L
Liu Jicong 已提交
825
// todo refactor : return window
826
void getAlignQueryTimeWindow(SInterval* pInterval, int32_t precision, int64_t key, STimeWindow* win) {
H
Haojun Liao 已提交
827
  win->skey = taosTimeTruncate(key, pInterval, precision);
828 829

  /*
H
Haojun Liao 已提交
830
   * if the realSkey > INT64_MAX - pInterval->interval, the query duration between
831 832
   * realSkey and realEkey must be less than one interval.Therefore, no need to adjust the query ranges.
   */
833 834
  win->ekey = taosTimeAdd(win->skey, pInterval->interval, pInterval->intervalUnit, precision) - 1;
  if (win->ekey < win->skey) {
835 836 837 838
    win->ekey = INT64_MAX;
  }
}

839
#if 0
L
Liu Jicong 已提交
840
static int32_t updateBlockLoadStatus(STaskAttr* pQuery, int32_t status) {
841

842 843 844
  bool hasFirstLastFunc = false;
  bool hasOtherFunc = false;

845
  if (status == BLK_DATA_DATA_LOAD || status == BLK_DATA_FILTEROUT) {
846 847 848 849 850
    return status;
  }

  for (int32_t i = 0; i < pQuery->numOfOutput; ++i) {
    int32_t functionId = getExprFunctionId(&pQuery->pExpr1[i]);
851

852 853 854 855 856 857 858 859 860 861
    if (functionId == FUNCTION_TS || functionId == FUNCTION_TS_DUMMY || functionId == FUNCTION_TAG ||
        functionId == FUNCTION_TAG_DUMMY) {
      continue;
    }

    if (functionId == FUNCTION_FIRST_DST || functionId == FUNCTION_LAST_DST) {
      hasFirstLastFunc = true;
    } else {
      hasOtherFunc = true;
    }
862

863 864
  }

865
  if (hasFirstLastFunc && status == BLK_DATA_NOT_LOAD) {
L
Liu Jicong 已提交
866
    if (!hasOtherFunc) {
867
      return BLK_DATA_FILTEROUT;
868
    } else {
869
      return BLK_DATA_DATA_LOAD;
870 871 872 873 874 875
    }
  }

  return status;
}

876 877
#endif

L
Liu Jicong 已提交
878 879
// static void updateDataCheckOrder(SQInfo *pQInfo, SQueryTableReq* pQueryMsg, bool stableQuery) {
//   STaskAttr* pQueryAttr = pQInfo->runtimeEnv.pQueryAttr;
H
Haojun Liao 已提交
880
//
L
Liu Jicong 已提交
881 882 883 884
//   // in case of point-interpolation query, use asc order scan
//   char msg[] = "QInfo:0x%"PRIx64" scan order changed for %s query, old:%d, new:%d, qrange exchanged, old qrange:%"
//   PRId64
//                "-%" PRId64 ", new qrange:%" PRId64 "-%" PRId64;
H
Haojun Liao 已提交
885
//
L
Liu Jicong 已提交
886 887 888 889 890
//   // todo handle the case the the order irrelevant query type mixed up with order critical query type
//   // descending order query for last_row query
//   if (isFirstLastRowQuery(pQueryAttr)) {
//     //qDebug("QInfo:0x%"PRIx64" scan order changed for last_row query, old:%d, new:%d", pQInfo->qId,
//     pQueryAttr->order.order, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
891
//
L
Liu Jicong 已提交
892 893
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
894
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
895
//     }
H
Haojun Liao 已提交
896
//
L
Liu Jicong 已提交
897 898 899
//     pQueryAttr->needReverseScan = false;
//     return;
//   }
H
Haojun Liao 已提交
900
//
L
Liu Jicong 已提交
901 902 903
//   if (pQueryAttr->groupbyColumn && pQueryAttr->order.order == TSDB_ORDER_DESC) {
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
904
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
905
//     }
H
Haojun Liao 已提交
906
//
L
Liu Jicong 已提交
907 908 909 910
//     pQueryAttr->needReverseScan = false;
//     doUpdateLastKey(pQueryAttr);
//     return;
//   }
H
Haojun Liao 已提交
911
//
L
Liu Jicong 已提交
912 913 914 915 916 917
//   if (pQueryAttr->pointInterpQuery && pQueryAttr->interval.interval == 0) {
//     if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       //qDebug(msg, pQInfo->qId, "interp", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey); TSWAP(pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, TSKEY);
//     }
H
Haojun Liao 已提交
918
//
L
Liu Jicong 已提交
919 920 921
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     return;
//   }
H
Haojun Liao 已提交
922
//
L
Liu Jicong 已提交
923 924 925 926
//   if (pQueryAttr->interval.interval == 0) {
//     if (onlyFirstQuery(pQueryAttr)) {
//       if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//         //qDebug(msg, pQInfo->qId, "only-first", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
H
Haojun Liao 已提交
927 928
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
929
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
930 931 932 933 934 935 936 937 938 939
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_ASC;
//      pQueryAttr->needReverseScan = false;
//    } else if (onlyLastQuery(pQueryAttr) && notContainSessionOrStateWindow(pQueryAttr)) {
//      if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//        //qDebug(msg, pQInfo->qId, "only-last", pQueryAttr->order.order, TSDB_ORDER_DESC, pQueryAttr->window.skey,
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
940
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
941 942 943 944 945 946 947 948 949 950 951 952
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_DESC;
//      pQueryAttr->needReverseScan = false;
//    }
//
//  } else {  // interval query
//    if (stableQuery) {
//      if (onlyFirstQuery(pQueryAttr)) {
//        if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-first stable", pQueryAttr->order.order, TSDB_ORDER_ASC,
L
Liu Jicong 已提交
953 954
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
955
//
wafwerar's avatar
wafwerar 已提交
956
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
957 958 959 960 961 962 963 964
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_ASC;
//        pQueryAttr->needReverseScan = false;
//      } else if (onlyLastQuery(pQueryAttr)) {
//        if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-last stable", pQueryAttr->order.order, TSDB_ORDER_DESC,
L
Liu Jicong 已提交
965 966
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
967
//
wafwerar's avatar
wafwerar 已提交
968
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
969 970 971 972 973 974 975 976 977
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_DESC;
//        pQueryAttr->needReverseScan = false;
//      }
//    }
//  }
//}
978

L
Liu Jicong 已提交
979 980 981
// static FORCE_INLINE bool doFilterByBlockStatistics(STaskRuntimeEnv* pRuntimeEnv, SDataStatis *pDataStatis,
// SqlFunctionCtx *pCtx, int32_t numOfRows) {
//   STaskAttr* pQueryAttr = pRuntimeEnv->pQueryAttr;
982
//
L
Liu Jicong 已提交
983 984 985
//   if (pDataStatis == NULL || pQueryAttr->pFilters == NULL) {
//     return true;
//   }
986
//
L
Liu Jicong 已提交
987 988
//   return filterRangeExecute(pQueryAttr->pFilters, pDataStatis, pQueryAttr->numOfCols, numOfRows);
// }
989
#if 0
H
Haojun Liao 已提交
990
static bool overlapWithTimeWindow(STaskAttr* pQueryAttr, SDataBlockInfo* pBlockInfo) {
991 992
  STimeWindow w = {0};

dengyihao's avatar
dengyihao 已提交
993 994
  TSKEY sk = TMIN(pQueryAttr->window.skey, pQueryAttr->window.ekey);
  TSKEY ek = TMAX(pQueryAttr->window.skey, pQueryAttr->window.ekey);
995

996
  if (true) {
L
Liu Jicong 已提交
997
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.skey, sk, ek, &w);
998 999 1000 1001 1002 1003
    assert(w.ekey >= pBlockInfo->window.skey);

    if (w.ekey < pBlockInfo->window.ekey) {
      return true;
    }

L
Liu Jicong 已提交
1004 1005
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1006 1007 1008 1009 1010 1011 1012 1013 1014 1015
      if (w.skey > pBlockInfo->window.ekey) {
        break;
      }

      assert(w.ekey > pBlockInfo->window.ekey);
      if (w.skey <= pBlockInfo->window.ekey && w.skey > pBlockInfo->window.skey) {
        return true;
      }
    }
  } else {
L
Liu Jicong 已提交
1016
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.ekey, sk, ek, &w);
1017 1018 1019 1020 1021 1022
    assert(w.skey <= pBlockInfo->window.ekey);

    if (w.skey > pBlockInfo->window.skey) {
      return true;
    }

L
Liu Jicong 已提交
1023 1024
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037
      if (w.ekey < pBlockInfo->window.skey) {
        break;
      }

      assert(w.skey < pBlockInfo->window.skey);
      if (w.ekey < pBlockInfo->window.ekey && w.ekey >= pBlockInfo->window.skey) {
        return true;
      }
    }
  }

  return false;
}
1038
#endif
1039 1040

static uint32_t doFilterByBlockTimeWindow(STableScanInfo* pTableScanInfo, SSDataBlock* pBlock) {
H
Haojun Liao 已提交
1041
  SqlFunctionCtx* pCtx = pTableScanInfo->pCtx;
1042
  uint32_t        status = BLK_DATA_NOT_LOAD;
1043

L
Liu Jicong 已提交
1044
  int32_t numOfOutput = 0;  // pTableScanInfo->numOfOutput;
1045 1046
  for (int32_t i = 0; i < numOfOutput; ++i) {
    int32_t functionId = pCtx[i].functionId;
H
Haojun Liao 已提交
1047
    int32_t colId = pTableScanInfo->pExpr[i].base.pParam[0].pCol->colId;
1048 1049 1050

    // group by + first/last should not apply the first/last block filter
    if (functionId < 0) {
1051
      status |= BLK_DATA_DATA_LOAD;
1052 1053
      return status;
    } else {
L
Liu Jicong 已提交
1054
      //      status |= aAggs[functionId].dataReqFunc(&pTableScanInfo->pCtx[i], &pBlock->info.window, colId);
1055
      //      if ((status & BLK_DATA_DATA_LOAD) == BLK_DATA_DATA_LOAD) {
L
Liu Jicong 已提交
1056 1057
      //        return status;
      //      }
1058 1059 1060 1061 1062 1063
    }
  }

  return status;
}

L
Liu Jicong 已提交
1064 1065
int32_t loadDataBlockOnDemand(SExecTaskInfo* pTaskInfo, STableScanInfo* pTableScanInfo, SSDataBlock* pBlock,
                              uint32_t* status) {
1066
  *status = BLK_DATA_NOT_LOAD;
1067

H
Haojun Liao 已提交
1068
  pBlock->pDataBlock = NULL;
L
Liu Jicong 已提交
1069
  pBlock->pBlockAgg = NULL;
H
Haojun Liao 已提交
1070

L
Liu Jicong 已提交
1071 1072
  //  int64_t groupId = pRuntimeEnv->current->groupIndex;
  //  bool    ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1073

H
Haojun Liao 已提交
1074
  STaskCostInfo* pCost = &pTaskInfo->cost;
1075

1076 1077
//  pCost->totalBlocks += 1;
//  pCost->totalRows += pBlock->info.rows;
H
Haojun Liao 已提交
1078
#if 0
1079 1080 1081
  // Calculate all time windows that are overlapping or contain current data block.
  // If current data block is contained by all possible time window, do not load current data block.
  if (/*pQueryAttr->pFilters || */pQueryAttr->groupbyColumn || pQueryAttr->sw.gap > 0 ||
H
Haojun Liao 已提交
1082
      (QUERY_IS_INTERVAL_QUERY(pQueryAttr) && overlapWithTimeWindow(pTaskInfo, &pBlock->info))) {
1083
    (*status) = BLK_DATA_DATA_LOAD;
1084 1085 1086
  }

  // check if this data block is required to load
1087
  if ((*status) != BLK_DATA_DATA_LOAD) {
1088 1089 1090 1091 1092 1093 1094
    bool needFilter = true;

    // the pCtx[i] result is belonged to previous time window since the outputBuf has not been set yet,
    // the filter result may be incorrect. So in case of interval query, we need to set the correct time output buffer
    if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
      SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1095
      bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1096 1097 1098 1099 1100 1101
      TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

      STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
      if (pQueryAttr->pointInterpQuery) {
        needFilter = chkWindowOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1102
                                    pTableScanInfo->rowEntryInfoOffset);
1103 1104 1105
      } else {
        if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1106
                                    pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1107 1108 1109 1110 1111
          longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
        }
      }
    } else if (pQueryAttr->stableQuery && (!pQueryAttr->tsCompQuery) && (!pQueryAttr->diffQuery)) { // stable aggregate, not interval aggregate or normal column aggregate
      doSetTableGroupOutputBuf(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pTableScanInfo->pCtx,
1112
                               pTableScanInfo->rowEntryInfoOffset, pTableScanInfo->numOfOutput,
1113 1114 1115 1116 1117 1118
                               pRuntimeEnv->current->groupIndex);
    }

    if (needFilter) {
      (*status) = doFilterByBlockTimeWindow(pTableScanInfo, pBlock);
    } else {
1119
      (*status) = BLK_DATA_DATA_LOAD;
1120 1121 1122 1123
    }
  }

  SDataBlockInfo* pBlockInfo = &pBlock->info;
H
Haojun Liao 已提交
1124
//  *status = updateBlockLoadStatus(pRuntimeEnv->pQueryAttr, *status);
1125

1126
  if ((*status) == BLK_DATA_NOT_LOAD || (*status) == BLK_DATA_FILTEROUT) {
1127 1128
    //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//           pBlockInfo->window.ekey, pBlockInfo->rows);
1129
    pCost->skipBlocks += 1;
1130
  } else if ((*status) == BLK_DATA_SMA_LOAD) {
1131 1132
    // this function never returns error?
    pCost->loadBlockStatis += 1;
1133
//    tsdbRetrieveDataBlockStatisInfo(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1134 1135

    if (pBlock->pBlockAgg == NULL) {  // data block statistics does not exist, load data block
1136
//      pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1137 1138 1139
      pCost->totalCheckedRows += pBlock->info.rows;
    }
  } else {
1140
    assert((*status) == BLK_DATA_DATA_LOAD);
1141 1142 1143

    // load the data block statistics to perform further filter
    pCost->loadBlockStatis += 1;
1144
//    tsdbRetrieveDataBlockStatisInfo(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1145 1146 1147 1148 1149 1150

    if (pQueryAttr->topBotQuery && pBlock->pBlockAgg != NULL) {
      { // set previous window
        if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
          SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1151
          bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1152 1153 1154 1155 1156
          TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

          STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
          if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                      pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1157
                                      pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168
            longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
          }
        }
      }
      bool load = false;
      for (int32_t i = 0; i < pQueryAttr->numOfOutput; ++i) {
        int32_t functionId = pTableScanInfo->pCtx[i].functionId;
        if (functionId == FUNCTION_TOP || functionId == FUNCTION_BOTTOM) {
//          load = topbot_datablock_filter(&pTableScanInfo->pCtx[i], (char*)&(pBlock->pBlockAgg[i].min),
//                                         (char*)&(pBlock->pBlockAgg[i].max));
          if (!load) { // current block has been discard due to filter applied
1169
            pCost->skipBlocks += 1;
1170 1171
            //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId,
//                   pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
1172
            (*status) = BLK_DATA_FILTEROUT;
1173 1174 1175 1176 1177 1178 1179 1180
            return TSDB_CODE_SUCCESS;
          }
        }
      }
    }

    // current block has been discard due to filter applied
//    if (!doFilterByBlockStatistics(pRuntimeEnv, pBlock->pBlockAgg, pTableScanInfo->pCtx, pBlockInfo->rows)) {
1181
//      pCost->skipBlocks += 1;
1182 1183
//      qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//             pBlockInfo->window.ekey, pBlockInfo->rows);
1184
//      (*status) = BLK_DATA_FILTEROUT;
1185 1186 1187 1188 1189
//      return TSDB_CODE_SUCCESS;
//    }

    pCost->totalCheckedRows += pBlockInfo->rows;
    pCost->loadBlocks += 1;
1190
//    pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1191 1192 1193 1194 1195
//    if (pBlock->pDataBlock == NULL) {
//      return terrno;
//    }

//    if (pQueryAttr->pFilters != NULL) {
1196
//      filterSetColFieldData(pQueryAttr->pFilters, taosArrayGetSize(pBlock->pDataBlock), pBlock->pDataBlock);
1197
//    }
1198

1199 1200 1201 1202
//    if (pQueryAttr->pFilters != NULL || pRuntimeEnv->pTsBuf != NULL) {
//      filterColRowsInDataBlock(pRuntimeEnv, pBlock, ascQuery);
//    }
  }
H
Haojun Liao 已提交
1203
#endif
1204 1205 1206
  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
1207
static void updateTableQueryInfoForReverseScan(STableQueryInfo* pTableQueryInfo) {
1208 1209 1210 1211
  if (pTableQueryInfo == NULL) {
    return;
  }

wafwerar's avatar
wafwerar 已提交
1212
  //  TSWAP(pTableQueryInfo->win.skey, pTableQueryInfo->win.ekey);
L
Liu Jicong 已提交
1213
  //  pTableQueryInfo->lastKey = pTableQueryInfo->win.skey;
1214

L
Liu Jicong 已提交
1215 1216
  //  SWITCH_ORDER(pTableQueryInfo->cur.order);
  //  pTableQueryInfo->cur.vgroupIndex = -1;
1217 1218

  // set the index to be the end slot of result rows array
dengyihao's avatar
dengyihao 已提交
1219 1220 1221 1222 1223 1224
  //  SResultRowInfo* pResultRowInfo = &pTableQueryInfo->resInfo;
  //  if (pResultRowInfo->size > 0) {
  //    pResultRowInfo->curPos = pResultRowInfo->size - 1;
  //  } else {
  //    pResultRowInfo->curPos = -1;
  //  }
1225 1226
}

H
Haojun Liao 已提交
1227
void initResultRow(SResultRow* pResultRow) {
X
Xiaoyu Wang 已提交
1228
  //  pResultRow->pEntryInfo = (struct SResultRowEntryInfo*)((char*)pResultRow + sizeof(SResultRow));
1229 1230 1231 1232 1233
}

/*
 * The start of each column SResultRowEntryInfo is denote by RowCellInfoOffset.
 * Note that in case of top/bottom query, the whole multiple rows of result is treated as only one row of results.
H
Haojun Liao 已提交
1234 1235 1236
 * +------------+-----------------result column 1------------+------------------result column 2-----------+
 * | SResultRow | SResultRowEntryInfo | intermediate buffer1 | SResultRowEntryInfo | intermediate buffer 2|
 * +------------+--------------------------------------------+--------------------------------------------+
1237 1238
 *           offset[0]                                  offset[1]                                   offset[2]
 */
1239
// TODO refactor: some function move away
L
Liu Jicong 已提交
1240 1241 1242
void setFunctionResultOutput(SOperatorInfo* pOperator, SOptrBasicInfo* pInfo, SAggSupporter* pSup, int32_t stage,
                             int32_t numOfExprs) {
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1243 1244
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
H
Haojun Liao 已提交
1245

H
Haojun Liao 已提交
1246
  SResultRowInfo* pResultRowInfo = &pInfo->resultRowInfo;
1247
  initResultRowInfo(pResultRowInfo);
H
Haojun Liao 已提交
1248

L
Liu Jicong 已提交
1249 1250
  int64_t     tid = 0;
  int64_t     groupId = 0;
1251 1252
  SResultRow* pRow = doSetResultOutBufByKey(pSup->pResultBuf, pResultRowInfo, (char*)&tid, sizeof(tid), true, groupId,
                                            pTaskInfo, false, pSup);
H
Haojun Liao 已提交
1253

1254
  for (int32_t i = 0; i < numOfExprs; ++i) {
1255
    struct SResultRowEntryInfo* pEntry = getResultEntryInfo(pRow, i, rowEntryInfoOffset);
H
Haojun Liao 已提交
1256 1257
    cleanupResultRowEntry(pEntry);

L
Liu Jicong 已提交
1258
    pCtx[i].resultInfo = pEntry;
1259
    pCtx[i].scanFlag = stage;
H
Haojun Liao 已提交
1260 1261
  }

1262
  initCtxOutputBuffer(pCtx, numOfExprs);
H
Haojun Liao 已提交
1263 1264
}

H
Haojun Liao 已提交
1265
void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size) {
1266 1267
  for (int32_t j = 0; j < size; ++j) {
    struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(&pCtx[j]);
dengyihao's avatar
dengyihao 已提交
1268 1269
    if (isRowEntryInitialized(pResInfo) || fmIsPseudoColumnFunc(pCtx[j].functionId) || pCtx[j].functionId == -1 ||
        fmIsScalarFunc(pCtx[j].functionId)) {
1270 1271 1272
      continue;
    }

H
Haojun Liao 已提交
1273
    pCtx[j].fpSet.init(&pCtx[j], pCtx[j].resultInfo);
1274 1275 1276
  }
}

L
Liu Jicong 已提交
1277
void setTaskStatus(SExecTaskInfo* pTaskInfo, int8_t status) {
1278
  if (status == TASK_NOT_COMPLETED) {
H
Haojun Liao 已提交
1279
    pTaskInfo->status = status;
1280 1281
  } else {
    // QUERY_NOT_COMPLETED is not compatible with any other status, so clear its position first
1282
    CLEAR_QUERY_STATUS(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
1283
    pTaskInfo->status |= status;
1284 1285 1286
  }
}

L
Liu Jicong 已提交
1287
void destroyTableQueryInfoImpl(STableQueryInfo* pTableQueryInfo) {
1288 1289 1290 1291
  if (pTableQueryInfo == NULL) {
    return;
  }

L
Liu Jicong 已提交
1292
  //  taosVariantDestroy(&pTableQueryInfo->tag);
dengyihao's avatar
dengyihao 已提交
1293
  //  cleanupResultRowInfo(&pTableQueryInfo->resInfo);
1294 1295
}

1296
void setResultRowInitCtx(SResultRow* pResult, SqlFunctionCtx* pCtx, int32_t numOfOutput, int32_t* rowEntryInfoOffset) {
1297
  for (int32_t i = 0; i < numOfOutput; ++i) {
1298
    pCtx[i].resultInfo = getResultEntryInfo(pResult, i, rowEntryInfoOffset);
1299 1300 1301 1302 1303

    struct SResultRowEntryInfo* pResInfo = pCtx[i].resultInfo;
    if (isRowEntryCompleted(pResInfo) && isRowEntryInitialized(pResInfo)) {
      continue;
    }
1304 1305 1306 1307 1308

    if (fmIsWindowPseudoColumnFunc(pCtx[i].functionId)) {
      continue;
    }

1309 1310 1311 1312 1313 1314
    if (!pResInfo->initialized) {
      if (pCtx[i].functionId != -1) {
        pCtx[i].fpSet.init(&pCtx[i], pResInfo);
      } else {
        pResInfo->initialized = true;
      }
1315 1316 1317 1318
    }
  }
}

H
Haojun Liao 已提交
1319
static void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep);
1320

1321
void doFilter(const SNode* pFilterNode, SSDataBlock* pBlock) {
1322 1323 1324 1325 1326
  if (pFilterNode == NULL) {
    return;
  }

  SFilterInfo* filter = NULL;
H
Haojun Liao 已提交
1327

H
Haojun Liao 已提交
1328
  // todo move to the initialization function
H
Haojun Liao 已提交
1329
  int32_t code = filterInitFromNode((SNode*)pFilterNode, &filter, 0);
1330

1331
  size_t             numOfCols = taosArrayGetSize(pBlock->pDataBlock);
1332
  SFilterColumnParam param1 = {.numOfCols = numOfCols, .pDataBlock = pBlock->pDataBlock};
1333 1334 1335
  code = filterSetDataFromSlotId(filter, &param1);

  int8_t* rowRes = NULL;
1336

1337
  // todo the keep seems never to be True??
1338
  bool keep = filterExecute(filter, pBlock, &rowRes, NULL, param1.numOfCols);
D
dapan1121 已提交
1339
  filterFreeInfo(filter);
1340

H
Haojun Liao 已提交
1341
  extractQualifiedTupleByFilterResult(pBlock, rowRes, keep);
1342
  blockDataUpdateTsWindow(pBlock, 0);
1343 1344
}

H
Haojun Liao 已提交
1345
void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep) {
1346 1347 1348 1349 1350
  if (keep) {
    return;
  }

  if (rowRes != NULL) {
L
Liu Jicong 已提交
1351
    int32_t      totalRows = pBlock->info.rows;
1352
    SSDataBlock* px = createOneDataBlock(pBlock, true);
1353

1354 1355
    size_t numOfCols = taosArrayGetSize(pBlock->pDataBlock);
    for (int32_t i = 0; i < numOfCols; ++i) {
1356 1357
      SColumnInfoData* pSrc = taosArrayGet(px->pDataBlock, i);
      SColumnInfoData* pDst = taosArrayGet(pBlock->pDataBlock, i);
1358
      // it is a reserved column for scalar function, and no data in this column yet.
1359
      if (pDst->pData == NULL || pSrc->pData == NULL) {
1360 1361 1362
        continue;
      }

1363 1364
      colInfoDataCleanup(pDst, pBlock->info.rows);

1365
      int32_t numOfRows = 0;
1366
      for (int32_t j = 0; j < totalRows; ++j) {
D
dapan1121 已提交
1367 1368 1369
        if (rowRes[j] == 0) {
          continue;
        }
1370

D
dapan1121 已提交
1371
        if (colDataIsNull_s(pSrc, j)) {
1372
          colDataAppendNULL(pDst, numOfRows);
D
dapan1121 已提交
1373
        } else {
1374
          colDataAppend(pDst, numOfRows, colDataGetData(pSrc, j), false);
D
dapan1121 已提交
1375
        }
1376
        numOfRows += 1;
H
Haojun Liao 已提交
1377
      }
1378

1379 1380 1381 1382 1383
      if (pBlock->info.rows == totalRows) {
        pBlock->info.rows = numOfRows;
      } else {
        ASSERT(pBlock->info.rows == numOfRows);
      }
1384
    }
1385

dengyihao's avatar
dengyihao 已提交
1386
    blockDataDestroy(px);  // fix memory leak
1387 1388 1389
  } else {
    // do nothing
    pBlock->info.rows = 0;
1390 1391 1392
  }
}

L
Liu Jicong 已提交
1393 1394
void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, SAggOperatorInfo* pAggInfo, int32_t numOfOutput,
                              uint64_t groupId) {
1395
  // for simple group by query without interval, all the tables belong to one group result.
L
Liu Jicong 已提交
1396
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
1397
  SResultRowInfo* pResultRowInfo = &pAggInfo->binfo.resultRowInfo;
1398 1399
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
1400

1401
  SResultRow* pResultRow = doSetResultOutBufByKey(pAggInfo->aggSup.pResultBuf, pResultRowInfo, (char*)&groupId,
L
Liu Jicong 已提交
1402
                                                  sizeof(groupId), true, groupId, pTaskInfo, false, &pAggInfo->aggSup);
L
Liu Jicong 已提交
1403
  assert(pResultRow != NULL);
1404 1405 1406 1407 1408 1409

  /*
   * not assign result buffer yet, add new result buffer
   * all group belong to one result set, and each group result has different group id so set the id to be one
   */
  if (pResultRow->pageId == -1) {
dengyihao's avatar
dengyihao 已提交
1410 1411
    int32_t ret =
        addNewWindowResultBuf(pResultRow, pAggInfo->aggSup.pResultBuf, groupId, pAggInfo->binfo.pRes->info.rowSize);
1412 1413 1414 1415 1416
    if (ret != TSDB_CODE_SUCCESS) {
      return;
    }
  }

1417
  setResultRowInitCtx(pResultRow, pCtx, numOfOutput, rowEntryInfoOffset);
1418 1419
}

1420
void setExecutionContext(SOperatorInfo* pOperator, int32_t numOfOutput, uint64_t groupId, SAggOperatorInfo* pAggInfo) {
H
Haojun Liao 已提交
1421
  if (pAggInfo->groupId != INT32_MIN && pAggInfo->groupId == groupId) {
1422 1423
    return;
  }
1424
#ifdef BUF_PAGE_DEBUG
L
Liu Jicong 已提交
1425
  qDebug("page_setbuf, groupId:%" PRIu64, groupId);
1426
#endif
1427
  doSetTableGroupOutputBuf(pOperator, pAggInfo, numOfOutput, groupId);
1428 1429

  // record the current active group id
H
Haojun Liao 已提交
1430
  pAggInfo->groupId = groupId;
1431 1432
}

1433 1434
static void doUpdateNumOfRows(SResultRow* pRow, int32_t numOfExprs, const int32_t* rowCellOffset) {
  for (int32_t j = 0; j < numOfExprs; ++j) {
1435
    struct SResultRowEntryInfo* pResInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1436 1437 1438 1439 1440 1441 1442 1443 1444 1445
    if (!isRowEntryInitialized(pResInfo)) {
      continue;
    }

    if (pRow->numOfRows < pResInfo->numOfRes) {
      pRow->numOfRows = pResInfo->numOfRes;
    }
  }
}

1446
int32_t finalizeResultRowIntoResultDataBlock(SDiskbasedBuf* pBuf, SResultRowPosition* resultRowPosition,
S
shenglian zhou 已提交
1447 1448 1449
                                             SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, int32_t numOfExprs,
                                             const int32_t* rowCellOffset, SSDataBlock* pBlock,
                                             SExecTaskInfo* pTaskInfo) {
1450 1451 1452 1453 1454 1455 1456 1457 1458
  SFilePage*  page = getBufPage(pBuf, resultRowPosition->pageId);
  SResultRow* pRow = (SResultRow*)((char*)page + resultRowPosition->offset);

  doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
  if (pRow->numOfRows == 0) {
    releaseBufPage(pBuf, page);
    return 0;
  }

1459 1460 1461 1462 1463 1464 1465
  while (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
    int32_t code = blockDataEnsureCapacity(pBlock, pBlock->info.capacity * 1.25);
    if (TAOS_FAILED(code)) {
      releaseBufPage(pBuf, page);
      qError("%s ensure result data capacity failed, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
      longjmp(pTaskInfo->env, code);
    }
1466 1467 1468 1469 1470
  }

  for (int32_t j = 0; j < numOfExprs; ++j) {
    int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1471
    pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491
    if (pCtx[j].fpSet.finalize) {
      int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
      if (TAOS_FAILED(code)) {
        qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
        longjmp(pTaskInfo->env, code);
      }
    } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
      // do nothing, todo refactor
    } else {
      // expand the result into multiple rows. E.g., _wstartts, top(k, 20)
      // the _wstartts needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
      SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
      char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
      for (int32_t k = 0; k < pRow->numOfRows; ++k) {
        colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
      }
    }
  }

  releaseBufPage(pBuf, page);
1492
  pBlock->info.rows += pRow->numOfRows;
1493 1494 1495 1496

  return 0;
}

X
Xiaoyu Wang 已提交
1497 1498 1499
int32_t doCopyToSDataBlock(SExecTaskInfo* pTaskInfo, SSDataBlock* pBlock, SExprInfo* pExprInfo, SDiskbasedBuf* pBuf,
                           SGroupResInfo* pGroupResInfo, const int32_t* rowCellOffset, SqlFunctionCtx* pCtx,
                           int32_t numOfExprs) {
1500
  int32_t numOfRows = getNumOfTotalRes(pGroupResInfo);
1501
  int32_t start = pGroupResInfo->index;
1502
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1503
  qDebug("\npage_copytoblock rows:%d", numOfRows);
1504
#endif
1505
  for (int32_t i = start; i < numOfRows; i += 1) {
L
Liu Jicong 已提交
1506 1507
    SResKeyPos* pPos = taosArrayGetP(pGroupResInfo->pRows, i);
    SFilePage*  page = getBufPage(pBuf, pPos->pos.pageId);
1508
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1509
    qDebug("page_copytoblock pos pageId:%d, offset:%d", pPos->pos.pageId, pPos->pos.offset);
1510
#endif
1511
    SResultRow* pRow = (SResultRow*)((char*)page + pPos->pos.offset);
1512 1513

    doUpdateNumOfRows(pRow, numOfExprs, rowCellOffset);
1514 1515
    if (pRow->numOfRows == 0) {
      pGroupResInfo->index += 1;
1516
      releaseBufPage(pBuf, page);
1517 1518 1519
      continue;
    }

1520 1521 1522 1523 1524
    if (pBlock->info.groupId == 0) {
      pBlock->info.groupId = pPos->groupId;
    } else {
      // current value belongs to different group, it can't be packed into one datablock
      if (pBlock->info.groupId != pPos->groupId) {
1525
        releaseBufPage(pBuf, page);
1526 1527 1528 1529
        break;
      }
    }

1530
    if (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
1531
      releaseBufPage(pBuf, page);
1532 1533 1534 1535 1536
      break;
    }

    pGroupResInfo->index += 1;

1537
    for (int32_t j = 0; j < numOfExprs; ++j) {
1538 1539
      int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1540
      pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1541
      if (pCtx[j].fpSet.finalize) {
1542
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1543
        qDebug("\npage_finalize %d", numOfExprs);
1544
#endif
1545
        int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
1546
        if (TAOS_FAILED(code)) {
1547 1548
          qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
          longjmp(pTaskInfo->env, code);
1549
        }
1550 1551
      } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
        // do nothing, todo refactor
1552
      } else {
1553 1554
        // expand the result into multiple rows. E.g., _wstartts, top(k, 20)
        // the _wstartts needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
X
Xiaoyu Wang 已提交
1555 1556
        SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
        char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
1557
        if (pCtx[j].increase) {
L
Liu Jicong 已提交
1558
          int64_t ts = *(int64_t*)in;
1559
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
L
Liu Jicong 已提交
1560
            colDataAppend(pColInfoData, pBlock->info.rows + k, (const char*)&ts, pCtx[j].resultInfo->isNullRes);
1561 1562 1563 1564 1565 1566
            ts++;
          }
        } else {
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
            colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
          }
X
Xiaoyu Wang 已提交
1567
        }
1568
      }
1569 1570
    }

1571
    releaseBufPage(pBuf, page);
1572
    pBlock->info.rows += pRow->numOfRows;
L
Liu Jicong 已提交
1573 1574 1575
    //    if (pBlock->info.rows >= pBlock->info.capacity) {  // output buffer is full
    //      break;
    //    }
1576 1577
  }

X
Xiaoyu Wang 已提交
1578 1579
  qDebug("%s result generated, rows:%d, groupId:%" PRIu64, GET_TASKID(pTaskInfo), pBlock->info.rows,
         pBlock->info.groupId);
1580
  blockDataUpdateTsWindow(pBlock, 0);
1581 1582 1583
  return 0;
}

X
Xiaoyu Wang 已提交
1584 1585
void doBuildResultDatablock(SOperatorInfo* pOperator, SOptrBasicInfo* pbInfo, SGroupResInfo* pGroupResInfo,
                            SDiskbasedBuf* pBuf) {
1586 1587
  SExprInfo*     pExprInfo = pOperator->exprSupp.pExprInfo;
  int32_t        numOfExprs = pOperator->exprSupp.numOfExprs;
1588 1589
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

1590
  int32_t*        rowCellOffset = pOperator->exprSupp.rowEntryInfoOffset;
X
Xiaoyu Wang 已提交
1591
  SSDataBlock*    pBlock = pbInfo->pRes;
1592
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
1593

1594
  blockDataCleanup(pBlock);
1595
  if (!hasDataInGroupInfo(pGroupResInfo)) {
1596 1597 1598
    return;
  }

1599 1600
  // clear the existed group id
  pBlock->info.groupId = 0;
1601
  doCopyToSDataBlock(pTaskInfo, pBlock, pExprInfo, pBuf, pGroupResInfo, rowCellOffset, pCtx, numOfExprs);
1602 1603
}

L
Liu Jicong 已提交
1604
static void updateNumOfRowsInResultRows(SqlFunctionCtx* pCtx, int32_t numOfOutput, SResultRowInfo* pResultRowInfo,
1605
                                        int32_t* rowEntryInfoOffset) {
1606
  // update the number of result for each, only update the number of rows for the corresponding window result.
L
Liu Jicong 已提交
1607 1608 1609
  //  if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
  //    return;
  //  }
H
Haojun Liao 已提交
1610
#if 0
1611
  for (int32_t i = 0; i < pResultRowInfo->size; ++i) {
L
Liu Jicong 已提交
1612
    SResultRow* pResult = pResultRowInfo->pResult[i];
1613 1614 1615 1616 1617 1618 1619

    for (int32_t j = 0; j < numOfOutput; ++j) {
      int32_t functionId = pCtx[j].functionId;
      if (functionId == FUNCTION_TS || functionId == FUNCTION_TAG || functionId == FUNCTION_TAGPRJ) {
        continue;
      }

1620
      SResultRowEntryInfo* pCell = getResultEntryInfo(pResult, j, rowEntryInfoOffset);
1621
      pResult->numOfRows = (uint16_t)(TMAX(pResult->numOfRows, pCell->numOfRes));
1622 1623
    }
  }
H
Haojun Liao 已提交
1624
#endif
1625 1626
}

L
Liu Jicong 已提交
1627
static int32_t compressQueryColData(SColumnInfoData* pColRes, int32_t numOfRows, char* data, int8_t compressed) {
1628 1629
  int32_t colSize = pColRes->info.bytes * numOfRows;
  return (*(tDataTypes[pColRes->info.type].compFunc))(pColRes->pData, colSize, numOfRows, data,
L
Liu Jicong 已提交
1630
                                                      colSize + COMP_OVERFLOW_BYTES, compressed, NULL, 0);
1631 1632
}

1633 1634 1635
int32_t doFillTimeIntervalGapsInResults(struct SFillInfo* pFillInfo, SSDataBlock* pBlock, int32_t capacity) {
  int32_t numOfRows = (int32_t)taosFillResultDataBlock(pFillInfo, pBlock, capacity - pBlock->info.rows);
  pBlock->info.rows += numOfRows;
1636

1637
  return pBlock->info.rows;
1638 1639
}

L
Liu Jicong 已提交
1640 1641
void queryCostStatis(SExecTaskInfo* pTaskInfo) {
  STaskCostInfo* pSummary = &pTaskInfo->cost;
1642

L
Liu Jicong 已提交
1643 1644 1645
  //  uint64_t hashSize = taosHashGetMemSize(pQInfo->runtimeEnv.pResultRowHashTable);
  //  hashSize += taosHashGetMemSize(pRuntimeEnv->tableqinfoGroupInfo.map);
  //  pSummary->hashSize = hashSize;
1646 1647 1648 1649

  // add the merge time
  pSummary->elapsedTime += pSummary->firstStageMergeTime;

L
Liu Jicong 已提交
1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660
  //  SResultRowPool* p = pTaskInfo->pool;
  //  if (p != NULL) {
  //    pSummary->winInfoSize = getResultRowPoolMemSize(p);
  //    pSummary->numOfTimeWindows = getNumOfAllocatedResultRows(p);
  //  } else {
  //    pSummary->winInfoSize = 0;
  //    pSummary->numOfTimeWindows = 0;
  //  }
  //
  //  calculateOperatorProfResults(pQInfo);

1661 1662
  SFileBlockLoadRecorder* pRecorder = pSummary->pRecoder;
  if (pSummary->pRecoder != NULL) {
X
Xiaoyu Wang 已提交
1663 1664
    qDebug("%s :cost summary: elapsed time:%" PRId64 " us, first merge:%" PRId64
           " us, total blocks:%d, "
1665 1666 1667 1668
           "load block statis:%d, load data block:%d, total rows:%" PRId64 ", check rows:%" PRId64,
           GET_TASKID(pTaskInfo), pSummary->elapsedTime, pSummary->firstStageMergeTime, pRecorder->totalBlocks,
           pRecorder->loadBlockStatis, pRecorder->loadBlocks, pRecorder->totalRows, pRecorder->totalCheckedRows);
  }
L
Liu Jicong 已提交
1669 1670 1671
  // qDebug("QInfo:0x%"PRIx64" :cost summary: winResPool size:%.2f Kb, numOfWin:%"PRId64", tableInfoSize:%.2f Kb,
  // hashTable:%.2f Kb", pQInfo->qId, pSummary->winInfoSize/1024.0,
  //      pSummary->numOfTimeWindows, pSummary->tableInfoSize/1024.0, pSummary->hashSize/1024.0);
1672 1673
}

L
Liu Jicong 已提交
1674 1675 1676
// static void updateOffsetVal(STaskRuntimeEnv *pRuntimeEnv, SDataBlockInfo *pBlockInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
1677
//
L
Liu Jicong 已提交
1678
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1679
//
L
Liu Jicong 已提交
1680 1681 1682 1683
//   if (pQueryAttr->limit.offset == pBlockInfo->rows) {  // current block will ignore completed
//     pTableQueryInfo->lastKey = QUERY_IS_ASC_QUERY(pQueryAttr) ? pBlockInfo->window.ekey + step :
//     pBlockInfo->window.skey + step; pQueryAttr->limit.offset = 0; return;
//   }
1684
//
L
Liu Jicong 已提交
1685 1686 1687 1688 1689
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     pQueryAttr->pos = (int32_t)pQueryAttr->limit.offset;
//   } else {
//     pQueryAttr->pos = pBlockInfo->rows - (int32_t)pQueryAttr->limit.offset - 1;
//   }
1690
//
L
Liu Jicong 已提交
1691
//   assert(pQueryAttr->pos >= 0 && pQueryAttr->pos <= pBlockInfo->rows - 1);
1692
//
L
Liu Jicong 已提交
1693 1694
//   SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//   SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1695
//
L
Liu Jicong 已提交
1696 1697
//   // update the pQueryAttr->limit.offset value, and pQueryAttr->pos value
//   TSKEY *keys = (TSKEY *) pColInfoData->pData;
1698
//
L
Liu Jicong 已提交
1699 1700 1701
//   // update the offset value
//   pTableQueryInfo->lastKey = keys[pQueryAttr->pos];
//   pQueryAttr->limit.offset = 0;
1702
//
L
Liu Jicong 已提交
1703
//   int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
1704
//
L
Liu Jicong 已提交
1705 1706 1707 1708
//   //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numBlocksOfStep:%d, numOfRes:%d,
//   lastKey:%"PRId64, GET_TASKID(pRuntimeEnv),
//          pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes, pQuery->current->lastKey);
// }
1709

L
Liu Jicong 已提交
1710 1711
// void skipBlocks(STaskRuntimeEnv *pRuntimeEnv) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
1712
//
L
Liu Jicong 已提交
1713 1714 1715
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0) {
//     return;
//   }
1716
//
L
Liu Jicong 已提交
1717 1718
//   pQueryAttr->pos = 0;
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1719
//
L
Liu Jicong 已提交
1720 1721
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
//   TsdbQueryHandleT pTsdbReadHandle = pRuntimeEnv->pTsdbReadHandle;
1722
//
L
Liu Jicong 已提交
1723 1724 1725 1726 1727
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pTsdbReadHandle)) {
//     if (isTaskKilled(pRuntimeEnv->qinfo)) {
//       longjmp(pRuntimeEnv->env, TSDB_CODE_TSC_QUERY_CANCELLED);
//     }
1728
//
L
Liu Jicong 已提交
1729
//     tsdbRetrieveDataBlockInfo(pTsdbReadHandle, &blockInfo);
1730
//
L
Liu Jicong 已提交
1731 1732 1733 1734
//     if (pQueryAttr->limit.offset > blockInfo.rows) {
//       pQueryAttr->limit.offset -= blockInfo.rows;
//       pTableQueryInfo->lastKey = (QUERY_IS_ASC_QUERY(pQueryAttr)) ? blockInfo.window.ekey : blockInfo.window.skey;
//       pTableQueryInfo->lastKey += step;
1735
//
L
Liu Jicong 已提交
1736 1737 1738 1739 1740 1741 1742
//       //qDebug("QInfo:0x%"PRIx64" skip rows:%d, offset:%" PRId64, GET_TASKID(pRuntimeEnv), blockInfo.rows,
//              pQuery->limit.offset);
//     } else {  // find the appropriated start position in current block
//       updateOffsetVal(pRuntimeEnv, &blockInfo);
//       break;
//     }
//   }
1743
//
L
Liu Jicong 已提交
1744 1745 1746 1747 1748 1749 1750 1751 1752
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
// }

// static TSKEY doSkipIntervalProcess(STaskRuntimeEnv* pRuntimeEnv, STimeWindow* win, SDataBlockInfo* pBlockInfo,
// STableQueryInfo* pTableQueryInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
1753
//
L
Liu Jicong 已提交
1754 1755 1756
//   assert(pQueryAttr->limit.offset == 0);
//   STimeWindow tw = *win;
//   getNextTimeWindow(pQueryAttr, &tw);
1757
//
L
Liu Jicong 已提交
1758 1759
//   if ((tw.skey <= pBlockInfo->window.ekey && QUERY_IS_ASC_QUERY(pQueryAttr)) ||
//       (tw.ekey >= pBlockInfo->window.skey && !QUERY_IS_ASC_QUERY(pQueryAttr))) {
1760
//
L
Liu Jicong 已提交
1761 1762 1763 1764
//     // load the data block and check data remaining in current data block
//     // TODO optimize performance
//     SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//     SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1765
//
L
Liu Jicong 已提交
1766 1767 1768 1769
//     tw = *win;
//     int32_t startPos =
//         getNextQualifiedWindow(pQueryAttr, &tw, pBlockInfo, pColInfoData->pData, binarySearchForKey, -1);
//     assert(startPos >= 0);
1770
//
L
Liu Jicong 已提交
1771 1772
//     // set the abort info
//     pQueryAttr->pos = startPos;
1773
//
L
Liu Jicong 已提交
1774 1775 1776 1777
//     // reset the query start timestamp
//     pTableQueryInfo->win.skey = ((TSKEY *)pColInfoData->pData)[startPos];
//     pQueryAttr->window.skey = pTableQueryInfo->win.skey;
//     TSKEY key = pTableQueryInfo->win.skey;
1778
//
L
Liu Jicong 已提交
1779 1780
//     pWindowResInfo->prevSKey = tw.skey;
//     int32_t index = pRuntimeEnv->resultRowInfo.curIndex;
1781
//
L
Liu Jicong 已提交
1782 1783
//     int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
//     pRuntimeEnv->resultRowInfo.curIndex = index;  // restore the window index
1784
//
L
Liu Jicong 已提交
1785 1786 1787 1788
//     //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numOfRows:%d, numOfRes:%d,
//     lastKey:%" PRId64,
//            GET_TASKID(pRuntimeEnv), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes,
//            pQueryAttr->current->lastKey);
1789
//
L
Liu Jicong 已提交
1790 1791 1792 1793 1794
//     return key;
//   } else {  // do nothing
//     pQueryAttr->window.skey      = tw.skey;
//     pWindowResInfo->prevSKey = tw.skey;
//     pTableQueryInfo->lastKey = tw.skey;
1795
//
L
Liu Jicong 已提交
1796 1797
//     return tw.skey;
//   }
1798
//
L
Liu Jicong 已提交
1799 1800 1801 1802 1803 1804 1805 1806 1807 1808
//   return true;
// }

// static bool skipTimeInterval(STaskRuntimeEnv *pRuntimeEnv, TSKEY* start) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     assert(*start <= pRuntimeEnv->current->lastKey);
//   } else {
//     assert(*start >= pRuntimeEnv->current->lastKey);
//   }
1809
//
L
Liu Jicong 已提交
1810 1811 1812 1813 1814
//   // if queried with value filter, do NOT forward query start position
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0 || pRuntimeEnv->pTsBuf != NULL ||
//   pRuntimeEnv->pFillInfo != NULL) {
//     return true;
//   }
1815
//
L
Liu Jicong 已提交
1816 1817 1818 1819 1820 1821 1822
//   /*
//    * 1. for interval without interpolation query we forward pQueryAttr->interval.interval at a time for
//    *    pQueryAttr->limit.offset times. Since hole exists, pQueryAttr->interval.interval*pQueryAttr->limit.offset
//    value is
//    *    not valid. otherwise, we only forward pQueryAttr->limit.offset number of points
//    */
//   assert(pRuntimeEnv->resultRowInfo.prevSKey == TSKEY_INITIAL_VAL);
1823
//
L
Liu Jicong 已提交
1824 1825
//   STimeWindow w = TSWINDOW_INITIALIZER;
//   bool ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1826
//
L
Liu Jicong 已提交
1827 1828
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
//   STableQueryInfo *pTableQueryInfo = pRuntimeEnv->current;
1829
//
L
Liu Jicong 已提交
1830 1831 1832
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pRuntimeEnv->pTsdbReadHandle)) {
//     tsdbRetrieveDataBlockInfo(pRuntimeEnv->pTsdbReadHandle, &blockInfo);
1833
//
L
Liu Jicong 已提交
1834 1835 1836 1837 1838 1839 1840 1841 1842
//     if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       if (pWindowResInfo->prevSKey == TSKEY_INITIAL_VAL) {
//         getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.skey, blockInfo.window.skey, pQueryAttr->window.ekey,
//         &w); pWindowResInfo->prevSKey = w.skey;
//       }
//     } else {
//       getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.ekey, pQueryAttr->window.ekey, blockInfo.window.ekey, &w);
//       pWindowResInfo->prevSKey = w.skey;
//     }
1843
//
L
Liu Jicong 已提交
1844 1845
//     // the first time window
//     STimeWindow win = getActiveTimeWindow(pWindowResInfo, pWindowResInfo->prevSKey, pQueryAttr);
1846
//
L
Liu Jicong 已提交
1847 1848
//     while (pQueryAttr->limit.offset > 0) {
//       STimeWindow tw = win;
1849
//
L
Liu Jicong 已提交
1850 1851 1852
//       if ((win.ekey <= blockInfo.window.ekey && ascQuery) || (win.ekey >= blockInfo.window.skey && !ascQuery)) {
//         pQueryAttr->limit.offset -= 1;
//         pWindowResInfo->prevSKey = win.skey;
1853
//
L
Liu Jicong 已提交
1854 1855 1856 1857 1858 1859
//         // current time window is aligned with blockInfo.window.ekey
//         // restart it from next data block by set prevSKey to be TSKEY_INITIAL_VAL;
//         if ((win.ekey == blockInfo.window.ekey && ascQuery) || (win.ekey == blockInfo.window.skey && !ascQuery)) {
//           pWindowResInfo->prevSKey = TSKEY_INITIAL_VAL;
//         }
//       }
1860
//
L
Liu Jicong 已提交
1861 1862 1863 1864
//       if (pQueryAttr->limit.offset == 0) {
//         *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//         return true;
//       }
1865
//
L
Liu Jicong 已提交
1866 1867
//       // current window does not ended in current data block, try next data block
//       getNextTimeWindow(pQueryAttr, &tw);
1868
//
L
Liu Jicong 已提交
1869 1870 1871 1872 1873 1874 1875 1876 1877
//       /*
//        * If the next time window still starts from current data block,
//        * load the primary timestamp column first, and then find the start position for the next queried time window.
//        * Note that only the primary timestamp column is required.
//        * TODO: Optimize for this cases. All data blocks are not needed to be loaded, only if the first actually
//        required
//        * time window resides in current data block.
//        */
//       if ((tw.skey <= blockInfo.window.ekey && ascQuery) || (tw.ekey >= blockInfo.window.skey && !ascQuery)) {
1878
//
L
Liu Jicong 已提交
1879 1880
//         SArray *pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//         SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1881
//
L
Liu Jicong 已提交
1882 1883 1884
//         if ((win.ekey > blockInfo.window.ekey && ascQuery) || (win.ekey < blockInfo.window.skey && !ascQuery)) {
//           pQueryAttr->limit.offset -= 1;
//         }
1885
//
L
Liu Jicong 已提交
1886 1887 1888 1889 1890 1891 1892 1893
//         if (pQueryAttr->limit.offset == 0) {
//           *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//           return true;
//         } else {
//           tw = win;
//           int32_t startPos =
//               getNextQualifiedWindow(pQueryAttr, &tw, &blockInfo, pColInfoData->pData, binarySearchForKey, -1);
//           assert(startPos >= 0);
1894
//
L
Liu Jicong 已提交
1895 1896 1897 1898 1899 1900 1901 1902 1903 1904 1905
//           // set the abort info
//           pQueryAttr->pos = startPos;
//           pTableQueryInfo->lastKey = ((TSKEY *)pColInfoData->pData)[startPos];
//           pWindowResInfo->prevSKey = tw.skey;
//           win = tw;
//         }
//       } else {
//         break;  // offset is not 0, and next time window begins or ends in the next block.
//       }
//     }
//   }
1906
//
L
Liu Jicong 已提交
1907 1908 1909 1910
//   // check for error
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
1911
//
L
Liu Jicong 已提交
1912 1913
//   return true;
// }
1914

1915
int32_t appendDownstream(SOperatorInfo* p, SOperatorInfo** pDownstream, int32_t num) {
H
Haojun Liao 已提交
1916
  if (p->pDownstream == NULL) {
H
Haojun Liao 已提交
1917
    assert(p->numOfDownstream == 0);
1918 1919
  }

wafwerar's avatar
wafwerar 已提交
1920
  p->pDownstream = taosMemoryCalloc(1, num * POINTER_BYTES);
1921 1922 1923 1924 1925 1926 1927
  if (p->pDownstream == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  memcpy(p->pDownstream, pDownstream, num * POINTER_BYTES);
  p->numOfDownstream = num;
  return TSDB_CODE_SUCCESS;
1928 1929
}

wmmhello's avatar
wmmhello 已提交
1930
static void doDestroyTableList(STableListInfo* pTableqinfoList);
1931

1932
static void doTableQueryInfoTimeWindowCheck(SExecTaskInfo* pTaskInfo, STableQueryInfo* pTableQueryInfo, int32_t order) {
H
Haojun Liao 已提交
1933 1934
#if 0
    if (order == TSDB_ORDER_ASC) {
1935 1936
    assert(
        (pTableQueryInfo->win.skey <= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1937 1938
        (pTableQueryInfo->lastKey >= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey >= pTaskInfo->window.skey && pTableQueryInfo->win.ekey <= pTaskInfo->window.ekey));
1939 1940 1941
  } else {
    assert(
        (pTableQueryInfo->win.skey >= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1942 1943
        (pTableQueryInfo->lastKey <= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey <= pTaskInfo->window.skey && pTableQueryInfo->win.ekey >= pTaskInfo->window.ekey));
1944
  }
H
Haojun Liao 已提交
1945
#endif
1946 1947
}

1948 1949 1950 1951
typedef struct SFetchRspHandleWrapper {
  uint32_t exchangeId;
  int32_t  sourceIndex;
} SFetchRspHandleWrapper;
1952

D
dapan1121 已提交
1953
int32_t loadRemoteDataCallback(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1954
  SFetchRspHandleWrapper* pWrapper = (SFetchRspHandleWrapper*)param;
1955 1956 1957 1958 1959 1960 1961

  SExchangeInfo* pExchangeInfo = taosAcquireRef(exchangeObjRefPool, pWrapper->exchangeId);
  if (pExchangeInfo == NULL) {
    qWarn("failed to acquire exchange operator, since it may have been released");
    return TSDB_CODE_SUCCESS;
  }

X
Xiaoyu Wang 已提交
1962
  int32_t          index = pWrapper->sourceIndex;
1963
  SSourceDataInfo* pSourceDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, index);
1964

H
Haojun Liao 已提交
1965 1966
  if (code == TSDB_CODE_SUCCESS) {
    pSourceDataInfo->pRsp = pMsg->pData;
1967

H
Haojun Liao 已提交
1968 1969
    SRetrieveTableRsp* pRsp = pSourceDataInfo->pRsp;
    pRsp->numOfRows = htonl(pRsp->numOfRows);
dengyihao's avatar
dengyihao 已提交
1970
    pRsp->compLen = htonl(pRsp->compLen);
1971
    pRsp->numOfCols = htonl(pRsp->numOfCols);
dengyihao's avatar
dengyihao 已提交
1972
    pRsp->useconds = htobe64(pRsp->useconds);
1973

1974
    ASSERT(pRsp != NULL);
1975
    qDebug("%s fetch rsp received, index:%d, rows:%d", pSourceDataInfo->taskId, index, pRsp->numOfRows);
H
Haojun Liao 已提交
1976 1977 1978
  } else {
    pSourceDataInfo->code = code;
  }
H
Haojun Liao 已提交
1979

H
Haojun Liao 已提交
1980
  pSourceDataInfo->status = EX_SOURCE_DATA_READY;
1981 1982 1983 1984 1985

  tsem_post(&pExchangeInfo->ready);
  taosReleaseRef(exchangeObjRefPool, pWrapper->exchangeId);

  taosMemoryFree(pWrapper);
wmmhello's avatar
wmmhello 已提交
1986
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
1987 1988 1989 1990
}

static void destroySendMsgInfo(SMsgSendInfo* pMsgBody) {
  assert(pMsgBody != NULL);
wafwerar's avatar
wafwerar 已提交
1991 1992
  taosMemoryFreeClear(pMsgBody->msgInfo.pData);
  taosMemoryFreeClear(pMsgBody);
H
Haojun Liao 已提交
1993 1994
}

S
Shengliang Guan 已提交
1995
void qProcessFetchRsp(void* parent, SRpcMsg* pMsg, SEpSet* pEpSet) {
S
Shengliang Guan 已提交
1996 1997
  SMsgSendInfo* pSendInfo = (SMsgSendInfo*)pMsg->info.ahandle;
  assert(pMsg->info.ahandle != NULL);
H
Haojun Liao 已提交
1998 1999 2000 2001

  SDataBuf buf = {.len = pMsg->contLen, .pData = NULL};

  if (pMsg->contLen > 0) {
wafwerar's avatar
wafwerar 已提交
2002
    buf.pData = taosMemoryCalloc(1, pMsg->contLen);
H
Haojun Liao 已提交
2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013
    if (buf.pData == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      pMsg->code = TSDB_CODE_OUT_OF_MEMORY;
    } else {
      memcpy(buf.pData, pMsg->pCont, pMsg->contLen);
    }
  }

  pSendInfo->fp(pSendInfo->param, &buf, pMsg->code);
  rpcFreeCont(pMsg->pCont);
  destroySendMsgInfo(pSendInfo);
2014 2015
}

L
Liu Jicong 已提交
2016
static int32_t doSendFetchDataRequest(SExchangeInfo* pExchangeInfo, SExecTaskInfo* pTaskInfo, int32_t sourceIndex) {
2017
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2018

wafwerar's avatar
wafwerar 已提交
2019
  SResFetchReq* pMsg = taosMemoryCalloc(1, sizeof(SResFetchReq));
2020 2021 2022 2023
  if (NULL == pMsg) {
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
  }
2024

L
Liu Jicong 已提交
2025 2026
  SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, sourceIndex);
  SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, sourceIndex);
2027

2028 2029
  ASSERT(pDataInfo->status == EX_SOURCE_DATA_NOT_READY);

2030 2031 2032
  qDebug("%s build fetch msg and send to vgId:%d, ep:%s, taskId:0x%" PRIx64 ", execId:%d, %d/%" PRIzu,
         GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->addr.epSet.eps[0].fqdn, pSource->taskId, pSource->execId,
         sourceIndex, totalSources);
2033 2034 2035 2036 2037

  pMsg->header.vgId = htonl(pSource->addr.nodeId);
  pMsg->sId = htobe64(pSource->schedId);
  pMsg->taskId = htobe64(pSource->taskId);
  pMsg->queryId = htobe64(pTaskInfo->id.queryId);
D
dapan1121 已提交
2038
  pMsg->execId = htonl(pSource->execId);
2039 2040

  // send the fetch remote task result reques
wafwerar's avatar
wafwerar 已提交
2041
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
2042
  if (NULL == pMsgSendInfo) {
wafwerar's avatar
wafwerar 已提交
2043
    taosMemoryFreeClear(pMsg);
2044 2045 2046
    qError("%s prepare message %d failed", GET_TASKID(pTaskInfo), (int32_t)sizeof(SMsgSendInfo));
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
H
Haojun Liao 已提交
2047 2048
  }

2049
  SFetchRspHandleWrapper* pWrapper = taosMemoryCalloc(1, sizeof(SFetchRspHandleWrapper));
X
Xiaoyu Wang 已提交
2050
  pWrapper->exchangeId = pExchangeInfo->self;
2051 2052 2053
  pWrapper->sourceIndex = sourceIndex;

  pMsgSendInfo->param = pWrapper;
2054 2055
  pMsgSendInfo->msgInfo.pData = pMsg;
  pMsgSendInfo->msgInfo.len = sizeof(SResFetchReq);
D
dapan1121 已提交
2056
  pMsgSendInfo->msgType = TDMT_SCH_FETCH;
2057
  pMsgSendInfo->fp = loadRemoteDataCallback;
2058

2059
  int64_t transporterId = 0;
L
Liu Jicong 已提交
2060
  int32_t code = asyncSendMsgToServer(pExchangeInfo->pTransporter, &pSource->addr.epSet, &transporterId, pMsgSendInfo);
2061 2062 2063
  return TSDB_CODE_SUCCESS;
}

2064
int32_t extractDataBlockFromFetchRsp(SSDataBlock* pRes, SLoadRemoteDataInfo* pLoadInfo, int32_t numOfRows, char* pData,
L
Liu Jicong 已提交
2065 2066
                                     int32_t compLen, int32_t numOfOutput, int64_t startTs, uint64_t* total,
                                     SArray* pColList) {
H
Haojun Liao 已提交
2067
  if (pColList == NULL) {  // data from other sources
2068
    blockDataCleanup(pRes);
2069
    //    blockDataEnsureCapacity(pRes, numOfRows);
2070
    blockDecode(pRes, numOfOutput, numOfRows, pData);
H
Haojun Liao 已提交
2071
  } else {  // extract data according to pColList
2072
    ASSERT(numOfOutput == taosArrayGetSize(pColList));
2073 2074 2075 2076 2077
    char* pStart = pData;

    int32_t numOfCols = htonl(*(int32_t*)pStart);
    pStart += sizeof(int32_t);

2078
    // todo refactor:extract method
2079
    SSysTableSchema* pSchema = (SSysTableSchema*)pStart;
dengyihao's avatar
dengyihao 已提交
2080
    for (int32_t i = 0; i < numOfCols; ++i) {
2081 2082 2083 2084 2085 2086 2087
      SSysTableSchema* p = (SSysTableSchema*)pStart;

      p->colId = htons(p->colId);
      p->bytes = htonl(p->bytes);
      pStart += sizeof(SSysTableSchema);
    }

2088
    SSDataBlock* pBlock = createDataBlock();
dengyihao's avatar
dengyihao 已提交
2089
    for (int32_t i = 0; i < numOfCols; ++i) {
2090 2091
      SColumnInfoData idata = createColumnInfoData(pSchema[i].type, pSchema[i].bytes, pSchema[i].colId);
      blockDataAppendColInfo(pBlock, &idata);
2092 2093
    }

2094
    blockDecode(pBlock, numOfCols, numOfRows, pStart);
2095 2096
    blockDataEnsureCapacity(pRes, numOfRows);

H
Haojun Liao 已提交
2097
    // data from mnode
2098
    pRes->info.rows = numOfRows;
2099 2100
    relocateColumnData(pRes, pColList, pBlock->pDataBlock, false);
    blockDataDestroy(pBlock);
2101
  }
2102

2103 2104
  // todo move this to time window aggregator, since the primary timestamp may not be known by exchange operator.
  blockDataUpdateTsWindow(pRes, 0);
2105

2106
  int64_t el = taosGetTimestampUs() - startTs;
2107

H
Haojun Liao 已提交
2108 2109
  pLoadInfo->totalRows += numOfRows;
  pLoadInfo->totalSize += compLen;
2110

H
Haojun Liao 已提交
2111 2112 2113
  if (total != NULL) {
    *total += numOfRows;
  }
2114

H
Haojun Liao 已提交
2115
  pLoadInfo->totalElapsed += el;
2116 2117
  return TSDB_CODE_SUCCESS;
}
2118

L
Liu Jicong 已提交
2119 2120
static void* setAllSourcesCompleted(SOperatorInfo* pOperator, int64_t startTs) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
2121
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
H
Haojun Liao 已提交
2122

2123
  int64_t              el = taosGetTimestampUs() - startTs;
H
Haojun Liao 已提交
2124
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2125

H
Haojun Liao 已提交
2126
  pLoadInfo->totalElapsed += el;
H
Haojun Liao 已提交
2127

2128
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
L
Liu Jicong 已提交
2129 2130 2131
  qDebug("%s all %" PRIzu " sources are exhausted, total rows: %" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
         GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
         pLoadInfo->totalElapsed / 1000.0);
2132 2133 2134 2135 2136

  doSetOperatorCompleted(pOperator);
  return NULL;
}

L
Liu Jicong 已提交
2137 2138
static SSDataBlock* concurrentlyLoadRemoteDataImpl(SOperatorInfo* pOperator, SExchangeInfo* pExchangeInfo,
                                                   SExecTaskInfo* pTaskInfo) {
2139 2140 2141 2142 2143 2144 2145 2146
  int32_t code = 0;
  int64_t startTs = taosGetTimestampUs();
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);

  while (1) {
    int32_t completed = 0;
    for (int32_t i = 0; i < totalSources; ++i) {
      SSourceDataInfo* pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, i);
2147
      if (pDataInfo->status == EX_SOURCE_DATA_EXHAUSTED) {
2148
        completed += 1;
H
Haojun Liao 已提交
2149 2150
        continue;
      }
2151

2152
      if (pDataInfo->status != EX_SOURCE_DATA_READY) {
2153 2154 2155
        continue;
      }

2156 2157 2158 2159 2160
      if (pDataInfo->code != TSDB_CODE_SUCCESS) {
        code = pDataInfo->code;
        goto _error;
      }

L
Liu Jicong 已提交
2161
      SRetrieveTableRsp*     pRsp = pDataInfo->pRsp;
X
Xiaoyu Wang 已提交
2162
      SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, i);
2163

L
Liu Jicong 已提交
2164
      SSDataBlock*         pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2165
      SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2166
      if (pRsp->numOfRows == 0) {
2167 2168
        qDebug("%s vgId:%d, taskId:0x%" PRIx64 " execId:%d index:%d completed, rowsOfSource:%" PRIu64
               ", totalRows:%" PRIu64 ", completed:%d try next %d/%" PRIzu,
D
dapan1121 已提交
2169
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pDataInfo->totalRows,
2170
               pExchangeInfo->loadInfo.totalRows, completed + 1, i + 1, totalSources);
2171
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2172
        completed += 1;
D
dapan1121 已提交
2173
        taosMemoryFreeClear(pDataInfo->pRsp);
2174 2175
        continue;
      }
H
Haojun Liao 已提交
2176

H
Haojun Liao 已提交
2177
      SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2178 2179 2180
      code =
          extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
                                       pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2181
      if (code != 0) {
2182
        taosMemoryFreeClear(pDataInfo->pRsp);
2183 2184 2185
        goto _error;
      }

2186
      if (pRsp->completed == 1) {
2187 2188
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64
               " execId:%d"
X
Xiaoyu Wang 已提交
2189 2190
               " index:%d completed, numOfRows:%d, rowsOfSource:%" PRIu64 ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64
               ", completed:%d try next %d/%" PRIzu,
2191 2192
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pRes->info.rows,
               pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, completed + 1, i + 1, totalSources);
2193
        completed += 1;
2194
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2195
      } else {
D
dapan1121 已提交
2196
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
dengyihao's avatar
dengyihao 已提交
2197
               ", totalBytes:%" PRIu64,
2198 2199
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
               pLoadInfo->totalRows, pLoadInfo->totalSize);
2200 2201
      }

2202 2203
      taosMemoryFreeClear(pDataInfo->pRsp);

2204 2205
      if (pDataInfo->status != EX_SOURCE_DATA_EXHAUSTED) {
        pDataInfo->status = EX_SOURCE_DATA_NOT_READY;
2206 2207
        code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
        if (code != TSDB_CODE_SUCCESS) {
2208
          taosMemoryFreeClear(pDataInfo->pRsp);
2209 2210 2211 2212 2213 2214 2215
          goto _error;
        }
      }

      return pExchangeInfo->pResult;
    }

2216
    if (completed == totalSources) {
2217 2218 2219 2220 2221 2222 2223 2224 2225
      return setAllSourcesCompleted(pOperator, startTs);
    }
  }

_error:
  pTaskInfo->code = code;
  return NULL;
}

L
Liu Jicong 已提交
2226 2227 2228
static int32_t prepareConcurrentlyLoad(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2229

L
Liu Jicong 已提交
2230
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2231 2232 2233
  int64_t startTs = taosGetTimestampUs();

  // Asynchronously send all fetch requests to all sources.
L
Liu Jicong 已提交
2234
  for (int32_t i = 0; i < totalSources; ++i) {
2235 2236
    int32_t code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
    if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2237 2238
      pTaskInfo->code = code;
      return code;
2239 2240 2241 2242
    }
  }

  int64_t endTs = taosGetTimestampUs();
2243
  qDebug("%s send all fetch requests to %" PRIzu " sources completed, elapsed:%.2fms", GET_TASKID(pTaskInfo),
X
Xiaoyu Wang 已提交
2244
         totalSources, (endTs - startTs) / 1000.0);
2245

2246
  pOperator->status = OP_RES_TO_RETURN;
H
Haojun Liao 已提交
2247
  pOperator->cost.openCost = taosGetTimestampUs() - startTs;
2248

2249
  tsem_wait(&pExchangeInfo->ready);
H
Haojun Liao 已提交
2250
  return TSDB_CODE_SUCCESS;
2251 2252
}

L
Liu Jicong 已提交
2253 2254 2255
static SSDataBlock* seqLoadRemoteData(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2256

L
Liu Jicong 已提交
2257
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2258
  int64_t startTs = taosGetTimestampUs();
2259

L
Liu Jicong 已提交
2260
  while (1) {
2261 2262
    if (pExchangeInfo->current >= totalSources) {
      return setAllSourcesCompleted(pOperator, startTs);
2263
    }
2264

2265 2266 2267
    doSendFetchDataRequest(pExchangeInfo, pTaskInfo, pExchangeInfo->current);
    tsem_wait(&pExchangeInfo->ready);

dengyihao's avatar
dengyihao 已提交
2268
    SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, pExchangeInfo->current);
X
Xiaoyu Wang 已提交
2269
    SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, pExchangeInfo->current);
2270

H
Haojun Liao 已提交
2271
    if (pDataInfo->code != TSDB_CODE_SUCCESS) {
2272 2273
      qError("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d error happens, code:%s", GET_TASKID(pTaskInfo),
             pSource->addr.nodeId, pSource->taskId, pSource->execId, tstrerror(pDataInfo->code));
H
Haojun Liao 已提交
2274 2275 2276 2277
      pOperator->pTaskInfo->code = pDataInfo->code;
      return NULL;
    }

L
Liu Jicong 已提交
2278
    SRetrieveTableRsp*   pRsp = pDataInfo->pRsp;
H
Haojun Liao 已提交
2279
    SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2280
    if (pRsp->numOfRows == 0) {
2281 2282
      qDebug("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d %d of total completed, rowsOfSource:%" PRIu64
             ", totalRows:%" PRIu64 " try next",
D
dapan1121 已提交
2283
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pExchangeInfo->current + 1,
H
Haojun Liao 已提交
2284
             pDataInfo->totalRows, pLoadInfo->totalRows);
H
Haojun Liao 已提交
2285

2286
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2287
      pExchangeInfo->current += 1;
D
dapan1121 已提交
2288
      taosMemoryFreeClear(pDataInfo->pRsp);
2289 2290
      continue;
    }
H
Haojun Liao 已提交
2291

L
Liu Jicong 已提交
2292
    SSDataBlock*       pRes = pExchangeInfo->pResult;
H
Haojun Liao 已提交
2293
    SRetrieveTableRsp* pTableRsp = pDataInfo->pRsp;
L
Liu Jicong 已提交
2294
    int32_t            code =
2295
        extractDataBlockFromFetchRsp(pExchangeInfo->pResult, pLoadInfo, pTableRsp->numOfRows, pTableRsp->data,
L
Liu Jicong 已提交
2296
                                     pTableRsp->compLen, pTableRsp->numOfCols, startTs, &pDataInfo->totalRows, NULL);
2297 2298

    if (pRsp->completed == 1) {
D
dapan1121 已提交
2299
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, rowsOfSource:%" PRIu64
L
Liu Jicong 已提交
2300
             ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64 " try next %d/%" PRIzu,
2301 2302 2303
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, pExchangeInfo->current + 1,
             totalSources);
2304

2305
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2306 2307
      pExchangeInfo->current += 1;
    } else {
D
dapan1121 已提交
2308
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
L
Liu Jicong 已提交
2309
             ", totalBytes:%" PRIu64,
2310 2311
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRes->info.rows,
             pLoadInfo->totalRows, pLoadInfo->totalSize);
2312 2313
    }

2314
    pOperator->resultInfo.totalRows += pRes->info.rows;
2315
    taosMemoryFreeClear(pDataInfo->pRsp);
2316 2317
    return pExchangeInfo->pResult;
  }
2318 2319
}

L
Liu Jicong 已提交
2320
static int32_t prepareLoadRemoteData(SOperatorInfo* pOperator) {
2321
  if (OPTR_IS_OPENED(pOperator)) {
H
Haojun Liao 已提交
2322 2323 2324
    return TSDB_CODE_SUCCESS;
  }

2325 2326
  int64_t st = taosGetTimestampUs();

L
Liu Jicong 已提交
2327
  SExchangeInfo* pExchangeInfo = pOperator->info;
2328
  if (!pExchangeInfo->seqLoadData) {
H
Haojun Liao 已提交
2329 2330 2331 2332 2333 2334
    int32_t code = prepareConcurrentlyLoad(pOperator);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
    }
  }

2335
  OPTR_SET_OPENED(pOperator);
2336
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2337 2338 2339
  return TSDB_CODE_SUCCESS;
}

2340
static SSDataBlock* doLoadRemoteData(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
2341 2342
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2343

2344
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
2345
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2346 2347
    return NULL;
  }
2348

L
Liu Jicong 已提交
2349
  size_t               totalSources = taosArrayGetSize(pExchangeInfo->pSources);
H
Haojun Liao 已提交
2350
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
H
Haojun Liao 已提交
2351

2352
  if (pOperator->status == OP_EXEC_DONE) {
L
Liu Jicong 已提交
2353 2354 2355
    qDebug("%s all %" PRIzu " source(s) are exhausted, total rows:%" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
           GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
           pLoadInfo->totalElapsed / 1000.0);
2356 2357 2358 2359 2360 2361
    return NULL;
  }

  if (pExchangeInfo->seqLoadData) {
    return seqLoadRemoteData(pOperator);
  } else {
2362
    return concurrentlyLoadRemoteDataImpl(pOperator, pExchangeInfo, pTaskInfo);
2363
  }
H
Haojun Liao 已提交
2364
}
2365

2366
static int32_t initDataSource(int32_t numOfSources, SExchangeInfo* pInfo, const char* id) {
2367
  pInfo->pSourceDataInfo = taosArrayInit(numOfSources, sizeof(SSourceDataInfo));
H
Haojun Liao 已提交
2368 2369
  if (pInfo->pSourceDataInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
2370 2371
  }

L
Liu Jicong 已提交
2372
  for (int32_t i = 0; i < numOfSources; ++i) {
2373
    SSourceDataInfo dataInfo = {0};
H
Haojun Liao 已提交
2374
    dataInfo.status = EX_SOURCE_DATA_NOT_READY;
2375
    dataInfo.taskId = id;
L
Liu Jicong 已提交
2376
    dataInfo.index = i;
X
Xiaoyu Wang 已提交
2377
    SSourceDataInfo* pDs = taosArrayPush(pInfo->pSourceDataInfo, &dataInfo);
2378
    if (pDs == NULL) {
H
Haojun Liao 已提交
2379 2380 2381 2382 2383 2384 2385 2386
      taosArrayDestroy(pInfo->pSourceDataInfo);
      return TSDB_CODE_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
}

2387
static int32_t initExchangeOperator(SExchangePhysiNode* pExNode, SExchangeInfo* pInfo, const char* id) {
2388
  size_t numOfSources = LIST_LENGTH(pExNode->pSrcEndPoints);
H
Haojun Liao 已提交
2389

2390
  if (numOfSources == 0) {
X
Xiaoyu Wang 已提交
2391
    qError("%s invalid number: %d of sources in exchange operator", id, (int32_t)numOfSources);
2392 2393 2394
    return TSDB_CODE_INVALID_PARA;
  }

H
Haojun Liao 已提交
2395
  pInfo->pSources = taosArrayInit(numOfSources, sizeof(SDownstreamSourceNode));
wmmhello's avatar
wmmhello 已提交
2396
  if (pInfo->pSources == NULL) {
2397
    return TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
2398 2399
  }

L
Liu Jicong 已提交
2400
  for (int32_t i = 0; i < numOfSources; ++i) {
D
dapan1121 已提交
2401
    SDownstreamSourceNode* pNode = (SDownstreamSourceNode*)nodesListGetNode((SNodeList*)pExNode->pSrcEndPoints, i);
H
Haojun Liao 已提交
2402 2403
    taosArrayPush(pInfo->pSources, pNode);
  }
2404

2405 2406
  pInfo->self = taosAddRef(exchangeObjRefPool, pInfo);

2407
  return initDataSource(numOfSources, pInfo, id);
2408 2409 2410 2411 2412 2413
}

SOperatorInfo* createExchangeOperatorInfo(void* pTransporter, SExchangePhysiNode* pExNode, SExecTaskInfo* pTaskInfo) {
  SExchangeInfo* pInfo = taosMemoryCalloc(1, sizeof(SExchangeInfo));
  SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
H
Haojun Liao 已提交
2414
    goto _error;
2415
  }
H
Haojun Liao 已提交
2416

2417
  int32_t code = initExchangeOperator(pExNode, pInfo, GET_TASKID(pTaskInfo));
2418 2419 2420
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2421 2422

  tsem_init(&pInfo->ready, 0, 0);
2423

2424
  pInfo->seqLoadData = false;
2425
  pInfo->pTransporter = pTransporter;
2426 2427
  pInfo->pResult = createResDataBlock(pExNode->node.pOutputDataBlockDesc);
  pOperator->name = "ExchangeOperator";
X
Xiaoyu Wang 已提交
2428
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_EXCHANGE;
X
Xiaoyu Wang 已提交
2429
  pOperator->blocking = false;
2430 2431
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
2432
  pOperator->exprSupp.numOfExprs = taosArrayGetSize(pInfo->pResult->pDataBlock);
X
Xiaoyu Wang 已提交
2433
  pOperator->pTaskInfo = pTaskInfo;
2434

L
Liu Jicong 已提交
2435 2436
  pOperator->fpSet = createOperatorFpSet(prepareLoadRemoteData, doLoadRemoteData, NULL, NULL,
                                         destroyExchangeOperatorInfo, NULL, NULL, NULL);
2437
  return pOperator;
H
Haojun Liao 已提交
2438

L
Liu Jicong 已提交
2439
_error:
H
Haojun Liao 已提交
2440
  if (pInfo != NULL) {
2441
    doDestroyExchangeOperatorInfo(pInfo);
H
Haojun Liao 已提交
2442 2443
  }

wafwerar's avatar
wafwerar 已提交
2444 2445
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
2446
  pTaskInfo->code = code;
H
Haojun Liao 已提交
2447
  return NULL;
2448 2449
}

dengyihao's avatar
dengyihao 已提交
2450 2451
static int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                                const char* pKey);
2452

2453
static void destroySortedMergeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
2454
  SSortedMergeOperatorInfo* pInfo = (SSortedMergeOperatorInfo*)param;
H
Haojun Liao 已提交
2455
  taosArrayDestroy(pInfo->pSortInfo);
2456 2457 2458
  taosArrayDestroy(pInfo->groupInfo);

  if (pInfo->pSortHandle != NULL) {
H
Haojun Liao 已提交
2459
    tsortDestroySortHandle(pInfo->pSortHandle);
2460 2461
  }

H
Haojun Liao 已提交
2462
  blockDataDestroy(pInfo->binfo.pRes);
H
Haojun Liao 已提交
2463
  cleanupAggSup(&pInfo->aggSup);
2464
}
H
Haojun Liao 已提交
2465

L
Liu Jicong 已提交
2466
static bool needToMerge(SSDataBlock* pBlock, SArray* groupInfo, char** buf, int32_t rowIndex) {
2467 2468 2469 2470
  size_t size = taosArrayGetSize(groupInfo);
  if (size == 0) {
    return true;
  }
2471

2472 2473
  for (int32_t i = 0; i < size; ++i) {
    int32_t* index = taosArrayGet(groupInfo, i);
2474

2475
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
L
Liu Jicong 已提交
2476
    bool             isNull = colDataIsNull(pColInfo, rowIndex, pBlock->info.rows, NULL);
2477

2478 2479 2480
    if ((isNull && buf[i] != NULL) || (!isNull && buf[i] == NULL)) {
      return false;
    }
2481

2482 2483 2484 2485 2486 2487 2488 2489 2490 2491 2492 2493 2494
    char* pCell = colDataGetData(pColInfo, rowIndex);
    if (IS_VAR_DATA_TYPE(pColInfo->info.type)) {
      if (varDataLen(pCell) != varDataLen(buf[i])) {
        return false;
      } else {
        if (memcmp(varDataVal(pCell), varDataVal(buf[i]), varDataLen(pCell)) != 0) {
          return false;
        }
      }
    } else {
      if (memcmp(pCell, buf[i], pColInfo->info.bytes) != 0) {
        return false;
      }
2495 2496 2497
    }
  }

2498
  return 0;
2499 2500
}

L
Liu Jicong 已提交
2501 2502 2503
static void doMergeResultImpl(SSortedMergeOperatorInfo* pInfo, SqlFunctionCtx* pCtx, int32_t numOfExpr,
                              int32_t rowIndex) {
  for (int32_t j = 0; j < numOfExpr; ++j) {  // TODO set row index
X
Xiaoyu Wang 已提交
2504
                                             //    pCtx[j].startRow = rowIndex;
2505 2506
  }

2507 2508
  for (int32_t j = 0; j < numOfExpr; ++j) {
    int32_t functionId = pCtx[j].functionId;
L
Liu Jicong 已提交
2509 2510 2511 2512 2513 2514 2515 2516 2517
    //    pCtx[j].fpSet->addInput(&pCtx[j]);

    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_MERGE);
    //    } else {
    //      assert(!TSDB_FUNC_IS_SCALAR(functionId));
    //      aAggs[functionId].mergeFunc(&pCtx[j]);
    //    }
2518
  }
2519
}
2520

L
Liu Jicong 已提交
2521 2522
static void doFinalizeResultImpl(SqlFunctionCtx* pCtx, int32_t numOfExpr) {
  for (int32_t j = 0; j < numOfExpr; ++j) {
2523 2524 2525 2526
    int32_t functionId = pCtx[j].functionId;
    //    if (functionId == FUNC_TAG_DUMMY || functionId == FUNC_TS_DUMMY) {
    //      continue;
    //    }
2527

2528 2529 2530 2531
    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_FINALIZE);
    //    } else {
dengyihao's avatar
dengyihao 已提交
2532
    //    pCtx[j].fpSet.finalize(&pCtx[j]);
2533 2534
  }
}
2535

2536
static bool saveCurrentTuple(char** rowColData, SArray* pColumnList, SSDataBlock* pBlock, int32_t rowIndex) {
L
Liu Jicong 已提交
2537
  int32_t size = (int32_t)taosArrayGetSize(pColumnList);
2538

L
Liu Jicong 已提交
2539 2540
  for (int32_t i = 0; i < size; ++i) {
    int32_t*         index = taosArrayGet(pColumnList, i);
2541
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
H
Haojun Liao 已提交
2542

2543 2544 2545
    char* data = colDataGetData(pColInfo, rowIndex);
    memcpy(rowColData[i], data, colDataGetLength(pColInfo, rowIndex));
  }
2546

2547 2548
  return true;
}
2549

2550 2551
static void doMergeImpl(SOperatorInfo* pOperator, int32_t numOfExpr, SSDataBlock* pBlock) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
2552

2553
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
2554

L
Liu Jicong 已提交
2555
  for (int32_t i = 0; i < pBlock->info.rows; ++i) {
2556 2557 2558 2559 2560 2561 2562 2563 2564
    if (!pInfo->hasGroupVal) {
      ASSERT(i == 0);
      doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
    } else {
      if (needToMerge(pBlock, pInfo->groupInfo, pInfo->groupVal, i)) {
        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      } else {
        doFinalizeResultImpl(pCtx, numOfExpr);
2565 2566
        int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
        //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2567

2568
        // TODO check for available buffer;
H
Haojun Liao 已提交
2569

2570 2571 2572 2573 2574
        // next group info data
        pInfo->binfo.pRes->info.rows += numOfRows;
        for (int32_t j = 0; j < numOfExpr; ++j) {
          if (pCtx[j].functionId < 0) {
            continue;
2575
          }
2576

H
Haojun Liao 已提交
2577
          pCtx[j].fpSet.process(&pCtx[j]);
2578
        }
2579 2580 2581

        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
        pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
H
Haojun Liao 已提交
2582
      }
2583 2584 2585 2586
    }
  }
}

2587 2588
static SSDataBlock* doMerge(SOperatorInfo* pOperator) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
L
Liu Jicong 已提交
2589
  SSortHandle*              pHandle = pInfo->pSortHandle;
2590

2591
  SSDataBlock* pDataBlock = createOneDataBlock(pInfo->binfo.pRes, false);
2592
  blockDataEnsureCapacity(pDataBlock, pOperator->resultInfo.capacity);
2593

L
Liu Jicong 已提交
2594
  while (1) {
2595
    blockDataCleanup(pDataBlock);
2596
    while (1) {
H
Haojun Liao 已提交
2597
      STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2598 2599
      if (pTupleHandle == NULL) {
        break;
2600
      }
2601

2602 2603
      // build datablock for merge for one group
      appendOneRowToDataBlock(pDataBlock, pTupleHandle);
2604
      if (pDataBlock->info.rows >= pOperator->resultInfo.capacity) {
2605 2606
        break;
      }
2607
    }
2608

2609 2610 2611
    if (pDataBlock->info.rows == 0) {
      break;
    }
2612

2613
    setInputDataBlock(pOperator, pOperator->exprSupp.pCtx, pDataBlock, TSDB_ORDER_ASC, MAIN_SCAN, true);
L
Liu Jicong 已提交
2614 2615
    //  updateOutputBuf(&pInfo->binfo, &pAggInfo->bufCapacity, pBlock->info.rows * pAggInfo->resultRowFactor,
    //  pOperator->pRuntimeEnv, true);
2616
    doMergeImpl(pOperator, pOperator->exprSupp.numOfExprs, pDataBlock);
2617 2618
    // flush to tuple store, and after all data have been handled, return to upstream node or sink node
  }
2619

2620 2621 2622
  doFinalizeResultImpl(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs);
  int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
  //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2623

2624
  // TODO check for available buffer;
2625

2626 2627
  // next group info data
  pInfo->binfo.pRes->info.rows += numOfRows;
L
Liu Jicong 已提交
2628
  return (pInfo->binfo.pRes->info.rows > 0) ? pInfo->binfo.pRes : NULL;
2629
}
2630

L
Liu Jicong 已提交
2631 2632
SSDataBlock* getSortedMergeBlockData(SSortHandle* pHandle, SSDataBlock* pDataBlock, int32_t capacity,
                                     SArray* pColMatchInfo, SSortedMergeOperatorInfo* pInfo) {
2633 2634 2635 2636 2637 2638 2639 2640 2641 2642
  blockDataCleanup(pDataBlock);

  SSDataBlock* p = tsortGetSortedDataBlock(pHandle);
  if (p == NULL) {
    return NULL;
  }

  blockDataEnsureCapacity(p, capacity);

  while (1) {
2643
    STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2644 2645 2646 2647
    if (pTupleHandle == NULL) {
      break;
    }

2648
    appendOneRowToDataBlock(p, pTupleHandle);
2649 2650 2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661
    if (p->info.rows >= capacity) {
      break;
    }
  }

  if (p->info.rows > 0) {
    int32_t numOfCols = taosArrayGetSize(pColMatchInfo);
    for (int32_t i = 0; i < numOfCols; ++i) {
      SColMatchInfo* pmInfo = taosArrayGet(pColMatchInfo, i);
      ASSERT(pmInfo->matchType == COL_MATCH_FROM_SLOT_ID);

      SColumnInfoData* pSrc = taosArrayGet(p->pDataBlock, pmInfo->srcSlotId);
      SColumnInfoData* pDst = taosArrayGet(pDataBlock->pDataBlock, pmInfo->targetSlotId);
2662
      colDataAssign(pDst, pSrc, p->info.rows, &pDataBlock->info);
2663 2664 2665 2666 2667 2668 2669 2670 2671 2672
    }

    pDataBlock->info.rows = p->info.rows;
    pDataBlock->info.capacity = p->info.rows;
  }

  blockDataDestroy(p);
  return (pDataBlock->info.rows > 0) ? pDataBlock : NULL;
}

2673
static SSDataBlock* doSortedMerge(SOperatorInfo* pOperator) {
2674 2675
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
2676 2677
  }

L
Liu Jicong 已提交
2678
  SExecTaskInfo*            pTaskInfo = pOperator->pTaskInfo;
2679
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
H
Haojun Liao 已提交
2680
  if (pOperator->status == OP_RES_TO_RETURN) {
2681
    return getSortedMergeBlockData(pInfo->pSortHandle, pInfo->binfo.pRes, pOperator->resultInfo.capacity, NULL, pInfo);
2682 2683
  }

2684
  int32_t numOfBufPage = pInfo->sortBufSize / pInfo->bufPageSize;
L
Liu Jicong 已提交
2685 2686
  pInfo->pSortHandle = tsortCreateSortHandle(pInfo->pSortInfo, SORT_MULTISOURCE_MERGE, pInfo->bufPageSize, numOfBufPage,
                                             pInfo->binfo.pRes, "GET_TASKID(pTaskInfo)");
H
Haojun Liao 已提交
2687

2688
  tsortSetFetchRawDataFp(pInfo->pSortHandle, loadNextDataBlock, NULL, NULL);
2689

L
Liu Jicong 已提交
2690
  for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
wmmhello's avatar
wmmhello 已提交
2691
    SSortSource* ps = taosMemoryCalloc(1, sizeof(SSortSource));
H
Haojun Liao 已提交
2692
    ps->param = pOperator->pDownstream[i];
H
Haojun Liao 已提交
2693
    tsortAddSource(pInfo->pSortHandle, ps);
2694 2695
  }

H
Haojun Liao 已提交
2696
  int32_t code = tsortOpen(pInfo->pSortHandle);
2697
  if (code != TSDB_CODE_SUCCESS) {
2698
    longjmp(pTaskInfo->env, terrno);
2699 2700
  }

H
Haojun Liao 已提交
2701
  pOperator->status = OP_RES_TO_RETURN;
2702
  return doMerge(pOperator);
2703
}
2704

L
Liu Jicong 已提交
2705 2706
static int32_t initGroupCol(SExprInfo* pExprInfo, int32_t numOfCols, SArray* pGroupInfo,
                            SSortedMergeOperatorInfo* pInfo) {
2707 2708
  if (pGroupInfo == NULL || taosArrayGetSize(pGroupInfo) == 0) {
    return 0;
H
Haojun Liao 已提交
2709 2710
  }

2711 2712 2713 2714 2715 2716 2717 2718
  int32_t len = 0;
  SArray* plist = taosArrayInit(3, sizeof(SColumn));
  pInfo->groupInfo = taosArrayInit(3, sizeof(int32_t));

  if (plist == NULL || pInfo->groupInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

L
Liu Jicong 已提交
2719 2720
  size_t numOfGroupCol = taosArrayGetSize(pInfo->groupInfo);
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2721
    SColumn* pCol = taosArrayGet(pGroupInfo, i);
L
Liu Jicong 已提交
2722
    for (int32_t j = 0; j < numOfCols; ++j) {
H
Haojun Liao 已提交
2723
      SExprInfo* pe = &pExprInfo[j];
2724
      if (pe->base.resSchema.slotId == pCol->colId) {
2725 2726
        taosArrayPush(plist, pCol);
        taosArrayPush(pInfo->groupInfo, &j);
H
Haojun Liao 已提交
2727
        len += pCol->bytes;
2728 2729
        break;
      }
H
Haojun Liao 已提交
2730 2731 2732
    }
  }

2733
  ASSERT(taosArrayGetSize(pGroupInfo) == taosArrayGetSize(plist));
H
Haojun Liao 已提交
2734

wafwerar's avatar
wafwerar 已提交
2735
  pInfo->groupVal = taosMemoryCalloc(1, (POINTER_BYTES * numOfGroupCol + len));
2736 2737 2738 2739
  if (pInfo->groupVal == NULL) {
    taosArrayDestroy(plist);
    return TSDB_CODE_OUT_OF_MEMORY;
  }
H
Haojun Liao 已提交
2740

2741
  int32_t offset = 0;
L
Liu Jicong 已提交
2742 2743
  char*   start = (char*)(pInfo->groupVal + (POINTER_BYTES * numOfGroupCol));
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2744 2745
    pInfo->groupVal[i] = start + offset;
    SColumn* pCol = taosArrayGet(plist, i);
H
Haojun Liao 已提交
2746
    offset += pCol->bytes;
2747
  }
H
Haojun Liao 已提交
2748

2749
  taosArrayDestroy(plist);
H
Haojun Liao 已提交
2750

2751 2752
  return TSDB_CODE_SUCCESS;
}
H
Haojun Liao 已提交
2753

L
Liu Jicong 已提交
2754 2755 2756
SOperatorInfo* createSortedMergeOperatorInfo(SOperatorInfo** downstream, int32_t numOfDownstream, SExprInfo* pExprInfo,
                                             int32_t num, SArray* pSortInfo, SArray* pGroupInfo,
                                             SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
2757
  SSortedMergeOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SSortedMergeOperatorInfo));
L
Liu Jicong 已提交
2758
  SOperatorInfo*            pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2759
  if (pInfo == NULL || pOperator == NULL) {
2760
    goto _error;
2761
  }
H
Haojun Liao 已提交
2762

2763 2764 2765 2766 2767
  int32_t code = initExprSupp(&pOperator->exprSupp, pExprInfo, num);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

2768
  initResultRowInfo(&pInfo->binfo.resultRowInfo);
H
Haojun Liao 已提交
2769

2770
  if (pOperator->exprSupp.pCtx == NULL || pInfo->binfo.pRes == NULL) {
2771 2772
    goto _error;
  }
H
Haojun Liao 已提交
2773

2774
  size_t keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
2775
  code = doInitAggInfoSup(&pInfo->aggSup, pOperator->exprSupp.pCtx, num, keyBufSize, pTaskInfo->id.str);
2776 2777 2778
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2779

2780
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, num);
H
Haojun Liao 已提交
2781
  code = initGroupCol(pExprInfo, num, pGroupInfo, pInfo);
2782 2783 2784
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
H
Haojun Liao 已提交
2785

L
Liu Jicong 已提交
2786 2787 2788 2789 2790
  //  pInfo->resultRowFactor = (int32_t)(getRowNumForMultioutput(pRuntimeEnv->pQueryAttr,
  //      pRuntimeEnv->pQueryAttr->topBotQuery, false));
  pInfo->sortBufSize = 1024 * 16;  // 1MB
  pInfo->bufPageSize = 1024;
  pInfo->pSortInfo = pSortInfo;
H
Haojun Liao 已提交
2791

2792
  pOperator->resultInfo.capacity = blockDataGetCapacityInRow(pInfo->binfo.pRes, pInfo->bufPageSize);
H
Haojun Liao 已提交
2793

L
Liu Jicong 已提交
2794
  pOperator->name = "SortedMerge";
X
Xiaoyu Wang 已提交
2795
  // pOperator->operatorType = OP_SortedMerge;
2796 2797 2798
  pOperator->blocking = true;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
L
Liu Jicong 已提交
2799
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
2800

2801 2802
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doSortedMerge, NULL, NULL, destroySortedMergeOperatorInfo,
                                         NULL, NULL, NULL);
2803 2804 2805
  code = appendDownstream(pOperator, downstream, numOfDownstream);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
2806
  }
H
Haojun Liao 已提交
2807

2808
  return pOperator;
H
Haojun Liao 已提交
2809

L
Liu Jicong 已提交
2810
_error:
2811
  if (pInfo != NULL) {
H
Haojun Liao 已提交
2812
    destroySortedMergeOperatorInfo(pInfo, num);
H
Haojun Liao 已提交
2813 2814
  }

wafwerar's avatar
wafwerar 已提交
2815 2816
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
2817 2818
  terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
  return NULL;
H
Haojun Liao 已提交
2819 2820
}

X
Xiaoyu Wang 已提交
2821
int32_t getTableScanInfo(SOperatorInfo* pOperator, int32_t* order, int32_t* scanFlag) {
2822
  // todo add more information about exchange operation
2823
  int32_t type = pOperator->operatorType;
X
Xiaoyu Wang 已提交
2824
  if (type == QUERY_NODE_PHYSICAL_PLAN_EXCHANGE || type == QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN ||
2825 2826
      type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN ||
      type == QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN) {
2827 2828 2829
    *order = TSDB_ORDER_ASC;
    *scanFlag = MAIN_SCAN;
    return TSDB_CODE_SUCCESS;
2830
  } else if (type == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) {
2831 2832 2833 2834 2835
    STableScanInfo* pTableScanInfo = pOperator->info;
    *order = pTableScanInfo->cond.order;
    *scanFlag = pTableScanInfo->scanFlag;
    return TSDB_CODE_SUCCESS;
  } else {
H
Haojun Liao 已提交
2836
    if (pOperator->pDownstream == NULL || pOperator->pDownstream[0] == NULL) {
2837
      return TSDB_CODE_INVALID_PARA;
H
Haojun Liao 已提交
2838
    } else {
2839
      return getTableScanInfo(pOperator->pDownstream[0], order, scanFlag);
2840 2841 2842
    }
  }
}
2843

L
Liu Jicong 已提交
2844 2845
int32_t doPrepareScan(SOperatorInfo* pOperator, uint64_t uid, int64_t ts) {
  int32_t type = pOperator->operatorType;
2846 2847 2848

  pOperator->status = OP_OPENED;

L
Liu Jicong 已提交
2849 2850
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
    SStreamBlockScanInfo* pScanInfo = pOperator->info;
2851 2852
    pScanInfo->blockType = STREAM_INPUT__DATA_SCAN;

2853 2854
    pScanInfo->pSnapshotReadOp->status = OP_OPENED;

2855
    STableScanInfo* pInfo = pScanInfo->pSnapshotReadOp->info;
2856 2857
    ASSERT(pInfo->scanMode == TABLE_SCAN__TABLE_ORDER);

L
Liu Jicong 已提交
2858 2859 2860 2861
    if (uid == 0) {
      pInfo->noTable = 1;
      return TSDB_CODE_SUCCESS;
    }
2862 2863 2864 2865 2866 2867

    /*if (pSnapShotScanInfo->dataReader == NULL) {*/
    /*pSnapShotScanInfo->dataReader = tsdbReaderOpen(pHandle->vnode, &pSTInfo->cond, tableList, 0, 0);*/
    /*pSnapShotScanInfo->scanMode = TABLE_SCAN__TABLE_ORDER;*/
    /*}*/

L
Liu Jicong 已提交
2868 2869
    pInfo->noTable = 0;

2870
    if (pInfo->lastStatus.uid != uid || pInfo->lastStatus.ts != ts) {
L
Liu Jicong 已提交
2871 2872 2873 2874 2875 2876 2877 2878 2879 2880 2881
      SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

      int32_t tableSz = taosArrayGetSize(pTaskInfo->tableqinfoList.pTableList);
      bool    found = false;
      for (int32_t i = 0; i < tableSz; i++) {
        STableKeyInfo* pTableInfo = taosArrayGet(pTaskInfo->tableqinfoList.pTableList, i);
        if (pTableInfo->uid == uid) {
          found = true;
          pInfo->currentTable = i;
        }
      }
2882
      // TODO after processing drop, found can be false
L
Liu Jicong 已提交
2883
      ASSERT(found);
2884 2885 2886 2887 2888 2889 2890 2891 2892

      tsdbSetTableId(pInfo->dataReader, uid);
      int64_t oldSkey = pInfo->cond.twindows[0].skey;
      pInfo->cond.twindows[0].skey = ts + 1;
      tsdbResetReadHandle(pInfo->dataReader, &pInfo->cond, 0);
      pInfo->cond.twindows[0].skey = oldSkey;
      pInfo->scanTimes = 0;
      pInfo->curTWinIdx = 0;

L
Liu Jicong 已提交
2893 2894
      qDebug("tsdb reader offset seek to uid %ld ts %ld, table cur set to %d , all table num %d", uid, ts,
             pInfo->currentTable, tableSz);
L
Liu Jicong 已提交
2895
    }
L
Liu Jicong 已提交
2896

L
Liu Jicong 已提交
2897
    return TSDB_CODE_SUCCESS;
2898

L
Liu Jicong 已提交
2899
  } else {
2900 2901 2902 2903 2904
    if (pOperator->numOfDownstream == 1) {
      return doPrepareScan(pOperator->pDownstream[0], uid, ts);
    } else if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator to set the input data block");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2905
    } else {
2906 2907
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2908 2909 2910 2911
    }
  }
}

2912 2913 2914 2915
int32_t doGetScanStatus(SOperatorInfo* pOperator, uint64_t* uid, int64_t* ts) {
  int32_t type = pOperator->operatorType;
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
    SStreamBlockScanInfo* pScanInfo = pOperator->info;
L
Liu Jicong 已提交
2916 2917 2918
    STableScanInfo*       pSnapShotScanInfo = pScanInfo->pSnapshotReadOp->info;
    *uid = pSnapShotScanInfo->lastStatus.uid;
    *ts = pSnapShotScanInfo->lastStatus.ts;
2919 2920 2921 2922 2923 2924 2925 2926 2927 2928 2929
  } else {
    if (pOperator->pDownstream[0] == NULL) {
      return TSDB_CODE_INVALID_PARA;
    } else {
      doGetScanStatus(pOperator->pDownstream[0], uid, ts);
    }
  }

  return TSDB_CODE_SUCCESS;
}

2930
// this is a blocking operator
L
Liu Jicong 已提交
2931
static int32_t doOpenAggregateOptr(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
2932 2933
  if (OPTR_IS_OPENED(pOperator)) {
    return TSDB_CODE_SUCCESS;
2934 2935
  }

H
Haojun Liao 已提交
2936
  SExecTaskInfo*    pTaskInfo = pOperator->pTaskInfo;
2937
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
2938

2939 2940
  SExprSupp*     pSup = &pOperator->exprSupp;
  SOperatorInfo* downstream = pOperator->pDownstream[0];
2941

2942 2943
  int64_t st = taosGetTimestampUs();

2944 2945 2946
  int32_t order = TSDB_ORDER_ASC;
  int32_t scanFlag = MAIN_SCAN;

H
Haojun Liao 已提交
2947
  while (1) {
2948
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
2949 2950 2951 2952
    if (pBlock == NULL) {
      break;
    }

2953 2954 2955 2956
    int32_t code = getTableScanInfo(pOperator, &order, &scanFlag);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
2957

2958
    // there is an scalar expression that needs to be calculated before apply the group aggregation.
2959 2960 2961
    if (pAggInfo->scalarExprSup.pExprInfo != NULL) {
      SExprSupp* pSup1 = &pAggInfo->scalarExprSup;
      code = projectApplyFunctions(pSup1->pExprInfo, pBlock, pBlock, pSup1->pCtx, pSup1->numOfExprs, NULL);
2962
      if (code != TSDB_CODE_SUCCESS) {
2963
        longjmp(pTaskInfo->env, code);
2964
      }
2965 2966
    }

2967
    // the pDataBlock are always the same one, no need to call this again
2968 2969 2970
    setExecutionContext(pOperator, pOperator->exprSupp.numOfExprs, pBlock->info.groupId, pAggInfo);
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, true);
    code = doAggregateImpl(pOperator, 0, pSup->pCtx);
2971 2972 2973
    if (code != 0) {
      longjmp(pTaskInfo->env, code);
    }
2974

dengyihao's avatar
dengyihao 已提交
2975
#if 0  // test for encode/decode result info
2976
    if(pOperator->fpSet.encodeResultRow){
2977 2978
      char *result = NULL;
      int32_t length = 0;
2979 2980
      pOperator->fpSet.encodeResultRow(pOperator, &result, &length);
      SAggSupporter* pSup = &pAggInfo->aggSup;
2981 2982
      taosHashClear(pSup->pResultRowHashTable);
      pInfo->resultRowInfo.size = 0;
2983
      pOperator->fpSet.decodeResultRow(pOperator, result);
2984 2985 2986
      if(result){
        taosMemoryFree(result);
      }
2987
    }
2988
#endif
2989 2990
  }

H
Haojun Liao 已提交
2991
  closeAllResultRows(&pAggInfo->binfo.resultRowInfo);
2992
  initGroupedResultInfo(&pAggInfo->groupResInfo, pAggInfo->aggSup.pResultRowHashTable, 0);
H
Haojun Liao 已提交
2993
  OPTR_SET_OPENED(pOperator);
2994

2995
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2996 2997 2998
  return TSDB_CODE_SUCCESS;
}

2999
static SSDataBlock* getAggregateResult(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3000
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
3001 3002 3003 3004 3005 3006
  SOptrBasicInfo*   pInfo = &pAggInfo->binfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

L
Liu Jicong 已提交
3007
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3008
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
H
Haojun Liao 已提交
3009
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
3010
    doSetOperatorCompleted(pOperator);
H
Haojun Liao 已提交
3011 3012 3013
    return NULL;
  }

H
Haojun Liao 已提交
3014
  blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);
3015
  doBuildResultDatablock(pOperator, pInfo, &pAggInfo->groupResInfo, pAggInfo->aggSup.pResultBuf);
3016
  if (pInfo->pRes->info.rows == 0 || !hasDataInGroupInfo(&pAggInfo->groupResInfo)) {
H
Haojun Liao 已提交
3017 3018
    doSetOperatorCompleted(pOperator);
  }
3019

3020
  size_t rows = blockDataGetNumOfRows(pInfo->pRes);
3021 3022
  pOperator->resultInfo.totalRows += rows;

3023
  return (rows == 0) ? NULL : pInfo->pRes;
3024 3025
}

wmmhello's avatar
wmmhello 已提交
3026
int32_t aggEncodeResultRow(SOperatorInfo* pOperator, char** result, int32_t* length) {
3027
  if (result == NULL || length == NULL) {
wmmhello's avatar
wmmhello 已提交
3028 3029 3030
    return TSDB_CODE_TSC_INVALID_INPUT;
  }
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3031 3032 3033 3034 3035
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
  int32_t         size = taosHashGetSize(pSup->pResultRowHashTable);
  size_t          keyLen = sizeof(uint64_t) * 2;  // estimate the key length
  int32_t         totalSize =
      sizeof(int32_t) + sizeof(int32_t) + size * (sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3036

C
Cary Xu 已提交
3037 3038 3039 3040 3041 3042
  // no result
  if (getTotalBufSize(pSup->pResultBuf) == 0) {
    *result = NULL;
    *length = 0;
    return TSDB_CODE_SUCCESS;
  }
3043

wmmhello's avatar
wmmhello 已提交
3044
  *result = (char*)taosMemoryCalloc(1, totalSize);
L
Liu Jicong 已提交
3045
  if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
3046
    return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
3047
  }
wmmhello's avatar
wmmhello 已提交
3048

wmmhello's avatar
wmmhello 已提交
3049
  int32_t offset = sizeof(int32_t);
wmmhello's avatar
wmmhello 已提交
3050 3051
  *(int32_t*)(*result + offset) = size;
  offset += sizeof(int32_t);
3052 3053

  // prepare memory
3054
  SResultRowPosition* pos = &pInfo->resultRowInfo.cur;
dengyihao's avatar
dengyihao 已提交
3055 3056
  void*               pPage = getBufPage(pSup->pResultBuf, pos->pageId);
  SResultRow*         pRow = (SResultRow*)((char*)pPage + pos->offset);
3057 3058 3059
  setBufPageDirty(pPage, true);
  releaseBufPage(pSup->pResultBuf, pPage);

dengyihao's avatar
dengyihao 已提交
3060
  void* pIter = taosHashIterate(pSup->pResultRowHashTable, NULL);
wmmhello's avatar
wmmhello 已提交
3061
  while (pIter) {
dengyihao's avatar
dengyihao 已提交
3062
    void*               key = taosHashGetKey(pIter, &keyLen);
3063
    SResultRowPosition* p1 = (SResultRowPosition*)pIter;
3064

dengyihao's avatar
dengyihao 已提交
3065
    pPage = (SFilePage*)getBufPage(pSup->pResultBuf, p1->pageId);
3066
    pRow = (SResultRow*)((char*)pPage + p1->offset);
3067 3068
    setBufPageDirty(pPage, true);
    releaseBufPage(pSup->pResultBuf, pPage);
wmmhello's avatar
wmmhello 已提交
3069 3070 3071

    // recalculate the result size
    int32_t realTotalSize = offset + sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize;
L
Liu Jicong 已提交
3072
    if (realTotalSize > totalSize) {
wmmhello's avatar
wmmhello 已提交
3073
      char* tmp = (char*)taosMemoryRealloc(*result, realTotalSize);
L
Liu Jicong 已提交
3074
      if (tmp == NULL) {
wafwerar's avatar
wafwerar 已提交
3075
        taosMemoryFree(*result);
wmmhello's avatar
wmmhello 已提交
3076
        *result = NULL;
wmmhello's avatar
wmmhello 已提交
3077
        return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
3078
      } else {
wmmhello's avatar
wmmhello 已提交
3079 3080 3081 3082 3083 3084 3085 3086 3087 3088 3089 3090
        *result = tmp;
      }
    }
    // save key
    *(int32_t*)(*result + offset) = keyLen;
    offset += sizeof(int32_t);
    memcpy(*result + offset, key, keyLen);
    offset += keyLen;

    // save value
    *(int32_t*)(*result + offset) = pSup->resultRowSize;
    offset += sizeof(int32_t);
3091
    memcpy(*result + offset, pRow, pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3092 3093 3094 3095 3096
    offset += pSup->resultRowSize;

    pIter = taosHashIterate(pSup->pResultRowHashTable, pIter);
  }

wmmhello's avatar
wmmhello 已提交
3097 3098 3099 3100
  *(int32_t*)(*result) = offset;
  *length = offset;

  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3101 3102
}

3103
int32_t aggDecodeResultRow(SOperatorInfo* pOperator, char* result) {
3104
  if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
3105
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3106
  }
wmmhello's avatar
wmmhello 已提交
3107
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3108
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
wmmhello's avatar
wmmhello 已提交
3109 3110

  //  int32_t size = taosHashGetSize(pSup->pResultRowHashTable);
3111
  int32_t length = *(int32_t*)(result);
wmmhello's avatar
wmmhello 已提交
3112
  int32_t offset = sizeof(int32_t);
3113 3114 3115 3116

  int32_t count = *(int32_t*)(result + offset);
  offset += sizeof(int32_t);

L
Liu Jicong 已提交
3117
  while (count-- > 0 && length > offset) {
wmmhello's avatar
wmmhello 已提交
3118 3119 3120
    int32_t keyLen = *(int32_t*)(result + offset);
    offset += sizeof(int32_t);

L
Liu Jicong 已提交
3121
    uint64_t    tableGroupId = *(uint64_t*)(result + offset);
3122
    SResultRow* resultRow = getNewResultRow(pSup->pResultBuf, tableGroupId, pSup->resultRowSize);
L
Liu Jicong 已提交
3123
    if (!resultRow) {
wmmhello's avatar
wmmhello 已提交
3124
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3125
    }
3126

wmmhello's avatar
wmmhello 已提交
3127
    // add a new result set for a new group
3128 3129
    SResultRowPosition pos = {.pageId = resultRow->pageId, .offset = resultRow->offset};
    taosHashPut(pSup->pResultRowHashTable, result + offset, keyLen, &pos, sizeof(SResultRowPosition));
wmmhello's avatar
wmmhello 已提交
3130 3131 3132

    offset += keyLen;
    int32_t valueLen = *(int32_t*)(result + offset);
L
Liu Jicong 已提交
3133
    if (valueLen != pSup->resultRowSize) {
wmmhello's avatar
wmmhello 已提交
3134
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3135 3136 3137 3138 3139 3140 3141 3142 3143 3144
    }
    offset += sizeof(int32_t);
    int32_t pageId = resultRow->pageId;
    int32_t pOffset = resultRow->offset;
    memcpy(resultRow, result + offset, valueLen);
    resultRow->pageId = pageId;
    resultRow->offset = pOffset;
    offset += valueLen;

    initResultRow(resultRow);
dengyihao's avatar
dengyihao 已提交
3145
    pInfo->resultRowInfo.cur = (SResultRowPosition){.pageId = resultRow->pageId, .offset = resultRow->offset};
wmmhello's avatar
wmmhello 已提交
3146 3147
  }

L
Liu Jicong 已提交
3148
  if (offset != length) {
wmmhello's avatar
wmmhello 已提交
3149
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3150
  }
wmmhello's avatar
wmmhello 已提交
3151
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3152 3153
}

3154 3155
enum {
  PROJECT_RETRIEVE_CONTINUE = 0x1,
L
Liu Jicong 已提交
3156
  PROJECT_RETRIEVE_DONE = 0x2,
3157 3158 3159 3160 3161
};

static int32_t handleLimitOffset(SOperatorInfo* pOperator, SSDataBlock* pBlock) {
  SProjectOperatorInfo* pProjectInfo = pOperator->info;
  SOptrBasicInfo*       pInfo = &pProjectInfo->binfo;
L
Liu Jicong 已提交
3162
  SSDataBlock*          pRes = pInfo->pRes;
3163 3164 3165 3166 3167 3168 3169 3170 3171 3172 3173 3174 3175 3176 3177 3178 3179 3180 3181 3182 3183 3184 3185 3186 3187 3188 3189 3190 3191 3192 3193 3194 3195 3196 3197 3198 3199 3200 3201 3202 3203 3204 3205 3206 3207 3208 3209 3210

  if (pProjectInfo->curSOffset > 0) {
    if (pProjectInfo->groupId == 0) {  // it is the first group
      pProjectInfo->groupId = pBlock->info.groupId;
      blockDataCleanup(pInfo->pRes);
      return PROJECT_RETRIEVE_CONTINUE;
    } else if (pProjectInfo->groupId != pBlock->info.groupId) {
      pProjectInfo->curSOffset -= 1;

      // ignore data block in current group
      if (pProjectInfo->curSOffset > 0) {
        blockDataCleanup(pInfo->pRes);
        return PROJECT_RETRIEVE_CONTINUE;
      }
    }

    // set current group id of the project operator
    pProjectInfo->groupId = pBlock->info.groupId;
  }

  if (pProjectInfo->groupId != 0 && pProjectInfo->groupId != pBlock->info.groupId) {
    pProjectInfo->curGroupOutput += 1;
    if ((pProjectInfo->slimit.limit > 0) && (pProjectInfo->slimit.limit <= pProjectInfo->curGroupOutput)) {
      pOperator->status = OP_EXEC_DONE;
      blockDataCleanup(pRes);

      return PROJECT_RETRIEVE_DONE;
    }

    // reset the value for a new group data
    pProjectInfo->curOffset = 0;
    pProjectInfo->curOutput = 0;
  }

  // here we reach the start position, according to the limit/offset requirements.

  // set current group id
  pProjectInfo->groupId = pBlock->info.groupId;

  if (pProjectInfo->curOffset >= pRes->info.rows) {
    pProjectInfo->curOffset -= pRes->info.rows;
    blockDataCleanup(pRes);
    return PROJECT_RETRIEVE_CONTINUE;
  } else if (pProjectInfo->curOffset < pRes->info.rows && pProjectInfo->curOffset > 0) {
    blockDataTrimFirstNRows(pRes, pProjectInfo->curOffset);
    pProjectInfo->curOffset = 0;
  }

3211
  // check for the limitation in each group
wmmhello's avatar
wmmhello 已提交
3212 3213 3214
  if (pProjectInfo->limit.limit >= 0 && pProjectInfo->curOutput + pRes->info.rows >= pProjectInfo->limit.limit) {
    int32_t keepRows = (int32_t)(pProjectInfo->limit.limit - pProjectInfo->curOutput);
    blockDataKeepFirstNRows(pRes, keepRows);
3215
    if (pProjectInfo->slimit.limit > 0 && pProjectInfo->slimit.limit <= pProjectInfo->curGroupOutput) {
3216 3217 3218
      pOperator->status = OP_EXEC_DONE;
    }

3219
    return PROJECT_RETRIEVE_DONE;
3220
  }
3221

3222
  // todo optimize performance
3223 3224
  // If there are slimit/soffset value exists, multi-round result can not be packed into one group, since the
  // they may not belong to the same group the limit/offset value is not valid in this case.
L
Liu Jicong 已提交
3225 3226
  if (pRes->info.rows >= pOperator->resultInfo.threshold || pProjectInfo->slimit.offset != -1 ||
      pProjectInfo->slimit.limit != -1) {
3227
    return PROJECT_RETRIEVE_DONE;
L
Liu Jicong 已提交
3228
  } else {  // not full enough, continue to accumulate the output data in the buffer.
3229 3230 3231 3232
    return PROJECT_RETRIEVE_CONTINUE;
  }
}

3233
static SSDataBlock* doProjectOperation(SOperatorInfo* pOperator) {
3234
  SProjectOperatorInfo* pProjectInfo = pOperator->info;
L
Liu Jicong 已提交
3235
  SOptrBasicInfo*       pInfo = &pProjectInfo->binfo;
3236

L
Liu Jicong 已提交
3237
  SExprSupp*   pSup = &pOperator->exprSupp;
3238
  SSDataBlock* pRes = pInfo->pRes;
3239
  blockDataCleanup(pRes);
3240

3241
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
3242 3243 3244
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }
dengyihao's avatar
dengyihao 已提交
3245

H
Haojun Liao 已提交
3246
#if 0
3247 3248 3249 3250 3251
  if (pProjectInfo->existDataBlock) {  // TODO refactor
    SSDataBlock* pBlock = pProjectInfo->existDataBlock;
    pProjectInfo->existDataBlock = NULL;

    // the pDataBlock are always the same one, no need to call this again
H
Haojun Liao 已提交
3252
    setInputDataBlock(pOperator, pInfo->pCtx, pBlock, TSDB_ORDER_ASC);
3253

H
Haojun Liao 已提交
3254
    blockDataEnsureCapacity(pInfo->pRes, pBlock->info.rows);
3255
    projectApplyFunctions(pOperator->exprSupp.pExprInfo, pInfo->pRes, pBlock, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
L
Liu Jicong 已提交
3256
    if (pRes->info.rows >= pProjectInfo->binfo.capacity * 0.8) {
3257 3258
      copyTsColoum(pRes, pInfo->pCtx, pOperator->exprSupp.numOfExprs);
      resetResultRowEntryResult(pInfo->pCtx, pOperator->exprSupp.numOfExprs);
3259 3260 3261
      return pRes;
    }
  }
H
Haojun Liao 已提交
3262
#endif
3263

3264
  int64_t st = 0;
3265 3266 3267
  int32_t order = 0;
  int32_t scanFlag = 0;

3268 3269 3270 3271
  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

H
Haojun Liao 已提交
3272 3273
  SOperatorInfo* downstream = pOperator->pDownstream[0];

L
Liu Jicong 已提交
3274
  while (1) {
H
Haojun Liao 已提交
3275
    // The downstream exec may change the value of the newgroup, so use a local variable instead.
3276
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
3277
    if (pBlock == NULL) {
3278
      doSetOperatorCompleted(pOperator);
3279 3280
      break;
    }
3281 3282 3283 3284
    if (pBlock->info.type == STREAM_RETRIEVE) {
      // for stream interval
      return pBlock;
    }
3285 3286

    // the pDataBlock are always the same one, no need to call this again
3287
    int32_t code = getTableScanInfo(pOperator->pDownstream[0], &order, &scanFlag);
3288 3289 3290
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
3291

3292
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
3293 3294
    blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

3295
    code = projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs,
X
Xiaoyu Wang 已提交
3296
                                 pProjectInfo->pPseudoColInfo);
3297 3298
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
3299 3300
    }

3301
    int32_t status = handleLimitOffset(pOperator, pBlock);
3302 3303 3304 3305

    // filter shall be applied after apply functions and limit/offset on the result
    doFilter(pProjectInfo->pFilterNode, pInfo->pRes);

3306
    if (status == PROJECT_RETRIEVE_CONTINUE) {
H
Haojun Liao 已提交
3307
      continue;
L
Liu Jicong 已提交
3308
    } else if (status == PROJECT_RETRIEVE_DONE) {
3309 3310 3311
      break;
    }
  }
dengyihao's avatar
dengyihao 已提交
3312

H
Haojun Liao 已提交
3313
  pProjectInfo->curOutput += pInfo->pRes->info.rows;
H
Haojun Liao 已提交
3314

3315 3316 3317 3318
  size_t rows = pInfo->pRes->info.rows;
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
3319
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
3320 3321
  }

3322
  return (rows > 0) ? pInfo->pRes : NULL;
3323 3324
}

L
Liu Jicong 已提交
3325 3326
static void doHandleRemainBlockForNewGroupImpl(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo, bool* newgroup,
                                               SExecTaskInfo* pTaskInfo) {
3327
  pInfo->totalInputRows = pInfo->existNewGroupBlock->info.rows;
H
Haojun Liao 已提交
3328

L
Liu Jicong 已提交
3329 3330
  int64_t ekey = Q_STATUS_EQUAL(pTaskInfo->status, TASK_COMPLETED) ? pTaskInfo->window.ekey
                                                                   : pInfo->existNewGroupBlock->info.window.ekey;
3331 3332
  taosResetFillInfo(pInfo->pFillInfo, getFillInfoStart(pInfo->pFillInfo));

3333
  taosFillSetStartInfo(pInfo->pFillInfo, pInfo->existNewGroupBlock->info.rows, ekey);
3334 3335
  taosFillSetInputDataBlock(pInfo->pFillInfo, pInfo->existNewGroupBlock);

3336
  doFillTimeIntervalGapsInResults(pInfo->pFillInfo, pInfo->pRes, pResultInfo->capacity);
3337 3338 3339 3340
  pInfo->existNewGroupBlock = NULL;
  *newgroup = true;
}

L
Liu Jicong 已提交
3341 3342
static void doHandleRemainBlockFromNewGroup(SFillOperatorInfo* pInfo, SResultInfo* pResultInfo, bool* newgroup,
                                            SExecTaskInfo* pTaskInfo) {
3343 3344
  if (taosFillHasMoreResults(pInfo->pFillInfo)) {
    *newgroup = false;
3345
    doFillTimeIntervalGapsInResults(pInfo->pFillInfo, pInfo->pRes, (int32_t)pResultInfo->capacity);
H
Haojun Liao 已提交
3346
    if (pInfo->pRes->info.rows > pResultInfo->threshold || (!pInfo->multigroupResult)) {
3347 3348 3349 3350 3351 3352
      return;
    }
  }

  // handle the cached new group data block
  if (pInfo->existNewGroupBlock) {
3353
    doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, newgroup, pTaskInfo);
3354 3355 3356
  }
}

3357
static SSDataBlock* doFill(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3358 3359
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;
3360

H
Haojun Liao 已提交
3361
  SResultInfo* pResultInfo = &pOperator->resultInfo;
3362 3363 3364
  SSDataBlock* pResBlock = pInfo->pRes;

  blockDataCleanup(pResBlock);
3365 3366 3367 3368
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

3369
  // todo handle different group data interpolation
X
Xiaoyu Wang 已提交
3370 3371
  bool  n = false;
  bool* newgroup = &n;
3372
  doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, newgroup, pTaskInfo);
3373 3374
  if (pResBlock->info.rows > pResultInfo->threshold || (!pInfo->multigroupResult && pResBlock->info.rows > 0)) {
    return pResBlock;
H
Haojun Liao 已提交
3375
  }
3376

H
Haojun Liao 已提交
3377
  SOperatorInfo* pDownstream = pOperator->pDownstream[0];
L
Liu Jicong 已提交
3378
  while (1) {
3379
    SSDataBlock* pBlock = pDownstream->fpSet.getNextFn(pDownstream);
3380 3381 3382 3383 3384 3385 3386 3387 3388 3389
    if (*newgroup) {
      assert(pBlock != NULL);
    }

    if (*newgroup && pInfo->totalInputRows > 0) {  // there are already processed current group data block
      pInfo->existNewGroupBlock = pBlock;
      *newgroup = false;

      // Fill the previous group data block, before handle the data block of new group.
      // Close the fill operation for previous group data block
3390
      taosFillSetStartInfo(pInfo->pFillInfo, 0, pTaskInfo->window.ekey);
3391 3392 3393 3394 3395 3396 3397
    } else {
      if (pBlock == NULL) {
        if (pInfo->totalInputRows == 0) {
          pOperator->status = OP_EXEC_DONE;
          return NULL;
        }

3398
        taosFillSetStartInfo(pInfo->pFillInfo, 0, pTaskInfo->window.ekey);
3399 3400 3401 3402 3403 3404 3405
      } else {
        pInfo->totalInputRows += pBlock->info.rows;
        taosFillSetStartInfo(pInfo->pFillInfo, pBlock->info.rows, pBlock->info.window.ekey);
        taosFillSetInputDataBlock(pInfo->pFillInfo, pBlock);
      }
    }

3406 3407
    blockDataEnsureCapacity(pResBlock, pOperator->resultInfo.capacity);
    doFillTimeIntervalGapsInResults(pInfo->pFillInfo, pResBlock, pOperator->resultInfo.capacity);
3408 3409

    // current group has no more result to return
3410
    if (pResBlock->info.rows > 0) {
3411 3412
      // 1. The result in current group not reach the threshold of output result, continue
      // 2. If multiple group results existing in one SSDataBlock is not allowed, return immediately
3413 3414
      if (pResBlock->info.rows > pResultInfo->threshold || pBlock == NULL || (!pInfo->multigroupResult)) {
        return pResBlock;
3415 3416
      }

3417
      doHandleRemainBlockFromNewGroup(pInfo, pResultInfo, newgroup, pTaskInfo);
3418 3419
      if (pResBlock->info.rows > pOperator->resultInfo.threshold || pBlock == NULL) {
        return pResBlock;
3420 3421 3422
      }
    } else if (pInfo->existNewGroupBlock) {  // try next group
      assert(pBlock != NULL);
3423
      doHandleRemainBlockForNewGroupImpl(pInfo, pResultInfo, newgroup, pTaskInfo);
3424 3425
      if (pResBlock->info.rows > pResultInfo->threshold) {
        return pResBlock;
3426 3427 3428 3429 3430 3431 3432
      }
    } else {
      return NULL;
    }
  }
}

H
Haojun Liao 已提交
3433 3434 3435 3436 3437 3438 3439 3440 3441 3442 3443
static void destroyExprInfo(SExprInfo* pExpr, int32_t numOfExprs) {
  for (int32_t i = 0; i < numOfExprs; ++i) {
    SExprInfo* pExprInfo = &pExpr[i];
    if (pExprInfo->pExpr->nodeType == QUERY_NODE_COLUMN) {
      taosMemoryFree(pExprInfo->base.pParam[0].pCol);
    }
    taosMemoryFree(pExprInfo->base.pParam);
    taosMemoryFree(pExprInfo->pExpr);
  }
}

3444 3445 3446 3447 3448
static void destroyOperatorInfo(SOperatorInfo* pOperator) {
  if (pOperator == NULL) {
    return;
  }

3449
  if (pOperator->fpSet.closeFn != NULL) {
3450
    pOperator->fpSet.closeFn(pOperator->info, pOperator->exprSupp.numOfExprs);
3451 3452
  }

H
Haojun Liao 已提交
3453
  if (pOperator->pDownstream != NULL) {
L
Liu Jicong 已提交
3454
    for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
H
Haojun Liao 已提交
3455
      destroyOperatorInfo(pOperator->pDownstream[i]);
3456 3457
    }

wafwerar's avatar
wafwerar 已提交
3458
    taosMemoryFreeClear(pOperator->pDownstream);
H
Haojun Liao 已提交
3459
    pOperator->numOfDownstream = 0;
3460 3461
  }

3462 3463
  if (pOperator->exprSupp.pExprInfo != NULL) {
    destroyExprInfo(pOperator->exprSupp.pExprInfo, pOperator->exprSupp.numOfExprs);
H
Haojun Liao 已提交
3464 3465
  }

3466
  taosMemoryFreeClear(pOperator->exprSupp.pExprInfo);
wafwerar's avatar
wafwerar 已提交
3467 3468
  taosMemoryFreeClear(pOperator->info);
  taosMemoryFreeClear(pOperator);
3469 3470
}

3471 3472 3473 3474 3475 3476 3477 3478 3479 3480 3481 3482 3483 3484 3485
int32_t getBufferPgSize(int32_t rowSize, uint32_t* defaultPgsz, uint32_t* defaultBufsz) {
  *defaultPgsz = 4096;
  while (*defaultPgsz < rowSize * 4) {
    *defaultPgsz <<= 1u;
  }

  // at least four pages need to be in buffer
  *defaultBufsz = 4096 * 256;
  if ((*defaultBufsz) <= (*defaultPgsz)) {
    (*defaultBufsz) = (*defaultPgsz) * 4;
  }

  return 0;
}

dengyihao's avatar
dengyihao 已提交
3486 3487
int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                         const char* pKey) {
3488 3489
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);

dengyihao's avatar
dengyihao 已提交
3490 3491
  pAggSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
  pAggSup->keyBuf = taosMemoryCalloc(1, keyBufSize + POINTER_BYTES + sizeof(int64_t));
3492 3493
  pAggSup->pResultRowHashTable = taosHashInit(10, hashFn, true, HASH_NO_LOCK);

H
Haojun Liao 已提交
3494
  if (pAggSup->keyBuf == NULL || pAggSup->pResultRowHashTable == NULL) {
3495 3496 3497
    return TSDB_CODE_OUT_OF_MEMORY;
  }

dengyihao's avatar
dengyihao 已提交
3498
  uint32_t defaultPgsz = 0;
3499 3500
  uint32_t defaultBufsz = 0;
  getBufferPgSize(pAggSup->resultRowSize, &defaultPgsz, &defaultBufsz);
H
Haojun Liao 已提交
3501

3502
  int32_t code = createDiskbasedBuf(&pAggSup->pResultBuf, defaultPgsz, defaultBufsz, pKey, TD_TMP_DIR_PATH);
H
Haojun Liao 已提交
3503 3504 3505 3506
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3507 3508 3509
  return TSDB_CODE_SUCCESS;
}

3510
void cleanupAggSup(SAggSupporter* pAggSup) {
wafwerar's avatar
wafwerar 已提交
3511
  taosMemoryFreeClear(pAggSup->keyBuf);
3512
  taosHashCleanup(pAggSup->pResultRowHashTable);
H
Haojun Liao 已提交
3513
  destroyDiskbasedBuf(pAggSup->pResultBuf);
3514 3515
}

L
Liu Jicong 已提交
3516 3517
int32_t initAggInfo(SExprSupp* pSup, SAggSupporter* pAggSup, SExprInfo* pExprInfo, int32_t numOfCols, size_t keyBufSize,
                    const char* pkey) {
3518 3519 3520 3521 3522
  int32_t code = initExprSupp(pSup, pExprInfo, numOfCols);
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3523
  doInitAggInfoSup(pAggSup, pSup->pCtx, numOfCols, keyBufSize, pkey);
L
Liu Jicong 已提交
3524
  for (int32_t i = 0; i < numOfCols; ++i) {
3525
    pSup->pCtx[i].pBuf = pAggSup->pResultBuf;
3526 3527
  }

3528
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
3529 3530
}

3531
void initResultSizeInfo(SOperatorInfo* pOperator, int32_t numOfRows) {
wmmhello's avatar
wmmhello 已提交
3532
  ASSERT(numOfRows != 0);
3533 3534 3535 3536
  pOperator->resultInfo.capacity = numOfRows;
  pOperator->resultInfo.threshold = numOfRows * 0.75;

  if (pOperator->resultInfo.threshold == 0) {
wmmhello's avatar
wmmhello 已提交
3537
    pOperator->resultInfo.threshold = numOfRows;
3538 3539 3540
  }
}

3541 3542 3543 3544 3545
void initBasicInfo(SOptrBasicInfo* pInfo, SSDataBlock* pBlock) {
  pInfo->pRes = pBlock;
  initResultRowInfo(&pInfo->resultRowInfo);
}

3546
int32_t initExprSupp(SExprSupp* pSup, SExprInfo* pExprInfo, int32_t numOfExpr) {
3547 3548 3549 3550
  pSup->pExprInfo = pExprInfo;
  pSup->numOfExprs = numOfExpr;
  if (pSup->pExprInfo != NULL) {
    pSup->pCtx = createSqlFunctionCtx(pExprInfo, numOfExpr, &pSup->rowEntryInfoOffset);
3551 3552 3553
    if (pSup->pCtx == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
3554
  }
3555 3556

  return TSDB_CODE_SUCCESS;
3557 3558
}

L
Liu Jicong 已提交
3559
SOperatorInfo* createAggregateOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
3560
                                           SSDataBlock* pResultBlock, SExprInfo* pScalarExprInfo,
wmmhello's avatar
wmmhello 已提交
3561
                                           int32_t numOfScalarExpr, SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3562
  SAggOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SAggOperatorInfo));
L
Liu Jicong 已提交
3563
  SOperatorInfo*    pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3564 3565 3566
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
H
Haojun Liao 已提交
3567

3568
  int32_t numOfRows = 1024;
dengyihao's avatar
dengyihao 已提交
3569
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3570 3571

  initResultSizeInfo(pOperator, numOfRows);
3572
  int32_t code = initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
L
Liu Jicong 已提交
3573
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3574 3575
    goto _error;
  }
H
Haojun Liao 已提交
3576

3577
  initBasicInfo(&pInfo->binfo, pResultBlock);
3578 3579 3580 3581
  code = initExprSupp(&pInfo->scalarExprSup, pScalarExprInfo, numOfScalarExpr);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3582

L
Liu Jicong 已提交
3583
  pInfo->groupId = INT32_MIN;
dengyihao's avatar
dengyihao 已提交
3584
  pOperator->name = "TableAggregate";
3585
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_HASH_AGG;
3586
  pOperator->blocking = true;
dengyihao's avatar
dengyihao 已提交
3587 3588 3589
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3590

3591 3592
  pOperator->fpSet = createOperatorFpSet(doOpenAggregateOptr, getAggregateResult, NULL, NULL, destroyAggOperatorInfo,
                                         aggEncodeResultRow, aggDecodeResultRow, NULL);
H
Haojun Liao 已提交
3593 3594 3595 3596 3597

  code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3598 3599

  return pOperator;
L
Liu Jicong 已提交
3600
_error:
H
Haojun Liao 已提交
3601
  destroyAggOperatorInfo(pInfo, numOfCols);
wafwerar's avatar
wafwerar 已提交
3602 3603
  taosMemoryFreeClear(pInfo);
  taosMemoryFreeClear(pOperator);
H
Haojun Liao 已提交
3604 3605
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3606 3607
}

3608 3609 3610 3611 3612 3613 3614 3615 3616 3617 3618 3619 3620 3621 3622 3623 3624 3625 3626
static void* destroySqlFunctionCtx(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
  if (pCtx == NULL) {
    return NULL;
  }

  for (int32_t i = 0; i < numOfOutput; ++i) {
    for (int32_t j = 0; j < pCtx[i].numOfParams; ++j) {
      taosVariantDestroy(&pCtx[i].param[j].param);
    }

    taosMemoryFreeClear(pCtx[i].subsidiaries.pCtx);
    taosMemoryFree(pCtx[i].input.pData);
    taosMemoryFree(pCtx[i].input.pColumnDataAgg);
  }

  taosMemoryFreeClear(pCtx);
  return NULL;
}

3627
void cleanupBasicInfo(SOptrBasicInfo* pInfo) {
3628 3629
  assert(pInfo != NULL);
  cleanupResultRowInfo(&pInfo->resultRowInfo);
H
Haojun Liao 已提交
3630
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
3631 3632
}

H
Haojun Liao 已提交
3633
void destroyBasicOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3634
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)param;
3635
  cleanupBasicInfo(pInfo);
3636
}
H
Haojun Liao 已提交
3637 3638

void destroyAggOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3639
  SAggOperatorInfo* pInfo = (SAggOperatorInfo*)param;
3640
  cleanupBasicInfo(&pInfo->binfo);
3641
}
3642

H
Haojun Liao 已提交
3643
void destroySFillOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3644
  SFillOperatorInfo* pInfo = (SFillOperatorInfo*)param;
3645
  pInfo->pFillInfo = taosDestroyFillInfo(pInfo->pFillInfo);
H
Haojun Liao 已提交
3646
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
wafwerar's avatar
wafwerar 已提交
3647
  taosMemoryFreeClear(pInfo->p);
3648 3649
}

H
Haojun Liao 已提交
3650
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput) {
D
fix bug  
dapan 已提交
3651 3652 3653
  if (NULL == param) {
    return;
  }
L
Liu Jicong 已提交
3654
  SProjectOperatorInfo* pInfo = (SProjectOperatorInfo*)param;
3655
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3656
  cleanupAggSup(&pInfo->aggSup);
H
Haojun Liao 已提交
3657
  taosArrayDestroy(pInfo->pPseudoColInfo);
3658 3659
}

3660
void cleanupExprSupp(SExprSupp* pSupp) {
3661 3662 3663 3664 3665 3666
  destroySqlFunctionCtx(pSupp->pCtx, pSupp->numOfExprs);
  destroyExprInfo(pSupp->pExprInfo, pSupp->numOfExprs);

  taosMemoryFree(pSupp->rowEntryInfoOffset);
}

H
Haojun Liao 已提交
3667
static void destroyIndefinitOperatorInfo(void* param, int32_t numOfOutput) {
3668
  SIndefOperatorInfo* pInfo = (SIndefOperatorInfo*)param;
3669
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
3670 3671 3672

  taosArrayDestroy(pInfo->pPseudoColInfo);
  cleanupAggSup(&pInfo->aggSup);
3673
  cleanupExprSupp(&pInfo->scalarSup);
H
Haojun Liao 已提交
3674 3675
}

H
Haojun Liao 已提交
3676
void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3677
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3678 3679 3680 3681
  taosRemoveRef(exchangeObjRefPool, pExInfo->self);
}

void doDestroyExchangeOperatorInfo(void* param) {
X
Xiaoyu Wang 已提交
3682
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3683

H
Haojun Liao 已提交
3684 3685 3686 3687 3688 3689 3690 3691 3692
  taosArrayDestroy(pExInfo->pSources);
  taosArrayDestroy(pExInfo->pSourceDataInfo);
  if (pExInfo->pResult != NULL) {
    blockDataDestroy(pExInfo->pResult);
  }

  tsem_destroy(&pExInfo->ready);
}

H
Haojun Liao 已提交
3693 3694
static SArray* setRowTsColumnOutputInfo(SqlFunctionCtx* pCtx, int32_t numOfCols) {
  SArray* pList = taosArrayInit(4, sizeof(int32_t));
dengyihao's avatar
dengyihao 已提交
3695
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
3696 3697 3698 3699 3700 3701 3702 3703
    if (fmIsPseudoColumnFunc(pCtx[i].functionId)) {
      taosArrayPush(pList, &i);
    }
  }

  return pList;
}

3704 3705 3706 3707
static int64_t getLimit(SNode* pLimit) { return NULL == pLimit ? -1 : ((SLimitNode*)pLimit)->limit; }

static int64_t getOffset(SNode* pLimit) { return NULL == pLimit ? -1 : ((SLimitNode*)pLimit)->offset; }

L
Liu Jicong 已提交
3708
SOperatorInfo* createProjectOperatorInfo(SOperatorInfo* downstream, SProjectPhysiNode* pProjPhyNode,
dengyihao's avatar
dengyihao 已提交
3709
                                         SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3710
  SProjectOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SProjectOperatorInfo));
L
Liu Jicong 已提交
3711
  SOperatorInfo*        pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3712 3713 3714
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
3715

L
Liu Jicong 已提交
3716
  int32_t    numOfCols = 0;
3717 3718 3719
  SExprInfo* pExprInfo = createExprInfo(pProjPhyNode->pProjections, NULL, &numOfCols);

  SSDataBlock* pResBlock = createResDataBlock(pProjPhyNode->node.pOutputDataBlockDesc);
3720 3721
  SLimit       limit = {.limit = getLimit(pProjPhyNode->node.pLimit), .offset = getOffset(pProjPhyNode->node.pLimit)};
  SLimit slimit = {.limit = getLimit(pProjPhyNode->node.pSlimit), .offset = getOffset(pProjPhyNode->node.pSlimit)};
3722

L
Liu Jicong 已提交
3723 3724 3725 3726
  pInfo->limit = limit;
  pInfo->slimit = slimit;
  pInfo->curOffset = limit.offset;
  pInfo->curSOffset = slimit.offset;
H
Haojun Liao 已提交
3727
  pInfo->binfo.pRes = pResBlock;
3728
  pInfo->pFilterNode = pProjPhyNode->node.pConditions;
H
Haojun Liao 已提交
3729 3730

  int32_t numOfRows = 4096;
dengyihao's avatar
dengyihao 已提交
3731
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3732

3733 3734 3735 3736 3737
  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
3738
  initResultSizeInfo(pOperator, numOfRows);
3739

3740 3741
  initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
  initBasicInfo(&pInfo->binfo, pResBlock);
3742
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfCols);
3743

3744
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pOperator->exprSupp.pCtx, numOfCols);
X
Xiaoyu Wang 已提交
3745
  pOperator->name = "ProjectOperator";
H
Haojun Liao 已提交
3746
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_PROJECT;
X
Xiaoyu Wang 已提交
3747 3748 3749 3750
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
3751

L
Liu Jicong 已提交
3752 3753
  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doProjectOperation, NULL, NULL,
                                         destroyProjectOperatorInfo, NULL, NULL, NULL);
L
Liu Jicong 已提交
3754

3755
  int32_t code = appendDownstream(pOperator, &downstream, 1);
H
Haojun Liao 已提交
3756
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3757 3758
    goto _error;
  }
3759 3760

  return pOperator;
H
Haojun Liao 已提交
3761

L
Liu Jicong 已提交
3762
_error:
H
Haojun Liao 已提交
3763 3764
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3765 3766
}

H
Haojun Liao 已提交
3767 3768
static SSDataBlock* doApplyIndefinitFunction(SOperatorInfo* pOperator) {
  SIndefOperatorInfo* pIndefInfo = pOperator->info;
3769
  SOptrBasicInfo*     pInfo = &pIndefInfo->binfo;
L
Liu Jicong 已提交
3770
  SExprSupp*          pSup = &pOperator->exprSupp;
H
Haojun Liao 已提交
3771 3772 3773 3774 3775 3776 3777 3778 3779 3780 3781 3782 3783 3784 3785 3786 3787 3788 3789 3790 3791 3792 3793 3794 3795 3796 3797 3798 3799 3800 3801 3802 3803 3804

  SSDataBlock* pRes = pInfo->pRes;
  blockDataCleanup(pRes);

  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

  int64_t st = 0;
  int32_t order = 0;
  int32_t scanFlag = 0;

  if (pOperator->cost.openCost == 0) {
    st = taosGetTimestampUs();
  }

  SOperatorInfo* downstream = pOperator->pDownstream[0];

  while (1) {
    // The downstream exec may change the value of the newgroup, so use a local variable instead.
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
    if (pBlock == NULL) {
      doSetOperatorCompleted(pOperator);
      break;
    }

    // the pDataBlock are always the same one, no need to call this again
    int32_t code = getTableScanInfo(pOperator->pDownstream[0], &order, &scanFlag);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }

    // there is an scalar expression that needs to be calculated before apply the group aggregation.
3805
    SExprSupp* pScalarSup = &pIndefInfo->scalarSup;
3806 3807
    if (pScalarSup->pExprInfo != NULL) {
      code = projectApplyFunctions(pScalarSup->pExprInfo, pBlock, pBlock, pScalarSup->pCtx, pScalarSup->numOfExprs,
L
Liu Jicong 已提交
3808
                                   pIndefInfo->pPseudoColInfo);
H
Haojun Liao 已提交
3809 3810 3811 3812 3813
      if (code != TSDB_CODE_SUCCESS) {
        longjmp(pTaskInfo->env, code);
      }
    }

3814
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
H
Haojun Liao 已提交
3815 3816
    blockDataEnsureCapacity(pInfo->pRes, pInfo->pRes->info.rows + pBlock->info.rows);

L
Liu Jicong 已提交
3817 3818
    code = projectApplyFunctions(pOperator->exprSupp.pExprInfo, pInfo->pRes, pBlock, pSup->pCtx,
                                 pOperator->exprSupp.numOfExprs, pIndefInfo->pPseudoColInfo);
H
Haojun Liao 已提交
3819 3820 3821 3822 3823 3824 3825 3826 3827 3828 3829 3830 3831 3832 3833
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
  }

  size_t rows = pInfo->pRes->info.rows;
  pOperator->resultInfo.totalRows += rows;

  if (pOperator->cost.openCost == 0) {
    pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
  }

  return (rows > 0) ? pInfo->pRes : NULL;
}

3834 3835
SOperatorInfo* createIndefinitOutputOperatorInfo(SOperatorInfo* downstream, SPhysiNode* pNode,
                                                 SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
3836
  SIndefOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SIndefOperatorInfo));
3837
  SOperatorInfo*      pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3838 3839 3840 3841
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

3842 3843
  SExprSupp* pSup = &pOperator->exprSupp;

H
Haojun Liao 已提交
3844 3845 3846
  SIndefRowsFuncPhysiNode* pPhyNode = (SIndefRowsFuncPhysiNode*)pNode;

  int32_t    numOfExpr = 0;
X
Xiaoyu Wang 已提交
3847
  SExprInfo* pExprInfo = createExprInfo(pPhyNode->pFuncs, NULL, &numOfExpr);
H
Haojun Liao 已提交
3848 3849

  if (pPhyNode->pExprs != NULL) {
3850
    int32_t    num = 0;
3851
    SExprInfo* pSExpr = createExprInfo(pPhyNode->pExprs, NULL, &num);
3852
    int32_t    code = initExprSupp(&pInfo->scalarSup, pSExpr, num);
3853 3854 3855
    if (code != TSDB_CODE_SUCCESS) {
      goto _error;
    }
H
Haojun Liao 已提交
3856 3857
  }

3858
  SSDataBlock* pResBlock = createResDataBlock(pPhyNode->node.pOutputDataBlockDesc);
H
Haojun Liao 已提交
3859 3860 3861 3862 3863 3864 3865 3866 3867 3868 3869

  int32_t numOfRows = 4096;
  size_t  keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;

  // Make sure the size of SSDataBlock will never exceed the size of 2MB.
  int32_t TWOMB = 2 * 1024 * 1024;
  if (numOfRows * pResBlock->info.rowSize > TWOMB) {
    numOfRows = TWOMB / pResBlock->info.rowSize;
  }
  initResultSizeInfo(pOperator, numOfRows);

3870 3871 3872
  initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfExpr, keyBufSize, pTaskInfo->id.str);
  initBasicInfo(&pInfo->binfo, pResBlock);

3873
  setFunctionResultOutput(pOperator, &pInfo->binfo, &pInfo->aggSup, MAIN_SCAN, numOfExpr);
H
Haojun Liao 已提交
3874

3875 3876
  pInfo->binfo.pRes = pResBlock;
  pInfo->pPseudoColInfo = setRowTsColumnOutputInfo(pSup->pCtx, numOfExpr);
H
Haojun Liao 已提交
3877

3878
  pOperator->name = "IndefinitOperator";
H
Haojun Liao 已提交
3879
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_PROJECT;
3880 3881 3882
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
3883
  pOperator->exprSupp.numOfExprs = numOfExpr;
3884
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3885 3886 3887 3888 3889 3890 3891 3892 3893 3894 3895

  pOperator->fpSet = createOperatorFpSet(operatorDummyOpenFn, doApplyIndefinitFunction, NULL, NULL,
                                         destroyIndefinitOperatorInfo, NULL, NULL, NULL);

  int32_t code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  return pOperator;

3896
_error:
H
Haojun Liao 已提交
3897 3898 3899 3900 3901 3902
  taosMemoryFree(pInfo);
  taosMemoryFree(pOperator);
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
}

3903
static int32_t initFillInfo(SFillOperatorInfo* pInfo, SExprInfo* pExpr, int32_t numOfCols, SNodeListNode* pValNode,
L
Liu Jicong 已提交
3904
                            STimeWindow win, int32_t capacity, const char* id, SInterval* pInterval, int32_t fillType) {
3905
  SFillColInfo* pColInfo = createFillColInfo(pExpr, numOfCols, pValNode);
H
Haojun Liao 已提交
3906 3907

  STimeWindow w = TSWINDOW_INITIALIZER;
3908
  getAlignQueryTimeWindow(pInterval, pInterval->precision, win.skey, &w);
H
Haojun Liao 已提交
3909 3910

  int32_t order = TSDB_ORDER_ASC;
3911
  pInfo->pFillInfo = taosCreateFillInfo(order, w.skey, 0, capacity, numOfCols, pInterval, fillType, pColInfo, id);
H
Haojun Liao 已提交
3912

wafwerar's avatar
wafwerar 已提交
3913
  pInfo->p = taosMemoryCalloc(numOfCols, POINTER_BYTES);
H
Haojun Liao 已提交
3914
  if (pInfo->pFillInfo == NULL || pInfo->p == NULL) {
H
Haojun Liao 已提交
3915 3916
    taosMemoryFree(pInfo->pFillInfo);
    taosMemoryFree(pInfo->p);
H
Haojun Liao 已提交
3917 3918 3919 3920 3921 3922
    return TSDB_CODE_OUT_OF_MEMORY;
  } else {
    return TSDB_CODE_SUCCESS;
  }
}

3923 3924 3925 3926 3927 3928 3929 3930
SOperatorInfo* createFillOperatorInfo(SOperatorInfo* downstream, SFillPhysiNode* pPhyFillNode, bool multigroupResult,
                                      SExecTaskInfo* pTaskInfo) {
  SFillOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SFillOperatorInfo));
  SOperatorInfo*     pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

L
Liu Jicong 已提交
3931 3932 3933 3934 3935
  int32_t      num = 0;
  SSDataBlock* pResBlock = createResDataBlock(pPhyFillNode->node.pOutputDataBlockDesc);
  SExprInfo*   pExprInfo = createExprInfo(pPhyFillNode->pTargets, NULL, &num);
  SInterval*   pInterval = &((SIntervalAggOperatorInfo*)downstream->info)->interval;
  int32_t      type = convertFillType(pPhyFillNode->mode);
3936

H
Haojun Liao 已提交
3937
  SResultInfo* pResultInfo = &pOperator->resultInfo;
3938 3939
  initResultSizeInfo(pOperator, 4096);

3940 3941
  int32_t code = initFillInfo(pInfo, pExprInfo, num, (SNodeListNode*)pPhyFillNode->pValues, pPhyFillNode->timeRange,
                              pResultInfo->capacity, pTaskInfo->id.str, pInterval, type);
3942 3943 3944
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3945

L
Liu Jicong 已提交
3946
  pInfo->pRes = pResBlock;
3947
  pInfo->multigroupResult = multigroupResult;
dengyihao's avatar
dengyihao 已提交
3948
  pOperator->name = "FillOperator";
3949
  pOperator->blocking = false;
dengyihao's avatar
dengyihao 已提交
3950
  pOperator->status = OP_NOT_OPENED;
3951
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_FILL;
3952 3953 3954 3955
  pOperator->exprSupp.pExprInfo = pExprInfo;
  pOperator->exprSupp.numOfExprs = num;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3956

L
Liu Jicong 已提交
3957 3958
  pOperator->fpSet =
      createOperatorFpSet(operatorDummyOpenFn, doFill, NULL, NULL, destroySFillOperatorInfo, NULL, NULL, NULL);
3959

3960
  code = appendDownstream(pOperator, &downstream, 1);
3961
  return pOperator;
H
Haojun Liao 已提交
3962

L
Liu Jicong 已提交
3963
_error:
wafwerar's avatar
wafwerar 已提交
3964 3965
  taosMemoryFreeClear(pOperator);
  taosMemoryFreeClear(pInfo);
H
Haojun Liao 已提交
3966
  return NULL;
3967 3968
}

D
dapan1121 已提交
3969
static SExecTaskInfo* createExecTaskInfo(uint64_t queryId, uint64_t taskId, EOPTR_EXEC_MODEL model, char* dbFName) {
wafwerar's avatar
wafwerar 已提交
3970
  SExecTaskInfo* pTaskInfo = taosMemoryCalloc(1, sizeof(SExecTaskInfo));
3971
  setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
3972

D
dapan1121 已提交
3973
  pTaskInfo->schemaVer.dbname = strdup(dbFName);
3974
  pTaskInfo->cost.created = taosGetTimestampMs();
H
Haojun Liao 已提交
3975
  pTaskInfo->id.queryId = queryId;
dengyihao's avatar
dengyihao 已提交
3976
  pTaskInfo->execModel = model;
H
Haojun Liao 已提交
3977

wafwerar's avatar
wafwerar 已提交
3978
  char* p = taosMemoryCalloc(1, 128);
L
Liu Jicong 已提交
3979
  snprintf(p, 128, "TID:0x%" PRIx64 " QID:0x%" PRIx64, taskId, queryId);
H
Haojun Liao 已提交
3980
  pTaskInfo->id.str = p;
H
Haojun Liao 已提交
3981

3982 3983
  return pTaskInfo;
}
H
Haojun Liao 已提交
3984

H
Haojun Liao 已提交
3985
static SArray* extractColumnInfo(SNodeList* pNodeList);
3986

D
dapan1121 已提交
3987
int32_t extractTableSchemaVersion(SReadHandle* pHandle, uint64_t uid, SExecTaskInfo* pTaskInfo) {
3988 3989
  SMetaReader mr = {0};
  metaReaderInit(&mr, pHandle->meta, 0);
D
dapan1121 已提交
3990 3991 3992 3993 3994
  int32_t code = metaGetTableEntryByUid(&mr, uid);
  if (code) {
    metaReaderClear(&mr);
    return code;
  }
3995 3996 3997 3998

  pTaskInfo->schemaVer.tablename = strdup(mr.me.name);

  if (mr.me.type == TSDB_SUPER_TABLE) {
3999 4000
    pTaskInfo->schemaVer.sversion = mr.me.stbEntry.schemaRow.version;
    pTaskInfo->schemaVer.tversion = mr.me.stbEntry.schemaTag.version;
4001 4002 4003
  } else if (mr.me.type == TSDB_CHILD_TABLE) {
    tb_uid_t suid = mr.me.ctbEntry.suid;
    metaGetTableEntryByUid(&mr, suid);
4004 4005
    pTaskInfo->schemaVer.sversion = mr.me.stbEntry.schemaRow.version;
    pTaskInfo->schemaVer.tversion = mr.me.stbEntry.schemaTag.version;
4006
  } else {
4007
    pTaskInfo->schemaVer.sversion = mr.me.ntbEntry.schemaRow.version;
4008
  }
4009 4010

  metaReaderClear(&mr);
D
dapan1121 已提交
4011 4012

  return TSDB_CODE_SUCCESS;
4013 4014
}

4015
static int32_t sortTableGroup(STableListInfo* pTableListInfo, int32_t groupNum) {
wmmhello's avatar
wmmhello 已提交
4016
  taosArrayClear(pTableListInfo->pGroupList);
4017 4018
  SArray* sortSupport = taosArrayInit(groupNum, sizeof(uint64_t));
  if (sortSupport == NULL) return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
4019 4020
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
4021
    uint64_t*      groupId = taosHashGet(pTableListInfo->map, &info->uid, sizeof(uint64_t));
wmmhello's avatar
wmmhello 已提交
4022 4023

    int32_t index = taosArraySearchIdx(sortSupport, groupId, compareUint64Val, TD_EQ);
4024 4025 4026 4027
    if (index == -1) {
      void*   p = taosArraySearch(sortSupport, groupId, compareUint64Val, TD_GT);
      SArray* tGroup = taosArrayInit(8, sizeof(STableKeyInfo));
      if (tGroup == NULL) {
wmmhello's avatar
wmmhello 已提交
4028 4029 4030
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
4031
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4032 4033 4034 4035
        qError("taos push info array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
4036
      if (p == NULL) {
wmmhello's avatar
wmmhello 已提交
4037
        if (taosArrayPush(sortSupport, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4038 4039 4040 4041
          qError("taos push support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
wmmhello's avatar
wmmhello 已提交
4042
        if (taosArrayPush(pTableListInfo->pGroupList, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4043 4044 4045 4046
          qError("taos push group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4047
      } else {
wmmhello's avatar
wmmhello 已提交
4048
        int32_t pos = TARRAY_ELEM_IDX(sortSupport, p);
4049
        if (taosArrayInsert(sortSupport, pos, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
4050 4051 4052 4053
          qError("taos insert support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
4054
        if (taosArrayInsert(pTableListInfo->pGroupList, pos, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
4055 4056 4057 4058 4059
          qError("taos insert group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
      }
4060
    } else {
wmmhello's avatar
wmmhello 已提交
4061
      SArray* tGroup = (SArray*)taosArrayGetP(pTableListInfo->pGroupList, index);
4062
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
4063 4064 4065 4066 4067 4068 4069 4070 4071 4072
        qError("taos push uid array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
    }
  }
  taosArrayDestroy(sortSupport);
  return TDB_CODE_SUCCESS;
}

wmmhello's avatar
wmmhello 已提交
4073 4074
int32_t generateGroupIdMap(STableListInfo* pTableListInfo, SReadHandle* pHandle, SNodeList* group) {
  if (group == NULL) {
wmmhello's avatar
wmmhello 已提交
4075 4076 4077 4078 4079 4080 4081 4082
    return TDB_CODE_SUCCESS;
  }

  pTableListInfo->map = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, HASH_NO_LOCK);
  if (pTableListInfo->map == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
  int32_t keyLen = 0;
X
Xiaoyu Wang 已提交
4083
  void*   keyBuf = NULL;
wmmhello's avatar
wmmhello 已提交
4084

4085
  SNode* node;
wmmhello's avatar
wmmhello 已提交
4086
  FOREACH(node, group) {
4087
    SExprNode* pExpr = (SExprNode*)node;
wmmhello's avatar
wmmhello 已提交
4088
    keyLen += pExpr->resType.bytes;
wmmhello's avatar
wmmhello 已提交
4089 4090
  }

wmmhello's avatar
wmmhello 已提交
4091
  int32_t nullFlagSize = sizeof(int8_t) * LIST_LENGTH(group);
wmmhello's avatar
wmmhello 已提交
4092 4093 4094 4095 4096 4097 4098
  keyLen += nullFlagSize;

  keyBuf = taosMemoryCalloc(1, keyLen);
  if (keyBuf == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

4099
  int32_t groupNum = 0;
X
Xiaoyu Wang 已提交
4100 4101 4102
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
    SMetaReader    mr = {0};
wmmhello's avatar
wmmhello 已提交
4103 4104 4105
    metaReaderInit(&mr, pHandle->meta, 0);
    metaGetTableEntryByUid(&mr, info->uid);

4106
    SNodeList* groupNew = nodesCloneList(group);
wmmhello's avatar
wmmhello 已提交
4107

wmmhello's avatar
wmmhello 已提交
4108
    nodesRewriteExprsPostOrder(groupNew, doTranslateTagExpr, &mr);
wmmhello's avatar
wmmhello 已提交
4109
    char* isNull = (char*)keyBuf;
wmmhello's avatar
wmmhello 已提交
4110 4111
    char* pStart = (char*)keyBuf + nullFlagSize;

4112
    SNode*  pNode;
wmmhello's avatar
wmmhello 已提交
4113
    int32_t index = 0;
4114
    FOREACH(pNode, groupNew) {
wmmhello's avatar
wmmhello 已提交
4115 4116 4117 4118
      SNode*  pNew = NULL;
      int32_t code = scalarCalculateConstants(pNode, &pNew);
      if (TSDB_CODE_SUCCESS == code) {
        REPLACE_NODE(pNew);
X
Xiaoyu Wang 已提交
4119
      } else {
4120
        taosMemoryFree(keyBuf);
wmmhello's avatar
wmmhello 已提交
4121
        nodesClearList(groupNew);
4122
        metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4123
        return code;
wmmhello's avatar
wmmhello 已提交
4124
      }
4125

wmmhello's avatar
wmmhello 已提交
4126
      ASSERT(nodeType(pNew) == QUERY_NODE_VALUE);
4127
      SValueNode* pValue = (SValueNode*)pNew;
4128

wmmhello's avatar
wmmhello 已提交
4129
      if (pValue->node.resType.type == TSDB_DATA_TYPE_NULL || pValue->isNull) {
wmmhello's avatar
wmmhello 已提交
4130 4131 4132 4133
        isNull[index++] = 1;
        continue;
      } else {
        isNull[index++] = 0;
4134
        char* data = nodesGetValueFromNode(pValue);
L
Liu Jicong 已提交
4135 4136
        if (pValue->node.resType.type == TSDB_DATA_TYPE_JSON) {
          if (tTagIsJson(data)) {
wmmhello's avatar
wmmhello 已提交
4137 4138 4139
            terrno = TSDB_CODE_QRY_JSON_IN_GROUP_ERROR;
            taosMemoryFree(keyBuf);
            nodesClearList(groupNew);
4140
            metaReaderClear(&mr);
wmmhello's avatar
wmmhello 已提交
4141 4142
            return terrno;
          }
wmmhello's avatar
wmmhello 已提交
4143
          int32_t len = getJsonValueLen(data);
wmmhello's avatar
wmmhello 已提交
4144 4145 4146
          memcpy(pStart, data, len);
          pStart += len;
        } else if (IS_VAR_DATA_TYPE(pValue->node.resType.type)) {
wmmhello's avatar
wmmhello 已提交
4147 4148
          memcpy(pStart, data, varDataTLen(data));
          pStart += varDataTLen(data);
wmmhello's avatar
wmmhello 已提交
4149
        } else {
wmmhello's avatar
wmmhello 已提交
4150 4151
          memcpy(pStart, data, pValue->node.resType.bytes);
          pStart += pValue->node.resType.bytes;
wmmhello's avatar
wmmhello 已提交
4152 4153 4154
        }
      }
    }
4155
    int32_t  len = (int32_t)(pStart - (char*)keyBuf);
4156 4157
    uint64_t groupId = calcGroupId(keyBuf, len);
    taosHashPut(pTableListInfo->map, &(info->uid), sizeof(uint64_t), &groupId, sizeof(uint64_t));
S
slzhou 已提交
4158
    info->groupId = groupId;
4159
    groupNum++;
wmmhello's avatar
wmmhello 已提交
4160

wmmhello's avatar
wmmhello 已提交
4161
    nodesClearList(groupNew);
wmmhello's avatar
wmmhello 已提交
4162 4163 4164
    metaReaderClear(&mr);
  }
  taosMemoryFree(keyBuf);
4165

4166
  if (pTableListInfo->needSortTableByGroupId) {
wmmhello's avatar
wmmhello 已提交
4167
    return sortTableGroup(pTableListInfo, groupNum);
4168 4169
  }

wmmhello's avatar
wmmhello 已提交
4170 4171 4172
  return TDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
4173
SOperatorInfo* createOperatorTree(SPhysiNode* pPhyNode, SExecTaskInfo* pTaskInfo, SReadHandle* pHandle,
4174 4175
                                  uint64_t queryId, uint64_t taskId, STableListInfo* pTableListInfo,
                                  const char* pUser) {
4176 4177
  int32_t type = nodeType(pPhyNode);

X
Xiaoyu Wang 已提交
4178
  if (pPhyNode->pChildren == NULL || LIST_LENGTH(pPhyNode->pChildren) == 0) {
H
Haojun Liao 已提交
4179
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == type) {
dengyihao's avatar
dengyihao 已提交
4180
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4181

wmmhello's avatar
wmmhello 已提交
4182
      int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
4183
      if (code) {
wmmhello's avatar
wmmhello 已提交
4184
        pTaskInfo->code = code;
D
dapan1121 已提交
4185 4186
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4187
      code = extractTableSchemaVersion(pHandle, pTableScanNode->scan.uid, pTaskInfo);
S
slzhou 已提交
4188
      if (code) {
4189
        pTaskInfo->code = terrno;
wmmhello's avatar
wmmhello 已提交
4190 4191 4192
        return NULL;
      }

wmmhello's avatar
wmmhello 已提交
4193
      SOperatorInfo*  pOperator = createTableScanOperatorInfo(pTableScanNode, pHandle, pTaskInfo, queryId, taskId);
4194 4195
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
S
slzhou 已提交
4196
      return pOperator;
L
Liu Jicong 已提交
4197

S
slzhou 已提交
4198 4199
    } else if (QUERY_NODE_PHYSICAL_PLAN_TABLE_MERGE_SCAN == type) {
      STableMergeScanPhysiNode* pTableScanNode = (STableMergeScanPhysiNode*)pPhyNode;
wmmhello's avatar
wmmhello 已提交
4200
      int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
L
Liu Jicong 已提交
4201
      if (code) {
wmmhello's avatar
wmmhello 已提交
4202
        pTaskInfo->code = code;
wmmhello's avatar
wmmhello 已提交
4203 4204 4205 4206 4207 4208 4209
        return NULL;
      }
      code = extractTableSchemaVersion(pHandle, pTableScanNode->scan.uid, pTaskInfo);
      if (code) {
        pTaskInfo->code = terrno;
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4210

4211 4212
      SOperatorInfo* pOperator =
          createTableMergeScanOperatorInfo(pTableScanNode, pTableListInfo, pHandle, pTaskInfo, queryId, taskId);
wmmhello's avatar
wmmhello 已提交
4213

4214 4215 4216
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
      return pOperator;
L
Liu Jicong 已提交
4217

H
Haojun Liao 已提交
4218
    } else if (QUERY_NODE_PHYSICAL_PLAN_EXCHANGE == type) {
4219
      return createExchangeOperatorInfo(pHandle->pMsgCb->clientRpc, (SExchangePhysiNode*)pPhyNode, pTaskInfo);
L
Liu Jicong 已提交
4220

H
Haojun Liao 已提交
4221
    } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN == type) {
5
54liuyao 已提交
4222
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
4223
      STimeWindowAggSupp   twSup = {
L
Liu Jicong 已提交
4224 4225 4226 4227
            .waterMark = pTableScanNode->watermark,
            .calTrigger = pTableScanNode->triggerType,
            .maxTs = INT64_MIN,
      };
L
Liu Jicong 已提交
4228
      if (pHandle) {
wmmhello's avatar
wmmhello 已提交
4229
        int32_t code = createScanTableListInfo(pTableScanNode, pHandle, pTableListInfo, queryId, taskId);
L
Liu Jicong 已提交
4230
        if (code) {
wmmhello's avatar
wmmhello 已提交
4231 4232 4233
          pTaskInfo->code = code;
          return NULL;
        }
5
54liuyao 已提交
4234
      }
4235

4236 4237
      SOperatorInfo* pOperator =
          createStreamScanOperatorInfo(pHandle, pTableScanNode, pTaskInfo, &twSup, queryId, taskId);
H
Haojun Liao 已提交
4238
      return pOperator;
L
Liu Jicong 已提交
4239

H
Haojun Liao 已提交
4240
    } else if (QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN == type) {
L
Liu Jicong 已提交
4241
      SSystemTableScanPhysiNode* pSysScanPhyNode = (SSystemTableScanPhysiNode*)pPhyNode;
4242
      return createSysTableScanOperatorInfo(pHandle, pSysScanPhyNode, pUser, pTaskInfo);
4243
    } else if (QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN == type) {
X
Xiaoyu Wang 已提交
4244
      STagScanPhysiNode* pScanPhyNode = (STagScanPhysiNode*)pPhyNode;
4245

wmmhello's avatar
wmmhello 已提交
4246
      int32_t code = getTableList(pHandle->meta, pScanPhyNode, pTableListInfo);
4247
      if (code != TSDB_CODE_SUCCESS) {
4248
        pTaskInfo->code = terrno;
4249 4250 4251
        return NULL;
      }

4252
      return createTagScanOperatorInfo(pHandle, pScanPhyNode, pTableListInfo, pTaskInfo);
L
Liu Jicong 已提交
4253

4254
    } else if (QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN == type) {
4255
      SBlockDistScanPhysiNode* pBlockNode = (SBlockDistScanPhysiNode*)pPhyNode;
4256 4257 4258 4259 4260 4261 4262 4263 4264
      pTableListInfo->pTableList = taosArrayInit(4, sizeof(STableKeyInfo));

      if (pBlockNode->tableType == TSDB_SUPER_TABLE) {
        int32_t code = tsdbGetAllTableList(pHandle->meta, pBlockNode->uid, pTableListInfo->pTableList);
        if (code != TSDB_CODE_SUCCESS) {
          pTaskInfo->code = terrno;
          return NULL;
        }
      } else {  // Create one table group.
S
slzhou 已提交
4265
        STableKeyInfo info = {.lastKey = 0, .uid = pBlockNode->uid, .groupId = 0};
4266 4267 4268 4269 4270 4271 4272 4273 4274 4275 4276 4277 4278 4279 4280 4281 4282 4283 4284 4285 4286 4287 4288 4289
        taosArrayPush(pTableListInfo->pTableList, &info);
      }

      SQueryTableDataCond cond = {0};

      {
        cond.order = TSDB_ORDER_ASC;
        cond.numOfCols = 1;
        cond.colList = taosMemoryCalloc(1, sizeof(SColumnInfo));
        if (cond.colList == NULL) {
          terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
          return NULL;
        }

        cond.colList->colId = 1;
        cond.colList->type = TSDB_DATA_TYPE_TIMESTAMP;
        cond.colList->bytes = sizeof(TSKEY);

        cond.numOfTWindows = 1;
        cond.twindows = taosMemoryCalloc(1, sizeof(STimeWindow));
        cond.twindows[0] = (STimeWindow){.skey = INT64_MIN, .ekey = INT64_MAX};
        cond.suid = pBlockNode->suid;
        cond.type = BLOCK_LOAD_OFFSET_SEQ_ORDER;
      }
wmmhello's avatar
wmmhello 已提交
4290
      tsdbReaderT* pReader = tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, queryId, taskId);
4291 4292
      cleanupQueryTableDataCond(&cond);

4293
      return createDataBlockInfoScanOperator(pReader, pHandle, cond.suid, pBlockNode, pTaskInfo);
H
Haojun Liao 已提交
4294 4295
    } else {
      ASSERT(0);
H
Haojun Liao 已提交
4296 4297 4298
    }
  }

4299 4300
  int32_t num = 0;
  size_t  size = LIST_LENGTH(pPhyNode->pChildren);
H
Haojun Liao 已提交
4301

4302
  SOperatorInfo** ops = taosMemoryCalloc(size, POINTER_BYTES);
dengyihao's avatar
dengyihao 已提交
4303
  for (int32_t i = 0; i < size; ++i) {
4304
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pPhyNode->pChildren, i);
4305
    ops[i] = createOperatorTree(pChildNode, pTaskInfo, pHandle, queryId, taskId, pTableListInfo, pUser);
4306 4307 4308
    if (ops[i] == NULL) {
      return NULL;
    }
4309
  }
H
Haojun Liao 已提交
4310

4311
  SOperatorInfo* pOptr = NULL;
H
Haojun Liao 已提交
4312
  if (QUERY_NODE_PHYSICAL_PLAN_PROJECT == type) {
4313
    pOptr = createProjectOperatorInfo(ops[0], (SProjectPhysiNode*)pPhyNode, pTaskInfo);
4314
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_AGG == type) {
H
Haojun Liao 已提交
4315 4316
    SAggPhysiNode* pAggNode = (SAggPhysiNode*)pPhyNode;
    SExprInfo*     pExprInfo = createExprInfo(pAggNode->pAggFuncs, pAggNode->pGroupKeys, &num);
4317
    SSDataBlock*   pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4318

dengyihao's avatar
dengyihao 已提交
4319
    int32_t    numOfScalarExpr = 0;
4320 4321 4322 4323 4324
    SExprInfo* pScalarExprInfo = NULL;
    if (pAggNode->pExprs != NULL) {
      pScalarExprInfo = createExprInfo(pAggNode->pExprs, NULL, &numOfScalarExpr);
    }

H
Haojun Liao 已提交
4325 4326
    if (pAggNode->pGroupKeys != NULL) {
      SArray* pColList = extractColumnInfo(pAggNode->pGroupKeys);
dengyihao's avatar
dengyihao 已提交
4327
      pOptr = createGroupOperatorInfo(ops[0], pExprInfo, num, pResBlock, pColList, pAggNode->node.pConditions,
wmmhello's avatar
wmmhello 已提交
4328
                                      pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4329
    } else {
dengyihao's avatar
dengyihao 已提交
4330 4331
      pOptr =
          createAggregateOperatorInfo(ops[0], pExprInfo, num, pResBlock, pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4332
    }
X
Xiaoyu Wang 已提交
4333
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_INTERVAL == type || QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type) {
H
Haojun Liao 已提交
4334
    SIntervalPhysiNode* pIntervalPhyNode = (SIntervalPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4335

H
Haojun Liao 已提交
4336
    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
4337
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4338

dengyihao's avatar
dengyihao 已提交
4339 4340 4341 4342 4343 4344
    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
H
Haojun Liao 已提交
4345

X
Xiaoyu Wang 已提交
4346 4347 4348 4349 4350
    STimeWindowAggSupp as = {
        .waterMark = pIntervalPhyNode->window.watermark,
        .calTrigger = pIntervalPhyNode->window.triggerType,
        .maxTs = INT64_MIN,
    };
4351
    ASSERT(as.calTrigger != STREAM_TRIGGER_MAX_DELAY);
4352

4353
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4354
    bool    isStream = (QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type);
4355 4356
    pOptr = createIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, &as, pIntervalPhyNode,
                                       pTaskInfo, isStream);
4357

4358 4359
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == type) {
    SMergeAlignedIntervalPhysiNode* pIntervalPhyNode = (SMergeAlignedIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4360 4361 4362 4363 4364 4365 4366 4367 4368 4369

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4370

S
shenglian zhou 已提交
4371
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
4372
    pOptr = createMergeAlignedIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, pTaskInfo);
S
shenglian zhou 已提交
4373
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_INTERVAL == type) {
X
Xiaoyu Wang 已提交
4374
    SMergeIntervalPhysiNode* pIntervalPhyNode = (SMergeIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4375 4376 4377 4378 4379 4380 4381 4382 4383 4384

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4385

S
shenglian zhou 已提交
4386 4387
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
    pOptr = createMergeIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, pTaskInfo);
5
54liuyao 已提交
4388
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_INTERVAL == type) {
4389
    int32_t children = 0;
5
54liuyao 已提交
4390 4391
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_INTERVAL == type) {
4392
    int32_t children = 1;
5
54liuyao 已提交
4393
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4394
  } else if (QUERY_NODE_PHYSICAL_PLAN_SORT == type) {
4395
    pOptr = createSortOperatorInfo(ops[0], (SSortPhysiNode*)pPhyNode, pTaskInfo);
S
shenglian zhou 已提交
4396 4397
  } else if (QUERY_NODE_PHYSICAL_PLAN_GROUP_SORT == type) {
    pOptr = createGroupSortOperatorInfo(ops[0], (SGroupSortPhysiNode*)pPhyNode, pTaskInfo);
X
Xiaoyu Wang 已提交
4398
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE == type) {
4399
    SMergePhysiNode* pMergePhyNode = (SMergePhysiNode*)pPhyNode;
4400
    pOptr = createMultiwayMergeOperatorInfo(ops, size, pMergePhyNode, pTaskInfo);
4401
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_SESSION == type) {
H
Haojun Liao 已提交
4402 4403
    SSessionWinodwPhysiNode* pSessionNode = (SSessionWinodwPhysiNode*)pPhyNode;

X
Xiaoyu Wang 已提交
4404 4405
    STimeWindowAggSupp as = {.waterMark = pSessionNode->window.watermark,
                             .calTrigger = pSessionNode->window.triggerType};
4406

H
Haojun Liao 已提交
4407
    SExprInfo*   pExprInfo = createExprInfo(pSessionNode->window.pFuncs, NULL, &num);
4408
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4409 4410
    int32_t      tsSlotId = ((SColumnNode*)pSessionNode->window.pTspk)->slotId;

X
Xiaoyu Wang 已提交
4411 4412
    pOptr =
        createSessionAggOperatorInfo(ops[0], pExprInfo, num, pResBlock, pSessionNode->gap, tsSlotId, &as, pTaskInfo);
4413
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SESSION == type) {
4414 4415 4416 4417 4418 4419 4420
    pOptr = createStreamSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_SESSION == type) {
    int32_t children = 0;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_SESSION == type) {
    int32_t children = 1;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4421
  } else if (QUERY_NODE_PHYSICAL_PLAN_PARTITION == type) {
4422
    pOptr = createPartitionOperatorInfo(ops[0], (SPartitionPhysiNode*)pPhyNode, pTaskInfo);
4423
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_STATE == type) {
dengyihao's avatar
dengyihao 已提交
4424
    SStateWinodwPhysiNode* pStateNode = (SStateWinodwPhysiNode*)pPhyNode;
4425

4426 4427
    STimeWindowAggSupp as = {.waterMark = pStateNode->window.watermark, .calTrigger = pStateNode->window.triggerType};

dengyihao's avatar
dengyihao 已提交
4428
    SExprInfo*   pExprInfo = createExprInfo(pStateNode->window.pFuncs, NULL, &num);
4429
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4430 4431
    int32_t      tsSlotId = ((SColumnNode*)pStateNode->window.pTspk)->slotId;

4432
    SColumnNode* pColNode = (SColumnNode*)((STargetNode*)pStateNode->pStateKey)->pExpr;
X
Xiaoyu Wang 已提交
4433
    SColumn      col = extractColumnFromColumnNode(pColNode);
4434
    pOptr = createStatewindowOperatorInfo(ops[0], pExprInfo, num, pResBlock, &as, tsSlotId, &col, pTaskInfo);
4435
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_STATE == type) {
5
54liuyao 已提交
4436
    pOptr = createStreamStateAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4437
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_JOIN == type) {
4438
    pOptr = createMergeJoinOperatorInfo(ops, size, (SJoinPhysiNode*)pPhyNode, pTaskInfo);
4439
  } else if (QUERY_NODE_PHYSICAL_PLAN_FILL == type) {
4440
    pOptr = createFillOperatorInfo(ops[0], (SFillPhysiNode*)pPhyNode, false, pTaskInfo);
H
Haojun Liao 已提交
4441 4442
  } else if (QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC == type) {
    pOptr = createIndefinitOutputOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4443 4444
  } else if (QUERY_NODE_PHYSICAL_PLAN_INTERP_FUNC == type) {
    pOptr = createTimeSliceOperatorInfo(ops[0], pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4445 4446
  } else {
    ASSERT(0);
H
Haojun Liao 已提交
4447
  }
4448 4449 4450

  taosMemoryFree(ops);
  return pOptr;
4451
}
H
Haojun Liao 已提交
4452

4453
int32_t compareTimeWindow(const void* p1, const void* p2, const void* param) {
dengyihao's avatar
dengyihao 已提交
4454 4455 4456
  const SQueryTableDataCond* pCond = param;
  const STimeWindow*         pWin1 = p1;
  const STimeWindow*         pWin2 = p2;
4457 4458 4459 4460 4461 4462 4463 4464
  if (pCond->order == TSDB_ORDER_ASC) {
    return pWin1->skey - pWin2->skey;
  } else if (pCond->order == TSDB_ORDER_DESC) {
    return pWin2->skey - pWin1->skey;
  }
  return 0;
}

H
Haojun Liao 已提交
4465
SArray* extractColumnInfo(SNodeList* pNodeList) {
L
Liu Jicong 已提交
4466
  size_t  numOfCols = LIST_LENGTH(pNodeList);
H
Haojun Liao 已提交
4467 4468 4469 4470 4471 4472
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColumn));
  if (pList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

L
Liu Jicong 已提交
4473 4474
  for (int32_t i = 0; i < numOfCols; ++i) {
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pNodeList, i);
H
Haojun Liao 已提交
4475

4476 4477 4478
    if (nodeType(pNode->pExpr) == QUERY_NODE_COLUMN) {
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

4479
      SColumn c = extractColumnFromColumnNode(pColNode);
4480 4481
      taosArrayPush(pList, &c);
    } else if (nodeType(pNode->pExpr) == QUERY_NODE_VALUE) {
L
Liu Jicong 已提交
4482 4483
      SValueNode* pValNode = (SValueNode*)pNode->pExpr;
      SColumn     c = {0};
4484
      c.slotId = pNode->slotId;
L
Liu Jicong 已提交
4485 4486 4487 4488
      c.colId = pNode->slotId;
      c.type = pValNode->node.type;
      c.bytes = pValNode->node.resType.bytes;
      c.scale = pValNode->node.resType.scale;
4489 4490 4491 4492
      c.precision = pValNode->node.resType.precision;

      taosArrayPush(pList, &c);
    }
H
Haojun Liao 已提交
4493 4494 4495 4496 4497
  }

  return pList;
}

L
Liu Jicong 已提交
4498
tsdbReaderT doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
wmmhello's avatar
wmmhello 已提交
4499 4500
                               STableListInfo* pTableListInfo, uint64_t queryId, uint64_t taskId) {
  int32_t code = getTableList(pHandle->meta, &pTableScanNode->scan, pTableListInfo);
wmmhello's avatar
wmmhello 已提交
4501 4502 4503 4504 4505 4506 4507 4508 4509 4510
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  if (taosArrayGetSize(pTableListInfo->pTableList) == 0) {
    code = 0;
    qDebug("no table qualified for query, TID:0x%" PRIx64 ", QID:0x%" PRIx64, taskId, queryId);
    goto _error;
  }

4511
  SQueryTableDataCond cond = {0};
wmmhello's avatar
wmmhello 已提交
4512
  code = initQueryTableDataCond(&cond, pTableScanNode);
4513
  if (code != TSDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4514
    goto _error;
X
Xiaoyu Wang 已提交
4515
  }
4516

wmmhello's avatar
wmmhello 已提交
4517
  tsdbReaderT pReader = tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, queryId, taskId);
4518
  cleanupQueryTableDataCond(&cond);
H
Haojun Liao 已提交
4519 4520

  return pReader;
wmmhello's avatar
wmmhello 已提交
4521 4522 4523 4524

_error:
  terrno = code;
  return NULL;
H
Haojun Liao 已提交
4525 4526
}

L
Liu Jicong 已提交
4527 4528 4529 4530 4531 4532 4533 4534 4535 4536 4537 4538 4539 4540 4541 4542 4543 4544 4545 4546
static int32_t extractTbscanInStreamOpTree(SOperatorInfo* pOperator, STableScanInfo** ppInfo) {
  if (pOperator->operatorType != QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
    if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator");
      return TSDB_CODE_QRY_APP_ERROR;
    }

    if (pOperator->numOfDownstream > 1) {
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
    }
    return extractTbscanInStreamOpTree(pOperator->pDownstream[0], ppInfo);
  } else {
    SStreamBlockScanInfo* pInfo = pOperator->info;
    ASSERT(pInfo->pSnapshotReadOp->operatorType == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN);
    *ppInfo = pInfo->pSnapshotReadOp->info;
    return 0;
  }
}

4547 4548 4549 4550 4551 4552 4553 4554 4555 4556 4557 4558 4559 4560 4561 4562 4563 4564 4565 4566 4567 4568
int32_t extractTableScanNode(SPhysiNode* pNode, STableScanPhysiNode** ppNode) {
  if (pNode->pChildren == NULL || LIST_LENGTH(pNode->pChildren) == 0) {
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == pNode->type) {
      *ppNode = (STableScanPhysiNode*)pNode;
      return 0;
    } else {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
  } else {
    if (LIST_LENGTH(pNode->pChildren) != 1) {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pNode->pChildren, 0);
    return extractTableScanNode(pChildNode, ppNode);
  }
  return -1;
}

L
Liu Jicong 已提交
4569 4570 4571 4572 4573
int32_t rebuildReader(SOperatorInfo* pOperator, SSubplan* plan, SReadHandle* pHandle, int64_t uid, int64_t ts) {
  STableScanInfo* pTableScanInfo = NULL;
  if (extractTbscanInStreamOpTree(pOperator, &pTableScanInfo) < 0) {
    return -1;
  }
4574

L
Liu Jicong 已提交
4575 4576 4577 4578
  STableScanPhysiNode* pNode = NULL;
  if (extractTableScanNode(plan->pNode, &pNode) < 0) {
    ASSERT(0);
  }
4579

L
Liu Jicong 已提交
4580
  tsdbCleanupReadHandle(pTableScanInfo->dataReader);
4581

L
Liu Jicong 已提交
4582 4583 4584 4585 4586 4587
  STableListInfo info = {0};
  pTableScanInfo->dataReader = doCreateDataReader(pNode, pHandle, &info, 0, 0);
  if (pTableScanInfo->dataReader == NULL) {
    ASSERT(0);
    qError("failed to create data reader");
    return TSDB_CODE_QRY_APP_ERROR;
4588
  }
L
Liu Jicong 已提交
4589
  // TODO: set uid and ts to data reader
4590 4591 4592
  return 0;
}

C
Cary Xu 已提交
4593
int32_t encodeOperator(SOperatorInfo* ops, char** result, int32_t* length, int32_t* nOptrWithVal) {
wmmhello's avatar
wmmhello 已提交
4594
  int32_t code = TDB_CODE_SUCCESS;
4595
  char*   pCurrent = NULL;
wmmhello's avatar
wmmhello 已提交
4596
  int32_t currLength = 0;
4597
  if (ops->fpSet.encodeResultRow) {
C
Cary Xu 已提交
4598
    if (result == NULL || length == NULL || nOptrWithVal == NULL) {
wmmhello's avatar
wmmhello 已提交
4599 4600 4601
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
    code = ops->fpSet.encodeResultRow(ops, &pCurrent, &currLength);
wmmhello's avatar
wmmhello 已提交
4602

4603 4604
    if (code != TDB_CODE_SUCCESS) {
      if (*result != NULL) {
wmmhello's avatar
wmmhello 已提交
4605 4606 4607 4608
        taosMemoryFree(*result);
        *result = NULL;
      }
      return code;
C
Cary Xu 已提交
4609 4610 4611
    } else if (currLength == 0) {
      ASSERT(!pCurrent);
      goto _downstream;
wmmhello's avatar
wmmhello 已提交
4612
    }
wmmhello's avatar
wmmhello 已提交
4613

C
Cary Xu 已提交
4614 4615
    ++(*nOptrWithVal);

C
Cary Xu 已提交
4616
    ASSERT(currLength >= 0);
wmmhello's avatar
wmmhello 已提交
4617

4618
    if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
4619
      *result = (char*)taosMemoryCalloc(1, currLength + sizeof(int32_t));
wmmhello's avatar
wmmhello 已提交
4620 4621 4622 4623 4624 4625
      if (*result == NULL) {
        taosMemoryFree(pCurrent);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      memcpy(*result + sizeof(int32_t), pCurrent, currLength);
      *(int32_t*)(*result) = currLength + sizeof(int32_t);
4626
    } else {
wmmhello's avatar
wmmhello 已提交
4627
      int32_t sizePre = *(int32_t*)(*result);
4628
      char*   tmp = (char*)taosMemoryRealloc(*result, sizePre + currLength);
wmmhello's avatar
wmmhello 已提交
4629 4630 4631 4632 4633 4634 4635 4636 4637 4638 4639 4640
      if (tmp == NULL) {
        taosMemoryFree(pCurrent);
        taosMemoryFree(*result);
        *result = NULL;
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      *result = tmp;
      memcpy(*result + sizePre, pCurrent, currLength);
      *(int32_t*)(*result) += currLength;
    }
    taosMemoryFree(pCurrent);
    *length = *(int32_t*)(*result);
wmmhello's avatar
wmmhello 已提交
4641 4642
  }

C
Cary Xu 已提交
4643
_downstream:
wmmhello's avatar
wmmhello 已提交
4644
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
C
Cary Xu 已提交
4645
    code = encodeOperator(ops->pDownstream[i], result, length, nOptrWithVal);
4646
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4647
      return code;
wmmhello's avatar
wmmhello 已提交
4648 4649
    }
  }
wmmhello's avatar
wmmhello 已提交
4650
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4651 4652
}

H
Haojun Liao 已提交
4653
int32_t decodeOperator(SOperatorInfo* ops, const char* result, int32_t length) {
wmmhello's avatar
wmmhello 已提交
4654
  int32_t code = TDB_CODE_SUCCESS;
4655 4656
  if (ops->fpSet.decodeResultRow) {
    if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
4657 4658
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
H
Haojun Liao 已提交
4659

4660
    ASSERT(length == *(int32_t*)result);
H
Haojun Liao 已提交
4661 4662

    const char* data = result + sizeof(int32_t);
L
Liu Jicong 已提交
4663
    code = ops->fpSet.decodeResultRow(ops, (char*)data);
4664
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4665 4666
      return code;
    }
wmmhello's avatar
wmmhello 已提交
4667

wmmhello's avatar
wmmhello 已提交
4668
    int32_t totalLength = *(int32_t*)result;
4669 4670
    int32_t dataLength = *(int32_t*)data;

4671
    if (totalLength == dataLength + sizeof(int32_t)) {  // the last data
wmmhello's avatar
wmmhello 已提交
4672 4673
      result = NULL;
      length = 0;
4674
    } else {
wmmhello's avatar
wmmhello 已提交
4675 4676 4677 4678
      result += dataLength;
      *(int32_t*)(result) = totalLength - dataLength;
      length = totalLength - dataLength;
    }
wmmhello's avatar
wmmhello 已提交
4679 4680
  }

wmmhello's avatar
wmmhello 已提交
4681 4682
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
    code = decodeOperator(ops->pDownstream[i], result, length);
4683
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4684
      return code;
wmmhello's avatar
wmmhello 已提交
4685 4686
    }
  }
wmmhello's avatar
wmmhello 已提交
4687
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4688 4689
}

4690
int32_t createDataSinkParam(SDataSinkNode* pNode, void** pParam, qTaskInfo_t* pTaskInfo) {
D
dapan1121 已提交
4691
  SExecTaskInfo* pTask = *(SExecTaskInfo**)pTaskInfo;
4692

D
dapan1121 已提交
4693 4694
  switch (pNode->type) {
    case QUERY_NODE_PHYSICAL_PLAN_DELETE: {
4695
      SDeleterParam* pDeleterParam = taosMemoryCalloc(1, sizeof(SDeleterParam));
D
dapan1121 已提交
4696 4697 4698 4699
      if (NULL == pDeleterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      int32_t tbNum = taosArrayGetSize(pTask->tableqinfoList.pTableList);
D
dapan1121 已提交
4700
      pDeleterParam->suid = pTask->tableqinfoList.suid;
D
dapan1121 已提交
4701 4702 4703 4704 4705 4706
      pDeleterParam->pUidList = taosArrayInit(tbNum, sizeof(uint64_t));
      if (NULL == pDeleterParam->pUidList) {
        taosMemoryFree(pDeleterParam);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      for (int32_t i = 0; i < tbNum; ++i) {
4707
        STableKeyInfo* pTable = taosArrayGet(pTask->tableqinfoList.pTableList, i);
D
dapan1121 已提交
4708 4709 4710 4711 4712 4713 4714 4715 4716 4717 4718 4719 4720
        taosArrayPush(pDeleterParam->pUidList, &pTable->uid);
      }

      *pParam = pDeleterParam;
      break;
    }
    default:
      break;
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
4721
int32_t createExecTaskInfoImpl(SSubplan* pPlan, SExecTaskInfo** pTaskInfo, SReadHandle* pHandle, uint64_t taskId,
4722
                               const char* sql, EOPTR_EXEC_MODEL model) {
H
Haojun Liao 已提交
4723 4724
  uint64_t queryId = pPlan->id.queryId;

H
Haojun Liao 已提交
4725
  int32_t code = TSDB_CODE_SUCCESS;
D
dapan1121 已提交
4726
  *pTaskInfo = createExecTaskInfo(queryId, taskId, model, pPlan->dbFName);
H
Haojun Liao 已提交
4727 4728 4729 4730
  if (*pTaskInfo == NULL) {
    code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    goto _complete;
  }
H
Haojun Liao 已提交
4731

4732
  (*pTaskInfo)->sql = sql;
wmmhello's avatar
wmmhello 已提交
4733 4734
  (*pTaskInfo)->tableqinfoList.pTagCond = pPlan->pTagCond;
  (*pTaskInfo)->tableqinfoList.pTagIndexCond = pPlan->pTagIndexCond;
4735 4736
  (*pTaskInfo)->pRoot = createOperatorTree(pPlan->pNode, *pTaskInfo, pHandle, queryId, taskId,
                                           &(*pTaskInfo)->tableqinfoList, pPlan->user);
L
Liu Jicong 已提交
4737

D
dapan1121 已提交
4738
  if (NULL == (*pTaskInfo)->pRoot) {
4739
    code = (*pTaskInfo)->code;
D
dapan1121 已提交
4740
    goto _complete;
4741 4742
  }

H
Haojun Liao 已提交
4743 4744
  return code;

H
Haojun Liao 已提交
4745
_complete:
wafwerar's avatar
wafwerar 已提交
4746
  taosMemoryFreeClear(*pTaskInfo);
H
Haojun Liao 已提交
4747 4748
  terrno = code;
  return code;
H
Haojun Liao 已提交
4749 4750
}

wmmhello's avatar
wmmhello 已提交
4751 4752 4753
static void doDestroyTableList(STableListInfo* pTableqinfoList) {
  taosArrayDestroy(pTableqinfoList->pTableList);
  taosHashCleanup(pTableqinfoList->map);
4754 4755
  if (pTableqinfoList->needSortTableByGroupId) {
    for (int32_t i = 0; i < taosArrayGetSize(pTableqinfoList->pGroupList); i++) {
wmmhello's avatar
wmmhello 已提交
4756 4757 4758 4759 4760
      SArray* tmp = taosArrayGetP(pTableqinfoList->pGroupList, i);
      taosArrayDestroy(tmp);
    }
  }
  taosArrayDestroy(pTableqinfoList->pGroupList);
4761

wmmhello's avatar
wmmhello 已提交
4762 4763
  pTableqinfoList->pTableList = NULL;
  pTableqinfoList->map = NULL;
4764 4765
}

L
Liu Jicong 已提交
4766
void doDestroyTask(SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
4767 4768
  qDebug("%s execTask is freed", GET_TASKID(pTaskInfo));

wmmhello's avatar
wmmhello 已提交
4769
  doDestroyTableList(&pTaskInfo->tableqinfoList);
H
Haojun Liao 已提交
4770
  destroyOperatorInfo(pTaskInfo->pRoot);
L
Liu Jicong 已提交
4771 4772
  //  taosArrayDestroy(pTaskInfo->summary.queryProfEvents);
  //  taosHashCleanup(pTaskInfo->summary.operatorProfResults);
4773

4774 4775
  taosMemoryFree(pTaskInfo->schemaVer.dbname);
  taosMemoryFree(pTaskInfo->schemaVer.tablename);
wafwerar's avatar
wafwerar 已提交
4776 4777 4778
  taosMemoryFreeClear(pTaskInfo->sql);
  taosMemoryFreeClear(pTaskInfo->id.str);
  taosMemoryFreeClear(pTaskInfo);
4779 4780 4781 4782 4783 4784 4785 4786 4787 4788 4789 4790
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes) {
  if (val == NULL) {
    setNull(output, type, bytes);
    return;
  }

  if (IS_VAR_DATA_TYPE(type)) {
    // Binary data overflows for sort of unknown reasons. Let trim the overflow data
    if (varDataTLen(val) > bytes) {
      int32_t maxLen = bytes - VARSTR_HEADER_SIZE;
L
Liu Jicong 已提交
4791
      int32_t len = (varDataLen(val) > maxLen) ? maxLen : varDataLen(val);
4792 4793 4794 4795 4796 4797 4798 4799 4800 4801 4802 4803
      memcpy(varDataVal(output), varDataVal(val), len);
      varDataSetLen(output, len);
    } else {
      varDataCopy(output, val);
    }
  } else {
    memcpy(output, val, bytes);
  }
}

static int64_t getQuerySupportBufSize(size_t numOfTables) {
  size_t s1 = sizeof(STableQueryInfo);
L
Liu Jicong 已提交
4804 4805
  //  size_t s3 = sizeof(STableCheckInfo);  buffer consumption in tsdb
  return (int64_t)(s1 * 1.5 * numOfTables);
4806 4807 4808 4809 4810 4811 4812
}

int32_t checkForQueryBuf(size_t numOfTables) {
  int64_t t = getQuerySupportBufSize(numOfTables);
  if (tsQueryBufferSizeBytes < 0) {
    return TSDB_CODE_SUCCESS;
  } else if (tsQueryBufferSizeBytes > 0) {
L
Liu Jicong 已提交
4813
    while (1) {
4814 4815 4816 4817 4818 4819 4820 4821 4822 4823 4824 4825 4826 4827 4828 4829 4830 4831 4832 4833 4834 4835 4836 4837 4838 4839
      int64_t s = tsQueryBufferSizeBytes;
      int64_t remain = s - t;
      if (remain >= 0) {
        if (atomic_val_compare_exchange_64(&tsQueryBufferSizeBytes, s, remain) == s) {
          return TSDB_CODE_SUCCESS;
        }
      } else {
        return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
      }
    }
  }

  // disable query processing if the value of tsQueryBufferSize is zero.
  return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
}

void releaseQueryBuf(size_t numOfTables) {
  if (tsQueryBufferSizeBytes < 0) {
    return;
  }

  int64_t t = getQuerySupportBufSize(numOfTables);

  // restore value is not enough buffer available
  atomic_add_fetch_64(&tsQueryBufferSizeBytes, t);
}
D
dapan1121 已提交
4840

dengyihao's avatar
dengyihao 已提交
4841 4842
int32_t getOperatorExplainExecInfo(SOperatorInfo* operatorInfo, SExplainExecInfo** pRes, int32_t* capacity,
                                   int32_t* resNum) {
D
dapan1121 已提交
4843 4844
  if (*resNum >= *capacity) {
    *capacity += 10;
dengyihao's avatar
dengyihao 已提交
4845

D
dapan1121 已提交
4846 4847
    *pRes = taosMemoryRealloc(*pRes, (*capacity) * sizeof(SExplainExecInfo));
    if (NULL == *pRes) {
D
dapan1121 已提交
4848
      qError("malloc %d failed", (*capacity) * (int32_t)sizeof(SExplainExecInfo));
D
dapan1121 已提交
4849 4850 4851 4852
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

4853 4854 4855 4856 4857
  SExplainExecInfo* pInfo = &(*pRes)[*resNum];

  pInfo->numOfRows = operatorInfo->resultInfo.totalRows;
  pInfo->startupCost = operatorInfo->cost.openCost;
  pInfo->totalCost = operatorInfo->cost.totalCost;
D
dapan1121 已提交
4858

4859
  if (operatorInfo->fpSet.getExplainFn) {
4860
    int32_t code = operatorInfo->fpSet.getExplainFn(operatorInfo, &pInfo->verboseInfo, &pInfo->verboseLen);
D
dapan1121 已提交
4861
    if (code) {
4862
      qError("%s operator getExplainFn failed, code:%s", GET_TASKID(operatorInfo->pTaskInfo), tstrerror(code));
D
dapan1121 已提交
4863 4864
      return code;
    }
4865 4866 4867
  } else {
    pInfo->verboseLen = 0;
    pInfo->verboseInfo = NULL;
D
dapan1121 已提交
4868
  }
dengyihao's avatar
dengyihao 已提交
4869

D
dapan1121 已提交
4870
  ++(*resNum);
dengyihao's avatar
dengyihao 已提交
4871

D
dapan1121 已提交
4872
  int32_t code = 0;
D
dapan1121 已提交
4873 4874
  for (int32_t i = 0; i < operatorInfo->numOfDownstream; ++i) {
    code = getOperatorExplainExecInfo(operatorInfo->pDownstream[i], pRes, capacity, resNum);
D
dapan1121 已提交
4875 4876 4877 4878 4879 4880 4881
    if (code) {
      taosMemoryFreeClear(*pRes);
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
D
dapan1121 已提交
4882
}
5
54liuyao 已提交
4883

L
Liu Jicong 已提交
4884
int32_t initStreamAggSupporter(SStreamAggSupporter* pSup, const char* pKey, SqlFunctionCtx* pCtx, int32_t numOfOutput,
4885
                               int32_t size) {
4886
  pSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
5
54liuyao 已提交
4887 4888
  pSup->keySize = sizeof(int64_t) + sizeof(TSKEY);
  pSup->pKeyBuf = taosMemoryCalloc(1, pSup->keySize);
4889 4890
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);
  pSup->pResultRows = taosHashInit(1024, hashFn, false, HASH_NO_LOCK);
5
54liuyao 已提交
4891 4892 4893
  if (pSup->pKeyBuf == NULL || pSup->pResultRows == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
4894
  pSup->valueSize = size;
5
54liuyao 已提交
4895

5
54liuyao 已提交
4896 4897
  pSup->pScanWindow = taosArrayInit(4, sizeof(STimeWindow));

5
54liuyao 已提交
4898 4899 4900 4901 4902 4903 4904 4905 4906
  int32_t pageSize = 4096;
  while (pageSize < pSup->resultRowSize * 4) {
    pageSize <<= 1u;
  }
  // at least four pages need to be in buffer
  int32_t bufSize = 4096 * 256;
  if (bufSize <= pageSize) {
    bufSize = pageSize * 4;
  }
4907
  int32_t code = createDiskbasedBuf(&pSup->pResultBuf, pageSize, bufSize, pKey, TD_TMP_DIR_PATH);
L
Liu Jicong 已提交
4908
  for (int32_t i = 0; i < numOfOutput; ++i) {
4909 4910 4911
    pCtx[i].pBuf = pSup->pResultBuf;
  }
  return code;
5
54liuyao 已提交
4912
}