executorimpl.c 171.4 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
15

H
Haojun Liao 已提交
16 17
#include "filter.h"
#include "function.h"
18 19
#include "functionMgt.h"
#include "os.h"
H
Haojun Liao 已提交
20
#include "querynodes.h"
21
#include "tfill.h"
dengyihao's avatar
dengyihao 已提交
22
#include "tname.h"
X
Xiaoyu Wang 已提交
23
#include "tref.h"
24

H
Haojun Liao 已提交
25
#include "tdatablock.h"
26
#include "tglobal.h"
H
Haojun Liao 已提交
27
#include "tmsg.h"
H
Haojun Liao 已提交
28
#include "tsort.h"
29
#include "ttime.h"
H
Haojun Liao 已提交
30

31
#include "executorimpl.h"
dengyihao's avatar
dengyihao 已提交
32
#include "index.h"
33
#include "query.h"
34 35
#include "tcompare.h"
#include "tcompression.h"
H
Haojun Liao 已提交
36
#include "thash.h"
37
#include "ttypes.h"
dengyihao's avatar
dengyihao 已提交
38
#include "vnode.h"
39

H
Haojun Liao 已提交
40
#define IS_MAIN_SCAN(runtime)          ((runtime)->scanFlag == MAIN_SCAN)
41 42 43 44 45 46
#define SET_REVERSE_SCAN_FLAG(runtime) ((runtime)->scanFlag = REVERSE_SCAN)

#define GET_FORWARD_DIRECTION_FACTOR(ord) (((ord) == TSDB_ORDER_ASC) ? QUERY_ASC_FORWARD_STEP : QUERY_DESC_FORWARD_STEP)

#if 0
static UNUSED_FUNC void *u_malloc (size_t __size) {
wafwerar's avatar
wafwerar 已提交
47
  uint32_t v = taosRand();
48 49 50 51

  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
52
    return taosMemoryMalloc(__size);
53 54 55 56
  }
}

static UNUSED_FUNC void* u_calloc(size_t num, size_t __size) {
wafwerar's avatar
wafwerar 已提交
57
  uint32_t v = taosRand();
58 59 60
  if (v % 1000 <= 0) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
61
    return taosMemoryCalloc(num, __size);
62 63 64 65
  }
}

static UNUSED_FUNC void* u_realloc(void* p, size_t __size) {
wafwerar's avatar
wafwerar 已提交
66
  uint32_t v = taosRand();
67 68 69
  if (v % 5 <= 1) {
    return NULL;
  } else {
wafwerar's avatar
wafwerar 已提交
70
    return taosMemoryRealloc(p, __size);
71 72 73 74 75 76 77 78
  }
}

#define calloc  u_calloc
#define malloc  u_malloc
#define realloc u_realloc
#endif

H
Haojun Liao 已提交
79 80 81 82 83 84
#define T_LONG_JMP(_obj, _c) \
  do {                       \
    assert((_c) != -1);      \
    longjmp((_obj), (_c));   \
  } while (0);

X
Xiaoyu Wang 已提交
85
#define CLEAR_QUERY_STATUS(q, st)   ((q)->status &= (~(st)))
86 87
#define QUERY_IS_INTERVAL_QUERY(_q) ((_q)->interval.interval > 0)

L
Liu Jicong 已提交
88 89 90
int32_t getMaximumIdleDurationSec() { return tsShellActivityTimer * 2; }

static int32_t getExprFunctionId(SExprInfo* pExprInfo) {
91
  assert(pExprInfo != NULL && pExprInfo->pExpr != NULL && pExprInfo->pExpr->nodeType == TEXPR_UNARYEXPR_NODE);
92
  return 0;
93 94 95 96
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes);

97
static void setBlockSMAInfo(SqlFunctionCtx* pCtx, SExprInfo* pExpr, SSDataBlock* pSDataBlock);
98

X
Xiaoyu Wang 已提交
99
static void releaseQueryBuf(size_t numOfTables);
100

101
static void destroyFillOperatorInfo(void* param, int32_t numOfOutput);
102 103 104
static void destroyProjectOperatorInfo(void* param, int32_t numOfOutput);
static void destroyOrderOperatorInfo(void* param, int32_t numOfOutput);
static void destroyAggOperatorInfo(void* param, int32_t numOfOutput);
X
Xiaoyu Wang 已提交
105

H
Haojun Liao 已提交
106
static void destroyIntervalOperatorInfo(void* param, int32_t numOfOutput);
H
Haojun Liao 已提交
107 108
static void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput);

109 110
static void destroyOperatorInfo(SOperatorInfo* pOperator);

111
void doSetOperatorCompleted(SOperatorInfo* pOperator) {
112
  pOperator->status = OP_EXEC_DONE;
113

114
  pOperator->cost.totalCost = (taosGetTimestampUs() - pOperator->pTaskInfo->cost.start * 1000) / 1000.0;
H
Haojun Liao 已提交
115
  if (pOperator->pTaskInfo != NULL) {
116
    setTaskStatus(pOperator->pTaskInfo, TASK_COMPLETED);
117 118
  }
}
119

H
Haojun Liao 已提交
120
int32_t operatorDummyOpenFn(SOperatorInfo* pOperator) {
121
  OPTR_SET_OPENED(pOperator);
122
  pOperator->cost.openCost = 0;
H
Haojun Liao 已提交
123
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
124 125
}

126
SOperatorFpSet createOperatorFpSet(__optr_open_fn_t openFn, __optr_fn_t nextFn, __optr_fn_t streamFn,
L
Liu Jicong 已提交
127
                                   __optr_fn_t cleanup, __optr_close_fn_t closeFn, __optr_encode_fn_t encode,
128
                                   __optr_decode_fn_t decode, __optr_explain_fn_t explain) {
129 130 131 132 133 134 135 136 137 138 139 140 141 142
  SOperatorFpSet fpSet = {
      ._openFn = openFn,
      .getNextFn = nextFn,
      .getStreamResFn = streamFn,
      .cleanupFn = cleanup,
      .closeFn = closeFn,
      .encodeResultRow = encode,
      .decodeResultRow = decode,
      .getExplainFn = explain,
  };

  return fpSet;
}

H
Haojun Liao 已提交
143
void operatorDummyCloseFn(void* param, int32_t numOfCols) {}
H
Haojun Liao 已提交
144

145 146
static int32_t doCopyToSDataBlock(SExecTaskInfo* pTaskInfo, SSDataBlock* pBlock, SExprSupp* pSup, SDiskbasedBuf* pBuf,
                                  SGroupResInfo* pGroupResInfo);
H
Haojun Liao 已提交
147

148
static void initCtxOutputBuffer(SqlFunctionCtx* pCtx, int32_t size);
149
static void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, int32_t numOfOutput, uint64_t groupId);
150

151
#if 0
L
Liu Jicong 已提交
152 153
static bool chkResultRowFromKey(STaskRuntimeEnv* pRuntimeEnv, SResultRowInfo* pResultRowInfo, char* pData,
                                int16_t bytes, bool masterscan, uint64_t uid) {
154 155 156
  bool existed = false;
  SET_RES_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid);

L
Liu Jicong 已提交
157 158
  SResultRow** p1 =
      (SResultRow**)taosHashGet(pRuntimeEnv->pResultRowHashTable, pRuntimeEnv->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
159 160 161 162 163 164 165 166 167 168 169

  // in case of repeat scan/reverse scan, no new time window added.
  if (QUERY_IS_INTERVAL_QUERY(pRuntimeEnv->pQueryAttr)) {
    if (!masterscan) {  // the *p1 may be NULL in case of sliding+offset exists.
      return p1 != NULL;
    }

    if (p1 != NULL) {
      if (pResultRowInfo->size == 0) {
        existed = false;
      } else if (pResultRowInfo->size == 1) {
dengyihao's avatar
dengyihao 已提交
170
        //        existed = (pResultRowInfo->pResult[0] == (*p1));
171 172
      } else {  // check if current pResultRowInfo contains the existed pResultRow
        SET_RES_EXT_WINDOW_KEY(pRuntimeEnv->keyBuf, pData, bytes, uid, pResultRowInfo);
L
Liu Jicong 已提交
173 174
        int64_t* index =
            taosHashGet(pRuntimeEnv->pResultRowListSet, pRuntimeEnv->keyBuf, GET_RES_EXT_WINDOW_KEY_LEN(bytes));
175 176 177 178 179 180 181 182 183 184 185 186 187
        if (index != NULL) {
          existed = true;
        } else {
          existed = false;
        }
      }
    }

    return existed;
  }

  return p1 != NULL;
}
188
#endif
189

190
SResultRow* getNewResultRow(SDiskbasedBuf* pResultBuf, int64_t tableGroupId, int32_t interBufSize) {
L
Liu Jicong 已提交
191
  SFilePage* pData = NULL;
192 193 194 195 196 197 198 199 200 201 202 203 204

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tableGroupId);

  if (taosArrayGetSize(list) == 0) {
    pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
    pData->num = sizeof(SFilePage);
  } else {
    SPageInfo* pi = getLastPageInfo(list);
    pData = getBufPage(pResultBuf, getPageId(pi));
    pageId = getPageId(pi);

wmmhello's avatar
wmmhello 已提交
205
    if (pData->num + interBufSize > getBufPageSize(pResultBuf)) {
206 207 208 209 210 211 212 213 214 215 216 217 218 219
      // release current page first, and prepare the next one
      releaseBufPageInfo(pResultBuf, pi);

      pData = getNewBufPage(pResultBuf, tableGroupId, &pageId);
      if (pData != NULL) {
        pData->num = sizeof(SFilePage);
      }
    }
  }

  if (pData == NULL) {
    return NULL;
  }

220 221
  setBufPageDirty(pData, true);

222 223 224 225 226
  // set the number of rows in current disk page
  SResultRow* pResultRow = (SResultRow*)((char*)pData + pData->num);
  pResultRow->pageId = pageId;
  pResultRow->offset = (int32_t)pData->num;

wmmhello's avatar
wmmhello 已提交
227
  pData->num += interBufSize;
228 229 230 231

  return pResultRow;
}

232 233 234 235 236 237 238
/**
 * the struct of key in hash table
 * +----------+---------------+
 * | group id |   key data    |
 * | 8 bytes  | actual length |
 * +----------+---------------+
 */
239 240 241
SResultRow* doSetResultOutBufByKey(SDiskbasedBuf* pResultBuf, SResultRowInfo* pResultRowInfo, char* pData,
                                   int16_t bytes, bool masterscan, uint64_t groupId, SExecTaskInfo* pTaskInfo,
                                   bool isIntervalQuery, SAggSupporter* pSup) {
242
  SET_RES_WINDOW_KEY(pSup->keyBuf, pData, bytes, groupId);
H
Haojun Liao 已提交
243

dengyihao's avatar
dengyihao 已提交
244 245
  SResultRowPosition* p1 =
      (SResultRowPosition*)taosHashGet(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes));
H
Haojun Liao 已提交
246

247 248
  SResultRow* pResult = NULL;

H
Haojun Liao 已提交
249 250
  // in case of repeat scan/reverse scan, no new time window added.
  if (isIntervalQuery) {
251
    if (masterscan && p1 != NULL) {  // the *p1 may be NULL in case of sliding+offset exists.
252
      pResult = getResultRowByPos(pResultBuf, p1, true);
253
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
254 255
    }
  } else {
dengyihao's avatar
dengyihao 已提交
256 257
    // In case of group by column query, the required SResultRow object must be existInCurrentResusltRowInfo in the
    // pResultRowInfo object.
H
Haojun Liao 已提交
258
    if (p1 != NULL) {
259
      // todo
260
      pResult = getResultRowByPos(pResultBuf, p1, true);
261
      ASSERT(pResult->pageId == p1->pageId && pResult->offset == p1->offset);
H
Haojun Liao 已提交
262 263 264
    }
  }

L
Liu Jicong 已提交
265
  // 1. close current opened time window
266
  if (pResultRowInfo->cur.pageId != -1 && ((pResult == NULL) || (pResult->pageId != pResultRowInfo->cur.pageId))) {
267
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
268
    qDebug("page_1");
269
#endif
270
    SResultRowPosition pos = pResultRowInfo->cur;
X
Xiaoyu Wang 已提交
271
    SFilePage*         pPage = getBufPage(pResultBuf, pos.pageId);
272 273 274 275 276
    releaseBufPage(pResultBuf, pPage);
  }

  // allocate a new buffer page
  if (pResult == NULL) {
277
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
278
    qDebug("page_2");
279
#endif
H
Haojun Liao 已提交
280
    ASSERT(pSup->resultRowSize > 0);
281 282
    pResult = getNewResultRow(pResultBuf, groupId, pSup->resultRowSize);

283
    initResultRow(pResult);
H
Haojun Liao 已提交
284

285 286
    // add a new result set for a new group
    SResultRowPosition pos = {.pageId = pResult->pageId, .offset = pResult->offset};
X
Xiaoyu Wang 已提交
287 288
    taosHashPut(pSup->pResultRowHashTable, pSup->keyBuf, GET_RES_WINDOW_KEY_LEN(bytes), &pos,
                sizeof(SResultRowPosition));
H
Haojun Liao 已提交
289 290
  }

291 292 293
  // 2. set the new time window to be the new active time window
  pResultRowInfo->cur = (SResultRowPosition){.pageId = pResult->pageId, .offset = pResult->offset};

H
Haojun Liao 已提交
294
  // too many time window in query
295 296
  if (pTaskInfo->execModel == OPTR_EXEC_MODEL_BATCH &&
      taosHashGetSize(pSup->pResultRowHashTable) > MAX_INTERVAL_TIME_WINDOW) {
H
Haojun Liao 已提交
297 298 299
    longjmp(pTaskInfo->env, TSDB_CODE_QRY_TOO_MANY_TIMEWINDOW);
  }

H
Haojun Liao 已提交
300
  return pResult;
H
Haojun Liao 已提交
301 302
}

303
// a new buffer page for each table. Needs to opt this design
L
Liu Jicong 已提交
304
static int32_t addNewWindowResultBuf(SResultRow* pWindowRes, SDiskbasedBuf* pResultBuf, int32_t tid, uint32_t size) {
305 306 307 308
  if (pWindowRes->pageId != -1) {
    return 0;
  }

L
Liu Jicong 已提交
309
  SFilePage* pData = NULL;
310 311 312 313 314 315

  // in the first scan, new space needed for results
  int32_t pageId = -1;
  SIDList list = getDataBufPagesIdList(pResultBuf, tid);

  if (taosArrayGetSize(list) == 0) {
H
Haojun Liao 已提交
316
    pData = getNewBufPage(pResultBuf, tid, &pageId);
317
    pData->num = sizeof(SFilePage);
318 319
  } else {
    SPageInfo* pi = getLastPageInfo(list);
320
    pData = getBufPage(pResultBuf, getPageId(pi));
321
    pageId = getPageId(pi);
322

323
    if (pData->num + size > getBufPageSize(pResultBuf)) {
324
      // release current page first, and prepare the next one
325
      releaseBufPageInfo(pResultBuf, pi);
326

H
Haojun Liao 已提交
327
      pData = getNewBufPage(pResultBuf, tid, &pageId);
328
      if (pData != NULL) {
329
        pData->num = sizeof(SFilePage);
330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349
      }
    }
  }

  if (pData == NULL) {
    return -1;
  }

  // set the number of rows in current disk page
  if (pWindowRes->pageId == -1) {  // not allocated yet, allocate new buffer
    pWindowRes->pageId = pageId;
    pWindowRes->offset = (int32_t)pData->num;

    pData->num += size;
    assert(pWindowRes->pageId >= 0);
  }

  return 0;
}

350
//  query_range_start, query_range_end, window_duration, window_start, window_end
351
void initExecTimeWindowInfo(SColumnInfoData* pColData, STimeWindow* pQueryWindow) {
352 353 354
  pColData->info.type = TSDB_DATA_TYPE_TIMESTAMP;
  pColData->info.bytes = sizeof(int64_t);

355
  colInfoDataEnsureCapacity(pColData, 5);
356 357 358 359 360 361 362 363 364
  colDataAppendInt64(pColData, 0, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 1, &pQueryWindow->ekey);

  int64_t interval = 0;
  colDataAppendInt64(pColData, 2, &interval);  // this value may be variable in case of 'n' and 'y'.
  colDataAppendInt64(pColData, 3, &pQueryWindow->skey);
  colDataAppendInt64(pColData, 4, &pQueryWindow->ekey);
}

L
Liu Jicong 已提交
365
void cleanupExecTimeWindowInfo(SColumnInfoData* pColData) { colDataDestroy(pColData); }
H
Haojun Liao 已提交
366

367 368 369 370 371 372 373 374 375 376 377 378 379 380
typedef struct {
  bool    hasAgg;
  int32_t numOfRows;
  int32_t startOffset;
} SFunctionCtxStatus;

static void functionCtxSave(SqlFunctionCtx* pCtx, SFunctionCtxStatus* pStatus) {
  pStatus->hasAgg = pCtx->input.colDataAggIsSet;
  pStatus->numOfRows = pCtx->input.numOfRows;
  pStatus->startOffset = pCtx->input.startRowIndex;
}

static void functionCtxRestore(SqlFunctionCtx* pCtx, SFunctionCtxStatus* pStatus) {
  pCtx->input.colDataAggIsSet = pStatus->hasAgg;
381
  pCtx->input.numOfRows = pStatus->numOfRows;
382 383 384 385 386
  pCtx->input.startRowIndex = pStatus->startOffset;
}

void doApplyFunctions(SExecTaskInfo* taskInfo, SqlFunctionCtx* pCtx, SColumnInfoData* pTimeWindowData, int32_t offset,
                      int32_t forwardStep, int32_t numOfTotal, int32_t numOfOutput) {
387
  for (int32_t k = 0; k < numOfOutput; ++k) {
H
Haojun Liao 已提交
388
    // keep it temporarily
389 390
    SFunctionCtxStatus status = {0};
    functionCtxSave(&pCtx[k], &status);
391

392
    pCtx[k].input.startRowIndex = offset;
393
    pCtx[k].input.numOfRows = forwardStep;
394 395 396

    // not a whole block involved in query processing, statistics data can not be used
    // NOTE: the original value of isSet have been changed here
397 398
    if (pCtx[k].input.colDataAggIsSet && forwardStep < numOfTotal) {
      pCtx[k].input.colDataAggIsSet = false;
399 400
    }

401 402
    if (fmIsWindowPseudoColumnFunc(pCtx[k].functionId)) {
      SResultRowEntryInfo* pEntryInfo = GET_RES_INFO(&pCtx[k]);
403 404

      char* p = GET_ROWCELL_INTERBUF(pEntryInfo);
405

406
      SColumnInfoData idata = {0};
dengyihao's avatar
dengyihao 已提交
407
      idata.info.type = TSDB_DATA_TYPE_BIGINT;
408
      idata.info.bytes = tDataTypes[TSDB_DATA_TYPE_BIGINT].bytes;
dengyihao's avatar
dengyihao 已提交
409
      idata.pData = p;
410 411 412 413

      SScalarParam out = {.columnData = &idata};
      SScalarParam tw = {.numOfRows = 5, .columnData = pTimeWindowData};
      pCtx[k].sfp.process(&tw, 1, &out);
414
      pEntryInfo->numOfRes = 1;
415 416 417 418 419 420 421 422 423 424
    } else {
      int32_t code = TSDB_CODE_SUCCESS;
      if (functionNeedToExecute(&pCtx[k]) && pCtx[k].fpSet.process != NULL) {
        code = pCtx[k].fpSet.process(&pCtx[k]);

        if (code != TSDB_CODE_SUCCESS) {
          qError("%s apply functions error, code: %s", GET_TASKID(taskInfo), tstrerror(code));
          taskInfo->code = code;
          longjmp(taskInfo->env, code);
        }
425
      }
426

427
      // restore it
428
      functionCtxRestore(&pCtx[k], &status);
429
    }
430 431 432
  }
}

dengyihao's avatar
dengyihao 已提交
433
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
434
                                   int32_t scanFlag, bool createDummyCol);
435

dengyihao's avatar
dengyihao 已提交
436 437
static void doSetInputDataBlockInfo(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock,
                                    int32_t order) {
438
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
439
    pCtx[i].order = order;
440
    pCtx[i].input.numOfRows = pBlock->info.rows;
441
    setBlockSMAInfo(&pCtx[i], &pOperator->exprSupp.pExprInfo[i], pBlock);
442
    pCtx[i].pSrcBlock = pBlock;
443 444 445
  }
}

X
Xiaoyu Wang 已提交
446 447
void setInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
                       int32_t scanFlag, bool createDummyCol) {
448
  if (pBlock->pBlockAgg != NULL) {
H
Haojun Liao 已提交
449
    doSetInputDataBlockInfo(pOperator, pCtx, pBlock, order);
450
  } else {
451
    doSetInputDataBlock(pOperator, pCtx, pBlock, order, scanFlag, createDummyCol);
H
Haojun Liao 已提交
452
  }
453 454
}

L
Liu Jicong 已提交
455 456
static int32_t doCreateConstantValColumnInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t paramIndex,
                                             int32_t numOfRows) {
457 458 459 460 461 462 463 464
  SColumnInfoData* pColInfo = NULL;
  if (pInput->pData[paramIndex] == NULL) {
    pColInfo = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pColInfo == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

    // Set the correct column info (data type and bytes)
465 466
    pColInfo->info.type = pFuncParam->param.nType;
    pColInfo->info.bytes = pFuncParam->param.nLen;
467 468

    pInput->pData[paramIndex] = pColInfo;
469 470
  } else {
    pColInfo = pInput->pData[paramIndex];
471 472
  }

473
  colInfoDataEnsureCapacity(pColInfo, numOfRows);
474

475
  int8_t type = pFuncParam->param.nType;
476 477
  if (type == TSDB_DATA_TYPE_BIGINT || type == TSDB_DATA_TYPE_UBIGINT) {
    int64_t v = pFuncParam->param.i;
dengyihao's avatar
dengyihao 已提交
478
    for (int32_t i = 0; i < numOfRows; ++i) {
479 480 481 482
      colDataAppendInt64(pColInfo, i, &v);
    }
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
dengyihao's avatar
dengyihao 已提交
483
    for (int32_t i = 0; i < numOfRows; ++i) {
484 485
      colDataAppendDouble(pColInfo, i, &v);
    }
486
  } else if (type == TSDB_DATA_TYPE_VARCHAR) {
L
Liu Jicong 已提交
487
    char* tmp = taosMemoryMalloc(pFuncParam->param.nLen + VARSTR_HEADER_SIZE);
488
    STR_WITH_SIZE_TO_VARSTR(tmp, pFuncParam->param.pz, pFuncParam->param.nLen);
L
Liu Jicong 已提交
489
    for (int32_t i = 0; i < numOfRows; ++i) {
490 491
      colDataAppend(pColInfo, i, tmp, false);
    }
492 493 494 495 496
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
497
static int32_t doSetInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order,
X
Xiaoyu Wang 已提交
498
                                   int32_t scanFlag, bool createDummyCol) {
499 500
  int32_t code = TSDB_CODE_SUCCESS;

501
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
L
Liu Jicong 已提交
502
    pCtx[i].order = order;
503 504
    pCtx[i].input.numOfRows = pBlock->info.rows;

L
Liu Jicong 已提交
505
    pCtx[i].pSrcBlock = pBlock;
X
Xiaoyu Wang 已提交
506
    pCtx[i].scanFlag = scanFlag;
H
Haojun Liao 已提交
507

508
    SInputColumnInfoData* pInput = &pCtx[i].input;
509
    pInput->uid = pBlock->info.uid;
C
Cary Xu 已提交
510
    pInput->colDataAggIsSet = false;
511

512
    SExprInfo* pOneExpr = &pOperator->exprSupp.pExprInfo[i];
513
    for (int32_t j = 0; j < pOneExpr->base.numOfParams; ++j) {
dengyihao's avatar
dengyihao 已提交
514
      SFunctParam* pFuncParam = &pOneExpr->base.pParam[j];
G
Ganlin Zhao 已提交
515 516
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
dengyihao's avatar
dengyihao 已提交
517
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
518 519 520
        pInput->totalRows = pBlock->info.rows;
        pInput->numOfRows = pBlock->info.rows;
        pInput->startRowIndex = 0;
521

522
        // NOTE: the last parameter is the primary timestamp column
H
Haojun Liao 已提交
523
        // todo: refactor this
524
        if (fmIsImplicitTsFunc(pCtx[i].functionId) && (j == pOneExpr->base.numOfParams - 1)) {
L
Liu Jicong 已提交
525 526
          pInput->pPTS = pInput->pData[j];  // in case of merge function, this is not always the ts column data.
                                            //          ASSERT(pInput->pPTS->info.type == TSDB_DATA_TYPE_TIMESTAMP);
527
        }
528 529
        ASSERT(pInput->pData[j] != NULL);
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
530 531 532
        // todo avoid case: top(k, 12), 12 is the value parameter.
        // sum(11), 11 is also the value parameter.
        if (createDummyCol && pOneExpr->base.numOfParams == 1) {
533 534 535 536
          pInput->totalRows = pBlock->info.rows;
          pInput->numOfRows = pBlock->info.rows;
          pInput->startRowIndex = 0;

537
          code = doCreateConstantValColumnInfo(pInput, pFuncParam, j, pBlock->info.rows);
538 539 540
          if (code != TSDB_CODE_SUCCESS) {
            return code;
          }
541
        }
G
Ganlin Zhao 已提交
542 543
      }
    }
H
Haojun Liao 已提交
544
  }
545 546

  return code;
H
Haojun Liao 已提交
547 548
}

549
static int32_t doAggregateImpl(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx) {
550
  for (int32_t k = 0; k < pOperator->exprSupp.numOfExprs; ++k) {
H
Haojun Liao 已提交
551
    if (functionNeedToExecute(&pCtx[k])) {
552
      // todo add a dummy funtion to avoid process check
553 554 555
      if (pCtx[k].fpSet.process == NULL) {
        continue;
      }
H
Haojun Liao 已提交
556

557 558 559 560
      int32_t code = pCtx[k].fpSet.process(&pCtx[k]);
      if (code != TSDB_CODE_SUCCESS) {
        qError("%s aggregate function error happens, code: %s", GET_TASKID(pOperator->pTaskInfo), tstrerror(code));
        return code;
561
      }
562 563
    }
  }
564 565

  return TSDB_CODE_SUCCESS;
566 567
}

H
Haojun Liao 已提交
568
static void setPseudoOutputColInfo(SSDataBlock* pResult, SqlFunctionCtx* pCtx, SArray* pPseudoList) {
dengyihao's avatar
dengyihao 已提交
569
  size_t num = (pPseudoList != NULL) ? taosArrayGetSize(pPseudoList) : 0;
H
Haojun Liao 已提交
570 571 572 573 574
  for (int32_t i = 0; i < num; ++i) {
    pCtx[i].pOutput = taosArrayGet(pResult->pDataBlock, i);
  }
}

575
int32_t projectApplyFunctions(SExprInfo* pExpr, SSDataBlock* pResult, SSDataBlock* pSrcBlock, SqlFunctionCtx* pCtx,
X
Xiaoyu Wang 已提交
576
                              int32_t numOfOutput, SArray* pPseudoList) {
H
Haojun Liao 已提交
577
  setPseudoOutputColInfo(pResult, pCtx, pPseudoList);
578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597

  if (pSrcBlock == NULL) {
    for (int32_t k = 0; k < numOfOutput; ++k) {
      int32_t outputSlotId = pExpr[k].base.resSchema.slotId;

      ASSERT(pExpr[k].pExpr->nodeType == QUERY_NODE_VALUE);
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);

      int32_t type = pExpr[k].base.pParam[0].param.nType;
      if (TSDB_DATA_TYPE_NULL == type) {
        colDataAppendNNULL(pColInfoData, 0, 1);
      } else {
        colDataAppend(pColInfoData, 0, taosVariantGet(&pExpr[k].base.pParam[0].param, type), false);
      }
    }

    pResult->info.rows = 1;
    return TSDB_CODE_SUCCESS;
  }

H
Haojun Liao 已提交
598
  pResult->info.groupId = pSrcBlock->info.groupId;
H
Haojun Liao 已提交
599

600 601
  // if the source equals to the destination, it is to create a new column as the result of scalar
  // function or some operators.
602 603
  bool createNewColModel = (pResult == pSrcBlock);

604 605
  int32_t numOfRows = 0;

606
  for (int32_t k = 0; k < numOfOutput; ++k) {
607 608
    int32_t               outputSlotId = pExpr[k].base.resSchema.slotId;
    SqlFunctionCtx*       pfCtx = &pCtx[k];
609
    SInputColumnInfoData* pInputData = &pfCtx->input;
610

L
Liu Jicong 已提交
611
    if (pExpr[k].pExpr->nodeType == QUERY_NODE_COLUMN) {  // it is a project query
612
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
613
      if (pResult->info.rows > 0 && !createNewColModel) {
614 615
        colDataMergeCol(pColInfoData, pResult->info.rows, &pResult->info.capacity, pInputData->pData[0],
                        pInputData->numOfRows);
616
      } else {
617
        colDataAssign(pColInfoData, pInputData->pData[0], pInputData->numOfRows, &pResult->info);
618
      }
619

620
      numOfRows = pInputData->numOfRows;
621
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_VALUE) {
622
      SColumnInfoData* pColInfoData = taosArrayGet(pResult->pDataBlock, outputSlotId);
623

dengyihao's avatar
dengyihao 已提交
624
      int32_t offset = createNewColModel ? 0 : pResult->info.rows;
625 626 627 628 629 630 631 632

      int32_t type = pExpr[k].base.pParam[0].param.nType;
      if (TSDB_DATA_TYPE_NULL == type) {
        colDataAppendNNULL(pColInfoData, offset, pSrcBlock->info.rows);
      } else {
        for (int32_t i = 0; i < pSrcBlock->info.rows; ++i) {
          colDataAppend(pColInfoData, i + offset, taosVariantGet(&pExpr[k].base.pParam[0].param, type), false);
        }
633
      }
634 635

      numOfRows = pSrcBlock->info.rows;
H
Haojun Liao 已提交
636
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_OPERATOR) {
637 638 639
      SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
      taosArrayPush(pBlockList, &pSrcBlock);

640
      SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
641
      SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
642

643
      SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
644
      int32_t      code = scalarCalculate(pExpr[k].pExpr->_optrRoot.pRootNode, pBlockList, &dest);
645 646 647 648
      if (code != TSDB_CODE_SUCCESS) {
        taosArrayDestroy(pBlockList);
        return code;
      }
649

dengyihao's avatar
dengyihao 已提交
650
      int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
651
      ASSERT(pResult->info.capacity > 0);
652
      colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
D
dapan1121 已提交
653
      colDataDestroy(&idata);
L
Liu Jicong 已提交
654

655
      numOfRows = dest.numOfRows;
656 657
      taosArrayDestroy(pBlockList);
    } else if (pExpr[k].pExpr->nodeType == QUERY_NODE_FUNCTION) {
658 659
      // _rowts/_c0, not tbname column
      if (fmIsPseudoColumnFunc(pfCtx->functionId) && (!fmIsScanPseudoColumnFunc(pfCtx->functionId))) {
H
Haojun Liao 已提交
660
        // do nothing
661
      } else if (fmIsIndefiniteRowsFunc(pfCtx->functionId)) {
662 663
        SResultRowEntryInfo* pResInfo = GET_RES_INFO(pfCtx);
        pfCtx->fpSet.init(pfCtx, pResInfo);
664 665 666 667 668 669 670 671 672 673

        pfCtx->pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
        pfCtx->offset = createNewColModel ? 0 : pResult->info.rows;  // set the start offset

        // set the timestamp(_rowts) output buffer
        if (taosArrayGetSize(pPseudoList) > 0) {
          int32_t* outputColIndex = taosArrayGet(pPseudoList, 0);
          pfCtx->pTsOutput = (SColumnInfoData*)pCtx[*outputColIndex].pOutput;
        }

674 675 676 677 678
        // link pDstBlock to set selectivity value
        if (pfCtx->subsidiaries.num > 0) {
          pfCtx->pDstBlock = pResult;
        }

679
        numOfRows = pfCtx->fpSet.process(pfCtx);
H
Haojun Liao 已提交
680
      } else if (fmIsAggFunc(pfCtx->functionId)) {
G
Ganlin Zhao 已提交
681
        // selective value output should be set during corresponding function execution
682 683 684
        if (fmIsSelectValueFunc(pfCtx->functionId)) {
          continue;
        }
685 686
        // _group_key function for "partition by tbname" + csum(col_name) query
        SColumnInfoData* pOutput = taosArrayGet(pResult->pDataBlock, outputSlotId);
687
        int32_t          slotId = pfCtx->param[0].pCol->slotId;
688 689 690

        // todo handle the json tag
        SColumnInfoData* pInput = taosArrayGet(pSrcBlock->pDataBlock, slotId);
691
        for (int32_t f = 0; f < pSrcBlock->info.rows; ++f) {
692 693 694 695 696 697 698 699 700
          bool isNull = colDataIsNull_s(pInput, f);
          if (isNull) {
            colDataAppendNULL(pOutput, pResult->info.rows + f);
          } else {
            char* data = colDataGetData(pInput, f);
            colDataAppend(pOutput, pResult->info.rows + f, data, isNull);
          }
        }

H
Haojun Liao 已提交
701 702 703
      } else {
        SArray* pBlockList = taosArrayInit(4, POINTER_BYTES);
        taosArrayPush(pBlockList, &pSrcBlock);
G
Ganlin Zhao 已提交
704

705
        SColumnInfoData* pResColData = taosArrayGet(pResult->pDataBlock, outputSlotId);
706
        SColumnInfoData  idata = {.info = pResColData->info, .hasNull = true};
H
Haojun Liao 已提交
707

708
        SScalarParam dest = {.columnData = &idata};
X
Xiaoyu Wang 已提交
709
        int32_t      code = scalarCalculate((SNode*)pExpr[k].pExpr->_function.pFunctNode, pBlockList, &dest);
710 711 712 713
        if (code != TSDB_CODE_SUCCESS) {
          taosArrayDestroy(pBlockList);
          return code;
        }
714

dengyihao's avatar
dengyihao 已提交
715
        int32_t startOffset = createNewColModel ? 0 : pResult->info.rows;
716
        ASSERT(pResult->info.capacity > 0);
717
        colDataMergeCol(pResColData, startOffset, &pResult->info.capacity, &idata, dest.numOfRows);
D
dapan1121 已提交
718
        colDataDestroy(&idata);
719 720

        numOfRows = dest.numOfRows;
H
Haojun Liao 已提交
721 722
        taosArrayDestroy(pBlockList);
      }
723
    } else {
724
      return TSDB_CODE_OPS_NOT_SUPPORT;
725 726
    }
  }
727

728 729 730
  if (!createNewColModel) {
    pResult->info.rows += numOfRows;
  }
731 732

  return TSDB_CODE_SUCCESS;
733 734
}

5
54liuyao 已提交
735
bool functionNeedToExecute(SqlFunctionCtx* pCtx) {
736
  struct SResultRowEntryInfo* pResInfo = GET_RES_INFO(pCtx);
737

738 739 740 741 742
  // in case of timestamp column, always generated results.
  int32_t functionId = pCtx->functionId;
  if (functionId == -1) {
    return false;
  }
743

744 745
  if (pCtx->scanFlag == REPEAT_SCAN) {
    return fmIsRepeatScanFunc(pCtx->functionId);
746 747
  }

748 749
  if (isRowEntryCompleted(pResInfo)) {
    return false;
750 751
  }

752 753 754
  return true;
}

755 756 757 758 759 760 761
static int32_t doCreateConstantValColumnAggInfo(SInputColumnInfoData* pInput, SFunctParam* pFuncParam, int32_t type,
                                                int32_t paramIndex, int32_t numOfRows) {
  if (pInput->pData[paramIndex] == NULL) {
    pInput->pData[paramIndex] = taosMemoryCalloc(1, sizeof(SColumnInfoData));
    if (pInput->pData[paramIndex] == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
762

763 764 765
    // Set the correct column info (data type and bytes)
    pInput->pData[paramIndex]->info.type = type;
    pInput->pData[paramIndex]->info.bytes = tDataTypes[type].bytes;
766
  }
H
Haojun Liao 已提交
767

768 769 770 771 772 773
  SColumnDataAgg* da = NULL;
  if (pInput->pColumnDataAgg[paramIndex] == NULL) {
    da = taosMemoryCalloc(1, sizeof(SColumnDataAgg));
    pInput->pColumnDataAgg[paramIndex] = da;
    if (da == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
774 775
    }
  } else {
776
    da = pInput->pColumnDataAgg[paramIndex];
777 778
  }

779
  ASSERT(!IS_VAR_DATA_TYPE(type));
780

781 782
  if (type == TSDB_DATA_TYPE_BIGINT) {
    int64_t v = pFuncParam->param.i;
783
    *da = (SColumnDataAgg){.numOfNull = 0, .min = v, .max = v, .sum = v * numOfRows};
784 785
  } else if (type == TSDB_DATA_TYPE_DOUBLE) {
    double v = pFuncParam->param.d;
786
    *da = (SColumnDataAgg){.numOfNull = 0};
787

788 789 790 791 792 793
    *(double*)&da->min = v;
    *(double*)&da->max = v;
    *(double*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_BOOL) {  // todo validate this data type
    bool v = pFuncParam->param.i;

794
    *da = (SColumnDataAgg){.numOfNull = 0};
795 796 797 798 799
    *(bool*)&da->min = 0;
    *(bool*)&da->max = v;
    *(bool*)&da->sum = v * numOfRows;
  } else if (type == TSDB_DATA_TYPE_TIMESTAMP) {
    // do nothing
800
  } else {
801
    ASSERT(0);
802 803
  }

804 805
  return TSDB_CODE_SUCCESS;
}
806

807
void setBlockSMAInfo(SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, SSDataBlock* pBlock) {
808 809 810 811 812 813 814 815 816
  int32_t numOfRows = pBlock->info.rows;

  SInputColumnInfoData* pInput = &pCtx->input;
  pInput->numOfRows = numOfRows;
  pInput->totalRows = numOfRows;

  if (pBlock->pBlockAgg != NULL) {
    pInput->colDataAggIsSet = true;

817 818
    for (int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      SFunctParam* pFuncParam = &pExprInfo->base.pParam[j];
819

820 821
      if (pFuncParam->type == FUNC_PARAM_TYPE_COLUMN) {
        int32_t slotId = pFuncParam->pCol->slotId;
822 823 824 825
        pInput->pColumnDataAgg[j] = pBlock->pBlockAgg[slotId];
        if (pInput->pColumnDataAgg[j] == NULL) {
          pInput->colDataAggIsSet = false;
        }
826 827 828 829

        // Here we set the column info data since the data type for each column data is required, but
        // the data in the corresponding SColumnInfoData will not be used.
        pInput->pData[j] = taosArrayGet(pBlock->pDataBlock, slotId);
830 831
      } else if (pFuncParam->type == FUNC_PARAM_TYPE_VALUE) {
        doCreateConstantValColumnAggInfo(pInput, pFuncParam, pFuncParam->param.nType, j, pBlock->info.rows);
832 833
      }
    }
834
  } else {
835
    pInput->colDataAggIsSet = false;
836 837 838
  }

  // set the statistics data for primary time stamp column
839 840 841 842 843
  //  if (pCtx->functionId == FUNCTION_SPREAD && pColumn->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
  //    pCtx->isAggSet = true;
  //    pCtx->agg.min = pBlock->info.window.skey;
  //    pCtx->agg.max = pBlock->info.window.ekey;
  //  }
844 845
}

L
Liu Jicong 已提交
846
bool isTaskKilled(SExecTaskInfo* pTaskInfo) {
847 848
  // query has been executed more than tsShellActivityTimer, and the retrieve has not arrived
  // abort current query execution.
L
Liu Jicong 已提交
849 850
  if (pTaskInfo->owner != 0 &&
      ((taosGetTimestampSec() - pTaskInfo->cost.start / 1000) > 10 * getMaximumIdleDurationSec())
851 852
      /*(!needBuildResAfterQueryComplete(pTaskInfo))*/) {
    assert(pTaskInfo->cost.start != 0);
L
Liu Jicong 已提交
853 854 855
    //    qDebug("QInfo:%" PRIu64 " retrieve not arrive beyond %d ms, abort current query execution, start:%" PRId64
    //           ", current:%d", pQInfo->qId, 1, pQInfo->startExecTs, taosGetTimestampSec());
    //    return true;
856 857 858 859 860
  }

  return false;
}

L
Liu Jicong 已提交
861
void setTaskKilled(SExecTaskInfo* pTaskInfo) { pTaskInfo->code = TSDB_CODE_TSC_QUERY_CANCELLED; }
862 863

/////////////////////////////////////////////////////////////////////////////////////////////
864
STimeWindow getAlignQueryTimeWindow(SInterval* pInterval, int32_t precision, int64_t key) {
L
Liu Jicong 已提交
865
  STimeWindow win = {0};
866
  win.skey = taosTimeTruncate(key, pInterval, precision);
867 868

  /*
H
Haojun Liao 已提交
869
   * if the realSkey > INT64_MAX - pInterval->interval, the query duration between
870 871
   * realSkey and realEkey must be less than one interval.Therefore, no need to adjust the query ranges.
   */
872 873 874
  win.ekey = taosTimeAdd(win.skey, pInterval->interval, pInterval->intervalUnit, precision) - 1;
  if (win.ekey < win.skey) {
    win.ekey = INT64_MAX;
875
  }
876 877

  return win;
878 879
}

880
#if 0
L
Liu Jicong 已提交
881
static int32_t updateBlockLoadStatus(STaskAttr* pQuery, int32_t status) {
882

883 884 885
  bool hasFirstLastFunc = false;
  bool hasOtherFunc = false;

886
  if (status == BLK_DATA_DATA_LOAD || status == BLK_DATA_FILTEROUT) {
887 888 889 890 891
    return status;
  }

  for (int32_t i = 0; i < pQuery->numOfOutput; ++i) {
    int32_t functionId = getExprFunctionId(&pQuery->pExpr1[i]);
892

893 894 895 896 897 898 899 900 901 902
    if (functionId == FUNCTION_TS || functionId == FUNCTION_TS_DUMMY || functionId == FUNCTION_TAG ||
        functionId == FUNCTION_TAG_DUMMY) {
      continue;
    }

    if (functionId == FUNCTION_FIRST_DST || functionId == FUNCTION_LAST_DST) {
      hasFirstLastFunc = true;
    } else {
      hasOtherFunc = true;
    }
903

904 905
  }

906
  if (hasFirstLastFunc && status == BLK_DATA_NOT_LOAD) {
L
Liu Jicong 已提交
907
    if (!hasOtherFunc) {
908
      return BLK_DATA_FILTEROUT;
909
    } else {
910
      return BLK_DATA_DATA_LOAD;
911 912 913 914 915 916
    }
  }

  return status;
}

917 918
#endif

L
Liu Jicong 已提交
919 920
// static void updateDataCheckOrder(SQInfo *pQInfo, SQueryTableReq* pQueryMsg, bool stableQuery) {
//   STaskAttr* pQueryAttr = pQInfo->runtimeEnv.pQueryAttr;
H
Haojun Liao 已提交
921
//
L
Liu Jicong 已提交
922 923 924 925
//   // in case of point-interpolation query, use asc order scan
//   char msg[] = "QInfo:0x%"PRIx64" scan order changed for %s query, old:%d, new:%d, qrange exchanged, old qrange:%"
//   PRId64
//                "-%" PRId64 ", new qrange:%" PRId64 "-%" PRId64;
H
Haojun Liao 已提交
926
//
L
Liu Jicong 已提交
927 928 929 930 931
//   // todo handle the case the the order irrelevant query type mixed up with order critical query type
//   // descending order query for last_row query
//   if (isFirstLastRowQuery(pQueryAttr)) {
//     //qDebug("QInfo:0x%"PRIx64" scan order changed for last_row query, old:%d, new:%d", pQInfo->qId,
//     pQueryAttr->order.order, TSDB_ORDER_ASC);
H
Haojun Liao 已提交
932
//
L
Liu Jicong 已提交
933 934
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
935
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
936
//     }
H
Haojun Liao 已提交
937
//
L
Liu Jicong 已提交
938 939 940
//     pQueryAttr->needReverseScan = false;
//     return;
//   }
H
Haojun Liao 已提交
941
//
L
Liu Jicong 已提交
942 943 944
//   if (pQueryAttr->groupbyColumn && pQueryAttr->order.order == TSDB_ORDER_DESC) {
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     if (pQueryAttr->window.skey > pQueryAttr->window.ekey) {
wafwerar's avatar
wafwerar 已提交
945
//       TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
L
Liu Jicong 已提交
946
//     }
H
Haojun Liao 已提交
947
//
L
Liu Jicong 已提交
948 949 950 951
//     pQueryAttr->needReverseScan = false;
//     doUpdateLastKey(pQueryAttr);
//     return;
//   }
H
Haojun Liao 已提交
952
//
L
Liu Jicong 已提交
953 954 955 956 957 958
//   if (pQueryAttr->pointInterpQuery && pQueryAttr->interval.interval == 0) {
//     if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       //qDebug(msg, pQInfo->qId, "interp", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey); TSWAP(pQueryAttr->window.skey,
//       pQueryAttr->window.ekey, TSKEY);
//     }
H
Haojun Liao 已提交
959
//
L
Liu Jicong 已提交
960 961 962
//     pQueryAttr->order.order = TSDB_ORDER_ASC;
//     return;
//   }
H
Haojun Liao 已提交
963
//
L
Liu Jicong 已提交
964 965 966 967
//   if (pQueryAttr->interval.interval == 0) {
//     if (onlyFirstQuery(pQueryAttr)) {
//       if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//         //qDebug(msg, pQInfo->qId, "only-first", pQueryAttr->order.order, TSDB_ORDER_ASC, pQueryAttr->window.skey,
H
Haojun Liao 已提交
968 969
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
970
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
971 972 973 974 975 976 977 978 979 980
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_ASC;
//      pQueryAttr->needReverseScan = false;
//    } else if (onlyLastQuery(pQueryAttr) && notContainSessionOrStateWindow(pQueryAttr)) {
//      if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//        //qDebug(msg, pQInfo->qId, "only-last", pQueryAttr->order.order, TSDB_ORDER_DESC, pQueryAttr->window.skey,
////               pQueryAttr->window.ekey, pQueryAttr->window.ekey, pQueryAttr->window.skey);
//
wafwerar's avatar
wafwerar 已提交
981
//        TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
982 983 984 985 986 987 988 989 990 991 992 993
//        doUpdateLastKey(pQueryAttr);
//      }
//
//      pQueryAttr->order.order = TSDB_ORDER_DESC;
//      pQueryAttr->needReverseScan = false;
//    }
//
//  } else {  // interval query
//    if (stableQuery) {
//      if (onlyFirstQuery(pQueryAttr)) {
//        if (!QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-first stable", pQueryAttr->order.order, TSDB_ORDER_ASC,
L
Liu Jicong 已提交
994 995
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
996
//
wafwerar's avatar
wafwerar 已提交
997
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
998 999 1000 1001 1002 1003 1004 1005
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_ASC;
//        pQueryAttr->needReverseScan = false;
//      } else if (onlyLastQuery(pQueryAttr)) {
//        if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//          //qDebug(msg, pQInfo->qId, "only-last stable", pQueryAttr->order.order, TSDB_ORDER_DESC,
L
Liu Jicong 已提交
1006 1007
////                 pQueryAttr->window.skey, pQueryAttr->window.ekey, pQueryAttr->window.ekey,
/// pQueryAttr->window.skey);
H
Haojun Liao 已提交
1008
//
wafwerar's avatar
wafwerar 已提交
1009
//          TSWAP(pQueryAttr->window.skey, pQueryAttr->window.ekey);
H
Haojun Liao 已提交
1010 1011 1012 1013 1014 1015 1016 1017 1018
//          doUpdateLastKey(pQueryAttr);
//        }
//
//        pQueryAttr->order.order = TSDB_ORDER_DESC;
//        pQueryAttr->needReverseScan = false;
//      }
//    }
//  }
//}
1019

1020
#if 0
H
Haojun Liao 已提交
1021
static bool overlapWithTimeWindow(STaskAttr* pQueryAttr, SDataBlockInfo* pBlockInfo) {
1022 1023
  STimeWindow w = {0};

dengyihao's avatar
dengyihao 已提交
1024 1025
  TSKEY sk = TMIN(pQueryAttr->window.skey, pQueryAttr->window.ekey);
  TSKEY ek = TMAX(pQueryAttr->window.skey, pQueryAttr->window.ekey);
1026

1027
  if (true) {
L
Liu Jicong 已提交
1028
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.skey, sk, ek, &w);
1029 1030 1031 1032 1033 1034
    assert(w.ekey >= pBlockInfo->window.skey);

    if (w.ekey < pBlockInfo->window.ekey) {
      return true;
    }

L
Liu Jicong 已提交
1035 1036
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1037 1038 1039 1040 1041 1042 1043 1044 1045 1046
      if (w.skey > pBlockInfo->window.ekey) {
        break;
      }

      assert(w.ekey > pBlockInfo->window.ekey);
      if (w.skey <= pBlockInfo->window.ekey && w.skey > pBlockInfo->window.skey) {
        return true;
      }
    }
  } else {
L
Liu Jicong 已提交
1047
    //    getAlignQueryTimeWindow(pQueryAttr, pBlockInfo->window.ekey, sk, ek, &w);
1048 1049 1050 1051 1052 1053
    assert(w.skey <= pBlockInfo->window.ekey);

    if (w.skey > pBlockInfo->window.skey) {
      return true;
    }

L
Liu Jicong 已提交
1054 1055
    while (1) {
      //      getNextTimeWindow(pQueryAttr, &w);
1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068
      if (w.ekey < pBlockInfo->window.skey) {
        break;
      }

      assert(w.skey < pBlockInfo->window.skey);
      if (w.ekey < pBlockInfo->window.ekey && w.ekey >= pBlockInfo->window.skey) {
        return true;
      }
    }
  }

  return false;
}
1069
#endif
1070 1071

static uint32_t doFilterByBlockTimeWindow(STableScanInfo* pTableScanInfo, SSDataBlock* pBlock) {
H
Haojun Liao 已提交
1072
#if 0
H
Haojun Liao 已提交
1073
  SqlFunctionCtx* pCtx = pTableScanInfo->pCtx;
1074
  uint32_t        status = BLK_DATA_NOT_LOAD;
1075

L
Liu Jicong 已提交
1076
  int32_t numOfOutput = 0;  // pTableScanInfo->numOfOutput;
1077 1078
  for (int32_t i = 0; i < numOfOutput; ++i) {
    int32_t functionId = pCtx[i].functionId;
H
Haojun Liao 已提交
1079
    int32_t colId = pTableScanInfo->pExpr[i].base.pParam[0].pCol->colId;
1080 1081 1082

    // group by + first/last should not apply the first/last block filter
    if (functionId < 0) {
1083
      status |= BLK_DATA_DATA_LOAD;
1084 1085
      return status;
    } else {
L
Liu Jicong 已提交
1086
      //      status |= aAggs[functionId].dataReqFunc(&pTableScanInfo->pCtx[i], &pBlock->info.window, colId);
1087
      //      if ((status & BLK_DATA_DATA_LOAD) == BLK_DATA_DATA_LOAD) {
L
Liu Jicong 已提交
1088 1089
      //        return status;
      //      }
1090 1091 1092 1093
    }
  }

  return status;
H
Haojun Liao 已提交
1094 1095
#endif
  return 0;
1096 1097
}

L
Liu Jicong 已提交
1098 1099
int32_t loadDataBlockOnDemand(SExecTaskInfo* pTaskInfo, STableScanInfo* pTableScanInfo, SSDataBlock* pBlock,
                              uint32_t* status) {
1100
  *status = BLK_DATA_NOT_LOAD;
1101

H
Haojun Liao 已提交
1102
  pBlock->pDataBlock = NULL;
L
Liu Jicong 已提交
1103
  pBlock->pBlockAgg = NULL;
H
Haojun Liao 已提交
1104

L
Liu Jicong 已提交
1105 1106
  //  int64_t groupId = pRuntimeEnv->current->groupIndex;
  //  bool    ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1107

H
Haojun Liao 已提交
1108
  STaskCostInfo* pCost = &pTaskInfo->cost;
1109

1110 1111
//  pCost->totalBlocks += 1;
//  pCost->totalRows += pBlock->info.rows;
H
Haojun Liao 已提交
1112
#if 0
1113 1114 1115
  // Calculate all time windows that are overlapping or contain current data block.
  // If current data block is contained by all possible time window, do not load current data block.
  if (/*pQueryAttr->pFilters || */pQueryAttr->groupbyColumn || pQueryAttr->sw.gap > 0 ||
H
Haojun Liao 已提交
1116
      (QUERY_IS_INTERVAL_QUERY(pQueryAttr) && overlapWithTimeWindow(pTaskInfo, &pBlock->info))) {
1117
    (*status) = BLK_DATA_DATA_LOAD;
1118 1119 1120
  }

  // check if this data block is required to load
1121
  if ((*status) != BLK_DATA_DATA_LOAD) {
1122 1123 1124 1125 1126 1127 1128
    bool needFilter = true;

    // the pCtx[i] result is belonged to previous time window since the outputBuf has not been set yet,
    // the filter result may be incorrect. So in case of interval query, we need to set the correct time output buffer
    if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
      SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1129
      bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1130 1131 1132 1133 1134 1135
      TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

      STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
      if (pQueryAttr->pointInterpQuery) {
        needFilter = chkWindowOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1136
                                    pTableScanInfo->rowEntryInfoOffset);
1137 1138 1139
      } else {
        if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                    pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1140
                                    pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1141 1142 1143 1144 1145
          longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
        }
      }
    } else if (pQueryAttr->stableQuery && (!pQueryAttr->tsCompQuery) && (!pQueryAttr->diffQuery)) { // stable aggregate, not interval aggregate or normal column aggregate
      doSetTableGroupOutputBuf(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pTableScanInfo->pCtx,
1146
                               pTableScanInfo->rowEntryInfoOffset, pTableScanInfo->numOfOutput,
1147 1148 1149 1150 1151 1152
                               pRuntimeEnv->current->groupIndex);
    }

    if (needFilter) {
      (*status) = doFilterByBlockTimeWindow(pTableScanInfo, pBlock);
    } else {
1153
      (*status) = BLK_DATA_DATA_LOAD;
1154 1155 1156 1157
    }
  }

  SDataBlockInfo* pBlockInfo = &pBlock->info;
H
Haojun Liao 已提交
1158
//  *status = updateBlockLoadStatus(pRuntimeEnv->pQueryAttr, *status);
1159

1160
  if ((*status) == BLK_DATA_NOT_LOAD || (*status) == BLK_DATA_FILTEROUT) {
1161 1162
    //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//           pBlockInfo->window.ekey, pBlockInfo->rows);
1163
    pCost->skipBlocks += 1;
1164
  } else if ((*status) == BLK_DATA_SMA_LOAD) {
1165 1166
    // this function never returns error?
    pCost->loadBlockStatis += 1;
1167
//    tsdbRetrieveDatablockSMA(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1168 1169

    if (pBlock->pBlockAgg == NULL) {  // data block statistics does not exist, load data block
1170
//      pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1171 1172 1173
      pCost->totalCheckedRows += pBlock->info.rows;
    }
  } else {
1174
    assert((*status) == BLK_DATA_DATA_LOAD);
1175 1176 1177

    // load the data block statistics to perform further filter
    pCost->loadBlockStatis += 1;
1178
//    tsdbRetrieveDatablockSMA(pTableScanInfo->pTsdbReadHandle, &pBlock->pBlockAgg);
1179 1180 1181 1182 1183 1184

    if (pQueryAttr->topBotQuery && pBlock->pBlockAgg != NULL) {
      { // set previous window
        if (QUERY_IS_INTERVAL_QUERY(pQueryAttr)) {
          SResultRow* pResult = NULL;

H
Haojun Liao 已提交
1185
          bool  masterScan = IS_MAIN_SCAN(pRuntimeEnv);
1186 1187 1188 1189 1190
          TSKEY k = ascQuery? pBlock->info.window.skey : pBlock->info.window.ekey;

          STimeWindow win = getActiveTimeWindow(pTableScanInfo->pResultRowInfo, k, pQueryAttr);
          if (setResultOutputBufByKey(pRuntimeEnv, pTableScanInfo->pResultRowInfo, pBlock->info.uid, &win, masterScan, &pResult, groupId,
                                      pTableScanInfo->pCtx, pTableScanInfo->numOfOutput,
1191
                                      pTableScanInfo->rowEntryInfoOffset) != TSDB_CODE_SUCCESS) {
1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202
            longjmp(pRuntimeEnv->env, TSDB_CODE_QRY_OUT_OF_MEMORY);
          }
        }
      }
      bool load = false;
      for (int32_t i = 0; i < pQueryAttr->numOfOutput; ++i) {
        int32_t functionId = pTableScanInfo->pCtx[i].functionId;
        if (functionId == FUNCTION_TOP || functionId == FUNCTION_BOTTOM) {
//          load = topbot_datablock_filter(&pTableScanInfo->pCtx[i], (char*)&(pBlock->pBlockAgg[i].min),
//                                         (char*)&(pBlock->pBlockAgg[i].max));
          if (!load) { // current block has been discard due to filter applied
1203
            pCost->skipBlocks += 1;
1204 1205
            //qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId,
//                   pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
1206
            (*status) = BLK_DATA_FILTEROUT;
1207 1208 1209 1210 1211 1212 1213
            return TSDB_CODE_SUCCESS;
          }
        }
      }
    }

    // current block has been discard due to filter applied
H
Haojun Liao 已提交
1214
//    if (!doFilterByBlockSMA(pRuntimeEnv, pBlock->pBlockAgg, pTableScanInfo->pCtx, pBlockInfo->rows)) {
1215
//      pCost->skipBlocks += 1;
1216 1217
//      qDebug("QInfo:0x%"PRIx64" data block discard, brange:%" PRId64 "-%" PRId64 ", rows:%d", pQInfo->qId, pBlockInfo->window.skey,
//             pBlockInfo->window.ekey, pBlockInfo->rows);
1218
//      (*status) = BLK_DATA_FILTEROUT;
1219 1220 1221 1222 1223
//      return TSDB_CODE_SUCCESS;
//    }

    pCost->totalCheckedRows += pBlockInfo->rows;
    pCost->loadBlocks += 1;
1224
//    pBlock->pDataBlock = tsdbRetrieveDataBlock(pTableScanInfo->pTsdbReadHandle, NULL);
1225 1226 1227 1228 1229
//    if (pBlock->pDataBlock == NULL) {
//      return terrno;
//    }

//    if (pQueryAttr->pFilters != NULL) {
1230
//      filterSetColFieldData(pQueryAttr->pFilters, taosArrayGetSize(pBlock->pDataBlock), pBlock->pDataBlock);
1231
//    }
1232

1233 1234 1235 1236
//    if (pQueryAttr->pFilters != NULL || pRuntimeEnv->pTsBuf != NULL) {
//      filterColRowsInDataBlock(pRuntimeEnv, pBlock, ascQuery);
//    }
  }
H
Haojun Liao 已提交
1237
#endif
1238 1239 1240
  return TSDB_CODE_SUCCESS;
}

L
Liu Jicong 已提交
1241
static void updateTableQueryInfoForReverseScan(STableQueryInfo* pTableQueryInfo) {
1242 1243 1244 1245
  if (pTableQueryInfo == NULL) {
    return;
  }

wafwerar's avatar
wafwerar 已提交
1246
  //  TSWAP(pTableQueryInfo->win.skey, pTableQueryInfo->win.ekey);
L
Liu Jicong 已提交
1247
  //  pTableQueryInfo->lastKey = pTableQueryInfo->win.skey;
1248

L
Liu Jicong 已提交
1249 1250
  //  SWITCH_ORDER(pTableQueryInfo->cur.order);
  //  pTableQueryInfo->cur.vgroupIndex = -1;
1251 1252

  // set the index to be the end slot of result rows array
dengyihao's avatar
dengyihao 已提交
1253 1254 1255 1256 1257 1258
  //  SResultRowInfo* pResultRowInfo = &pTableQueryInfo->resInfo;
  //  if (pResultRowInfo->size > 0) {
  //    pResultRowInfo->curPos = pResultRowInfo->size - 1;
  //  } else {
  //    pResultRowInfo->curPos = -1;
  //  }
1259 1260
}

H
Haojun Liao 已提交
1261
void initResultRow(SResultRow* pResultRow) {
X
Xiaoyu Wang 已提交
1262
  //  pResultRow->pEntryInfo = (struct SResultRowEntryInfo*)((char*)pResultRow + sizeof(SResultRow));
1263 1264
}

L
Liu Jicong 已提交
1265
void setTaskStatus(SExecTaskInfo* pTaskInfo, int8_t status) {
1266
  if (status == TASK_NOT_COMPLETED) {
H
Haojun Liao 已提交
1267
    pTaskInfo->status = status;
1268 1269
  } else {
    // QUERY_NOT_COMPLETED is not compatible with any other status, so clear its position first
1270
    CLEAR_QUERY_STATUS(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
1271
    pTaskInfo->status |= status;
1272 1273 1274
  }
}

L
Liu Jicong 已提交
1275
void destroyTableQueryInfoImpl(STableQueryInfo* pTableQueryInfo) {
1276 1277 1278 1279
  if (pTableQueryInfo == NULL) {
    return;
  }

L
Liu Jicong 已提交
1280
  //  taosVariantDestroy(&pTableQueryInfo->tag);
dengyihao's avatar
dengyihao 已提交
1281
  //  cleanupResultRowInfo(&pTableQueryInfo->resInfo);
1282 1283
}

1284
void setResultRowInitCtx(SResultRow* pResult, SqlFunctionCtx* pCtx, int32_t numOfOutput, int32_t* rowEntryInfoOffset) {
5
54liuyao 已提交
1285
  bool init = false;
1286
  for (int32_t i = 0; i < numOfOutput; ++i) {
1287
    pCtx[i].resultInfo = getResultEntryInfo(pResult, i, rowEntryInfoOffset);
5
54liuyao 已提交
1288 1289 1290
    if (init) {
      continue;
    }
1291 1292 1293 1294 1295

    struct SResultRowEntryInfo* pResInfo = pCtx[i].resultInfo;
    if (isRowEntryCompleted(pResInfo) && isRowEntryInitialized(pResInfo)) {
      continue;
    }
1296 1297 1298 1299 1300

    if (fmIsWindowPseudoColumnFunc(pCtx[i].functionId)) {
      continue;
    }

1301 1302 1303 1304 1305 1306
    if (!pResInfo->initialized) {
      if (pCtx[i].functionId != -1) {
        pCtx[i].fpSet.init(&pCtx[i], pResInfo);
      } else {
        pResInfo->initialized = true;
      }
5
54liuyao 已提交
1307 1308
    } else {
      init = true;
1309 1310 1311 1312
    }
  }
}

H
Haojun Liao 已提交
1313
static void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep);
1314

1315
void doFilter(const SNode* pFilterNode, SSDataBlock* pBlock, const SArray* pColMatchInfo) {
1316
  if (pFilterNode == NULL || pBlock->info.rows == 0) {
S
shenglian zhou 已提交
1317 1318
    return;
  }
1319

1320
  SFilterInfo* filter = NULL;
H
Haojun Liao 已提交
1321

H
Haojun Liao 已提交
1322
  // todo move to the initialization function
H
Haojun Liao 已提交
1323
  int32_t code = filterInitFromNode((SNode*)pFilterNode, &filter, 0);
1324

1325
  size_t             numOfCols = taosArrayGetSize(pBlock->pDataBlock);
1326
  SFilterColumnParam param1 = {.numOfCols = numOfCols, .pDataBlock = pBlock->pDataBlock};
1327 1328 1329
  code = filterSetDataFromSlotId(filter, &param1);

  int8_t* rowRes = NULL;
1330

1331
  // todo the keep seems never to be True??
1332
  bool keep = filterExecute(filter, pBlock, &rowRes, NULL, param1.numOfCols);
D
dapan1121 已提交
1333
  filterFreeInfo(filter);
1334

H
Haojun Liao 已提交
1335
  extractQualifiedTupleByFilterResult(pBlock, rowRes, keep);
1336 1337

  if (pColMatchInfo != NULL) {
1338
    for (int32_t i = 0; i < taosArrayGetSize(pColMatchInfo); ++i) {
1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349
      SColMatchInfo* pInfo = taosArrayGet(pColMatchInfo, i);
      if (pInfo->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
        SColumnInfoData* pColData = taosArrayGet(pBlock->pDataBlock, pInfo->targetSlotId);
        if (pColData->info.type == TSDB_DATA_TYPE_TIMESTAMP) {
          blockDataUpdateTsWindow(pBlock, pInfo->targetSlotId);
          break;
        }
      }
    }
  }

H
Haojun Liao 已提交
1350
  taosMemoryFree(rowRes);
1351 1352
}

H
Haojun Liao 已提交
1353
void extractQualifiedTupleByFilterResult(SSDataBlock* pBlock, const int8_t* rowRes, bool keep) {
1354 1355 1356 1357 1358
  if (keep) {
    return;
  }

  if (rowRes != NULL) {
L
Liu Jicong 已提交
1359
    int32_t      totalRows = pBlock->info.rows;
1360
    SSDataBlock* px = createOneDataBlock(pBlock, true);
1361

1362 1363
    size_t numOfCols = taosArrayGetSize(pBlock->pDataBlock);
    for (int32_t i = 0; i < numOfCols; ++i) {
1364 1365
      SColumnInfoData* pSrc = taosArrayGet(px->pDataBlock, i);
      SColumnInfoData* pDst = taosArrayGet(pBlock->pDataBlock, i);
1366
      // it is a reserved column for scalar function, and no data in this column yet.
1367
      if (pDst->pData == NULL || pSrc->pData == NULL) {
1368 1369 1370
        continue;
      }

1371 1372
      colInfoDataCleanup(pDst, pBlock->info.rows);

1373
      int32_t numOfRows = 0;
1374
      for (int32_t j = 0; j < totalRows; ++j) {
D
dapan1121 已提交
1375 1376 1377
        if (rowRes[j] == 0) {
          continue;
        }
1378

D
dapan1121 已提交
1379
        if (colDataIsNull_s(pSrc, j)) {
1380
          colDataAppendNULL(pDst, numOfRows);
D
dapan1121 已提交
1381
        } else {
1382
          colDataAppend(pDst, numOfRows, colDataGetData(pSrc, j), false);
D
dapan1121 已提交
1383
        }
1384
        numOfRows += 1;
H
Haojun Liao 已提交
1385
      }
1386

1387 1388 1389 1390 1391
      if (pBlock->info.rows == totalRows) {
        pBlock->info.rows = numOfRows;
      } else {
        ASSERT(pBlock->info.rows == numOfRows);
      }
1392
    }
1393

dengyihao's avatar
dengyihao 已提交
1394
    blockDataDestroy(px);  // fix memory leak
1395 1396 1397
  } else {
    // do nothing
    pBlock->info.rows = 0;
1398 1399 1400
  }
}

1401
void doSetTableGroupOutputBuf(SOperatorInfo* pOperator, int32_t numOfOutput, uint64_t groupId) {
1402
  // for simple group by query without interval, all the tables belong to one group result.
1403 1404 1405
  SExecTaskInfo*    pTaskInfo = pOperator->pTaskInfo;
  SAggOperatorInfo* pAggInfo = pOperator->info;

1406
  SResultRowInfo* pResultRowInfo = &pAggInfo->binfo.resultRowInfo;
1407 1408
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
  int32_t*        rowEntryInfoOffset = pOperator->exprSupp.rowEntryInfoOffset;
1409

1410
  SResultRow* pResultRow = doSetResultOutBufByKey(pAggInfo->aggSup.pResultBuf, pResultRowInfo, (char*)&groupId,
L
Liu Jicong 已提交
1411
                                                  sizeof(groupId), true, groupId, pTaskInfo, false, &pAggInfo->aggSup);
L
Liu Jicong 已提交
1412
  assert(pResultRow != NULL);
1413 1414 1415 1416 1417 1418

  /*
   * not assign result buffer yet, add new result buffer
   * all group belong to one result set, and each group result has different group id so set the id to be one
   */
  if (pResultRow->pageId == -1) {
dengyihao's avatar
dengyihao 已提交
1419 1420
    int32_t ret =
        addNewWindowResultBuf(pResultRow, pAggInfo->aggSup.pResultBuf, groupId, pAggInfo->binfo.pRes->info.rowSize);
1421 1422 1423 1424 1425
    if (ret != TSDB_CODE_SUCCESS) {
      return;
    }
  }

1426
  setResultRowInitCtx(pResultRow, pCtx, numOfOutput, rowEntryInfoOffset);
1427 1428
}

1429 1430 1431
static void setExecutionContext(SOperatorInfo* pOperator, int32_t numOfOutput, uint64_t groupId) {
  SAggOperatorInfo* pAggInfo = pOperator->info;
  if (pAggInfo->groupId != UINT64_MAX && pAggInfo->groupId == groupId) {
1432 1433
    return;
  }
1434 1435

  doSetTableGroupOutputBuf(pOperator, numOfOutput, groupId);
1436 1437

  // record the current active group id
H
Haojun Liao 已提交
1438
  pAggInfo->groupId = groupId;
1439 1440
}

dengyihao's avatar
dengyihao 已提交
1441 1442
static void doUpdateNumOfRows(SqlFunctionCtx* pCtx, SResultRow* pRow, int32_t numOfExprs,
                              const int32_t* rowCellOffset) {
1443
  bool returnNotNull = false;
1444
  for (int32_t j = 0; j < numOfExprs; ++j) {
1445
    struct SResultRowEntryInfo* pResInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1446 1447 1448 1449 1450 1451 1452
    if (!isRowEntryInitialized(pResInfo)) {
      continue;
    }

    if (pRow->numOfRows < pResInfo->numOfRes) {
      pRow->numOfRows = pResInfo->numOfRes;
    }
1453

1454
    if (fmIsNotNullOutputFunc(pCtx[j].functionId)) {
1455 1456
      returnNotNull = true;
    }
1457
  }
S
shenglian zhou 已提交
1458 1459
  // if all expr skips all blocks, e.g. all null inputs for max function, output one row in final result.
  //  except for first/last, which require not null output, output no rows
1460
  if (pRow->numOfRows == 0 && !returnNotNull) {
1461
    pRow->numOfRows = 1;
1462 1463 1464
  }
}

1465
// todo extract method with copytoSSDataBlock
1466
int32_t finalizeResultRowIntoResultDataBlock(SDiskbasedBuf* pBuf, SResultRowPosition* resultRowPosition,
S
shenglian zhou 已提交
1467 1468 1469
                                             SqlFunctionCtx* pCtx, SExprInfo* pExprInfo, int32_t numOfExprs,
                                             const int32_t* rowCellOffset, SSDataBlock* pBlock,
                                             SExecTaskInfo* pTaskInfo) {
1470 1471 1472
  SFilePage*  page = getBufPage(pBuf, resultRowPosition->pageId);
  SResultRow* pRow = (SResultRow*)((char*)page + resultRowPosition->offset);

1473
  doUpdateNumOfRows(pCtx, pRow, numOfExprs, rowCellOffset);
1474 1475 1476 1477 1478
  if (pRow->numOfRows == 0) {
    releaseBufPage(pBuf, page);
    return 0;
  }

1479 1480 1481 1482 1483 1484 1485
  while (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
    int32_t code = blockDataEnsureCapacity(pBlock, pBlock->info.capacity * 1.25);
    if (TAOS_FAILED(code)) {
      releaseBufPage(pBuf, page);
      qError("%s ensure result data capacity failed, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
      longjmp(pTaskInfo->env, code);
    }
1486 1487 1488 1489 1490
  }

  for (int32_t j = 0; j < numOfExprs; ++j) {
    int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1491
    pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowCellOffset);
1492 1493 1494 1495 1496 1497 1498 1499 1500
    if (pCtx[j].fpSet.finalize) {
      int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
      if (TAOS_FAILED(code)) {
        qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
        longjmp(pTaskInfo->env, code);
      }
    } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
      // do nothing, todo refactor
    } else {
1501 1502
      // expand the result into multiple rows. E.g., _wstart, top(k, 20)
      // the _wstart needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
1503 1504 1505 1506 1507 1508 1509 1510 1511
      SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
      char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
      for (int32_t k = 0; k < pRow->numOfRows; ++k) {
        colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
      }
    }
  }

  releaseBufPage(pBuf, page);
1512
  pBlock->info.rows += pRow->numOfRows;
1513 1514 1515 1516

  return 0;
}

1517 1518 1519 1520 1521 1522 1523
int32_t doCopyToSDataBlock(SExecTaskInfo* pTaskInfo, SSDataBlock* pBlock, SExprSupp* pSup, SDiskbasedBuf* pBuf,
                           SGroupResInfo* pGroupResInfo) {
  SExprInfo*      pExprInfo = pSup->pExprInfo;
  int32_t         numOfExprs = pSup->numOfExprs;
  int32_t*        rowEntryOffset = pSup->rowEntryInfoOffset;
  SqlFunctionCtx* pCtx = pSup->pCtx;

1524
  int32_t numOfRows = getNumOfTotalRes(pGroupResInfo);
1525

1526
  for (int32_t i = pGroupResInfo->index; i < numOfRows; i += 1) {
L
Liu Jicong 已提交
1527 1528
    SResKeyPos* pPos = taosArrayGetP(pGroupResInfo->pRows, i);
    SFilePage*  page = getBufPage(pBuf, pPos->pos.pageId);
1529

1530
    SResultRow* pRow = (SResultRow*)((char*)page + pPos->pos.offset);
1531

H
Haojun Liao 已提交
1532
    doUpdateNumOfRows(pCtx, pRow, numOfExprs, rowEntryOffset);
1533 1534

    // no results, continue to check the next one
1535 1536
    if (pRow->numOfRows == 0) {
      pGroupResInfo->index += 1;
1537
      releaseBufPage(pBuf, page);
1538 1539 1540
      continue;
    }

1541 1542 1543 1544 1545
    if (pBlock->info.groupId == 0) {
      pBlock->info.groupId = pPos->groupId;
    } else {
      // current value belongs to different group, it can't be packed into one datablock
      if (pBlock->info.groupId != pPos->groupId) {
1546
        releaseBufPage(pBuf, page);
1547 1548 1549 1550
        break;
      }
    }

1551
    if (pBlock->info.rows + pRow->numOfRows > pBlock->info.capacity) {
1552
      ASSERT(pBlock->info.rows > 0);
1553
      releaseBufPage(pBuf, page);
1554 1555 1556 1557 1558
      break;
    }

    pGroupResInfo->index += 1;

1559
    for (int32_t j = 0; j < numOfExprs; ++j) {
1560 1561
      int32_t slotId = pExprInfo[j].base.resSchema.slotId;

1562
      pCtx[j].resultInfo = getResultEntryInfo(pRow, j, rowEntryOffset);
1563
      if (pCtx[j].fpSet.finalize) {
1564
#ifdef BUF_PAGE_DEBUG
wmmhello's avatar
wmmhello 已提交
1565
        qDebug("\npage_finalize %d", numOfExprs);
1566
#endif
1567
        int32_t code = pCtx[j].fpSet.finalize(&pCtx[j], pBlock);
1568
        if (TAOS_FAILED(code)) {
1569 1570
          qError("%s build result data block error, code %s", GET_TASKID(pTaskInfo), tstrerror(code));
          longjmp(pTaskInfo->env, code);
1571
        }
1572 1573
      } else if (strcmp(pCtx[j].pExpr->pExpr->_function.functionName, "_select_value") == 0) {
        // do nothing, todo refactor
1574
      } else {
1575 1576
        // expand the result into multiple rows. E.g., _wstart, top(k, 20)
        // the _wstart needs to copy to 20 following rows, since the results of top-k expands to 20 different rows.
X
Xiaoyu Wang 已提交
1577 1578
        SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
        char*            in = GET_ROWCELL_INTERBUF(pCtx[j].resultInfo);
1579
        if (pCtx[j].increase) {
L
Liu Jicong 已提交
1580
          int64_t ts = *(int64_t*)in;
1581
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
L
Liu Jicong 已提交
1582
            colDataAppend(pColInfoData, pBlock->info.rows + k, (const char*)&ts, pCtx[j].resultInfo->isNullRes);
1583 1584 1585 1586 1587 1588
            ts++;
          }
        } else {
          for (int32_t k = 0; k < pRow->numOfRows; ++k) {
            colDataAppend(pColInfoData, pBlock->info.rows + k, in, pCtx[j].resultInfo->isNullRes);
          }
X
Xiaoyu Wang 已提交
1589
        }
1590
      }
1591 1592
    }

1593
    releaseBufPage(pBuf, page);
1594
    pBlock->info.rows += pRow->numOfRows;
1595 1596
  }

X
Xiaoyu Wang 已提交
1597 1598
  qDebug("%s result generated, rows:%d, groupId:%" PRIu64, GET_TASKID(pTaskInfo), pBlock->info.rows,
         pBlock->info.groupId);
1599

1600
  blockDataUpdateTsWindow(pBlock, 0);
1601 1602 1603
  return 0;
}

X
Xiaoyu Wang 已提交
1604 1605
void doBuildResultDatablock(SOperatorInfo* pOperator, SOptrBasicInfo* pbInfo, SGroupResInfo* pGroupResInfo,
                            SDiskbasedBuf* pBuf) {
1606
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
1607
  SSDataBlock*   pBlock = pbInfo->pRes;
1608

1609 1610 1611
  // set output datablock version
  pBlock->info.version = pTaskInfo->version;

1612
  blockDataCleanup(pBlock);
1613
  if (!hasRemainResults(pGroupResInfo)) {
1614 1615 1616
    return;
  }

1617 1618
  // clear the existed group id
  pBlock->info.groupId = 0;
1619 1620 1621
  if (!pbInfo->mergeResultBlock) {
    doCopyToSDataBlock(pTaskInfo, pBlock, &pOperator->exprSupp, pBuf, pGroupResInfo);
  } else {
dengyihao's avatar
dengyihao 已提交
1622
    while (hasRemainResults(pGroupResInfo)) {
1623 1624 1625
      doCopyToSDataBlock(pTaskInfo, pBlock, &pOperator->exprSupp, pBuf, pGroupResInfo);
      if (pBlock->info.rows >= pOperator->resultInfo.threshold) {
        break;
1626 1627
      }

1628 1629
      // clearing group id to continue to merge data that belong to different groups
      pBlock->info.groupId = 0;
1630
    }
1631 1632 1633

    // clear the group id info in SSDataBlock, since the client does not need it
    pBlock->info.groupId = 0;
1634 1635 1636
  }
}

L
Liu Jicong 已提交
1637
static int32_t compressQueryColData(SColumnInfoData* pColRes, int32_t numOfRows, char* data, int8_t compressed) {
1638 1639
  int32_t colSize = pColRes->info.bytes * numOfRows;
  return (*(tDataTypes[pColRes->info.type].compFunc))(pColRes->pData, colSize, numOfRows, data,
L
Liu Jicong 已提交
1640
                                                      colSize + COMP_OVERFLOW_BYTES, compressed, NULL, 0);
1641 1642
}

L
Liu Jicong 已提交
1643 1644
void queryCostStatis(SExecTaskInfo* pTaskInfo) {
  STaskCostInfo* pSummary = &pTaskInfo->cost;
1645

L
Liu Jicong 已提交
1646 1647 1648
  //  uint64_t hashSize = taosHashGetMemSize(pQInfo->runtimeEnv.pResultRowHashTable);
  //  hashSize += taosHashGetMemSize(pRuntimeEnv->tableqinfoGroupInfo.map);
  //  pSummary->hashSize = hashSize;
1649

L
Liu Jicong 已提交
1650 1651 1652 1653 1654 1655 1656 1657 1658
  //  SResultRowPool* p = pTaskInfo->pool;
  //  if (p != NULL) {
  //    pSummary->winInfoSize = getResultRowPoolMemSize(p);
  //    pSummary->numOfTimeWindows = getNumOfAllocatedResultRows(p);
  //  } else {
  //    pSummary->winInfoSize = 0;
  //    pSummary->numOfTimeWindows = 0;
  //  }

1659 1660
  SFileBlockLoadRecorder* pRecorder = pSummary->pRecoder;
  if (pSummary->pRecoder != NULL) {
1661
    qDebug(
X
Xiaoyu Wang 已提交
1662 1663 1664 1665
        "%s :cost summary: elapsed time:%.2f ms, total blocks:%d, load block SMA:%d, load data block:%d, total "
        "rows:%" PRId64 ", check rows:%" PRId64,
        GET_TASKID(pTaskInfo), pSummary->elapsedTime / 1000.0, pRecorder->totalBlocks, pRecorder->loadBlockStatis,
        pRecorder->loadBlocks, pRecorder->totalRows, pRecorder->totalCheckedRows);
1666
  }
1667

L
Liu Jicong 已提交
1668 1669 1670
  // qDebug("QInfo:0x%"PRIx64" :cost summary: winResPool size:%.2f Kb, numOfWin:%"PRId64", tableInfoSize:%.2f Kb,
  // hashTable:%.2f Kb", pQInfo->qId, pSummary->winInfoSize/1024.0,
  //      pSummary->numOfTimeWindows, pSummary->tableInfoSize/1024.0, pSummary->hashSize/1024.0);
1671 1672
}

L
Liu Jicong 已提交
1673 1674 1675
// static void updateOffsetVal(STaskRuntimeEnv *pRuntimeEnv, SDataBlockInfo *pBlockInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
1676
//
L
Liu Jicong 已提交
1677
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1678
//
L
Liu Jicong 已提交
1679 1680 1681 1682
//   if (pQueryAttr->limit.offset == pBlockInfo->rows) {  // current block will ignore completed
//     pTableQueryInfo->lastKey = QUERY_IS_ASC_QUERY(pQueryAttr) ? pBlockInfo->window.ekey + step :
//     pBlockInfo->window.skey + step; pQueryAttr->limit.offset = 0; return;
//   }
1683
//
L
Liu Jicong 已提交
1684 1685 1686 1687 1688
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     pQueryAttr->pos = (int32_t)pQueryAttr->limit.offset;
//   } else {
//     pQueryAttr->pos = pBlockInfo->rows - (int32_t)pQueryAttr->limit.offset - 1;
//   }
1689
//
L
Liu Jicong 已提交
1690
//   assert(pQueryAttr->pos >= 0 && pQueryAttr->pos <= pBlockInfo->rows - 1);
1691
//
L
Liu Jicong 已提交
1692 1693
//   SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//   SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1694
//
L
Liu Jicong 已提交
1695 1696
//   // update the pQueryAttr->limit.offset value, and pQueryAttr->pos value
//   TSKEY *keys = (TSKEY *) pColInfoData->pData;
1697
//
L
Liu Jicong 已提交
1698 1699 1700
//   // update the offset value
//   pTableQueryInfo->lastKey = keys[pQueryAttr->pos];
//   pQueryAttr->limit.offset = 0;
1701
//
L
Liu Jicong 已提交
1702
//   int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
1703
//
L
Liu Jicong 已提交
1704 1705 1706 1707
//   //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numBlocksOfStep:%d, numOfRes:%d,
//   lastKey:%"PRId64, GET_TASKID(pRuntimeEnv),
//          pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes, pQuery->current->lastKey);
// }
1708

L
Liu Jicong 已提交
1709 1710
// void skipBlocks(STaskRuntimeEnv *pRuntimeEnv) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
1711
//
L
Liu Jicong 已提交
1712 1713 1714
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0) {
//     return;
//   }
1715
//
L
Liu Jicong 已提交
1716 1717
//   pQueryAttr->pos = 0;
//   int32_t step = GET_FORWARD_DIRECTION_FACTOR(pQueryAttr->order.order);
1718
//
L
Liu Jicong 已提交
1719 1720
//   STableQueryInfo* pTableQueryInfo = pRuntimeEnv->current;
//   TsdbQueryHandleT pTsdbReadHandle = pRuntimeEnv->pTsdbReadHandle;
1721
//
L
Liu Jicong 已提交
1722 1723 1724 1725 1726
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pTsdbReadHandle)) {
//     if (isTaskKilled(pRuntimeEnv->qinfo)) {
//       longjmp(pRuntimeEnv->env, TSDB_CODE_TSC_QUERY_CANCELLED);
//     }
1727
//
L
Liu Jicong 已提交
1728
//     tsdbRetrieveDataBlockInfo(pTsdbReadHandle, &blockInfo);
1729
//
L
Liu Jicong 已提交
1730 1731 1732 1733
//     if (pQueryAttr->limit.offset > blockInfo.rows) {
//       pQueryAttr->limit.offset -= blockInfo.rows;
//       pTableQueryInfo->lastKey = (QUERY_IS_ASC_QUERY(pQueryAttr)) ? blockInfo.window.ekey : blockInfo.window.skey;
//       pTableQueryInfo->lastKey += step;
1734
//
L
Liu Jicong 已提交
1735 1736 1737 1738 1739 1740 1741
//       //qDebug("QInfo:0x%"PRIx64" skip rows:%d, offset:%" PRId64, GET_TASKID(pRuntimeEnv), blockInfo.rows,
//              pQuery->limit.offset);
//     } else {  // find the appropriated start position in current block
//       updateOffsetVal(pRuntimeEnv, &blockInfo);
//       break;
//     }
//   }
1742
//
L
Liu Jicong 已提交
1743 1744 1745 1746 1747 1748 1749 1750 1751
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
// }

// static TSKEY doSkipIntervalProcess(STaskRuntimeEnv* pRuntimeEnv, STimeWindow* win, SDataBlockInfo* pBlockInfo,
// STableQueryInfo* pTableQueryInfo) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
1752
//
L
Liu Jicong 已提交
1753 1754 1755
//   assert(pQueryAttr->limit.offset == 0);
//   STimeWindow tw = *win;
//   getNextTimeWindow(pQueryAttr, &tw);
1756
//
L
Liu Jicong 已提交
1757 1758
//   if ((tw.skey <= pBlockInfo->window.ekey && QUERY_IS_ASC_QUERY(pQueryAttr)) ||
//       (tw.ekey >= pBlockInfo->window.skey && !QUERY_IS_ASC_QUERY(pQueryAttr))) {
1759
//
L
Liu Jicong 已提交
1760 1761 1762 1763
//     // load the data block and check data remaining in current data block
//     // TODO optimize performance
//     SArray *         pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//     SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1764
//
L
Liu Jicong 已提交
1765 1766 1767 1768
//     tw = *win;
//     int32_t startPos =
//         getNextQualifiedWindow(pQueryAttr, &tw, pBlockInfo, pColInfoData->pData, binarySearchForKey, -1);
//     assert(startPos >= 0);
1769
//
L
Liu Jicong 已提交
1770 1771
//     // set the abort info
//     pQueryAttr->pos = startPos;
1772
//
L
Liu Jicong 已提交
1773 1774 1775 1776
//     // reset the query start timestamp
//     pTableQueryInfo->win.skey = ((TSKEY *)pColInfoData->pData)[startPos];
//     pQueryAttr->window.skey = pTableQueryInfo->win.skey;
//     TSKEY key = pTableQueryInfo->win.skey;
1777
//
L
Liu Jicong 已提交
1778 1779
//     pWindowResInfo->prevSKey = tw.skey;
//     int32_t index = pRuntimeEnv->resultRowInfo.curIndex;
1780
//
L
Liu Jicong 已提交
1781 1782
//     int32_t numOfRes = tableApplyFunctionsOnBlock(pRuntimeEnv, pBlockInfo, NULL, binarySearchForKey, pDataBlock);
//     pRuntimeEnv->resultRowInfo.curIndex = index;  // restore the window index
1783
//
L
Liu Jicong 已提交
1784 1785 1786 1787
//     //qDebug("QInfo:0x%"PRIx64" check data block, brange:%" PRId64 "-%" PRId64 ", numOfRows:%d, numOfRes:%d,
//     lastKey:%" PRId64,
//            GET_TASKID(pRuntimeEnv), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, numOfRes,
//            pQueryAttr->current->lastKey);
1788
//
L
Liu Jicong 已提交
1789 1790 1791 1792 1793
//     return key;
//   } else {  // do nothing
//     pQueryAttr->window.skey      = tw.skey;
//     pWindowResInfo->prevSKey = tw.skey;
//     pTableQueryInfo->lastKey = tw.skey;
1794
//
L
Liu Jicong 已提交
1795 1796
//     return tw.skey;
//   }
1797
//
L
Liu Jicong 已提交
1798 1799 1800 1801 1802 1803 1804 1805 1806 1807
//   return true;
// }

// static bool skipTimeInterval(STaskRuntimeEnv *pRuntimeEnv, TSKEY* start) {
//   STaskAttr *pQueryAttr = pRuntimeEnv->pQueryAttr;
//   if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//     assert(*start <= pRuntimeEnv->current->lastKey);
//   } else {
//     assert(*start >= pRuntimeEnv->current->lastKey);
//   }
1808
//
L
Liu Jicong 已提交
1809 1810 1811 1812 1813
//   // if queried with value filter, do NOT forward query start position
//   if (pQueryAttr->limit.offset <= 0 || pQueryAttr->numOfFilterCols > 0 || pRuntimeEnv->pTsBuf != NULL ||
//   pRuntimeEnv->pFillInfo != NULL) {
//     return true;
//   }
1814
//
L
Liu Jicong 已提交
1815 1816 1817 1818 1819 1820 1821
//   /*
//    * 1. for interval without interpolation query we forward pQueryAttr->interval.interval at a time for
//    *    pQueryAttr->limit.offset times. Since hole exists, pQueryAttr->interval.interval*pQueryAttr->limit.offset
//    value is
//    *    not valid. otherwise, we only forward pQueryAttr->limit.offset number of points
//    */
//   assert(pRuntimeEnv->resultRowInfo.prevSKey == TSKEY_INITIAL_VAL);
1822
//
L
Liu Jicong 已提交
1823 1824
//   STimeWindow w = TSWINDOW_INITIALIZER;
//   bool ascQuery = QUERY_IS_ASC_QUERY(pQueryAttr);
1825
//
L
Liu Jicong 已提交
1826 1827
//   SResultRowInfo *pWindowResInfo = &pRuntimeEnv->resultRowInfo;
//   STableQueryInfo *pTableQueryInfo = pRuntimeEnv->current;
1828
//
L
Liu Jicong 已提交
1829 1830 1831
//   SDataBlockInfo blockInfo = SDATA_BLOCK_INITIALIZER;
//   while (tsdbNextDataBlock(pRuntimeEnv->pTsdbReadHandle)) {
//     tsdbRetrieveDataBlockInfo(pRuntimeEnv->pTsdbReadHandle, &blockInfo);
1832
//
L
Liu Jicong 已提交
1833 1834 1835 1836 1837 1838 1839 1840 1841
//     if (QUERY_IS_ASC_QUERY(pQueryAttr)) {
//       if (pWindowResInfo->prevSKey == TSKEY_INITIAL_VAL) {
//         getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.skey, blockInfo.window.skey, pQueryAttr->window.ekey,
//         &w); pWindowResInfo->prevSKey = w.skey;
//       }
//     } else {
//       getAlignQueryTimeWindow(pQueryAttr, blockInfo.window.ekey, pQueryAttr->window.ekey, blockInfo.window.ekey, &w);
//       pWindowResInfo->prevSKey = w.skey;
//     }
1842
//
L
Liu Jicong 已提交
1843 1844
//     // the first time window
//     STimeWindow win = getActiveTimeWindow(pWindowResInfo, pWindowResInfo->prevSKey, pQueryAttr);
1845
//
L
Liu Jicong 已提交
1846 1847
//     while (pQueryAttr->limit.offset > 0) {
//       STimeWindow tw = win;
1848
//
L
Liu Jicong 已提交
1849 1850 1851
//       if ((win.ekey <= blockInfo.window.ekey && ascQuery) || (win.ekey >= blockInfo.window.skey && !ascQuery)) {
//         pQueryAttr->limit.offset -= 1;
//         pWindowResInfo->prevSKey = win.skey;
1852
//
L
Liu Jicong 已提交
1853 1854 1855 1856 1857 1858
//         // current time window is aligned with blockInfo.window.ekey
//         // restart it from next data block by set prevSKey to be TSKEY_INITIAL_VAL;
//         if ((win.ekey == blockInfo.window.ekey && ascQuery) || (win.ekey == blockInfo.window.skey && !ascQuery)) {
//           pWindowResInfo->prevSKey = TSKEY_INITIAL_VAL;
//         }
//       }
1859
//
L
Liu Jicong 已提交
1860 1861 1862 1863
//       if (pQueryAttr->limit.offset == 0) {
//         *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//         return true;
//       }
1864
//
L
Liu Jicong 已提交
1865 1866
//       // current window does not ended in current data block, try next data block
//       getNextTimeWindow(pQueryAttr, &tw);
1867
//
L
Liu Jicong 已提交
1868 1869 1870 1871 1872 1873 1874 1875 1876
//       /*
//        * If the next time window still starts from current data block,
//        * load the primary timestamp column first, and then find the start position for the next queried time window.
//        * Note that only the primary timestamp column is required.
//        * TODO: Optimize for this cases. All data blocks are not needed to be loaded, only if the first actually
//        required
//        * time window resides in current data block.
//        */
//       if ((tw.skey <= blockInfo.window.ekey && ascQuery) || (tw.ekey >= blockInfo.window.skey && !ascQuery)) {
1877
//
L
Liu Jicong 已提交
1878 1879
//         SArray *pDataBlock = tsdbRetrieveDataBlock(pRuntimeEnv->pTsdbReadHandle, NULL);
//         SColumnInfoData *pColInfoData = taosArrayGet(pDataBlock, 0);
1880
//
L
Liu Jicong 已提交
1881 1882 1883
//         if ((win.ekey > blockInfo.window.ekey && ascQuery) || (win.ekey < blockInfo.window.skey && !ascQuery)) {
//           pQueryAttr->limit.offset -= 1;
//         }
1884
//
L
Liu Jicong 已提交
1885 1886 1887 1888 1889 1890 1891 1892
//         if (pQueryAttr->limit.offset == 0) {
//           *start = doSkipIntervalProcess(pRuntimeEnv, &win, &blockInfo, pTableQueryInfo);
//           return true;
//         } else {
//           tw = win;
//           int32_t startPos =
//               getNextQualifiedWindow(pQueryAttr, &tw, &blockInfo, pColInfoData->pData, binarySearchForKey, -1);
//           assert(startPos >= 0);
1893
//
L
Liu Jicong 已提交
1894 1895 1896 1897 1898 1899 1900 1901 1902 1903 1904
//           // set the abort info
//           pQueryAttr->pos = startPos;
//           pTableQueryInfo->lastKey = ((TSKEY *)pColInfoData->pData)[startPos];
//           pWindowResInfo->prevSKey = tw.skey;
//           win = tw;
//         }
//       } else {
//         break;  // offset is not 0, and next time window begins or ends in the next block.
//       }
//     }
//   }
1905
//
L
Liu Jicong 已提交
1906 1907 1908 1909
//   // check for error
//   if (terrno != TSDB_CODE_SUCCESS) {
//     longjmp(pRuntimeEnv->env, terrno);
//   }
1910
//
L
Liu Jicong 已提交
1911 1912
//   return true;
// }
1913

1914
int32_t appendDownstream(SOperatorInfo* p, SOperatorInfo** pDownstream, int32_t num) {
H
Haojun Liao 已提交
1915
  if (p->pDownstream == NULL) {
H
Haojun Liao 已提交
1916
    assert(p->numOfDownstream == 0);
1917 1918
  }

wafwerar's avatar
wafwerar 已提交
1919
  p->pDownstream = taosMemoryCalloc(1, num * POINTER_BYTES);
1920 1921 1922 1923 1924 1925 1926
  if (p->pDownstream == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  memcpy(p->pDownstream, pDownstream, num * POINTER_BYTES);
  p->numOfDownstream = num;
  return TSDB_CODE_SUCCESS;
1927 1928
}

wmmhello's avatar
wmmhello 已提交
1929
static void doDestroyTableList(STableListInfo* pTableqinfoList);
1930

1931
static void doTableQueryInfoTimeWindowCheck(SExecTaskInfo* pTaskInfo, STableQueryInfo* pTableQueryInfo, int32_t order) {
H
Haojun Liao 已提交
1932 1933
#if 0
    if (order == TSDB_ORDER_ASC) {
1934 1935
    assert(
        (pTableQueryInfo->win.skey <= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1936 1937
        (pTableQueryInfo->lastKey >= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey >= pTaskInfo->window.skey && pTableQueryInfo->win.ekey <= pTaskInfo->window.ekey));
1938 1939 1940
  } else {
    assert(
        (pTableQueryInfo->win.skey >= pTableQueryInfo->win.ekey) &&
H
Haojun Liao 已提交
1941 1942
        (pTableQueryInfo->lastKey <= pTaskInfo->window.skey) &&
        (pTableQueryInfo->win.skey <= pTaskInfo->window.skey && pTableQueryInfo->win.ekey >= pTaskInfo->window.ekey));
1943
  }
H
Haojun Liao 已提交
1944
#endif
1945 1946
}

1947 1948 1949 1950
typedef struct SFetchRspHandleWrapper {
  uint32_t exchangeId;
  int32_t  sourceIndex;
} SFetchRspHandleWrapper;
1951

D
dapan1121 已提交
1952
int32_t loadRemoteDataCallback(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1953
  SFetchRspHandleWrapper* pWrapper = (SFetchRspHandleWrapper*)param;
1954 1955 1956 1957

  SExchangeInfo* pExchangeInfo = taosAcquireRef(exchangeObjRefPool, pWrapper->exchangeId);
  if (pExchangeInfo == NULL) {
    qWarn("failed to acquire exchange operator, since it may have been released");
1958
    taosMemoryFree(pMsg->pData);
1959 1960 1961
    return TSDB_CODE_SUCCESS;
  }

X
Xiaoyu Wang 已提交
1962
  int32_t          index = pWrapper->sourceIndex;
1963
  SSourceDataInfo* pSourceDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, index);
1964

H
Haojun Liao 已提交
1965 1966
  if (code == TSDB_CODE_SUCCESS) {
    pSourceDataInfo->pRsp = pMsg->pData;
1967

H
Haojun Liao 已提交
1968 1969
    SRetrieveTableRsp* pRsp = pSourceDataInfo->pRsp;
    pRsp->numOfRows = htonl(pRsp->numOfRows);
dengyihao's avatar
dengyihao 已提交
1970
    pRsp->compLen = htonl(pRsp->compLen);
1971
    pRsp->numOfCols = htonl(pRsp->numOfCols);
dengyihao's avatar
dengyihao 已提交
1972
    pRsp->useconds = htobe64(pRsp->useconds);
1973
    pRsp->numOfBlocks = htonl(pRsp->numOfBlocks);
1974

1975
    ASSERT(pRsp != NULL);
H
Haojun Liao 已提交
1976 1977
    qDebug("%s fetch rsp received, index:%d, blocks:%d, rows:%d", pSourceDataInfo->taskId, index, pRsp->numOfBlocks,
           pRsp->numOfRows);
H
Haojun Liao 已提交
1978
  } else {
1979
    taosMemoryFree(pMsg->pData);
H
Haojun Liao 已提交
1980
    pSourceDataInfo->code = code;
D
dapan1121 已提交
1981
    qDebug("%s fetch rsp received, index:%d, error:%d", pSourceDataInfo->taskId, index, tstrerror(code));
H
Haojun Liao 已提交
1982
  }
H
Haojun Liao 已提交
1983

H
Haojun Liao 已提交
1984
  pSourceDataInfo->status = EX_SOURCE_DATA_READY;
1985 1986 1987 1988

  tsem_post(&pExchangeInfo->ready);
  taosReleaseRef(exchangeObjRefPool, pWrapper->exchangeId);

wmmhello's avatar
wmmhello 已提交
1989
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
1990 1991
}

D
dapan1121 已提交
1992
void qProcessRspMsg(void* parent, SRpcMsg* pMsg, SEpSet* pEpSet) {
S
Shengliang Guan 已提交
1993 1994
  SMsgSendInfo* pSendInfo = (SMsgSendInfo*)pMsg->info.ahandle;
  assert(pMsg->info.ahandle != NULL);
H
Haojun Liao 已提交
1995 1996 1997 1998

  SDataBuf buf = {.len = pMsg->contLen, .pData = NULL};

  if (pMsg->contLen > 0) {
wafwerar's avatar
wafwerar 已提交
1999
    buf.pData = taosMemoryCalloc(1, pMsg->contLen);
H
Haojun Liao 已提交
2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010
    if (buf.pData == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      pMsg->code = TSDB_CODE_OUT_OF_MEMORY;
    } else {
      memcpy(buf.pData, pMsg->pCont, pMsg->contLen);
    }
  }

  pSendInfo->fp(pSendInfo->param, &buf, pMsg->code);
  rpcFreeCont(pMsg->pCont);
  destroySendMsgInfo(pSendInfo);
2011 2012
}

L
Liu Jicong 已提交
2013
static int32_t doSendFetchDataRequest(SExchangeInfo* pExchangeInfo, SExecTaskInfo* pTaskInfo, int32_t sourceIndex) {
2014
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2015

wafwerar's avatar
wafwerar 已提交
2016
  SResFetchReq* pMsg = taosMemoryCalloc(1, sizeof(SResFetchReq));
2017 2018 2019 2020
  if (NULL == pMsg) {
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
  }
2021

L
Liu Jicong 已提交
2022 2023
  SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, sourceIndex);
  SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, sourceIndex);
2024

2025 2026
  ASSERT(pDataInfo->status == EX_SOURCE_DATA_NOT_READY);

2027 2028 2029
  qDebug("%s build fetch msg and send to vgId:%d, ep:%s, taskId:0x%" PRIx64 ", execId:%d, %d/%" PRIzu,
         GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->addr.epSet.eps[0].fqdn, pSource->taskId, pSource->execId,
         sourceIndex, totalSources);
2030 2031 2032 2033 2034

  pMsg->header.vgId = htonl(pSource->addr.nodeId);
  pMsg->sId = htobe64(pSource->schedId);
  pMsg->taskId = htobe64(pSource->taskId);
  pMsg->queryId = htobe64(pTaskInfo->id.queryId);
D
dapan1121 已提交
2035
  pMsg->execId = htonl(pSource->execId);
2036 2037

  // send the fetch remote task result reques
wafwerar's avatar
wafwerar 已提交
2038
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
2039
  if (NULL == pMsgSendInfo) {
wafwerar's avatar
wafwerar 已提交
2040
    taosMemoryFreeClear(pMsg);
2041 2042 2043
    qError("%s prepare message %d failed", GET_TASKID(pTaskInfo), (int32_t)sizeof(SMsgSendInfo));
    pTaskInfo->code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return pTaskInfo->code;
H
Haojun Liao 已提交
2044 2045
  }

2046
  SFetchRspHandleWrapper* pWrapper = taosMemoryCalloc(1, sizeof(SFetchRspHandleWrapper));
X
Xiaoyu Wang 已提交
2047
  pWrapper->exchangeId = pExchangeInfo->self;
2048 2049 2050
  pWrapper->sourceIndex = sourceIndex;

  pMsgSendInfo->param = pWrapper;
D
dapan1121 已提交
2051
  pMsgSendInfo->paramFreeFp = taosMemoryFree;
2052 2053
  pMsgSendInfo->msgInfo.pData = pMsg;
  pMsgSendInfo->msgInfo.len = sizeof(SResFetchReq);
L
Liu Jicong 已提交
2054
  pMsgSendInfo->msgType = pSource->fetchMsgType;
2055
  pMsgSendInfo->fp = loadRemoteDataCallback;
2056

2057
  int64_t transporterId = 0;
L
Liu Jicong 已提交
2058
  int32_t code = asyncSendMsgToServer(pExchangeInfo->pTransporter, &pSource->addr.epSet, &transporterId, pMsgSendInfo);
2059 2060 2061
  return TSDB_CODE_SUCCESS;
}

2062 2063 2064 2065 2066 2067 2068 2069 2070
void updateLoadRemoteInfo(SLoadRemoteDataInfo* pInfo, int32_t numOfRows, int32_t dataLen, int64_t startTs,
                          SOperatorInfo* pOperator) {
  pInfo->totalRows += numOfRows;
  pInfo->totalSize += dataLen;
  pInfo->totalElapsed += (taosGetTimestampUs() - startTs);
  pOperator->resultInfo.totalRows += numOfRows;
}

int32_t extractDataBlockFromFetchRsp(SSDataBlock* pRes, char* pData, int32_t numOfOutput, SArray* pColList,
dengyihao's avatar
dengyihao 已提交
2071
                                     char** pNextStart) {
H
Haojun Liao 已提交
2072
  if (pColList == NULL) {  // data from other sources
2073
    blockDataCleanup(pRes);
dengyihao's avatar
dengyihao 已提交
2074
    *pNextStart = (char*)blockDecode(pRes, pData);
H
Haojun Liao 已提交
2075
  } else {  // extract data according to pColList
2076
    ASSERT(numOfOutput == taosArrayGetSize(pColList));
2077 2078 2079 2080 2081
    char* pStart = pData;

    int32_t numOfCols = htonl(*(int32_t*)pStart);
    pStart += sizeof(int32_t);

2082
    // todo refactor:extract method
2083
    SSysTableSchema* pSchema = (SSysTableSchema*)pStart;
dengyihao's avatar
dengyihao 已提交
2084
    for (int32_t i = 0; i < numOfCols; ++i) {
2085 2086 2087 2088 2089 2090 2091
      SSysTableSchema* p = (SSysTableSchema*)pStart;

      p->colId = htons(p->colId);
      p->bytes = htonl(p->bytes);
      pStart += sizeof(SSysTableSchema);
    }

2092
    SSDataBlock* pBlock = createDataBlock();
dengyihao's avatar
dengyihao 已提交
2093
    for (int32_t i = 0; i < numOfCols; ++i) {
2094 2095
      SColumnInfoData idata = createColumnInfoData(pSchema[i].type, pSchema[i].bytes, pSchema[i].colId);
      blockDataAppendColInfo(pBlock, &idata);
2096 2097
    }

2098
    blockDecode(pBlock, pStart);
2099
    blockDataEnsureCapacity(pRes, pBlock->info.rows);
2100

H
Haojun Liao 已提交
2101
    // data from mnode
2102
    pRes->info.rows = pBlock->info.rows;
2103 2104
    relocateColumnData(pRes, pColList, pBlock->pDataBlock, false);
    blockDataDestroy(pBlock);
2105
  }
2106

2107 2108
  // todo move this to time window aggregator, since the primary timestamp may not be known by exchange operator.
  blockDataUpdateTsWindow(pRes, 0);
2109 2110
  return TSDB_CODE_SUCCESS;
}
2111

L
Liu Jicong 已提交
2112 2113
static void* setAllSourcesCompleted(SOperatorInfo* pOperator, int64_t startTs) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
2114
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
H
Haojun Liao 已提交
2115

2116
  int64_t              el = taosGetTimestampUs() - startTs;
H
Haojun Liao 已提交
2117
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2118

H
Haojun Liao 已提交
2119
  pLoadInfo->totalElapsed += el;
H
Haojun Liao 已提交
2120

2121
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
L
Liu Jicong 已提交
2122 2123 2124
  qDebug("%s all %" PRIzu " sources are exhausted, total rows: %" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
         GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
         pLoadInfo->totalElapsed / 1000.0);
2125 2126 2127 2128 2129

  doSetOperatorCompleted(pOperator);
  return NULL;
}

2130 2131
static void concurrentlyLoadRemoteDataImpl(SOperatorInfo* pOperator, SExchangeInfo* pExchangeInfo,
                                           SExecTaskInfo* pTaskInfo) {
2132 2133 2134 2135 2136 2137 2138 2139
  int32_t code = 0;
  int64_t startTs = taosGetTimestampUs();
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);

  while (1) {
    int32_t completed = 0;
    for (int32_t i = 0; i < totalSources; ++i) {
      SSourceDataInfo* pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, i);
2140
      if (pDataInfo->status == EX_SOURCE_DATA_EXHAUSTED) {
2141
        completed += 1;
H
Haojun Liao 已提交
2142 2143
        continue;
      }
2144

2145
      if (pDataInfo->status != EX_SOURCE_DATA_READY) {
2146 2147 2148
        continue;
      }

2149 2150 2151 2152 2153
      if (pDataInfo->code != TSDB_CODE_SUCCESS) {
        code = pDataInfo->code;
        goto _error;
      }

L
Liu Jicong 已提交
2154
      SRetrieveTableRsp*     pRsp = pDataInfo->pRsp;
X
Xiaoyu Wang 已提交
2155
      SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, i);
2156

H
Haojun Liao 已提交
2157
      SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2158
      if (pRsp->numOfRows == 0) {
2159 2160
        qDebug("%s vgId:%d, taskId:0x%" PRIx64 " execId:%d index:%d completed, rowsOfSource:%" PRIu64
               ", totalRows:%" PRIu64 ", completed:%d try next %d/%" PRIzu,
D
dapan1121 已提交
2161
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pDataInfo->totalRows,
2162
               pExchangeInfo->loadInfo.totalRows, completed + 1, i + 1, totalSources);
2163
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2164
        completed += 1;
D
dapan1121 已提交
2165
        taosMemoryFreeClear(pDataInfo->pRsp);
2166 2167
        continue;
      }
H
Haojun Liao 已提交
2168

2169
      SRetrieveTableRsp* pRetrieveRsp = pDataInfo->pRsp;
dengyihao's avatar
dengyihao 已提交
2170 2171 2172
      int32_t            index = 0;
      char*              pStart = pRetrieveRsp->data;
      while (index++ < pRetrieveRsp->numOfBlocks) {
2173
        SSDataBlock* pb = createOneDataBlock(pExchangeInfo->pDummyBlock, false);
2174
        code = extractDataBlockFromFetchRsp(pb, pStart, pRetrieveRsp->numOfCols, NULL, &pStart);
2175 2176 2177 2178 2179 2180
        if (code != 0) {
          taosMemoryFreeClear(pDataInfo->pRsp);
          goto _error;
        }

        taosArrayPush(pExchangeInfo->pResultBlockList, &pb);
2181 2182
      }

2183
      updateLoadRemoteInfo(pLoadInfo, pRetrieveRsp->numOfRows, pRetrieveRsp->compLen, startTs, pOperator);
2184

2185
      if (pRsp->completed == 1) {
dengyihao's avatar
dengyihao 已提交
2186 2187 2188 2189
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64
               " execId:%d"
               " index:%d completed, blocks:%d, numOfRows:%d, rowsOfSource:%" PRIu64 ", totalRows:%" PRIu64
               ", total:%.2f Kb,"
2190
               " completed:%d try next %d/%" PRIzu,
H
Haojun Liao 已提交
2191 2192 2193
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, i, pRsp->numOfBlocks,
               pRsp->numOfRows, pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize / 1024.0,
               completed + 1, i + 1, totalSources);
2194
        completed += 1;
2195
        pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2196
      } else {
dengyihao's avatar
dengyihao 已提交
2197 2198 2199 2200
        qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64
               " execId:%d blocks:%d, numOfRows:%d, totalRows:%" PRIu64 ", total:%.2f Kb",
               GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRsp->numOfBlocks,
               pRsp->numOfRows, pLoadInfo->totalRows, pLoadInfo->totalSize / 1024.0);
2201 2202
      }

2203 2204
      taosMemoryFreeClear(pDataInfo->pRsp);

2205 2206
      if (pDataInfo->status != EX_SOURCE_DATA_EXHAUSTED) {
        pDataInfo->status = EX_SOURCE_DATA_NOT_READY;
2207 2208
        code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
        if (code != TSDB_CODE_SUCCESS) {
2209
          taosMemoryFreeClear(pDataInfo->pRsp);
2210 2211 2212 2213
          goto _error;
        }
      }

2214
      return;
2215 2216
    }

2217
    if (completed == totalSources) {
2218 2219
      setAllSourcesCompleted(pOperator, startTs);
      return;
2220
    }
H
Haojun Liao 已提交
2221 2222

    sched_yield();
2223 2224 2225 2226 2227 2228
  }

_error:
  pTaskInfo->code = code;
}

L
Liu Jicong 已提交
2229 2230 2231
static int32_t prepareConcurrentlyLoad(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2232

L
Liu Jicong 已提交
2233
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2234 2235 2236
  int64_t startTs = taosGetTimestampUs();

  // Asynchronously send all fetch requests to all sources.
L
Liu Jicong 已提交
2237
  for (int32_t i = 0; i < totalSources; ++i) {
2238 2239
    int32_t code = doSendFetchDataRequest(pExchangeInfo, pTaskInfo, i);
    if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2240 2241
      pTaskInfo->code = code;
      return code;
2242 2243 2244 2245
    }
  }

  int64_t endTs = taosGetTimestampUs();
2246
  qDebug("%s send all fetch requests to %" PRIzu " sources completed, elapsed:%.2fms", GET_TASKID(pTaskInfo),
X
Xiaoyu Wang 已提交
2247
         totalSources, (endTs - startTs) / 1000.0);
2248

2249
  pOperator->status = OP_RES_TO_RETURN;
H
Haojun Liao 已提交
2250
  pOperator->cost.openCost = taosGetTimestampUs() - startTs;
2251

2252
  tsem_wait(&pExchangeInfo->ready);
H
Haojun Liao 已提交
2253
  return TSDB_CODE_SUCCESS;
2254 2255
}

2256
static int32_t seqLoadRemoteData(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
2257 2258
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2259

L
Liu Jicong 已提交
2260
  size_t  totalSources = taosArrayGetSize(pExchangeInfo->pSources);
2261
  int64_t startTs = taosGetTimestampUs();
2262

L
Liu Jicong 已提交
2263
  while (1) {
2264
    if (pExchangeInfo->current >= totalSources) {
2265 2266
      setAllSourcesCompleted(pOperator, startTs);
      return TSDB_CODE_SUCCESS;
2267
    }
2268

2269 2270 2271
    doSendFetchDataRequest(pExchangeInfo, pTaskInfo, pExchangeInfo->current);
    tsem_wait(&pExchangeInfo->ready);

dengyihao's avatar
dengyihao 已提交
2272
    SSourceDataInfo*       pDataInfo = taosArrayGet(pExchangeInfo->pSourceDataInfo, pExchangeInfo->current);
X
Xiaoyu Wang 已提交
2273
    SDownstreamSourceNode* pSource = taosArrayGet(pExchangeInfo->pSources, pExchangeInfo->current);
2274

H
Haojun Liao 已提交
2275
    if (pDataInfo->code != TSDB_CODE_SUCCESS) {
2276 2277
      qError("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d error happens, code:%s", GET_TASKID(pTaskInfo),
             pSource->addr.nodeId, pSource->taskId, pSource->execId, tstrerror(pDataInfo->code));
H
Haojun Liao 已提交
2278
      pOperator->pTaskInfo->code = pDataInfo->code;
2279
      return pOperator->pTaskInfo->code;
H
Haojun Liao 已提交
2280 2281
    }

L
Liu Jicong 已提交
2282
    SRetrieveTableRsp*   pRsp = pDataInfo->pRsp;
H
Haojun Liao 已提交
2283
    SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2284
    if (pRsp->numOfRows == 0) {
2285 2286
      qDebug("%s vgId:%d, taskID:0x%" PRIx64 " execId:%d %d of total completed, rowsOfSource:%" PRIu64
             ", totalRows:%" PRIu64 " try next",
D
dapan1121 已提交
2287
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pExchangeInfo->current + 1,
H
Haojun Liao 已提交
2288
             pDataInfo->totalRows, pLoadInfo->totalRows);
H
Haojun Liao 已提交
2289

2290
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2291
      pExchangeInfo->current += 1;
D
dapan1121 已提交
2292
      taosMemoryFreeClear(pDataInfo->pRsp);
2293 2294
      continue;
    }
H
Haojun Liao 已提交
2295

2296 2297 2298
    SRetrieveTableRsp* pRetrieveRsp = pDataInfo->pRsp;

    char*   pStart = pRetrieveRsp->data;
2299
    int32_t code = extractDataBlockFromFetchRsp(NULL, pStart, pRetrieveRsp->numOfCols, NULL, &pStart);
2300 2301

    if (pRsp->completed == 1) {
D
dapan1121 已提交
2302
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, rowsOfSource:%" PRIu64
L
Liu Jicong 已提交
2303
             ", totalRows:%" PRIu64 ", totalBytes:%" PRIu64 " try next %d/%" PRIzu,
2304
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRetrieveRsp->numOfRows,
2305 2306
             pDataInfo->totalRows, pLoadInfo->totalRows, pLoadInfo->totalSize, pExchangeInfo->current + 1,
             totalSources);
2307

2308
      pDataInfo->status = EX_SOURCE_DATA_EXHAUSTED;
2309 2310
      pExchangeInfo->current += 1;
    } else {
D
dapan1121 已提交
2311
      qDebug("%s fetch msg rsp from vgId:%d, taskId:0x%" PRIx64 " execId:%d numOfRows:%d, totalRows:%" PRIu64
L
Liu Jicong 已提交
2312
             ", totalBytes:%" PRIu64,
2313
             GET_TASKID(pTaskInfo), pSource->addr.nodeId, pSource->taskId, pSource->execId, pRetrieveRsp->numOfRows,
2314
             pLoadInfo->totalRows, pLoadInfo->totalSize);
2315 2316
    }

2317 2318 2319
    updateLoadRemoteInfo(pLoadInfo, pRetrieveRsp->numOfRows, pRetrieveRsp->compLen, startTs, pOperator);
    pDataInfo->totalRows += pRetrieveRsp->numOfRows;

2320
    taosMemoryFreeClear(pDataInfo->pRsp);
2321
    return TSDB_CODE_SUCCESS;
2322
  }
2323 2324
}

L
Liu Jicong 已提交
2325
static int32_t prepareLoadRemoteData(SOperatorInfo* pOperator) {
2326
  if (OPTR_IS_OPENED(pOperator)) {
H
Haojun Liao 已提交
2327 2328 2329
    return TSDB_CODE_SUCCESS;
  }

2330 2331
  int64_t st = taosGetTimestampUs();

L
Liu Jicong 已提交
2332
  SExchangeInfo* pExchangeInfo = pOperator->info;
2333
  if (!pExchangeInfo->seqLoadData) {
H
Haojun Liao 已提交
2334 2335 2336 2337 2338 2339
    int32_t code = prepareConcurrentlyLoad(pOperator);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
    }
  }

2340
  OPTR_SET_OPENED(pOperator);
2341
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2342 2343 2344
  return TSDB_CODE_SUCCESS;
}

2345 2346 2347 2348 2349
static void freeBlock(void* pParam) {
  SSDataBlock* pBlock = *(SSDataBlock**)pParam;
  blockDataDestroy(pBlock);
}

2350
static SSDataBlock* doLoadRemoteDataImpl(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
2351 2352
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2353

2354
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
2355
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2356 2357
    return NULL;
  }
2358

2359
  size_t totalSources = taosArrayGetSize(pExchangeInfo->pSources);
H
Haojun Liao 已提交
2360

2361
  SLoadRemoteDataInfo* pLoadInfo = &pExchangeInfo->loadInfo;
2362
  if (pOperator->status == OP_EXEC_DONE) {
L
Liu Jicong 已提交
2363 2364 2365
    qDebug("%s all %" PRIzu " source(s) are exhausted, total rows:%" PRIu64 " bytes:%" PRIu64 ", elapsed:%.2f ms",
           GET_TASKID(pTaskInfo), totalSources, pLoadInfo->totalRows, pLoadInfo->totalSize,
           pLoadInfo->totalElapsed / 1000.0);
2366 2367 2368
    return NULL;
  }

2369 2370 2371 2372 2373 2374 2375 2376 2377 2378 2379 2380 2381
  size_t size = taosArrayGetSize(pExchangeInfo->pResultBlockList);
  if (size == 0 || pExchangeInfo->rspBlockIndex >= size) {
    pExchangeInfo->rspBlockIndex = 0;
    taosArrayClearEx(pExchangeInfo->pResultBlockList, freeBlock);
    if (pExchangeInfo->seqLoadData) {
      seqLoadRemoteData(pOperator);
    } else {
      concurrentlyLoadRemoteDataImpl(pOperator, pExchangeInfo, pTaskInfo);
    }

    if (taosArrayGetSize(pExchangeInfo->pResultBlockList) == 0) {
      return NULL;
    }
2382
  }
2383 2384 2385

  // we have buffered retrieved datablock, return it directly
  return taosArrayGetP(pExchangeInfo->pResultBlockList, pExchangeInfo->rspBlockIndex++);
H
Haojun Liao 已提交
2386
}
2387

2388 2389 2390 2391 2392 2393 2394 2395
static SSDataBlock* doLoadRemoteData(SOperatorInfo* pOperator) {
  SExchangeInfo* pExchangeInfo = pOperator->info;
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

L
Liu Jicong 已提交
2396
  while (1) {
2397 2398 2399 2400 2401 2402 2403
    SSDataBlock* pBlock = doLoadRemoteDataImpl(pOperator);
    if (pBlock == NULL) {
      return NULL;
    }

    SLimitInfo* pLimitInfo = &pExchangeInfo->limitInfo;
    if (hasLimitOffsetInfo(pLimitInfo)) {
2404
      int32_t status = handleLimitOffset(pOperator, pLimitInfo, pBlock, false);
2405 2406 2407
      if (status == PROJECT_RETRIEVE_CONTINUE) {
        continue;
      } else if (status == PROJECT_RETRIEVE_DONE) {
2408
        size_t rows = pBlock->info.rows;
2409 2410 2411 2412 2413 2414
        pExchangeInfo->limitInfo.numOfOutputRows += rows;

        if (rows == 0) {
          doSetOperatorCompleted(pOperator);
          return NULL;
        } else {
2415
          return pBlock;
2416 2417 2418
        }
      }
    } else {
2419
      return pBlock;
2420 2421 2422 2423
    }
  }
}

2424
static int32_t initDataSource(int32_t numOfSources, SExchangeInfo* pInfo, const char* id) {
2425
  pInfo->pSourceDataInfo = taosArrayInit(numOfSources, sizeof(SSourceDataInfo));
H
Haojun Liao 已提交
2426 2427
  if (pInfo->pSourceDataInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
2428 2429
  }

L
Liu Jicong 已提交
2430
  for (int32_t i = 0; i < numOfSources; ++i) {
2431
    SSourceDataInfo dataInfo = {0};
H
Haojun Liao 已提交
2432
    dataInfo.status = EX_SOURCE_DATA_NOT_READY;
2433
    dataInfo.taskId = id;
L
Liu Jicong 已提交
2434
    dataInfo.index = i;
X
Xiaoyu Wang 已提交
2435
    SSourceDataInfo* pDs = taosArrayPush(pInfo->pSourceDataInfo, &dataInfo);
2436
    if (pDs == NULL) {
H
Haojun Liao 已提交
2437 2438 2439 2440 2441 2442 2443 2444
      taosArrayDestroy(pInfo->pSourceDataInfo);
      return TSDB_CODE_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
}

2445
static int32_t initExchangeOperator(SExchangePhysiNode* pExNode, SExchangeInfo* pInfo, const char* id) {
2446
  size_t numOfSources = LIST_LENGTH(pExNode->pSrcEndPoints);
H
Haojun Liao 已提交
2447

2448
  if (numOfSources == 0) {
X
Xiaoyu Wang 已提交
2449
    qError("%s invalid number: %d of sources in exchange operator", id, (int32_t)numOfSources);
2450 2451 2452
    return TSDB_CODE_INVALID_PARA;
  }

H
Haojun Liao 已提交
2453
  pInfo->pSources = taosArrayInit(numOfSources, sizeof(SDownstreamSourceNode));
wmmhello's avatar
wmmhello 已提交
2454
  if (pInfo->pSources == NULL) {
2455
    return TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
2456 2457
  }

L
Liu Jicong 已提交
2458
  for (int32_t i = 0; i < numOfSources; ++i) {
D
dapan1121 已提交
2459
    SDownstreamSourceNode* pNode = (SDownstreamSourceNode*)nodesListGetNode((SNodeList*)pExNode->pSrcEndPoints, i);
H
Haojun Liao 已提交
2460 2461
    taosArrayPush(pInfo->pSources, pNode);
  }
2462

2463
  initLimitInfo(pExNode->node.pLimit, pExNode->node.pSlimit, &pInfo->limitInfo);
2464 2465
  pInfo->self = taosAddRef(exchangeObjRefPool, pInfo);

2466
  return initDataSource(numOfSources, pInfo, id);
2467 2468 2469 2470 2471 2472
}

SOperatorInfo* createExchangeOperatorInfo(void* pTransporter, SExchangePhysiNode* pExNode, SExecTaskInfo* pTaskInfo) {
  SExchangeInfo* pInfo = taosMemoryCalloc(1, sizeof(SExchangeInfo));
  SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
H
Haojun Liao 已提交
2473
    goto _error;
2474
  }
H
Haojun Liao 已提交
2475

2476
  int32_t code = initExchangeOperator(pExNode, pInfo, GET_TASKID(pTaskInfo));
2477 2478 2479
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2480 2481

  tsem_init(&pInfo->ready, 0, 0);
2482 2483
  pInfo->pDummyBlock = createResDataBlock(pExNode->node.pOutputDataBlockDesc);
  pInfo->pResultBlockList = taosArrayInit(1, POINTER_BYTES);
2484

2485
  pInfo->seqLoadData = false;
2486
  pInfo->pTransporter = pTransporter;
2487

2488
  pOperator->name = "ExchangeOperator";
X
Xiaoyu Wang 已提交
2489
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_EXCHANGE;
X
Xiaoyu Wang 已提交
2490
  pOperator->blocking = false;
2491 2492
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
2493
  pOperator->exprSupp.numOfExprs = taosArrayGetSize(pInfo->pDummyBlock->pDataBlock);
X
Xiaoyu Wang 已提交
2494
  pOperator->pTaskInfo = pTaskInfo;
2495

L
Liu Jicong 已提交
2496 2497
  pOperator->fpSet = createOperatorFpSet(prepareLoadRemoteData, doLoadRemoteData, NULL, NULL,
                                         destroyExchangeOperatorInfo, NULL, NULL, NULL);
2498
  return pOperator;
H
Haojun Liao 已提交
2499

L
Liu Jicong 已提交
2500
_error:
H
Haojun Liao 已提交
2501
  if (pInfo != NULL) {
2502
    doDestroyExchangeOperatorInfo(pInfo);
H
Haojun Liao 已提交
2503 2504
  }

wafwerar's avatar
wafwerar 已提交
2505
  taosMemoryFreeClear(pOperator);
2506
  pTaskInfo->code = code;
H
Haojun Liao 已提交
2507
  return NULL;
2508 2509
}

dengyihao's avatar
dengyihao 已提交
2510 2511
static int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                                const char* pKey);
2512

2513
static void destroySortedMergeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
2514
  SSortedMergeOperatorInfo* pInfo = (SSortedMergeOperatorInfo*)param;
H
Haojun Liao 已提交
2515
  taosArrayDestroy(pInfo->pSortInfo);
2516 2517 2518
  taosArrayDestroy(pInfo->groupInfo);

  if (pInfo->pSortHandle != NULL) {
H
Haojun Liao 已提交
2519
    tsortDestroySortHandle(pInfo->pSortHandle);
2520 2521
  }

H
Haojun Liao 已提交
2522
  blockDataDestroy(pInfo->binfo.pRes);
H
Haojun Liao 已提交
2523
  cleanupAggSup(&pInfo->aggSup);
L
Liu Jicong 已提交
2524

D
dapan1121 已提交
2525
  taosMemoryFreeClear(param);
2526
}
H
Haojun Liao 已提交
2527

L
Liu Jicong 已提交
2528
static bool needToMerge(SSDataBlock* pBlock, SArray* groupInfo, char** buf, int32_t rowIndex) {
2529 2530 2531 2532
  size_t size = taosArrayGetSize(groupInfo);
  if (size == 0) {
    return true;
  }
2533

2534 2535
  for (int32_t i = 0; i < size; ++i) {
    int32_t* index = taosArrayGet(groupInfo, i);
2536

2537
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
L
Liu Jicong 已提交
2538
    bool             isNull = colDataIsNull(pColInfo, rowIndex, pBlock->info.rows, NULL);
2539

2540 2541 2542
    if ((isNull && buf[i] != NULL) || (!isNull && buf[i] == NULL)) {
      return false;
    }
2543

2544 2545 2546 2547 2548 2549 2550 2551 2552 2553 2554 2555 2556
    char* pCell = colDataGetData(pColInfo, rowIndex);
    if (IS_VAR_DATA_TYPE(pColInfo->info.type)) {
      if (varDataLen(pCell) != varDataLen(buf[i])) {
        return false;
      } else {
        if (memcmp(varDataVal(pCell), varDataVal(buf[i]), varDataLen(pCell)) != 0) {
          return false;
        }
      }
    } else {
      if (memcmp(pCell, buf[i], pColInfo->info.bytes) != 0) {
        return false;
      }
2557 2558 2559
    }
  }

2560
  return 0;
2561 2562
}

L
Liu Jicong 已提交
2563 2564 2565
static void doMergeResultImpl(SSortedMergeOperatorInfo* pInfo, SqlFunctionCtx* pCtx, int32_t numOfExpr,
                              int32_t rowIndex) {
  for (int32_t j = 0; j < numOfExpr; ++j) {  // TODO set row index
X
Xiaoyu Wang 已提交
2566
                                             //    pCtx[j].startRow = rowIndex;
2567 2568
  }

2569 2570
  for (int32_t j = 0; j < numOfExpr; ++j) {
    int32_t functionId = pCtx[j].functionId;
L
Liu Jicong 已提交
2571 2572 2573 2574 2575 2576 2577 2578 2579
    //    pCtx[j].fpSet->addInput(&pCtx[j]);

    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_MERGE);
    //    } else {
    //      assert(!TSDB_FUNC_IS_SCALAR(functionId));
    //      aAggs[functionId].mergeFunc(&pCtx[j]);
    //    }
2580
  }
2581
}
2582

L
Liu Jicong 已提交
2583 2584
static void doFinalizeResultImpl(SqlFunctionCtx* pCtx, int32_t numOfExpr) {
  for (int32_t j = 0; j < numOfExpr; ++j) {
2585 2586 2587 2588
    int32_t functionId = pCtx[j].functionId;
    //    if (functionId == FUNC_TAG_DUMMY || functionId == FUNC_TS_DUMMY) {
    //      continue;
    //    }
2589

2590 2591 2592 2593
    //    if (functionId < 0) {
    //      SUdfInfo* pUdfInfo = taosArrayGet(pInfo->udfInfo, -1 * functionId - 1);
    //      doInvokeUdf(pUdfInfo, &pCtx[j], 0, TSDB_UDF_FUNC_FINALIZE);
    //    } else {
dengyihao's avatar
dengyihao 已提交
2594
    //    pCtx[j].fpSet.finalize(&pCtx[j]);
2595 2596
  }
}
2597

2598
static bool saveCurrentTuple(char** rowColData, SArray* pColumnList, SSDataBlock* pBlock, int32_t rowIndex) {
L
Liu Jicong 已提交
2599
  int32_t size = (int32_t)taosArrayGetSize(pColumnList);
2600

L
Liu Jicong 已提交
2601 2602
  for (int32_t i = 0; i < size; ++i) {
    int32_t*         index = taosArrayGet(pColumnList, i);
2603
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, *index);
H
Haojun Liao 已提交
2604

2605 2606 2607
    char* data = colDataGetData(pColInfo, rowIndex);
    memcpy(rowColData[i], data, colDataGetLength(pColInfo, rowIndex));
  }
2608

2609 2610
  return true;
}
2611

2612 2613
static void doMergeImpl(SOperatorInfo* pOperator, int32_t numOfExpr, SSDataBlock* pBlock) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
2614

2615
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
2616

L
Liu Jicong 已提交
2617
  for (int32_t i = 0; i < pBlock->info.rows; ++i) {
2618 2619 2620 2621 2622 2623 2624 2625 2626
    if (!pInfo->hasGroupVal) {
      ASSERT(i == 0);
      doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
    } else {
      if (needToMerge(pBlock, pInfo->groupInfo, pInfo->groupVal, i)) {
        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
      } else {
        doFinalizeResultImpl(pCtx, numOfExpr);
2627 2628
        int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
        //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2629

2630
        // TODO check for available buffer;
H
Haojun Liao 已提交
2631

2632 2633 2634 2635 2636
        // next group info data
        pInfo->binfo.pRes->info.rows += numOfRows;
        for (int32_t j = 0; j < numOfExpr; ++j) {
          if (pCtx[j].functionId < 0) {
            continue;
2637
          }
2638

H
Haojun Liao 已提交
2639
          pCtx[j].fpSet.process(&pCtx[j]);
2640
        }
2641 2642 2643

        doMergeResultImpl(pInfo, pCtx, numOfExpr, i);
        pInfo->hasGroupVal = saveCurrentTuple(pInfo->groupVal, pInfo->groupInfo, pBlock, i);
H
Haojun Liao 已提交
2644
      }
2645 2646 2647 2648
    }
  }
}

2649 2650
static SSDataBlock* doMerge(SOperatorInfo* pOperator) {
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
L
Liu Jicong 已提交
2651
  SSortHandle*              pHandle = pInfo->pSortHandle;
2652

2653
  SSDataBlock* pDataBlock = createOneDataBlock(pInfo->binfo.pRes, false);
2654
  blockDataEnsureCapacity(pDataBlock, pOperator->resultInfo.capacity);
2655

L
Liu Jicong 已提交
2656
  while (1) {
2657
    blockDataCleanup(pDataBlock);
2658
    while (1) {
H
Haojun Liao 已提交
2659
      STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2660 2661
      if (pTupleHandle == NULL) {
        break;
2662
      }
2663

2664 2665
      // build datablock for merge for one group
      appendOneRowToDataBlock(pDataBlock, pTupleHandle);
2666
      if (pDataBlock->info.rows >= pOperator->resultInfo.capacity) {
2667 2668
        break;
      }
2669
    }
2670

2671 2672 2673
    if (pDataBlock->info.rows == 0) {
      break;
    }
2674

2675
    setInputDataBlock(pOperator, pOperator->exprSupp.pCtx, pDataBlock, TSDB_ORDER_ASC, MAIN_SCAN, true);
L
Liu Jicong 已提交
2676 2677
    //  updateOutputBuf(&pInfo->binfo, &pAggInfo->bufCapacity, pBlock->info.rows * pAggInfo->resultRowFactor,
    //  pOperator->pRuntimeEnv, true);
2678
    doMergeImpl(pOperator, pOperator->exprSupp.numOfExprs, pDataBlock);
2679 2680
    // flush to tuple store, and after all data have been handled, return to upstream node or sink node
  }
2681

2682 2683 2684
  doFinalizeResultImpl(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs);
  int32_t numOfRows = getNumOfResult(pOperator->exprSupp.pCtx, pOperator->exprSupp.numOfExprs, NULL);
  //        setTagValueForMultipleRows(pCtx, pOperator->exprSupp.numOfExprs, numOfRows);
2685

2686
  // TODO check for available buffer;
2687

2688 2689
  // next group info data
  pInfo->binfo.pRes->info.rows += numOfRows;
L
Liu Jicong 已提交
2690
  return (pInfo->binfo.pRes->info.rows > 0) ? pInfo->binfo.pRes : NULL;
2691
}
2692

L
Liu Jicong 已提交
2693 2694
SSDataBlock* getSortedMergeBlockData(SSortHandle* pHandle, SSDataBlock* pDataBlock, int32_t capacity,
                                     SArray* pColMatchInfo, SSortedMergeOperatorInfo* pInfo) {
2695 2696 2697 2698 2699 2700 2701 2702 2703 2704
  blockDataCleanup(pDataBlock);

  SSDataBlock* p = tsortGetSortedDataBlock(pHandle);
  if (p == NULL) {
    return NULL;
  }

  blockDataEnsureCapacity(p, capacity);

  while (1) {
2705
    STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2706 2707 2708 2709
    if (pTupleHandle == NULL) {
      break;
    }

2710
    appendOneRowToDataBlock(p, pTupleHandle);
2711 2712 2713 2714 2715 2716 2717 2718 2719 2720 2721 2722 2723
    if (p->info.rows >= capacity) {
      break;
    }
  }

  if (p->info.rows > 0) {
    int32_t numOfCols = taosArrayGetSize(pColMatchInfo);
    for (int32_t i = 0; i < numOfCols; ++i) {
      SColMatchInfo* pmInfo = taosArrayGet(pColMatchInfo, i);
      ASSERT(pmInfo->matchType == COL_MATCH_FROM_SLOT_ID);

      SColumnInfoData* pSrc = taosArrayGet(p->pDataBlock, pmInfo->srcSlotId);
      SColumnInfoData* pDst = taosArrayGet(pDataBlock->pDataBlock, pmInfo->targetSlotId);
2724
      colDataAssign(pDst, pSrc, p->info.rows, &pDataBlock->info);
2725 2726 2727 2728 2729 2730 2731 2732 2733 2734
    }

    pDataBlock->info.rows = p->info.rows;
    pDataBlock->info.capacity = p->info.rows;
  }

  blockDataDestroy(p);
  return (pDataBlock->info.rows > 0) ? pDataBlock : NULL;
}

2735
static SSDataBlock* doSortedMerge(SOperatorInfo* pOperator) {
2736 2737
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
2738 2739
  }

L
Liu Jicong 已提交
2740
  SExecTaskInfo*            pTaskInfo = pOperator->pTaskInfo;
2741
  SSortedMergeOperatorInfo* pInfo = pOperator->info;
H
Haojun Liao 已提交
2742
  if (pOperator->status == OP_RES_TO_RETURN) {
2743
    return getSortedMergeBlockData(pInfo->pSortHandle, pInfo->binfo.pRes, pOperator->resultInfo.capacity, NULL, pInfo);
2744 2745
  }

2746
  int32_t numOfBufPage = pInfo->sortBufSize / pInfo->bufPageSize;
L
Liu Jicong 已提交
2747 2748
  pInfo->pSortHandle = tsortCreateSortHandle(pInfo->pSortInfo, SORT_MULTISOURCE_MERGE, pInfo->bufPageSize, numOfBufPage,
                                             pInfo->binfo.pRes, "GET_TASKID(pTaskInfo)");
H
Haojun Liao 已提交
2749

2750
  tsortSetFetchRawDataFp(pInfo->pSortHandle, loadNextDataBlock, NULL, NULL);
2751

L
Liu Jicong 已提交
2752
  for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
wmmhello's avatar
wmmhello 已提交
2753
    SSortSource* ps = taosMemoryCalloc(1, sizeof(SSortSource));
H
Haojun Liao 已提交
2754
    ps->param = pOperator->pDownstream[i];
H
Haojun Liao 已提交
2755
    tsortAddSource(pInfo->pSortHandle, ps);
2756 2757
  }

H
Haojun Liao 已提交
2758
  int32_t code = tsortOpen(pInfo->pSortHandle);
2759
  if (code != TSDB_CODE_SUCCESS) {
2760
    longjmp(pTaskInfo->env, terrno);
2761 2762
  }

H
Haojun Liao 已提交
2763
  pOperator->status = OP_RES_TO_RETURN;
2764
  return doMerge(pOperator);
2765
}
2766

L
Liu Jicong 已提交
2767 2768
static int32_t initGroupCol(SExprInfo* pExprInfo, int32_t numOfCols, SArray* pGroupInfo,
                            SSortedMergeOperatorInfo* pInfo) {
2769 2770
  if (pGroupInfo == NULL || taosArrayGetSize(pGroupInfo) == 0) {
    return 0;
H
Haojun Liao 已提交
2771 2772
  }

2773 2774 2775 2776 2777 2778 2779 2780
  int32_t len = 0;
  SArray* plist = taosArrayInit(3, sizeof(SColumn));
  pInfo->groupInfo = taosArrayInit(3, sizeof(int32_t));

  if (plist == NULL || pInfo->groupInfo == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

L
Liu Jicong 已提交
2781 2782
  size_t numOfGroupCol = taosArrayGetSize(pInfo->groupInfo);
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2783
    SColumn* pCol = taosArrayGet(pGroupInfo, i);
L
Liu Jicong 已提交
2784
    for (int32_t j = 0; j < numOfCols; ++j) {
H
Haojun Liao 已提交
2785
      SExprInfo* pe = &pExprInfo[j];
2786
      if (pe->base.resSchema.slotId == pCol->colId) {
2787 2788
        taosArrayPush(plist, pCol);
        taosArrayPush(pInfo->groupInfo, &j);
H
Haojun Liao 已提交
2789
        len += pCol->bytes;
2790 2791
        break;
      }
H
Haojun Liao 已提交
2792 2793 2794
    }
  }

2795
  ASSERT(taosArrayGetSize(pGroupInfo) == taosArrayGetSize(plist));
H
Haojun Liao 已提交
2796

wafwerar's avatar
wafwerar 已提交
2797
  pInfo->groupVal = taosMemoryCalloc(1, (POINTER_BYTES * numOfGroupCol + len));
2798 2799 2800 2801
  if (pInfo->groupVal == NULL) {
    taosArrayDestroy(plist);
    return TSDB_CODE_OUT_OF_MEMORY;
  }
H
Haojun Liao 已提交
2802

2803
  int32_t offset = 0;
L
Liu Jicong 已提交
2804 2805
  char*   start = (char*)(pInfo->groupVal + (POINTER_BYTES * numOfGroupCol));
  for (int32_t i = 0; i < numOfGroupCol; ++i) {
2806 2807
    pInfo->groupVal[i] = start + offset;
    SColumn* pCol = taosArrayGet(plist, i);
H
Haojun Liao 已提交
2808
    offset += pCol->bytes;
2809
  }
H
Haojun Liao 已提交
2810

2811
  taosArrayDestroy(plist);
H
Haojun Liao 已提交
2812

2813 2814
  return TSDB_CODE_SUCCESS;
}
H
Haojun Liao 已提交
2815

X
Xiaoyu Wang 已提交
2816
int32_t getTableScanInfo(SOperatorInfo* pOperator, int32_t* order, int32_t* scanFlag) {
2817
  // todo add more information about exchange operation
2818
  int32_t type = pOperator->operatorType;
X
Xiaoyu Wang 已提交
2819
  if (type == QUERY_NODE_PHYSICAL_PLAN_EXCHANGE || type == QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN ||
2820
      type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN ||
2821
      type == QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN || type == QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN) {
2822 2823 2824
    *order = TSDB_ORDER_ASC;
    *scanFlag = MAIN_SCAN;
    return TSDB_CODE_SUCCESS;
2825
  } else if (type == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) {
2826 2827 2828 2829
    STableScanInfo* pTableScanInfo = pOperator->info;
    *order = pTableScanInfo->cond.order;
    *scanFlag = pTableScanInfo->scanFlag;
    return TSDB_CODE_SUCCESS;
2830 2831 2832 2833 2834
  } else if (type == QUERY_NODE_PHYSICAL_PLAN_TABLE_MERGE_SCAN) {
    STableMergeScanInfo* pTableScanInfo = pOperator->info;
    *order = pTableScanInfo->cond.order;
    *scanFlag = pTableScanInfo->scanFlag;
    return TSDB_CODE_SUCCESS;
2835
  } else {
H
Haojun Liao 已提交
2836
    if (pOperator->pDownstream == NULL || pOperator->pDownstream[0] == NULL) {
2837
      return TSDB_CODE_INVALID_PARA;
H
Haojun Liao 已提交
2838
    } else {
2839
      return getTableScanInfo(pOperator->pDownstream[0], order, scanFlag);
2840 2841 2842
    }
  }
}
L
Liu Jicong 已提交
2843
#if 0
L
Liu Jicong 已提交
2844
int32_t doPrepareScan(SOperatorInfo* pOperator, uint64_t uid, int64_t ts) {
L
Liu Jicong 已提交
2845
  uint8_t type = pOperator->operatorType;
2846 2847 2848

  pOperator->status = OP_OPENED;

L
Liu Jicong 已提交
2849
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2850
    SStreamScanInfo* pScanInfo = pOperator->info;
L
Liu Jicong 已提交
2851
    pScanInfo->blockType = STREAM_INPUT__TABLE_SCAN;
2852

2853
    pScanInfo->pTableScanOp->status = OP_OPENED;
2854

2855
    STableScanInfo* pInfo = pScanInfo->pTableScanOp->info;
2856 2857
    ASSERT(pInfo->scanMode == TABLE_SCAN__TABLE_ORDER);

L
Liu Jicong 已提交
2858 2859 2860 2861
    if (uid == 0) {
      pInfo->noTable = 1;
      return TSDB_CODE_SUCCESS;
    }
2862 2863 2864 2865 2866 2867

    /*if (pSnapShotScanInfo->dataReader == NULL) {*/
    /*pSnapShotScanInfo->dataReader = tsdbReaderOpen(pHandle->vnode, &pSTInfo->cond, tableList, 0, 0);*/
    /*pSnapShotScanInfo->scanMode = TABLE_SCAN__TABLE_ORDER;*/
    /*}*/

L
Liu Jicong 已提交
2868 2869
    pInfo->noTable = 0;

2870
    if (pInfo->lastStatus.uid != uid || pInfo->lastStatus.ts != ts) {
L
Liu Jicong 已提交
2871 2872 2873 2874 2875 2876 2877 2878 2879 2880 2881
      SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

      int32_t tableSz = taosArrayGetSize(pTaskInfo->tableqinfoList.pTableList);
      bool    found = false;
      for (int32_t i = 0; i < tableSz; i++) {
        STableKeyInfo* pTableInfo = taosArrayGet(pTaskInfo->tableqinfoList.pTableList, i);
        if (pTableInfo->uid == uid) {
          found = true;
          pInfo->currentTable = i;
        }
      }
2882
      // TODO after processing drop, found can be false
L
Liu Jicong 已提交
2883
      ASSERT(found);
2884 2885

      tsdbSetTableId(pInfo->dataReader, uid);
H
Haojun Liao 已提交
2886 2887 2888 2889
      int64_t oldSkey = pInfo->cond.twindows.skey;
      pInfo->cond.twindows.skey = ts + 1;
      tsdbReaderReset(pInfo->dataReader, &pInfo->cond);
      pInfo->cond.twindows.skey = oldSkey;
2890 2891
      pInfo->scanTimes = 0;

S
Shengliang Guan 已提交
2892
      qDebug("tsdb reader offset seek to uid %" PRId64 " ts %" PRId64 ", table cur set to %d , all table num %d", uid, ts,
L
Liu Jicong 已提交
2893
             pInfo->currentTable, tableSz);
L
Liu Jicong 已提交
2894
    }
L
Liu Jicong 已提交
2895

L
Liu Jicong 已提交
2896
    return TSDB_CODE_SUCCESS;
2897

L
Liu Jicong 已提交
2898
  } else {
2899 2900 2901 2902 2903
    if (pOperator->numOfDownstream == 1) {
      return doPrepareScan(pOperator->pDownstream[0], uid, ts);
    } else if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator to set the input data block");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2904
    } else {
2905 2906
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
L
Liu Jicong 已提交
2907 2908 2909 2910
    }
  }
}

2911 2912 2913
int32_t doGetScanStatus(SOperatorInfo* pOperator, uint64_t* uid, int64_t* ts) {
  int32_t type = pOperator->operatorType;
  if (type == QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
2914 2915
    SStreamScanInfo* pScanInfo = pOperator->info;
    STableScanInfo*  pSnapShotScanInfo = pScanInfo->pTableScanOp->info;
L
Liu Jicong 已提交
2916 2917
    *uid = pSnapShotScanInfo->lastStatus.uid;
    *ts = pSnapShotScanInfo->lastStatus.ts;
2918 2919 2920 2921 2922 2923 2924 2925 2926 2927
  } else {
    if (pOperator->pDownstream[0] == NULL) {
      return TSDB_CODE_INVALID_PARA;
    } else {
      doGetScanStatus(pOperator->pDownstream[0], uid, ts);
    }
  }

  return TSDB_CODE_SUCCESS;
}
L
Liu Jicong 已提交
2928
#endif
2929

2930
// this is a blocking operator
L
Liu Jicong 已提交
2931
static int32_t doOpenAggregateOptr(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
2932 2933
  if (OPTR_IS_OPENED(pOperator)) {
    return TSDB_CODE_SUCCESS;
2934 2935
  }

H
Haojun Liao 已提交
2936
  SExecTaskInfo*    pTaskInfo = pOperator->pTaskInfo;
2937
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
2938

2939 2940
  SExprSupp*     pSup = &pOperator->exprSupp;
  SOperatorInfo* downstream = pOperator->pDownstream[0];
2941

2942 2943
  int64_t st = taosGetTimestampUs();

2944 2945 2946
  int32_t order = TSDB_ORDER_ASC;
  int32_t scanFlag = MAIN_SCAN;

H
Haojun Liao 已提交
2947
  while (1) {
2948
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
2949 2950 2951 2952
    if (pBlock == NULL) {
      break;
    }

2953 2954 2955 2956
    int32_t code = getTableScanInfo(pOperator, &order, &scanFlag);
    if (code != TSDB_CODE_SUCCESS) {
      longjmp(pTaskInfo->env, code);
    }
2957

2958
    // there is an scalar expression that needs to be calculated before apply the group aggregation.
2959 2960 2961
    if (pAggInfo->scalarExprSup.pExprInfo != NULL) {
      SExprSupp* pSup1 = &pAggInfo->scalarExprSup;
      code = projectApplyFunctions(pSup1->pExprInfo, pBlock, pBlock, pSup1->pCtx, pSup1->numOfExprs, NULL);
2962
      if (code != TSDB_CODE_SUCCESS) {
2963
        longjmp(pTaskInfo->env, code);
2964
      }
2965 2966
    }

2967
    // the pDataBlock are always the same one, no need to call this again
2968
    setExecutionContext(pOperator, pOperator->exprSupp.numOfExprs, pBlock->info.groupId);
2969
    setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, true);
2970
    code = doAggregateImpl(pOperator, pSup->pCtx);
2971 2972 2973
    if (code != 0) {
      longjmp(pTaskInfo->env, code);
    }
2974 2975
  }

2976
  initGroupedResultInfo(&pAggInfo->groupResInfo, pAggInfo->aggSup.pResultRowHashTable, 0);
H
Haojun Liao 已提交
2977
  OPTR_SET_OPENED(pOperator);
2978

2979
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
H
Haojun Liao 已提交
2980 2981 2982
  return TSDB_CODE_SUCCESS;
}

2983
static SSDataBlock* getAggregateResult(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
2984
  SAggOperatorInfo* pAggInfo = pOperator->info;
H
Haojun Liao 已提交
2985 2986 2987 2988 2989 2990
  SOptrBasicInfo*   pInfo = &pAggInfo->binfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

L
Liu Jicong 已提交
2991
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;
2992
  pTaskInfo->code = pOperator->fpSet._openFn(pOperator);
H
Haojun Liao 已提交
2993
  if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
2994
    doSetOperatorCompleted(pOperator);
H
Haojun Liao 已提交
2995 2996 2997
    return NULL;
  }

H
Haojun Liao 已提交
2998
  blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);
S
slzhou 已提交
2999 3000
  while (1) {
    doBuildResultDatablock(pOperator, pInfo, &pAggInfo->groupResInfo, pAggInfo->aggSup.pResultBuf);
3001
    doFilter(pAggInfo->pCondition, pInfo->pRes, NULL);
S
slzhou 已提交
3002

3003
    if (!hasRemainResults(&pAggInfo->groupResInfo)) {
S
slzhou 已提交
3004 3005 3006
      doSetOperatorCompleted(pOperator);
      break;
    }
3007

S
slzhou 已提交
3008 3009 3010 3011
    if (pInfo->pRes->info.rows > 0) {
      break;
    }
  }
3012

3013
  size_t rows = blockDataGetNumOfRows(pInfo->pRes);
3014 3015
  pOperator->resultInfo.totalRows += rows;

3016
  return (rows == 0) ? NULL : pInfo->pRes;
3017 3018
}

wmmhello's avatar
wmmhello 已提交
3019
int32_t aggEncodeResultRow(SOperatorInfo* pOperator, char** result, int32_t* length) {
3020
  if (result == NULL || length == NULL) {
wmmhello's avatar
wmmhello 已提交
3021 3022 3023
    return TSDB_CODE_TSC_INVALID_INPUT;
  }
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3024 3025 3026 3027 3028
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
  int32_t         size = taosHashGetSize(pSup->pResultRowHashTable);
  size_t          keyLen = sizeof(uint64_t) * 2;  // estimate the key length
  int32_t         totalSize =
      sizeof(int32_t) + sizeof(int32_t) + size * (sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3029

C
Cary Xu 已提交
3030 3031 3032 3033 3034 3035
  // no result
  if (getTotalBufSize(pSup->pResultBuf) == 0) {
    *result = NULL;
    *length = 0;
    return TSDB_CODE_SUCCESS;
  }
3036

wmmhello's avatar
wmmhello 已提交
3037
  *result = (char*)taosMemoryCalloc(1, totalSize);
L
Liu Jicong 已提交
3038
  if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
3039
    return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
3040
  }
wmmhello's avatar
wmmhello 已提交
3041

wmmhello's avatar
wmmhello 已提交
3042
  int32_t offset = sizeof(int32_t);
wmmhello's avatar
wmmhello 已提交
3043 3044
  *(int32_t*)(*result + offset) = size;
  offset += sizeof(int32_t);
3045 3046

  // prepare memory
3047
  SResultRowPosition* pos = &pInfo->resultRowInfo.cur;
dengyihao's avatar
dengyihao 已提交
3048 3049
  void*               pPage = getBufPage(pSup->pResultBuf, pos->pageId);
  SResultRow*         pRow = (SResultRow*)((char*)pPage + pos->offset);
3050 3051 3052
  setBufPageDirty(pPage, true);
  releaseBufPage(pSup->pResultBuf, pPage);

dengyihao's avatar
dengyihao 已提交
3053
  void* pIter = taosHashIterate(pSup->pResultRowHashTable, NULL);
wmmhello's avatar
wmmhello 已提交
3054
  while (pIter) {
dengyihao's avatar
dengyihao 已提交
3055
    void*               key = taosHashGetKey(pIter, &keyLen);
3056
    SResultRowPosition* p1 = (SResultRowPosition*)pIter;
3057

dengyihao's avatar
dengyihao 已提交
3058
    pPage = (SFilePage*)getBufPage(pSup->pResultBuf, p1->pageId);
3059
    pRow = (SResultRow*)((char*)pPage + p1->offset);
3060 3061
    setBufPageDirty(pPage, true);
    releaseBufPage(pSup->pResultBuf, pPage);
wmmhello's avatar
wmmhello 已提交
3062 3063 3064

    // recalculate the result size
    int32_t realTotalSize = offset + sizeof(int32_t) + keyLen + sizeof(int32_t) + pSup->resultRowSize;
L
Liu Jicong 已提交
3065
    if (realTotalSize > totalSize) {
wmmhello's avatar
wmmhello 已提交
3066
      char* tmp = (char*)taosMemoryRealloc(*result, realTotalSize);
L
Liu Jicong 已提交
3067
      if (tmp == NULL) {
wafwerar's avatar
wafwerar 已提交
3068
        taosMemoryFree(*result);
wmmhello's avatar
wmmhello 已提交
3069
        *result = NULL;
wmmhello's avatar
wmmhello 已提交
3070
        return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
3071
      } else {
wmmhello's avatar
wmmhello 已提交
3072 3073 3074 3075 3076 3077 3078 3079 3080 3081 3082 3083
        *result = tmp;
      }
    }
    // save key
    *(int32_t*)(*result + offset) = keyLen;
    offset += sizeof(int32_t);
    memcpy(*result + offset, key, keyLen);
    offset += keyLen;

    // save value
    *(int32_t*)(*result + offset) = pSup->resultRowSize;
    offset += sizeof(int32_t);
3084
    memcpy(*result + offset, pRow, pSup->resultRowSize);
wmmhello's avatar
wmmhello 已提交
3085 3086 3087 3088 3089
    offset += pSup->resultRowSize;

    pIter = taosHashIterate(pSup->pResultRowHashTable, pIter);
  }

wmmhello's avatar
wmmhello 已提交
3090 3091 3092 3093
  *(int32_t*)(*result) = offset;
  *length = offset;

  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3094 3095
}

3096
int32_t aggDecodeResultRow(SOperatorInfo* pOperator, char* result) {
3097
  if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
3098
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3099
  }
wmmhello's avatar
wmmhello 已提交
3100
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)(pOperator->info);
3101
  SAggSupporter*  pSup = (SAggSupporter*)POINTER_SHIFT(pOperator->info, sizeof(SOptrBasicInfo));
wmmhello's avatar
wmmhello 已提交
3102 3103

  //  int32_t size = taosHashGetSize(pSup->pResultRowHashTable);
3104
  int32_t length = *(int32_t*)(result);
wmmhello's avatar
wmmhello 已提交
3105
  int32_t offset = sizeof(int32_t);
3106 3107 3108 3109

  int32_t count = *(int32_t*)(result + offset);
  offset += sizeof(int32_t);

L
Liu Jicong 已提交
3110
  while (count-- > 0 && length > offset) {
wmmhello's avatar
wmmhello 已提交
3111 3112 3113
    int32_t keyLen = *(int32_t*)(result + offset);
    offset += sizeof(int32_t);

L
Liu Jicong 已提交
3114
    uint64_t    tableGroupId = *(uint64_t*)(result + offset);
3115
    SResultRow* resultRow = getNewResultRow(pSup->pResultBuf, tableGroupId, pSup->resultRowSize);
L
Liu Jicong 已提交
3116
    if (!resultRow) {
wmmhello's avatar
wmmhello 已提交
3117
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3118
    }
3119

wmmhello's avatar
wmmhello 已提交
3120
    // add a new result set for a new group
3121 3122
    SResultRowPosition pos = {.pageId = resultRow->pageId, .offset = resultRow->offset};
    taosHashPut(pSup->pResultRowHashTable, result + offset, keyLen, &pos, sizeof(SResultRowPosition));
wmmhello's avatar
wmmhello 已提交
3123 3124 3125

    offset += keyLen;
    int32_t valueLen = *(int32_t*)(result + offset);
L
Liu Jicong 已提交
3126
    if (valueLen != pSup->resultRowSize) {
wmmhello's avatar
wmmhello 已提交
3127
      return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3128 3129 3130 3131 3132 3133 3134 3135 3136 3137
    }
    offset += sizeof(int32_t);
    int32_t pageId = resultRow->pageId;
    int32_t pOffset = resultRow->offset;
    memcpy(resultRow, result + offset, valueLen);
    resultRow->pageId = pageId;
    resultRow->offset = pOffset;
    offset += valueLen;

    initResultRow(resultRow);
dengyihao's avatar
dengyihao 已提交
3138
    pInfo->resultRowInfo.cur = (SResultRowPosition){.pageId = resultRow->pageId, .offset = resultRow->offset};
C
Cary Xu 已提交
3139
    // releaseBufPage(pSup->pResultBuf, getBufPage(pSup->pResultBuf, pageId));
wmmhello's avatar
wmmhello 已提交
3140 3141
  }

L
Liu Jicong 已提交
3142
  if (offset != length) {
wmmhello's avatar
wmmhello 已提交
3143
    return TSDB_CODE_TSC_INVALID_INPUT;
wmmhello's avatar
wmmhello 已提交
3144
  }
wmmhello's avatar
wmmhello 已提交
3145
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
3146 3147
}

3148 3149 3150 3151 3152
int32_t handleLimitOffset(SOperatorInfo* pOperator, SLimitInfo* pLimitInfo, SSDataBlock* pBlock, bool holdDataInBuf) {
  if (pLimitInfo->remainGroupOffset > 0) {
    if (pLimitInfo->currentGroupId == 0) {  // it is the first group
      pLimitInfo->currentGroupId = pBlock->info.groupId;
      blockDataCleanup(pBlock);
3153
      return PROJECT_RETRIEVE_CONTINUE;
3154 3155 3156
    } else if (pLimitInfo->currentGroupId != pBlock->info.groupId) {
      // now it is the data from a new group
      pLimitInfo->remainGroupOffset -= 1;
3157 3158

      // ignore data block in current group
3159 3160
      if (pLimitInfo->remainGroupOffset > 0) {
        blockDataCleanup(pBlock);
3161 3162 3163 3164 3165
        return PROJECT_RETRIEVE_CONTINUE;
      }
    }

    // set current group id of the project operator
3166
    pLimitInfo->currentGroupId = pBlock->info.groupId;
3167 3168
  }

3169
  // here check for a new group data, we need to handle the data of the previous group.
3170 3171 3172
  if (pLimitInfo->currentGroupId != 0 && pLimitInfo->currentGroupId != pBlock->info.groupId) {
    pLimitInfo->numOfOutputGroups += 1;
    if ((pLimitInfo->slimit.limit > 0) && (pLimitInfo->slimit.limit <= pLimitInfo->numOfOutputGroups)) {
3173
      pOperator->status = OP_EXEC_DONE;
3174
      blockDataCleanup(pBlock);
3175 3176 3177 3178 3179

      return PROJECT_RETRIEVE_DONE;
    }

    // reset the value for a new group data
3180 3181
    pLimitInfo->numOfOutputRows = 0;
    pLimitInfo->remainOffset = pLimitInfo->limit.offset;
3182 3183 3184 3185 3186

    // existing rows that belongs to previous group.
    if (pBlock->info.rows > 0) {
      return PROJECT_RETRIEVE_DONE;
    }
3187 3188 3189 3190 3191
  }

  // here we reach the start position, according to the limit/offset requirements.

  // set current group id
3192
  pLimitInfo->currentGroupId = pBlock->info.groupId;
3193

3194 3195 3196
  if (pLimitInfo->remainOffset >= pBlock->info.rows) {
    pLimitInfo->remainOffset -= pBlock->info.rows;
    blockDataCleanup(pBlock);
3197
    return PROJECT_RETRIEVE_CONTINUE;
3198 3199 3200
  } else if (pLimitInfo->remainOffset < pBlock->info.rows && pLimitInfo->remainOffset > 0) {
    blockDataTrimFirstNRows(pBlock, pLimitInfo->remainOffset);
    pLimitInfo->remainOffset = 0;
3201 3202
  }

3203
  // check for the limitation in each group
3204 3205 3206 3207
  if (pLimitInfo->limit.limit >= 0 && pLimitInfo->numOfOutputRows + pBlock->info.rows >= pLimitInfo->limit.limit) {
    int32_t keepRows = (int32_t)(pLimitInfo->limit.limit - pLimitInfo->numOfOutputRows);
    blockDataKeepFirstNRows(pBlock, keepRows);
    if (pLimitInfo->slimit.limit > 0 && pLimitInfo->slimit.limit <= pLimitInfo->numOfOutputGroups) {
3208 3209 3210
      pOperator->status = OP_EXEC_DONE;
    }

3211
    return PROJECT_RETRIEVE_DONE;
3212
  }
3213

3214
  // todo optimize performance
3215 3216
  // If there are slimit/soffset value exists, multi-round result can not be packed into one group, since the
  // they may not belong to the same group the limit/offset value is not valid in this case.
3217 3218
  if ((!holdDataInBuf) || (pBlock->info.rows >= pOperator->resultInfo.threshold) || pLimitInfo->slimit.offset != -1 ||
      pLimitInfo->slimit.limit != -1) {
3219
    return PROJECT_RETRIEVE_DONE;
L
Liu Jicong 已提交
3220
  } else {  // not full enough, continue to accumulate the output data in the buffer.
3221 3222 3223 3224
    return PROJECT_RETRIEVE_CONTINUE;
  }
}

3225
static void doApplyScalarCalculation(SOperatorInfo* pOperator, SSDataBlock* pBlock, int32_t order, int32_t scanFlag);
L
Liu Jicong 已提交
3226 3227
static void doHandleRemainBlockForNewGroupImpl(SOperatorInfo* pOperator, SFillOperatorInfo* pInfo,
                                               SResultInfo* pResultInfo, SExecTaskInfo* pTaskInfo) {
3228
  pInfo->totalInputRows = pInfo->existNewGroupBlock->info.rows;
3229 3230 3231 3232 3233
  SSDataBlock* pResBlock = pInfo->pFinalRes;

  int32_t order = TSDB_ORDER_ASC;
  int32_t scanFlag = MAIN_SCAN;
  getTableScanInfo(pOperator, &order, &scanFlag);
H
Haojun Liao 已提交
3234

L
Liu Jicong 已提交
3235 3236
  int64_t ekey =
      Q_STATUS_EQUAL(pTaskInfo->status, TASK_COMPLETED) ? pInfo->win.ekey : pInfo->existNewGroupBlock->info.window.ekey;
3237 3238
  taosResetFillInfo(pInfo->pFillInfo, getFillInfoStart(pInfo->pFillInfo));

3239 3240 3241 3242
  doApplyScalarCalculation(pOperator, pInfo->existNewGroupBlock, order, scanFlag);

  taosFillSetStartInfo(pInfo->pFillInfo, pInfo->pRes->info.rows, ekey);
  taosFillSetInputDataBlock(pInfo->pFillInfo, pInfo->pRes);
3243

3244 3245
  int32_t numOfResultRows = pResultInfo->capacity - pResBlock->info.rows;
  taosFillResultDataBlock(pInfo->pFillInfo, pResBlock, numOfResultRows);
H
Haojun Liao 已提交
3246

3247
  pInfo->curGroupId = pInfo->existNewGroupBlock->info.groupId;
3248 3249 3250
  pInfo->existNewGroupBlock = NULL;
}

L
Liu Jicong 已提交
3251 3252
static void doHandleRemainBlockFromNewGroup(SOperatorInfo* pOperator, SFillOperatorInfo* pInfo,
                                            SResultInfo* pResultInfo, SExecTaskInfo* pTaskInfo) {
3253
  if (taosFillHasMoreResults(pInfo->pFillInfo)) {
H
Haojun Liao 已提交
3254 3255
    int32_t numOfResultRows = pResultInfo->capacity - pInfo->pFinalRes->info.rows;
    taosFillResultDataBlock(pInfo->pFillInfo, pInfo->pFinalRes, numOfResultRows);
3256 3257
    pInfo->pRes->info.groupId = pInfo->curGroupId;
    return;
3258 3259 3260 3261
  }

  // handle the cached new group data block
  if (pInfo->existNewGroupBlock) {
3262 3263 3264 3265 3266 3267
    doHandleRemainBlockForNewGroupImpl(pOperator, pInfo, pResultInfo, pTaskInfo);
  }
}

static void doApplyScalarCalculation(SOperatorInfo* pOperator, SSDataBlock* pBlock, int32_t order, int32_t scanFlag) {
  SFillOperatorInfo* pInfo = pOperator->info;
L
Liu Jicong 已提交
3268 3269
  SExprSupp*         pSup = &pOperator->exprSupp;
  SSDataBlock*       pResBlock = pInfo->pFinalRes;
3270 3271 3272 3273 3274 3275 3276 3277 3278

  setInputDataBlock(pOperator, pSup->pCtx, pBlock, order, scanFlag, false);
  projectApplyFunctions(pSup->pExprInfo, pInfo->pRes, pBlock, pSup->pCtx, pSup->numOfExprs, NULL);
  pInfo->pRes->info.groupId = pBlock->info.groupId;

  SColumnInfoData* pDst = taosArrayGet(pInfo->pRes->pDataBlock, pInfo->primaryTsCol);
  SColumnInfoData* pSrc = taosArrayGet(pBlock->pDataBlock, pInfo->primarySrcSlotId);
  colDataAssign(pDst, pSrc, pInfo->pRes->info.rows, &pResBlock->info);

L
Liu Jicong 已提交
3279
  for (int32_t i = 0; i < pInfo->numOfNotFillExpr; ++i) {
3280 3281 3282 3283
    SFillColInfo* pCol = &pInfo->pFillInfo->pFillCol[i + pInfo->numOfExpr];
    ASSERT(pCol->notFillCol);

    SExprInfo* pExpr = pCol->pExpr;
L
Liu Jicong 已提交
3284 3285
    int32_t    srcSlotId = pExpr->base.pParam[0].pCol->slotId;
    int32_t    dstSlotId = pExpr->base.resSchema.slotId;
3286 3287 3288 3289

    SColumnInfoData* pDst1 = taosArrayGet(pInfo->pRes->pDataBlock, dstSlotId);
    SColumnInfoData* pSrc1 = taosArrayGet(pBlock->pDataBlock, srcSlotId);
    colDataAssign(pDst1, pSrc1, pInfo->pRes->info.rows, &pResBlock->info);
3290 3291 3292
  }
}

S
slzhou 已提交
3293
static SSDataBlock* doFillImpl(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
3294 3295
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;
3296

H
Haojun Liao 已提交
3297
  SResultInfo* pResultInfo = &pOperator->resultInfo;
H
Haojun Liao 已提交
3298
  SSDataBlock* pResBlock = pInfo->pFinalRes;
3299 3300

  blockDataCleanup(pResBlock);
H
Haojun Liao 已提交
3301
  blockDataCleanup(pInfo->pRes);
3302

H
Haojun Liao 已提交
3303 3304
  int32_t order = TSDB_ORDER_ASC;
  int32_t scanFlag = MAIN_SCAN;
3305
  getTableScanInfo(pOperator, &order, &scanFlag);
3306

3307
  doHandleRemainBlockFromNewGroup(pOperator, pInfo, pResultInfo, pTaskInfo);
3308
  if (pResBlock->info.rows > 0) {
3309
    pResBlock->info.groupId = pInfo->curGroupId;
3310
    return pResBlock;
H
Haojun Liao 已提交
3311
  }
3312

H
Haojun Liao 已提交
3313
  SOperatorInfo* pDownstream = pOperator->pDownstream[0];
L
Liu Jicong 已提交
3314
  while (1) {
3315
    SSDataBlock* pBlock = pDownstream->fpSet.getNextFn(pDownstream);
3316 3317
    if (pBlock == NULL) {
      if (pInfo->totalInputRows == 0) {
3318
        doSetOperatorCompleted(pOperator);
3319 3320
        return NULL;
      }
3321

3322
      taosFillSetStartInfo(pInfo->pFillInfo, 0, pInfo->win.ekey);
3323
    } else {
3324
      blockDataUpdateTsWindow(pBlock, pInfo->primarySrcSlotId);
3325
      doApplyScalarCalculation(pOperator, pBlock, order, scanFlag);
3326

H
Haojun Liao 已提交
3327 3328 3329
      if (pInfo->curGroupId == 0 || pInfo->curGroupId == pInfo->pRes->info.groupId) {
        pInfo->curGroupId = pInfo->pRes->info.groupId;  // the first data block
        pInfo->totalInputRows += pInfo->pRes->info.rows;
3330

S
slzhou 已提交
3331 3332 3333 3334 3335
        if (order == pInfo->pFillInfo->order) {
          taosFillSetStartInfo(pInfo->pFillInfo, pInfo->pRes->info.rows, pBlock->info.window.ekey);
        } else {
          taosFillSetStartInfo(pInfo->pFillInfo, pInfo->pRes->info.rows, pBlock->info.window.skey);
        }
H
Haojun Liao 已提交
3336
        taosFillSetInputDataBlock(pInfo->pFillInfo, pInfo->pRes);
L
Liu Jicong 已提交
3337
      } else if (pInfo->curGroupId != pBlock->info.groupId) {  // the new group data block
3338 3339 3340 3341 3342
        pInfo->existNewGroupBlock = pBlock;

        // Fill the previous group data block, before handle the data block of new group.
        // Close the fill operation for previous group data block
        taosFillSetStartInfo(pInfo->pFillInfo, 0, pInfo->win.ekey);
3343 3344 3345
      }
    }

3346 3347
    int32_t numOfResultRows = pOperator->resultInfo.capacity - pResBlock->info.rows;
    taosFillResultDataBlock(pInfo->pFillInfo, pResBlock, numOfResultRows);
3348 3349

    // current group has no more result to return
3350
    if (pResBlock->info.rows > 0) {
3351 3352
      // 1. The result in current group not reach the threshold of output result, continue
      // 2. If multiple group results existing in one SSDataBlock is not allowed, return immediately
3353
      if (pResBlock->info.rows > pResultInfo->threshold || pBlock == NULL || pInfo->existNewGroupBlock != NULL) {
3354
        pResBlock->info.groupId = pInfo->curGroupId;
3355
        return pResBlock;
3356 3357
      }

3358
      doHandleRemainBlockFromNewGroup(pOperator, pInfo, pResultInfo, pTaskInfo);
3359
      if (pResBlock->info.rows >= pOperator->resultInfo.threshold || pBlock == NULL) {
3360
        pResBlock->info.groupId = pInfo->curGroupId;
3361
        return pResBlock;
3362 3363 3364
      }
    } else if (pInfo->existNewGroupBlock) {  // try next group
      assert(pBlock != NULL);
3365 3366 3367 3368 3369

      blockDataCleanup(pResBlock);
      blockDataCleanup(pInfo->pRes);

      doHandleRemainBlockForNewGroupImpl(pOperator, pInfo, pResultInfo, pTaskInfo);
3370
      if (pResBlock->info.rows > pResultInfo->threshold) {
3371
        pResBlock->info.groupId = pInfo->curGroupId;
3372
        return pResBlock;
3373 3374 3375 3376 3377 3378 3379
      }
    } else {
      return NULL;
    }
  }
}

S
slzhou 已提交
3380 3381 3382 3383 3384 3385 3386 3387
static SSDataBlock* doFill(SOperatorInfo* pOperator) {
  SFillOperatorInfo* pInfo = pOperator->info;
  SExecTaskInfo*     pTaskInfo = pOperator->pTaskInfo;

  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

S
slzhou 已提交
3388
  SSDataBlock* fillResult = NULL;
S
slzhou 已提交
3389
  while (true) {
S
slzhou 已提交
3390
    fillResult = doFillImpl(pOperator);
S
slzhou 已提交
3391 3392 3393 3394 3395
    if (fillResult == NULL) {
      doSetOperatorCompleted(pOperator);
      break;
    }

3396
    doFilter(pInfo->pCondition, fillResult, pInfo->pColMatchColInfo);
S
slzhou 已提交
3397 3398 3399 3400 3401
    if (fillResult->info.rows > 0) {
      break;
    }
  }

S
slzhou 已提交
3402
  if (fillResult != NULL) {
3403
    pOperator->resultInfo.totalRows += fillResult->info.rows;
S
slzhou 已提交
3404
  }
S
slzhou 已提交
3405

S
slzhou 已提交
3406
  return fillResult;
S
slzhou 已提交
3407 3408
}

3409
void destroyExprInfo(SExprInfo* pExpr, int32_t numOfExprs) {
C
Cary Xu 已提交
3410 3411 3412 3413 3414
  for (int32_t i = 0; i < numOfExprs; ++i) {
    SExprInfo* pExprInfo = &pExpr[i];
    for (int32_t j = 0; j < pExprInfo->base.numOfParams; ++j) {
      if (pExprInfo->base.pParam[j].type == FUNC_PARAM_TYPE_COLUMN) {
        taosMemoryFreeClear(pExprInfo->base.pParam[j].pCol);
H
Haojun Liao 已提交
3415
      }
3416
    }
C
Cary Xu 已提交
3417 3418 3419

    taosMemoryFree(pExprInfo->base.pParam);
    taosMemoryFree(pExprInfo->pExpr);
H
Haojun Liao 已提交
3420 3421 3422
  }
}

3423 3424 3425 3426 3427
static void destroyOperatorInfo(SOperatorInfo* pOperator) {
  if (pOperator == NULL) {
    return;
  }

3428
  if (pOperator->fpSet.closeFn != NULL) {
3429
    pOperator->fpSet.closeFn(pOperator->info, pOperator->exprSupp.numOfExprs);
3430 3431
  }

H
Haojun Liao 已提交
3432
  if (pOperator->pDownstream != NULL) {
L
Liu Jicong 已提交
3433
    for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
H
Haojun Liao 已提交
3434
      destroyOperatorInfo(pOperator->pDownstream[i]);
3435 3436
    }

wafwerar's avatar
wafwerar 已提交
3437
    taosMemoryFreeClear(pOperator->pDownstream);
H
Haojun Liao 已提交
3438
    pOperator->numOfDownstream = 0;
3439 3440
  }

3441
  cleanupExprSupp(&pOperator->exprSupp);
wafwerar's avatar
wafwerar 已提交
3442
  taosMemoryFreeClear(pOperator);
3443 3444
}

3445 3446 3447 3448 3449 3450 3451 3452 3453 3454 3455 3456 3457 3458 3459
int32_t getBufferPgSize(int32_t rowSize, uint32_t* defaultPgsz, uint32_t* defaultBufsz) {
  *defaultPgsz = 4096;
  while (*defaultPgsz < rowSize * 4) {
    *defaultPgsz <<= 1u;
  }

  // at least four pages need to be in buffer
  *defaultBufsz = 4096 * 256;
  if ((*defaultBufsz) <= (*defaultPgsz)) {
    (*defaultBufsz) = (*defaultPgsz) * 4;
  }

  return 0;
}

dengyihao's avatar
dengyihao 已提交
3460 3461
int32_t doInitAggInfoSup(SAggSupporter* pAggSup, SqlFunctionCtx* pCtx, int32_t numOfOutput, size_t keyBufSize,
                         const char* pKey) {
3462 3463
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);

dengyihao's avatar
dengyihao 已提交
3464 3465
  pAggSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
  pAggSup->keyBuf = taosMemoryCalloc(1, keyBufSize + POINTER_BYTES + sizeof(int64_t));
3466 3467
  pAggSup->pResultRowHashTable = taosHashInit(10, hashFn, true, HASH_NO_LOCK);

H
Haojun Liao 已提交
3468
  if (pAggSup->keyBuf == NULL || pAggSup->pResultRowHashTable == NULL) {
3469 3470 3471
    return TSDB_CODE_OUT_OF_MEMORY;
  }

dengyihao's avatar
dengyihao 已提交
3472
  uint32_t defaultPgsz = 0;
3473 3474
  uint32_t defaultBufsz = 0;
  getBufferPgSize(pAggSup->resultRowSize, &defaultPgsz, &defaultBufsz);
H
Haojun Liao 已提交
3475

wafwerar's avatar
wafwerar 已提交
3476 3477 3478 3479 3480
  if (!osTempSpaceAvailable()) {
    terrno = TSDB_CODE_NO_AVAIL_DISK;
    qError("Init stream agg supporter failed since %s", terrstr(terrno));
    return terrno;
  }
3481

wafwerar's avatar
wafwerar 已提交
3482
  int32_t code = createDiskbasedBuf(&pAggSup->pResultBuf, defaultPgsz, defaultBufsz, pKey, tsTempDir);
H
Haojun Liao 已提交
3483
  if (code != TSDB_CODE_SUCCESS) {
3484
    qError("Create agg result buf failed since %s", tstrerror(code));
H
Haojun Liao 已提交
3485 3486 3487
    return code;
  }

3488 3489 3490
  return TSDB_CODE_SUCCESS;
}

3491
void cleanupAggSup(SAggSupporter* pAggSup) {
wafwerar's avatar
wafwerar 已提交
3492
  taosMemoryFreeClear(pAggSup->keyBuf);
3493
  taosHashCleanup(pAggSup->pResultRowHashTable);
H
Haojun Liao 已提交
3494
  destroyDiskbasedBuf(pAggSup->pResultBuf);
3495 3496
}

L
Liu Jicong 已提交
3497 3498
int32_t initAggInfo(SExprSupp* pSup, SAggSupporter* pAggSup, SExprInfo* pExprInfo, int32_t numOfCols, size_t keyBufSize,
                    const char* pkey) {
3499 3500 3501 3502 3503
  int32_t code = initExprSupp(pSup, pExprInfo, numOfCols);
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

3504 3505 3506 3507 3508
  code = doInitAggInfoSup(pAggSup, pSup->pCtx, numOfCols, keyBufSize, pkey);
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

L
Liu Jicong 已提交
3509
  for (int32_t i = 0; i < numOfCols; ++i) {
3510
    pSup->pCtx[i].pBuf = pAggSup->pResultBuf;
3511 3512
  }

3513
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
3514 3515
}

L
Liu Jicong 已提交
3516
void initResultSizeInfo(SResultInfo* pResultInfo, int32_t numOfRows) {
wmmhello's avatar
wmmhello 已提交
3517
  ASSERT(numOfRows != 0);
3518 3519
  pResultInfo->capacity = numOfRows;
  pResultInfo->threshold = numOfRows * 0.75;
3520

3521 3522
  if (pResultInfo->threshold == 0) {
    pResultInfo->threshold = numOfRows;
3523 3524 3525
  }
}

3526 3527 3528 3529 3530
void initBasicInfo(SOptrBasicInfo* pInfo, SSDataBlock* pBlock) {
  pInfo->pRes = pBlock;
  initResultRowInfo(&pInfo->resultRowInfo);
}

5
54liuyao 已提交
3531
void* destroySqlFunctionCtx(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
3532 3533 3534 3535 3536 3537 3538 3539 3540 3541 3542 3543 3544 3545 3546 3547 3548 3549
  if (pCtx == NULL) {
    return NULL;
  }

  for (int32_t i = 0; i < numOfOutput; ++i) {
    for (int32_t j = 0; j < pCtx[i].numOfParams; ++j) {
      taosVariantDestroy(&pCtx[i].param[j].param);
    }

    taosMemoryFreeClear(pCtx[i].subsidiaries.pCtx);
    taosMemoryFree(pCtx[i].input.pData);
    taosMemoryFree(pCtx[i].input.pColumnDataAgg);
  }

  taosMemoryFreeClear(pCtx);
  return NULL;
}

3550
int32_t initExprSupp(SExprSupp* pSup, SExprInfo* pExprInfo, int32_t numOfExpr) {
3551 3552 3553 3554
  pSup->pExprInfo = pExprInfo;
  pSup->numOfExprs = numOfExpr;
  if (pSup->pExprInfo != NULL) {
    pSup->pCtx = createSqlFunctionCtx(pExprInfo, numOfExpr, &pSup->rowEntryInfoOffset);
3555 3556 3557
    if (pSup->pCtx == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
3558
  }
3559 3560

  return TSDB_CODE_SUCCESS;
3561 3562
}

3563 3564 3565 3566
void cleanupExprSupp(SExprSupp* pSupp) {
  destroySqlFunctionCtx(pSupp->pCtx, pSupp->numOfExprs);
  if (pSupp->pExprInfo != NULL) {
    destroyExprInfo(pSupp->pExprInfo, pSupp->numOfExprs);
C
Cary Xu 已提交
3567
    taosMemoryFreeClear(pSupp->pExprInfo);
3568 3569 3570 3571
  }
  taosMemoryFree(pSupp->rowEntryInfoOffset);
}

L
Liu Jicong 已提交
3572
SOperatorInfo* createAggregateOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
S
slzhou 已提交
3573
                                           SSDataBlock* pResultBlock, SNode* pCondition, SExprInfo* pScalarExprInfo,
3574
                                           int32_t numOfScalarExpr, bool mergeResult, SExecTaskInfo* pTaskInfo) {
wafwerar's avatar
wafwerar 已提交
3575
  SAggOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SAggOperatorInfo));
L
Liu Jicong 已提交
3576
  SOperatorInfo*    pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
3577 3578 3579
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
H
Haojun Liao 已提交
3580

dengyihao's avatar
dengyihao 已提交
3581
  size_t keyBufSize = sizeof(int64_t) + sizeof(int64_t) + POINTER_BYTES;
3582

3583
  initResultSizeInfo(&pOperator->resultInfo, 4096);
3584
  int32_t code = initAggInfo(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, numOfCols, keyBufSize, pTaskInfo->id.str);
L
Liu Jicong 已提交
3585
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
3586 3587
    goto _error;
  }
H
Haojun Liao 已提交
3588

3589
  initBasicInfo(&pInfo->binfo, pResultBlock);
3590 3591 3592 3593
  code = initExprSupp(&pInfo->scalarExprSup, pScalarExprInfo, numOfScalarExpr);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3594

3595
  pInfo->binfo.mergeResultBlock = mergeResult;
3596
  pInfo->groupId = UINT64_MAX;
S
slzhou 已提交
3597
  pInfo->pCondition = pCondition;
dengyihao's avatar
dengyihao 已提交
3598
  pOperator->name = "TableAggregate";
3599
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_HASH_AGG;
3600
  pOperator->blocking = true;
dengyihao's avatar
dengyihao 已提交
3601 3602 3603
  pOperator->status = OP_NOT_OPENED;
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3604

3605 3606
  pOperator->fpSet = createOperatorFpSet(doOpenAggregateOptr, getAggregateResult, NULL, NULL, destroyAggOperatorInfo,
                                         aggEncodeResultRow, aggDecodeResultRow, NULL);
H
Haojun Liao 已提交
3607

3608 3609 3610 3611 3612 3613
  if (downstream->operatorType == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) {
    STableScanInfo* pTableScanInfo = downstream->info;
    pTableScanInfo->pdInfo.pExprSup = &pOperator->exprSupp;
    pTableScanInfo->pdInfo.pAggSup = &pInfo->aggSup;
  }

H
Haojun Liao 已提交
3614 3615 3616 3617
  code = appendDownstream(pOperator, &downstream, 1);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3618 3619

  return pOperator;
L
Liu Jicong 已提交
3620
_error:
H
Haojun Liao 已提交
3621
  destroyAggOperatorInfo(pInfo, numOfCols);
wafwerar's avatar
wafwerar 已提交
3622
  taosMemoryFreeClear(pOperator);
H
Haojun Liao 已提交
3623 3624
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
3625 3626
}

3627
void cleanupBasicInfo(SOptrBasicInfo* pInfo) {
3628
  assert(pInfo != NULL);
H
Haojun Liao 已提交
3629
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
3630 3631
}

H
Haojun Liao 已提交
3632
void destroyBasicOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3633
  SOptrBasicInfo* pInfo = (SOptrBasicInfo*)param;
3634
  cleanupBasicInfo(pInfo);
L
Liu Jicong 已提交
3635

D
dapan1121 已提交
3636
  taosMemoryFreeClear(param);
3637
}
H
Haojun Liao 已提交
3638

H
Haojun Liao 已提交
3639 3640 3641 3642 3643 3644 3645
static void freeItem(void* pItem) {
  void** p = pItem;
  if (*p != NULL) {
    taosMemoryFreeClear(*p);
  }
}

H
Haojun Liao 已提交
3646
void destroyAggOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3647
  SAggOperatorInfo* pInfo = (SAggOperatorInfo*)param;
L
Liu Jicong 已提交
3648 3649
  cleanupBasicInfo(&pInfo->binfo);

H
Haojun Liao 已提交
3650
  cleanupAggSup(&pInfo->aggSup);
S
shenglian zhou 已提交
3651
  cleanupExprSupp(&pInfo->scalarExprSup);
H
Haojun Liao 已提交
3652
  cleanupGroupResInfo(&pInfo->groupResInfo);
D
dapan1121 已提交
3653
  taosMemoryFreeClear(param);
3654
}
3655

3656
void destroyFillOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3657
  SFillOperatorInfo* pInfo = (SFillOperatorInfo*)param;
3658
  pInfo->pFillInfo = taosDestroyFillInfo(pInfo->pFillInfo);
H
Haojun Liao 已提交
3659
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
H
Haojun Liao 已提交
3660 3661 3662 3663 3664 3665 3666
  pInfo->pFinalRes = blockDataDestroy(pInfo->pFinalRes);

  if (pInfo->pNotFillExprInfo != NULL) {
    destroyExprInfo(pInfo->pNotFillExprInfo, pInfo->numOfNotFillExpr);
    taosMemoryFree(pInfo->pNotFillExprInfo);
  }

wafwerar's avatar
wafwerar 已提交
3667
  taosMemoryFreeClear(pInfo->p);
3668
  taosArrayDestroy(pInfo->pColMatchColInfo);
D
dapan1121 已提交
3669
  taosMemoryFreeClear(param);
3670 3671
}

H
Haojun Liao 已提交
3672
void destroyExchangeOperatorInfo(void* param, int32_t numOfOutput) {
L
Liu Jicong 已提交
3673
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3674 3675 3676
  taosRemoveRef(exchangeObjRefPool, pExInfo->self);
}

L
Liu Jicong 已提交
3677
void freeSourceDataInfo(void* p) {
3678 3679 3680 3681
  SSourceDataInfo* pInfo = (SSourceDataInfo*)p;
  taosMemoryFreeClear(pInfo->pRsp);
}

3682
void doDestroyExchangeOperatorInfo(void* param) {
X
Xiaoyu Wang 已提交
3683
  SExchangeInfo* pExInfo = (SExchangeInfo*)param;
3684

H
Haojun Liao 已提交
3685
  taosArrayDestroy(pExInfo->pSources);
3686
  taosArrayDestroyEx(pExInfo->pSourceDataInfo, freeSourceDataInfo);
3687 3688 3689 3690

  if (pExInfo->pResultBlockList != NULL) {
    taosArrayDestroyEx(pExInfo->pResultBlockList, freeBlock);
    pExInfo->pResultBlockList = NULL;
H
Haojun Liao 已提交
3691 3692
  }

3693
  blockDataDestroy(pExInfo->pDummyBlock);
L
Liu Jicong 已提交
3694

3695
  tsem_destroy(&pExInfo->ready);
D
dapan1121 已提交
3696
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
3697 3698
}

H
Haojun Liao 已提交
3699 3700 3701 3702
static int32_t initFillInfo(SFillOperatorInfo* pInfo, SExprInfo* pExpr, int32_t numOfCols, SExprInfo* pNotFillExpr,
                            int32_t numOfNotFillCols, SNodeListNode* pValNode, STimeWindow win, int32_t capacity,
                            const char* id, SInterval* pInterval, int32_t fillType, int32_t order) {
  SFillColInfo* pColInfo = createFillColInfo(pExpr, numOfCols, pNotFillExpr, numOfNotFillCols, pValNode);
H
Haojun Liao 已提交
3703

3704
  int64_t     startKey = (order == TSDB_ORDER_ASC) ? win.skey : win.ekey;
S
slzhou 已提交
3705 3706
  STimeWindow w = getAlignQueryTimeWindow(pInterval, pInterval->precision, startKey);
  w = getFirstQualifiedTimeWindow(startKey, &w, pInterval, order);
H
Haojun Liao 已提交
3707

L
Liu Jicong 已提交
3708 3709
  pInfo->pFillInfo = taosCreateFillInfo(w.skey, numOfCols, numOfNotFillCols, capacity, pInterval, fillType, pColInfo,
                                        pInfo->primaryTsCol, order, id);
H
Haojun Liao 已提交
3710

S
slzhou 已提交
3711 3712 3713 3714 3715 3716 3717
  if (order == TSDB_ORDER_ASC) {
    pInfo->win.skey = win.skey;
    pInfo->win.ekey = win.ekey;
  } else {
    pInfo->win.skey = win.ekey;
    pInfo->win.ekey = win.skey;
  }
L
Liu Jicong 已提交
3718
  pInfo->p = taosMemoryCalloc(numOfCols, POINTER_BYTES);
3719

H
Haojun Liao 已提交
3720
  if (pInfo->pFillInfo == NULL || pInfo->p == NULL) {
H
Haojun Liao 已提交
3721 3722
    taosMemoryFree(pInfo->pFillInfo);
    taosMemoryFree(pInfo->p);
H
Haojun Liao 已提交
3723 3724 3725 3726 3727 3728
    return TSDB_CODE_OUT_OF_MEMORY;
  } else {
    return TSDB_CODE_SUCCESS;
  }
}

L
Liu Jicong 已提交
3729 3730
SOperatorInfo* createFillOperatorInfo(SOperatorInfo* downstream, SFillPhysiNode* pPhyFillNode,
                                      SExecTaskInfo* pTaskInfo) {
3731 3732 3733 3734 3735 3736
  SFillOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SFillOperatorInfo));
  SOperatorInfo*     pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

L
Liu Jicong 已提交
3737
  SSDataBlock* pResBlock = createResDataBlock(pPhyFillNode->node.pOutputDataBlockDesc);
3738
  SExprInfo*   pExprInfo = createExprInfo(pPhyFillNode->pFillExprs, NULL, &pInfo->numOfExpr);
H
Haojun Liao 已提交
3739
  pInfo->pNotFillExprInfo = createExprInfo(pPhyFillNode->pNotFillExprs, NULL, &pInfo->numOfNotFillExpr);
H
Haojun Liao 已提交
3740

L
Liu Jicong 已提交
3741
  SInterval* pInterval =
3742
      QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == downstream->operatorType
L
Liu Jicong 已提交
3743 3744
          ? &((SMergeAlignedIntervalAggOperatorInfo*)downstream->info)->intervalAggOperatorInfo->interval
          : &((SIntervalAggOperatorInfo*)downstream->info)->interval;
3745

3746
  int32_t order = (pPhyFillNode->inputTsOrder == ORDER_ASC) ? TSDB_ORDER_ASC : TSDB_ORDER_DESC;
3747
  int32_t type = convertFillType(pPhyFillNode->mode);
3748

H
Haojun Liao 已提交
3749
  SResultInfo* pResultInfo = &pOperator->resultInfo;
3750
  initResultSizeInfo(&pOperator->resultInfo, 4096);
H
Haojun Liao 已提交
3751
  blockDataEnsureCapacity(pResBlock, pOperator->resultInfo.capacity);
3752
  initExprSupp(&pOperator->exprSupp, pExprInfo, pInfo->numOfExpr);
H
Haojun Liao 已提交
3753

H
Haojun Liao 已提交
3754 3755
  pInfo->primaryTsCol = ((STargetNode*)pPhyFillNode->pWStartTs)->slotId;
  pInfo->primarySrcSlotId = ((SColumnNode*)((STargetNode*)pPhyFillNode->pWStartTs)->pExpr)->slotId;
3756

3757
  int32_t numOfOutputCols = 0;
3758
  SArray* pColMatchColInfo = extractColMatchInfo(pPhyFillNode->pFillExprs, pPhyFillNode->node.pOutputDataBlockDesc,
3759
                                                 &numOfOutputCols, COL_MATCH_FROM_SLOT_ID);
3760

L
Liu Jicong 已提交
3761 3762 3763
  int32_t code = initFillInfo(pInfo, pExprInfo, pInfo->numOfExpr, pInfo->pNotFillExprInfo, pInfo->numOfNotFillExpr,
                              (SNodeListNode*)pPhyFillNode->pValues, pPhyFillNode->timeRange, pResultInfo->capacity,
                              pTaskInfo->id.str, pInterval, type, order);
3764 3765 3766
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
3767

3768
  pInfo->pRes = pResBlock;
H
Haojun Liao 已提交
3769 3770 3771
  pInfo->pFinalRes = createOneDataBlock(pResBlock, false);
  blockDataEnsureCapacity(pInfo->pFinalRes, pOperator->resultInfo.capacity);

3772 3773 3774 3775 3776 3777 3778
  pInfo->pCondition = pPhyFillNode->node.pConditions;
  pInfo->pColMatchColInfo = pColMatchColInfo;
  pOperator->name = "FillOperator";
  pOperator->blocking = false;
  pOperator->status = OP_NOT_OPENED;
  pOperator->operatorType = QUERY_NODE_PHYSICAL_PLAN_FILL;
  pOperator->exprSupp.pExprInfo = pExprInfo;
3779
  pOperator->exprSupp.numOfExprs = pInfo->numOfExpr;
3780 3781
  pOperator->info = pInfo;
  pOperator->pTaskInfo = pTaskInfo;
H
Haojun Liao 已提交
3782

L
Liu Jicong 已提交
3783
  pOperator->fpSet =
3784
      createOperatorFpSet(operatorDummyOpenFn, doFill, NULL, NULL, destroyFillOperatorInfo, NULL, NULL, NULL);
3785

3786
  code = appendDownstream(pOperator, &downstream, 1);
3787
  return pOperator;
H
Haojun Liao 已提交
3788

L
Liu Jicong 已提交
3789
_error:
wafwerar's avatar
wafwerar 已提交
3790 3791
  taosMemoryFreeClear(pOperator);
  taosMemoryFreeClear(pInfo);
H
Haojun Liao 已提交
3792
  return NULL;
3793 3794
}

D
dapan1121 已提交
3795
static SExecTaskInfo* createExecTaskInfo(uint64_t queryId, uint64_t taskId, EOPTR_EXEC_MODEL model, char* dbFName) {
wafwerar's avatar
wafwerar 已提交
3796
  SExecTaskInfo* pTaskInfo = taosMemoryCalloc(1, sizeof(SExecTaskInfo));
3797
  setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
H
Haojun Liao 已提交
3798

3799
  pTaskInfo->schemaInfo.dbname = strdup(dbFName);
3800
  pTaskInfo->cost.created = taosGetTimestampMs();
H
Haojun Liao 已提交
3801
  pTaskInfo->id.queryId = queryId;
dengyihao's avatar
dengyihao 已提交
3802
  pTaskInfo->execModel = model;
H
Haojun Liao 已提交
3803

wafwerar's avatar
wafwerar 已提交
3804
  char* p = taosMemoryCalloc(1, 128);
L
Liu Jicong 已提交
3805
  snprintf(p, 128, "TID:0x%" PRIx64 " QID:0x%" PRIx64, taskId, queryId);
H
Haojun Liao 已提交
3806
  pTaskInfo->id.str = p;
H
Haojun Liao 已提交
3807

3808 3809
  return pTaskInfo;
}
H
Haojun Liao 已提交
3810

H
Haojun Liao 已提交
3811
static SArray* extractColumnInfo(SNodeList* pNodeList);
3812

H
Haojun Liao 已提交
3813 3814
SSchemaWrapper* extractQueriedColumnSchema(SScanPhysiNode* pScanNode);

3815
int32_t extractTableSchemaInfo(SReadHandle* pHandle, SScanPhysiNode* pScanNode, SExecTaskInfo* pTaskInfo) {
3816 3817
  SMetaReader mr = {0};
  metaReaderInit(&mr, pHandle->meta, 0);
3818
  int32_t code = metaGetTableEntryByUid(&mr, pScanNode->uid);
3819
  if (code != TSDB_CODE_SUCCESS) {
L
Liu Jicong 已提交
3820 3821
    qError("failed to get the table meta, uid:0x%" PRIx64 ", suid:0x%" PRIx64 ", %s", pScanNode->uid, pScanNode->suid,
           GET_TASKID(pTaskInfo));
H
Haojun Liao 已提交
3822

D
dapan1121 已提交
3823
    metaReaderClear(&mr);
3824
    return terrno;
D
dapan1121 已提交
3825
  }
3826

3827 3828
  SSchemaInfo* pSchemaInfo = &pTaskInfo->schemaInfo;
  pSchemaInfo->tablename = strdup(mr.me.name);
3829 3830

  if (mr.me.type == TSDB_SUPER_TABLE) {
3831 3832
    pSchemaInfo->sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
    pSchemaInfo->tversion = mr.me.stbEntry.schemaTag.version;
3833
  } else if (mr.me.type == TSDB_CHILD_TABLE) {
3834 3835
    tDecoderClear(&mr.coder);

3836 3837
    tb_uid_t suid = mr.me.ctbEntry.suid;
    metaGetTableEntryByUid(&mr, suid);
3838 3839
    pSchemaInfo->sw = tCloneSSchemaWrapper(&mr.me.stbEntry.schemaRow);
    pSchemaInfo->tversion = mr.me.stbEntry.schemaTag.version;
3840
  } else {
3841
    pSchemaInfo->sw = tCloneSSchemaWrapper(&mr.me.ntbEntry.schemaRow);
3842
  }
3843 3844

  metaReaderClear(&mr);
3845

H
Haojun Liao 已提交
3846 3847 3848 3849 3850
  pSchemaInfo->qsw = extractQueriedColumnSchema(pScanNode);
  return TSDB_CODE_SUCCESS;
}

SSchemaWrapper* extractQueriedColumnSchema(SScanPhysiNode* pScanNode) {
3851 3852 3853
  int32_t numOfCols = LIST_LENGTH(pScanNode->pScanCols);
  int32_t numOfTags = LIST_LENGTH(pScanNode->pScanPseudoCols);

3854
  SSchemaWrapper* pqSw = taosMemoryCalloc(1, sizeof(SSchemaWrapper));
3855
  pqSw->pSchema = taosMemoryCalloc(numOfCols + numOfTags, sizeof(SSchema));
3856

L
Liu Jicong 已提交
3857
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
3858
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pScanNode->pScanCols, i);
3859 3860
    SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

H
Haojun Liao 已提交
3861 3862 3863 3864 3865
    SSchema* pSchema = &pqSw->pSchema[pqSw->nCols++];
    pSchema->colId = pColNode->colId;
    pSchema->type = pColNode->node.resType.type;
    pSchema->type = pColNode->node.resType.bytes;
    strncpy(pSchema->name, pColNode->colName, tListLen(pSchema->name));
3866 3867
  }

3868
  // this the tags and pseudo function columns, we only keep the tag columns
3869
  for (int32_t i = 0; i < numOfTags; ++i) {
3870 3871 3872 3873 3874 3875 3876 3877 3878 3879 3880 3881 3882 3883
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pScanNode->pScanPseudoCols, i);

    int32_t type = nodeType(pNode->pExpr);
    if (type == QUERY_NODE_COLUMN) {
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

      SSchema* pSchema = &pqSw->pSchema[pqSw->nCols++];
      pSchema->colId = pColNode->colId;
      pSchema->type = pColNode->node.resType.type;
      pSchema->type = pColNode->node.resType.bytes;
      strncpy(pSchema->name, pColNode->colName, tListLen(pSchema->name));
    }
  }

H
Haojun Liao 已提交
3884
  return pqSw;
3885 3886
}

3887 3888
static void cleanupTableSchemaInfo(SSchemaInfo* pSchemaInfo) {
  taosMemoryFreeClear(pSchemaInfo->dbname);
3889
  taosMemoryFreeClear(pSchemaInfo->tablename);
3890 3891
  tDeleteSSchemaWrapper(pSchemaInfo->sw);
  tDeleteSSchemaWrapper(pSchemaInfo->qsw);
3892 3893
}

wmmhello's avatar
wmmhello 已提交
3894
static int32_t sortTableGroup(STableListInfo* pTableListInfo) {
wmmhello's avatar
wmmhello 已提交
3895
  taosArrayClear(pTableListInfo->pGroupList);
wmmhello's avatar
wmmhello 已提交
3896
  SArray* sortSupport = taosArrayInit(16, sizeof(uint64_t));
3897
  if (sortSupport == NULL) return TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
3898 3899
  for (int32_t i = 0; i < taosArrayGetSize(pTableListInfo->pTableList); i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
3900
    uint64_t*      groupId = taosHashGet(pTableListInfo->map, &info->uid, sizeof(uint64_t));
wmmhello's avatar
wmmhello 已提交
3901 3902

    int32_t index = taosArraySearchIdx(sortSupport, groupId, compareUint64Val, TD_EQ);
3903 3904 3905 3906
    if (index == -1) {
      void*   p = taosArraySearch(sortSupport, groupId, compareUint64Val, TD_GT);
      SArray* tGroup = taosArrayInit(8, sizeof(STableKeyInfo));
      if (tGroup == NULL) {
wmmhello's avatar
wmmhello 已提交
3907 3908 3909
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
3910
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
3911 3912 3913 3914
        qError("taos push info array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
3915
      if (p == NULL) {
wmmhello's avatar
wmmhello 已提交
3916
        if (taosArrayPush(sortSupport, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
3917 3918 3919 3920
          qError("taos push support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
wmmhello's avatar
wmmhello 已提交
3921
        if (taosArrayPush(pTableListInfo->pGroupList, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
3922 3923 3924 3925
          qError("taos push group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
3926
      } else {
wmmhello's avatar
wmmhello 已提交
3927
        int32_t pos = TARRAY_ELEM_IDX(sortSupport, p);
3928
        if (taosArrayInsert(sortSupport, pos, groupId) == NULL) {
wmmhello's avatar
wmmhello 已提交
3929 3930 3931 3932
          qError("taos insert support array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
3933
        if (taosArrayInsert(pTableListInfo->pGroupList, pos, &tGroup) == NULL) {
wmmhello's avatar
wmmhello 已提交
3934 3935 3936 3937 3938
          qError("taos insert group array error");
          taosArrayDestroy(sortSupport);
          return TSDB_CODE_QRY_APP_ERROR;
        }
      }
3939
    } else {
wmmhello's avatar
wmmhello 已提交
3940
      SArray* tGroup = (SArray*)taosArrayGetP(pTableListInfo->pGroupList, index);
3941
      if (taosArrayPush(tGroup, info) == NULL) {
wmmhello's avatar
wmmhello 已提交
3942 3943 3944 3945 3946 3947 3948 3949 3950 3951
        qError("taos push uid array error");
        taosArrayDestroy(sortSupport);
        return TSDB_CODE_QRY_APP_ERROR;
      }
    }
  }
  taosArrayDestroy(sortSupport);
  return TDB_CODE_SUCCESS;
}

3952
bool groupbyTbname(SNodeList* pGroupList) {
3953
  bool bytbname = false;
H
Haojun Liao 已提交
3954
  if (LIST_LENGTH(pGroupList) > 0) {
3955 3956 3957 3958 3959 3960 3961 3962 3963 3964
    SNode* p = nodesListGetNode(pGroupList, 0);
    if (p->type == QUERY_NODE_FUNCTION) {
      // partition by tbname/group by tbname
      bytbname = (strcmp(((struct SFunctionNode*)p)->functionName, "tbname") == 0);
    }
  }

  return bytbname;
}

wmmhello's avatar
wmmhello 已提交
3965 3966
int32_t generateGroupIdMap(STableListInfo* pTableListInfo, SReadHandle* pHandle, SNodeList* group) {
  if (group == NULL) {
wmmhello's avatar
wmmhello 已提交
3967 3968 3969 3970 3971 3972 3973 3974
    return TDB_CODE_SUCCESS;
  }

  pTableListInfo->map = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, HASH_NO_LOCK);
  if (pTableListInfo->map == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }

3975 3976
  bool assignUid = groupbyTbname(group);

3977
  size_t numOfTables = taosArrayGetSize(pTableListInfo->pTableList);
3978

3979
  if (assignUid) {
wmmhello's avatar
wmmhello 已提交
3980 3981
    for (int32_t i = 0; i < numOfTables; i++) {
      STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
3982
      info->groupId = info->uid;
wmmhello's avatar
wmmhello 已提交
3983 3984
      taosHashPut(pTableListInfo->map, &(info->uid), sizeof(uint64_t), &info->groupId, sizeof(uint64_t));
    }
3985
  } else {
wmmhello's avatar
wmmhello 已提交
3986 3987 3988
    int32_t code = getColInfoResultForGroupby(pHandle->meta, group, pTableListInfo);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
wmmhello's avatar
wmmhello 已提交
3989 3990
    }
  }
3991

3992
  if (pTableListInfo->needSortTableByGroupId) {
wmmhello's avatar
wmmhello 已提交
3993
    return sortTableGroup(pTableListInfo);
3994 3995
  }

wmmhello's avatar
wmmhello 已提交
3996 3997 3998
  return TDB_CODE_SUCCESS;
}

3999 4000 4001 4002 4003 4004 4005 4006 4007 4008 4009 4010 4011 4012 4013 4014 4015
static int32_t initTableblockDistQueryCond(uint64_t uid, SQueryTableDataCond* pCond) {
  memset(pCond, 0, sizeof(SQueryTableDataCond));

  pCond->order = TSDB_ORDER_ASC;
  pCond->numOfCols = 1;
  pCond->colList = taosMemoryCalloc(1, sizeof(SColumnInfo));
  if (pCond->colList == NULL) {
    terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
    return terrno;
  }

  pCond->colList->colId = 1;
  pCond->colList->type = TSDB_DATA_TYPE_TIMESTAMP;
  pCond->colList->bytes = sizeof(TSKEY);

  pCond->twindows = (STimeWindow){.skey = INT64_MIN, .ekey = INT64_MAX};
  pCond->suid = uid;
4016
  pCond->type = TIMEWINDOW_RANGE_CONTAINED;
4017
  pCond->startVersion = -1;
L
Liu Jicong 已提交
4018
  pCond->endVersion = -1;
4019 4020 4021 4022

  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
4023
SOperatorInfo* createOperatorTree(SPhysiNode* pPhyNode, SExecTaskInfo* pTaskInfo, SReadHandle* pHandle,
L
Liu Jicong 已提交
4024 4025
                                  STableListInfo* pTableListInfo, SNode* pTagCond, SNode* pTagIndexCond,
                                  const char* pUser) {
4026 4027
  int32_t type = nodeType(pPhyNode);

X
Xiaoyu Wang 已提交
4028
  if (pPhyNode->pChildren == NULL || LIST_LENGTH(pPhyNode->pChildren) == 0) {
4029
    SOperatorInfo* pOperator = NULL;
H
Haojun Liao 已提交
4030
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == type) {
dengyihao's avatar
dengyihao 已提交
4031
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4032

L
Liu Jicong 已提交
4033 4034 4035
      int32_t code =
          createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags, pTableScanNode->groupSort, pHandle,
                                  pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
4036
      if (code) {
wmmhello's avatar
wmmhello 已提交
4037
        pTaskInfo->code = code;
4038
        qError("failed to createScanTableListInfo, code: %s", tstrerror(code));
D
dapan1121 已提交
4039 4040
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4041

4042
      code = extractTableSchemaInfo(pHandle, &pTableScanNode->scan, pTaskInfo);
S
slzhou 已提交
4043
      if (code) {
4044
        pTaskInfo->code = terrno;
wmmhello's avatar
wmmhello 已提交
4045 4046 4047
        return NULL;
      }

4048
      pOperator = createTableScanOperatorInfo(pTableScanNode, pHandle, pTaskInfo);
4049 4050
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
S
slzhou 已提交
4051 4052
    } else if (QUERY_NODE_PHYSICAL_PLAN_TABLE_MERGE_SCAN == type) {
      STableMergeScanPhysiNode* pTableScanNode = (STableMergeScanPhysiNode*)pPhyNode;
L
Liu Jicong 已提交
4053 4054 4055
      int32_t                   code =
          createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags, pTableScanNode->groupSort, pHandle,
                                  pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
L
Liu Jicong 已提交
4056
      if (code) {
wmmhello's avatar
wmmhello 已提交
4057
        pTaskInfo->code = code;
4058
        qError("failed to createScanTableListInfo, code: %s", tstrerror(code));
wmmhello's avatar
wmmhello 已提交
4059 4060
        return NULL;
      }
4061

4062
      code = extractTableSchemaInfo(pHandle, &pTableScanNode->scan, pTaskInfo);
wmmhello's avatar
wmmhello 已提交
4063 4064 4065 4066
      if (code) {
        pTaskInfo->code = terrno;
        return NULL;
      }
wmmhello's avatar
wmmhello 已提交
4067

4068
      pOperator = createTableMergeScanOperatorInfo(pTableScanNode, pTableListInfo, pHandle, pTaskInfo);
wmmhello's avatar
wmmhello 已提交
4069

4070 4071
      STableScanInfo* pScanInfo = pOperator->info;
      pTaskInfo->cost.pRecoder = &pScanInfo->readRecorder;
H
Haojun Liao 已提交
4072
    } else if (QUERY_NODE_PHYSICAL_PLAN_EXCHANGE == type) {
4073
      pOperator = createExchangeOperatorInfo(pHandle->pMsgCb->clientRpc, (SExchangePhysiNode*)pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4074
    } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN == type) {
5
54liuyao 已提交
4075
      STableScanPhysiNode* pTableScanNode = (STableScanPhysiNode*)pPhyNode;
5
54liuyao 已提交
4076
      if (pHandle->vnode) {
L
Liu Jicong 已提交
4077 4078 4079
        int32_t code =
            createScanTableListInfo(&pTableScanNode->scan, pTableScanNode->pGroupTags, pTableScanNode->groupSort,
                                    pHandle, pTableListInfo, pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
L
Liu Jicong 已提交
4080
        if (code) {
wmmhello's avatar
wmmhello 已提交
4081
          pTaskInfo->code = code;
4082
          qError("failed to createScanTableListInfo, code: %s", tstrerror(code));
wmmhello's avatar
wmmhello 已提交
4083 4084
          return NULL;
        }
L
Liu Jicong 已提交
4085 4086 4087 4088 4089

#ifndef NDEBUG
        int32_t sz = taosArrayGetSize(pTableListInfo->pTableList);
        for (int32_t i = 0; i < sz; i++) {
          STableKeyInfo* pKeyInfo = taosArrayGet(pTableListInfo->pTableList, i);
S
Shengliang Guan 已提交
4090
          qDebug("creating stream task: add table %" PRId64, pKeyInfo->uid);
L
Liu Jicong 已提交
4091
        }
5
54liuyao 已提交
4092
      }
L
Liu Jicong 已提交
4093
#endif
4094

H
Haojun Liao 已提交
4095
      pTaskInfo->schemaInfo.qsw = extractQueriedColumnSchema(&pTableScanNode->scan);
4096
      pOperator = createStreamScanOperatorInfo(pHandle, pTableScanNode, pTagCond, pTaskInfo);
H
Haojun Liao 已提交
4097
    } else if (QUERY_NODE_PHYSICAL_PLAN_SYSTABLE_SCAN == type) {
L
Liu Jicong 已提交
4098
      SSystemTableScanPhysiNode* pSysScanPhyNode = (SSystemTableScanPhysiNode*)pPhyNode;
4099
      pOperator = createSysTableScanOperatorInfo(pHandle, pSysScanPhyNode, pUser, pTaskInfo);
4100
    } else if (QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN == type) {
X
Xiaoyu Wang 已提交
4101
      STagScanPhysiNode* pScanPhyNode = (STagScanPhysiNode*)pPhyNode;
4102
      int32_t code = getTableList(pHandle->meta, pHandle->vnode, pScanPhyNode, pTagCond, pTagIndexCond, pTableListInfo);
4103
      if (code != TSDB_CODE_SUCCESS) {
4104
        pTaskInfo->code = terrno;
4105
        qError("failed to getTableList, code: %s", tstrerror(code));
4106 4107 4108
        return NULL;
      }

4109
      pOperator = createTagScanOperatorInfo(pHandle, pScanPhyNode, pTableListInfo, pTaskInfo);
4110
    } else if (QUERY_NODE_PHYSICAL_PLAN_BLOCK_DIST_SCAN == type) {
4111
      SBlockDistScanPhysiNode* pBlockNode = (SBlockDistScanPhysiNode*)pPhyNode;
4112 4113 4114
      pTableListInfo->pTableList = taosArrayInit(4, sizeof(STableKeyInfo));

      if (pBlockNode->tableType == TSDB_SUPER_TABLE) {
4115
        int32_t code = vnodeGetAllTableList(pHandle->vnode, pBlockNode->uid, pTableListInfo->pTableList);
4116 4117 4118 4119 4120
        if (code != TSDB_CODE_SUCCESS) {
          pTaskInfo->code = terrno;
          return NULL;
        }
      } else {  // Create one table group.
4121
        STableKeyInfo info = {.uid = pBlockNode->uid, .groupId = 0};
4122 4123 4124 4125
        taosArrayPush(pTableListInfo->pTableList, &info);
      }

      SQueryTableDataCond cond = {0};
L
Liu Jicong 已提交
4126
      int32_t             code = initTableblockDistQueryCond(pBlockNode->suid, &cond);
4127 4128
      if (code != TSDB_CODE_SUCCESS) {
        return NULL;
4129
      }
H
Haojun Liao 已提交
4130 4131 4132

      STsdbReader* pReader = NULL;
      tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, "");
4133 4134
      cleanupQueryTableDataCond(&cond);

4135
      pOperator = createDataBlockInfoScanOperator(pReader, pHandle, cond.suid, pBlockNode, pTaskInfo);
H
Haojun Liao 已提交
4136 4137 4138
    } else if (QUERY_NODE_PHYSICAL_PLAN_LAST_ROW_SCAN == type) {
      SLastRowScanPhysiNode* pScanNode = (SLastRowScanPhysiNode*)pPhyNode;

L
Liu Jicong 已提交
4139 4140
      int32_t code = createScanTableListInfo(&pScanNode->scan, pScanNode->pGroupTags, true, pHandle, pTableListInfo,
                                             pTagCond, pTagIndexCond, GET_TASKID(pTaskInfo));
4141 4142 4143 4144
      if (code != TSDB_CODE_SUCCESS) {
        pTaskInfo->code = code;
        return NULL;
      }
4145

4146
      code = extractTableSchemaInfo(pHandle, &pScanNode->scan, pTaskInfo);
4147 4148 4149
      if (code != TSDB_CODE_SUCCESS) {
        pTaskInfo->code = code;
        return NULL;
H
Haojun Liao 已提交
4150 4151
      }

4152
      pOperator = createLastrowScanOperator(pScanNode, pHandle, pTaskInfo);
4153
    } else if (QUERY_NODE_PHYSICAL_PLAN_PROJECT == type) {
4154
      pOperator = createProjectOperatorInfo(NULL, (SProjectPhysiNode*)pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4155 4156
    } else {
      ASSERT(0);
H
Haojun Liao 已提交
4157
    }
4158 4159 4160 4161 4162

    if (pOperator != NULL) {
      pOperator->resultDataBlockId = pPhyNode->pOutputDataBlockDesc->dataBlockId;
    }

4163
    return pOperator;
H
Haojun Liao 已提交
4164 4165
  }

4166 4167
  int32_t num = 0;
  size_t  size = LIST_LENGTH(pPhyNode->pChildren);
H
Haojun Liao 已提交
4168

4169
  SOperatorInfo** ops = taosMemoryCalloc(size, POINTER_BYTES);
dengyihao's avatar
dengyihao 已提交
4170
  for (int32_t i = 0; i < size; ++i) {
4171
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pPhyNode->pChildren, i);
4172
    ops[i] = createOperatorTree(pChildNode, pTaskInfo, pHandle, pTableListInfo, pTagCond, pTagIndexCond, pUser);
4173
    if (ops[i] == NULL) {
H
Haojun Liao 已提交
4174
      taosMemoryFree(ops);
4175
      return NULL;
4176 4177
    } else {
      ops[i]->resultDataBlockId = pChildNode->pOutputDataBlockDesc->dataBlockId;
4178
    }
4179
  }
H
Haojun Liao 已提交
4180

4181
  SOperatorInfo* pOptr = NULL;
H
Haojun Liao 已提交
4182
  if (QUERY_NODE_PHYSICAL_PLAN_PROJECT == type) {
4183
    pOptr = createProjectOperatorInfo(ops[0], (SProjectPhysiNode*)pPhyNode, pTaskInfo);
4184
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_AGG == type) {
H
Haojun Liao 已提交
4185 4186
    SAggPhysiNode* pAggNode = (SAggPhysiNode*)pPhyNode;
    SExprInfo*     pExprInfo = createExprInfo(pAggNode->pAggFuncs, pAggNode->pGroupKeys, &num);
4187
    SSDataBlock*   pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4188

dengyihao's avatar
dengyihao 已提交
4189
    int32_t    numOfScalarExpr = 0;
4190 4191 4192 4193 4194
    SExprInfo* pScalarExprInfo = NULL;
    if (pAggNode->pExprs != NULL) {
      pScalarExprInfo = createExprInfo(pAggNode->pExprs, NULL, &numOfScalarExpr);
    }

H
Haojun Liao 已提交
4195 4196
    if (pAggNode->pGroupKeys != NULL) {
      SArray* pColList = extractColumnInfo(pAggNode->pGroupKeys);
dengyihao's avatar
dengyihao 已提交
4197
      pOptr = createGroupOperatorInfo(ops[0], pExprInfo, num, pResBlock, pColList, pAggNode->node.pConditions,
wmmhello's avatar
wmmhello 已提交
4198
                                      pScalarExprInfo, numOfScalarExpr, pTaskInfo);
H
Haojun Liao 已提交
4199
    } else {
L
Liu Jicong 已提交
4200
      pOptr = createAggregateOperatorInfo(ops[0], pExprInfo, num, pResBlock, pAggNode->node.pConditions,
4201
                                          pScalarExprInfo, numOfScalarExpr, pAggNode->mergeDataBlock, pTaskInfo);
H
Haojun Liao 已提交
4202
    }
X
Xiaoyu Wang 已提交
4203
  } else if (QUERY_NODE_PHYSICAL_PLAN_HASH_INTERVAL == type || QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type) {
H
Haojun Liao 已提交
4204
    SIntervalPhysiNode* pIntervalPhyNode = (SIntervalPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4205

H
Haojun Liao 已提交
4206
    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
4207
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
H
Haojun Liao 已提交
4208

dengyihao's avatar
dengyihao 已提交
4209 4210 4211 4212 4213 4214
    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
H
Haojun Liao 已提交
4215

X
Xiaoyu Wang 已提交
4216 4217 4218 4219 4220
    STimeWindowAggSupp as = {
        .waterMark = pIntervalPhyNode->window.watermark,
        .calTrigger = pIntervalPhyNode->window.triggerType,
        .maxTs = INT64_MIN,
    };
4221
    ASSERT(as.calTrigger != STREAM_TRIGGER_MAX_DELAY);
4222

4223
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4224
    bool    isStream = (QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL == type);
4225 4226
    pOptr = createIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId, &as, pIntervalPhyNode,
                                       pTaskInfo, isStream);
4227

4228 4229
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_ALIGNED_INTERVAL == type) {
    SMergeAlignedIntervalPhysiNode* pIntervalPhyNode = (SMergeAlignedIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4230 4231 4232 4233 4234 4235 4236 4237 4238 4239

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4240

S
shenglian zhou 已提交
4241
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
L
Liu Jicong 已提交
4242
    pOptr = createMergeAlignedIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId,
dengyihao's avatar
dengyihao 已提交
4243 4244
                                                   pPhyNode->pConditions, pIntervalPhyNode->window.mergeDataBlock,
                                                   pTaskInfo);
S
shenglian zhou 已提交
4245
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_INTERVAL == type) {
X
Xiaoyu Wang 已提交
4246
    SMergeIntervalPhysiNode* pIntervalPhyNode = (SMergeIntervalPhysiNode*)pPhyNode;
S
shenglian zhou 已提交
4247 4248 4249 4250 4251 4252 4253 4254 4255 4256

    SExprInfo*   pExprInfo = createExprInfo(pIntervalPhyNode->window.pFuncs, NULL, &num);
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);

    SInterval interval = {.interval = pIntervalPhyNode->interval,
                          .sliding = pIntervalPhyNode->sliding,
                          .intervalUnit = pIntervalPhyNode->intervalUnit,
                          .slidingUnit = pIntervalPhyNode->slidingUnit,
                          .offset = pIntervalPhyNode->offset,
                          .precision = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->node.resType.precision};
4257

S
shenglian zhou 已提交
4258
    int32_t tsSlotId = ((SColumnNode*)pIntervalPhyNode->window.pTspk)->slotId;
dengyihao's avatar
dengyihao 已提交
4259 4260
    pOptr = createMergeIntervalOperatorInfo(ops[0], pExprInfo, num, pResBlock, &interval, tsSlotId,
                                            pIntervalPhyNode->window.mergeDataBlock, pTaskInfo);
5
54liuyao 已提交
4261
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_INTERVAL == type) {
4262
    int32_t children = 0;
5
54liuyao 已提交
4263 4264
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_INTERVAL == type) {
5
54liuyao 已提交
4265
    int32_t children = pHandle->numOfVgroups;
5
54liuyao 已提交
4266
    pOptr = createStreamFinalIntervalOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4267
  } else if (QUERY_NODE_PHYSICAL_PLAN_SORT == type) {
4268
    pOptr = createSortOperatorInfo(ops[0], (SSortPhysiNode*)pPhyNode, pTaskInfo);
S
shenglian zhou 已提交
4269 4270
  } else if (QUERY_NODE_PHYSICAL_PLAN_GROUP_SORT == type) {
    pOptr = createGroupSortOperatorInfo(ops[0], (SGroupSortPhysiNode*)pPhyNode, pTaskInfo);
X
Xiaoyu Wang 已提交
4271
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE == type) {
4272
    SMergePhysiNode* pMergePhyNode = (SMergePhysiNode*)pPhyNode;
4273
    pOptr = createMultiwayMergeOperatorInfo(ops, size, pMergePhyNode, pTaskInfo);
4274
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_SESSION == type) {
H
Haojun Liao 已提交
4275
    SSessionWinodwPhysiNode* pSessionNode = (SSessionWinodwPhysiNode*)pPhyNode;
H
Haojun Liao 已提交
4276
    pOptr = createSessionAggOperatorInfo(ops[0], pSessionNode, pTaskInfo);
4277
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SESSION == type) {
4278 4279 4280 4281 4282
    pOptr = createStreamSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_SESSION == type) {
    int32_t children = 0;
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_SESSION == type) {
4283
    int32_t children = pHandle->numOfVgroups;
4284
    pOptr = createStreamFinalSessionAggOperatorInfo(ops[0], pPhyNode, pTaskInfo, children);
H
Haojun Liao 已提交
4285
  } else if (QUERY_NODE_PHYSICAL_PLAN_PARTITION == type) {
4286
    pOptr = createPartitionOperatorInfo(ops[0], (SPartitionPhysiNode*)pPhyNode, pTaskInfo);
4287
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_STATE == type) {
dengyihao's avatar
dengyihao 已提交
4288
    SStateWinodwPhysiNode* pStateNode = (SStateWinodwPhysiNode*)pPhyNode;
4289

4290 4291
    STimeWindowAggSupp as = {.waterMark = pStateNode->window.watermark, .calTrigger = pStateNode->window.triggerType};

dengyihao's avatar
dengyihao 已提交
4292
    SExprInfo*   pExprInfo = createExprInfo(pStateNode->window.pFuncs, NULL, &num);
4293
    SSDataBlock* pResBlock = createResDataBlock(pPhyNode->pOutputDataBlockDesc);
4294 4295
    int32_t      tsSlotId = ((SColumnNode*)pStateNode->window.pTspk)->slotId;

4296
    SColumnNode* pColNode = (SColumnNode*)((STargetNode*)pStateNode->pStateKey)->pExpr;
X
Xiaoyu Wang 已提交
4297
    SColumn      col = extractColumnFromColumnNode(pColNode);
L
Liu Jicong 已提交
4298 4299
    pOptr = createStatewindowOperatorInfo(ops[0], pExprInfo, num, pResBlock, &as, tsSlotId, &col, pPhyNode->pConditions,
                                          pTaskInfo);
4300
  } else if (QUERY_NODE_PHYSICAL_PLAN_STREAM_STATE == type) {
5
54liuyao 已提交
4301
    pOptr = createStreamStateAggOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4302
  } else if (QUERY_NODE_PHYSICAL_PLAN_MERGE_JOIN == type) {
4303
    pOptr = createMergeJoinOperatorInfo(ops, size, (SSortMergeJoinPhysiNode*)pPhyNode, pTaskInfo);
4304
  } else if (QUERY_NODE_PHYSICAL_PLAN_FILL == type) {
H
Haojun Liao 已提交
4305
    pOptr = createFillOperatorInfo(ops[0], (SFillPhysiNode*)pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4306 4307
  } else if (QUERY_NODE_PHYSICAL_PLAN_INDEF_ROWS_FUNC == type) {
    pOptr = createIndefinitOutputOperatorInfo(ops[0], pPhyNode, pTaskInfo);
4308 4309
  } else if (QUERY_NODE_PHYSICAL_PLAN_INTERP_FUNC == type) {
    pOptr = createTimeSliceOperatorInfo(ops[0], pPhyNode, pTaskInfo);
H
Haojun Liao 已提交
4310 4311
  } else {
    ASSERT(0);
H
Haojun Liao 已提交
4312
  }
4313
  taosMemoryFree(ops);
dengyihao's avatar
dengyihao 已提交
4314
  if (pOptr) pOptr->resultDataBlockId = pPhyNode->pOutputDataBlockDesc->dataBlockId;
4315
  return pOptr;
4316
}
H
Haojun Liao 已提交
4317

H
Haojun Liao 已提交
4318
SArray* extractColumnInfo(SNodeList* pNodeList) {
L
Liu Jicong 已提交
4319
  size_t  numOfCols = LIST_LENGTH(pNodeList);
H
Haojun Liao 已提交
4320 4321 4322 4323 4324 4325
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColumn));
  if (pList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

L
Liu Jicong 已提交
4326 4327
  for (int32_t i = 0; i < numOfCols; ++i) {
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pNodeList, i);
H
Haojun Liao 已提交
4328

4329 4330 4331
    if (nodeType(pNode->pExpr) == QUERY_NODE_COLUMN) {
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

4332
      SColumn c = extractColumnFromColumnNode(pColNode);
4333 4334
      taosArrayPush(pList, &c);
    } else if (nodeType(pNode->pExpr) == QUERY_NODE_VALUE) {
L
Liu Jicong 已提交
4335 4336
      SValueNode* pValNode = (SValueNode*)pNode->pExpr;
      SColumn     c = {0};
4337
      c.slotId = pNode->slotId;
L
Liu Jicong 已提交
4338 4339 4340 4341
      c.colId = pNode->slotId;
      c.type = pValNode->node.type;
      c.bytes = pValNode->node.resType.bytes;
      c.scale = pValNode->node.resType.scale;
4342 4343 4344 4345
      c.precision = pValNode->node.resType.precision;

      taosArrayPush(pList, &c);
    }
H
Haojun Liao 已提交
4346 4347 4348 4349 4350
  }

  return pList;
}

4351
#if 0
L
Liu Jicong 已提交
4352 4353
STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle* pHandle,
                                STableListInfo* pTableListInfo, const char* idstr) {
4354
  int32_t code = getTableList(pHandle->meta, pHandle->vnode, &pTableScanNode->scan, pTableListInfo);
wmmhello's avatar
wmmhello 已提交
4355 4356 4357 4358 4359 4360
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

  if (taosArrayGetSize(pTableListInfo->pTableList) == 0) {
    code = 0;
H
Haojun Liao 已提交
4361
    qDebug("no table qualified for query, %s", idstr);
wmmhello's avatar
wmmhello 已提交
4362 4363 4364
    goto _error;
  }

4365
  SQueryTableDataCond cond = {0};
wmmhello's avatar
wmmhello 已提交
4366
  code = initQueryTableDataCond(&cond, pTableScanNode);
4367
  if (code != TSDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4368
    goto _error;
X
Xiaoyu Wang 已提交
4369
  }
4370

H
Hongze Cheng 已提交
4371
  STsdbReader* pReader;
H
Haojun Liao 已提交
4372
  code = tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo->pTableList, &pReader, idstr);
H
Haojun Liao 已提交
4373 4374 4375 4376
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

4377
  cleanupQueryTableDataCond(&cond);
H
Haojun Liao 已提交
4378 4379

  return pReader;
wmmhello's avatar
wmmhello 已提交
4380 4381 4382 4383

_error:
  terrno = code;
  return NULL;
H
Haojun Liao 已提交
4384
}
4385
#endif
H
Haojun Liao 已提交
4386

L
Liu Jicong 已提交
4387 4388 4389 4390 4391 4392 4393 4394 4395 4396 4397 4398 4399
static int32_t extractTbscanInStreamOpTree(SOperatorInfo* pOperator, STableScanInfo** ppInfo) {
  if (pOperator->operatorType != QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
    if (pOperator->numOfDownstream == 0) {
      qError("failed to find stream scan operator");
      return TSDB_CODE_QRY_APP_ERROR;
    }

    if (pOperator->numOfDownstream > 1) {
      qError("join not supported for stream block scan");
      return TSDB_CODE_QRY_APP_ERROR;
    }
    return extractTbscanInStreamOpTree(pOperator->pDownstream[0], ppInfo);
  } else {
4400 4401 4402
    SStreamScanInfo* pInfo = pOperator->info;
    ASSERT(pInfo->pTableScanOp->operatorType == QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN);
    *ppInfo = pInfo->pTableScanOp->info;
L
Liu Jicong 已提交
4403 4404 4405 4406
    return 0;
  }
}

4407 4408 4409 4410 4411 4412 4413 4414 4415 4416 4417 4418 4419 4420 4421 4422 4423 4424 4425 4426 4427 4428
int32_t extractTableScanNode(SPhysiNode* pNode, STableScanPhysiNode** ppNode) {
  if (pNode->pChildren == NULL || LIST_LENGTH(pNode->pChildren) == 0) {
    if (QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN == pNode->type) {
      *ppNode = (STableScanPhysiNode*)pNode;
      return 0;
    } else {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
  } else {
    if (LIST_LENGTH(pNode->pChildren) != 1) {
      ASSERT(0);
      terrno = TSDB_CODE_QRY_APP_ERROR;
      return -1;
    }
    SPhysiNode* pChildNode = (SPhysiNode*)nodesListGetNode(pNode->pChildren, 0);
    return extractTableScanNode(pChildNode, ppNode);
  }
  return -1;
}

4429
#if 0
L
Liu Jicong 已提交
4430 4431 4432 4433 4434
int32_t rebuildReader(SOperatorInfo* pOperator, SSubplan* plan, SReadHandle* pHandle, int64_t uid, int64_t ts) {
  STableScanInfo* pTableScanInfo = NULL;
  if (extractTbscanInStreamOpTree(pOperator, &pTableScanInfo) < 0) {
    return -1;
  }
4435

L
Liu Jicong 已提交
4436 4437 4438 4439
  STableScanPhysiNode* pNode = NULL;
  if (extractTableScanNode(plan->pNode, &pNode) < 0) {
    ASSERT(0);
  }
4440

H
Haojun Liao 已提交
4441
  tsdbReaderClose(pTableScanInfo->dataReader);
4442

L
Liu Jicong 已提交
4443
  STableListInfo info = {0};
H
Haojun Liao 已提交
4444
  pTableScanInfo->dataReader = doCreateDataReader(pNode, pHandle, &info, NULL);
L
Liu Jicong 已提交
4445 4446 4447 4448
  if (pTableScanInfo->dataReader == NULL) {
    ASSERT(0);
    qError("failed to create data reader");
    return TSDB_CODE_QRY_APP_ERROR;
4449
  }
L
Liu Jicong 已提交
4450
  // TODO: set uid and ts to data reader
4451 4452
  return 0;
}
4453
#endif
4454

C
Cary Xu 已提交
4455
int32_t encodeOperator(SOperatorInfo* ops, char** result, int32_t* length, int32_t* nOptrWithVal) {
wmmhello's avatar
wmmhello 已提交
4456
  int32_t code = TDB_CODE_SUCCESS;
4457
  char*   pCurrent = NULL;
wmmhello's avatar
wmmhello 已提交
4458
  int32_t currLength = 0;
4459
  if (ops->fpSet.encodeResultRow) {
C
Cary Xu 已提交
4460
    if (result == NULL || length == NULL || nOptrWithVal == NULL) {
wmmhello's avatar
wmmhello 已提交
4461 4462 4463
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
    code = ops->fpSet.encodeResultRow(ops, &pCurrent, &currLength);
wmmhello's avatar
wmmhello 已提交
4464

4465 4466
    if (code != TDB_CODE_SUCCESS) {
      if (*result != NULL) {
wmmhello's avatar
wmmhello 已提交
4467 4468 4469 4470
        taosMemoryFree(*result);
        *result = NULL;
      }
      return code;
C
Cary Xu 已提交
4471 4472 4473
    } else if (currLength == 0) {
      ASSERT(!pCurrent);
      goto _downstream;
wmmhello's avatar
wmmhello 已提交
4474
    }
wmmhello's avatar
wmmhello 已提交
4475

C
Cary Xu 已提交
4476 4477
    ++(*nOptrWithVal);

C
Cary Xu 已提交
4478
    ASSERT(currLength >= 0);
wmmhello's avatar
wmmhello 已提交
4479

4480
    if (*result == NULL) {
wmmhello's avatar
wmmhello 已提交
4481
      *result = (char*)taosMemoryCalloc(1, currLength + sizeof(int32_t));
wmmhello's avatar
wmmhello 已提交
4482 4483 4484 4485 4486 4487
      if (*result == NULL) {
        taosMemoryFree(pCurrent);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      memcpy(*result + sizeof(int32_t), pCurrent, currLength);
      *(int32_t*)(*result) = currLength + sizeof(int32_t);
4488
    } else {
wmmhello's avatar
wmmhello 已提交
4489
      int32_t sizePre = *(int32_t*)(*result);
4490
      char*   tmp = (char*)taosMemoryRealloc(*result, sizePre + currLength);
wmmhello's avatar
wmmhello 已提交
4491 4492 4493 4494 4495 4496 4497 4498 4499 4500 4501 4502
      if (tmp == NULL) {
        taosMemoryFree(pCurrent);
        taosMemoryFree(*result);
        *result = NULL;
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      *result = tmp;
      memcpy(*result + sizePre, pCurrent, currLength);
      *(int32_t*)(*result) += currLength;
    }
    taosMemoryFree(pCurrent);
    *length = *(int32_t*)(*result);
wmmhello's avatar
wmmhello 已提交
4503 4504
  }

C
Cary Xu 已提交
4505
_downstream:
wmmhello's avatar
wmmhello 已提交
4506
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
C
Cary Xu 已提交
4507
    code = encodeOperator(ops->pDownstream[i], result, length, nOptrWithVal);
4508
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4509
      return code;
wmmhello's avatar
wmmhello 已提交
4510 4511
    }
  }
wmmhello's avatar
wmmhello 已提交
4512
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4513 4514
}

H
Haojun Liao 已提交
4515
int32_t decodeOperator(SOperatorInfo* ops, const char* result, int32_t length) {
wmmhello's avatar
wmmhello 已提交
4516
  int32_t code = TDB_CODE_SUCCESS;
4517 4518
  if (ops->fpSet.decodeResultRow) {
    if (result == NULL) {
wmmhello's avatar
wmmhello 已提交
4519 4520
      return TSDB_CODE_TSC_INVALID_INPUT;
    }
H
Haojun Liao 已提交
4521

4522
    ASSERT(length == *(int32_t*)result);
H
Haojun Liao 已提交
4523 4524

    const char* data = result + sizeof(int32_t);
L
Liu Jicong 已提交
4525
    code = ops->fpSet.decodeResultRow(ops, (char*)data);
4526
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4527 4528
      return code;
    }
wmmhello's avatar
wmmhello 已提交
4529

wmmhello's avatar
wmmhello 已提交
4530
    int32_t totalLength = *(int32_t*)result;
4531 4532
    int32_t dataLength = *(int32_t*)data;

4533
    if (totalLength == dataLength + sizeof(int32_t)) {  // the last data
wmmhello's avatar
wmmhello 已提交
4534 4535
      result = NULL;
      length = 0;
4536
    } else {
wmmhello's avatar
wmmhello 已提交
4537 4538 4539 4540
      result += dataLength;
      *(int32_t*)(result) = totalLength - dataLength;
      length = totalLength - dataLength;
    }
wmmhello's avatar
wmmhello 已提交
4541 4542
  }

wmmhello's avatar
wmmhello 已提交
4543 4544
  for (int32_t i = 0; i < ops->numOfDownstream; ++i) {
    code = decodeOperator(ops->pDownstream[i], result, length);
4545
    if (code != TDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
4546
      return code;
wmmhello's avatar
wmmhello 已提交
4547 4548
    }
  }
wmmhello's avatar
wmmhello 已提交
4549
  return TDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
4550 4551
}

D
dapan1121 已提交
4552
int32_t createDataSinkParam(SDataSinkNode* pNode, void** pParam, qTaskInfo_t* pTaskInfo, SReadHandle* readHandle) {
D
dapan1121 已提交
4553
  SExecTaskInfo* pTask = *(SExecTaskInfo**)pTaskInfo;
4554

D
dapan1121 已提交
4555
  switch (pNode->type) {
D
dapan1121 已提交
4556 4557 4558 4559 4560 4561
    case QUERY_NODE_PHYSICAL_PLAN_QUERY_INSERT: {
      SInserterParam* pInserterParam = taosMemoryCalloc(1, sizeof(SInserterParam));
      if (NULL == pInserterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      pInserterParam->readHandle = readHandle;
L
Liu Jicong 已提交
4562

D
dapan1121 已提交
4563 4564 4565
      *pParam = pInserterParam;
      break;
    }
D
dapan1121 已提交
4566
    case QUERY_NODE_PHYSICAL_PLAN_DELETE: {
4567
      SDeleterParam* pDeleterParam = taosMemoryCalloc(1, sizeof(SDeleterParam));
D
dapan1121 已提交
4568 4569 4570 4571
      if (NULL == pDeleterParam) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      int32_t tbNum = taosArrayGetSize(pTask->tableqinfoList.pTableList);
D
dapan1121 已提交
4572
      pDeleterParam->suid = pTask->tableqinfoList.suid;
D
dapan1121 已提交
4573 4574 4575 4576 4577 4578
      pDeleterParam->pUidList = taosArrayInit(tbNum, sizeof(uint64_t));
      if (NULL == pDeleterParam->pUidList) {
        taosMemoryFree(pDeleterParam);
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      for (int32_t i = 0; i < tbNum; ++i) {
4579
        STableKeyInfo* pTable = taosArrayGet(pTask->tableqinfoList.pTableList, i);
D
dapan1121 已提交
4580 4581 4582 4583 4584 4585 4586 4587 4588 4589 4590 4591 4592
        taosArrayPush(pDeleterParam->pUidList, &pTable->uid);
      }

      *pParam = pDeleterParam;
      break;
    }
    default:
      break;
  }

  return TSDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
4593
int32_t createExecTaskInfoImpl(SSubplan* pPlan, SExecTaskInfo** pTaskInfo, SReadHandle* pHandle, uint64_t taskId,
D
dapan1121 已提交
4594
                               char* sql, EOPTR_EXEC_MODEL model) {
H
Haojun Liao 已提交
4595 4596
  uint64_t queryId = pPlan->id.queryId;

H
Haojun Liao 已提交
4597
  int32_t code = TSDB_CODE_SUCCESS;
D
dapan1121 已提交
4598
  *pTaskInfo = createExecTaskInfo(queryId, taskId, model, pPlan->dbFName);
H
Haojun Liao 已提交
4599 4600 4601 4602
  if (*pTaskInfo == NULL) {
    code = TSDB_CODE_QRY_OUT_OF_MEMORY;
    goto _complete;
  }
H
Haojun Liao 已提交
4603

L
Liu Jicong 已提交
4604 4605
  if (pHandle && pHandle->pStateBackend) {
    (*pTaskInfo)->streamInfo.pState = pHandle->pStateBackend;
4606 4607
  }

4608
  (*pTaskInfo)->sql = sql;
D
dapan1121 已提交
4609
  sql = NULL;
4610
  (*pTaskInfo)->pSubplan = pPlan;
L
Liu Jicong 已提交
4611 4612
  (*pTaskInfo)->pRoot = createOperatorTree(pPlan->pNode, *pTaskInfo, pHandle, &(*pTaskInfo)->tableqinfoList,
                                           pPlan->pTagCond, pPlan->pTagIndexCond, pPlan->user);
L
Liu Jicong 已提交
4613

D
dapan1121 已提交
4614
  if (NULL == (*pTaskInfo)->pRoot) {
4615
    code = (*pTaskInfo)->code;
D
dapan1121 已提交
4616
    goto _complete;
4617 4618
  }

H
Haojun Liao 已提交
4619 4620
  return code;

H
Haojun Liao 已提交
4621
_complete:
D
dapan1121 已提交
4622
  taosMemoryFree(sql);
H
Haojun Liao 已提交
4623
  doDestroyTask(*pTaskInfo);
H
Haojun Liao 已提交
4624 4625
  terrno = code;
  return code;
H
Haojun Liao 已提交
4626 4627
}

wmmhello's avatar
wmmhello 已提交
4628 4629 4630
static void doDestroyTableList(STableListInfo* pTableqinfoList) {
  taosArrayDestroy(pTableqinfoList->pTableList);
  taosHashCleanup(pTableqinfoList->map);
4631 4632
  if (pTableqinfoList->needSortTableByGroupId) {
    for (int32_t i = 0; i < taosArrayGetSize(pTableqinfoList->pGroupList); i++) {
wmmhello's avatar
wmmhello 已提交
4633
      SArray* tmp = taosArrayGetP(pTableqinfoList->pGroupList, i);
4634 4635 4636
      if (tmp == pTableqinfoList->pTableList) {
        continue;
      }
wmmhello's avatar
wmmhello 已提交
4637 4638 4639 4640
      taosArrayDestroy(tmp);
    }
  }
  taosArrayDestroy(pTableqinfoList->pGroupList);
4641

wmmhello's avatar
wmmhello 已提交
4642 4643
  pTableqinfoList->pTableList = NULL;
  pTableqinfoList->map = NULL;
4644 4645
}

L
Liu Jicong 已提交
4646
void doDestroyTask(SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
4647 4648
  qDebug("%s execTask is freed", GET_TASKID(pTaskInfo));

wmmhello's avatar
wmmhello 已提交
4649
  doDestroyTableList(&pTaskInfo->tableqinfoList);
H
Haojun Liao 已提交
4650
  destroyOperatorInfo(pTaskInfo->pRoot);
4651 4652 4653
  cleanupTableSchemaInfo(&pTaskInfo->schemaInfo);

  nodesDestroyNode((SNode*)pTaskInfo->pSubplan);
4654

wafwerar's avatar
wafwerar 已提交
4655 4656 4657
  taosMemoryFreeClear(pTaskInfo->sql);
  taosMemoryFreeClear(pTaskInfo->id.str);
  taosMemoryFreeClear(pTaskInfo);
4658 4659 4660 4661 4662 4663 4664 4665 4666 4667 4668 4669
}

static void doSetTagValueToResultBuf(char* output, const char* val, int16_t type, int16_t bytes) {
  if (val == NULL) {
    setNull(output, type, bytes);
    return;
  }

  if (IS_VAR_DATA_TYPE(type)) {
    // Binary data overflows for sort of unknown reasons. Let trim the overflow data
    if (varDataTLen(val) > bytes) {
      int32_t maxLen = bytes - VARSTR_HEADER_SIZE;
L
Liu Jicong 已提交
4670
      int32_t len = (varDataLen(val) > maxLen) ? maxLen : varDataLen(val);
4671 4672 4673 4674 4675 4676 4677 4678 4679 4680 4681 4682
      memcpy(varDataVal(output), varDataVal(val), len);
      varDataSetLen(output, len);
    } else {
      varDataCopy(output, val);
    }
  } else {
    memcpy(output, val, bytes);
  }
}

static int64_t getQuerySupportBufSize(size_t numOfTables) {
  size_t s1 = sizeof(STableQueryInfo);
L
Liu Jicong 已提交
4683 4684
  //  size_t s3 = sizeof(STableCheckInfo);  buffer consumption in tsdb
  return (int64_t)(s1 * 1.5 * numOfTables);
4685 4686 4687 4688 4689 4690 4691
}

int32_t checkForQueryBuf(size_t numOfTables) {
  int64_t t = getQuerySupportBufSize(numOfTables);
  if (tsQueryBufferSizeBytes < 0) {
    return TSDB_CODE_SUCCESS;
  } else if (tsQueryBufferSizeBytes > 0) {
L
Liu Jicong 已提交
4692
    while (1) {
4693 4694 4695 4696 4697 4698 4699 4700 4701 4702 4703 4704 4705 4706 4707 4708 4709 4710 4711 4712 4713 4714 4715 4716 4717 4718
      int64_t s = tsQueryBufferSizeBytes;
      int64_t remain = s - t;
      if (remain >= 0) {
        if (atomic_val_compare_exchange_64(&tsQueryBufferSizeBytes, s, remain) == s) {
          return TSDB_CODE_SUCCESS;
        }
      } else {
        return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
      }
    }
  }

  // disable query processing if the value of tsQueryBufferSize is zero.
  return TSDB_CODE_QRY_NOT_ENOUGH_BUFFER;
}

void releaseQueryBuf(size_t numOfTables) {
  if (tsQueryBufferSizeBytes < 0) {
    return;
  }

  int64_t t = getQuerySupportBufSize(numOfTables);

  // restore value is not enough buffer available
  atomic_add_fetch_64(&tsQueryBufferSizeBytes, t);
}
D
dapan1121 已提交
4719

H
Haojun Liao 已提交
4720
int32_t getOperatorExplainExecInfo(SOperatorInfo* operatorInfo, SArray* pExecInfoList) {
4721
  SExplainExecInfo  execInfo = {0};
H
Haojun Liao 已提交
4722
  SExplainExecInfo* pExplainInfo = taosArrayPush(pExecInfoList, &execInfo);
4723

H
Haojun Liao 已提交
4724 4725 4726 4727 4728
  pExplainInfo->numOfRows = operatorInfo->resultInfo.totalRows;
  pExplainInfo->startupCost = operatorInfo->cost.openCost;
  pExplainInfo->totalCost = operatorInfo->cost.totalCost;
  pExplainInfo->verboseLen = 0;
  pExplainInfo->verboseInfo = NULL;
D
dapan1121 已提交
4729

4730
  if (operatorInfo->fpSet.getExplainFn) {
4731 4732
    int32_t code =
        operatorInfo->fpSet.getExplainFn(operatorInfo, &pExplainInfo->verboseInfo, &pExplainInfo->verboseLen);
D
dapan1121 已提交
4733
    if (code) {
4734
      qError("%s operator getExplainFn failed, code:%s", GET_TASKID(operatorInfo->pTaskInfo), tstrerror(code));
D
dapan1121 已提交
4735 4736 4737
      return code;
    }
  }
dengyihao's avatar
dengyihao 已提交
4738

D
dapan1121 已提交
4739
  int32_t code = 0;
D
dapan1121 已提交
4740
  for (int32_t i = 0; i < operatorInfo->numOfDownstream; ++i) {
H
Haojun Liao 已提交
4741 4742
    code = getOperatorExplainExecInfo(operatorInfo->pDownstream[i], pExecInfoList);
    if (code != TSDB_CODE_SUCCESS) {
4743
      //      taosMemoryFreeClear(*pRes);
D
dapan1121 已提交
4744 4745 4746 4747 4748
      return TSDB_CODE_QRY_OUT_OF_MEMORY;
    }
  }

  return TSDB_CODE_SUCCESS;
D
dapan1121 已提交
4749
}
5
54liuyao 已提交
4750

L
Liu Jicong 已提交
4751
int32_t initStreamAggSupporter(SStreamAggSupporter* pSup, const char* pKey, SqlFunctionCtx* pCtx, int32_t numOfOutput,
4752
                               int32_t size) {
4753
  pSup->resultRowSize = getResultRowSize(pCtx, numOfOutput);
5
54liuyao 已提交
4754 4755
  pSup->keySize = sizeof(int64_t) + sizeof(TSKEY);
  pSup->pKeyBuf = taosMemoryCalloc(1, pSup->keySize);
4756 4757
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);
  pSup->pResultRows = taosHashInit(1024, hashFn, false, HASH_NO_LOCK);
5
54liuyao 已提交
4758 4759 4760
  if (pSup->pKeyBuf == NULL || pSup->pResultRows == NULL) {
    return TSDB_CODE_OUT_OF_MEMORY;
  }
4761
  pSup->valueSize = size;
5
54liuyao 已提交
4762

4763
  pSup->pScanBlock = createSpecialDataBlock(STREAM_CLEAR);
5
54liuyao 已提交
4764 4765 4766 4767 4768 4769 4770 4771 4772
  int32_t pageSize = 4096;
  while (pageSize < pSup->resultRowSize * 4) {
    pageSize <<= 1u;
  }
  // at least four pages need to be in buffer
  int32_t bufSize = 4096 * 256;
  if (bufSize <= pageSize) {
    bufSize = pageSize * 4;
  }
wafwerar's avatar
wafwerar 已提交
4773 4774 4775 4776 4777 4778
  if (!osTempSpaceAvailable()) {
    terrno = TSDB_CODE_NO_AVAIL_DISK;
    qError("Init stream agg supporter failed since %s", terrstr(terrno));
    return terrno;
  }
  int32_t code = createDiskbasedBuf(&pSup->pResultBuf, pageSize, bufSize, pKey, tsTempDir);
L
Liu Jicong 已提交
4779
  for (int32_t i = 0; i < numOfOutput; ++i) {
4780 4781 4782
    pCtx[i].pBuf = pSup->pResultBuf;
  }
  return code;
5
54liuyao 已提交
4783
}