scanoperator.c 128.6 KB
Newer Older
H
Haojun Liao 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

16
#include "executorimpl.h"
H
Haojun Liao 已提交
17
#include "filter.h"
18
#include "function.h"
19
#include "functionMgt.h"
L
Liu Jicong 已提交
20
#include "os.h"
H
Haojun Liao 已提交
21
#include "querynodes.h"
22
#include "systable.h"
H
Haojun Liao 已提交
23
#include "tname.h"
24
#include "ttime.h"
H
Haojun Liao 已提交
25 26 27 28 29 30 31 32 33

#include "tdatablock.h"
#include "tmsg.h"

#include "query.h"
#include "tcompare.h"
#include "thash.h"
#include "ttypes.h"

D
dapan1121 已提交
34 35 36
int32_t scanDebug = 0;


D
dapan1121 已提交
37
#define MULTI_READER_MAX_TABLE_NUM 5000
H
Haojun Liao 已提交
38
#define SET_REVERSE_SCAN_FLAG(_info) ((_info)->scanFlag = REVERSE_SCAN)
39
#define SWITCH_ORDER(n)              (((n) = ((n) == TSDB_ORDER_ASC) ? TSDB_ORDER_DESC : TSDB_ORDER_ASC))
40

H
Haojun Liao 已提交
41 42 43 44 45 46 47 48 49
typedef struct STableMergeScanExecInfo {
  SFileBlockLoadRecorder blockRecorder;
  SSortExecInfo          sortExecInfo;
} STableMergeScanExecInfo;

typedef struct STableMergeScanSortSourceParam {
  SOperatorInfo* pOperator;
  int32_t        readerIdx;
  uint64_t       uid;
50
  SSDataBlock*   inputBlock;  
D
dapan1121 已提交
51
  bool           multiReader;
52
  STsdbReader*   dataReader;
H
Haojun Liao 已提交
53 54
} STableMergeScanSortSourceParam;

L
Liu Jicong 已提交
55
static bool processBlockWithProbability(const SSampleExecInfo* pInfo);
56

H
Haojun Liao 已提交
57
bool processBlockWithProbability(const SSampleExecInfo* pInfo) {
58 59 60 61 62 63 64 65 66 67 68 69
#if 0
  if (pInfo->sampleRatio == 1) {
    return true;
  }

  uint32_t val = taosRandR((uint32_t*) &pInfo->seed);
  return (val % ((uint32_t)(1/pInfo->sampleRatio))) == 0;
#else
  return true;
#endif
}

70
static void switchCtxOrder(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
H
Haojun Liao 已提交
71 72 73 74 75
  for (int32_t i = 0; i < numOfOutput; ++i) {
    SWITCH_ORDER(pCtx[i].order);
  }
}

76 77 78 79 80 81 82 83 84
static void getNextTimeWindow(SInterval* pInterval, STimeWindow* tw, int32_t order) {
  int32_t factor = GET_FORWARD_DIRECTION_FACTOR(order);
  if (pInterval->intervalUnit != 'n' && pInterval->intervalUnit != 'y') {
    tw->skey += pInterval->sliding * factor;
    tw->ekey = tw->skey + pInterval->interval - 1;
    return;
  }

  int64_t key = tw->skey, interval = pInterval->interval;
85
  // convert key to second
86 87 88 89 90 91 92
  key = convertTimePrecision(key, pInterval->precision, TSDB_TIME_PRECISION_MILLI) / 1000;

  if (pInterval->intervalUnit == 'y') {
    interval *= 12;
  }

  struct tm tm;
93
  time_t    t = (time_t)key;
94 95 96 97 98
  taosLocalTime(&t, &tm);

  int mon = (int)(tm.tm_year * 12 + tm.tm_mon + interval * factor);
  tm.tm_year = mon / 12;
  tm.tm_mon = mon % 12;
wafwerar's avatar
wafwerar 已提交
99
  tw->skey = convertTimePrecision((int64_t)taosMktime(&tm) * 1000LL, TSDB_TIME_PRECISION_MILLI, pInterval->precision);
100 101 102 103

  mon = (int)(mon + interval);
  tm.tm_year = mon / 12;
  tm.tm_mon = mon % 12;
wafwerar's avatar
wafwerar 已提交
104
  tw->ekey = convertTimePrecision((int64_t)taosMktime(&tm) * 1000LL, TSDB_TIME_PRECISION_MILLI, pInterval->precision);
105 106 107 108

  tw->ekey -= 1;
}

109
static bool overlapWithTimeWindow(SInterval* pInterval, SDataBlockInfo* pBlockInfo, int32_t order) {
110 111 112 113 114 115 116
  STimeWindow w = {0};

  // 0 by default, which means it is not a interval operator of the upstream operator.
  if (pInterval->interval == 0) {
    return false;
  }

117
  if (order == TSDB_ORDER_ASC) {
118
    w = getAlignQueryTimeWindow(pInterval, pInterval->precision, pBlockInfo->window.skey);
119
    ASSERT(w.ekey >= pBlockInfo->window.skey);
120

121
    if (w.ekey < pBlockInfo->window.ekey) {
122 123 124
      return true;
    }

125 126
    while (1) {
      getNextTimeWindow(pInterval, &w, order);
127 128 129 130
      if (w.skey > pBlockInfo->window.ekey) {
        break;
      }

131
      ASSERT(w.ekey > pBlockInfo->window.ekey);
132
      if (TMAX(w.skey, pBlockInfo->window.skey) <= pBlockInfo->window.ekey) {
133 134 135 136
        return true;
      }
    }
  } else {
137
    w = getAlignQueryTimeWindow(pInterval, pInterval->precision, pBlockInfo->window.ekey);
138
    ASSERT(w.skey <= pBlockInfo->window.ekey);
139

140
    if (w.skey > pBlockInfo->window.skey) {
141 142 143
      return true;
    }

144
    while (1) {
145 146 147 148 149 150
      getNextTimeWindow(pInterval, &w, order);
      if (w.ekey < pBlockInfo->window.skey) {
        break;
      }

      assert(w.skey < pBlockInfo->window.skey);
151
      if (pBlockInfo->window.skey <= TMIN(w.ekey, pBlockInfo->window.ekey)) {
152 153 154
        return true;
      }
    }
155 156 157 158 159
  }

  return false;
}

160 161 162 163 164 165 166 167 168 169 170
// this function is for table scanner to extract temporary results of upstream aggregate results.
static SResultRow* getTableGroupOutputBuf(SOperatorInfo* pOperator, uint64_t groupId, SFilePage** pPage) {
  if (pOperator->operatorType != QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN) {
    return NULL;
  }

  int64_t buf[2] = {0};
  SET_RES_WINDOW_KEY((char*)buf, &groupId, sizeof(groupId), groupId);

  STableScanInfo* pTableScanInfo = pOperator->info;

S
slzhou 已提交
171 172
  SResultRowPosition* p1 = (SResultRowPosition*)tSimpleHashGet(pTableScanInfo->base.pdInfo.pAggSup->pResultRowHashTable,
                                                               buf, GET_RES_WINDOW_KEY_LEN(sizeof(groupId)));
173 174 175 176 177

  if (p1 == NULL) {
    return NULL;
  }

H
Haojun Liao 已提交
178
  *pPage = getBufPage(pTableScanInfo->base.pdInfo.pAggSup->pResultBuf, p1->pageId);
179 180 181
  if (NULL == *pPage) {
    return NULL;
  }
L
Liu Jicong 已提交
182

183 184 185 186 187 188
  return (SResultRow*)((char*)(*pPage) + p1->offset);
}

static int32_t doDynamicPruneDataBlock(SOperatorInfo* pOperator, SDataBlockInfo* pBlockInfo, uint32_t* status) {
  STableScanInfo* pTableScanInfo = pOperator->info;

H
Haojun Liao 已提交
189
  if (pTableScanInfo->base.pdInfo.pExprSup == NULL) {
190 191 192
    return TSDB_CODE_SUCCESS;
  }

H
Haojun Liao 已提交
193
  SExprSupp* pSup1 = pTableScanInfo->base.pdInfo.pExprSup;
194 195

  SFilePage*  pPage = NULL;
H
Haojun Liao 已提交
196
  SResultRow* pRow = getTableGroupOutputBuf(pOperator, pBlockInfo->id.groupId, &pPage);
197 198 199 200 201 202 203 204 205

  if (pRow == NULL) {
    return TSDB_CODE_SUCCESS;
  }

  bool notLoadBlock = true;
  for (int32_t i = 0; i < pSup1->numOfExprs; ++i) {
    int32_t functionId = pSup1->pCtx[i].functionId;

H
Haojun Liao 已提交
206
    SResultRowEntryInfo* pEntry = getResultEntryInfo(pRow, i, pTableScanInfo->base.pdInfo.pExprSup->rowEntryInfoOffset);
207 208 209 210 211 212 213 214 215

    int32_t reqStatus = fmFuncDynDataRequired(functionId, pEntry, &pBlockInfo->window);
    if (reqStatus != FUNC_DATA_REQUIRED_NOT_LOAD) {
      notLoadBlock = false;
      break;
    }
  }

  // release buffer pages
H
Haojun Liao 已提交
216
  releaseBufPage(pTableScanInfo->base.pdInfo.pAggSup->pResultBuf, pPage);
217 218 219 220 221 222 223 224

  if (notLoadBlock) {
    *status = FUNC_DATA_REQUIRED_NOT_LOAD;
  }

  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
225
static bool doFilterByBlockSMA(SFilterInfo* pFilterInfo, SColumnDataAgg** pColsAgg, int32_t numOfCols,
226
                               int32_t numOfRows) {
H
Haojun Liao 已提交
227
  if (pColsAgg == NULL || pFilterInfo == NULL) {
H
Haojun Liao 已提交
228 229 230
    return true;
  }

H
Haojun Liao 已提交
231
  bool keep = filterRangeExecute(pFilterInfo, pColsAgg, numOfCols, numOfRows);
H
Haojun Liao 已提交
232 233 234
  return keep;
}

H
Haojun Liao 已提交
235
static bool doLoadBlockSMA(STableScanBase* pTableScanInfo, SSDataBlock* pBlock, SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
236
  bool    allColumnsHaveAgg = true;
237
  int32_t code = tsdbRetrieveDatablockSMA(pTableScanInfo->dataReader, pBlock, &allColumnsHaveAgg);
H
Haojun Liao 已提交
238
  if (code != TSDB_CODE_SUCCESS) {
239
    T_LONG_JMP(pTaskInfo->env, code);
H
Haojun Liao 已提交
240 241 242 243 244 245 246 247
  }

  if (!allColumnsHaveAgg) {
    return false;
  }
  return true;
}

H
Haojun Liao 已提交
248
static void doSetTagColumnData(STableScanBase* pTableScanInfo, SSDataBlock* pBlock, SExecTaskInfo* pTaskInfo,
249
                               int32_t rows) {
H
Haojun Liao 已提交
250 251 252
  if (pTableScanInfo->pseudoSup.numOfExprs > 0) {
    SExprSupp* pSup = &pTableScanInfo->pseudoSup;

253
    int32_t code = addTagPseudoColumnData(&pTableScanInfo->readHandle, pSup->pExprInfo, pSup->numOfExprs, pBlock, rows,
254
                                          GET_TASKID(pTaskInfo), &pTableScanInfo->metaCache);
H
Haojun Liao 已提交
255
    // ignore the table not exists error, since this table may have been dropped during the scan procedure.
H
Haojun Liao 已提交
256
    if (code != TSDB_CODE_SUCCESS && code != TSDB_CODE_PAR_TABLE_NOT_EXIST) {
H
Haojun Liao 已提交
257 258
      T_LONG_JMP(pTaskInfo->env, code);
    }
H
Haojun Liao 已提交
259 260 261

    // reset the error code.
    terrno = 0;
H
Haojun Liao 已提交
262 263 264
  }
}

265
bool applyLimitOffset(SLimitInfo* pLimitInfo, SSDataBlock* pBlock, SExecTaskInfo* pTaskInfo) {
266
  SLimit*     pLimit = &pLimitInfo->limit;
H
Haojun Liao 已提交
267
  const char* id = GET_TASKID(pTaskInfo);
268

269
  if (pLimitInfo->remainOffset > 0) {
270 271
    if (pLimitInfo->remainOffset >= pBlock->info.rows) {
      pLimitInfo->remainOffset -= pBlock->info.rows;
H
Haojun Liao 已提交
272
      blockDataEmpty(pBlock);
H
Haojun Liao 已提交
273
      qDebug("current block ignore due to offset, current:%" PRId64 ", %s", pLimitInfo->remainOffset, id);
274
      return false;
275
    } else {
276
      blockDataTrimFirstRows(pBlock, pLimitInfo->remainOffset);
277 278 279 280 281 282
      pLimitInfo->remainOffset = 0;
    }
  }

  if (pLimit->limit != -1 && pLimit->limit <= (pLimitInfo->numOfOutputRows + pBlock->info.rows)) {
    // limit the output rows
283
    int32_t keep = (int32_t)(pLimit->limit - pLimitInfo->numOfOutputRows);
284
    blockDataKeepFirstNRows(pBlock, keep);
285 286

    pLimitInfo->numOfOutputRows += pBlock->info.rows;
H
Haojun Liao 已提交
287
    qDebug("output limit %" PRId64 " has reached, %s", pLimit->limit, id);
288
    return true;
289
  }
290

291
  pLimitInfo->numOfOutputRows += pBlock->info.rows;
292
  return false;
293 294
}

H
Haojun Liao 已提交
295
static int32_t loadDataBlock(SOperatorInfo* pOperator, STableScanBase* pTableScanInfo, SSDataBlock* pBlock,
L
Liu Jicong 已提交
296
                             uint32_t* status) {
S
slzhou 已提交
297
  SExecTaskInfo*          pTaskInfo = pOperator->pTaskInfo;
298
  SFileBlockLoadRecorder* pCost = &pTableScanInfo->readRecorder;
H
Haojun Liao 已提交
299 300

  pCost->totalBlocks += 1;
301
  pCost->totalRows += pBlock->info.rows;
302

H
Haojun Liao 已提交
303
  bool loadSMA = false;
H
Haojun Liao 已提交
304
  *status = pTableScanInfo->dataBlockLoadFlag;
H
Haojun Liao 已提交
305
  if (pOperator->exprSupp.pFilterInfo != NULL ||
306
      overlapWithTimeWindow(&pTableScanInfo->pdInfo.interval, &pBlock->info, pTableScanInfo->cond.order)) {
307 308 309 310
    (*status) = FUNC_DATA_REQUIRED_DATA_LOAD;
  }

  SDataBlockInfo* pBlockInfo = &pBlock->info;
311
  taosMemoryFreeClear(pBlock->pBlockAgg);
312 313

  if (*status == FUNC_DATA_REQUIRED_FILTEROUT) {
314 315
    qDebug("%s data block filter out, brange:%" PRId64 "-%" PRId64 ", rows:%d", GET_TASKID(pTaskInfo),
           pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
316
    pCost->filterOutBlocks += 1;
317
    pCost->totalRows += pBlock->info.rows;
318
    tsdbReleaseDataBlock(pTableScanInfo->dataReader);
319 320
    return TSDB_CODE_SUCCESS;
  } else if (*status == FUNC_DATA_REQUIRED_NOT_LOAD) {
X
Xiaoyu Wang 已提交
321
    qDebug("%s data block skipped, brange:%" PRId64 "-%" PRId64 ", rows:%d, uid:%" PRIu64, GET_TASKID(pTaskInfo),
H
Haojun Liao 已提交
322
           pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, pBlockInfo->id.uid);
323
    doSetTagColumnData(pTableScanInfo, pBlock, pTaskInfo, 1);
324
    pCost->skipBlocks += 1;
325
    tsdbReleaseDataBlock(pTableScanInfo->dataReader);
326
    return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
327
  } else if (*status == FUNC_DATA_REQUIRED_SMA_LOAD) {
328
    pCost->loadBlockStatis += 1;
L
Liu Jicong 已提交
329
    loadSMA = true;  // mark the operation of load sma;
H
Haojun Liao 已提交
330
    bool success = doLoadBlockSMA(pTableScanInfo, pBlock, pTaskInfo);
L
Liu Jicong 已提交
331
    if (success) {  // failed to load the block sma data, data block statistics does not exist, load data block instead
332 333
      qDebug("%s data block SMA loaded, brange:%" PRId64 "-%" PRId64 ", rows:%d", GET_TASKID(pTaskInfo),
             pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
334
      doSetTagColumnData(pTableScanInfo, pBlock, pTaskInfo, 1);
335
      tsdbReleaseDataBlock(pTableScanInfo->dataReader);
336 337
      return TSDB_CODE_SUCCESS;
    } else {
338
      qDebug("%s failed to load SMA, since not all columns have SMA", GET_TASKID(pTaskInfo));
H
Haojun Liao 已提交
339
      *status = FUNC_DATA_REQUIRED_DATA_LOAD;
340
    }
H
Haojun Liao 已提交
341
  }
342

H
Haojun Liao 已提交
343
  ASSERT(*status == FUNC_DATA_REQUIRED_DATA_LOAD);
344

H
Haojun Liao 已提交
345
  // try to filter data block according to sma info
H
Haojun Liao 已提交
346
  if (pOperator->exprSupp.pFilterInfo != NULL && (!loadSMA)) {
347 348 349
    bool success = doLoadBlockSMA(pTableScanInfo, pBlock, pTaskInfo);
    if (success) {
      size_t size = taosArrayGetSize(pBlock->pDataBlock);
H
Haojun Liao 已提交
350
      bool   keep = doFilterByBlockSMA(pOperator->exprSupp.pFilterInfo, pBlock->pBlockAgg, size, pBlockInfo->rows);
351 352 353 354 355 356
      if (!keep) {
        qDebug("%s data block filter out by block SMA, brange:%" PRId64 "-%" PRId64 ", rows:%d", GET_TASKID(pTaskInfo),
               pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
        pCost->filterOutBlocks += 1;
        (*status) = FUNC_DATA_REQUIRED_FILTEROUT;

357
        tsdbReleaseDataBlock(pTableScanInfo->dataReader);
358 359
        return TSDB_CODE_SUCCESS;
      }
360
    }
H
Haojun Liao 已提交
361
  }
362

363 364 365
  // free the sma info, since it should not be involved in later computing process.
  taosMemoryFreeClear(pBlock->pBlockAgg);

366
  // try to filter data block according to current results
367 368
  doDynamicPruneDataBlock(pOperator, pBlockInfo, status);
  if (*status == FUNC_DATA_REQUIRED_NOT_LOAD) {
369
    qDebug("%s data block skipped due to dynamic prune, brange:%" PRId64 "-%" PRId64 ", rows:%d", GET_TASKID(pTaskInfo),
370 371
           pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows);
    pCost->skipBlocks += 1;
372
    tsdbReleaseDataBlock(pTableScanInfo->dataReader);
373
    *status = FUNC_DATA_REQUIRED_FILTEROUT;
374 375 376
    return TSDB_CODE_SUCCESS;
  }

H
Haojun Liao 已提交
377 378
  pCost->totalCheckedRows += pBlock->info.rows;
  pCost->loadBlocks += 1;
379

H
Haojun Liao 已提交
380 381
  SSDataBlock* p = tsdbRetrieveDataBlock(pTableScanInfo->dataReader, NULL);
  if (p == NULL) {
H
Haojun Liao 已提交
382
    return terrno;
H
Haojun Liao 已提交
383 384
  }

H
Haojun Liao 已提交
385
  ASSERT(p == pBlock);
386
  doSetTagColumnData(pTableScanInfo, pBlock, pTaskInfo, pBlock->info.rows);
387

H
Haojun Liao 已提交
388 389
  // restore the previous value
  pCost->totalRows -= pBlock->info.rows;
390

H
Haojun Liao 已提交
391
  if (pOperator->exprSupp.pFilterInfo != NULL) {
392
    int64_t st = taosGetTimestampUs();
H
Haojun Liao 已提交
393
    doFilter(pBlock, pOperator->exprSupp.pFilterInfo, &pTableScanInfo->matchInfo);
394

395 396
    double el = (taosGetTimestampUs() - st) / 1000.0;
    pTableScanInfo->readRecorder.filterTime += el;
397

398 399 400 401 402 403 404
    if (pBlock->info.rows == 0) {
      pCost->filterOutBlocks += 1;
      qDebug("%s data block filter out, brange:%" PRId64 "-%" PRId64 ", rows:%d, elapsed time:%.2f ms",
             GET_TASKID(pTaskInfo), pBlockInfo->window.skey, pBlockInfo->window.ekey, pBlockInfo->rows, el);
    } else {
      qDebug("%s data block filter applied, elapsed time:%.2f ms", GET_TASKID(pTaskInfo), el);
    }
405 406
  }

407
  bool limitReached = applyLimitOffset(&pTableScanInfo->limitInfo, pBlock, pTaskInfo);
X
Xiaoyu Wang 已提交
408
  if (limitReached) {  // set operator flag is done
409 410
    setOperatorCompleted(pOperator);
  }
411

H
Haojun Liao 已提交
412
  pCost->totalRows += pBlock->info.rows;
H
Haojun Liao 已提交
413 414 415
  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
416
static void prepareForDescendingScan(STableScanBase* pTableScanInfo, SqlFunctionCtx* pCtx, int32_t numOfOutput) {
H
Haojun Liao 已提交
417 418 419
  SET_REVERSE_SCAN_FLAG(pTableScanInfo);

  switchCtxOrder(pCtx, numOfOutput);
420
  pTableScanInfo->cond.order = TSDB_ORDER_DESC;
H
Haojun Liao 已提交
421 422
  STimeWindow* pTWindow = &pTableScanInfo->cond.twindows;
  TSWAP(pTWindow->skey, pTWindow->ekey);
H
Haojun Liao 已提交
423 424
}

425 426
typedef struct STableCachedVal {
  const char* pName;
427
  STag*       pTags;
428 429
} STableCachedVal;

430 431 432 433 434 435 436 437 438 439 440
static void freeTableCachedVal(void* param) {
  if (param == NULL) {
    return;
  }

  STableCachedVal* pVal = param;
  taosMemoryFree((void*)pVal->pName);
  taosMemoryFree(pVal->pTags);
  taosMemoryFree(pVal);
}

H
Haojun Liao 已提交
441 442
static STableCachedVal* createTableCacheVal(const SMetaReader* pMetaReader) {
  STableCachedVal* pVal = taosMemoryMalloc(sizeof(STableCachedVal));
443
  pVal->pName = taosStrdup(pMetaReader->me.name);
H
Haojun Liao 已提交
444 445 446 447
  pVal->pTags = NULL;

  // only child table has tag value
  if (pMetaReader->me.type == TSDB_CHILD_TABLE) {
448
    STag* pTag = (STag*)pMetaReader->me.ctbEntry.pTags;
H
Haojun Liao 已提交
449 450 451 452 453 454 455
    pVal->pTags = taosMemoryMalloc(pTag->len);
    memcpy(pVal->pTags, pTag, pTag->len);
  }

  return pVal;
}

456 457
// const void *key, size_t keyLen, void *value
static void freeCachedMetaItem(const void* key, size_t keyLen, void* value) { freeTableCachedVal(value); }
458

459 460 461 462 463
static void doSetNullValue(SSDataBlock* pBlock, const SExprInfo* pExpr, int32_t numOfExpr) {
  for (int32_t j = 0; j < numOfExpr; ++j) {
    int32_t dstSlotId = pExpr[j].base.resSchema.slotId;

    SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, dstSlotId);
464
    colDataSetNNULL(pColInfoData, 0, pBlock->info.rows);
465 466 467
  }
}

468 469
int32_t addTagPseudoColumnData(SReadHandle* pHandle, const SExprInfo* pExpr, int32_t numOfExpr, SSDataBlock* pBlock,
                               int32_t rows, const char* idStr, STableMetaCacheInfo* pCache) {
470
  // currently only the tbname pseudo column
471
  if (numOfExpr <= 0) {
H
Haojun Liao 已提交
472
    return TSDB_CODE_SUCCESS;
473 474
  }

475 476
  int32_t code = 0;

477 478 479 480
  // backup the rows
  int32_t backupRows = pBlock->info.rows;
  pBlock->info.rows = rows;

481
  bool            freeReader = false;
482
  STableCachedVal val = {0};
483 484

  SMetaReader mr = {0};
485
  LRUHandle*  h = NULL;
486

487 488 489
  // todo refactor: extract method
  // the handling of the null data should be packed in the extracted method

490
  // 1. check if it is existed in meta cache
491
  if (pCache == NULL) {
492
    metaReaderInit(&mr, pHandle->meta, 0);
H
Haojun Liao 已提交
493
    code = metaGetTableEntryByUidCache(&mr, pBlock->info.id.uid);
494
    if (code != TSDB_CODE_SUCCESS) {
495
      // when encounter the TSDB_CODE_PAR_TABLE_NOT_EXIST error, we proceed.
H
Haojun Liao 已提交
496
      if (terrno == TSDB_CODE_PAR_TABLE_NOT_EXIST) {
S
slzhou 已提交
497 498
        qWarn("failed to get table meta, table may have been dropped, uid:0x%" PRIx64 ", code:%s, %s",
              pBlock->info.id.uid, tstrerror(terrno), idStr);
499 500 501

        // append null value before return to caller, since the caller will ignore this error code and proceed
        doSetNullValue(pBlock, pExpr, numOfExpr);
H
Haojun Liao 已提交
502
      } else {
S
slzhou 已提交
503 504
        qError("failed to get table meta, uid:0x%" PRIx64 ", code:%s, %s", pBlock->info.id.uid, tstrerror(terrno),
               idStr);
H
Haojun Liao 已提交
505
      }
506 507 508 509 510
      metaReaderClear(&mr);
      return terrno;
    }

    metaReaderReleaseLock(&mr);
511

512 513
    val.pName = mr.me.name;
    val.pTags = (STag*)mr.me.ctbEntry.pTags;
514 515

    freeReader = true;
516
  } else {
517 518
    pCache->metaFetch += 1;

H
Haojun Liao 已提交
519
    h = taosLRUCacheLookup(pCache->pTableMetaEntryCache, &pBlock->info.id.uid, sizeof(pBlock->info.id.uid));
520 521
    if (h == NULL) {
      metaReaderInit(&mr, pHandle->meta, 0);
H
Haojun Liao 已提交
522
      code = metaGetTableEntryByUidCache(&mr, pBlock->info.id.uid);
523
      if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
524
        if (terrno == TSDB_CODE_PAR_TABLE_NOT_EXIST) {
525
          qWarn("failed to get table meta, table may have been dropped, uid:0x%" PRIx64 ", code:%s, %s",
H
Haojun Liao 已提交
526
                pBlock->info.id.uid, tstrerror(terrno), idStr);
527 528
          // append null value before return to caller, since the caller will ignore this error code and proceed
          doSetNullValue(pBlock, pExpr, numOfExpr);
H
Haojun Liao 已提交
529
        } else {
H
Haojun Liao 已提交
530
          qError("failed to get table meta, uid:0x%" PRIx64 ", code:%s, %s", pBlock->info.id.uid, tstrerror(terrno),
531
                 idStr);
H
Haojun Liao 已提交
532
        }
533 534 535 536 537 538
        metaReaderClear(&mr);
        return terrno;
      }

      metaReaderReleaseLock(&mr);

H
Haojun Liao 已提交
539
      STableCachedVal* pVal = createTableCacheVal(&mr);
540

H
Haojun Liao 已提交
541
      val = *pVal;
542
      freeReader = true;
H
Haojun Liao 已提交
543

H
Haojun Liao 已提交
544
      int32_t ret = taosLRUCacheInsert(pCache->pTableMetaEntryCache, &pBlock->info.id.uid, sizeof(uint64_t), pVal,
545
                                       sizeof(STableCachedVal), freeCachedMetaItem, NULL, TAOS_LRU_PRIORITY_LOW);
546 547 548 549 550 551 552 553
      if (ret != TAOS_LRU_STATUS_OK) {
        qError("failed to put meta into lru cache, code:%d, %s", ret, idStr);
        freeTableCachedVal(pVal);
      }
    } else {
      pCache->cacheHit += 1;
      STableCachedVal* pVal = taosLRUCacheValue(pCache->pTableMetaEntryCache, h);
      val = *pVal;
H
Haojun Liao 已提交
554

H
Haojun Liao 已提交
555
      taosLRUCacheRelease(pCache->pTableMetaEntryCache, h, false);
556
    }
H
Haojun Liao 已提交
557

558 559
    qDebug("retrieve table meta from cache:%" PRIu64 ", hit:%" PRIu64 " miss:%" PRIu64 ", %s", pCache->metaFetch,
           pCache->cacheHit, (pCache->metaFetch - pCache->cacheHit), idStr);
H
Haojun Liao 已提交
560
  }
561

562 563
  for (int32_t j = 0; j < numOfExpr; ++j) {
    const SExprInfo* pExpr1 = &pExpr[j];
564
    int32_t          dstSlotId = pExpr1->base.resSchema.slotId;
565 566

    SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, dstSlotId);
D
dapan1121 已提交
567
    colInfoDataCleanup(pColInfoData, pBlock->info.rows);
568

569
    int32_t functionId = pExpr1->pExpr->_function.functionId;
570 571 572

    // this is to handle the tbname
    if (fmIsScanPseudoColumnFunc(functionId)) {
573
      setTbNameColData(pBlock, pColInfoData, functionId, val.pName);
574
    } else {  // these are tags
wmmhello's avatar
wmmhello 已提交
575
      STagVal tagVal = {0};
576 577
      tagVal.cid = pExpr1->base.pParam[0].pCol->colId;
      const char* p = metaGetTableTagVal(val.pTags, pColInfoData->info.type, &tagVal);
wmmhello's avatar
wmmhello 已提交
578

579 580 581 582
      char* data = NULL;
      if (pColInfoData->info.type != TSDB_DATA_TYPE_JSON && p != NULL) {
        data = tTagValToData((const STagVal*)p, false);
      } else {
wmmhello's avatar
wmmhello 已提交
583
        data = (char*)p;
wmmhello's avatar
wmmhello 已提交
584
      }
585

H
Haojun Liao 已提交
586 587
      bool isNullVal = (data == NULL) || (pColInfoData->info.type == TSDB_DATA_TYPE_JSON && tTagIsJsonNull(data));
      if (isNullVal) {
588
        colDataSetNNULL(pColInfoData, 0, pBlock->info.rows);
H
Haojun Liao 已提交
589
      } else if (pColInfoData->info.type != TSDB_DATA_TYPE_JSON) {
590
        colDataSetNItems(pColInfoData, 0, data, pBlock->info.rows);
H
Haojun Liao 已提交
591 592 593
        if (IS_VAR_DATA_TYPE(((const STagVal*)p)->type)) {
          taosMemoryFree(data);
        }
L
Liu Jicong 已提交
594
      } else {  // todo opt for json tag
H
Haojun Liao 已提交
595
        for (int32_t i = 0; i < pBlock->info.rows; ++i) {
596
          colDataSetVal(pColInfoData, i, data, false);
H
Haojun Liao 已提交
597
        }
598 599 600 601
      }
    }
  }

602 603
  // restore the rows
  pBlock->info.rows = backupRows;
604 605 606 607
  if (freeReader) {
    metaReaderClear(&mr);
  }

H
Haojun Liao 已提交
608
  return TSDB_CODE_SUCCESS;
609 610
}

H
Haojun Liao 已提交
611
void setTbNameColData(const SSDataBlock* pBlock, SColumnInfoData* pColInfoData, int32_t functionId, const char* name) {
612 613 614
  struct SScalarFuncExecFuncs fpSet = {0};
  fmGetScalarFuncExecFuncs(functionId, &fpSet);

H
Haojun Liao 已提交
615
  size_t len = TSDB_TABLE_FNAME_LEN + VARSTR_HEADER_SIZE;
616
  char   buf[TSDB_TABLE_FNAME_LEN + VARSTR_HEADER_SIZE] = {0};
H
Haojun Liao 已提交
617 618 619
  STR_TO_VARSTR(buf, name)

  SColumnInfoData infoData = createColumnInfoData(TSDB_DATA_TYPE_VARCHAR, len, 1);
620

H
Haojun Liao 已提交
621
  colInfoDataEnsureCapacity(&infoData, 1, false);
622
  colDataSetVal(&infoData, 0, buf, false);
623

H
Haojun Liao 已提交
624
  SScalarParam srcParam = {.numOfRows = pBlock->info.rows, .columnData = &infoData};
625
  SScalarParam param = {.columnData = pColInfoData};
H
Haojun Liao 已提交
626 627 628 629 630 631 632

  if (fpSet.process != NULL) {
    fpSet.process(&srcParam, 1, &param);
  } else {
    qError("failed to get the corresponding callback function, functionId:%d", functionId);
  }

D
dapan1121 已提交
633
  colDataDestroy(&infoData);
634 635
}

636
static SSDataBlock* doTableScanImpl(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
637
  STableScanInfo* pTableScanInfo = pOperator->info;
638
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
L
Liu Jicong 已提交
639
  SSDataBlock*    pBlock = pTableScanInfo->pResBlock;
H
Haojun Liao 已提交
640

641 642
  int64_t st = taosGetTimestampUs();

H
Haojun Liao 已提交
643
  while (tsdbNextDataBlock(pTableScanInfo->base.dataReader)) {
644
    if (isTaskKilled(pTaskInfo)) {
X
Xiaoyu Wang 已提交
645
      tsdbReleaseDataBlock(pTableScanInfo->base.dataReader);
646
      T_LONG_JMP(pTaskInfo->env, pTaskInfo->code);
647
    }
H
Haojun Liao 已提交
648

649
    if (pOperator->status == OP_EXEC_DONE) {
X
Xiaoyu Wang 已提交
650
      tsdbReleaseDataBlock(pTableScanInfo->base.dataReader);
651 652 653
      break;
    }

654 655 656 657 658 659
    // process this data block based on the probabilities
    bool processThisBlock = processBlockWithProbability(&pTableScanInfo->sample);
    if (!processThisBlock) {
      continue;
    }

D
dapan1121 已提交
660 661 662 663
    if (pBlock->info.id.uid) {
      pBlock->info.id.groupId = getTableGroupId(pTaskInfo->pTableInfoList, pBlock->info.id.uid);
    }
    
664
    uint32_t status = 0;
H
Haojun Liao 已提交
665
    int32_t  code = loadDataBlock(pOperator, &pTableScanInfo->base, pBlock, &status);
666
    if (code != TSDB_CODE_SUCCESS) {
667
      T_LONG_JMP(pTaskInfo->env, code);
668
    }
669

670 671 672
    // current block is filter out according to filter condition, continue load the next block
    if (status == FUNC_DATA_REQUIRED_FILTEROUT || pBlock->info.rows == 0) {
      continue;
673
    }
674

H
Haojun Liao 已提交
675 676
    pOperator->resultInfo.totalRows = pTableScanInfo->base.readRecorder.totalRows;
    pTableScanInfo->base.readRecorder.elapsedTime += (taosGetTimestampUs() - st) / 1000.0;
677

H
Haojun Liao 已提交
678
    pOperator->cost.totalCost = pTableScanInfo->base.readRecorder.elapsedTime;
679 680

    // todo refactor
H
Haojun Liao 已提交
681
    /*pTableScanInfo->lastStatus.uid = pBlock->info.id.uid;*/
L
Liu Jicong 已提交
682 683
    /*pTableScanInfo->lastStatus.ts = pBlock->info.window.ekey;*/
    pTaskInfo->streamInfo.lastStatus.type = TMQ_OFFSET__SNAPSHOT_DATA;
H
Haojun Liao 已提交
684
    pTaskInfo->streamInfo.lastStatus.uid = pBlock->info.id.uid;
L
Liu Jicong 已提交
685
    pTaskInfo->streamInfo.lastStatus.ts = pBlock->info.window.ekey;
686

687
    return pBlock;
H
Haojun Liao 已提交
688 689 690 691
  }
  return NULL;
}

H
Haojun Liao 已提交
692
static SSDataBlock* doGroupedTableScan(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
693 694 695 696
  STableScanInfo* pTableScanInfo = pOperator->info;
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;

  // The read handle is not initialized yet, since no qualified tables exists
H
Haojun Liao 已提交
697
  if (pTableScanInfo->base.dataReader == NULL || pOperator->status == OP_EXEC_DONE) {
H
Haojun Liao 已提交
698 699 700
    return NULL;
  }

701 702
  // do the ascending order traverse in the first place.
  while (pTableScanInfo->scanTimes < pTableScanInfo->scanInfo.numOfAsc) {
H
Haojun Liao 已提交
703 704 705
    SSDataBlock* p = doTableScanImpl(pOperator);
    if (p != NULL) {
      return p;
H
Haojun Liao 已提交
706 707
    }

708
    pTableScanInfo->scanTimes += 1;
709

710
    if (pTableScanInfo->scanTimes < pTableScanInfo->scanInfo.numOfAsc) {
711
      setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
G
Ganlin Zhao 已提交
712 713
      pTableScanInfo->base.scanFlag = MAIN_SCAN;
      pTableScanInfo->base.dataBlockLoadFlag = FUNC_DATA_REQUIRED_DATA_LOAD;
714
      qDebug("start to repeat ascending order scan data blocks due to query func required, %s", GET_TASKID(pTaskInfo));
H
Haojun Liao 已提交
715

716
      // do prepare for the next round table scan operation
H
Haojun Liao 已提交
717
      tsdbReaderReset(pTableScanInfo->base.dataReader, &pTableScanInfo->base.cond);
H
Haojun Liao 已提交
718
    }
719
  }
H
Haojun Liao 已提交
720

721
  int32_t total = pTableScanInfo->scanInfo.numOfAsc + pTableScanInfo->scanInfo.numOfDesc;
722
  if (pTableScanInfo->scanTimes < total) {
H
Haojun Liao 已提交
723 724 725
    if (pTableScanInfo->base.cond.order == TSDB_ORDER_ASC) {
      prepareForDescendingScan(&pTableScanInfo->base, pOperator->exprSupp.pCtx, 0);
      tsdbReaderReset(pTableScanInfo->base.dataReader, &pTableScanInfo->base.cond);
726
      qDebug("%s start to descending order scan data blocks due to query func required", GET_TASKID(pTaskInfo));
727
    }
H
Haojun Liao 已提交
728

729
    while (pTableScanInfo->scanTimes < total) {
H
Haojun Liao 已提交
730 731 732
      SSDataBlock* p = doTableScanImpl(pOperator);
      if (p != NULL) {
        return p;
733
      }
H
Haojun Liao 已提交
734

735
      pTableScanInfo->scanTimes += 1;
H
Haojun Liao 已提交
736

737
      if (pTableScanInfo->scanTimes < total) {
738
        setTaskStatus(pTaskInfo, TASK_NOT_COMPLETED);
G
Ganlin Zhao 已提交
739
        pTableScanInfo->base.scanFlag = MAIN_SCAN;
H
Haojun Liao 已提交
740

741
        qDebug("%s start to repeat descending order scan data blocks", GET_TASKID(pTaskInfo));
H
Haojun Liao 已提交
742
        tsdbReaderReset(pTableScanInfo->base.dataReader, &pTableScanInfo->base.cond);
743
      }
H
Haojun Liao 已提交
744 745 746
    }
  }

wmmhello's avatar
wmmhello 已提交
747 748 749 750 751 752 753
  return NULL;
}

static SSDataBlock* doTableScan(SOperatorInfo* pOperator) {
  STableScanInfo* pInfo = pOperator->info;
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;

754
  // scan table one by one sequentially
L
Liu Jicong 已提交
755
  if (pInfo->scanMode == TABLE_SCAN__TABLE_ORDER) {
H
Haojun Liao 已提交
756
    int32_t numOfTables = tableListGetSize(pTaskInfo->pTableInfoList);
H
Haojun Liao 已提交
757

L
Liu Jicong 已提交
758
    while (1) {
H
Haojun Liao 已提交
759
      SSDataBlock* result = doGroupedTableScan(pOperator);
760
      if (result || (pOperator->status == OP_EXEC_DONE)) {
L
Liu Jicong 已提交
761 762
        return result;
      }
H
Haojun Liao 已提交
763

L
Liu Jicong 已提交
764 765
      // if no data, switch to next table and continue scan
      pInfo->currentTable++;
H
Haojun Liao 已提交
766
      if (pInfo->currentTable >= numOfTables) {
L
Liu Jicong 已提交
767 768
        return NULL;
      }
H
Haojun Liao 已提交
769

H
Haojun Liao 已提交
770
      STableKeyInfo* pTableInfo = tableListGetInfo(pTaskInfo->pTableInfoList, pInfo->currentTable);
H
Haojun Liao 已提交
771
      tsdbSetTableList(pInfo->base.dataReader, pTableInfo, 1);
L
Liu Jicong 已提交
772 773
      qDebug("set uid:%" PRIu64 " into scanner, total tables:%d, index:%d %s", pTableInfo->uid, numOfTables,
             pInfo->currentTable, pTaskInfo->id.str);
H
Haojun Liao 已提交
774

H
Haojun Liao 已提交
775
      tsdbReaderReset(pInfo->base.dataReader, &pInfo->base.cond);
L
Liu Jicong 已提交
776 777
      pInfo->scanTimes = 0;
    }
778 779
  } else {  // scan table group by group sequentially
    if (pInfo->currentGroupId == -1) {
H
Haojun Liao 已提交
780
      if ((++pInfo->currentGroupId) >= tableListGetOutputGroups(pTaskInfo->pTableInfoList)) {
H
Haojun Liao 已提交
781
        setOperatorCompleted(pOperator);
782 783
        return NULL;
      }
784

5
54liuyao 已提交
785
      int32_t        num = 0;
786
      STableKeyInfo* pList = NULL;
H
Haojun Liao 已提交
787
      tableListGetGroupList(pTaskInfo->pTableInfoList, pInfo->currentGroupId, &pList, &num);
H
Haojun Liao 已提交
788
      ASSERT(pInfo->base.dataReader == NULL);
789

L
Liu Jicong 已提交
790
      int32_t code = tsdbReaderOpen(pInfo->base.readHandle.vnode, &pInfo->base.cond, pList, num, pInfo->pResBlock,
D
dapan1121 已提交
791
                                    (STsdbReader**)&pInfo->base.dataReader, GET_TASKID(pTaskInfo), pInfo->countOnly);
792 793 794
      if (code != TSDB_CODE_SUCCESS) {
        T_LONG_JMP(pTaskInfo->env, code);
      }
795 796 797 798

      if (pInfo->pResBlock->info.capacity > pOperator->resultInfo.capacity) {
        pOperator->resultInfo.capacity = pInfo->pResBlock->info.capacity;
      }
wmmhello's avatar
wmmhello 已提交
799
    }
H
Haojun Liao 已提交
800

H
Haojun Liao 已提交
801
    SSDataBlock* result = doGroupedTableScan(pOperator);
802 803 804
    if (result != NULL) {
      return result;
    }
H
Haojun Liao 已提交
805

H
Haojun Liao 已提交
806
    if ((++pInfo->currentGroupId) >= tableListGetOutputGroups(pTaskInfo->pTableInfoList)) {
H
Haojun Liao 已提交
807
      setOperatorCompleted(pOperator);
808 809
      return NULL;
    }
wmmhello's avatar
wmmhello 已提交
810

811 812
    // reset value for the next group data output
    pOperator->status = OP_OPENED;
813
    resetLimitInfoForNextGroup(&pInfo->base.limitInfo);
wmmhello's avatar
wmmhello 已提交
814

5
54liuyao 已提交
815
    int32_t        num = 0;
816
    STableKeyInfo* pList = NULL;
H
Haojun Liao 已提交
817
    tableListGetGroupList(pTaskInfo->pTableInfoList, pInfo->currentGroupId, &pList, &num);
wmmhello's avatar
wmmhello 已提交
818

H
Haojun Liao 已提交
819 820
    tsdbSetTableList(pInfo->base.dataReader, pList, num);
    tsdbReaderReset(pInfo->base.dataReader, &pInfo->base.cond);
821
    pInfo->scanTimes = 0;
wmmhello's avatar
wmmhello 已提交
822

H
Haojun Liao 已提交
823
    result = doGroupedTableScan(pOperator);
824 825 826
    if (result != NULL) {
      return result;
    }
827

H
Haojun Liao 已提交
828
    setOperatorCompleted(pOperator);
829 830
    return NULL;
  }
H
Haojun Liao 已提交
831 832
}

833 834
static int32_t getTableScannerExecInfo(struct SOperatorInfo* pOptr, void** pOptrExplain, uint32_t* len) {
  SFileBlockLoadRecorder* pRecorder = taosMemoryCalloc(1, sizeof(SFileBlockLoadRecorder));
835
  STableScanInfo*         pTableScanInfo = pOptr->info;
H
Haojun Liao 已提交
836
  *pRecorder = pTableScanInfo->base.readRecorder;
837 838 839 840 841
  *pOptrExplain = pRecorder;
  *len = sizeof(SFileBlockLoadRecorder);
  return 0;
}

842
static void destroyTableScanOperatorInfo(void* param) {
843
  STableScanInfo* pTableScanInfo = (STableScanInfo*)param;
H
Haojun Liao 已提交
844
  blockDataDestroy(pTableScanInfo->pResBlock);
H
Haojun Liao 已提交
845
  cleanupQueryTableDataCond(&pTableScanInfo->base.cond);
H
Haojun Liao 已提交
846

H
Haojun Liao 已提交
847 848
  tsdbReaderClose(pTableScanInfo->base.dataReader);
  pTableScanInfo->base.dataReader = NULL;
849

H
Haojun Liao 已提交
850 851
  if (pTableScanInfo->base.matchInfo.pList != NULL) {
    taosArrayDestroy(pTableScanInfo->base.matchInfo.pList);
852
  }
L
Liu Jicong 已提交
853

H
Haojun Liao 已提交
854 855
  taosLRUCacheCleanup(pTableScanInfo->base.metaCache.pTableMetaEntryCache);
  cleanupExprSupp(&pTableScanInfo->base.pseudoSup);
D
dapan1121 已提交
856
  taosMemoryFreeClear(param);
857 858
}

859
SOperatorInfo* createTableScanOperatorInfo(STableScanPhysiNode* pTableScanNode, SReadHandle* readHandle,
860
                                           SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
861 862 863
  STableScanInfo* pInfo = taosMemoryCalloc(1, sizeof(STableScanInfo));
  SOperatorInfo*  pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
864
    goto _error;
H
Haojun Liao 已提交
865 866
  }

867
  SScanPhysiNode*     pScanNode = &pTableScanNode->scan;
H
Haojun Liao 已提交
868
  SDataBlockDescNode* pDescNode = pScanNode->node.pOutputDataBlockDesc;
869 870

  int32_t numOfCols = 0;
871
  int32_t code =
H
Haojun Liao 已提交
872
      extractColMatchInfo(pScanNode->pScanCols, pDescNode, &numOfCols, COL_MATCH_FROM_COL_ID, &pInfo->base.matchInfo);
873 874 875 876
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

H
Haojun Liao 已提交
877
  initLimitInfo(pScanNode->node.pLimit, pScanNode->node.pSlimit, &pInfo->base.limitInfo);
H
Haojun Liao 已提交
878
  code = initQueryTableDataCond(&pInfo->base.cond, pTableScanNode);
879
  if (code != TSDB_CODE_SUCCESS) {
880
    goto _error;
881 882
  }

H
Haojun Liao 已提交
883
  if (pScanNode->pScanPseudoCols != NULL) {
H
Haojun Liao 已提交
884
    SExprSupp* pSup = &pInfo->base.pseudoSup;
H
Haojun Liao 已提交
885
    pSup->pExprInfo = createExprInfo(pScanNode->pScanPseudoCols, NULL, &pSup->numOfExprs);
886
    pSup->pCtx = createSqlFunctionCtx(pSup->pExprInfo, pSup->numOfExprs, &pSup->rowEntryInfoOffset);
887 888
  }

889
  pInfo->scanInfo = (SScanInfo){.numOfAsc = pTableScanNode->scanSeq[0], .numOfDesc = pTableScanNode->scanSeq[1]};
G
Ganlin Zhao 已提交
890
  pInfo->base.scanFlag = (pInfo->scanInfo.numOfAsc > 1) ? PRE_SCAN : MAIN_SCAN;
H
Haojun Liao 已提交
891

H
Haojun Liao 已提交
892 893
  pInfo->base.pdInfo.interval = extractIntervalInfo(pTableScanNode);
  pInfo->base.readHandle = *readHandle;
H
Haojun Liao 已提交
894 895
  pInfo->base.dataBlockLoadFlag = pTableScanNode->dataRequired;

896 897
  pInfo->sample.sampleRatio = pTableScanNode->ratio;
  pInfo->sample.seed = taosGetTimestampSec();
898

H
Haojun Liao 已提交
899
  initResultSizeInfo(&pOperator->resultInfo, 4096);
H
Haojun Liao 已提交
900
  pInfo->pResBlock = createDataBlockFromDescNode(pDescNode);
X
Xiaoyu Wang 已提交
901
  //  blockDataEnsureCapacity(pInfo->pResBlock, pOperator->resultInfo.capacity);
H
Haojun Liao 已提交
902

H
Haojun Liao 已提交
903 904 905
  code = filterInitFromNode((SNode*)pTableScanNode->scan.node.pConditions, &pOperator->exprSupp.pFilterInfo, 0);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
H
Haojun Liao 已提交
906 907
  }

wmmhello's avatar
wmmhello 已提交
908
  pInfo->currentGroupId = -1;
909
  pInfo->assignBlockUid = pTableScanNode->assignBlockUid;
910
  pInfo->hasGroupByTag = pTableScanNode->pGroupTags ? true : false;
911

L
Liu Jicong 已提交
912 913
  setOperatorInfo(pOperator, "TableScanOperator", QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN, false, OP_NOT_OPENED, pInfo,
                  pTaskInfo);
914
  pOperator->exprSupp.numOfExprs = numOfCols;
915

H
Haojun Liao 已提交
916 917
  pInfo->base.metaCache.pTableMetaEntryCache = taosLRUCacheInit(1024 * 128, -1, .5);
  if (pInfo->base.metaCache.pTableMetaEntryCache == NULL) {
918 919 920
    code = terrno;
    goto _error;
  }
921

D
dapan1121 已提交
922 923 924 925
  if (scanDebug) {
    pInfo->countOnly = true;
  }

H
Haojun Liao 已提交
926
  taosLRUCacheSetStrictCapacity(pInfo->base.metaCache.pTableMetaEntryCache, false);
927 928
  pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, doTableScan, NULL, destroyTableScanOperatorInfo,
                                         optrDefaultBufFn, getTableScannerExecInfo);
929 930 931

  // for non-blocking operator, the open cost is always 0
  pOperator->cost.openCost = 0;
H
Haojun Liao 已提交
932
  return pOperator;
933

934
_error:
935 936 937
  if (pInfo != NULL) {
    destroyTableScanOperatorInfo(pInfo);
  }
938

939 940
  taosMemoryFreeClear(pOperator);
  pTaskInfo->code = code;
941
  return NULL;
H
Haojun Liao 已提交
942 943
}

944
SOperatorInfo* createTableSeqScanOperatorInfo(void* pReadHandle, SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
945
  STableScanInfo* pInfo = taosMemoryCalloc(1, sizeof(STableScanInfo));
L
Liu Jicong 已提交
946
  SOperatorInfo*  pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
947

H
Haojun Liao 已提交
948
  pInfo->base.dataReader = pReadHandle;
L
Liu Jicong 已提交
949
  //  pInfo->prevGroupId       = -1;
H
Haojun Liao 已提交
950

L
Liu Jicong 已提交
951 952
  setOperatorInfo(pOperator, "TableSeqScanOperator", QUERY_NODE_PHYSICAL_PLAN_TABLE_SEQ_SCAN, false, OP_NOT_OPENED,
                  pInfo, pTaskInfo);
953
  pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, doTableScanImpl, NULL, NULL, optrDefaultBufFn, NULL);
H
Haojun Liao 已提交
954 955 956
  return pOperator;
}

957
FORCE_INLINE void doClearBufferedBlocks(SStreamScanInfo* pInfo) {
5
54liuyao 已提交
958
  qDebug("clear buff blocks:%d", (int32_t)taosArrayGetSize(pInfo->pBlockLists));
L
Liu Jicong 已提交
959 960
  taosArrayClear(pInfo->pBlockLists);
  pInfo->validBlockIndex = 0;
H
Haojun Liao 已提交
961 962
}

963
static bool isSessionWindow(SStreamScanInfo* pInfo) {
H
Haojun Liao 已提交
964
  return pInfo->windowSup.parentType == QUERY_NODE_PHYSICAL_PLAN_STREAM_SESSION;
5
54liuyao 已提交
965 966
}

967
static bool isStateWindow(SStreamScanInfo* pInfo) {
968
  return pInfo->windowSup.parentType == QUERY_NODE_PHYSICAL_PLAN_STREAM_STATE;
5
54liuyao 已提交
969
}
5
54liuyao 已提交
970

L
Liu Jicong 已提交
971
static bool isIntervalWindow(SStreamScanInfo* pInfo) {
972 973 974
  return pInfo->windowSup.parentType == QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL ||
         pInfo->windowSup.parentType == QUERY_NODE_PHYSICAL_PLAN_STREAM_SEMI_INTERVAL ||
         pInfo->windowSup.parentType == QUERY_NODE_PHYSICAL_PLAN_STREAM_FINAL_INTERVAL;
5
54liuyao 已提交
975 976 977
}

static bool isSignleIntervalWindow(SStreamScanInfo* pInfo) {
978
  return pInfo->windowSup.parentType == QUERY_NODE_PHYSICAL_PLAN_STREAM_INTERVAL;
L
Liu Jicong 已提交
979 980
}

981 982 983 984
static bool isSlidingWindow(SStreamScanInfo* pInfo) {
  return isIntervalWindow(pInfo) && pInfo->interval.interval != pInfo->interval.sliding;
}

985
static void setGroupId(SStreamScanInfo* pInfo, SSDataBlock* pBlock, int32_t groupColIndex, int32_t rowIndex) {
986 987
  SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, groupColIndex);
  uint64_t*        groupCol = (uint64_t*)pColInfo->pData;
988
  ASSERT(rowIndex < pBlock->info.rows);
989
  pInfo->groupId = groupCol[rowIndex];
990 991
}

L
Liu Jicong 已提交
992
void resetTableScanInfo(STableScanInfo* pTableScanInfo, STimeWindow* pWin) {
H
Haojun Liao 已提交
993
  pTableScanInfo->base.cond.twindows = *pWin;
L
Liu Jicong 已提交
994 995
  pTableScanInfo->scanTimes = 0;
  pTableScanInfo->currentGroupId = -1;
H
Haojun Liao 已提交
996
  tsdbReaderClose(pTableScanInfo->base.dataReader);
H
Haojun Liao 已提交
997
  qDebug("1");
H
Haojun Liao 已提交
998
  pTableScanInfo->base.dataReader = NULL;
999 1000
}

L
Liu Jicong 已提交
1001 1002
static SSDataBlock* readPreVersionData(SOperatorInfo* pTableScanOp, uint64_t tbUid, TSKEY startTs, TSKEY endTs,
                                       int64_t maxVersion) {
1003
  STableKeyInfo tblInfo = {.uid = tbUid, .groupId = 0};
1004

1005
  STableScanInfo*     pTableScanInfo = pTableScanOp->info;
H
Haojun Liao 已提交
1006
  SQueryTableDataCond cond = pTableScanInfo->base.cond;
1007 1008 1009 1010 1011 1012 1013 1014 1015

  cond.startVersion = -1;
  cond.endVersion = maxVersion;
  cond.twindows = (STimeWindow){.skey = startTs, .ekey = endTs};

  SExecTaskInfo* pTaskInfo = pTableScanOp->pTaskInfo;

  SSDataBlock* pBlock = pTableScanInfo->pResBlock;
  STsdbReader* pReader = NULL;
L
Liu Jicong 已提交
1016
  int32_t      code = tsdbReaderOpen(pTableScanInfo->base.readHandle.vnode, &cond, &tblInfo, 1, pBlock,
D
dapan1121 已提交
1017
                                     (STsdbReader**)&pReader, GET_TASKID(pTaskInfo), false);
1018 1019
  if (code != TSDB_CODE_SUCCESS) {
    terrno = code;
dengyihao's avatar
dengyihao 已提交
1020
    T_LONG_JMP(pTaskInfo->env, code);
1021 1022 1023
    return NULL;
  }

H
Haojun Liao 已提交
1024
  if (tsdbNextDataBlock(pReader)) {
L
Liu Jicong 已提交
1025
    /*SSDataBlock* p = */ tsdbRetrieveDataBlock(pReader, NULL);
H
Haojun Liao 已提交
1026
    doSetTagColumnData(&pTableScanInfo->base, pBlock, pTaskInfo, pBlock->info.rows);
H
Haojun Liao 已提交
1027
    pBlock->info.id.groupId = getTableGroupId(pTaskInfo->pTableInfoList, pBlock->info.id.uid);
1028 1029 1030 1031
  }

  tsdbReaderClose(pReader);
  qDebug("retrieve prev rows:%d, skey:%" PRId64 ", ekey:%" PRId64 " uid:%" PRIu64 ", max ver:%" PRId64
5
54liuyao 已提交
1032 1033
         ", suid:%" PRIu64,
         pBlock->info.rows, startTs, endTs, tbUid, maxVersion, cond.suid);
1034 1035

  return pBlock->info.rows > 0 ? pBlock : NULL;
1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046
}

static uint64_t getGroupIdByCol(SStreamScanInfo* pInfo, uint64_t uid, TSKEY ts, int64_t maxVersion) {
  SSDataBlock* pPreRes = readPreVersionData(pInfo->pTableScanOp, uid, ts, ts, maxVersion);
  if (!pPreRes || pPreRes->info.rows == 0) {
    return 0;
  }
  ASSERT(pPreRes->info.rows == 1);
  return calGroupIdByData(&pInfo->partitionSup, pInfo->pPartScalarSup, pPreRes, 0);
}

5
54liuyao 已提交
1047
static uint64_t getGroupIdByUid(SStreamScanInfo* pInfo, uint64_t uid) {
H
Haojun Liao 已提交
1048
  return getTableGroupId(pInfo->pTableScanOp->pTaskInfo->pTableInfoList, uid);
1049 1050
}

5
54liuyao 已提交
1051 1052 1053 1054 1055 1056 1057 1058
static uint64_t getGroupIdByData(SStreamScanInfo* pInfo, uint64_t uid, TSKEY ts, int64_t maxVersion) {
  if (pInfo->partitionSup.needCalc) {
    return getGroupIdByCol(pInfo, uid, ts, maxVersion);
  }

  return getGroupIdByUid(pInfo, uid);
}

L
Liu Jicong 已提交
1059
static bool prepareRangeScan(SStreamScanInfo* pInfo, SSDataBlock* pBlock, int32_t* pRowIndex) {
5
54liuyao 已提交
1060 1061 1062
  if (pBlock->info.rows == 0) {
    return false;
  }
L
Liu Jicong 已提交
1063 1064 1065 1066 1067 1068 1069 1070 1071 1072
  if ((*pRowIndex) == pBlock->info.rows) {
    return false;
  }

  ASSERT(taosArrayGetSize(pBlock->pDataBlock) >= 3);
  SColumnInfoData* pStartTsCol = taosArrayGet(pBlock->pDataBlock, START_TS_COLUMN_INDEX);
  TSKEY*           startData = (TSKEY*)pStartTsCol->pData;
  SColumnInfoData* pEndTsCol = taosArrayGet(pBlock->pDataBlock, END_TS_COLUMN_INDEX);
  TSKEY*           endData = (TSKEY*)pEndTsCol->pData;
  STimeWindow      win = {.skey = startData[*pRowIndex], .ekey = endData[*pRowIndex]};
1073 1074 1075
  SColumnInfoData* pGpCol = taosArrayGet(pBlock->pDataBlock, GROUPID_COLUMN_INDEX);
  uint64_t*        gpData = (uint64_t*)pGpCol->pData;
  uint64_t         groupId = gpData[*pRowIndex];
1076 1077 1078 1079 1080 1081

  SColumnInfoData* pCalStartTsCol = taosArrayGet(pBlock->pDataBlock, CALCULATE_START_TS_COLUMN_INDEX);
  TSKEY*           calStartData = (TSKEY*)pCalStartTsCol->pData;
  SColumnInfoData* pCalEndTsCol = taosArrayGet(pBlock->pDataBlock, CALCULATE_END_TS_COLUMN_INDEX);
  TSKEY*           calEndData = (TSKEY*)pCalEndTsCol->pData;

L
Liu Jicong 已提交
1082
  setGroupId(pInfo, pBlock, GROUPID_COLUMN_INDEX, *pRowIndex);
1083 1084 1085 1086
  if (isSlidingWindow(pInfo)) {
    pInfo->updateWin.skey = calStartData[*pRowIndex];
    pInfo->updateWin.ekey = calEndData[*pRowIndex];
  }
L
Liu Jicong 已提交
1087 1088 1089
  (*pRowIndex)++;

  for (; *pRowIndex < pBlock->info.rows; (*pRowIndex)++) {
1090
    if (win.skey == startData[*pRowIndex] && groupId == gpData[*pRowIndex]) {
L
Liu Jicong 已提交
1091 1092 1093
      win.ekey = TMAX(win.ekey, endData[*pRowIndex]);
      continue;
    }
1094
    if (win.skey == endData[*pRowIndex] && groupId == gpData[*pRowIndex]) {
L
Liu Jicong 已提交
1095 1096 1097
      win.skey = TMIN(win.skey, startData[*pRowIndex]);
      continue;
    }
1098 1099
    ASSERT(!(win.skey > startData[*pRowIndex] && win.ekey < endData[*pRowIndex]) ||
           !(isInTimeWindow(&win, startData[*pRowIndex], 0) || isInTimeWindow(&win, endData[*pRowIndex], 0)));
L
Liu Jicong 已提交
1100 1101 1102 1103
    break;
  }

  resetTableScanInfo(pInfo->pTableScanOp->info, &win);
1104
  pInfo->pTableScanOp->status = OP_OPENED;
L
Liu Jicong 已提交
1105 1106 1107
  return true;
}

5
54liuyao 已提交
1108
static STimeWindow getSlidingWindow(TSKEY* startTsCol, TSKEY* endTsCol, uint64_t* gpIdCol, SInterval* pInterval,
1109
                                    SDataBlockInfo* pDataBlockInfo, int32_t* pRowIndex, bool hasGroup) {
H
Haojun Liao 已提交
1110
  SResultRowInfo dumyInfo = {0};
5
54liuyao 已提交
1111
  dumyInfo.cur.pageId = -1;
1112
  STimeWindow win = getActiveTimeWindow(NULL, &dumyInfo, startTsCol[*pRowIndex], pInterval, TSDB_ORDER_ASC);
5
54liuyao 已提交
1113 1114
  STimeWindow endWin = win;
  STimeWindow preWin = win;
5
54liuyao 已提交
1115
  uint64_t    groupId = gpIdCol[*pRowIndex];
H
Haojun Liao 已提交
1116

5
54liuyao 已提交
1117
  while (1) {
1118 1119 1120
    if (hasGroup) {
      (*pRowIndex) += 1;
    } else {
5
54liuyao 已提交
1121
      while ((groupId == gpIdCol[(*pRowIndex)] && startTsCol[*pRowIndex] <= endWin.ekey)) {
5
54liuyao 已提交
1122 1123 1124 1125 1126
        (*pRowIndex) += 1;
        if ((*pRowIndex) == pDataBlockInfo->rows) {
          break;
        }
      }
1127
    }
5
54liuyao 已提交
1128

5
54liuyao 已提交
1129 1130 1131
    do {
      preWin = endWin;
      getNextTimeWindow(pInterval, &endWin, TSDB_ORDER_ASC);
1132
    } while (endTsCol[(*pRowIndex) - 1] >= endWin.skey);
5
54liuyao 已提交
1133
    endWin = preWin;
5
54liuyao 已提交
1134
    if (win.ekey == endWin.ekey || (*pRowIndex) == pDataBlockInfo->rows || groupId != gpIdCol[*pRowIndex]) {
5
54liuyao 已提交
1135 1136 1137 1138 1139 1140
      win.ekey = endWin.ekey;
      return win;
    }
    win.ekey = endWin.ekey;
  }
}
5
54liuyao 已提交
1141

L
Liu Jicong 已提交
1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152
static SSDataBlock* doRangeScan(SStreamScanInfo* pInfo, SSDataBlock* pSDB, int32_t tsColIndex, int32_t* pRowIndex) {
  while (1) {
    SSDataBlock* pResult = NULL;
    pResult = doTableScan(pInfo->pTableScanOp);
    if (!pResult && prepareRangeScan(pInfo, pSDB, pRowIndex)) {
      // scan next window data
      pResult = doTableScan(pInfo->pTableScanOp);
    }
    if (!pResult) {
      blockDataCleanup(pSDB);
      *pRowIndex = 0;
5
54liuyao 已提交
1153
      pInfo->updateWin = (STimeWindow){.skey = INT64_MIN, .ekey = INT64_MAX};
H
Hongze Cheng 已提交
1154
      STableScanInfo* pTableScanInfo = pInfo->pTableScanOp->info;
H
Haojun Liao 已提交
1155
      tsdbReaderClose(pTableScanInfo->base.dataReader);
H
Haojun Liao 已提交
1156
      qDebug("2");
H
Haojun Liao 已提交
1157
      pTableScanInfo->base.dataReader = NULL;
1158 1159
      return NULL;
    }
L
Liu Jicong 已提交
1160

H
Haojun Liao 已提交
1161
    doFilter(pResult, pInfo->pTableScanOp->exprSupp.pFilterInfo, NULL);
1162 1163 1164 1165
    if (pResult->info.rows == 0) {
      continue;
    }

1166 1167 1168 1169 1170 1171 1172 1173
    if (pInfo->partitionSup.needCalc) {
      SSDataBlock* tmpBlock = createOneDataBlock(pResult, true);
      blockDataCleanup(pResult);
      for (int32_t i = 0; i < tmpBlock->info.rows; i++) {
        if (calGroupIdByData(&pInfo->partitionSup, pInfo->pPartScalarSup, tmpBlock, i) == pInfo->groupId) {
          for (int32_t j = 0; j < pInfo->pTableScanOp->exprSupp.numOfExprs; j++) {
            SColumnInfoData* pSrcCol = taosArrayGet(tmpBlock->pDataBlock, j);
            SColumnInfoData* pDestCol = taosArrayGet(pResult->pDataBlock, j);
L
Liu Jicong 已提交
1174 1175
            bool             isNull = colDataIsNull(pSrcCol, tmpBlock->info.rows, i, NULL);
            char*            pSrcData = colDataGetData(pSrcCol, i);
1176
            colDataSetVal(pDestCol, pResult->info.rows, pSrcData, isNull);
1177 1178 1179 1180
          }
          pResult->info.rows++;
        }
      }
H
Haojun Liao 已提交
1181 1182 1183

      blockDataDestroy(tmpBlock);

1184 1185 1186 1187
      if (pResult->info.rows > 0) {
        pResult->info.calWin = pInfo->updateWin;
        return pResult;
      }
H
Haojun Liao 已提交
1188
    } else if (pResult->info.id.groupId == pInfo->groupId) {
5
54liuyao 已提交
1189
      pResult->info.calWin = pInfo->updateWin;
1190
      return pResult;
5
54liuyao 已提交
1191 1192
    }
  }
1193
}
1194

1195
static int32_t getPreSessionWindow(SStreamAggSupporter* pAggSup, TSKEY startTs, TSKEY endTs, uint64_t groupId,
X
Xiaoyu Wang 已提交
1196
                                   SSessionKey* pKey) {
1197 1198 1199
  pKey->win.skey = startTs;
  pKey->win.ekey = endTs;
  pKey->groupId = groupId;
X
Xiaoyu Wang 已提交
1200

1201 1202 1203 1204 1205
  SStreamStateCur* pCur = streamStateSessionSeekKeyCurrentPrev(pAggSup->pState, pKey);
  int32_t          code = streamStateSessionGetKVByCur(pCur, pKey, NULL, 0);
  if (code != TSDB_CODE_SUCCESS) {
    SET_SESSION_WIN_KEY_INVALID(pKey);
  }
H
Haojun Liao 已提交
1206 1207

  taosMemoryFree(pCur);
1208 1209 1210
  return code;
}

1211
static int32_t generateSessionScanRange(SStreamScanInfo* pInfo, SSDataBlock* pSrcBlock, SSDataBlock* pDestBlock) {
5
54liuyao 已提交
1212
  blockDataCleanup(pDestBlock);
1213 1214
  if (pSrcBlock->info.rows == 0) {
    return TSDB_CODE_SUCCESS;
1215
  }
1216
  int32_t code = blockDataEnsureCapacity(pDestBlock, pSrcBlock->info.rows);
1217
  if (code != TSDB_CODE_SUCCESS) {
1218
    return code;
L
Liu Jicong 已提交
1219
  }
1220 1221
  ASSERT(taosArrayGetSize(pSrcBlock->pDataBlock) >= 3);
  SColumnInfoData* pStartTsCol = taosArrayGet(pSrcBlock->pDataBlock, START_TS_COLUMN_INDEX);
L
Liu Jicong 已提交
1222
  TSKEY*           startData = (TSKEY*)pStartTsCol->pData;
1223
  SColumnInfoData* pEndTsCol = taosArrayGet(pSrcBlock->pDataBlock, END_TS_COLUMN_INDEX);
L
Liu Jicong 已提交
1224
  TSKEY*           endData = (TSKEY*)pEndTsCol->pData;
1225 1226
  SColumnInfoData* pUidCol = taosArrayGet(pSrcBlock->pDataBlock, UID_COLUMN_INDEX);
  uint64_t*        uidCol = (uint64_t*)pUidCol->pData;
L
Liu Jicong 已提交
1227

1228 1229
  SColumnInfoData* pDestStartCol = taosArrayGet(pDestBlock->pDataBlock, START_TS_COLUMN_INDEX);
  SColumnInfoData* pDestEndCol = taosArrayGet(pDestBlock->pDataBlock, END_TS_COLUMN_INDEX);
5
54liuyao 已提交
1230
  SColumnInfoData* pDestUidCol = taosArrayGet(pDestBlock->pDataBlock, UID_COLUMN_INDEX);
1231
  SColumnInfoData* pDestGpCol = taosArrayGet(pDestBlock->pDataBlock, GROUPID_COLUMN_INDEX);
5
54liuyao 已提交
1232 1233
  SColumnInfoData* pDestCalStartTsCol = taosArrayGet(pDestBlock->pDataBlock, CALCULATE_START_TS_COLUMN_INDEX);
  SColumnInfoData* pDestCalEndTsCol = taosArrayGet(pDestBlock->pDataBlock, CALCULATE_END_TS_COLUMN_INDEX);
L
Liu Jicong 已提交
1234
  int64_t          version = pSrcBlock->info.version - 1;
1235
  for (int32_t i = 0; i < pSrcBlock->info.rows; i++) {
1236
    uint64_t groupId = getGroupIdByData(pInfo, uidCol[i], startData[i], version);
L
Liu Jicong 已提交
1237
    // gap must be 0.
5
54liuyao 已提交
1238
    SSessionKey startWin = {0};
1239
    getCurSessionWindow(pInfo->windowSup.pStreamAggSup, startData[i], startData[i], groupId, &startWin);
5
54liuyao 已提交
1240
    if (IS_INVALID_SESSION_WIN_KEY(startWin)) {
L
Liu Jicong 已提交
1241 1242 1243
      // window has been closed.
      continue;
    }
5
54liuyao 已提交
1244 1245
    SSessionKey endWin = {0};
    getCurSessionWindow(pInfo->windowSup.pStreamAggSup, endData[i], endData[i], groupId, &endWin);
X
Xiaoyu Wang 已提交
1246
    if (IS_INVALID_SESSION_WIN_KEY(endWin)) {
1247 1248 1249 1250
      getPreSessionWindow(pInfo->windowSup.pStreamAggSup, endData[i], endData[i], groupId, &endWin);
    }
    if (IS_INVALID_SESSION_WIN_KEY(startWin)) {
      // window has been closed.
X
Xiaoyu Wang 已提交
1251
      qError("generate session scan range failed. rang start:%" PRIx64 ", end:%" PRIx64, startData[i], endData[i]);
1252 1253
      continue;
    }
1254 1255
    colDataSetVal(pDestStartCol, i, (const char*)&startWin.win.skey, false);
    colDataSetVal(pDestEndCol, i, (const char*)&endWin.win.ekey, false);
5
54liuyao 已提交
1256

1257
    colDataSetNULL(pDestUidCol, i);
1258
    colDataSetVal(pDestGpCol, i, (const char*)&groupId, false);
1259 1260
    colDataSetNULL(pDestCalStartTsCol, i);
    colDataSetNULL(pDestCalEndTsCol, i);
1261
    pDestBlock->info.rows++;
L
Liu Jicong 已提交
1262
  }
1263
  return TSDB_CODE_SUCCESS;
L
Liu Jicong 已提交
1264
}
1265 1266 1267 1268 1269 1270

static int32_t generateIntervalScanRange(SStreamScanInfo* pInfo, SSDataBlock* pSrcBlock, SSDataBlock* pDestBlock) {
  blockDataCleanup(pDestBlock);
  int32_t rows = pSrcBlock->info.rows;
  if (rows == 0) {
    return TSDB_CODE_SUCCESS;
1271
  }
1272

1273 1274
  SColumnInfoData* pSrcStartTsCol = (SColumnInfoData*)taosArrayGet(pSrcBlock->pDataBlock, START_TS_COLUMN_INDEX);
  SColumnInfoData* pSrcEndTsCol = (SColumnInfoData*)taosArrayGet(pSrcBlock->pDataBlock, END_TS_COLUMN_INDEX);
1275 1276
  SColumnInfoData* pSrcUidCol = taosArrayGet(pSrcBlock->pDataBlock, UID_COLUMN_INDEX);
  SColumnInfoData* pSrcGpCol = taosArrayGet(pSrcBlock->pDataBlock, GROUPID_COLUMN_INDEX);
5
54liuyao 已提交
1277

L
Liu Jicong 已提交
1278
  uint64_t* srcUidData = (uint64_t*)pSrcUidCol->pData;
1279
  ASSERT(pSrcStartTsCol->info.type == TSDB_DATA_TYPE_TIMESTAMP);
5
54liuyao 已提交
1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315
  TSKEY*  srcStartTsCol = (TSKEY*)pSrcStartTsCol->pData;
  TSKEY*  srcEndTsCol = (TSKEY*)pSrcEndTsCol->pData;
  int64_t version = pSrcBlock->info.version - 1;

  if (pInfo->partitionSup.needCalc && srcStartTsCol[0] != srcEndTsCol[0]) {
    uint64_t     srcUid = srcUidData[0];
    TSKEY        startTs = srcStartTsCol[0];
    TSKEY        endTs = srcEndTsCol[0];
    SSDataBlock* pPreRes = readPreVersionData(pInfo->pTableScanOp, srcUid, startTs, endTs, version);
    printDataBlock(pPreRes, "pre res");
    blockDataCleanup(pSrcBlock);
    int32_t code = blockDataEnsureCapacity(pSrcBlock, pPreRes->info.rows);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
    }

    SColumnInfoData* pTsCol = (SColumnInfoData*)taosArrayGet(pPreRes->pDataBlock, pInfo->primaryTsIndex);
    rows = pPreRes->info.rows;

    for (int32_t i = 0; i < rows; i++) {
      uint64_t groupId = calGroupIdByData(&pInfo->partitionSup, pInfo->pPartScalarSup, pPreRes, i);
      appendOneRowToStreamSpecialBlock(pSrcBlock, ((TSKEY*)pTsCol->pData) + i, ((TSKEY*)pTsCol->pData) + i, &srcUid,
                                       &groupId, NULL);
    }
    printDataBlock(pSrcBlock, "new delete");
  }
  uint64_t* srcGp = (uint64_t*)pSrcGpCol->pData;
  srcStartTsCol = (TSKEY*)pSrcStartTsCol->pData;
  srcEndTsCol = (TSKEY*)pSrcEndTsCol->pData;
  srcUidData = (uint64_t*)pSrcUidCol->pData;

  int32_t code = blockDataEnsureCapacity(pDestBlock, rows);
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

1316 1317
  SColumnInfoData* pStartTsCol = taosArrayGet(pDestBlock->pDataBlock, START_TS_COLUMN_INDEX);
  SColumnInfoData* pEndTsCol = taosArrayGet(pDestBlock->pDataBlock, END_TS_COLUMN_INDEX);
1318
  SColumnInfoData* pDeUidCol = taosArrayGet(pDestBlock->pDataBlock, UID_COLUMN_INDEX);
1319 1320 1321
  SColumnInfoData* pGpCol = taosArrayGet(pDestBlock->pDataBlock, GROUPID_COLUMN_INDEX);
  SColumnInfoData* pCalStartTsCol = taosArrayGet(pDestBlock->pDataBlock, CALCULATE_START_TS_COLUMN_INDEX);
  SColumnInfoData* pCalEndTsCol = taosArrayGet(pDestBlock->pDataBlock, CALCULATE_END_TS_COLUMN_INDEX);
1322
  for (int32_t i = 0; i < rows;) {
1323
    uint64_t srcUid = srcUidData[i];
5
54liuyao 已提交
1324 1325 1326 1327 1328
    uint64_t groupId = srcGp[i];
    if (groupId == 0) {
      groupId = getGroupIdByData(pInfo, srcUid, srcStartTsCol[i], version);
    }
    TSKEY calStartTs = srcStartTsCol[i];
1329
    colDataSetVal(pCalStartTsCol, pDestBlock->info.rows, (const char*)(&calStartTs), false);
5
54liuyao 已提交
1330
    STimeWindow win = getSlidingWindow(srcStartTsCol, srcEndTsCol, srcGp, &pInfo->interval, &pSrcBlock->info, &i,
1331 1332
                                       pInfo->partitionSup.needCalc);
    TSKEY       calEndTs = srcStartTsCol[i - 1];
1333 1334 1335 1336 1337
    colDataSetVal(pCalEndTsCol, pDestBlock->info.rows, (const char*)(&calEndTs), false);
    colDataSetVal(pDeUidCol, pDestBlock->info.rows, (const char*)(&srcUid), false);
    colDataSetVal(pStartTsCol, pDestBlock->info.rows, (const char*)(&win.skey), false);
    colDataSetVal(pEndTsCol, pDestBlock->info.rows, (const char*)(&win.ekey), false);
    colDataSetVal(pGpCol, pDestBlock->info.rows, (const char*)(&groupId), false);
1338
    pDestBlock->info.rows++;
5
54liuyao 已提交
1339
  }
1340 1341
  return TSDB_CODE_SUCCESS;
}
1342

1343
static int32_t generateDeleteResultBlock(SStreamScanInfo* pInfo, SSDataBlock* pSrcBlock, SSDataBlock* pDestBlock) {
5
54liuyao 已提交
1344 1345 1346
  blockDataCleanup(pDestBlock);
  int32_t rows = pSrcBlock->info.rows;
  if (rows == 0) {
1347 1348
    return TSDB_CODE_SUCCESS;
  }
5
54liuyao 已提交
1349
  int32_t code = blockDataEnsureCapacity(pDestBlock, rows);
1350 1351 1352 1353
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

5
54liuyao 已提交
1354 1355 1356 1357 1358 1359 1360 1361 1362 1363
  SColumnInfoData* pSrcStartTsCol = (SColumnInfoData*)taosArrayGet(pSrcBlock->pDataBlock, START_TS_COLUMN_INDEX);
  SColumnInfoData* pSrcEndTsCol = (SColumnInfoData*)taosArrayGet(pSrcBlock->pDataBlock, END_TS_COLUMN_INDEX);
  SColumnInfoData* pSrcUidCol = taosArrayGet(pSrcBlock->pDataBlock, UID_COLUMN_INDEX);
  uint64_t*        srcUidData = (uint64_t*)pSrcUidCol->pData;
  SColumnInfoData* pSrcGpCol = taosArrayGet(pSrcBlock->pDataBlock, GROUPID_COLUMN_INDEX);
  uint64_t*        srcGp = (uint64_t*)pSrcGpCol->pData;
  ASSERT(pSrcStartTsCol->info.type == TSDB_DATA_TYPE_TIMESTAMP);
  TSKEY*  srcStartTsCol = (TSKEY*)pSrcStartTsCol->pData;
  TSKEY*  srcEndTsCol = (TSKEY*)pSrcEndTsCol->pData;
  int64_t version = pSrcBlock->info.version - 1;
1364
  for (int32_t i = 0; i < pSrcBlock->info.rows; i++) {
5
54liuyao 已提交
1365 1366
    uint64_t srcUid = srcUidData[i];
    uint64_t groupId = srcGp[i];
L
Liu Jicong 已提交
1367
    char*    tbname[VARSTR_HEADER_SIZE + TSDB_TABLE_NAME_LEN] = {0};
5
54liuyao 已提交
1368 1369 1370
    if (groupId == 0) {
      groupId = getGroupIdByData(pInfo, srcUid, srcStartTsCol[i], version);
    }
L
Liu Jicong 已提交
1371
    if (pInfo->tbnameCalSup.pExprInfo) {
1372 1373 1374
      void* parTbname = NULL;
      streamStateGetParName(pInfo->pStreamScanOp->pTaskInfo->streamInfo.pState, groupId, &parTbname);

L
Liu Jicong 已提交
1375 1376
      memcpy(varDataVal(tbname), parTbname, TSDB_TABLE_NAME_LEN);
      varDataSetLen(tbname, strlen(varDataVal(tbname)));
L
Liu Jicong 已提交
1377
      tdbFree(parTbname);
L
Liu Jicong 已提交
1378 1379 1380
    }
    appendOneRowToStreamSpecialBlock(pDestBlock, srcStartTsCol + i, srcEndTsCol + i, srcUidData + i, &groupId,
                                     tbname[0] == 0 ? NULL : tbname);
1381 1382 1383 1384
  }
  return TSDB_CODE_SUCCESS;
}

1385 1386 1387 1388
static int32_t generateScanRange(SStreamScanInfo* pInfo, SSDataBlock* pSrcBlock, SSDataBlock* pDestBlock) {
  int32_t code = TSDB_CODE_SUCCESS;
  if (isIntervalWindow(pInfo)) {
    code = generateIntervalScanRange(pInfo, pSrcBlock, pDestBlock);
1389
  } else if (isSessionWindow(pInfo) || isStateWindow(pInfo)) {
1390
    code = generateSessionScanRange(pInfo, pSrcBlock, pDestBlock);
5
54liuyao 已提交
1391 1392
  } else {
    code = generateDeleteResultBlock(pInfo, pSrcBlock, pDestBlock);
1393
  }
1394
  pDestBlock->info.type = STREAM_CLEAR;
1395
  pDestBlock->info.version = pSrcBlock->info.version;
1396
  pDestBlock->info.dataLoad = 1;
1397 1398 1399 1400
  blockDataUpdateTsWindow(pDestBlock, 0);
  return code;
}

L
Liu Jicong 已提交
1401 1402 1403
#if 0
void calBlockTag(SStreamScanInfo* pInfo, SSDataBlock* pBlock) {
  SExprSupp*    pTagCalSup = &pInfo->tagCalSup;
1404
  SStreamState* pState = pInfo->pStreamScanOp->pTaskInfo->streamInfo.pState;
L
Liu Jicong 已提交
1405
  if (pTagCalSup == NULL || pTagCalSup->numOfExprs == 0) return;
L
Liu Jicong 已提交
1406
  if (pBlock == NULL || pBlock->info.rows == 0) return;
1407

L
Liu Jicong 已提交
1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423
  void*   tag = NULL;
  int32_t tagLen = 0;
  if (streamStateGetParTag(pState, pBlock->info.id.groupId, &tag, &tagLen) == 0) {
    pBlock->info.tagLen = tagLen;
    void* pTag = taosMemoryRealloc(pBlock->info.pTag, tagLen);
    if (pTag == NULL) {
      tdbFree(tag);
      taosMemoryFree(pBlock->info.pTag);
      pBlock->info.pTag = NULL;
      pBlock->info.tagLen = 0;
      return;
    }
    pBlock->info.pTag = pTag;
    memcpy(pBlock->info.pTag, tag, tagLen);
    tdbFree(tag);
    return;
L
Liu Jicong 已提交
1424
  } else {
L
Liu Jicong 已提交
1425
    pBlock->info.pTag = NULL;
L
Liu Jicong 已提交
1426
  }
L
Liu Jicong 已提交
1427 1428 1429
  tdbFree(tag);
}
#endif
L
Liu Jicong 已提交
1430

5
54liuyao 已提交
1431
static void calBlockTbName(SStreamScanInfo* pInfo, SSDataBlock* pBlock) {
1432 1433
  SExprSupp*    pTbNameCalSup = &pInfo->tbnameCalSup;
  SStreamState* pState = pInfo->pStreamScanOp->pTaskInfo->streamInfo.pState;
5
54liuyao 已提交
1434 1435
  blockDataCleanup(pInfo->pCreateTbRes);
  if (pInfo->tbnameCalSup.numOfExprs == 0 && pInfo->tagCalSup.numOfExprs == 0) {
L
Liu Jicong 已提交
1436
    pBlock->info.parTbName[0] = 0;
L
Liu Jicong 已提交
1437
  } else {
5
54liuyao 已提交
1438 1439
    appendCreateTableRow(pInfo->pStreamScanOp->pTaskInfo->streamInfo.pState, &pInfo->tbnameCalSup, &pInfo->tagCalSup,
                         pBlock->info.id.groupId, pBlock, 0, pInfo->pCreateTbRes);
L
Liu Jicong 已提交
1440
  }
L
Liu Jicong 已提交
1441 1442
}

1443 1444
void appendOneRowToStreamSpecialBlock(SSDataBlock* pBlock, TSKEY* pStartTs, TSKEY* pEndTs, uint64_t* pUid,
                                      uint64_t* pGp, void* pTbName) {
1445 1446
  SColumnInfoData* pStartTsCol = taosArrayGet(pBlock->pDataBlock, START_TS_COLUMN_INDEX);
  SColumnInfoData* pEndTsCol = taosArrayGet(pBlock->pDataBlock, END_TS_COLUMN_INDEX);
1447 1448
  SColumnInfoData* pUidCol = taosArrayGet(pBlock->pDataBlock, UID_COLUMN_INDEX);
  SColumnInfoData* pGpCol = taosArrayGet(pBlock->pDataBlock, GROUPID_COLUMN_INDEX);
1449 1450
  SColumnInfoData* pCalStartCol = taosArrayGet(pBlock->pDataBlock, CALCULATE_START_TS_COLUMN_INDEX);
  SColumnInfoData* pCalEndCol = taosArrayGet(pBlock->pDataBlock, CALCULATE_END_TS_COLUMN_INDEX);
1451
  SColumnInfoData* pTableCol = taosArrayGet(pBlock->pDataBlock, TABLE_NAME_COLUMN_INDEX);
1452 1453 1454 1455 1456 1457 1458
  colDataSetVal(pStartTsCol, pBlock->info.rows, (const char*)pStartTs, false);
  colDataSetVal(pEndTsCol, pBlock->info.rows, (const char*)pEndTs, false);
  colDataSetVal(pUidCol, pBlock->info.rows, (const char*)pUid, false);
  colDataSetVal(pGpCol, pBlock->info.rows, (const char*)pGp, false);
  colDataSetVal(pCalStartCol, pBlock->info.rows, (const char*)pStartTs, false);
  colDataSetVal(pCalEndCol, pBlock->info.rows, (const char*)pEndTs, false);
  colDataSetVal(pTableCol, pBlock->info.rows, (const char*)pTbName, pTbName == NULL);
1459
  pBlock->info.rows++;
5
54liuyao 已提交
1460 1461
}

1462
static void checkUpdateData(SStreamScanInfo* pInfo, bool invertible, SSDataBlock* pBlock, bool out) {
1463 1464
  if (out) {
    blockDataCleanup(pInfo->pUpdateDataRes);
5
54liuyao 已提交
1465
    blockDataEnsureCapacity(pInfo->pUpdateDataRes, pBlock->info.rows * 2);
1466
  }
1467 1468
  SColumnInfoData* pColDataInfo = taosArrayGet(pBlock->pDataBlock, pInfo->primaryTsIndex);
  ASSERT(pColDataInfo->info.type == TSDB_DATA_TYPE_TIMESTAMP);
5
54liuyao 已提交
1469
  TSKEY* tsCol = (TSKEY*)pColDataInfo->pData;
H
Haojun Liao 已提交
1470
  bool   tableInserted = updateInfoIsTableInserted(pInfo->pUpdateInfo, pBlock->info.id.uid);
1471
  for (int32_t rowId = 0; rowId < pBlock->info.rows; rowId++) {
5
54liuyao 已提交
1472 1473
    SResultRowInfo dumyInfo;
    dumyInfo.cur.pageId = -1;
L
Liu Jicong 已提交
1474
    bool        isClosed = false;
5
54liuyao 已提交
1475
    STimeWindow win = {.skey = INT64_MIN, .ekey = INT64_MAX};
X
Xiaoyu Wang 已提交
1476
    bool        overDue = isOverdue(tsCol[rowId], &pInfo->twAggSup);
1477 1478 1479 1480 1481
    if (pInfo->igExpired && overDue) {
      continue;
    }

    if (tableInserted && overDue) {
5
54liuyao 已提交
1482 1483 1484
      win = getActiveTimeWindow(NULL, &dumyInfo, tsCol[rowId], &pInfo->interval, TSDB_ORDER_ASC);
      isClosed = isCloseWindow(&win, &pInfo->twAggSup);
    }
5
54liuyao 已提交
1485
    // must check update info first.
H
Haojun Liao 已提交
1486
    bool update = updateInfoIsUpdated(pInfo->pUpdateInfo, pBlock->info.id.uid, tsCol[rowId]);
L
Liu Jicong 已提交
1487
    bool closedWin = isClosed && isSignleIntervalWindow(pInfo) &&
H
Haojun Liao 已提交
1488
                     isDeletedStreamWindow(&win, pBlock->info.id.groupId,
1489
                                           pInfo->pTableScanOp->pTaskInfo->streamInfo.pState, &pInfo->twAggSup);
L
Liu Jicong 已提交
1490
    if ((update || closedWin) && out) {
L
Liu Jicong 已提交
1491
      qDebug("stream update check not pass, update %d, closedWin %d", update, closedWin);
5
54liuyao 已提交
1492
      uint64_t gpId = 0;
H
Haojun Liao 已提交
1493
      appendOneRowToStreamSpecialBlock(pInfo->pUpdateDataRes, tsCol + rowId, tsCol + rowId, &pBlock->info.id.uid, &gpId,
1494
                                       NULL);
5
54liuyao 已提交
1495 1496
      if (closedWin && pInfo->partitionSup.needCalc) {
        gpId = calGroupIdByData(&pInfo->partitionSup, pInfo->pPartScalarSup, pBlock, rowId);
S
slzhou 已提交
1497 1498
        appendOneRowToStreamSpecialBlock(pInfo->pUpdateDataRes, tsCol + rowId, tsCol + rowId, &pBlock->info.id.uid,
                                         &gpId, NULL);
5
54liuyao 已提交
1499
      }
1500 1501
    }
  }
1502 1503
  if (out && pInfo->pUpdateDataRes->info.rows > 0) {
    pInfo->pUpdateDataRes->info.version = pBlock->info.version;
1504
    pInfo->pUpdateDataRes->info.dataLoad = 1;
1505
    blockDataUpdateTsWindow(pInfo->pUpdateDataRes, 0);
1506
    pInfo->pUpdateDataRes->info.type = pInfo->partitionSup.needCalc ? STREAM_DELETE_DATA : STREAM_CLEAR;
5
54liuyao 已提交
1507 1508
  }
}
L
Liu Jicong 已提交
1509

1510
static int32_t setBlockIntoRes(SStreamScanInfo* pInfo, const SSDataBlock* pBlock, bool filter) {
L
Liu Jicong 已提交
1511 1512
  SDataBlockInfo* pBlockInfo = &pInfo->pRes->info;
  SOperatorInfo*  pOperator = pInfo->pStreamScanOp;
L
Liu Jicong 已提交
1513
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
L
Liu Jicong 已提交
1514

1515 1516
  blockDataEnsureCapacity(pInfo->pRes, pBlock->info.rows);

L
Liu Jicong 已提交
1517
  pInfo->pRes->info.rows = pBlock->info.rows;
H
Haojun Liao 已提交
1518
  pInfo->pRes->info.id.uid = pBlock->info.id.uid;
L
Liu Jicong 已提交
1519
  pInfo->pRes->info.type = STREAM_NORMAL;
1520
  pInfo->pRes->info.version = pBlock->info.version;
L
Liu Jicong 已提交
1521

H
Haojun Liao 已提交
1522
  pInfo->pRes->info.id.groupId = getTableGroupId(pTaskInfo->pTableInfoList, pBlock->info.id.uid);
L
Liu Jicong 已提交
1523 1524

  // todo extract method
H
Haojun Liao 已提交
1525 1526 1527
  for (int32_t i = 0; i < taosArrayGetSize(pInfo->matchInfo.pList); ++i) {
    SColMatchItem* pColMatchInfo = taosArrayGet(pInfo->matchInfo.pList, i);
    if (!pColMatchInfo->needOutput) {
L
Liu Jicong 已提交
1528 1529 1530 1531 1532 1533 1534
      continue;
    }

    bool colExists = false;
    for (int32_t j = 0; j < blockDataGetNumOfCols(pBlock); ++j) {
      SColumnInfoData* pResCol = bdGetColumnInfoData(pBlock, j);
      if (pResCol->info.colId == pColMatchInfo->colId) {
H
Haojun Liao 已提交
1535
        SColumnInfoData* pDst = taosArrayGet(pInfo->pRes->pDataBlock, pColMatchInfo->dstSlotId);
1536
        colDataAssign(pDst, pResCol, pBlock->info.rows, &pInfo->pRes->info);
L
Liu Jicong 已提交
1537 1538 1539 1540 1541 1542 1543
        colExists = true;
        break;
      }
    }

    // the required column does not exists in submit block, let's set it to be all null value
    if (!colExists) {
H
Haojun Liao 已提交
1544
      SColumnInfoData* pDst = taosArrayGet(pInfo->pRes->pDataBlock, pColMatchInfo->dstSlotId);
1545
      colDataSetNNULL(pDst, 0, pBlockInfo->rows);
L
Liu Jicong 已提交
1546 1547 1548 1549 1550
    }
  }

  // currently only the tbname pseudo column
  if (pInfo->numOfPseudoExpr > 0) {
L
Liu Jicong 已提交
1551
    int32_t code = addTagPseudoColumnData(&pInfo->readHandle, pInfo->pPseudoExpr, pInfo->numOfPseudoExpr, pInfo->pRes,
1552
                                          pInfo->pRes->info.rows, GET_TASKID(pTaskInfo), NULL);
K
kailixu 已提交
1553 1554
    // ignore the table not exists error, since this table may have been dropped during the scan procedure.
    if (code != TSDB_CODE_SUCCESS && code != TSDB_CODE_PAR_TABLE_NOT_EXIST) {
L
Liu Jicong 已提交
1555
      blockDataFreeRes((SSDataBlock*)pBlock);
1556
      T_LONG_JMP(pTaskInfo->env, code);
H
Haojun Liao 已提交
1557
    }
K
kailixu 已提交
1558 1559 1560

    // reset the error code.
    terrno = 0;
L
Liu Jicong 已提交
1561 1562
  }

1563
  if (filter) {
H
Haojun Liao 已提交
1564
    doFilter(pInfo->pRes, pOperator->exprSupp.pFilterInfo, NULL);
1565
  }
1566

1567
  pInfo->pRes->info.dataLoad = 1;
L
Liu Jicong 已提交
1568
  blockDataUpdateTsWindow(pInfo->pRes, pInfo->primaryTsIndex);
L
Liu Jicong 已提交
1569
  blockDataFreeRes((SSDataBlock*)pBlock);
L
Liu Jicong 已提交
1570

L
Liu Jicong 已提交
1571
  calBlockTbName(pInfo, pInfo->pRes);
L
Liu Jicong 已提交
1572 1573
  return 0;
}
5
54liuyao 已提交
1574

L
Liu Jicong 已提交
1575
static SSDataBlock* doQueueScan(SOperatorInfo* pOperator) {
1576 1577
  SExecTaskInfo*   pTaskInfo = pOperator->pTaskInfo;
  SStreamScanInfo* pInfo = pOperator->info;
H
Haojun Liao 已提交
1578

1579
  qDebug("start to exec queue scan");
L
Liu Jicong 已提交
1580

L
Liu Jicong 已提交
1581
  if (pTaskInfo->streamInfo.submit.msgStr != NULL) {
L
Liu Jicong 已提交
1582 1583
    if (pInfo->tqReader->msg2.msgStr == NULL) {
      /*pInfo->tqReader->pMsg = pTaskInfo->streamInfo.pReq;*/
L
Liu Jicong 已提交
1584

L
Liu Jicong 已提交
1585
      /*const SSubmitReq* pSubmit = pInfo->tqReader->pMsg;*/
L
Liu Jicong 已提交
1586 1587
      /*if (tqReaderSetDataMsg(pInfo->tqReader, pSubmit, 0) < 0) {*/
      /*void* msgStr = pTaskInfo->streamInfo.*/
L
Liu Jicong 已提交
1588
      SPackedData submit = pTaskInfo->streamInfo.submit;
L
Liu Jicong 已提交
1589
      if (tqReaderSetSubmitReq2(pInfo->tqReader, submit.msgStr, submit.msgLen, submit.ver) < 0) {
L
Liu Jicong 已提交
1590
        qError("submit msg messed up when initing stream submit block %p", submit.msgStr);
L
Liu Jicong 已提交
1591
        pInfo->tqReader->msg2 = (SPackedData){0};
L
Liu Jicong 已提交
1592
        pInfo->tqReader->setMsg = 0;
L
Liu Jicong 已提交
1593 1594 1595 1596 1597 1598 1599
        ASSERT(0);
      }
    }

    blockDataCleanup(pInfo->pRes);
    SDataBlockInfo* pBlockInfo = &pInfo->pRes->info;

L
Liu Jicong 已提交
1600
    while (tqNextDataBlock2(pInfo->tqReader)) {
L
Liu Jicong 已提交
1601 1602
      SSDataBlock block = {0};

1603
      int32_t code = tqRetrieveDataBlock2(&block, pInfo->tqReader, NULL);
L
Liu Jicong 已提交
1604 1605 1606 1607
      if (code != TSDB_CODE_SUCCESS || block.info.rows == 0) {
        continue;
      }

1608
      setBlockIntoRes(pInfo, &block, true);
L
Liu Jicong 已提交
1609 1610 1611 1612 1613 1614

      if (pBlockInfo->rows > 0) {
        return pInfo->pRes;
      }
    }

L
Liu Jicong 已提交
1615
    pInfo->tqReader->msg2 = (SPackedData){0};
L
Liu Jicong 已提交
1616
    pInfo->tqReader->setMsg = 0;
L
Liu Jicong 已提交
1617
    pTaskInfo->streamInfo.submit = (SPackedData){0};
L
Liu Jicong 已提交
1618
    return NULL;
L
Liu Jicong 已提交
1619 1620
  }

L
Liu Jicong 已提交
1621 1622 1623
  if (pTaskInfo->streamInfo.prepareStatus.type == TMQ_OFFSET__SNAPSHOT_DATA) {
    SSDataBlock* pResult = doTableScan(pInfo->pTableScanOp);
    if (pResult && pResult->info.rows > 0) {
1624 1625
      qDebug("queue scan tsdb return %d rows min:%" PRId64 " max:%" PRId64 " wal curVersion:%" PRId64, pResult->info.rows,
             pResult->info.window.skey, pResult->info.window.ekey, pInfo->tqReader->pWalReader->curVersion);
1626
      pTaskInfo->streamInfo.returned = 1;
L
Liu Jicong 已提交
1627 1628
      return pResult;
    } else {
1629 1630
      if (!pTaskInfo->streamInfo.returned) {
        STableScanInfo* pTSInfo = pInfo->pTableScanOp->info;
H
Haojun Liao 已提交
1631
        tsdbReaderClose(pTSInfo->base.dataReader);
H
Haojun Liao 已提交
1632
        qDebug("3");
H
Haojun Liao 已提交
1633
        pTSInfo->base.dataReader = NULL;
1634
        tqOffsetResetToLog(&pTaskInfo->streamInfo.prepareStatus, pTaskInfo->streamInfo.snapshotVer);
1635
        qDebug("queue scan tsdb over, switch to wal ver %" PRId64 "", pTaskInfo->streamInfo.snapshotVer + 1);
H
Haojun Liao 已提交
1636
        if (tqSeekVer(pInfo->tqReader, pTaskInfo->streamInfo.snapshotVer + 1, pTaskInfo->id.str) < 0) {
1637
          tqOffsetResetToLog(&pTaskInfo->streamInfo.lastStatus, pTaskInfo->streamInfo.snapshotVer);
1638 1639 1640
          return NULL;
        }
      } else {
L
Liu Jicong 已提交
1641 1642
        return NULL;
      }
1643 1644 1645
    }
  }

L
Liu Jicong 已提交
1646 1647 1648
  if (pTaskInfo->streamInfo.prepareStatus.type == TMQ_OFFSET__LOG) {
    while (1) {
      SFetchRet ret = {0};
1649
      if (tqNextBlock(pInfo->tqReader, &ret) < 0) {
1650 1651 1652 1653
        // if the end is reached, terrno is 0
        if (terrno != 0) {
          qError("failed to get next log block since %s", terrstr());
        }
1654
      }
1655

L
Liu Jicong 已提交
1656 1657
      if (ret.fetchType == FETCH_TYPE__DATA) {
        blockDataCleanup(pInfo->pRes);
1658
        setBlockIntoRes(pInfo, &ret.data, true);
L
Liu Jicong 已提交
1659
        if (pInfo->pRes->info.rows > 0) {
L
Liu Jicong 已提交
1660
          pOperator->status = OP_EXEC_RECV;
L
Liu Jicong 已提交
1661
          qDebug("queue scan log return %d rows", pInfo->pRes->info.rows);
L
Liu Jicong 已提交
1662 1663 1664
          return pInfo->pRes;
        }
      } else if (ret.fetchType == FETCH_TYPE__META) {
1665
        qError("unexpected ret.fetchType:%d", ret.fetchType);
1666
        continue;
L
Liu Jicong 已提交
1667 1668 1669
        //        pTaskInfo->streamInfo.lastStatus = ret.offset;
        //        pTaskInfo->streamInfo.metaBlk = ret.meta;
        //        return NULL;
L
Liu Jicong 已提交
1670 1671
      } else if (ret.fetchType == FETCH_TYPE__NONE ||
                 (ret.fetchType == FETCH_TYPE__SEP && pOperator->status == OP_EXEC_RECV)) {
L
Liu Jicong 已提交
1672
        pTaskInfo->streamInfo.lastStatus = ret.offset;
1673 1674
        char formatBuf[80];
        tFormatOffset(formatBuf, 80, &ret.offset);
L
Liu Jicong 已提交
1675
        qDebug("queue scan log return null, offset %s", formatBuf);
L
Liu Jicong 已提交
1676
        pOperator->status = OP_OPENED;
L
Liu Jicong 已提交
1677 1678 1679
        return NULL;
      }
    }
L
Liu Jicong 已提交
1680
  } else {
1681
    qError("unexpected streamInfo prepare type: %d", pTaskInfo->streamInfo.prepareStatus.type);
L
Liu Jicong 已提交
1682
    return NULL;
H
Haojun Liao 已提交
1683
  }
L
Liu Jicong 已提交
1684 1685
}

L
Liu Jicong 已提交
1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703
static int32_t filterDelBlockByUid(SSDataBlock* pDst, const SSDataBlock* pSrc, SStreamScanInfo* pInfo) {
  STqReader* pReader = pInfo->tqReader;
  int32_t    rows = pSrc->info.rows;
  blockDataEnsureCapacity(pDst, rows);

  SColumnInfoData* pSrcStartCol = taosArrayGet(pSrc->pDataBlock, START_TS_COLUMN_INDEX);
  uint64_t*        startCol = (uint64_t*)pSrcStartCol->pData;
  SColumnInfoData* pSrcEndCol = taosArrayGet(pSrc->pDataBlock, END_TS_COLUMN_INDEX);
  uint64_t*        endCol = (uint64_t*)pSrcEndCol->pData;
  SColumnInfoData* pSrcUidCol = taosArrayGet(pSrc->pDataBlock, UID_COLUMN_INDEX);
  uint64_t*        uidCol = (uint64_t*)pSrcUidCol->pData;

  SColumnInfoData* pDstStartCol = taosArrayGet(pDst->pDataBlock, START_TS_COLUMN_INDEX);
  SColumnInfoData* pDstEndCol = taosArrayGet(pDst->pDataBlock, END_TS_COLUMN_INDEX);
  SColumnInfoData* pDstUidCol = taosArrayGet(pDst->pDataBlock, UID_COLUMN_INDEX);
  int32_t          j = 0;
  for (int32_t i = 0; i < rows; i++) {
    if (taosHashGet(pReader->tbIdHash, &uidCol[i], sizeof(uint64_t))) {
1704 1705 1706
      colDataSetVal(pDstStartCol, j, (const char*)&startCol[i], false);
      colDataSetVal(pDstEndCol, j, (const char*)&endCol[i], false);
      colDataSetVal(pDstUidCol, j, (const char*)&uidCol[i], false);
L
Liu Jicong 已提交
1707

1708 1709 1710
      colDataSetNULL(taosArrayGet(pDst->pDataBlock, GROUPID_COLUMN_INDEX), j);
      colDataSetNULL(taosArrayGet(pDst->pDataBlock, CALCULATE_START_TS_COLUMN_INDEX), j);
      colDataSetNULL(taosArrayGet(pDst->pDataBlock, CALCULATE_END_TS_COLUMN_INDEX), j);
L
Liu Jicong 已提交
1711 1712 1713
      j++;
    }
  }
L
Liu Jicong 已提交
1714
  uint32_t cap = pDst->info.capacity;
L
Liu Jicong 已提交
1715 1716
  pDst->info = pSrc->info;
  pDst->info.rows = j;
L
Liu Jicong 已提交
1717
  pDst->info.capacity = cap;
L
Liu Jicong 已提交
1718 1719 1720 1721

  return 0;
}

5
54liuyao 已提交
1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733
// for partition by tag
static void setBlockGroupIdByUid(SStreamScanInfo* pInfo, SSDataBlock* pBlock) {
  SColumnInfoData* pStartTsCol = taosArrayGet(pBlock->pDataBlock, START_TS_COLUMN_INDEX);
  TSKEY*           startTsCol = (TSKEY*)pStartTsCol->pData;
  SColumnInfoData* pGpCol = taosArrayGet(pBlock->pDataBlock, GROUPID_COLUMN_INDEX);
  uint64_t*        gpCol = (uint64_t*)pGpCol->pData;
  SColumnInfoData* pUidCol = taosArrayGet(pBlock->pDataBlock, UID_COLUMN_INDEX);
  uint64_t*        uidCol = (uint64_t*)pUidCol->pData;
  int32_t          rows = pBlock->info.rows;
  if (!pInfo->partitionSup.needCalc) {
    for (int32_t i = 0; i < rows; i++) {
      uint64_t groupId = getGroupIdByUid(pInfo, uidCol[i]);
1734
      colDataSetVal(pGpCol, i, (const char*)&groupId, false);
5
54liuyao 已提交
1735 1736 1737 1738
    }
  }
}

5
54liuyao 已提交
1739
static void doCheckUpdate(SStreamScanInfo* pInfo, TSKEY endKey, SSDataBlock* pBlock) {
5
54liuyao 已提交
1740
  if (pInfo->pUpdateInfo) {
5
54liuyao 已提交
1741
    checkUpdateData(pInfo, true, pBlock, true);
5
54liuyao 已提交
1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752
    pInfo->twAggSup.maxTs = TMAX(pInfo->twAggSup.maxTs, endKey);
    if (pInfo->pUpdateDataRes->info.rows > 0) {
      pInfo->updateResIndex = 0;
      if (pInfo->pUpdateDataRes->info.type == STREAM_CLEAR) {
        pInfo->scanMode = STREAM_SCAN_FROM_UPDATERES;
      } else if (pInfo->pUpdateDataRes->info.type == STREAM_INVERT) {
        pInfo->scanMode = STREAM_SCAN_FROM_RES;
        // return pInfo->pUpdateDataRes;
      } else if (pInfo->pUpdateDataRes->info.type == STREAM_DELETE_DATA) {
        pInfo->scanMode = STREAM_SCAN_FROM_DELETE_DATA;
      }
5
54liuyao 已提交
1753 1754 1755 1756
    }
  }
}

L
Liu Jicong 已提交
1757 1758 1759 1760 1761
static SSDataBlock* doStreamScan(SOperatorInfo* pOperator) {
  // NOTE: this operator does never check if current status is done or not
  SExecTaskInfo*   pTaskInfo = pOperator->pTaskInfo;
  SStreamScanInfo* pInfo = pOperator->info;

L
Liu Jicong 已提交
1762
  qDebug("stream scan called");
H
Haojun Liao 已提交
1763

1764 1765
  if (pTaskInfo->streamInfo.recoverStep == STREAM_RECOVER_STEP__PREPARE1 ||
      pTaskInfo->streamInfo.recoverStep == STREAM_RECOVER_STEP__PREPARE2) {
L
Liu Jicong 已提交
1766
    STableScanInfo* pTSInfo = pInfo->pTableScanOp->info;
H
Haojun Liao 已提交
1767
    memcpy(&pTSInfo->base.cond, &pTaskInfo->streamInfo.tableCond, sizeof(SQueryTableDataCond));
1768
    if (pTaskInfo->streamInfo.recoverStep == STREAM_RECOVER_STEP__PREPARE1) {
H
Haojun Liao 已提交
1769 1770 1771 1772
      pTSInfo->base.cond.startVersion = 0;
      pTSInfo->base.cond.endVersion = pTaskInfo->streamInfo.fillHistoryVer1;
      qDebug("stream recover step 1, from %" PRId64 " to %" PRId64, pTSInfo->base.cond.startVersion,
             pTSInfo->base.cond.endVersion);
5
54liuyao 已提交
1773
      pTaskInfo->streamInfo.recoverStep = STREAM_RECOVER_STEP__SCAN1;
1774
    } else {
H
Haojun Liao 已提交
1775 1776 1777 1778
      pTSInfo->base.cond.startVersion = pTaskInfo->streamInfo.fillHistoryVer1 + 1;
      pTSInfo->base.cond.endVersion = pTaskInfo->streamInfo.fillHistoryVer2;
      qDebug("stream recover step 2, from %" PRId64 " to %" PRId64, pTSInfo->base.cond.startVersion,
             pTSInfo->base.cond.endVersion);
5
54liuyao 已提交
1779
      pTaskInfo->streamInfo.recoverStep = STREAM_RECOVER_STEP__SCAN2;
1780
    }
L
Liu Jicong 已提交
1781 1782

    /*resetTableScanInfo(pTSInfo, pWin);*/
H
Haojun Liao 已提交
1783
    tsdbReaderClose(pTSInfo->base.dataReader);
H
Haojun Liao 已提交
1784 1785
    qDebug("4");

H
Haojun Liao 已提交
1786
    pTSInfo->base.dataReader = NULL;
L
Liu Jicong 已提交
1787
    pInfo->pTableScanOp->status = OP_OPENED;
L
Liu Jicong 已提交
1788

L
Liu Jicong 已提交
1789 1790
    pTSInfo->scanTimes = 0;
    pTSInfo->currentGroupId = -1;
L
Liu Jicong 已提交
1791
    pTaskInfo->streamInfo.recoverScanFinished = false;
L
Liu Jicong 已提交
1792 1793
  }

5
54liuyao 已提交
1794 1795
  if (pTaskInfo->streamInfo.recoverStep == STREAM_RECOVER_STEP__SCAN1 ||
      pTaskInfo->streamInfo.recoverStep == STREAM_RECOVER_STEP__SCAN2) {
L
Liu Jicong 已提交
1796 1797 1798 1799 1800
    if (pInfo->blockRecoverContiCnt > 100) {
      pInfo->blockRecoverTotCnt += pInfo->blockRecoverContiCnt;
      pInfo->blockRecoverContiCnt = 0;
      return NULL;
    }
5
54liuyao 已提交
1801 1802 1803 1804 1805 1806 1807

    switch (pInfo->scanMode) {
      case STREAM_SCAN_FROM_RES: {
        pInfo->scanMode = STREAM_SCAN_FROM_READERHANDLE;
        printDataBlock(pInfo->pRecoverRes, "scan recover");
        return pInfo->pRecoverRes;
      } break;
5
54liuyao 已提交
1808 1809 1810 1811
      case STREAM_SCAN_FROM_UPDATERES: {
        generateScanRange(pInfo, pInfo->pUpdateDataRes, pInfo->pUpdateRes);
        prepareRangeScan(pInfo, pInfo->pUpdateRes, &pInfo->updateResIndex);
        pInfo->scanMode = STREAM_SCAN_FROM_DATAREADER_RANGE;
1812
        printDataBlock(pInfo->pUpdateRes, "recover update");
5
54liuyao 已提交
1813 1814 1815 1816 1817 1818 1819 1820 1821 1822
        return pInfo->pUpdateRes;
      } break;
      case STREAM_SCAN_FROM_DATAREADER_RANGE: {
        SSDataBlock* pSDB = doRangeScan(pInfo, pInfo->pUpdateRes, pInfo->primaryTsIndex, &pInfo->updateResIndex);
        if (pSDB) {
          STableScanInfo* pTableScanInfo = pInfo->pTableScanOp->info;
          uint64_t        version = getReaderMaxVersion(pTableScanInfo->base.dataReader);
          updateInfoSetScanRange(pInfo->pUpdateInfo, &pTableScanInfo->base.cond.twindows, pInfo->groupId, version);
          pSDB->info.type = pInfo->scanMode == STREAM_SCAN_FROM_DATAREADER_RANGE ? STREAM_NORMAL : STREAM_PULL_DATA;
          checkUpdateData(pInfo, true, pSDB, false);
1823
          printDataBlock(pSDB, "scan recover update");
5
54liuyao 已提交
1824 1825 1826 1827 1828 1829
          calBlockTbName(pInfo, pSDB);
          return pSDB;
        }
        blockDataCleanup(pInfo->pUpdateDataRes);
        pInfo->scanMode = STREAM_SCAN_FROM_READERHANDLE;
      } break;
5
54liuyao 已提交
1830 1831 1832 1833 1834 1835
      default:
        break;
    }

    pInfo->pRecoverRes = doTableScan(pInfo->pTableScanOp);
    if (pInfo->pRecoverRes != NULL) {
L
Liu Jicong 已提交
1836
      pInfo->blockRecoverContiCnt++;
5
54liuyao 已提交
1837
      calBlockTbName(pInfo, pInfo->pRecoverRes);
1838
      if (pInfo->pUpdateInfo) {
5
54liuyao 已提交
1839 1840 1841 1842 1843 1844
        if (pTaskInfo->streamInfo.recoverStep == STREAM_RECOVER_STEP__SCAN1) {
          TSKEY maxTs = updateInfoFillBlockData(pInfo->pUpdateInfo, pInfo->pRecoverRes, pInfo->primaryTsIndex);
          pInfo->twAggSup.maxTs = TMAX(pInfo->twAggSup.maxTs, maxTs);
        } else {
          doCheckUpdate(pInfo, pInfo->pRecoverRes->info.window.ekey, pInfo->pRecoverRes);
        }
1845
      }
5
54liuyao 已提交
1846 1847
      if (pInfo->pCreateTbRes->info.rows > 0) {
        pInfo->scanMode = STREAM_SCAN_FROM_RES;
1848
        printDataBlock(pInfo->pCreateTbRes, "recover createTbl");
5
54liuyao 已提交
1849 1850 1851 1852 1853
        return pInfo->pCreateTbRes;
      }
      qDebug("stream recover scan get block, rows %d", pInfo->pRecoverRes->info.rows);
      printDataBlock(pInfo->pRecoverRes, "scan recover");
      return pInfo->pRecoverRes;
L
Liu Jicong 已提交
1854 1855
    }
    pTaskInfo->streamInfo.recoverStep = STREAM_RECOVER_STEP__NONE;
L
Liu Jicong 已提交
1856
    STableScanInfo* pTSInfo = pInfo->pTableScanOp->info;
H
Haojun Liao 已提交
1857
    tsdbReaderClose(pTSInfo->base.dataReader);
H
Haojun Liao 已提交
1858 1859
    qDebug("5");

H
Haojun Liao 已提交
1860
    pTSInfo->base.dataReader = NULL;
1861

H
Haojun Liao 已提交
1862 1863
    pTSInfo->base.cond.startVersion = -1;
    pTSInfo->base.cond.endVersion = -1;
L
Liu Jicong 已提交
1864

L
Liu Jicong 已提交
1865
    pTaskInfo->streamInfo.recoverScanFinished = true;
L
Liu Jicong 已提交
1866 1867 1868
    return NULL;
  }

5
54liuyao 已提交
1869
  size_t total = taosArrayGetSize(pInfo->pBlockLists);
5
54liuyao 已提交
1870
// TODO: refactor
L
Liu Jicong 已提交
1871
FETCH_NEXT_BLOCK:
L
Liu Jicong 已提交
1872
  if (pInfo->blockType == STREAM_INPUT__DATA_BLOCK) {
H
Haojun Liao 已提交
1873
    if (pInfo->validBlockIndex >= total) {
L
Liu Jicong 已提交
1874
      doClearBufferedBlocks(pInfo);
L
Liu Jicong 已提交
1875
      /*pOperator->status = OP_EXEC_DONE;*/
H
Haojun Liao 已提交
1876 1877 1878
      return NULL;
    }

1879
    int32_t      current = pInfo->validBlockIndex++;
L
Liu Jicong 已提交
1880 1881
    SPackedData* pPacked = taosArrayGet(pInfo->pBlockLists, current);
    SSDataBlock* pBlock = pPacked->pDataBlock;
5
54liuyao 已提交
1882
    if (pBlock->info.parTbName[0]) {
H
Haojun Liao 已提交
1883
      streamStatePutParName(pTaskInfo->streamInfo.pState, pBlock->info.id.groupId, pBlock->info.parTbName);
1884
    }
1885
    // TODO move into scan
5
54liuyao 已提交
1886 1887
    pBlock->info.calWin.skey = INT64_MIN;
    pBlock->info.calWin.ekey = INT64_MAX;
1888
    pBlock->info.dataLoad = 1;
1889
    blockDataUpdateTsWindow(pBlock, 0);
1890
    switch (pBlock->info.type) {
L
Liu Jicong 已提交
1891 1892 1893
      case STREAM_NORMAL:
      case STREAM_GET_ALL:
        return pBlock;
1894 1895 1896
      case STREAM_RETRIEVE: {
        pInfo->blockType = STREAM_INPUT__DATA_SUBMIT;
        pInfo->scanMode = STREAM_SCAN_FROM_DATAREADER_RETRIEVE;
1897 1898
        copyDataBlock(pInfo->pUpdateRes, pBlock);
        prepareRangeScan(pInfo, pInfo->pUpdateRes, &pInfo->updateResIndex);
1899 1900 1901
        updateInfoAddCloseWindowSBF(pInfo->pUpdateInfo);
      } break;
      case STREAM_DELETE_DATA: {
1902
        printDataBlock(pBlock, "stream scan delete recv");
L
Liu Jicong 已提交
1903
        SSDataBlock* pDelBlock = NULL;
L
Liu Jicong 已提交
1904
        if (pInfo->tqReader) {
L
Liu Jicong 已提交
1905
          pDelBlock = createSpecialDataBlock(STREAM_DELETE_DATA);
L
Liu Jicong 已提交
1906
          filterDelBlockByUid(pDelBlock, pBlock, pInfo);
L
Liu Jicong 已提交
1907 1908
        } else {
          pDelBlock = pBlock;
L
Liu Jicong 已提交
1909
        }
5
54liuyao 已提交
1910 1911
        setBlockGroupIdByUid(pInfo, pDelBlock);
        printDataBlock(pDelBlock, "stream scan delete recv filtered");
5
54liuyao 已提交
1912 1913 1914 1915 1916 1917
        if (pDelBlock->info.rows == 0) {
          if (pInfo->tqReader) {
            blockDataDestroy(pDelBlock);
          }
          goto FETCH_NEXT_BLOCK;
        }
1918
        if (!isIntervalWindow(pInfo) && !isSessionWindow(pInfo) && !isStateWindow(pInfo)) {
L
Liu Jicong 已提交
1919
          generateDeleteResultBlock(pInfo, pDelBlock, pInfo->pDeleteDataRes);
1920
          pInfo->pDeleteDataRes->info.type = STREAM_DELETE_RESULT;
L
Liu Jicong 已提交
1921
          printDataBlock(pDelBlock, "stream scan delete result");
H
Haojun Liao 已提交
1922 1923
          blockDataDestroy(pDelBlock);

L
Liu Jicong 已提交
1924 1925 1926 1927 1928
          if (pInfo->pDeleteDataRes->info.rows > 0) {
            return pInfo->pDeleteDataRes;
          } else {
            goto FETCH_NEXT_BLOCK;
          }
1929 1930 1931
        } else {
          pInfo->blockType = STREAM_INPUT__DATA_SUBMIT;
          pInfo->updateResIndex = 0;
L
Liu Jicong 已提交
1932
          generateScanRange(pInfo, pDelBlock, pInfo->pUpdateRes);
1933 1934 1935
          prepareRangeScan(pInfo, pInfo->pUpdateRes, &pInfo->updateResIndex);
          copyDataBlock(pInfo->pDeleteDataRes, pInfo->pUpdateRes);
          pInfo->pDeleteDataRes->info.type = STREAM_DELETE_DATA;
L
Liu Jicong 已提交
1936 1937 1938 1939
          printDataBlock(pDelBlock, "stream scan delete data");
          if (pInfo->tqReader) {
            blockDataDestroy(pDelBlock);
          }
L
Liu Jicong 已提交
1940
          if (pInfo->pDeleteDataRes->info.rows > 0) {
5
54liuyao 已提交
1941
            pInfo->scanMode = STREAM_SCAN_FROM_DATAREADER_RANGE;
L
Liu Jicong 已提交
1942 1943 1944 1945
            return pInfo->pDeleteDataRes;
          } else {
            goto FETCH_NEXT_BLOCK;
          }
1946
        }
1947 1948 1949
      } break;
      default:
        break;
5
54liuyao 已提交
1950
    }
1951
    // printDataBlock(pBlock, "stream scan recv");
1952
    return pBlock;
L
Liu Jicong 已提交
1953
  } else if (pInfo->blockType == STREAM_INPUT__DATA_SUBMIT) {
L
Liu Jicong 已提交
1954
    qDebug("scan mode %d", pInfo->scanMode);
5
54liuyao 已提交
1955 1956 1957
    switch (pInfo->scanMode) {
      case STREAM_SCAN_FROM_RES: {
        pInfo->scanMode = STREAM_SCAN_FROM_READERHANDLE;
5
54liuyao 已提交
1958
        doCheckUpdate(pInfo, pInfo->pRes->info.window.ekey, pInfo->pRes);
5
54liuyao 已提交
1959 1960 1961
        doFilter(pInfo->pRes, pOperator->exprSupp.pFilterInfo, NULL);
        pInfo->pRes->info.dataLoad = 1;
        blockDataUpdateTsWindow(pInfo->pRes, pInfo->primaryTsIndex);
5
54liuyao 已提交
1962 1963 1964
        if (pInfo->pRes->info.rows > 0) {
          return pInfo->pRes;
        }
5
54liuyao 已提交
1965
      } break;
1966
      case STREAM_SCAN_FROM_DELETE_DATA: {
1967 1968 1969 1970 1971 1972 1973
        generateScanRange(pInfo, pInfo->pUpdateDataRes, pInfo->pUpdateRes);
        prepareRangeScan(pInfo, pInfo->pUpdateRes, &pInfo->updateResIndex);
        pInfo->scanMode = STREAM_SCAN_FROM_DATAREADER_RANGE;
        copyDataBlock(pInfo->pDeleteDataRes, pInfo->pUpdateRes);
        pInfo->pDeleteDataRes->info.type = STREAM_DELETE_DATA;
        return pInfo->pDeleteDataRes;
      } break;
5
54liuyao 已提交
1974 1975 1976 1977 1978 1979 1980 1981 1982 1983
      case STREAM_SCAN_FROM_UPDATERES: {
        generateScanRange(pInfo, pInfo->pUpdateDataRes, pInfo->pUpdateRes);
        prepareRangeScan(pInfo, pInfo->pUpdateRes, &pInfo->updateResIndex);
        pInfo->scanMode = STREAM_SCAN_FROM_DATAREADER_RANGE;
        return pInfo->pUpdateRes;
      } break;
      case STREAM_SCAN_FROM_DATAREADER_RANGE:
      case STREAM_SCAN_FROM_DATAREADER_RETRIEVE: {
        SSDataBlock* pSDB = doRangeScan(pInfo, pInfo->pUpdateRes, pInfo->primaryTsIndex, &pInfo->updateResIndex);
        if (pSDB) {
1984
          STableScanInfo* pTableScanInfo = pInfo->pTableScanOp->info;
H
Haojun Liao 已提交
1985 1986
          uint64_t        version = getReaderMaxVersion(pTableScanInfo->base.dataReader);
          updateInfoSetScanRange(pInfo->pUpdateInfo, &pTableScanInfo->base.cond.twindows, pInfo->groupId, version);
5
54liuyao 已提交
1987 1988
          pSDB->info.type = pInfo->scanMode == STREAM_SCAN_FROM_DATAREADER_RANGE ? STREAM_NORMAL : STREAM_PULL_DATA;
          checkUpdateData(pInfo, true, pSDB, false);
1989
          // printDataBlock(pSDB, "stream scan update");
L
Liu Jicong 已提交
1990
          calBlockTbName(pInfo, pSDB);
5
54liuyao 已提交
1991 1992
          return pSDB;
        }
1993
        blockDataCleanup(pInfo->pUpdateDataRes);
5
54liuyao 已提交
1994 1995 1996 1997
        pInfo->scanMode = STREAM_SCAN_FROM_READERHANDLE;
      } break;
      default:
        break;
1998
    }
1999

2000
    SStreamAggSupporter* pSup = pInfo->windowSup.pStreamAggSup;
5
54liuyao 已提交
2001
    if (isStateWindow(pInfo) && pSup->pScanBlock->info.rows > 0) {
2002 2003
      pInfo->scanMode = STREAM_SCAN_FROM_DATAREADER_RANGE;
      pInfo->updateResIndex = 0;
5
54liuyao 已提交
2004 2005
      copyDataBlock(pInfo->pUpdateRes, pSup->pScanBlock);
      blockDataCleanup(pSup->pScanBlock);
2006 2007
      prepareRangeScan(pInfo, pInfo->pUpdateRes, &pInfo->updateResIndex);
      return pInfo->pUpdateRes;
5
54liuyao 已提交
2008
    }
5
54liuyao 已提交
2009

H
Haojun Liao 已提交
2010 2011
    SDataBlockInfo* pBlockInfo = &pInfo->pRes->info;

2012
    int32_t totBlockNum = taosArrayGetSize(pInfo->pBlockLists);
2013

L
Liu Jicong 已提交
2014
  NEXT_SUBMIT_BLK:
2015
    while (1) {
L
Liu Jicong 已提交
2016
      if (pInfo->tqReader->msg2.msgStr == NULL) {
2017
        if (pInfo->validBlockIndex >= totBlockNum) {
5
54liuyao 已提交
2018
          updateInfoDestoryColseWinSBF(pInfo->pUpdateInfo);
L
Liu Jicong 已提交
2019
          doClearBufferedBlocks(pInfo);
L
Liu Jicong 已提交
2020
          qDebug("stream scan return empty, consume block %d", totBlockNum);
2021 2022
          return NULL;
        }
2023

L
Liu Jicong 已提交
2024 2025
        int32_t      current = pInfo->validBlockIndex++;
        SPackedData* pSubmit = taosArrayGet(pInfo->pBlockLists, current);
L
Liu Jicong 已提交
2026
        /*if (tqReaderSetDataMsg(pInfo->tqReader, pSubmit, 0) < 0) {*/
L
Liu Jicong 已提交
2027
        if (tqReaderSetSubmitReq2(pInfo->tqReader, pSubmit->msgStr, pSubmit->msgLen, pSubmit->ver) < 0) {
2028 2029 2030 2031
          qError("submit msg messed up when initing stream submit block %p, current %d, total %d", pSubmit, current,
                 totBlockNum);
          continue;
        }
H
Haojun Liao 已提交
2032 2033
      }

2034 2035
      blockDataCleanup(pInfo->pRes);

L
Liu Jicong 已提交
2036
      while (tqNextDataBlock2(pInfo->tqReader)) {
2037
        SSDataBlock block = {0};
2038

2039
        int32_t code = tqRetrieveDataBlock2(&block, pInfo->tqReader, NULL);
2040 2041 2042 2043 2044

        if (code != TSDB_CODE_SUCCESS || block.info.rows == 0) {
          continue;
        }

2045
        setBlockIntoRes(pInfo, &block, false);
2046

H
Haojun Liao 已提交
2047
        if (updateInfoIgnore(pInfo->pUpdateInfo, &pInfo->pRes->info.window, pInfo->pRes->info.id.groupId,
L
Liu Jicong 已提交
2048
                             pInfo->pRes->info.version)) {
2049 2050 2051 2052 2053
          printDataBlock(pInfo->pRes, "stream scan ignore");
          blockDataCleanup(pInfo->pRes);
          continue;
        }

5
54liuyao 已提交
2054 2055 2056
        if (pInfo->pCreateTbRes->info.rows > 0) {
          pInfo->scanMode = STREAM_SCAN_FROM_RES;
          return pInfo->pCreateTbRes;
2057 2058
        }

5
54liuyao 已提交
2059
        doCheckUpdate(pInfo, pBlockInfo->window.ekey, pInfo->pRes);
H
Haojun Liao 已提交
2060
        doFilter(pInfo->pRes, pOperator->exprSupp.pFilterInfo, NULL);
2061
        pInfo->pRes->info.dataLoad = 1;
2062 2063 2064
        blockDataUpdateTsWindow(pInfo->pRes, pInfo->primaryTsIndex);

        if (pBlockInfo->rows > 0 || pInfo->pUpdateDataRes->info.rows > 0) {
2065 2066 2067
          break;
        }
      }
2068
      if (pBlockInfo->rows > 0 || pInfo->pUpdateDataRes->info.rows > 0) {
5
54liuyao 已提交
2069
        break;
J
jiacy-jcy 已提交
2070
      } else {
2071
        continue;
5
54liuyao 已提交
2072
      }
H
Haojun Liao 已提交
2073 2074 2075 2076
    }

    // record the scan action.
    pInfo->numOfExec++;
2077
    pOperator->resultInfo.totalRows += pBlockInfo->rows;
2078
    // printDataBlock(pInfo->pRes, "stream scan");
H
Haojun Liao 已提交
2079

L
Liu Jicong 已提交
2080
    qDebug("scan rows: %d", pBlockInfo->rows);
L
Liu Jicong 已提交
2081 2082 2083
    if (pBlockInfo->rows > 0) {
      return pInfo->pRes;
    }
2084 2085 2086 2087 2088 2089

    if (pInfo->pUpdateDataRes->info.rows > 0) {
      goto FETCH_NEXT_BLOCK;
    }

    goto NEXT_SUBMIT_BLK;
L
Liu Jicong 已提交
2090 2091 2092
  } else {
    ASSERT(0);
    return NULL;
H
Haojun Liao 已提交
2093 2094 2095
  }
}

H
Haojun Liao 已提交
2096
static SArray* extractTableIdList(const STableListInfo* pTableListInfo) {
2097 2098 2099
  SArray* tableIdList = taosArrayInit(4, sizeof(uint64_t));

  // Transfer the Array of STableKeyInfo into uid list.
H
Haojun Liao 已提交
2100 2101 2102
  size_t size = tableListGetSize(pTableListInfo);
  for (int32_t i = 0; i < size; ++i) {
    STableKeyInfo* pkeyInfo = tableListGetInfo(pTableListInfo, i);
2103 2104 2105 2106 2107 2108
    taosArrayPush(tableIdList, &pkeyInfo->uid);
  }

  return tableIdList;
}

2109
static SSDataBlock* doRawScan(SOperatorInfo* pOperator) {
L
Liu Jicong 已提交
2110 2111
  // NOTE: this operator does never check if current status is done or not
  SExecTaskInfo*      pTaskInfo = pOperator->pTaskInfo;
2112
  SStreamRawScanInfo* pInfo = pOperator->info;
L
Liu Jicong 已提交
2113
  pTaskInfo->streamInfo.metaRsp.metaRspLen = 0;  // use metaRspLen !=0 to judge if data is meta
wmmhello's avatar
wmmhello 已提交
2114
  pTaskInfo->streamInfo.metaRsp.metaRsp = NULL;
2115

wmmhello's avatar
wmmhello 已提交
2116
  qDebug("tmqsnap doRawScan called");
L
Liu Jicong 已提交
2117
  if (pTaskInfo->streamInfo.prepareStatus.type == TMQ_OFFSET__SNAPSHOT_DATA) {
2118
    if (pInfo->dataReader && tsdbNextDataBlock(pInfo->dataReader)) {
wmmhello's avatar
wmmhello 已提交
2119
      if (isTaskKilled(pTaskInfo)) {
X
Xiaoyu Wang 已提交
2120
        tsdbReleaseDataBlock(pInfo->dataReader);
2121
        longjmp(pTaskInfo->env, pTaskInfo->code);
wmmhello's avatar
wmmhello 已提交
2122
      }
2123

H
Haojun Liao 已提交
2124 2125
      SSDataBlock* pBlock = tsdbRetrieveDataBlock(pInfo->dataReader, NULL);
      if (pBlock == NULL) {
wmmhello's avatar
wmmhello 已提交
2126
        longjmp(pTaskInfo->env, terrno);
wmmhello's avatar
wmmhello 已提交
2127 2128
      }

H
Haojun Liao 已提交
2129
      qDebug("tmqsnap doRawScan get data uid:%" PRId64 "", pBlock->info.id.uid);
wmmhello's avatar
wmmhello 已提交
2130
      pTaskInfo->streamInfo.lastStatus.type = TMQ_OFFSET__SNAPSHOT_DATA;
H
Haojun Liao 已提交
2131
      pTaskInfo->streamInfo.lastStatus.uid = pBlock->info.id.uid;
wmmhello's avatar
wmmhello 已提交
2132 2133 2134
      pTaskInfo->streamInfo.lastStatus.ts = pBlock->info.window.ekey;
      return pBlock;
    }
wmmhello's avatar
wmmhello 已提交
2135 2136

    SMetaTableInfo mtInfo = getUidfromSnapShot(pInfo->sContext);
L
Liu Jicong 已提交
2137
    if (mtInfo.uid == 0) {  // read snapshot done, change to get data from wal
wmmhello's avatar
wmmhello 已提交
2138 2139
      qDebug("tmqsnap read snapshot done, change to get data from wal");
      pTaskInfo->streamInfo.prepareStatus.uid = mtInfo.uid;
wmmhello's avatar
wmmhello 已提交
2140 2141
      pTaskInfo->streamInfo.lastStatus.type = TMQ_OFFSET__LOG;
      pTaskInfo->streamInfo.lastStatus.version = pInfo->sContext->snapVersion;
L
Liu Jicong 已提交
2142
    } else {
wmmhello's avatar
wmmhello 已提交
2143 2144
      pTaskInfo->streamInfo.prepareStatus.uid = mtInfo.uid;
      pTaskInfo->streamInfo.prepareStatus.ts = INT64_MIN;
2145
      qDebug("tmqsnap change get data uid:%" PRId64 "", mtInfo.uid);
wmmhello's avatar
wmmhello 已提交
2146 2147
      qStreamPrepareScan(pTaskInfo, &pTaskInfo->streamInfo.prepareStatus, pInfo->sContext->subType);
    }
2148
    tDeleteSSchemaWrapper(mtInfo.schema);
wmmhello's avatar
wmmhello 已提交
2149
    qDebug("tmqsnap stream scan tsdb return null");
wmmhello's avatar
wmmhello 已提交
2150
    return NULL;
L
Liu Jicong 已提交
2151 2152 2153 2154 2155 2156 2157
  } else if (pTaskInfo->streamInfo.prepareStatus.type == TMQ_OFFSET__SNAPSHOT_META) {
    SSnapContext* sContext = pInfo->sContext;
    void*         data = NULL;
    int32_t       dataLen = 0;
    int16_t       type = 0;
    int64_t       uid = 0;
    if (getMetafromSnapShot(sContext, &data, &dataLen, &type, &uid) < 0) {
wmmhello's avatar
wmmhello 已提交
2158
      qError("tmqsnap getMetafromSnapShot error");
wmmhello's avatar
wmmhello 已提交
2159
      taosMemoryFreeClear(data);
2160 2161 2162
      return NULL;
    }

L
Liu Jicong 已提交
2163
    if (!sContext->queryMetaOrData) {  // change to get data next poll request
wmmhello's avatar
wmmhello 已提交
2164 2165 2166 2167
      pTaskInfo->streamInfo.lastStatus.type = TMQ_OFFSET__SNAPSHOT_META;
      pTaskInfo->streamInfo.lastStatus.uid = uid;
      pTaskInfo->streamInfo.metaRsp.rspOffset.type = TMQ_OFFSET__SNAPSHOT_DATA;
      pTaskInfo->streamInfo.metaRsp.rspOffset.uid = 0;
wmmhello's avatar
wmmhello 已提交
2168
      pTaskInfo->streamInfo.metaRsp.rspOffset.ts = INT64_MIN;
L
Liu Jicong 已提交
2169
    } else {
wmmhello's avatar
wmmhello 已提交
2170 2171 2172 2173 2174 2175 2176
      pTaskInfo->streamInfo.lastStatus.type = TMQ_OFFSET__SNAPSHOT_META;
      pTaskInfo->streamInfo.lastStatus.uid = uid;
      pTaskInfo->streamInfo.metaRsp.rspOffset = pTaskInfo->streamInfo.lastStatus;
      pTaskInfo->streamInfo.metaRsp.resMsgType = type;
      pTaskInfo->streamInfo.metaRsp.metaRspLen = dataLen;
      pTaskInfo->streamInfo.metaRsp.metaRsp = data;
    }
2177

wmmhello's avatar
wmmhello 已提交
2178
    return NULL;
2179
  }
L
Liu Jicong 已提交
2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217
  //  else if (pTaskInfo->streamInfo.prepareStatus.type == TMQ_OFFSET__LOG) {
  //    int64_t fetchVer = pTaskInfo->streamInfo.prepareStatus.version + 1;
  //
  //    while(1){
  //      if (tqFetchLog(pInfo->tqReader->pWalReader, pInfo->sContext->withMeta, &fetchVer, &pInfo->pCkHead) < 0) {
  //        qDebug("tmqsnap tmq poll: consumer log end. offset %" PRId64, fetchVer);
  //        pTaskInfo->streamInfo.lastStatus.version = fetchVer;
  //        pTaskInfo->streamInfo.lastStatus.type = TMQ_OFFSET__LOG;
  //        return NULL;
  //      }
  //      SWalCont* pHead = &pInfo->pCkHead->head;
  //      qDebug("tmqsnap tmq poll: consumer log offset %" PRId64 " msgType %d", fetchVer, pHead->msgType);
  //
  //      if (pHead->msgType == TDMT_VND_SUBMIT) {
  //        SSubmitReq* pCont = (SSubmitReq*)&pHead->body;
  //        tqReaderSetDataMsg(pInfo->tqReader, pCont, 0);
  //        SSDataBlock* block = tqLogScanExec(pInfo->sContext->subType, pInfo->tqReader, pInfo->pFilterOutTbUid,
  //        &pInfo->pRes); if(block){
  //          pTaskInfo->streamInfo.lastStatus.type = TMQ_OFFSET__LOG;
  //          pTaskInfo->streamInfo.lastStatus.version = fetchVer;
  //          qDebug("tmqsnap fetch data msg, ver:%" PRId64 ", type:%d", pHead->version, pHead->msgType);
  //          return block;
  //        }else{
  //          fetchVer++;
  //        }
  //      } else{
  //        ASSERT(pInfo->sContext->withMeta);
  //        ASSERT(IS_META_MSG(pHead->msgType));
  //        qDebug("tmqsnap fetch meta msg, ver:%" PRId64 ", type:%d", pHead->version, pHead->msgType);
  //        pTaskInfo->streamInfo.metaRsp.rspOffset.version = fetchVer;
  //        pTaskInfo->streamInfo.metaRsp.rspOffset.type = TMQ_OFFSET__LOG;
  //        pTaskInfo->streamInfo.metaRsp.resMsgType = pHead->msgType;
  //        pTaskInfo->streamInfo.metaRsp.metaRspLen = pHead->bodyLen;
  //        pTaskInfo->streamInfo.metaRsp.metaRsp = taosMemoryMalloc(pHead->bodyLen);
  //        memcpy(pTaskInfo->streamInfo.metaRsp.metaRsp, pHead->body, pHead->bodyLen);
  //        return NULL;
  //      }
  //    }
2218 2219 2220
  return NULL;
}

wmmhello's avatar
wmmhello 已提交
2221
static void destroyRawScanOperatorInfo(void* param) {
wmmhello's avatar
wmmhello 已提交
2222 2223 2224 2225 2226 2227
  SStreamRawScanInfo* pRawScan = (SStreamRawScanInfo*)param;
  tsdbReaderClose(pRawScan->dataReader);
  destroySnapContext(pRawScan->sContext);
  taosMemoryFree(pRawScan);
}

L
Liu Jicong 已提交
2228 2229 2230
// for subscribing db or stb (not including column),
// if this scan is used, meta data can be return
// and schemas are decided when scanning
2231
SOperatorInfo* createRawScanOperatorInfo(SReadHandle* pHandle, SExecTaskInfo* pTaskInfo) {
L
Liu Jicong 已提交
2232 2233 2234 2235 2236
  // create operator
  // create tb reader
  // create meta reader
  // create tq reader

H
Haojun Liao 已提交
2237 2238
  int32_t code = TSDB_CODE_SUCCESS;

2239
  SStreamRawScanInfo* pInfo = taosMemoryCalloc(1, sizeof(SStreamRawScanInfo));
L
Liu Jicong 已提交
2240
  SOperatorInfo*      pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2241
  if (pInfo == NULL || pOperator == NULL) {
H
Haojun Liao 已提交
2242 2243
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _end;
2244 2245
  }

wmmhello's avatar
wmmhello 已提交
2246 2247
  pInfo->vnode = pHandle->vnode;

2248
  pInfo->sContext = pHandle->sContext;
L
Liu Jicong 已提交
2249 2250
  setOperatorInfo(pOperator, "RawScanOperator", QUERY_NODE_PHYSICAL_PLAN_TABLE_SCAN, false, OP_NOT_OPENED, pInfo,
                  pTaskInfo);
2251

2252
  pOperator->fpSet = createOperatorFpSet(NULL, doRawScan, NULL, destroyRawScanOperatorInfo, optrDefaultBufFn, NULL);
2253
  return pOperator;
H
Haojun Liao 已提交
2254

L
Liu Jicong 已提交
2255
_end:
H
Haojun Liao 已提交
2256 2257 2258 2259
  taosMemoryFree(pInfo);
  taosMemoryFree(pOperator);
  pTaskInfo->code = code;
  return NULL;
L
Liu Jicong 已提交
2260 2261
}

2262
static void destroyStreamScanOperatorInfo(void* param) {
2263 2264
  SStreamScanInfo* pStreamScan = (SStreamScanInfo*)param;
  if (pStreamScan->pTableScanOp && pStreamScan->pTableScanOp->info) {
5
54liuyao 已提交
2265
    destroyOperatorInfo(pStreamScan->pTableScanOp);
2266 2267 2268 2269
  }
  if (pStreamScan->tqReader) {
    tqCloseReader(pStreamScan->tqReader);
  }
H
Haojun Liao 已提交
2270 2271
  if (pStreamScan->matchInfo.pList) {
    taosArrayDestroy(pStreamScan->matchInfo.pList);
2272
  }
C
Cary Xu 已提交
2273 2274
  if (pStreamScan->pPseudoExpr) {
    destroyExprInfo(pStreamScan->pPseudoExpr, pStreamScan->numOfPseudoExpr);
L
Liu Jicong 已提交
2275
    taosMemoryFree(pStreamScan->pPseudoExpr);
C
Cary Xu 已提交
2276
  }
C
Cary Xu 已提交
2277

L
Liu Jicong 已提交
2278
  cleanupExprSupp(&pStreamScan->tbnameCalSup);
5
54liuyao 已提交
2279
  cleanupExprSupp(&pStreamScan->tagCalSup);
L
Liu Jicong 已提交
2280

L
Liu Jicong 已提交
2281
  updateInfoDestroy(pStreamScan->pUpdateInfo);
2282 2283 2284 2285
  blockDataDestroy(pStreamScan->pRes);
  blockDataDestroy(pStreamScan->pUpdateRes);
  blockDataDestroy(pStreamScan->pPullDataRes);
  blockDataDestroy(pStreamScan->pDeleteDataRes);
5
54liuyao 已提交
2286
  blockDataDestroy(pStreamScan->pUpdateDataRes);
5
54liuyao 已提交
2287
  blockDataDestroy(pStreamScan->pCreateTbRes);
2288 2289 2290 2291
  taosArrayDestroy(pStreamScan->pBlockLists);
  taosMemoryFree(pStreamScan);
}

2292
SOperatorInfo* createStreamScanOperatorInfo(SReadHandle* pHandle, STableScanPhysiNode* pTableScanNode, SNode* pTagCond,
2293
                                            SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
2294
  SArray*          pColIds = NULL;
2295 2296
  SStreamScanInfo* pInfo = taosMemoryCalloc(1, sizeof(SStreamScanInfo));
  SOperatorInfo*   pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
2297

H
Haojun Liao 已提交
2298
  if (pInfo == NULL || pOperator == NULL) {
S
Shengliang Guan 已提交
2299
    terrno = TSDB_CODE_OUT_OF_MEMORY;
2300
    goto _error;
H
Haojun Liao 已提交
2301 2302
  }

2303
  SScanPhysiNode*     pScanPhyNode = &pTableScanNode->scan;
2304
  SDataBlockDescNode* pDescNode = pScanPhyNode->node.pOutputDataBlockDesc;
H
Haojun Liao 已提交
2305

2306
  pInfo->pTagCond = pTagCond;
2307
  pInfo->pGroupTags = pTableScanNode->pGroupTags;
2308

2309
  int32_t numOfCols = 0;
2310 2311
  int32_t code =
      extractColMatchInfo(pScanPhyNode->pScanCols, pDescNode, &numOfCols, COL_MATCH_FROM_COL_ID, &pInfo->matchInfo);
H
Haojun Liao 已提交
2312 2313 2314
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2315

H
Haojun Liao 已提交
2316
  int32_t numOfOutput = taosArrayGetSize(pInfo->matchInfo.pList);
H
Haojun Liao 已提交
2317
  pColIds = taosArrayInit(numOfOutput, sizeof(int16_t));
2318
  for (int32_t i = 0; i < numOfOutput; ++i) {
H
Haojun Liao 已提交
2319
    SColMatchItem* id = taosArrayGet(pInfo->matchInfo.pList, i);
2320 2321

    int16_t colId = id->colId;
2322
    taosArrayPush(pColIds, &colId);
2323
    if (id->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
H
Haojun Liao 已提交
2324
      pInfo->primaryTsIndex = id->dstSlotId;
5
54liuyao 已提交
2325
    }
H
Haojun Liao 已提交
2326 2327
  }

L
Liu Jicong 已提交
2328 2329 2330 2331 2332 2333 2334 2335 2336 2337 2338 2339 2340
  if (pTableScanNode->pSubtable != NULL) {
    SExprInfo* pSubTableExpr = taosMemoryCalloc(1, sizeof(SExprInfo));
    if (pSubTableExpr == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      goto _error;
    }
    pInfo->tbnameCalSup.pExprInfo = pSubTableExpr;
    createExprFromOneNode(pSubTableExpr, pTableScanNode->pSubtable, 0);
    if (initExprSupp(&pInfo->tbnameCalSup, pSubTableExpr, 1) != 0) {
      goto _error;
    }
  }

2341 2342
  if (pTableScanNode->pTags != NULL) {
    int32_t    numOfTags;
5
54liuyao 已提交
2343
    SExprInfo* pTagExpr = createExpr(pTableScanNode->pTags, &numOfTags);
2344 2345 2346 2347 2348 2349 2350 2351 2352 2353
    if (pTagExpr == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      goto _error;
    }
    if (initExprSupp(&pInfo->tagCalSup, pTagExpr, numOfTags) != 0) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
      goto _error;
    }
  }

L
Liu Jicong 已提交
2354
  pInfo->pBlockLists = taosArrayInit(4, sizeof(SPackedData));
H
Haojun Liao 已提交
2355
  if (pInfo->pBlockLists == NULL) {
2356 2357
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    goto _error;
H
Haojun Liao 已提交
2358 2359
  }

5
54liuyao 已提交
2360
  if (pHandle->vnode) {
L
Liu Jicong 已提交
2361
    SOperatorInfo*  pTableScanOp = createTableScanOperatorInfo(pTableScanNode, pHandle, pTaskInfo);
L
Liu Jicong 已提交
2362
    STableScanInfo* pTSInfo = (STableScanInfo*)pTableScanOp->info;
2363
    if (pHandle->version > 0) {
H
Haojun Liao 已提交
2364
      pTSInfo->base.cond.endVersion = pHandle->version;
2365
    }
L
Liu Jicong 已提交
2366

2367
    STableKeyInfo* pList = NULL;
5
54liuyao 已提交
2368
    int32_t        num = 0;
H
Haojun Liao 已提交
2369
    tableListGetGroupList(pTaskInfo->pTableInfoList, 0, &pList, &num);
2370

2371
    if (pHandle->initTableReader) {
L
Liu Jicong 已提交
2372
      pTSInfo->scanMode = TABLE_SCAN__TABLE_ORDER;
H
Haojun Liao 已提交
2373
      pTSInfo->base.dataReader = NULL;
2374
      pTaskInfo->streamInfo.lastStatus.uid = -1;
L
Liu Jicong 已提交
2375 2376
    }

L
Liu Jicong 已提交
2377 2378 2379 2380
    if (pHandle->initTqReader) {
      ASSERT(pHandle->tqReader == NULL);
      pInfo->tqReader = tqOpenReader(pHandle->vnode);
      ASSERT(pInfo->tqReader);
2381
    } else {
L
Liu Jicong 已提交
2382 2383
      ASSERT(pHandle->tqReader);
      pInfo->tqReader = pHandle->tqReader;
2384 2385
    }

2386
    pInfo->pUpdateInfo = NULL;
2387
    pInfo->pTableScanOp = pTableScanOp;
2388 2389 2390
    if (pInfo->pTableScanOp->pTaskInfo->streamInfo.pState) {
      streamStateSetNumber(pInfo->pTableScanOp->pTaskInfo->streamInfo.pState, -1);
    }
L
Liu Jicong 已提交
2391

L
Liu Jicong 已提交
2392 2393
    pInfo->readHandle = *pHandle;
    pInfo->tableUid = pScanPhyNode->uid;
L
Liu Jicong 已提交
2394
    pTaskInfo->streamInfo.snapshotVer = pHandle->version;
5
54liuyao 已提交
2395 2396
    pInfo->pCreateTbRes = buildCreateTableBlock(&pInfo->tbnameCalSup, &pInfo->tagCalSup);
    blockDataEnsureCapacity(pInfo->pCreateTbRes, 8);
L
Liu Jicong 已提交
2397

L
Liu Jicong 已提交
2398
    // set the extract column id to streamHandle
L
Liu Jicong 已提交
2399
    tqReaderSetColIdList(pInfo->tqReader, pColIds);
H
Haojun Liao 已提交
2400
    SArray* tableIdList = extractTableIdList(pTaskInfo->pTableInfoList);
2401
    code = tqReaderSetTbUidList(pInfo->tqReader, tableIdList);
L
Liu Jicong 已提交
2402 2403 2404 2405 2406
    if (code != 0) {
      taosArrayDestroy(tableIdList);
      goto _error;
    }
    taosArrayDestroy(tableIdList);
H
Haojun Liao 已提交
2407
    memcpy(&pTaskInfo->streamInfo.tableCond, &pTSInfo->base.cond, sizeof(SQueryTableDataCond));
L
Liu Jicong 已提交
2408 2409
  } else {
    taosArrayDestroy(pColIds);
H
Haojun Liao 已提交
2410
    pColIds = NULL;
5
54liuyao 已提交
2411 2412
  }

2413 2414 2415 2416 2417
  // create the pseduo columns info
  if (pTableScanNode->scan.pScanPseudoCols != NULL) {
    pInfo->pPseudoExpr = createExprInfo(pTableScanNode->scan.pScanPseudoCols, NULL, &pInfo->numOfPseudoExpr);
  }

H
Haojun Liao 已提交
2418 2419 2420 2421 2422
  code = filterInitFromNode((SNode*)pScanPhyNode->node.pConditions, &pOperator->exprSupp.pFilterInfo, 0);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

H
Haojun Liao 已提交
2423
  pInfo->pRes = createDataBlockFromDescNode(pDescNode);
2424
  pInfo->pUpdateRes = createSpecialDataBlock(STREAM_CLEAR);
2425
  pInfo->scanMode = STREAM_SCAN_FROM_READERHANDLE;
L
Liu Jicong 已提交
2426
  pInfo->windowSup = (SWindowSupporter){.pStreamAggSup = NULL, .gap = -1, .parentType = QUERY_NODE_PHYSICAL_PLAN};
2427
  pInfo->groupId = 0;
2428
  pInfo->pPullDataRes = createSpecialDataBlock(STREAM_RETRIEVE);
2429
  pInfo->pStreamScanOp = pOperator;
2430
  pInfo->deleteDataIndex = 0;
2431
  pInfo->pDeleteDataRes = createSpecialDataBlock(STREAM_DELETE_DATA);
5
54liuyao 已提交
2432
  pInfo->updateWin = (STimeWindow){.skey = INT64_MAX, .ekey = INT64_MAX};
2433
  pInfo->pUpdateDataRes = createSpecialDataBlock(STREAM_CLEAR);
X
Xiaoyu Wang 已提交
2434
  pInfo->assignBlockUid = pTableScanNode->assignBlockUid;
2435
  pInfo->partitionSup.needCalc = false;
5
54liuyao 已提交
2436 2437
  pInfo->igCheckUpdate = pTableScanNode->igCheckUpdate;
  pInfo->igExpired = pTableScanNode->igExpired;
2438
  pInfo->twAggSup.maxTs = INT64_MIN;
L
Liu Jicong 已提交
2439

L
Liu Jicong 已提交
2440 2441
  setOperatorInfo(pOperator, "StreamScanOperator", QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN, false, OP_NOT_OPENED, pInfo,
                  pTaskInfo);
2442
  pOperator->exprSupp.numOfExprs = taosArrayGetSize(pInfo->pRes->pDataBlock);
H
Haojun Liao 已提交
2443

L
Liu Jicong 已提交
2444
  __optr_fn_t nextFn = pTaskInfo->execModel == OPTR_EXEC_MODEL_STREAM ? doStreamScan : doQueueScan;
L
Liu Jicong 已提交
2445 2446
  pOperator->fpSet =
      createOperatorFpSet(optrDummyOpenFn, nextFn, NULL, destroyStreamScanOperatorInfo, optrDefaultBufFn, NULL);
2447

H
Haojun Liao 已提交
2448
  return pOperator;
2449

L
Liu Jicong 已提交
2450
_error:
H
Haojun Liao 已提交
2451 2452 2453 2454 2455 2456 2457 2458
  if (pColIds != NULL) {
    taosArrayDestroy(pColIds);
  }

  if (pInfo != NULL) {
    destroyStreamScanOperatorInfo(pInfo);
  }

2459 2460
  taosMemoryFreeClear(pOperator);
  return NULL;
H
Haojun Liao 已提交
2461 2462
}

2463
static SSDataBlock* doTagScan(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
2464 2465 2466 2467
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

2468 2469 2470
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

  STagScanInfo* pInfo = pOperator->info;
2471
  SExprInfo*    pExprInfo = &pOperator->exprSupp.pExprInfo[0];
2472
  SSDataBlock*  pRes = pInfo->pRes;
2473
  blockDataCleanup(pRes);
H
Haojun Liao 已提交
2474

H
Haojun Liao 已提交
2475
  int32_t size = tableListGetSize(pTaskInfo->pTableInfoList);
wmmhello's avatar
wmmhello 已提交
2476
  if (size == 0) {
H
Haojun Liao 已提交
2477 2478 2479 2480
    setTaskStatus(pTaskInfo, TASK_COMPLETED);
    return NULL;
  }

2481 2482 2483
  char        str[512] = {0};
  int32_t     count = 0;
  SMetaReader mr = {0};
2484
  metaReaderInit(&mr, pInfo->readHandle.meta, 0);
H
Haojun Liao 已提交
2485

wmmhello's avatar
wmmhello 已提交
2486
  while (pInfo->curPos < size && count < pOperator->resultInfo.capacity) {
H
Haojun Liao 已提交
2487
    STableKeyInfo* item = tableListGetInfo(pTaskInfo->pTableInfoList, pInfo->curPos);
L
Liu Jicong 已提交
2488
    int32_t        code = metaGetTableEntryByUid(&mr, item->uid);
2489
    tDecoderClear(&mr.coder);
H
Haojun Liao 已提交
2490
    if (code != TSDB_CODE_SUCCESS) {
L
Liu Jicong 已提交
2491 2492
      qError("failed to get table meta, uid:0x%" PRIx64 ", code:%s, %s", item->uid, tstrerror(terrno),
             GET_TASKID(pTaskInfo));
H
Haojun Liao 已提交
2493
      metaReaderClear(&mr);
2494
      T_LONG_JMP(pTaskInfo->env, terrno);
H
Haojun Liao 已提交
2495
    }
H
Haojun Liao 已提交
2496

2497
    for (int32_t j = 0; j < pOperator->exprSupp.numOfExprs; ++j) {
2498 2499 2500 2501 2502
      SColumnInfoData* pDst = taosArrayGet(pRes->pDataBlock, pExprInfo[j].base.resSchema.slotId);

      // refactor later
      if (fmIsScanPseudoColumnFunc(pExprInfo[j].pExpr->_function.functionId)) {
        STR_TO_VARSTR(str, mr.me.name);
2503
        colDataSetVal(pDst, count, str, false);
2504
      } else {  // it is a tag value
wmmhello's avatar
wmmhello 已提交
2505 2506
        STagVal val = {0};
        val.cid = pExprInfo[j].base.pParam[0].pCol->colId;
2507
        const char* p = metaGetTableTagVal(mr.me.ctbEntry.pTags, pDst->info.type, &val);
wmmhello's avatar
wmmhello 已提交
2508

2509 2510 2511 2512
        char* data = NULL;
        if (pDst->info.type != TSDB_DATA_TYPE_JSON && p != NULL) {
          data = tTagValToData((const STagVal*)p, false);
        } else {
wmmhello's avatar
wmmhello 已提交
2513 2514
          data = (char*)p;
        }
2515
        colDataSetVal(pDst, count, data,
L
Liu Jicong 已提交
2516
                      (data == NULL) || (pDst->info.type == TSDB_DATA_TYPE_JSON && tTagIsJsonNull(data)));
2517

2518 2519
        if (pDst->info.type != TSDB_DATA_TYPE_JSON && p != NULL && IS_VAR_DATA_TYPE(((const STagVal*)p)->type) &&
            data != NULL) {
wmmhello's avatar
wmmhello 已提交
2520
          taosMemoryFree(data);
wmmhello's avatar
wmmhello 已提交
2521
        }
H
Haojun Liao 已提交
2522 2523 2524
      }
    }

2525
    count += 1;
wmmhello's avatar
wmmhello 已提交
2526
    if (++pInfo->curPos >= size) {
H
Haojun Liao 已提交
2527
      setOperatorCompleted(pOperator);
H
Haojun Liao 已提交
2528 2529 2530
    }
  }

2531 2532
  metaReaderClear(&mr);

2533
  // qDebug("QInfo:0x%"PRIx64" create tag values results completed, rows:%d", GET_TASKID(pRuntimeEnv), count);
H
Haojun Liao 已提交
2534
  if (pOperator->status == OP_EXEC_DONE) {
2535
    setTaskStatus(pTaskInfo, TASK_COMPLETED);
H
Haojun Liao 已提交
2536 2537 2538
  }

  pRes->info.rows = count;
wmmhello's avatar
wmmhello 已提交
2539
  pOperator->resultInfo.totalRows += count;
2540

2541
  return (pRes->info.rows == 0) ? NULL : pInfo->pRes;
H
Haojun Liao 已提交
2542 2543
}

2544
static void destroyTagScanOperatorInfo(void* param) {
H
Haojun Liao 已提交
2545 2546
  STagScanInfo* pInfo = (STagScanInfo*)param;
  pInfo->pRes = blockDataDestroy(pInfo->pRes);
H
Haojun Liao 已提交
2547
  taosArrayDestroy(pInfo->matchInfo.pList);
D
dapan1121 已提交
2548
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
2549 2550
}

S
slzhou 已提交
2551 2552
SOperatorInfo* createTagScanOperatorInfo(SReadHandle* pReadHandle, STagScanPhysiNode* pPhyNode,
                                         SExecTaskInfo* pTaskInfo) {
2553
  STagScanInfo*  pInfo = taosMemoryCalloc(1, sizeof(STagScanInfo));
H
Haojun Liao 已提交
2554 2555 2556 2557 2558
  SOperatorInfo* pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }

2559 2560 2561 2562
  SDataBlockDescNode* pDescNode = pPhyNode->node.pOutputDataBlockDesc;

  int32_t    numOfExprs = 0;
  SExprInfo* pExprInfo = createExprInfo(pPhyNode->pScanPseudoCols, NULL, &numOfExprs);
2563
  int32_t    code = initExprSupp(&pOperator->exprSupp, pExprInfo, numOfExprs);
2564 2565 2566
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2567

H
Haojun Liao 已提交
2568 2569
  int32_t num = 0;
  code = extractColMatchInfo(pPhyNode->pScanPseudoCols, pDescNode, &num, COL_MATCH_FROM_COL_ID, &pInfo->matchInfo);
2570 2571 2572
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2573

H
Haojun Liao 已提交
2574
  pInfo->pRes = createDataBlockFromDescNode(pDescNode);
2575 2576
  pInfo->readHandle = *pReadHandle;
  pInfo->curPos = 0;
2577

L
Liu Jicong 已提交
2578 2579
  setOperatorInfo(pOperator, "TagScanOperator", QUERY_NODE_PHYSICAL_PLAN_TAG_SCAN, false, OP_NOT_OPENED, pInfo,
                  pTaskInfo);
2580
  initResultSizeInfo(&pOperator->resultInfo, 4096);
2581 2582
  blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);

L
Liu Jicong 已提交
2583 2584
  pOperator->fpSet =
      createOperatorFpSet(optrDummyOpenFn, doTagScan, NULL, destroyTagScanOperatorInfo, optrDefaultBufFn, NULL);
H
Haojun Liao 已提交
2585 2586

  return pOperator;
2587

2588
_error:
H
Haojun Liao 已提交
2589 2590 2591 2592 2593
  taosMemoryFree(pInfo);
  taosMemoryFree(pOperator);
  terrno = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
}
2594

dengyihao's avatar
dengyihao 已提交
2595
static SSDataBlock* getTableDataBlockImpl(void* param) {
dengyihao's avatar
opt mem  
dengyihao 已提交
2596 2597 2598 2599 2600 2601
  STableMergeScanSortSourceParam* source = param;
  SOperatorInfo*                  pOperator = source->pOperator;
  STableMergeScanInfo*            pInfo = pOperator->info;
  SExecTaskInfo*                  pTaskInfo = pOperator->pTaskInfo;
  int32_t                         readIdx = source->readerIdx;
  SSDataBlock*                    pBlock = source->inputBlock;
2602
  int32_t                         code = 0;
dengyihao's avatar
opt mem  
dengyihao 已提交
2603

H
Haojun Liao 已提交
2604
  SQueryTableDataCond* pQueryCond = taosArrayGet(pInfo->queryConds, readIdx);
dengyihao's avatar
opt mem  
dengyihao 已提交
2605

L
Liu Jicong 已提交
2606 2607
  int64_t      st = taosGetTimestampUs();
  void*        p = tableListGetInfo(pTaskInfo->pTableInfoList, readIdx + pInfo->tableStartIndex);
H
Haojun Liao 已提交
2608
  SReadHandle* pHandle = &pInfo->base.readHandle;
dengyihao's avatar
dengyihao 已提交
2609

D
dapan1121 已提交
2610
  if (NULL == source->dataReader || !source->multiReader) {
D
dapan1121 已提交
2611
    code = tsdbReaderOpen(pHandle->vnode, pQueryCond, p, 1, pBlock, &source->dataReader, GET_TASKID(pTaskInfo), false);
2612 2613 2614
    if (code != 0) {
      T_LONG_JMP(pTaskInfo->env, code);
    }
dengyihao's avatar
dengyihao 已提交
2615
  }
2616 2617
  
  pInfo->base.dataReader = source->dataReader;
H
Haojun Liao 已提交
2618
  STsdbReader* reader = pInfo->base.dataReader;
2619
  qTrace("tsdb/read-table-data: %p, enter next reader", reader);
dengyihao's avatar
opt mem  
dengyihao 已提交
2620
  while (tsdbNextDataBlock(reader)) {
H
Haojun Liao 已提交
2621
    if (isTaskKilled(pTaskInfo)) {
X
Xiaoyu Wang 已提交
2622
      tsdbReleaseDataBlock(reader);
D
dapan1121 已提交
2623
      pInfo->base.dataReader = NULL;
2624
      T_LONG_JMP(pTaskInfo->env, pTaskInfo->code);
dengyihao's avatar
opt mem  
dengyihao 已提交
2625 2626 2627
    }

    // process this data block based on the probabilities
H
Haojun Liao 已提交
2628
    bool processThisBlock = processBlockWithProbability(&pInfo->sample);
dengyihao's avatar
opt mem  
dengyihao 已提交
2629 2630 2631 2632
    if (!processThisBlock) {
      continue;
    }

H
Haojun Liao 已提交
2633
    if (pQueryCond->order == TSDB_ORDER_ASC) {
dengyihao's avatar
opt mem  
dengyihao 已提交
2634 2635 2636 2637
      pQueryCond->twindows.skey = pBlock->info.window.ekey + 1;
    } else {
      pQueryCond->twindows.ekey = pBlock->info.window.skey - 1;
    }
dengyihao's avatar
opt mem  
dengyihao 已提交
2638 2639

    uint32_t status = 0;
2640
    code = loadDataBlock(pOperator, &pInfo->base, pBlock, &status);
S
slzhou 已提交
2641
    //    code = loadDataBlockFromOneTable(pOperator, pTableScanInfo, pBlock, &status);
dengyihao's avatar
opt mem  
dengyihao 已提交
2642
    if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2643
      T_LONG_JMP(pTaskInfo->env, code);
dengyihao's avatar
opt mem  
dengyihao 已提交
2644 2645 2646 2647 2648 2649 2650
    }

    // current block is filter out according to filter condition, continue load the next block
    if (status == FUNC_DATA_REQUIRED_FILTEROUT || pBlock->info.rows == 0) {
      continue;
    }

H
Haojun Liao 已提交
2651
    pBlock->info.id.groupId = getTableGroupId(pTaskInfo->pTableInfoList, pBlock->info.id.uid);
dengyihao's avatar
opt mem  
dengyihao 已提交
2652

H
Haojun Liao 已提交
2653
    pOperator->resultInfo.totalRows += pBlock->info.rows;
H
Haojun Liao 已提交
2654
    pInfo->base.readRecorder.elapsedTime += (taosGetTimestampUs() - st) / 1000.0;
dengyihao's avatar
opt mem  
dengyihao 已提交
2655

2656
    qTrace("tsdb/read-table-data: %p, close reader", reader);
D
dapan1121 已提交
2657 2658 2659 2660
    if (!source->multiReader) {
      tsdbReaderClose(pInfo->base.dataReader);
      source->dataReader = NULL;
    }
H
Haojun Liao 已提交
2661
    pInfo->base.dataReader = NULL;
dengyihao's avatar
opt mem  
dengyihao 已提交
2662 2663
    return pBlock;
  }
H
Haojun Liao 已提交
2664

D
dapan1121 已提交
2665 2666 2667 2668
  if (!source->multiReader) {
    tsdbReaderClose(pInfo->base.dataReader);
    source->dataReader = NULL;
  }
H
Haojun Liao 已提交
2669
  pInfo->base.dataReader = NULL;
dengyihao's avatar
opt mem  
dengyihao 已提交
2670 2671 2672
  return NULL;
}

2673 2674 2675
SArray* generateSortByTsInfo(SArray* colMatchInfo, int32_t order) {
  int32_t tsTargetSlotId = 0;
  for (int32_t i = 0; i < taosArrayGetSize(colMatchInfo); ++i) {
H
Haojun Liao 已提交
2676
    SColMatchItem* colInfo = taosArrayGet(colMatchInfo, i);
2677
    if (colInfo->colId == PRIMARYKEY_TIMESTAMP_COL_ID) {
H
Haojun Liao 已提交
2678
      tsTargetSlotId = colInfo->dstSlotId;
2679 2680 2681
    }
  }

2682 2683 2684
  SArray*         pList = taosArrayInit(1, sizeof(SBlockOrderInfo));
  SBlockOrderInfo bi = {0};
  bi.order = order;
2685
  bi.slotId = tsTargetSlotId;
2686 2687 2688 2689 2690 2691 2692
  bi.nullFirst = NULL_ORDER_FIRST;

  taosArrayPush(pList, &bi);

  return pList;
}

H
Haojun Liao 已提交
2693
int32_t dumpQueryTableCond(const SQueryTableDataCond* src, SQueryTableDataCond* dst) {
dengyihao's avatar
opt mem  
dengyihao 已提交
2694 2695 2696 2697 2698 2699 2700
  memcpy((void*)dst, (void*)src, sizeof(SQueryTableDataCond));
  dst->colList = taosMemoryCalloc(src->numOfCols, sizeof(SColumnInfo));
  for (int i = 0; i < src->numOfCols; i++) {
    dst->colList[i] = src->colList[i];
  }
  return 0;
}
H
Haojun Liao 已提交
2701

2702
int32_t startGroupTableMergeScan(SOperatorInfo* pOperator) {
2703 2704 2705
  STableMergeScanInfo* pInfo = pOperator->info;
  SExecTaskInfo*       pTaskInfo = pOperator->pTaskInfo;

S
slzhou 已提交
2706
  {
H
Haojun Liao 已提交
2707
    size_t  numOfTables = tableListGetSize(pTaskInfo->pTableInfoList);
S
slzhou 已提交
2708
    int32_t i = pInfo->tableStartIndex + 1;
H
Haojun Liao 已提交
2709
    for (; i < numOfTables; ++i) {
H
Haojun Liao 已提交
2710
      STableKeyInfo* tableKeyInfo = tableListGetInfo(pTaskInfo->pTableInfoList, i);
S
slzhou 已提交
2711 2712 2713 2714 2715 2716
      if (tableKeyInfo->groupId != pInfo->groupId) {
        break;
      }
    }
    pInfo->tableEndIndex = i - 1;
  }
2717

S
slzhou 已提交
2718 2719
  int32_t tableStartIdx = pInfo->tableStartIndex;
  int32_t tableEndIdx = pInfo->tableEndIndex;
2720

H
Haojun Liao 已提交
2721
  pInfo->base.dataReader = NULL;
2722

2723 2724
  // todo the total available buffer should be determined by total capacity of buffer of this task.
  // the additional one is reserved for merge result
S
slzhou 已提交
2725
  pInfo->sortBufSize = pInfo->bufPageSize * (tableEndIdx - tableStartIdx + 1 + 1);
2726
  int32_t numOfBufPage = pInfo->sortBufSize / pInfo->bufPageSize;
L
Liu Jicong 已提交
2727 2728
  pInfo->pSortHandle = tsortCreateSortHandle(pInfo->pSortInfo, SORT_MULTISOURCE_MERGE, pInfo->bufPageSize, numOfBufPage,
                                             pInfo->pSortInputBlock, pTaskInfo->id.str);
2729

dengyihao's avatar
dengyihao 已提交
2730
  tsortSetFetchRawDataFp(pInfo->pSortHandle, getTableDataBlockImpl, NULL, NULL);
dengyihao's avatar
opt mem  
dengyihao 已提交
2731 2732 2733 2734 2735 2736

  // one table has one data block
  int32_t numOfTable = tableEndIdx - tableStartIdx + 1;
  pInfo->queryConds = taosArrayInit(numOfTable, sizeof(SQueryTableDataCond));

  for (int32_t i = 0; i < numOfTable; ++i) {
2737 2738 2739
    STableMergeScanSortSourceParam param = {0};
    param.readerIdx = i;
    param.pOperator = pOperator;
D
dapan1121 已提交
2740
    param.multiReader = (numOfTable <= MULTI_READER_MAX_TABLE_NUM) ? true : false;
2741
    param.inputBlock = createOneDataBlock(pInfo->pResBlock, false);
H
Haojun Liao 已提交
2742 2743
    blockDataEnsureCapacity(param.inputBlock, pOperator->resultInfo.capacity);

2744
    taosArrayPush(pInfo->sortSourceParams, &param);
dengyihao's avatar
opt mem  
dengyihao 已提交
2745 2746

    SQueryTableDataCond cond;
H
Haojun Liao 已提交
2747
    dumpQueryTableCond(&pInfo->base.cond, &cond);
dengyihao's avatar
opt mem  
dengyihao 已提交
2748
    taosArrayPush(pInfo->queryConds, &cond);
2749 2750
  }

dengyihao's avatar
opt mem  
dengyihao 已提交
2751
  for (int32_t i = 0; i < numOfTable; ++i) {
2752
    SSortSource*                    ps = taosMemoryCalloc(1, sizeof(SSortSource));
2753
    STableMergeScanSortSourceParam* param = taosArrayGet(pInfo->sortSourceParams, i);
2754
    ps->param = param;
2755
    ps->onlyRef = true;
2756 2757 2758 2759 2760 2761
    tsortAddSource(pInfo->pSortHandle, ps);
  }

  int32_t code = tsortOpen(pInfo->pSortHandle);

  if (code != TSDB_CODE_SUCCESS) {
2762
    T_LONG_JMP(pTaskInfo->env, terrno);
2763 2764
  }

2765 2766 2767 2768 2769 2770 2771
  return TSDB_CODE_SUCCESS;
}

int32_t stopGroupTableMergeScan(SOperatorInfo* pOperator) {
  STableMergeScanInfo* pInfo = pOperator->info;
  SExecTaskInfo*       pTaskInfo = pOperator->pTaskInfo;

dengyihao's avatar
dengyihao 已提交
2772
  int32_t numOfTable = taosArrayGetSize(pInfo->queryConds);
2773

2774 2775 2776 2777 2778 2779 2780
  SSortExecInfo sortExecInfo = tsortGetSortExecInfo(pInfo->pSortHandle);
  pInfo->sortExecInfo.sortMethod = sortExecInfo.sortMethod;
  pInfo->sortExecInfo.sortBuffer = sortExecInfo.sortBuffer;
  pInfo->sortExecInfo.loops += sortExecInfo.loops;
  pInfo->sortExecInfo.readBytes += sortExecInfo.readBytes;
  pInfo->sortExecInfo.writeBytes += sortExecInfo.writeBytes;

dengyihao's avatar
dengyihao 已提交
2781
  for (int32_t i = 0; i < numOfTable; ++i) {
2782 2783
    STableMergeScanSortSourceParam* param = taosArrayGet(pInfo->sortSourceParams, i);
    blockDataDestroy(param->inputBlock);
2784 2785
    tsdbReaderClose(param->dataReader);
    param->dataReader = NULL;
2786
  }
2787 2788
  taosArrayClear(pInfo->sortSourceParams);

2789
  tsortDestroySortHandle(pInfo->pSortHandle);
dengyihao's avatar
dengyihao 已提交
2790
  pInfo->pSortHandle = NULL;
2791

dengyihao's avatar
opt mem  
dengyihao 已提交
2792 2793 2794
  for (int32_t i = 0; i < taosArrayGetSize(pInfo->queryConds); i++) {
    SQueryTableDataCond* cond = taosArrayGet(pInfo->queryConds, i);
    taosMemoryFree(cond->colList);
2795
  }
dengyihao's avatar
opt mem  
dengyihao 已提交
2796 2797 2798
  taosArrayDestroy(pInfo->queryConds);
  pInfo->queryConds = NULL;

2799
  resetLimitInfoForNextGroup(&pInfo->limitInfo);
2800 2801 2802
  return TSDB_CODE_SUCCESS;
}

2803 2804
// all data produced by this function only belongs to one group
// slimit/soffset does not need to be concerned here, since this function only deal with data within one group.
L
Liu Jicong 已提交
2805 2806
SSDataBlock* getSortedTableMergeScanBlockData(SSortHandle* pHandle, SSDataBlock* pResBlock, int32_t capacity,
                                              SOperatorInfo* pOperator) {
2807 2808 2809
  STableMergeScanInfo* pInfo = pOperator->info;
  SExecTaskInfo*       pTaskInfo = pOperator->pTaskInfo;

2810
  blockDataCleanup(pResBlock);
2811 2812

  while (1) {
2813
    STupleHandle* pTupleHandle = tsortNextTuple(pHandle);
2814 2815 2816 2817
    if (pTupleHandle == NULL) {
      break;
    }

2818 2819
    appendOneRowToDataBlock(pResBlock, pTupleHandle);
    if (pResBlock->info.rows >= capacity) {
2820 2821 2822 2823
      break;
    }
  }

2824
  bool limitReached = applyLimitOffset(&pInfo->limitInfo, pResBlock, pTaskInfo);
X
Xiaoyu Wang 已提交
2825
  qDebug("%s get sorted row block, rows:%d, limit:%" PRId64, GET_TASKID(pTaskInfo), pResBlock->info.rows,
2826
         pInfo->limitInfo.numOfOutputRows);
2827

2828
  return (pResBlock->info.rows > 0) ? pResBlock : NULL;
2829 2830 2831 2832 2833 2834 2835 2836 2837 2838 2839 2840
}

SSDataBlock* doTableMergeScan(SOperatorInfo* pOperator) {
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

  SExecTaskInfo*       pTaskInfo = pOperator->pTaskInfo;
  STableMergeScanInfo* pInfo = pOperator->info;

  int32_t code = pOperator->fpSet._openFn(pOperator);
  if (code != TSDB_CODE_SUCCESS) {
2841
    T_LONG_JMP(pTaskInfo->env, code);
2842
  }
2843

H
Haojun Liao 已提交
2844
  size_t tableListSize = tableListGetSize(pTaskInfo->pTableInfoList);
S
slzhou 已提交
2845 2846
  if (!pInfo->hasGroupId) {
    pInfo->hasGroupId = true;
2847

S
slzhou 已提交
2848
    if (tableListSize == 0) {
H
Haojun Liao 已提交
2849
      setOperatorCompleted(pOperator);
2850 2851
      return NULL;
    }
S
slzhou 已提交
2852
    pInfo->tableStartIndex = 0;
H
Haojun Liao 已提交
2853
    pInfo->groupId = ((STableKeyInfo*)tableListGetInfo(pTaskInfo->pTableInfoList, pInfo->tableStartIndex))->groupId;
2854 2855
    startGroupTableMergeScan(pOperator);
  }
2856

S
slzhou 已提交
2857 2858
  SSDataBlock* pBlock = NULL;
  while (pInfo->tableStartIndex < tableListSize) {
2859 2860 2861 2862
    if (isTaskKilled(pTaskInfo)) {
      T_LONG_JMP(pTaskInfo->env, pTaskInfo->code);
    }

L
Liu Jicong 已提交
2863 2864
    pBlock = getSortedTableMergeScanBlockData(pInfo->pSortHandle, pInfo->pResBlock, pOperator->resultInfo.capacity,
                                              pOperator);
S
slzhou 已提交
2865
    if (pBlock != NULL) {
H
Haojun Liao 已提交
2866
      pBlock->info.id.groupId = pInfo->groupId;
S
slzhou 已提交
2867 2868 2869
      pOperator->resultInfo.totalRows += pBlock->info.rows;
      return pBlock;
    } else {
2870
      // Data of this group are all dumped, let's try the next group
S
slzhou 已提交
2871 2872
      stopGroupTableMergeScan(pOperator);
      if (pInfo->tableEndIndex >= tableListSize - 1) {
H
Haojun Liao 已提交
2873
        setOperatorCompleted(pOperator);
S
slzhou 已提交
2874 2875
        break;
      }
2876

S
slzhou 已提交
2877
      pInfo->tableStartIndex = pInfo->tableEndIndex + 1;
H
Haojun Liao 已提交
2878
      pInfo->groupId = tableListGetInfo(pTaskInfo->pTableInfoList, pInfo->tableStartIndex)->groupId;
S
slzhou 已提交
2879
      startGroupTableMergeScan(pOperator);
D
dapan1121 已提交
2880
      resetLimitInfoForNextGroup(&pInfo->limitInfo);      
S
slzhou 已提交
2881
    }
wmmhello's avatar
wmmhello 已提交
2882 2883
  }

2884 2885 2886
  return pBlock;
}

2887
void destroyTableMergeScanOperatorInfo(void* param) {
2888
  STableMergeScanInfo* pTableScanInfo = (STableMergeScanInfo*)param;
H
Haojun Liao 已提交
2889
  cleanupQueryTableDataCond(&pTableScanInfo->base.cond);
2890

dengyihao's avatar
dengyihao 已提交
2891 2892 2893
  int32_t numOfTable = taosArrayGetSize(pTableScanInfo->queryConds);

  for (int32_t i = 0; i < numOfTable; i++) {
H
Haojun Liao 已提交
2894 2895
    STableMergeScanSortSourceParam* p = taosArrayGet(pTableScanInfo->sortSourceParams, i);
    blockDataDestroy(p->inputBlock);
2896 2897
    tsdbReaderClose(p->dataReader);
    p->dataReader = NULL;
2898
  }
H
Haojun Liao 已提交
2899

D
dapan1121 已提交
2900 2901 2902
  tsdbReaderClose(pTableScanInfo->base.dataReader);
  pTableScanInfo->base.dataReader = NULL;

2903
  taosArrayDestroy(pTableScanInfo->sortSourceParams);
dengyihao's avatar
dengyihao 已提交
2904 2905
  tsortDestroySortHandle(pTableScanInfo->pSortHandle);
  pTableScanInfo->pSortHandle = NULL;
2906

dengyihao's avatar
opt mem  
dengyihao 已提交
2907 2908 2909
  for (int i = 0; i < taosArrayGetSize(pTableScanInfo->queryConds); i++) {
    SQueryTableDataCond* pCond = taosArrayGet(pTableScanInfo->queryConds, i);
    taosMemoryFree(pCond->colList);
2910
  }
dengyihao's avatar
opt mem  
dengyihao 已提交
2911
  taosArrayDestroy(pTableScanInfo->queryConds);
2912

H
Haojun Liao 已提交
2913 2914
  if (pTableScanInfo->base.matchInfo.pList != NULL) {
    taosArrayDestroy(pTableScanInfo->base.matchInfo.pList);
2915 2916 2917 2918 2919 2920
  }

  pTableScanInfo->pResBlock = blockDataDestroy(pTableScanInfo->pResBlock);
  pTableScanInfo->pSortInputBlock = blockDataDestroy(pTableScanInfo->pSortInputBlock);

  taosArrayDestroy(pTableScanInfo->pSortInfo);
H
Haojun Liao 已提交
2921
  cleanupExprSupp(&pTableScanInfo->base.pseudoSup);
L
Liu Jicong 已提交
2922

H
Haojun Liao 已提交
2923 2924
  taosLRUCacheCleanup(pTableScanInfo->base.metaCache.pTableMetaEntryCache);

D
dapan1121 已提交
2925
  taosMemoryFreeClear(param);
2926 2927 2928 2929
}

int32_t getTableMergeScanExplainExecInfo(SOperatorInfo* pOptr, void** pOptrExplain, uint32_t* len) {
  ASSERT(pOptr != NULL);
2930 2931
  // TODO: merge these two info into one struct
  STableMergeScanExecInfo* execInfo = taosMemoryCalloc(1, sizeof(STableMergeScanExecInfo));
L
Liu Jicong 已提交
2932
  STableMergeScanInfo*     pInfo = pOptr->info;
H
Haojun Liao 已提交
2933
  execInfo->blockRecorder = pInfo->base.readRecorder;
2934
  execInfo->sortExecInfo = pInfo->sortExecInfo;
2935 2936 2937

  *pOptrExplain = execInfo;
  *len = sizeof(STableMergeScanExecInfo);
L
Liu Jicong 已提交
2938

2939 2940 2941
  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
2942 2943
SOperatorInfo* createTableMergeScanOperatorInfo(STableScanPhysiNode* pTableScanNode, SReadHandle* readHandle,
                                                SExecTaskInfo* pTaskInfo) {
2944 2945 2946 2947 2948
  STableMergeScanInfo* pInfo = taosMemoryCalloc(1, sizeof(STableMergeScanInfo));
  SOperatorInfo*       pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
    goto _error;
  }
2949

2950 2951 2952
  SDataBlockDescNode* pDescNode = pTableScanNode->scan.node.pOutputDataBlockDesc;

  int32_t numOfCols = 0;
2953
  int32_t code = extractColMatchInfo(pTableScanNode->scan.pScanCols, pDescNode, &numOfCols, COL_MATCH_FROM_COL_ID,
H
Haojun Liao 已提交
2954
                                     &pInfo->base.matchInfo);
H
Haojun Liao 已提交
2955 2956 2957
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
2958

H
Haojun Liao 已提交
2959
  code = initQueryTableDataCond(&pInfo->base.cond, pTableScanNode);
2960
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
2961
    taosArrayDestroy(pInfo->base.matchInfo.pList);
2962 2963 2964 2965
    goto _error;
  }

  if (pTableScanNode->scan.pScanPseudoCols != NULL) {
H
Haojun Liao 已提交
2966
    SExprSupp* pSup = &pInfo->base.pseudoSup;
2967 2968
    pSup->pExprInfo = createExprInfo(pTableScanNode->scan.pScanPseudoCols, NULL, &pSup->numOfExprs);
    pSup->pCtx = createSqlFunctionCtx(pSup->pExprInfo, pSup->numOfExprs, &pSup->rowEntryInfoOffset);
2969 2970 2971 2972
  }

  pInfo->scanInfo = (SScanInfo){.numOfAsc = pTableScanNode->scanSeq[0], .numOfDesc = pTableScanNode->scanSeq[1]};

H
Haojun Liao 已提交
2973 2974 2975 2976 2977 2978
  pInfo->base.metaCache.pTableMetaEntryCache = taosLRUCacheInit(1024 * 128, -1, .5);
  if (pInfo->base.metaCache.pTableMetaEntryCache == NULL) {
    code = terrno;
    goto _error;
  }

H
Haojun Liao 已提交
2979 2980
  pInfo->base.dataBlockLoadFlag = FUNC_DATA_REQUIRED_DATA_LOAD;
  pInfo->base.scanFlag = MAIN_SCAN;
H
Haojun Liao 已提交
2981
  pInfo->base.readHandle = *readHandle;
2982 2983 2984

  pInfo->base.limitInfo.limit.limit = -1;
  pInfo->base.limitInfo.slimit.limit = -1;
H
Haojun Liao 已提交
2985

2986
  pInfo->sample.sampleRatio = pTableScanNode->ratio;
L
Liu Jicong 已提交
2987
  pInfo->sample.seed = taosGetTimestampSec();
H
Haojun Liao 已提交
2988 2989 2990 2991 2992 2993

  code = filterInitFromNode((SNode*)pTableScanNode->scan.node.pConditions, &pOperator->exprSupp.pFilterInfo, 0);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

H
Haojun Liao 已提交
2994
  initResultSizeInfo(&pOperator->resultInfo, 1024);
H
Haojun Liao 已提交
2995
  pInfo->pResBlock = createDataBlockFromDescNode(pDescNode);
H
Haojun Liao 已提交
2996 2997
  blockDataEnsureCapacity(pInfo->pResBlock, pOperator->resultInfo.capacity);

2998
  pInfo->sortSourceParams = taosArrayInit(64, sizeof(STableMergeScanSortSourceParam));
2999

H
Haojun Liao 已提交
3000
  pInfo->pSortInfo = generateSortByTsInfo(pInfo->base.matchInfo.pList, pInfo->base.cond.order);
3001
  pInfo->pSortInputBlock = createOneDataBlock(pInfo->pResBlock, false);
3002
  initLimitInfo(pTableScanNode->scan.node.pLimit, pTableScanNode->scan.node.pSlimit, &pInfo->limitInfo);
3003

dengyihao's avatar
dengyihao 已提交
3004
  int32_t  rowSize = pInfo->pResBlock->info.rowSize;
A
Alex Duan 已提交
3005 3006
  uint32_t nCols = taosArrayGetSize(pInfo->pResBlock->pDataBlock);
  pInfo->bufPageSize = getProperSortPageSize(rowSize, nCols);
3007

L
Liu Jicong 已提交
3008 3009
  setOperatorInfo(pOperator, "TableMergeScanOperator", QUERY_NODE_PHYSICAL_PLAN_TABLE_MERGE_SCAN, false, OP_NOT_OPENED,
                  pInfo, pTaskInfo);
L
Liu Jicong 已提交
3010
  pOperator->exprSupp.numOfExprs = numOfCols;
3011

3012 3013
  pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, doTableMergeScan, NULL, destroyTableMergeScanOperatorInfo,
                                         optrDefaultBufFn, getTableMergeScanExplainExecInfo);
3014 3015 3016 3017 3018 3019 3020 3021 3022
  pOperator->cost.openCost = 0;
  return pOperator;

_error:
  pTaskInfo->code = TSDB_CODE_OUT_OF_MEMORY;
  taosMemoryFree(pInfo);
  taosMemoryFree(pOperator);
  return NULL;
}
S
shenglian zhou 已提交
3023 3024 3025 3026

// ====================================================================================================================
// TableCountScanOperator
static SSDataBlock* doTableCountScan(SOperatorInfo* pOperator);
S
slzhou 已提交
3027
static void         destoryTableCountScanOperator(void* param);
S
slzhou 已提交
3028 3029 3030 3031 3032 3033
static void         buildVnodeGroupedStbTableCount(STableCountScanOperatorInfo* pInfo, STableCountScanSupp* pSupp,
                                                   SSDataBlock* pRes, char* dbName, tb_uid_t stbUid);
static void         buildVnodeGroupedNtbTableCount(STableCountScanOperatorInfo* pInfo, STableCountScanSupp* pSupp,
                                                   SSDataBlock* pRes, char* dbName);
static void         buildVnodeFilteredTbCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
                                              STableCountScanSupp* pSupp, SSDataBlock* pRes, char* dbName);
L
Liu Jicong 已提交
3034 3035
static void         buildVnodeGroupedTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
                                                STableCountScanSupp* pSupp, SSDataBlock* pRes, int32_t vgId, char* dbName);
S
slzhou 已提交
3036 3037 3038 3039 3040 3041 3042
static SSDataBlock* buildVnodeDbTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
                                           STableCountScanSupp* pSupp, SSDataBlock* pRes);
static void         buildSysDbGroupedTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
                                                STableCountScanSupp* pSupp, SSDataBlock* pRes, size_t infodbTableNum,
                                                size_t perfdbTableNum);
static void         buildSysDbFilterTableCount(SOperatorInfo* pOperator, STableCountScanSupp* pSupp, SSDataBlock* pRes,
                                               size_t infodbTableNum, size_t perfdbTableNum);
S
slzhou 已提交
3043 3044 3045 3046 3047 3048 3049 3050 3051 3052 3053 3054 3055 3056 3057 3058 3059 3060 3061 3062 3063 3064 3065 3066 3067 3068 3069 3070 3071 3072 3073 3074 3075 3076 3077 3078 3079 3080 3081 3082 3083 3084 3085 3086 3087 3088 3089 3090 3091 3092 3093 3094 3095 3096 3097 3098 3099 3100 3101 3102 3103
static const char*  GROUP_TAG_DB_NAME = "db_name";
static const char*  GROUP_TAG_STABLE_NAME = "stable_name";

int32_t tblCountScanGetGroupTagsSlotId(const SNodeList* scanCols, STableCountScanSupp* supp) {
  if (scanCols != NULL) {
    SNode* pNode = NULL;
    FOREACH(pNode, scanCols) {
      if (nodeType(pNode) != QUERY_NODE_TARGET) {
        return TSDB_CODE_QRY_SYS_ERROR;
      }
      STargetNode* targetNode = (STargetNode*)pNode;
      if (nodeType(targetNode->pExpr) != QUERY_NODE_COLUMN) {
        return TSDB_CODE_QRY_SYS_ERROR;
      }
      SColumnNode* colNode = (SColumnNode*)(targetNode->pExpr);
      if (strcmp(colNode->colName, GROUP_TAG_DB_NAME) == 0) {
        supp->dbNameSlotId = targetNode->slotId;
      } else if (strcmp(colNode->colName, GROUP_TAG_STABLE_NAME) == 0) {
        supp->stbNameSlotId = targetNode->slotId;
      }
    }
  }
  return TSDB_CODE_SUCCESS;
}

int32_t tblCountScanGetCountSlotId(const SNodeList* pseudoCols, STableCountScanSupp* supp) {
  if (pseudoCols != NULL) {
    SNode* pNode = NULL;
    FOREACH(pNode, pseudoCols) {
      if (nodeType(pNode) != QUERY_NODE_TARGET) {
        return TSDB_CODE_QRY_SYS_ERROR;
      }
      STargetNode* targetNode = (STargetNode*)pNode;
      if (nodeType(targetNode->pExpr) != QUERY_NODE_FUNCTION) {
        return TSDB_CODE_QRY_SYS_ERROR;
      }
      SFunctionNode* funcNode = (SFunctionNode*)(targetNode->pExpr);
      if (funcNode->funcType == FUNCTION_TYPE_TABLE_COUNT) {
        supp->tbCountSlotId = targetNode->slotId;
      }
    }
  }
  return TSDB_CODE_SUCCESS;
}

int32_t tblCountScanGetInputs(SNodeList* groupTags, SName* tableName, STableCountScanSupp* supp) {
  if (groupTags != NULL) {
    SNode* pNode = NULL;
    FOREACH(pNode, groupTags) {
      if (nodeType(pNode) != QUERY_NODE_COLUMN) {
        return TSDB_CODE_QRY_SYS_ERROR;
      }
      SColumnNode* colNode = (SColumnNode*)pNode;
      if (strcmp(colNode->colName, GROUP_TAG_DB_NAME) == 0) {
        supp->groupByDbName = true;
      }
      if (strcmp(colNode->colName, GROUP_TAG_STABLE_NAME) == 0) {
        supp->groupByStbName = true;
      }
    }
  } else {
H
Haojun Liao 已提交
3104 3105
    tstrncpy(supp->dbNameFilter, tNameGetDbNameP(tableName), TSDB_DB_NAME_LEN);
    tstrncpy(supp->stbNameFilter, tNameGetTableName(tableName), TSDB_TABLE_NAME_LEN);
S
slzhou 已提交
3106 3107 3108 3109 3110 3111 3112 3113 3114 3115 3116 3117 3118 3119 3120 3121 3122 3123 3124 3125 3126 3127 3128 3129 3130 3131 3132 3133
  }
  return TSDB_CODE_SUCCESS;
}

int32_t getTableCountScanSupp(SNodeList* groupTags, SName* tableName, SNodeList* scanCols, SNodeList* pseudoCols,
                              STableCountScanSupp* supp, SExecTaskInfo* taskInfo) {
  int32_t code = 0;
  code = tblCountScanGetInputs(groupTags, tableName, supp);
  if (code != TSDB_CODE_SUCCESS) {
    qError("%s get table count scan supp. get inputs error", GET_TASKID(taskInfo));
    return code;
  }
  supp->dbNameSlotId = -1;
  supp->stbNameSlotId = -1;
  supp->tbCountSlotId = -1;

  code = tblCountScanGetGroupTagsSlotId(scanCols, supp);
  if (code != TSDB_CODE_SUCCESS) {
    qError("%s get table count scan supp. get group tags slot id error", GET_TASKID(taskInfo));
    return code;
  }
  code = tblCountScanGetCountSlotId(pseudoCols, supp);
  if (code != TSDB_CODE_SUCCESS) {
    qError("%s get table count scan supp. get count error", GET_TASKID(taskInfo));
    return code;
  }
  return code;
}
S
shenglian zhou 已提交
3134

S
slzhou 已提交
3135
SOperatorInfo* createTableCountScanOperatorInfo(SReadHandle* readHandle, STableCountScanPhysiNode* pTblCountScanNode,
S
shenglian zhou 已提交
3136 3137 3138
                                                SExecTaskInfo* pTaskInfo) {
  int32_t code = TSDB_CODE_SUCCESS;

S
slzhou 已提交
3139
  SScanPhysiNode*              pScanNode = &pTblCountScanNode->scan;
S
slzhou 已提交
3140
  STableCountScanOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(STableCountScanOperatorInfo));
S
slzhou 已提交
3141
  SOperatorInfo*               pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
S
shenglian zhou 已提交
3142 3143 3144 3145 3146 3147 3148 3149 3150

  if (!pInfo || !pOperator) {
    goto _error;
  }

  pInfo->readHandle = *readHandle;

  SDataBlockDescNode* pDescNode = pScanNode->node.pOutputDataBlockDesc;
  initResultSizeInfo(&pOperator->resultInfo, 1);
3151
  pInfo->pRes = createDataBlockFromDescNode(pDescNode);
S
shenglian zhou 已提交
3152 3153
  blockDataEnsureCapacity(pInfo->pRes, pOperator->resultInfo.capacity);

S
slzhou 已提交
3154 3155 3156
  getTableCountScanSupp(pTblCountScanNode->pGroupTags, &pTblCountScanNode->scan.tableName,
                        pTblCountScanNode->scan.pScanCols, pTblCountScanNode->scan.pScanPseudoCols, &pInfo->supp,
                        pTaskInfo);
S
shenglian zhou 已提交
3157 3158 3159

  setOperatorInfo(pOperator, "TableCountScanOperator", QUERY_NODE_PHYSICAL_PLAN_TABLE_COUNT_SCAN, false, OP_NOT_OPENED,
                  pInfo, pTaskInfo);
L
Liu Jicong 已提交
3160 3161
  pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, doTableCountScan, NULL, destoryTableCountScanOperator,
                                         optrDefaultBufFn, NULL);
S
shenglian zhou 已提交
3162 3163 3164 3165 3166 3167 3168 3169 3170 3171 3172
  return pOperator;

_error:
  if (pInfo != NULL) {
    destoryTableCountScanOperator(pInfo);
  }
  taosMemoryFreeClear(pOperator);
  pTaskInfo->code = code;
  return NULL;
}

S
slzhou 已提交
3173 3174 3175
void fillTableCountScanDataBlock(STableCountScanSupp* pSupp, char* dbName, char* stbName, int64_t count,
                                 SSDataBlock* pRes) {
  if (pSupp->dbNameSlotId != -1) {
3176
    ASSERT(strlen(dbName));
S
slzhou 已提交
3177
    SColumnInfoData* colInfoData = taosArrayGet(pRes->pDataBlock, pSupp->dbNameSlotId);
H
Haojun Liao 已提交
3178 3179 3180 3181

    char varDbName[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
    tstrncpy(varDataVal(varDbName), dbName, TSDB_DB_NAME_LEN);

S
slzhou 已提交
3182
    varDataSetLen(varDbName, strlen(dbName));
3183
    colDataSetVal(colInfoData, 0, varDbName, false);
S
slzhou 已提交
3184 3185 3186 3187
  }

  if (pSupp->stbNameSlotId != -1) {
    SColumnInfoData* colInfoData = taosArrayGet(pRes->pDataBlock, pSupp->stbNameSlotId);
3188
    if (strlen(stbName) != 0) {
S
slzhou 已提交
3189
      char varStbName[TSDB_TABLE_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
H
Haojun Liao 已提交
3190
      strncpy(varDataVal(varStbName), stbName, TSDB_TABLE_NAME_LEN);
3191
      varDataSetLen(varStbName, strlen(stbName));
3192
      colDataSetVal(colInfoData, 0, varStbName, false);
3193
    } else {
3194
      colDataSetNULL(colInfoData, 0);
3195
    }
S
slzhou 已提交
3196 3197 3198
  }

  if (pSupp->tbCountSlotId != -1) {
S
slzhou 已提交
3199
    SColumnInfoData* colInfoData = taosArrayGet(pRes->pDataBlock, pSupp->tbCountSlotId);
3200
    colDataSetVal(colInfoData, 0, (char*)&count, false);
S
slzhou 已提交
3201 3202 3203 3204
  }
  pRes->info.rows = 1;
}

S
slzhou 已提交
3205
static SSDataBlock* buildSysDbTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo) {
S
slzhou 已提交
3206 3207 3208
  STableCountScanSupp* pSupp = &pInfo->supp;
  SSDataBlock*         pRes = pInfo->pRes;

S
slzhou 已提交
3209
  size_t infodbTableNum;
S
slzhou 已提交
3210
  getInfosDbMeta(NULL, &infodbTableNum);
S
slzhou 已提交
3211
  size_t perfdbTableNum;
S
slzhou 已提交
3212 3213
  getPerfDbMeta(NULL, &perfdbTableNum);

3214
  if (pSupp->groupByDbName || pSupp->groupByStbName) {
S
slzhou 已提交
3215
    buildSysDbGroupedTableCount(pOperator, pInfo, pSupp, pRes, infodbTableNum, perfdbTableNum);
S
slzhou 已提交
3216 3217
    return (pRes->info.rows > 0) ? pRes : NULL;
  } else {
S
slzhou 已提交
3218
    buildSysDbFilterTableCount(pOperator, pSupp, pRes, infodbTableNum, perfdbTableNum);
S
slzhou 已提交
3219 3220 3221 3222
    return (pRes->info.rows > 0) ? pRes : NULL;
  }
}

S
slzhou 已提交
3223 3224 3225 3226 3227 3228 3229 3230 3231 3232 3233 3234 3235 3236 3237 3238
static void buildSysDbFilterTableCount(SOperatorInfo* pOperator, STableCountScanSupp* pSupp, SSDataBlock* pRes,
                                       size_t infodbTableNum, size_t perfdbTableNum) {
  if (strcmp(pSupp->dbNameFilter, TSDB_INFORMATION_SCHEMA_DB) == 0) {
    fillTableCountScanDataBlock(pSupp, TSDB_INFORMATION_SCHEMA_DB, "", infodbTableNum, pRes);
  } else if (strcmp(pSupp->dbNameFilter, TSDB_PERFORMANCE_SCHEMA_DB) == 0) {
    fillTableCountScanDataBlock(pSupp, TSDB_PERFORMANCE_SCHEMA_DB, "", perfdbTableNum, pRes);
  } else if (strlen(pSupp->dbNameFilter) == 0) {
    fillTableCountScanDataBlock(pSupp, "", "", infodbTableNum + perfdbTableNum, pRes);
  }
  setOperatorCompleted(pOperator);
}

static void buildSysDbGroupedTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
                                        STableCountScanSupp* pSupp, SSDataBlock* pRes, size_t infodbTableNum,
                                        size_t perfdbTableNum) {
  if (pInfo->currGrpIdx == 0) {
3239 3240 3241 3242 3243 3244 3245
    uint64_t groupId = 0;
    if (pSupp->groupByDbName) {
      groupId = calcGroupId(TSDB_INFORMATION_SCHEMA_DB, strlen(TSDB_INFORMATION_SCHEMA_DB));
    } else {
      groupId = calcGroupId("", 0);
    }
    
S
slzhou 已提交
3246 3247 3248
    pRes->info.id.groupId = groupId;
    fillTableCountScanDataBlock(pSupp, TSDB_INFORMATION_SCHEMA_DB, "", infodbTableNum, pRes);
  } else if (pInfo->currGrpIdx == 1) {
3249 3250 3251 3252 3253 3254 3255
    uint64_t groupId = 0;
    if (pSupp->groupByDbName) {
      groupId = calcGroupId(TSDB_PERFORMANCE_SCHEMA_DB, strlen(TSDB_PERFORMANCE_SCHEMA_DB));
    } else {
      groupId = calcGroupId("", 0);
    }

S
slzhou 已提交
3256 3257 3258 3259 3260 3261 3262 3263
    pRes->info.id.groupId = groupId;
    fillTableCountScanDataBlock(pSupp, TSDB_PERFORMANCE_SCHEMA_DB, "", perfdbTableNum, pRes);
  } else {
    setOperatorCompleted(pOperator);
  }
  pInfo->currGrpIdx++;
}

S
shenglian zhou 已提交
3264
static SSDataBlock* doTableCountScan(SOperatorInfo* pOperator) {
S
slzhou 已提交
3265 3266 3267 3268
  SExecTaskInfo*               pTaskInfo = pOperator->pTaskInfo;
  STableCountScanOperatorInfo* pInfo = pOperator->info;
  STableCountScanSupp*         pSupp = &pInfo->supp;
  SSDataBlock*                 pRes = pInfo->pRes;
S
slzhou 已提交
3269
  blockDataCleanup(pRes);
3270

S
slzhou 已提交
3271 3272 3273
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }
S
slzhou 已提交
3274
  if (pInfo->readHandle.mnd != NULL) {
S
slzhou 已提交
3275
    return buildSysDbTableCount(pOperator, pInfo);
S
slzhou 已提交
3276
  }
S
slzhou 已提交
3277

S
slzhou 已提交
3278 3279 3280 3281 3282
  return buildVnodeDbTableCount(pOperator, pInfo, pSupp, pRes);
}

static SSDataBlock* buildVnodeDbTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
                                           STableCountScanSupp* pSupp, SSDataBlock* pRes) {
S
slzhou 已提交
3283 3284
  const char* db = NULL;
  int32_t     vgId = 0;
S
slzhou 已提交
3285
  char        dbName[TSDB_DB_NAME_LEN] = {0};
S
slzhou 已提交
3286

S
slzhou 已提交
3287 3288 3289 3290 3291 3292
  // get dbname
  vnodeGetInfo(pInfo->readHandle.vnode, &db, &vgId);
  SName sn = {0};
  tNameFromString(&sn, db, T_NAME_ACCT | T_NAME_DB);
  tNameGetDbName(&sn, dbName);

3293
  if (pSupp->groupByDbName || pSupp->groupByStbName) {
S
slzhou 已提交
3294 3295 3296 3297 3298 3299 3300 3301 3302 3303 3304 3305 3306 3307
    buildVnodeGroupedTableCount(pOperator, pInfo, pSupp, pRes, vgId, dbName);
  } else {
    buildVnodeFilteredTbCount(pOperator, pInfo, pSupp, pRes, dbName);
  }
  return pRes->info.rows > 0 ? pRes : NULL;
}

static void buildVnodeGroupedTableCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
                                        STableCountScanSupp* pSupp, SSDataBlock* pRes, int32_t vgId, char* dbName) {
  if (pSupp->groupByStbName) {
    if (pInfo->stbUidList == NULL) {
      pInfo->stbUidList = taosArrayInit(16, sizeof(tb_uid_t));
      if (vnodeGetStbIdList(pInfo->readHandle.vnode, 0, pInfo->stbUidList) < 0) {
        qError("vgId:%d, failed to get stb id list error: %s", vgId, terrstr());
S
slzhou 已提交
3308
      }
S
slzhou 已提交
3309 3310 3311 3312 3313 3314 3315 3316 3317 3318
    }
    if (pInfo->currGrpIdx < taosArrayGetSize(pInfo->stbUidList)) {
      tb_uid_t stbUid = *(tb_uid_t*)taosArrayGet(pInfo->stbUidList, pInfo->currGrpIdx);
      buildVnodeGroupedStbTableCount(pInfo, pSupp, pRes, dbName, stbUid);

      pInfo->currGrpIdx++;
    } else if (pInfo->currGrpIdx == taosArrayGetSize(pInfo->stbUidList)) {
      buildVnodeGroupedNtbTableCount(pInfo, pSupp, pRes, dbName);

      pInfo->currGrpIdx++;
S
slzhou 已提交
3319
    } else {
S
slzhou 已提交
3320
      setOperatorCompleted(pOperator);
S
slzhou 已提交
3321 3322
    }
  } else {
S
slzhou 已提交
3323 3324 3325 3326 3327 3328 3329 3330 3331 3332 3333 3334 3335 3336 3337 3338 3339
    uint64_t groupId = calcGroupId(dbName, strlen(dbName));
    pRes->info.id.groupId = groupId;
    int64_t dbTableCount = metaGetTbNum(pInfo->readHandle.meta);
    fillTableCountScanDataBlock(pSupp, dbName, "", dbTableCount, pRes);
    setOperatorCompleted(pOperator);
  }
}

static void buildVnodeFilteredTbCount(SOperatorInfo* pOperator, STableCountScanOperatorInfo* pInfo,
                                      STableCountScanSupp* pSupp, SSDataBlock* pRes, char* dbName) {
  if (strlen(pSupp->dbNameFilter) != 0) {
    if (strlen(pSupp->stbNameFilter) != 0) {
      tb_uid_t      uid = metaGetTableEntryUidByName(pInfo->readHandle.meta, pSupp->stbNameFilter);
      SMetaStbStats stats = {0};
      metaGetStbStats(pInfo->readHandle.meta, uid, &stats);
      int64_t ctbNum = stats.ctbNum;
      fillTableCountScanDataBlock(pSupp, dbName, pSupp->stbNameFilter, ctbNum, pRes);
S
slzhou 已提交
3340 3341 3342
    } else {
      int64_t tbNumVnode = metaGetTbNum(pInfo->readHandle.meta);
      fillTableCountScanDataBlock(pSupp, dbName, "", tbNumVnode, pRes);
S
slzhou 已提交
3343
    }
S
slzhou 已提交
3344 3345 3346
  } else {
    int64_t tbNumVnode = metaGetTbNum(pInfo->readHandle.meta);
    fillTableCountScanDataBlock(pSupp, dbName, "", tbNumVnode, pRes);
S
slzhou 已提交
3347
  }
S
slzhou 已提交
3348 3349 3350 3351 3352 3353
  setOperatorCompleted(pOperator);
}

static void buildVnodeGroupedNtbTableCount(STableCountScanOperatorInfo* pInfo, STableCountScanSupp* pSupp,
                                           SSDataBlock* pRes, char* dbName) {
  char fullStbName[TSDB_TABLE_FNAME_LEN] = {0};
3354 3355 3356 3357
  if (pSupp->groupByDbName) {
    snprintf(fullStbName, TSDB_TABLE_FNAME_LEN, "%s.%s", dbName, "");
  }
  
S
slzhou 已提交
3358 3359 3360
  uint64_t groupId = calcGroupId(fullStbName, strlen(fullStbName));
  pRes->info.id.groupId = groupId;
  int64_t ntbNum = metaGetNtbNum(pInfo->readHandle.meta);
3361 3362 3363
  if (ntbNum != 0) {
    fillTableCountScanDataBlock(pSupp, dbName, "", ntbNum, pRes);
  }
S
slzhou 已提交
3364 3365 3366 3367 3368 3369 3370 3371
}

static void buildVnodeGroupedStbTableCount(STableCountScanOperatorInfo* pInfo, STableCountScanSupp* pSupp,
                                           SSDataBlock* pRes, char* dbName, tb_uid_t stbUid) {
  char stbName[TSDB_TABLE_NAME_LEN] = {0};
  metaGetTableSzNameByUid(pInfo->readHandle.meta, stbUid, stbName);

  char fullStbName[TSDB_TABLE_FNAME_LEN] = {0};
3372 3373 3374 3375 3376 3377
  if (pSupp->groupByDbName) {
    snprintf(fullStbName, TSDB_TABLE_FNAME_LEN, "%s.%s", dbName, stbName);
  } else {
    snprintf(fullStbName, TSDB_TABLE_FNAME_LEN, "%s", stbName);
  }
  
S
slzhou 已提交
3378 3379 3380 3381 3382 3383 3384 3385
  uint64_t groupId = calcGroupId(fullStbName, strlen(fullStbName));
  pRes->info.id.groupId = groupId;

  SMetaStbStats stats = {0};
  metaGetStbStats(pInfo->readHandle.meta, stbUid, &stats);
  int64_t ctbNum = stats.ctbNum;

  fillTableCountScanDataBlock(pSupp, dbName, stbName, ctbNum, pRes);
S
shenglian zhou 已提交
3386 3387 3388
}

static void destoryTableCountScanOperator(void* param) {
S
slzhou 已提交
3389
  STableCountScanOperatorInfo* pTableCountScanInfo = param;
S
shenglian zhou 已提交
3390 3391
  blockDataDestroy(pTableCountScanInfo->pRes);

S
slzhou 已提交
3392
  taosArrayDestroy(pTableCountScanInfo->stbUidList);
S
shenglian zhou 已提交
3393 3394
  taosMemoryFreeClear(param);
}