executil.c 64.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

16 17
#include "function.h"
#include "functionMgt.h"
dengyihao's avatar
dengyihao 已提交
18 19
#include "index.h"
#include "os.h"
20
#include "tdatablock.h"
21
#include "thash.h"
22
#include "tmsg.h"
23
#include "ttime.h"
24

25 26
#include "executil.h"
#include "executorimpl.h"
H
Haojun Liao 已提交
27
#include "tcompression.h"
H
Haojun Liao 已提交
28

H
Haojun Liao 已提交
29 30 31 32
// If the numOfOutputGroups is 1, the data blocks that belongs to different groups will be provided randomly
// The numOfOutputGroups is specified by physical plan. and will not be affect by numOfGroups
struct STableListInfo {
  bool      oneTableForEachGroup;
dengyihao's avatar
dengyihao 已提交
33 34
  int32_t   numOfOuputGroups;  // the data block will be generated one by one
  int32_t*  groupOffset;       // keep the offset value for each group in the tableList
H
Haojun Liao 已提交
35
  SArray*   pTableList;
dengyihao's avatar
dengyihao 已提交
36
  SHashObj* map;  // speedup acquire the tableQueryInfo by table uid
H
Haojun Liao 已提交
37 38 39 40 41 42 43 44 45
  uint64_t  suid;
};

typedef struct tagFilterAssist {
  SHashObj* colHash;
  int32_t   index;
  SArray*   cInfoList;
} tagFilterAssist;

46
static int32_t removeInvalidUid(SArray* uids, SHashObj* tags);
47
static int32_t optimizeTbnameInCond(void* metaHandle, int64_t suid, SArray* pRes, SNode* pTagCond);
H
Haojun Liao 已提交
48
static int32_t optimizeTbnameInCondImpl(void* metaHandle, SArray* pExistedUidList, SNode* pTagCond);
49
static int32_t getTableList(void* metaHandle, void* pVnode, SScanPhysiNode* pScanNode, SNode* pTagCond,
50
                            SNode* pTagIndexCond, STableListInfo* pListInfo, const char* idstr);
H
Haojun Liao 已提交
51
static SSDataBlock* createTagValBlockForFilter(SArray* pColList, int32_t numOfTables, SArray* pUidTagList, void* metaHandle);
dengyihao's avatar
dengyihao 已提交
52

H
Haojun Liao 已提交
53 54
static int64_t getLimit(const SNode* pLimit) { return NULL == pLimit ? -1 : ((SLimitNode*)pLimit)->limit; }
static int64_t getOffset(const SNode* pLimit) { return NULL == pLimit ? -1 : ((SLimitNode*)pLimit)->offset; }
dengyihao's avatar
dengyihao 已提交
55

dengyihao's avatar
dengyihao 已提交
56 57
void initResultRowInfo(SResultRowInfo* pResultRowInfo) {
  pResultRowInfo->size = 0;
58
  pResultRowInfo->cur.pageId = -1;
59 60
}

dengyihao's avatar
dengyihao 已提交
61
void closeResultRow(SResultRow* pResultRow) { pResultRow->closed = true; }
62

63 64 65 66 67 68 69 70 71 72 73
void resetResultRow(SResultRow* pResultRow, size_t entrySize) {
  pResultRow->numOfRows = 0;
  pResultRow->closed = false;
  pResultRow->endInterp = false;
  pResultRow->startInterp = false;

  if (entrySize > 0) {
    memset(pResultRow->pEntryInfo, 0, entrySize);
  }
}

H
Haojun Liao 已提交
74
// TODO refactor: use macro
75
SResultRowEntryInfo* getResultEntryInfo(const SResultRow* pRow, int32_t index, const int32_t* offset) {
H
Haojun Liao 已提交
76
  assert(index >= 0 && offset != NULL);
dengyihao's avatar
dengyihao 已提交
77
  return (SResultRowEntryInfo*)((char*)pRow->pEntryInfo + offset[index]);
H
Haojun Liao 已提交
78 79
}

80 81 82
size_t getResultRowSize(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
  int32_t rowSize = (numOfOutput * sizeof(SResultRowEntryInfo)) + sizeof(SResultRow);

dengyihao's avatar
dengyihao 已提交
83
  for (int32_t i = 0; i < numOfOutput; ++i) {
84 85 86
    rowSize += pCtx[i].resDataInfo.interBufSize;
  }

87 88
  rowSize += (numOfOutput * sizeof(bool));
  // expand rowSize to mark if col is null for top/bottom result(saveTupleData)
89
  return rowSize;
90 91
}

H
Haojun Liao 已提交
92
void cleanupGroupResInfo(SGroupResInfo* pGroupResInfo) {
H
Haojun Liao 已提交
93
  taosMemoryFreeClear(pGroupResInfo->pBuf);
H
Haojun Liao 已提交
94
  pGroupResInfo->pRows = taosArrayDestroy(pGroupResInfo->pRows);
dengyihao's avatar
dengyihao 已提交
95
  pGroupResInfo->index = 0;
H
Haojun Liao 已提交
96 97
}

5
54liuyao 已提交
98
int32_t resultrowComparAsc(const void* p1, const void* p2) {
dengyihao's avatar
dengyihao 已提交
99 100
  SResKeyPos* pp1 = *(SResKeyPos**)p1;
  SResKeyPos* pp2 = *(SResKeyPos**)p2;
101 102

  if (pp1->groupId == pp2->groupId) {
dengyihao's avatar
dengyihao 已提交
103 104
    int64_t pts1 = *(int64_t*)pp1->key;
    int64_t pts2 = *(int64_t*)pp2->key;
105 106 107 108

    if (pts1 == pts2) {
      return 0;
    } else {
dengyihao's avatar
dengyihao 已提交
109
      return pts1 < pts2 ? -1 : 1;
110 111
    }
  } else {
dengyihao's avatar
dengyihao 已提交
112
    return pp1->groupId < pp2->groupId ? -1 : 1;
113 114 115
  }
}

dengyihao's avatar
dengyihao 已提交
116
static int32_t resultrowComparDesc(const void* p1, const void* p2) { return resultrowComparAsc(p2, p1); }
117

118
void initGroupedResultInfo(SGroupResInfo* pGroupResInfo, SSHashObj* pHashmap, int32_t order) {
H
Haojun Liao 已提交
119 120 121 122
  if (pGroupResInfo->pRows != NULL) {
    taosArrayDestroy(pGroupResInfo->pRows);
  }

123
  // extract the result rows information from the hash map
H
Haojun Liao 已提交
124 125
  int32_t size = tSimpleHashGetSize(pHashmap);

126
  void* pData = NULL;
H
Haojun Liao 已提交
127
  pGroupResInfo->pRows = taosArrayInit(size, POINTER_BYTES);
128

129
  size_t  keyLen = 0;
H
Haojun Liao 已提交
130 131
  int32_t iter = 0;
  int32_t bufLen = 0, offset = 0;
H
Haojun Liao 已提交
132

H
Haojun Liao 已提交
133
  // todo move away and record this during create window
134
  while ((pData = tSimpleHashIterate(pHashmap, pData, &iter)) != NULL) {
H
Haojun Liao 已提交
135 136 137
    /*void* key = */tSimpleHashGetKey(pData, &keyLen);
    bufLen += keyLen + sizeof(SResultRowPosition);
  }
138

H
Haojun Liao 已提交
139
  pGroupResInfo->pBuf = taosMemoryMalloc(bufLen);
H
Haojun Liao 已提交
140

H
Haojun Liao 已提交
141 142 143 144 145
  iter = 0;
  while ((pData = tSimpleHashIterate(pHashmap, pData, &iter)) != NULL) {
    void* key = tSimpleHashGetKey(pData, &keyLen);

    SResKeyPos* p = (SResKeyPos*) (pGroupResInfo->pBuf + offset);
146

dengyihao's avatar
dengyihao 已提交
147 148
    p->groupId = *(uint64_t*)key;
    p->pos = *(SResultRowPosition*)pData;
149
    memcpy(p->key, (char*)key + sizeof(uint64_t), keyLen - sizeof(uint64_t));
150
    taosArrayPush(pGroupResInfo->pRows, &p);
H
Haojun Liao 已提交
151 152

    offset += keyLen + sizeof(struct SResultRowPosition);
153 154
  }

155
  if (order == TSDB_ORDER_ASC || order == TSDB_ORDER_DESC) {
dengyihao's avatar
dengyihao 已提交
156
    __compar_fn_t fn = (order == TSDB_ORDER_ASC) ? resultrowComparAsc : resultrowComparDesc;
157
    size = POINTER_BYTES;
H
Haojun Liao 已提交
158
    taosSort(pGroupResInfo->pRows->pData, taosArrayGetSize(pGroupResInfo->pRows), size, fn);
159 160
  }

H
Haojun Liao 已提交
161
  pGroupResInfo->index = 0;
H
Haojun Liao 已提交
162 163 164
  assert(pGroupResInfo->index <= getNumOfTotalRes(pGroupResInfo));
}

H
Haojun Liao 已提交
165 166
void initMultiResInfoFromArrayList(SGroupResInfo* pGroupResInfo, SArray* pArrayList) {
  if (pGroupResInfo->pRows != NULL) {
5
54liuyao 已提交
167
    taosArrayDestroyP(pGroupResInfo->pRows, taosMemoryFree);
H
Haojun Liao 已提交
168 169
  }

170
  pGroupResInfo->pRows = pArrayList;
H
Haojun Liao 已提交
171
  pGroupResInfo->index = 0;
172
  ASSERT(pGroupResInfo->index <= getNumOfTotalRes(pGroupResInfo));
H
Haojun Liao 已提交
173 174
}

175
bool hasRemainResults(SGroupResInfo* pGroupResInfo) {
H
Haojun Liao 已提交
176 177 178 179 180 181 182 183 184 185 186 187
  if (pGroupResInfo->pRows == NULL) {
    return false;
  }

  return pGroupResInfo->index < taosArrayGetSize(pGroupResInfo->pRows);
}

int32_t getNumOfTotalRes(SGroupResInfo* pGroupResInfo) {
  if (pGroupResInfo->pRows == 0) {
    return 0;
  }

dengyihao's avatar
dengyihao 已提交
188
  return (int32_t)taosArrayGetSize(pGroupResInfo->pRows);
H
Haojun Liao 已提交
189 190
}

191
SArray* createSortInfo(SNodeList* pNodeList) {
192
  size_t numOfCols = 0;
193

194 195 196 197 198
  if (pNodeList != NULL) {
    numOfCols = LIST_LENGTH(pNodeList);
  } else {
    numOfCols = 0;
  }
199

200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219
  SArray* pList = taosArrayInit(numOfCols, sizeof(SBlockOrderInfo));
  if (pList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return pList;
  }

  for (int32_t i = 0; i < numOfCols; ++i) {
    SOrderByExprNode* pSortKey = (SOrderByExprNode*)nodesListGetNode(pNodeList, i);
    SBlockOrderInfo   bi = {0};
    bi.order = (pSortKey->order == ORDER_ASC) ? TSDB_ORDER_ASC : TSDB_ORDER_DESC;
    bi.nullFirst = (pSortKey->nullOrder == NULL_ORDER_FIRST);

    SColumnNode* pColNode = (SColumnNode*)pSortKey->pExpr;
    bi.slotId = pColNode->slotId;
    taosArrayPush(pList, &bi);
  }

  return pList;
}

H
Haojun Liao 已提交
220
SSDataBlock* createDataBlockFromDescNode(SDataBlockDescNode* pNode) {
221
  int32_t numOfCols = LIST_LENGTH(pNode->pSlots);
H
Haojun Liao 已提交
222

223
  SSDataBlock* pBlock = createDataBlock();
H
Haojun Liao 已提交
224

H
Haojun Liao 已提交
225
  pBlock->info.id.blockId = pNode->dataBlockId;
226
  pBlock->info.type = STREAM_INVALID;
5
54liuyao 已提交
227
  pBlock->info.calWin = (STimeWindow){.skey = INT64_MIN, .ekey = INT64_MAX};
228
  pBlock->info.watermark = INT64_MIN;
H
Haojun Liao 已提交
229

230
  for (int32_t i = 0; i < numOfCols; ++i) {
M
Minglei Jin 已提交
231
    SSlotDescNode*  pDescNode = (SSlotDescNode*)nodesListGetNode(pNode->pSlots, i);
dengyihao's avatar
dengyihao 已提交
232 233
    SColumnInfoData idata =
        createColumnInfoData(pDescNode->dataType.type, pDescNode->dataType.bytes, pDescNode->slotId);
234 235 236
    idata.info.scale = pDescNode->dataType.scale;
    idata.info.precision = pDescNode->dataType.precision;

237
    blockDataAppendColInfo(pBlock, &idata);
H
Haojun Liao 已提交
238 239
  }

240 241 242
  return pBlock;
}

wmmhello's avatar
wmmhello 已提交
243 244
EDealRes doTranslateTagExpr(SNode** pNode, void* pContext) {
  SMetaReader* mr = (SMetaReader*)pContext;
dengyihao's avatar
dengyihao 已提交
245
  if (nodeType(*pNode) == QUERY_NODE_COLUMN) {
wmmhello's avatar
wmmhello 已提交
246 247
    SColumnNode* pSColumnNode = *(SColumnNode**)pNode;

dengyihao's avatar
dengyihao 已提交
248
    SValueNode* res = (SValueNode*)nodesMakeNode(QUERY_NODE_VALUE);
wmmhello's avatar
wmmhello 已提交
249 250 251 252 253 254 255 256 257
    if (NULL == res) {
      return DEAL_RES_ERROR;
    }

    res->translate = true;
    res->node.resType = pSColumnNode->node.resType;

    STagVal tagVal = {0};
    tagVal.cid = pSColumnNode->colId;
258
    const char* p = metaGetTableTagVal(mr->me.ctbEntry.pTags, pSColumnNode->node.resType.type, &tagVal);
wmmhello's avatar
wmmhello 已提交
259 260
    if (p == NULL) {
      res->node.resType.type = TSDB_DATA_TYPE_NULL;
dengyihao's avatar
dengyihao 已提交
261 262
    } else if (pSColumnNode->node.resType.type == TSDB_DATA_TYPE_JSON) {
      int32_t len = ((const STag*)p)->len;
wmmhello's avatar
wmmhello 已提交
263 264 265 266 267 268 269 270 271 272 273
      res->datum.p = taosMemoryCalloc(len + 1, 1);
      memcpy(res->datum.p, p, len);
    } else if (IS_VAR_DATA_TYPE(pSColumnNode->node.resType.type)) {
      res->datum.p = taosMemoryCalloc(tagVal.nData + VARSTR_HEADER_SIZE + 1, 1);
      memcpy(varDataVal(res->datum.p), tagVal.pData, tagVal.nData);
      varDataSetLen(res->datum.p, tagVal.nData);
    } else {
      nodesSetValueNodeValue(res, &(tagVal.i64));
    }
    nodesDestroyNode(*pNode);
    *pNode = (SNode*)res;
dengyihao's avatar
dengyihao 已提交
274 275 276 277
  } else if (nodeType(*pNode) == QUERY_NODE_FUNCTION) {
    SFunctionNode* pFuncNode = *(SFunctionNode**)pNode;
    if (pFuncNode->funcType == FUNCTION_TYPE_TBNAME) {
      SValueNode* res = (SValueNode*)nodesMakeNode(QUERY_NODE_VALUE);
wmmhello's avatar
wmmhello 已提交
278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296
      if (NULL == res) {
        return DEAL_RES_ERROR;
      }

      res->translate = true;
      res->node.resType = pFuncNode->node.resType;

      int32_t len = strlen(mr->me.name);
      res->datum.p = taosMemoryCalloc(len + VARSTR_HEADER_SIZE + 1, 1);
      memcpy(varDataVal(res->datum.p), mr->me.name, len);
      varDataSetLen(res->datum.p, len);
      nodesDestroyNode(*pNode);
      *pNode = (SNode*)res;
    }
  }

  return DEAL_RES_CONTINUE;
}

H
Haojun Liao 已提交
297
int32_t isQualifiedTable(STableKeyInfo* info, SNode* pTagCond, void* metaHandle, bool* pQualified) {
298
  int32_t     code = TSDB_CODE_SUCCESS;
dengyihao's avatar
dengyihao 已提交
299
  SMetaReader mr = {0};
300

wmmhello's avatar
wmmhello 已提交
301
  metaReaderInit(&mr, metaHandle, 0);
H
Haojun Liao 已提交
302
  code = metaGetTableEntryByUidCache(&mr, info->uid);
303 304
  if (TSDB_CODE_SUCCESS != code) {
    metaReaderClear(&mr);
M
Minglei Jin 已提交
305
    *pQualified = false;
306

M
Minglei Jin 已提交
307
    return TSDB_CODE_SUCCESS;
308
  }
wmmhello's avatar
wmmhello 已提交
309

dengyihao's avatar
dengyihao 已提交
310
  SNode* pTagCondTmp = nodesCloneNode(pTagCond);
wmmhello's avatar
wmmhello 已提交
311 312 313 314

  nodesRewriteExprPostOrder(&pTagCondTmp, doTranslateTagExpr, &mr);
  metaReaderClear(&mr);

315 316
  SNode* pNew = NULL;
  code = scalarCalculateConstants(pTagCondTmp, &pNew);
wmmhello's avatar
wmmhello 已提交
317
  if (TSDB_CODE_SUCCESS != code) {
wmmhello's avatar
wmmhello 已提交
318
    terrno = code;
wmmhello's avatar
wmmhello 已提交
319
    nodesDestroyNode(pTagCondTmp);
320 321 322
    *pQualified = false;

    return code;
wmmhello's avatar
wmmhello 已提交
323 324
  }

325
  ASSERT(nodeType(pNew) == QUERY_NODE_VALUE);
dengyihao's avatar
dengyihao 已提交
326
  SValueNode* pValue = (SValueNode*)pNew;
wmmhello's avatar
wmmhello 已提交
327

328
  ASSERT(pValue->node.resType.type == TSDB_DATA_TYPE_BOOL);
329 330
  *pQualified = pValue->datum.b;

wmmhello's avatar
wmmhello 已提交
331
  nodesDestroyNode(pNew);
332
  return TSDB_CODE_SUCCESS;
wmmhello's avatar
wmmhello 已提交
333 334
}

wmmhello's avatar
wmmhello 已提交
335 336 337 338
static EDealRes getColumn(SNode** pNode, void* pContext) {
  SColumnNode* pSColumnNode = NULL;
  if (QUERY_NODE_COLUMN == nodeType((*pNode))) {
    pSColumnNode = *(SColumnNode**)pNode;
H
Haojun Liao 已提交
339
  } else if (QUERY_NODE_FUNCTION == nodeType((*pNode))) {
wmmhello's avatar
wmmhello 已提交
340 341 342 343 344 345 346 347 348 349 350 351
    SFunctionNode* pFuncNode = *(SFunctionNode**)(pNode);
    if (pFuncNode->funcType == FUNCTION_TYPE_TBNAME) {
      pSColumnNode = (SColumnNode*)nodesMakeNode(QUERY_NODE_COLUMN);
      if (NULL == pSColumnNode) {
        return DEAL_RES_ERROR;
      }
      pSColumnNode->colId = -1;
      pSColumnNode->colType = COLUMN_TYPE_TBNAME;
      pSColumnNode->node.resType.type = TSDB_DATA_TYPE_VARCHAR;
      pSColumnNode->node.resType.bytes = TSDB_TABLE_FNAME_LEN - 1 + VARSTR_HEADER_SIZE;
      nodesDestroyNode(*pNode);
      *pNode = (SNode*)pSColumnNode;
H
Haojun Liao 已提交
352
    } else {
353
      return DEAL_RES_CONTINUE;
wmmhello's avatar
wmmhello 已提交
354
    }
H
Haojun Liao 已提交
355
  } else {
wmmhello's avatar
wmmhello 已提交
356
    return DEAL_RES_CONTINUE;
wmmhello's avatar
wmmhello 已提交
357
  }
wmmhello's avatar
wmmhello 已提交
358

H
Haojun Liao 已提交
359 360 361
  tagFilterAssist* pData = (tagFilterAssist*)pContext;
  void*            data = taosHashGet(pData->colHash, &pSColumnNode->colId, sizeof(pSColumnNode->colId));
  if (!data) {
wmmhello's avatar
wmmhello 已提交
362 363
    taosHashPut(pData->colHash, &pSColumnNode->colId, sizeof(pSColumnNode->colId), pNode, sizeof((*pNode)));
    pSColumnNode->slotId = pData->index++;
H
Haojun Liao 已提交
364 365 366
    SColumnInfo cInfo = {.colId = pSColumnNode->colId,
                         .type = pSColumnNode->node.resType.type,
                         .bytes = pSColumnNode->node.resType.bytes};
367 368 369
#if TAG_FILTER_DEBUG
    qDebug("tagfilter build column info, slotId:%d, colId:%d, type:%d", pSColumnNode->slotId, cInfo.colId, cInfo.type);
#endif
wmmhello's avatar
wmmhello 已提交
370
    taosArrayPush(pData->cInfoList, &cInfo);
H
Haojun Liao 已提交
371
  } else {
372 373
    SColumnNode* col = *(SColumnNode**)data;
    pSColumnNode->slotId = col->slotId;
wmmhello's avatar
wmmhello 已提交
374 375
  }

wmmhello's avatar
wmmhello 已提交
376 377 378 379 380 381 382 383 384 385
  return DEAL_RES_CONTINUE;
}

static int32_t createResultData(SDataType* pType, int32_t numOfRows, SScalarParam* pParam) {
  SColumnInfoData* pColumnData = taosMemoryCalloc(1, sizeof(SColumnInfoData));
  if (pColumnData == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return terrno;
  }

H
Haojun Liao 已提交
386 387 388
  pColumnData->info.type = pType->type;
  pColumnData->info.bytes = pType->bytes;
  pColumnData->info.scale = pType->scale;
wmmhello's avatar
wmmhello 已提交
389 390
  pColumnData->info.precision = pType->precision;

H
Haojun Liao 已提交
391
  int32_t code = colInfoDataEnsureCapacity(pColumnData, numOfRows, true);
wmmhello's avatar
wmmhello 已提交
392
  if (code != TSDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
393
    terrno = code;
wmmhello's avatar
wmmhello 已提交
394 395 396 397 398 399 400 401 402
    taosMemoryFree(pColumnData);
    return terrno;
  }

  pParam->columnData = pColumnData;
  pParam->colAlloced = true;
  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
403 404 405 406 407 408 409 410
static void releaseColInfoData(void* pCol) {
  if (pCol) {
    SColumnInfoData* col = (SColumnInfoData*)pCol;
    colDataDestroy(col);
    taosMemoryFree(col);
  }
}

H
Haojun Liao 已提交
411 412 413 414 415 416 417
void freeItem(void* p) {
  STUidTagInfo *pInfo = p;
  if (pInfo->pTagVal != NULL) {
    taosMemoryFree(pInfo->pTagVal);
  }
}

H
Haojun Liao 已提交
418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435
int32_t getColInfoResultForGroupby(void* metaHandle, SNodeList* group, STableListInfo* pTableListInfo) {
  int32_t      code = TSDB_CODE_SUCCESS;
  SArray*      pBlockList = NULL;
  SSDataBlock* pResBlock = NULL;
  void*        keyBuf = NULL;
  SArray*      groupData = NULL;

  int32_t rows = taosArrayGetSize(pTableListInfo->pTableList);
  if (rows == 0) {
    return TDB_CODE_SUCCESS;
  }

  tagFilterAssist ctx = {0};
  ctx.colHash = taosHashInit(4, taosGetDefaultHashFunction(TSDB_DATA_TYPE_SMALLINT), false, HASH_NO_LOCK);
  if (ctx.colHash == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto end;
  }
436

H
Haojun Liao 已提交
437 438 439 440 441 442 443 444 445 446 447 448 449
  ctx.index = 0;
  ctx.cInfoList = taosArrayInit(4, sizeof(SColumnInfo));
  if (ctx.cInfoList == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto end;
  }

  SNode* pNode = NULL;
  FOREACH(pNode, group) {
    nodesRewriteExprPostOrder(&pNode, getColumn, (void*)&ctx);
    REPLACE_NODE(pNode);
  }

450
  SArray* pUidTagList = taosArrayInit(8, sizeof(STUidTagInfo));
H
Haojun Liao 已提交
451 452
  for (int32_t i = 0; i < rows; ++i) {
    STableKeyInfo* pkeyInfo = taosArrayGet(pTableListInfo->pTableList, i);
453 454
    STUidTagInfo info = {.uid = pkeyInfo->uid};
    taosArrayPush(pUidTagList, &info);
H
Haojun Liao 已提交
455 456 457
  }

  //  int64_t stt = taosGetTimestampUs();
458
  code = metaGetTableTags(metaHandle, pTableListInfo->suid, pUidTagList);
H
Haojun Liao 已提交
459 460 461 462
  if (code != TSDB_CODE_SUCCESS) {
    goto end;
  }

463
  int32_t numOfTables = taosArrayGetSize(pUidTagList);
H
Haojun Liao 已提交
464 465 466
  pResBlock = createTagValBlockForFilter(ctx.cInfoList, numOfTables, pUidTagList, metaHandle);
  if (pResBlock == NULL) {
    code = terrno;
H
Haojun Liao 已提交
467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492
    goto end;
  }

  //  int64_t st1 = taosGetTimestampUs();
  //  qDebug("generate tag block rows:%d, cost:%ld us", rows, st1-st);

  pBlockList = taosArrayInit(2, POINTER_BYTES);
  taosArrayPush(pBlockList, &pResBlock);

  groupData = taosArrayInit(2, POINTER_BYTES);
  FOREACH(pNode, group) {
    SScalarParam output = {0};

    switch (nodeType(pNode)) {
      case QUERY_NODE_VALUE:
        break;
      case QUERY_NODE_COLUMN:
      case QUERY_NODE_OPERATOR:
      case QUERY_NODE_FUNCTION: {
        SExprNode* expNode = (SExprNode*)pNode;
        code = createResultData(&expNode->resType, rows, &output);
        if (code != TSDB_CODE_SUCCESS) {
          goto end;
        }
        break;
      }
493

H
Haojun Liao 已提交
494 495 496 497
      default:
        code = TSDB_CODE_OPS_NOT_SUPPORT;
        goto end;
    }
498

H
Haojun Liao 已提交
499 500 501 502 503 504 505 506 507
    if (nodeType(pNode) == QUERY_NODE_COLUMN) {
      SColumnNode*     pSColumnNode = (SColumnNode*)pNode;
      SColumnInfoData* pColInfo = (SColumnInfoData*)taosArrayGet(pResBlock->pDataBlock, pSColumnNode->slotId);
      code = colDataAssign(output.columnData, pColInfo, rows, NULL);
    } else if (nodeType(pNode) == QUERY_NODE_VALUE) {
      continue;
    } else {
      code = scalarCalculate(pNode, pBlockList, &output);
    }
508

H
Haojun Liao 已提交
509 510 511 512
    if (code != TSDB_CODE_SUCCESS) {
      releaseColInfoData(output.columnData);
      goto end;
    }
513

H
Haojun Liao 已提交
514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531
    taosArrayPush(groupData, &output.columnData);
  }

  int32_t keyLen = 0;
  SNode*  node;
  FOREACH(node, group) {
    SExprNode* pExpr = (SExprNode*)node;
    keyLen += pExpr->resType.bytes;
  }

  int32_t nullFlagSize = sizeof(int8_t) * LIST_LENGTH(group);
  keyLen += nullFlagSize;

  keyBuf = taosMemoryCalloc(1, keyLen);
  if (keyBuf == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto end;
  }
532

H
Haojun Liao 已提交
533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580
  for (int i = 0; i < rows; i++) {
    STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);

    char* isNull = (char*)keyBuf;
    char* pStart = (char*)keyBuf + sizeof(int8_t) * LIST_LENGTH(group);
    for (int j = 0; j < taosArrayGetSize(groupData); j++) {
      SColumnInfoData* pValue = (SColumnInfoData*)taosArrayGetP(groupData, j);

      if (colDataIsNull_s(pValue, i)) {
        isNull[j] = 1;
      } else {
        isNull[j] = 0;
        char* data = colDataGetData(pValue, i);
        if (pValue->info.type == TSDB_DATA_TYPE_JSON) {
          if (tTagIsJson(data)) {
            code = TSDB_CODE_QRY_JSON_IN_GROUP_ERROR;
            goto end;
          }
          if (tTagIsJsonNull(data)) {
            isNull[j] = 1;
            continue;
          }
          int32_t len = getJsonValueLen(data);
          memcpy(pStart, data, len);
          pStart += len;
        } else if (IS_VAR_DATA_TYPE(pValue->info.type)) {
          memcpy(pStart, data, varDataTLen(data));
          pStart += varDataTLen(data);
        } else {
          memcpy(pStart, data, pValue->info.bytes);
          pStart += pValue->info.bytes;
        }
      }
    }

    int32_t len = (int32_t)(pStart - (char*)keyBuf);
    info->groupId = calcGroupId(keyBuf, len);
  }

  //  int64_t st2 = taosGetTimestampUs();
  //  qDebug("calculate tag block rows:%d, cost:%ld us", rows, st2-st1);

end:
  taosMemoryFreeClear(keyBuf);
  taosHashCleanup(ctx.colHash);
  taosArrayDestroy(ctx.cInfoList);
  blockDataDestroy(pResBlock);
  taosArrayDestroy(pBlockList);
H
Haojun Liao 已提交
581
  taosArrayDestroyEx(pUidTagList, freeItem);
H
Haojun Liao 已提交
582 583 584 585
  taosArrayDestroyP(groupData, releaseColInfoData);
  return code;
}

H
Haojun Liao 已提交
586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638
static int32_t nameComparFn(const void* p1, const void* p2) {
  const char* pName1 = *(const char**)p1;
  const char* pName2 = *(const char**)p2;

  int32_t ret = strcmp(pName1, pName2);
  if (ret == 0) {
    return 0;
  } else {
    return (ret > 0) ? 1 : -1;
  }
}

static SArray* getTableNameList(const SNodeListNode* pList) {
  int32_t    len = LIST_LENGTH(pList->pNodeList);
  SListCell* cell = pList->pNodeList->pHead;

  SArray* pTbList = taosArrayInit(len, POINTER_BYTES);
  for (int i = 0; i < pList->pNodeList->length; i++) {
    SValueNode* valueNode = (SValueNode*)cell->pNode;
    if (!IS_VAR_DATA_TYPE(valueNode->node.resType.type)) {
      terrno = TSDB_CODE_INVALID_PARA;
      taosArrayDestroy(pTbList);
      return NULL;
    }

    char* name = varDataVal(valueNode->datum.p);
    taosArrayPush(pTbList, &name);
    cell = cell->pNext;
  }

  size_t numOfTables = taosArrayGetSize(pTbList);

  // order the name
  taosArraySort(pTbList, nameComparFn);

  // remove the duplicates
  SArray* pNewList = taosArrayInit(taosArrayGetSize(pTbList), sizeof(void*));
  taosArrayPush(pNewList, taosArrayGet(pTbList, 0));

  for (int32_t i = 1; i < numOfTables; ++i) {
    char** name = taosArrayGetLast(pNewList);
    char** nameInOldList = taosArrayGet(pTbList, i);
    if (strcmp(*name, *nameInOldList) == 0) {
      continue;
    }

    taosArrayPush(pNewList, nameInOldList);
  }

  taosArrayDestroy(pTbList);
  return pNewList;
}

dengyihao's avatar
dengyihao 已提交
639
static int tableUidCompare(const void* a, const void* b) {
H
Haojun Liao 已提交
640 641 642
  uint64_t u1 = *(uint64_t*)a;
  uint64_t u2 = *(uint64_t*)b;

dengyihao's avatar
dengyihao 已提交
643 644 645
  if (u1 == u2) {
    return 0;
  }
H
Haojun Liao 已提交
646

dengyihao's avatar
dengyihao 已提交
647 648
  return u1 < u2 ? -1 : 1;
}
H
Haojun Liao 已提交
649

H
Haojun Liao 已提交
650
static int32_t filterTableInfoCompare(const void* a, const void* b) {
651 652
  STUidTagInfo* p1 = (STUidTagInfo*) a;
  STUidTagInfo* p2 = (STUidTagInfo*) b;
H
Haojun Liao 已提交
653 654 655 656 657 658 659 660

  if (p1->uid == p2->uid) {
    return 0;
  }

  return p1->uid < p2->uid? -1:1;
}

661
static int32_t optimizeTbnameInCond(void* metaHandle, int64_t suid, SArray* pRes, SNode* cond) {
dengyihao's avatar
dengyihao 已提交
662
  int32_t ret = -1;
663 664 665
  int32_t ntype = nodeType(cond);

  if (ntype == QUERY_NODE_OPERATOR) {
H
Haojun Liao 已提交
666
    ret = optimizeTbnameInCondImpl(metaHandle, pRes, cond);
dengyihao's avatar
dengyihao 已提交
667 668
  }

669
  if (ntype != QUERY_NODE_LOGIC_CONDITION || ((SLogicConditionNode*)cond)->condType != LOGIC_COND_TYPE_AND) {
dengyihao's avatar
dengyihao 已提交
670
    return ret;
dengyihao's avatar
dengyihao 已提交
671 672
  }

dengyihao's avatar
dengyihao 已提交
673
  bool                 hasTbnameCond = false;
dengyihao's avatar
dengyihao 已提交
674
  SLogicConditionNode* pNode = (SLogicConditionNode*)cond;
dengyihao's avatar
dengyihao 已提交
675
  SNodeList*           pList = (SNodeList*)pNode->pParameterList;
dengyihao's avatar
dengyihao 已提交
676

dengyihao's avatar
dengyihao 已提交
677
  int32_t len = LIST_LENGTH(pList);
H
Haojun Liao 已提交
678 679 680
  if (len <= 0) {
    return ret;
  }
dengyihao's avatar
dengyihao 已提交
681

dengyihao's avatar
dengyihao 已提交
682
  SListCell* cell = pList->pHead;
dengyihao's avatar
dengyihao 已提交
683
  for (int i = 0; i < len; i++) {
dengyihao's avatar
dengyihao 已提交
684
    if (cell == NULL) break;
H
Haojun Liao 已提交
685
    if (optimizeTbnameInCondImpl(metaHandle, pRes, cell->pNode) == 0) {
dengyihao's avatar
dengyihao 已提交
686
      hasTbnameCond = true;
dengyihao's avatar
dengyihao 已提交
687
      break;
dengyihao's avatar
dengyihao 已提交
688 689 690
    }
    cell = cell->pNext;
  }
H
Haojun Liao 已提交
691

H
Haojun Liao 已提交
692 693
  taosArraySort(pRes, filterTableInfoCompare);
  taosArrayRemoveDuplicate(pRes, filterTableInfoCompare, NULL);
dengyihao's avatar
dengyihao 已提交
694

dengyihao's avatar
dengyihao 已提交
695
  if (hasTbnameCond) {
696
    ret = metaGetTableTagsByUids(metaHandle, suid, pRes);
697
//    removeInvalidUid(pRes, tags);
dengyihao's avatar
dengyihao 已提交
698
  }
H
Haojun Liao 已提交
699

dengyihao's avatar
dengyihao 已提交
700 701 702
  return ret;
}

703
#if 0
dengyihao's avatar
dengyihao 已提交
704 705 706
/*
 * handle invalid uid
 */
707 708 709 710 711
static int32_t removeInvalidUid(SArray* uids, SHashObj* tags) {
  int32_t size = taosArrayGetSize(uids);
  if (size <= 0) {
    return 0;
  }
dengyihao's avatar
dengyihao 已提交
712

713
  SArray* validUid = taosArrayInit(size, sizeof(STUidTagInfo));
dengyihao's avatar
dengyihao 已提交
714

715
  for (int32_t i = 0; i < size; i++) {
716
    STUidTagInfo* p = taosArrayGet(uids, i);
H
Haojun Liao 已提交
717 718
    if (taosHashGet(tags, &p->uid, sizeof(int64_t)) != NULL) {
      taosArrayPush(validUid, p);
dengyihao's avatar
dengyihao 已提交
719 720
    }
  }
H
Haojun Liao 已提交
721

dengyihao's avatar
dengyihao 已提交
722 723 724
  taosArraySwap(uids, validUid);
  taosArrayDestroy(validUid);
  return 0;
dengyihao's avatar
dengyihao 已提交
725
}
726

727 728
#endif

729
// only return uid that does not contained in pExistedUidList
H
Haojun Liao 已提交
730
static int32_t optimizeTbnameInCondImpl(void* metaHandle, SArray* pExistedUidList, SNode* pTagCond) {
dengyihao's avatar
dengyihao 已提交
731 732 733
  if (nodeType(pTagCond) != QUERY_NODE_OPERATOR) {
    return -1;
  }
734

dengyihao's avatar
dengyihao 已提交
735 736 737 738
  SOperatorNode* pNode = (SOperatorNode*)pTagCond;
  if (pNode->opType != OP_TYPE_IN) {
    return -1;
  }
739

dengyihao's avatar
dengyihao 已提交
740 741 742 743 744 745
  if ((pNode->pLeft != NULL && nodeType(pNode->pLeft) == QUERY_NODE_COLUMN &&
       ((SColumnNode*)pNode->pLeft)->colType == COLUMN_TYPE_TBNAME) &&
      (pNode->pRight != NULL && nodeType(pNode->pRight) == QUERY_NODE_NODE_LIST)) {
    SNodeListNode* pList = (SNodeListNode*)pNode->pRight;

    int32_t len = LIST_LENGTH(pList->pNodeList);
H
Haojun Liao 已提交
746 747
    if (len <= 0) {
      return -1;
dengyihao's avatar
dengyihao 已提交
748 749
    }

dengyihao's avatar
dengyihao 已提交
750 751 752
    SArray*   pTbList = getTableNameList(pList);
    int32_t   numOfTables = taosArrayGetSize(pTbList);
    SHashObj* uHash = NULL;
H
Haojun Liao 已提交
753

754 755 756 757
    size_t    numOfExisted = taosArrayGetSize(pExistedUidList);  // len > 0 means there already have uids
    if (numOfExisted > 0) {
      uHash = taosHashInit(numOfExisted / 0.7, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_NO_LOCK);
      for (int i = 0; i < numOfExisted; i++) {
758
        STUidTagInfo* pTInfo = taosArrayGet(pExistedUidList, i);
H
Haojun Liao 已提交
759
        taosHashPut(uHash, &pTInfo->uid, sizeof(uint64_t), &i, sizeof(i));
D
dapan1121 已提交
760 761
      }
    }
dengyihao's avatar
dengyihao 已提交
762

763 764
    for (int i = 0; i < numOfTables; i++) {
      char* name = taosArrayGetP(pTbList, i);
dengyihao's avatar
dengyihao 已提交
765 766 767

      uint64_t uid = 0;
      if (metaGetTableUidByName(metaHandle, name, &uid) == 0) {
dengyihao's avatar
dengyihao 已提交
768 769
        ETableType tbType = TSDB_TABLE_MAX;
        if (metaGetTableTypeByName(metaHandle, name, &tbType) == 0 && tbType == TSDB_CHILD_TABLE) {
D
dapan1121 已提交
770
          if (NULL == uHash || taosHashGet(uHash, &uid, sizeof(uid)) == NULL) {
771
            STUidTagInfo s = {.uid = uid, .name = name, .pTagVal = NULL};
H
Haojun Liao 已提交
772
            taosArrayPush(pExistedUidList, &s);
D
dapan1121 已提交
773
          }
dengyihao's avatar
dengyihao 已提交
774 775
        } else {
          taosArrayDestroy(pTbList);
D
dapan1121 已提交
776
          taosHashCleanup(uHash);
dengyihao's avatar
dengyihao 已提交
777 778
          return -1;
        }
dengyihao's avatar
dengyihao 已提交
779
      } else {
H
Haojun Liao 已提交
780
//        qWarn("failed to get tableIds from by table name: %s, reason: %s", name, tstrerror(terrno));
dengyihao's avatar
dengyihao 已提交
781 782 783
        terrno = 0;
      }
    }
784

D
dapan1121 已提交
785
    taosHashCleanup(uHash);
dengyihao's avatar
dengyihao 已提交
786
    taosArrayDestroy(pTbList);
dengyihao's avatar
dengyihao 已提交
787
    return 0;
dengyihao's avatar
dengyihao 已提交
788
  }
H
Haojun Liao 已提交
789

dengyihao's avatar
dengyihao 已提交
790
  return -1;
dengyihao's avatar
dengyihao 已提交
791
}
H
Haojun Liao 已提交
792

793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808
static void genTagFilterDigest(const SNode* pTagCond, T_MD5_CTX* pContext) {
  if (pTagCond == NULL) {
    return;
  }

  char*   payload = NULL;
  int32_t len = 0;
  nodesNodeToMsg(pTagCond, &payload, &len);

  tMD5Init(pContext);
  tMD5Update(pContext, (uint8_t*)payload, (uint32_t)len);
  tMD5Final(pContext);

  taosMemoryFree(payload);
}

H
Haojun Liao 已提交
809
static SSDataBlock* createTagValBlockForFilter(SArray* pColList, int32_t numOfTables, SArray* pUidTagList, void* metaHandle) {
810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839
  SSDataBlock* pResBlock = createDataBlock();
  if (pResBlock == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

  for (int32_t i = 0; i < taosArrayGetSize(pColList); ++i) {
    SColumnInfoData colInfo = {0};
    colInfo.info = *(SColumnInfo*)taosArrayGet(pColList, i);
    blockDataAppendColInfo(pResBlock, &colInfo);
  }

  int32_t code = blockDataEnsureCapacity(pResBlock, numOfTables);
  if (code != TSDB_CODE_SUCCESS) {
    terrno = code;
    return NULL;
  }

  pResBlock->info.rows = numOfTables;

  int32_t numOfCols = taosArrayGetSize(pResBlock->pDataBlock);

  for (int32_t i = 0; i < numOfTables; i++) {
    STUidTagInfo* p1 = taosArrayGet(pUidTagList, i);

    for (int32_t j = 0; j < numOfCols; j++) {
      SColumnInfoData* pColInfo = (SColumnInfoData*)taosArrayGet(pResBlock->pDataBlock, j);

      if (pColInfo->info.colId == -1) {  // tbname
        char str[TSDB_TABLE_FNAME_LEN + VARSTR_HEADER_SIZE] = {0};
H
Haojun Liao 已提交
840 841 842 843 844 845
        if (p1->name != NULL) {
          STR_TO_VARSTR(str, p1->name);
        } else { // name is not retrieved during filter
          metaGetTableNameByUid(metaHandle, p1->uid, str);
        }

846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903
        colDataAppend(pColInfo, i, str, false);
#if TAG_FILTER_DEBUG
        qDebug("tagfilter uid:%ld, tbname:%s", *uid, str + 2);
#endif
      } else {
        STagVal tagVal = {0};
        tagVal.cid = pColInfo->info.colId;
        if (p1->pTagVal == NULL) {
          colDataAppendNULL(pColInfo, i);
        }

        const char* p = metaGetTableTagVal(p1->pTagVal, pColInfo->info.type, &tagVal);

        if (p == NULL || (pColInfo->info.type == TSDB_DATA_TYPE_JSON && ((STag*)p)->nTag == 0)) {
          colDataAppendNULL(pColInfo, i);
        } else if (pColInfo->info.type == TSDB_DATA_TYPE_JSON) {
          colDataAppend(pColInfo, i, p, false);
        } else if (IS_VAR_DATA_TYPE(pColInfo->info.type)) {
          char* tmp = alloca(tagVal.nData + VARSTR_HEADER_SIZE + 1);
          varDataSetLen(tmp, tagVal.nData);
          memcpy(tmp + VARSTR_HEADER_SIZE, tagVal.pData, tagVal.nData);
          colDataAppend(pColInfo, i, tmp, false);
#if TAG_FILTER_DEBUG
          qDebug("tagfilter varch:%s", tmp + 2);
#endif
        } else {
          colDataAppend(pColInfo, i, (const char*)&tagVal.i64, false);
#if TAG_FILTER_DEBUG
          if (pColInfo->info.type == TSDB_DATA_TYPE_INT) {
            qDebug("tagfilter int:%d", *(int*)(&tagVal.i64));
          } else if (pColInfo->info.type == TSDB_DATA_TYPE_DOUBLE) {
            qDebug("tagfilter double:%f", *(double*)(&tagVal.i64));
          }
#endif
        }
      }
    }
  }

  return pResBlock;
}

static void doSetQualifiedUid(SArray* pUidList, const SArray* pUidTagList, bool* pResultList) {
  taosArrayClear(pUidList);

  int32_t numOfTables = taosArrayGetSize(pUidTagList);
  for(int32_t i = 0; i < numOfTables; ++i) {
    uint64_t uid = ((STUidTagInfo*)taosArrayGet(pUidTagList, i))->uid;
    qDebug("tagfilter get uid:%" PRId64 ", res:%d", uid, pResultList[i]);

    if (pResultList[i]) {
      taosArrayPush(pUidList, &uid);
    }
  }
}

static void copyExistedUids(SArray* pUidTagList, const SArray* pUidList) {
  int32_t numOfExisted = taosArrayGetSize(pUidList);
904 905 906 907 908 909 910 911
  if (numOfExisted == 0) {
    return;
  }

  for(int32_t i = 0; i < numOfExisted; ++i) {
    uint64_t* uid = taosArrayGet(pUidList, i);
    STUidTagInfo info = {.uid = *uid};
    taosArrayPush(pUidTagList, &info);
912 913 914 915
  }
}

static int32_t doFilterByTagCond(STableListInfo* pListInfo, SArray* pUidList, SNode* pTagCond, void* metaHandle) {
916 917 918 919 920
  if (pTagCond == NULL) {
    return TSDB_CODE_SUCCESS;
  }

  terrno = TDB_CODE_SUCCESS;
921 922 923 924 925 926 927 928 929 930 931

  int32_t      code = TSDB_CODE_SUCCESS;
  SArray*      pBlockList = NULL;
  SSDataBlock* pResBlock = NULL;
  SScalarParam output = {0};

  tagFilterAssist ctx = {0};
  ctx.colHash = taosHashInit(4, taosGetDefaultHashFunction(TSDB_DATA_TYPE_SMALLINT), false, HASH_NO_LOCK);
  if (ctx.colHash == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    goto end;
932 933
  }

934 935 936 937 938
  ctx.cInfoList = taosArrayInit(4, sizeof(SColumnInfo));
  if (ctx.cInfoList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    goto end;
  }
939

940
  nodesRewriteExprPostOrder(&pTagCond, getColumn, (void*)&ctx);
941

942
  SDataType type = {.type = TSDB_DATA_TYPE_BOOL, .bytes = sizeof(bool)};
943

944 945
  //  int64_t stt = taosGetTimestampUs();
  SArray* pUidTagList = taosArrayInit(10, sizeof(STUidTagInfo));
946 947
  copyExistedUids(pUidTagList, pUidList);

948 949
  int32_t filter = optimizeTbnameInCond(metaHandle, pListInfo->suid, pUidTagList, pTagCond);
  if (filter == 0) {  // tbname in filter is activated, do nothing and return
950 951
    taosArrayClear(pUidList);

952 953 954 955 956 957
    int32_t numOfRows = taosArrayGetSize(pUidTagList);
    taosArrayEnsureCap(pUidList, numOfRows);
    for(int32_t i = 0; i < numOfRows; ++i) {
      STUidTagInfo* pInfo = taosArrayGet(pUidTagList, i);
      taosArrayPush(pUidList, &pInfo->uid);
    }
H
Haojun Liao 已提交
958

959 960 961 962 963 964 965 966 967
    terrno = 0;
    goto end;
  } else {
    // here we retrieve all tags from the vnode table-meta store
    code = metaGetTableTags(metaHandle, pListInfo->suid, pUidTagList);
    if (code != TSDB_CODE_SUCCESS) {
      qError("failed to get table tags from meta, reason:%s, suid:%" PRIu64, tstrerror(code), pListInfo->suid);
      terrno = code;
      goto end;
968
    }
969
  }
970

971 972 973
  int32_t numOfTables = taosArrayGetSize(pUidTagList);
  if (numOfTables == 0) {
    goto end;
974 975
  }

H
Haojun Liao 已提交
976 977 978
  pResBlock = createTagValBlockForFilter(ctx.cInfoList, numOfTables, pUidTagList, metaHandle);
  if (pResBlock == NULL) {
    code = terrno;
979 980 981 982 983 984 985 986 987 988
    goto end;
  }

  //  int64_t st1 = taosGetTimestampUs();
  //  qDebug("generate tag block rows:%d, cost:%ld us", rows, st1-st);
  pBlockList = taosArrayInit(2, POINTER_BYTES);
  taosArrayPush(pBlockList, &pResBlock);

  code = createResultData(&type, numOfTables, &output);
  if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
989
    terrno = code;
990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006
    goto end;
  }

  code = scalarCalculate(pTagCond, pBlockList, &output);
  if (code != TSDB_CODE_SUCCESS) {
    qError("failed to calculate scalar, reason:%s", tstrerror(code));
    terrno = code;
    goto end;
  }

  doSetQualifiedUid(pUidList, pUidTagList, (bool*) output.columnData->pData);

  end:
  taosHashCleanup(ctx.colHash);
  taosArrayDestroy(ctx.cInfoList);
  blockDataDestroy(pResBlock);
  taosArrayDestroy(pBlockList);
H
Haojun Liao 已提交
1007
  taosArrayDestroyEx(pUidTagList, freeItem);
1008 1009 1010

  colDataDestroy(output.columnData);
  taosMemoryFreeClear(output.columnData);
H
Haojun Liao 已提交
1011
  return code;
1012 1013
}

1014
int32_t getTableList(void* metaHandle, void* pVnode, SScanPhysiNode* pScanNode, SNode* pTagCond, SNode* pTagIndexCond,
1015
                     STableListInfo* pListInfo, const char* idstr) {
1016
  int32_t code = TSDB_CODE_SUCCESS;
1017
  size_t  numOfTables = 0;
1018

D
dapan1121 已提交
1019
  pListInfo->suid = pScanNode->suid;
1020
  SArray* pUidList = taosArrayInit(8, sizeof(uint64_t));
dengyihao's avatar
dengyihao 已提交
1021

1022
  if (pScanNode->tableType != TSDB_SUPER_TABLE) {
1023 1024
    if (metaIsTableExist(metaHandle, pScanNode->uid)) {
      taosArrayPush(pUidList, &pScanNode->uid);
1025
    }
1026

1027
    code = doFilterByTagCond(pListInfo, pUidList, pTagCond, metaHandle);
1028
    if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
1029
      goto _end;
H
Haojun Liao 已提交
1030
    }
1031 1032
  } else {
    T_MD5_CTX context = {0};
H
Haojun Liao 已提交
1033

1034 1035 1036 1037 1038
    if (tsTagFilterCache) {
      // try to retrieve the result from meta cache
      genTagFilterDigest(pTagCond, &context);

      bool acquired = false;
1039
      metaGetCachedTableUidList(metaHandle, pScanNode->suid, context.digest, tListLen(context.digest), pUidList, &acquired);
1040
      if (acquired) {
1041
        qDebug("retrieve table uid list from cache, numOfTables:%d", (int32_t)taosArrayGetSize(pUidList));
1042 1043
        goto _end;
      }
wmmhello's avatar
wmmhello 已提交
1044 1045
    }

1046
    if (!pTagCond) {  // no tag filter condition exists, let's fetch all tables of this super table
1047
      ASSERT(pTagIndexCond == NULL);
1048
      vnodeGetCtbIdList(pVnode, pScanNode->suid, pUidList);
1049
    } else {
H
Haojun Liao 已提交
1050 1051
      // failed to find the result in the cache, let try to calculate the results
      if (pTagIndexCond) {
1052 1053 1054
        void* pIndex = tsdbGetIvtIdx(metaHandle);
        SIndexMetaArg metaArg = {
            .metaEx = metaHandle, .idx = tsdbGetIdx(metaHandle), .ivtIdx = pIndex, .suid = pScanNode->uid};
H
Haojun Liao 已提交
1055 1056

        SIdxFltStatus status = SFLT_NOT_INDEX;
1057
        code = doFilterTag(pTagIndexCond, &metaArg, pUidList, &status);
H
Haojun Liao 已提交
1058 1059
        if (code != 0 || status == SFLT_NOT_INDEX) {  // temporarily disable it for performance sake
//          qError("failed to get tableIds from index, reason:%s, suid:%" PRIu64, tstrerror(code), tableUid);
H
Haojun Liao 已提交
1060 1061
          code = TDB_CODE_SUCCESS;
        }
wmmhello's avatar
wmmhello 已提交
1062 1063
      }
    }
1064

1065
    code = doFilterByTagCond(pListInfo, pUidList, pTagCond, metaHandle);
1066
    if (code != TSDB_CODE_SUCCESS) {
H
Haojun Liao 已提交
1067
      goto _end;
wmmhello's avatar
wmmhello 已提交
1068 1069
    }

1070
    // let's add the filter results into meta-cache
1071
    numOfTables = taosArrayGetSize(pUidList);
1072

1073
    if (tsTagFilterCache) {
1074 1075 1076 1077 1078
      size_t size = numOfTables * sizeof(uint64_t) + sizeof(int32_t);
      char*  pPayload = taosMemoryMalloc(size);

      if (numOfTables > 0) {
        *(int32_t*)pPayload = numOfTables;
1079
        memcpy(pPayload + sizeof(int32_t), taosArrayGet(pUidList, 0), numOfTables * sizeof(uint64_t));
1080 1081
      }

1082
      metaUidFilterCachePut(metaHandle, pScanNode->suid, context.digest, tListLen(context.digest), pPayload, size, 1);
1083
      taosMemoryFree(pPayload);
1084
    }
wmmhello's avatar
wmmhello 已提交
1085 1086
  }

1087
_end:
1088
  numOfTables = taosArrayGetSize(pUidList);
H
Haojun Liao 已提交
1089
  for (int i = 0; i < numOfTables; i++) {
1090
    STableKeyInfo info = {.uid = *(uint64_t*)taosArrayGet(pUidList, i), .groupId = 0};
1091 1092

    void* p = taosArrayPush(pListInfo->pTableList, &info);
H
Haojun Liao 已提交
1093
    if (p == NULL) {
1094
      taosArrayDestroy(pUidList);
H
Haojun Liao 已提交
1095 1096 1097
      return TSDB_CODE_OUT_OF_MEMORY;
    }

1098
    qTrace("tagfilter get uid:%" PRIu64", %s", info.uid, idstr);
1099 1100
  }

1101
  taosArrayDestroy(pUidList);
1102 1103
  return code;
}
H
Haojun Liao 已提交
1104

1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117
size_t getTableTagsBufLen(const SNodeList* pGroups) {
  size_t keyLen = 0;

  SNode* node;
  FOREACH(node, pGroups) {
    SExprNode* pExpr = (SExprNode*)node;
    keyLen += pExpr->resType.bytes;
  }

  keyLen += sizeof(int8_t) * LIST_LENGTH(pGroups);
  return keyLen;
}

H
Haojun Liao 已提交
1118
int32_t getGroupIdFromTagsVal(void* pMeta, uint64_t uid, SNodeList* pGroupNode, char* keyBuf, uint64_t* pGroupId) {
M
Minglei Jin 已提交
1119
  SMetaReader mr = {0};
1120
  metaReaderInit(&mr, pMeta, 0);
H
Haojun Liao 已提交
1121
  if (metaGetTableEntryByUidCache(&mr, uid) != 0) {  // table not exist
1122 1123 1124
    metaReaderClear(&mr);
    return TSDB_CODE_PAR_TABLE_NOT_EXIST;
  }
1125 1126 1127 1128 1129

  SNodeList* groupNew = nodesCloneList(pGroupNode);

  nodesRewriteExprsPostOrder(groupNew, doTranslateTagExpr, &mr);
  char* isNull = (char*)keyBuf;
M
Minglei Jin 已提交
1130
  char* pStart = (char*)keyBuf + sizeof(int8_t) * LIST_LENGTH(pGroupNode);
1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145

  SNode*  pNode;
  int32_t index = 0;
  FOREACH(pNode, groupNew) {
    SNode*  pNew = NULL;
    int32_t code = scalarCalculateConstants(pNode, &pNew);
    if (TSDB_CODE_SUCCESS == code) {
      REPLACE_NODE(pNew);
    } else {
      taosMemoryFree(keyBuf);
      nodesDestroyList(groupNew);
      metaReaderClear(&mr);
      return code;
    }

1146
    ASSERT(nodeType(pNew) == QUERY_NODE_VALUE);
1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175
    SValueNode* pValue = (SValueNode*)pNew;

    if (pValue->node.resType.type == TSDB_DATA_TYPE_NULL || pValue->isNull) {
      isNull[index++] = 1;
      continue;
    } else {
      isNull[index++] = 0;
      char* data = nodesGetValueFromNode(pValue);
      if (pValue->node.resType.type == TSDB_DATA_TYPE_JSON) {
        if (tTagIsJson(data)) {
          terrno = TSDB_CODE_QRY_JSON_IN_GROUP_ERROR;
          taosMemoryFree(keyBuf);
          nodesDestroyList(groupNew);
          metaReaderClear(&mr);
          return terrno;
        }
        int32_t len = getJsonValueLen(data);
        memcpy(pStart, data, len);
        pStart += len;
      } else if (IS_VAR_DATA_TYPE(pValue->node.resType.type)) {
        memcpy(pStart, data, varDataTLen(data));
        pStart += varDataTLen(data);
      } else {
        memcpy(pStart, data, pValue->node.resType.bytes);
        pStart += pValue->node.resType.bytes;
      }
    }
  }

M
Minglei Jin 已提交
1176
  int32_t len = (int32_t)(pStart - (char*)keyBuf);
1177 1178 1179 1180 1181 1182 1183
  *pGroupId = calcGroupId(keyBuf, len);

  nodesDestroyList(groupNew);
  metaReaderClear(&mr);
  return TSDB_CODE_SUCCESS;
}

1184
SArray* extractPartitionColInfo(SNodeList* pNodeList) {
dengyihao's avatar
dengyihao 已提交
1185
  if (!pNodeList) {
1186 1187
    return NULL;
  }
H
Haojun Liao 已提交
1188

1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209
  size_t  numOfCols = LIST_LENGTH(pNodeList);
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColumn));
  if (pList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

  for (int32_t i = 0; i < numOfCols; ++i) {
    SColumnNode* pColNode = (SColumnNode*)nodesListGetNode(pNodeList, i);

    // todo extract method
    SColumn c = {0};
    c.slotId = pColNode->slotId;
    c.colId = pColNode->colId;
    c.type = pColNode->node.resType.type;
    c.bytes = pColNode->node.resType.bytes;
    c.precision = pColNode->node.resType.precision;
    c.scale = pColNode->node.resType.scale;

    taosArrayPush(pList, &c);
  }
H
Haojun Liao 已提交
1210

1211
  return pList;
H
Haojun Liao 已提交
1212 1213
}

H
Haojun Liao 已提交
1214 1215
int32_t extractColMatchInfo(SNodeList* pNodeList, SDataBlockDescNode* pOutputNodeList, int32_t* numOfOutputCols,
                            int32_t type, SColMatchInfo* pMatchInfo) {
H
Haojun Liao 已提交
1216
  size_t  numOfCols = LIST_LENGTH(pNodeList);
H
Haojun Liao 已提交
1217 1218 1219 1220
  int32_t code = 0;

  pMatchInfo->matchType = type;

1221
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColMatchItem));
1222
  if (pList == NULL) {
H
Haojun Liao 已提交
1223 1224
    code = TSDB_CODE_OUT_OF_MEMORY;
    return code;
1225 1226 1227 1228
  }

  for (int32_t i = 0; i < numOfCols; ++i) {
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pNodeList, i);
1229 1230 1231
    if (nodeType(pNode->pExpr) == QUERY_NODE_COLUMN) {
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

H
Haojun Liao 已提交
1232
      SColMatchItem c = {.needOutput = true};
1233 1234
      c.colId = pColNode->colId;
      c.srcSlotId = pColNode->slotId;
H
Haojun Liao 已提交
1235
      c.dstSlotId = pNode->slotId;
1236 1237
      taosArrayPush(pList, &c);
    }
1238 1239
  }

H
Haojun Liao 已提交
1240
  // set the output flag for each column in SColMatchInfo, according to the
1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252
  *numOfOutputCols = 0;
  int32_t num = LIST_LENGTH(pOutputNodeList->pSlots);
  for (int32_t i = 0; i < num; ++i) {
    SSlotDescNode* pNode = (SSlotDescNode*)nodesListGetNode(pOutputNodeList->pSlots, i);

    // todo: add reserve flag check
    // it is a column reserved for the arithmetic expression calculation
    if (pNode->slotId >= numOfCols) {
      (*numOfOutputCols) += 1;
      continue;
    }

H
Haojun Liao 已提交
1253
    SColMatchItem* info = NULL;
1254 1255
    for (int32_t j = 0; j < taosArrayGetSize(pList); ++j) {
      info = taosArrayGet(pList, j);
H
Haojun Liao 已提交
1256
      if (info->dstSlotId == pNode->slotId) {
1257 1258 1259
        break;
      }
    }
1260

1261 1262
    if (pNode->output) {
      (*numOfOutputCols) += 1;
H
Haojun Liao 已提交
1263 1264
    } else if (info != NULL) {
      // select distinct tbname from stb where tbname='abc';
H
Haojun Liao 已提交
1265
      info->needOutput = false;
1266
    }
1267
  }
1268

H
Haojun Liao 已提交
1269
  pMatchInfo->pList = pList;
H
Haojun Liao 已提交
1270
  return code;
1271 1272
}

1273 1274 1275 1276 1277 1278 1279 1280
static SResSchema createResSchema(int32_t type, int32_t bytes, int32_t slotId, int32_t scale, int32_t precision,
                                  const char* name) {
  SResSchema s = {0};
  s.scale = scale;
  s.type = type;
  s.bytes = bytes;
  s.slotId = slotId;
  s.precision = precision;
H
Haojun Liao 已提交
1281
  tstrncpy(s.name, name, tListLen(s.name));
1282 1283 1284

  return s;
}
1285

H
Haojun Liao 已提交
1286
static SColumn* createColumn(int32_t blockId, int32_t slotId, int32_t colId, SDataType* pType, EColumnType colType) {
1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299
  SColumn* pCol = taosMemoryCalloc(1, sizeof(SColumn));
  if (pCol == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

  pCol->slotId = slotId;
  pCol->colId = colId;
  pCol->bytes = pType->bytes;
  pCol->type = pType->type;
  pCol->scale = pType->scale;
  pCol->precision = pType->precision;
  pCol->dataBlockId = blockId;
H
Haojun Liao 已提交
1300
  pCol->colType = colType;
1301 1302 1303
  return pCol;
}

1304
void createExprFromOneNode(SExprInfo* pExp, SNode* pNode, int16_t slotId) {
1305 1306 1307 1308
  pExp->pExpr = taosMemoryCalloc(1, sizeof(tExprNode));
  pExp->pExpr->_function.num = 1;
  pExp->pExpr->_function.functionId = -1;

1309
  int32_t type = nodeType(pNode);
1310 1311 1312
  // it is a project query, or group by column
  if (type == QUERY_NODE_COLUMN) {
    pExp->pExpr->nodeType = QUERY_NODE_COLUMN;
1313
    SColumnNode* pColNode = (SColumnNode*)pNode;
1314 1315 1316 1317 1318

    pExp->base.pParam = taosMemoryCalloc(1, sizeof(SFunctParam));
    pExp->base.numOfParams = 1;

    SDataType* pType = &pColNode->node.resType;
1319 1320
    pExp->base.resSchema =
        createResSchema(pType->type, pType->bytes, slotId, pType->scale, pType->precision, pColNode->colName);
1321 1322 1323 1324 1325
    pExp->base.pParam[0].pCol =
        createColumn(pColNode->dataBlockId, pColNode->slotId, pColNode->colId, pType, pColNode->colType);
    pExp->base.pParam[0].type = FUNC_PARAM_TYPE_COLUMN;
  } else if (type == QUERY_NODE_VALUE) {
    pExp->pExpr->nodeType = QUERY_NODE_VALUE;
1326
    SValueNode* pValNode = (SValueNode*)pNode;
1327 1328 1329 1330 1331

    pExp->base.pParam = taosMemoryCalloc(1, sizeof(SFunctParam));
    pExp->base.numOfParams = 1;

    SDataType* pType = &pValNode->node.resType;
1332 1333
    pExp->base.resSchema =
        createResSchema(pType->type, pType->bytes, slotId, pType->scale, pType->precision, pValNode->node.aliasName);
1334 1335 1336 1337
    pExp->base.pParam[0].type = FUNC_PARAM_TYPE_VALUE;
    nodesValueNodeToVariant(pValNode, &pExp->base.pParam[0].param);
  } else if (type == QUERY_NODE_FUNCTION) {
    pExp->pExpr->nodeType = QUERY_NODE_FUNCTION;
1338
    SFunctionNode* pFuncNode = (SFunctionNode*)pNode;
1339 1340

    SDataType* pType = &pFuncNode->node.resType;
1341 1342
    pExp->base.resSchema =
        createResSchema(pType->type, pType->bytes, slotId, pType->scale, pType->precision, pFuncNode->node.aliasName);
1343

H
Haojun Liao 已提交
1344 1345 1346 1347
    tExprNode* pExprNode = pExp->pExpr;

    pExprNode->_function.functionId = pFuncNode->funcId;
    pExprNode->_function.pFunctNode = pFuncNode;
S
shenglian zhou 已提交
1348
    pExprNode->_function.functionType = pFuncNode->funcType;
H
Haojun Liao 已提交
1349 1350

    tstrncpy(pExprNode->_function.functionName, pFuncNode->functionName, tListLen(pExprNode->_function.functionName));
1351 1352 1353

#if 1
    // todo refactor: add the parameter for tbname function
H
Haojun Liao 已提交
1354
    const char* name = "tbname";
dengyihao's avatar
dengyihao 已提交
1355
    int32_t     len = strlen(name);
H
Haojun Liao 已提交
1356 1357 1358

    if (!pFuncNode->pParameterList && (memcmp(pExprNode->_function.functionName, name, len) == 0) &&
        pExprNode->_function.functionName[len] == 0) {
1359
      pFuncNode->pParameterList = nodesMakeList();
1360
      ASSERT(LIST_LENGTH(pFuncNode->pParameterList) == 0);
1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390
      SValueNode* res = (SValueNode*)nodesMakeNode(QUERY_NODE_VALUE);
      if (NULL == res) {  // todo handle error
      } else {
        res->node.resType = (SDataType){.bytes = sizeof(int64_t), .type = TSDB_DATA_TYPE_BIGINT};
        nodesListAppend(pFuncNode->pParameterList, (SNode*)res);
      }
    }
#endif

    int32_t numOfParam = LIST_LENGTH(pFuncNode->pParameterList);

    pExp->base.pParam = taosMemoryCalloc(numOfParam, sizeof(SFunctParam));
    pExp->base.numOfParams = numOfParam;

    for (int32_t j = 0; j < numOfParam; ++j) {
      SNode* p1 = nodesListGetNode(pFuncNode->pParameterList, j);
      if (p1->type == QUERY_NODE_COLUMN) {
        SColumnNode* pcn = (SColumnNode*)p1;

        pExp->base.pParam[j].type = FUNC_PARAM_TYPE_COLUMN;
        pExp->base.pParam[j].pCol =
            createColumn(pcn->dataBlockId, pcn->slotId, pcn->colId, &pcn->node.resType, pcn->colType);
      } else if (p1->type == QUERY_NODE_VALUE) {
        SValueNode* pvn = (SValueNode*)p1;
        pExp->base.pParam[j].type = FUNC_PARAM_TYPE_VALUE;
        nodesValueNodeToVariant(pvn, &pExp->base.pParam[j].param);
      }
    }
  } else if (type == QUERY_NODE_OPERATOR) {
    pExp->pExpr->nodeType = QUERY_NODE_OPERATOR;
1391
    SOperatorNode* pOpNode = (SOperatorNode*)pNode;
1392 1393 1394 1395

    pExp->base.pParam = taosMemoryCalloc(1, sizeof(SFunctParam));
    pExp->base.numOfParams = 1;

1396 1397 1398 1399
    SDataType* pType = &pOpNode->node.resType;
    pExp->base.resSchema =
        createResSchema(pType->type, pType->bytes, slotId, pType->scale, pType->precision, pOpNode->node.aliasName);
    pExp->pExpr->_optrRoot.pRootNode = pNode;
D
dapan1121 已提交
1400 1401
  } else if (type == QUERY_NODE_CASE_WHEN) {
    pExp->pExpr->nodeType = QUERY_NODE_OPERATOR;
D
dapan1121 已提交
1402
    SCaseWhenNode* pCaseNode = (SCaseWhenNode*)pNode;
dengyihao's avatar
dengyihao 已提交
1403

D
dapan1121 已提交
1404 1405
    pExp->base.pParam = taosMemoryCalloc(1, sizeof(SFunctParam));
    pExp->base.numOfParams = 1;
dengyihao's avatar
dengyihao 已提交
1406

D
dapan1121 已提交
1407
    SDataType* pType = &pCaseNode->node.resType;
dengyihao's avatar
dengyihao 已提交
1408 1409
    pExp->base.resSchema =
        createResSchema(pType->type, pType->bytes, slotId, pType->scale, pType->precision, pCaseNode->node.aliasName);
D
dapan1121 已提交
1410
    pExp->pExpr->_optrRoot.pRootNode = pNode;
1411
  } else {
1412
    ASSERT(0);
1413 1414 1415
  }
}

1416 1417 1418 1419
void createExprFromTargetNode(SExprInfo* pExp, STargetNode* pTargetNode) {
  createExprFromOneNode(pExp, pTargetNode->pExpr, pTargetNode->slotId);
}

1420 1421 1422 1423 1424 1425 1426 1427
SExprInfo* createExprInfo(SNodeList* pNodeList, SNodeList* pGroupKeys, int32_t* numOfExprs) {
  int32_t numOfFuncs = LIST_LENGTH(pNodeList);
  int32_t numOfGroupKeys = 0;
  if (pGroupKeys != NULL) {
    numOfGroupKeys = LIST_LENGTH(pGroupKeys);
  }

  *numOfExprs = numOfFuncs + numOfGroupKeys;
1428 1429 1430 1431
  if (*numOfExprs == 0) {
    return NULL;
  }

1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442
  SExprInfo* pExprs = taosMemoryCalloc(*numOfExprs, sizeof(SExprInfo));

  for (int32_t i = 0; i < (*numOfExprs); ++i) {
    STargetNode* pTargetNode = NULL;
    if (i < numOfFuncs) {
      pTargetNode = (STargetNode*)nodesListGetNode(pNodeList, i);
    } else {
      pTargetNode = (STargetNode*)nodesListGetNode(pGroupKeys, i - numOfFuncs);
    }

    SExprInfo* pExp = &pExprs[i];
1443
    createExprFromTargetNode(pExp, pTargetNode);
1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455
  }

  return pExprs;
}

// set the output buffer for the selectivity + tag query
static int32_t setSelectValueColumnInfo(SqlFunctionCtx* pCtx, int32_t numOfOutput) {
  int32_t num = 0;

  SqlFunctionCtx*  p = NULL;
  SqlFunctionCtx** pValCtx = taosMemoryCalloc(numOfOutput, POINTER_BYTES);
  if (pValCtx == NULL) {
S
Shengliang Guan 已提交
1456
    return TSDB_CODE_OUT_OF_MEMORY;
1457 1458 1459
  }

  for (int32_t i = 0; i < numOfOutput; ++i) {
H
Haojun Liao 已提交
1460
    const char* pName = pCtx[i].pExpr->pExpr->_function.functionName;
1461
    if ((strcmp(pName, "_select_value") == 0) || (strcmp(pName, "_group_key") == 0)) {
1462 1463 1464 1465 1466
      pValCtx[num++] = &pCtx[i];
    } else if (fmIsSelectFunc(pCtx[i].functionId)) {
      p = &pCtx[i];
    }
  }
H
Haojun Liao 已提交
1467

1468 1469 1470
  if (p != NULL) {
    p->subsidiaries.pCtx = pValCtx;
    p->subsidiaries.num = num;
1471
  } else {
1472
    taosMemoryFreeClear(pValCtx);
1473
  }
1474 1475

  return TSDB_CODE_SUCCESS;
1476 1477
}

1478
SqlFunctionCtx* createSqlFunctionCtx(SExprInfo* pExprInfo, int32_t numOfOutput, int32_t** rowEntryInfoOffset) {
1479 1480 1481 1482
  SqlFunctionCtx* pFuncCtx = (SqlFunctionCtx*)taosMemoryCalloc(numOfOutput, sizeof(SqlFunctionCtx));
  if (pFuncCtx == NULL) {
    return NULL;
  }
1483

1484 1485
  *rowEntryInfoOffset = taosMemoryCalloc(numOfOutput, sizeof(int32_t));
  if (*rowEntryInfoOffset == 0) {
1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501
    taosMemoryFreeClear(pFuncCtx);
    return NULL;
  }

  for (int32_t i = 0; i < numOfOutput; ++i) {
    SExprInfo* pExpr = &pExprInfo[i];

    SExprBasicInfo* pFunct = &pExpr->base;
    SqlFunctionCtx* pCtx = &pFuncCtx[i];

    pCtx->functionId = -1;
    pCtx->pExpr = pExpr;

    if (pExpr->pExpr->nodeType == QUERY_NODE_FUNCTION) {
      SFuncExecEnv env = {0};
      pCtx->functionId = pExpr->pExpr->_function.pFunctNode->funcId;
1502
      pCtx->isPseudoFunc = fmIsWindowPseudoColumnFunc(pCtx->functionId);
1503
      pCtx->isNotNullFunc = fmIsNotNullOutputFunc(pCtx->functionId);
1504 1505 1506 1507 1508 1509 1510

      if (fmIsAggFunc(pCtx->functionId) || fmIsIndefiniteRowsFunc(pCtx->functionId)) {
        bool isUdaf = fmIsUserDefinedFunc(pCtx->functionId);
        if (!isUdaf) {
          fmGetFuncExecFuncs(pCtx->functionId, &pCtx->fpSet);
        } else {
          char* udfName = pExpr->pExpr->_function.pFunctNode->functionName;
1511
          pCtx->udfName = strdup(udfName);
1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530 1531 1532 1533 1534 1535 1536 1537 1538 1539
          fmGetUdafExecFuncs(pCtx->functionId, &pCtx->fpSet);
        }
        pCtx->fpSet.getEnv(pExpr->pExpr->_function.pFunctNode, &env);
      } else {
        fmGetScalarFuncExecFuncs(pCtx->functionId, &pCtx->sfp);
        if (pCtx->sfp.getEnv != NULL) {
          pCtx->sfp.getEnv(pExpr->pExpr->_function.pFunctNode, &env);
        }
      }
      pCtx->resDataInfo.interBufSize = env.calcMemSize;
    } else if (pExpr->pExpr->nodeType == QUERY_NODE_COLUMN || pExpr->pExpr->nodeType == QUERY_NODE_OPERATOR ||
               pExpr->pExpr->nodeType == QUERY_NODE_VALUE) {
      // for simple column, the result buffer needs to hold at least one element.
      pCtx->resDataInfo.interBufSize = pFunct->resSchema.bytes;
    }

    pCtx->input.numOfInputCols = pFunct->numOfParams;
    pCtx->input.pData = taosMemoryCalloc(pFunct->numOfParams, POINTER_BYTES);
    pCtx->input.pColumnDataAgg = taosMemoryCalloc(pFunct->numOfParams, POINTER_BYTES);

    pCtx->pTsOutput = NULL;
    pCtx->resDataInfo.bytes = pFunct->resSchema.bytes;
    pCtx->resDataInfo.type = pFunct->resSchema.type;
    pCtx->order = TSDB_ORDER_ASC;
    pCtx->start.key = INT64_MIN;
    pCtx->end.key = INT64_MIN;
    pCtx->numOfParams = pExpr->base.numOfParams;
    pCtx->param = pFunct->pParam;
1540
    pCtx->saveHandle.currentPage = -1;
1541 1542 1543
  }

  for (int32_t i = 1; i < numOfOutput; ++i) {
dengyihao's avatar
dengyihao 已提交
1544 1545
    (*rowEntryInfoOffset)[i] = (int32_t)((*rowEntryInfoOffset)[i - 1] + sizeof(SResultRowEntryInfo) +
                                         pFuncCtx[i - 1].resDataInfo.interBufSize);
1546 1547 1548 1549
  }

  setSelectValueColumnInfo(pFuncCtx, numOfOutput);
  return pFuncCtx;
1550
}
1551 1552

// NOTE: sources columns are more than the destination SSDatablock columns.
1553 1554
// doFilter in table scan needs every column even its output is false
void relocateColumnData(SSDataBlock* pBlock, const SArray* pColMatchInfo, SArray* pCols, bool outputEveryColumn) {
1555 1556 1557 1558 1559
  size_t numOfSrcCols = taosArrayGetSize(pCols);

  int32_t i = 0, j = 0;
  while (i < numOfSrcCols && j < taosArrayGetSize(pColMatchInfo)) {
    SColumnInfoData* p = taosArrayGet(pCols, i);
H
Haojun Liao 已提交
1560
    SColMatchItem*   pmInfo = taosArrayGet(pColMatchInfo, j);
1561 1562

    if (p->info.colId == pmInfo->colId) {
H
Haojun Liao 已提交
1563
      SColumnInfoData* pDst = taosArrayGet(pBlock->pDataBlock, pmInfo->dstSlotId);
1564
      colDataAssign(pDst, p, pBlock->info.rows, &pBlock->info);
1565 1566 1567 1568 1569
      i++;
      j++;
    } else if (p->info.colId < pmInfo->colId) {
      i++;
    } else {
1570
      ASSERT(0);
1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588
    }
  }
}

SInterval extractIntervalInfo(const STableScanPhysiNode* pTableScanNode) {
  SInterval interval = {
      .interval = pTableScanNode->interval,
      .sliding = pTableScanNode->sliding,
      .intervalUnit = pTableScanNode->intervalUnit,
      .slidingUnit = pTableScanNode->slidingUnit,
      .offset = pTableScanNode->offset,
  };

  return interval;
}

SColumn extractColumnFromColumnNode(SColumnNode* pColNode) {
  SColumn c = {0};
H
Haojun Liao 已提交
1589

1590 1591 1592 1593 1594
  c.slotId = pColNode->slotId;
  c.colId = pColNode->colId;
  c.type = pColNode->node.resType.type;
  c.bytes = pColNode->node.resType.bytes;
  c.scale = pColNode->node.resType.scale;
1595 1596 1597 1598 1599 1600 1601
  c.precision = pColNode->node.resType.precision;
  return c;
}

int32_t initQueryTableDataCond(SQueryTableDataCond* pCond, const STableScanPhysiNode* pTableScanNode) {
  pCond->order = pTableScanNode->scanSeq[0] > 0 ? TSDB_ORDER_ASC : TSDB_ORDER_DESC;
  pCond->numOfCols = LIST_LENGTH(pTableScanNode->scan.pScanCols);
H
Haojun Liao 已提交
1602

1603
  pCond->colList = taosMemoryCalloc(pCond->numOfCols, sizeof(SColumnInfo));
dengyihao's avatar
dengyihao 已提交
1604
  pCond->pSlotList = taosMemoryMalloc(sizeof(int32_t) * pCond->numOfCols);
H
Haojun Liao 已提交
1605
  if (pCond->colList == NULL || pCond->pSlotList == NULL) {
S
Shengliang Guan 已提交
1606
    terrno = TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
1607 1608
    taosMemoryFreeClear(pCond->colList);
    taosMemoryFreeClear(pCond->pSlotList);
1609 1610 1611 1612
    return terrno;
  }

  // TODO: get it from stable scan node
H
Haojun Liao 已提交
1613
  pCond->twindows = pTableScanNode->scanRange;
1614
  pCond->suid = pTableScanNode->scan.suid;
1615
  pCond->type = TIMEWINDOW_RANGE_CONTAINED;
H
Haojun Liao 已提交
1616
  pCond->startVersion = -1;
1617
  pCond->endVersion = -1;
1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629

  int32_t j = 0;
  for (int32_t i = 0; i < pCond->numOfCols; ++i) {
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pTableScanNode->scan.pScanCols, i);
    SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;
    if (pColNode->colType == COLUMN_TYPE_TAG) {
      continue;
    }

    pCond->colList[j].type = pColNode->node.resType.type;
    pCond->colList[j].bytes = pColNode->node.resType.bytes;
    pCond->colList[j].colId = pColNode->colId;
H
Haojun Liao 已提交
1630 1631

    pCond->pSlotList[j] = pNode->slotId;
1632 1633 1634 1635 1636 1637 1638
    j += 1;
  }

  pCond->numOfCols = j;
  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
1639 1640 1641 1642
void cleanupQueryTableDataCond(SQueryTableDataCond* pCond) {
  taosMemoryFreeClear(pCond->colList);
  taosMemoryFreeClear(pCond->pSlotList);
}
1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655

int32_t convertFillType(int32_t mode) {
  int32_t type = TSDB_FILL_NONE;
  switch (mode) {
    case FILL_MODE_PREV:
      type = TSDB_FILL_PREV;
      break;
    case FILL_MODE_NONE:
      type = TSDB_FILL_NONE;
      break;
    case FILL_MODE_NULL:
      type = TSDB_FILL_NULL;
      break;
D
dapan1121 已提交
1656 1657 1658
    case FILL_MODE_NULL_F:
      type = TSDB_FILL_NULL_F;
      break;
1659 1660 1661 1662 1663 1664
    case FILL_MODE_NEXT:
      type = TSDB_FILL_NEXT;
      break;
    case FILL_MODE_VALUE:
      type = TSDB_FILL_SET_VALUE;
      break;
D
dapan1121 已提交
1665 1666 1667
    case FILL_MODE_VALUE_F:
      type = TSDB_FILL_SET_VALUE_F;
      break;
1668 1669 1670 1671 1672 1673 1674 1675 1676
    case FILL_MODE_LINEAR:
      type = TSDB_FILL_LINEAR;
      break;
    default:
      type = TSDB_FILL_NONE;
  }

  return type;
}
H
Haojun Liao 已提交
1677 1678 1679

static void getInitialStartTimeWindow(SInterval* pInterval, TSKEY ts, STimeWindow* w, bool ascQuery) {
  if (ascQuery) {
1680
    *w = getAlignQueryTimeWindow(pInterval, pInterval->precision, ts);
H
Haojun Liao 已提交
1681 1682
  } else {
    // the start position of the first time window in the endpoint that spreads beyond the queried last timestamp
1683
    *w = getAlignQueryTimeWindow(pInterval, pInterval->precision, ts);
H
Haojun Liao 已提交
1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697

    int64_t key = w->skey;
    while (key < ts) {  // moving towards end
      key = taosTimeAdd(key, pInterval->sliding, pInterval->slidingUnit, pInterval->precision);
      if (key >= ts) {
        break;
      }

      w->skey = key;
    }
  }
}

static STimeWindow doCalculateTimeWindow(int64_t ts, SInterval* pInterval) {
1698
  STimeWindow w = {0};
H
Haojun Liao 已提交
1699

1700 1701
  w.skey = taosTimeTruncate(ts, pInterval, pInterval->precision);
  w.ekey = taosTimeAdd(w.skey, pInterval->interval, pInterval->intervalUnit, pInterval->precision) - 1;
H
Haojun Liao 已提交
1702 1703 1704
  return w;
}

1705
STimeWindow getFirstQualifiedTimeWindow(int64_t ts, STimeWindow* pWindow, SInterval* pInterval, int32_t order) {
1706
  int32_t factor = (order == TSDB_ORDER_ASC) ? -1 : 1;
H
Haojun Liao 已提交
1707 1708 1709

  STimeWindow win = *pWindow;
  STimeWindow save = win;
1710
  while (win.skey <= ts && win.ekey >= ts) {
H
Haojun Liao 已提交
1711 1712 1713 1714 1715 1716 1717 1718 1719
    save = win;
    win.skey = taosTimeAdd(win.skey, factor * pInterval->sliding, pInterval->slidingUnit, pInterval->precision);
    win.ekey = taosTimeAdd(win.ekey, factor * pInterval->sliding, pInterval->slidingUnit, pInterval->precision);
  }

  return save;
}

// get the correct time window according to the handled timestamp
1720
// todo refactor
H
Haojun Liao 已提交
1721 1722 1723 1724 1725 1726 1727 1728 1729
STimeWindow getActiveTimeWindow(SDiskbasedBuf* pBuf, SResultRowInfo* pResultRowInfo, int64_t ts, SInterval* pInterval,
                                int32_t order) {
  STimeWindow w = {0};
  if (pResultRowInfo->cur.pageId == -1) {  // the first window, from the previous stored value
    getInitialStartTimeWindow(pInterval, ts, &w, (order == TSDB_ORDER_ASC));
    w.ekey = taosTimeAdd(w.skey, pInterval->interval, pInterval->intervalUnit, pInterval->precision) - 1;
    return w;
  }

1730 1731 1732 1733
  SResultRow* pRow = getResultRowByPos(pBuf, &pResultRowInfo->cur, false);
  if (pRow) {
    w = pRow->win;
  }
H
Haojun Liao 已提交
1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745
  // in case of typical time window, we can calculate time window directly.
  if (w.skey > ts || w.ekey < ts) {
    w = doCalculateTimeWindow(ts, pInterval);
  }

  if (pInterval->interval != pInterval->sliding) {
    // it is an sliding window query, in which sliding value is not equalled to
    // interval value, and we need to find the first qualified time window.
    w = getFirstQualifiedTimeWindow(ts, &w, pInterval, order);
  }

  return w;
1746 1747 1748 1749 1750 1751 1752
}

bool hasLimitOffsetInfo(SLimitInfo* pLimitInfo) {
  return (pLimitInfo->limit.limit != -1 || pLimitInfo->limit.offset != -1 || pLimitInfo->slimit.limit != -1 ||
          pLimitInfo->slimit.offset != -1);
}

1753 1754 1755 1756
bool hasSlimitOffsetInfo(SLimitInfo* pLimitInfo) {
  return (pLimitInfo->slimit.limit != -1 || pLimitInfo->slimit.offset != -1);
}

1757 1758 1759 1760 1761
void initLimitInfo(const SNode* pLimit, const SNode* pSLimit, SLimitInfo* pLimitInfo) {
  SLimit limit = {.limit = getLimit(pLimit), .offset = getOffset(pLimit)};
  SLimit slimit = {.limit = getLimit(pSLimit), .offset = getOffset(pSLimit)};

  pLimitInfo->limit = limit;
1762
  pLimitInfo->slimit = slimit;
1763 1764
  pLimitInfo->remainOffset = limit.offset;
  pLimitInfo->remainGroupOffset = slimit.offset;
1765
}
H
Haojun Liao 已提交
1766

1767 1768 1769 1770 1771
void resetLimitInfoForNextGroup(SLimitInfo* pLimitInfo) {
  pLimitInfo->numOfOutputRows = 0;
  pLimitInfo->remainOffset = pLimitInfo->limit.offset;
}

H
Haojun Liao 已提交
1772
uint64_t tableListGetSize(const STableListInfo* pTableList) {
1773
  ASSERT(taosArrayGetSize(pTableList->pTableList) == taosHashGetSize(pTableList->map));
H
Haojun Liao 已提交
1774 1775 1776
  return taosArrayGetSize(pTableList->pTableList);
}

dengyihao's avatar
dengyihao 已提交
1777
uint64_t tableListGetSuid(const STableListInfo* pTableList) { return pTableList->suid; }
H
Haojun Liao 已提交
1778 1779 1780 1781 1782 1783 1784 1785 1786

STableKeyInfo* tableListGetInfo(const STableListInfo* pTableList, int32_t index) {
  if (taosArrayGetSize(pTableList->pTableList) == 0) {
    return NULL;
  }

  return taosArrayGet(pTableList->pTableList, index);
}

H
Haojun Liao 已提交
1787 1788
uint64_t getTableGroupId(const STableListInfo* pTableList, uint64_t tableUid) {
  int32_t* slot = taosHashGet(pTableList->map, &tableUid, sizeof(tableUid));
1789
  ASSERT(pTableList->map != NULL && slot != NULL);
H
Haojun Liao 已提交
1790 1791

  STableKeyInfo* pKeyInfo = taosArrayGet(pTableList->pTableList, *slot);
1792
  ASSERT(pKeyInfo->uid == tableUid);
H
Haojun Liao 已提交
1793 1794 1795 1796

  return pKeyInfo->groupId;
}

H
Haojun Liao 已提交
1797
// TODO handle the group offset info, fix it, the rule of group output will be broken by this function
H
Haojun Liao 已提交
1798
int32_t tableListAddTableInfo(STableListInfo* pTableList, uint64_t uid, uint64_t gid) {
H
Haojun Liao 已提交
1799
  if (pTableList->map == NULL) {
1800
    ASSERT(taosArrayGetSize(pTableList->pTableList) == 0);
1801
    pTableList->map = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, HASH_ENTRY_LOCK);
H
Haojun Liao 已提交
1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813
  }

  STableKeyInfo keyInfo = {.uid = uid, .groupId = gid};
  taosArrayPush(pTableList->pTableList, &keyInfo);

  int32_t slot = (int32_t)taosArrayGetSize(pTableList->pTableList) - 1;
  taosHashPut(pTableList->map, &uid, sizeof(uid), &slot, sizeof(slot));

  qDebug("uid:%" PRIu64 ", groupId:%" PRIu64 " added into table list, slot:%d, total:%d", uid, gid, slot, slot + 1);
  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
1814
int32_t tableListGetGroupList(const STableListInfo* pTableList, int32_t ordinalGroupIndex, STableKeyInfo** pKeyInfo,
dengyihao's avatar
dengyihao 已提交
1815
                              int32_t* size) {
1816 1817 1818 1819
  int32_t totalGroups = tableListGetOutputGroups(pTableList);
  int32_t numOfTables =  tableListGetSize(pTableList);

  if (ordinalGroupIndex < 0 || ordinalGroupIndex >= totalGroups) {
H
Haojun Liao 已提交
1820 1821 1822 1823 1824
    return TSDB_CODE_INVALID_PARA;
  }

  // here handle two special cases:
  // 1. only one group exists, and 2. one table exists for each group.
1825 1826
  if (totalGroups == 1) {
    *size = numOfTables;
dengyihao's avatar
dengyihao 已提交
1827
    *pKeyInfo = (*size == 0) ? NULL : taosArrayGet(pTableList->pTableList, 0);
H
Haojun Liao 已提交
1828
    return TSDB_CODE_SUCCESS;
1829
  } else if (totalGroups == numOfTables) {
H
Haojun Liao 已提交
1830 1831 1832 1833 1834 1835
    *size = 1;
    *pKeyInfo = taosArrayGet(pTableList->pTableList, ordinalGroupIndex);
    return TSDB_CODE_SUCCESS;
  }

  int32_t offset = pTableList->groupOffset[ordinalGroupIndex];
1836
  if (ordinalGroupIndex < totalGroups - 1) {
1837
    *size = pTableList->groupOffset[ordinalGroupIndex + 1] - offset;
H
Haojun Liao 已提交
1838
  } else {
1839
    *size = numOfTables - offset;
H
Haojun Liao 已提交
1840 1841 1842 1843 1844 1845
  }

  *pKeyInfo = taosArrayGet(pTableList->pTableList, offset);
  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
1846
int32_t tableListGetOutputGroups(const STableListInfo* pTableList) { return pTableList->numOfOuputGroups; }
H
Haojun Liao 已提交
1847 1848 1849

bool oneTableForEachGroup(const STableListInfo* pTableList) { return pTableList->oneTableForEachGroup; }

H
Haojun Liao 已提交
1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861
STableListInfo* tableListCreate() {
  STableListInfo* pListInfo = taosMemoryCalloc(1, sizeof(STableListInfo));
  if (pListInfo == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

  pListInfo->pTableList = taosArrayInit(4, sizeof(STableKeyInfo));
  if (pListInfo->pTableList == NULL) {
    goto _error;
  }

1862
  pListInfo->map = taosHashInit(1024, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_ENTRY_LOCK);
H
Haojun Liao 已提交
1863 1864 1865 1866 1867 1868 1869 1870 1871 1872 1873 1874 1875 1876
  if (pListInfo->map == NULL) {
    goto _error;
  }

  pListInfo->numOfOuputGroups = 1;
  return pListInfo;

_error:
  tableListDestroy(pListInfo);
  terrno = TSDB_CODE_OUT_OF_MEMORY;
  return NULL;
}

void* tableListDestroy(STableListInfo* pTableListInfo) {
1877 1878 1879
  if (pTableListInfo == NULL) {
    return NULL;
  }
H
Haojun Liao 已提交
1880

H
Haojun Liao 已提交
1881 1882
  pTableListInfo->pTableList = taosArrayDestroy(pTableListInfo->pTableList);
  taosMemoryFreeClear(pTableListInfo->groupOffset);
H
Haojun Liao 已提交
1883

H
Haojun Liao 已提交
1884 1885 1886 1887 1888 1889 1890 1891 1892
  taosHashCleanup(pTableListInfo->map);

  pTableListInfo->pTableList = NULL;
  pTableListInfo->map = NULL;
  taosMemoryFree(pTableListInfo);
  return NULL;
}

void tableListClear(STableListInfo* pTableListInfo) {
H
Haojun Liao 已提交
1893 1894 1895 1896
  if (pTableListInfo == NULL) {
    return;
  }

H
Haojun Liao 已提交
1897 1898 1899 1900 1901 1902 1903 1904
  taosArrayClear(pTableListInfo->pTableList);
  taosHashClear(pTableListInfo->map);
  taosMemoryFree(pTableListInfo->groupOffset);
  pTableListInfo->numOfOuputGroups = 1;
  pTableListInfo->oneTableForEachGroup = false;
}

static int32_t orderbyGroupIdComparFn(const void* p1, const void* p2) {
dengyihao's avatar
dengyihao 已提交
1905 1906
  STableKeyInfo* pInfo1 = (STableKeyInfo*)p1;
  STableKeyInfo* pInfo2 = (STableKeyInfo*)p2;
H
Haojun Liao 已提交
1907 1908 1909 1910

  if (pInfo1->groupId == pInfo2->groupId) {
    return 0;
  } else {
dengyihao's avatar
dengyihao 已提交
1911
    return pInfo1->groupId < pInfo2->groupId ? -1 : 1;
H
Haojun Liao 已提交
1912 1913 1914 1915 1916 1917 1918 1919 1920 1921
  }
}

static int32_t sortTableGroup(STableListInfo* pTableListInfo) {
  taosArraySort(pTableListInfo->pTableList, orderbyGroupIdComparFn);
  int32_t size = taosArrayGetSize(pTableListInfo->pTableList);

  SArray* pList = taosArrayInit(4, sizeof(int32_t));

  STableKeyInfo* pInfo = taosArrayGet(pTableListInfo->pTableList, 0);
dengyihao's avatar
dengyihao 已提交
1922
  uint64_t       gid = pInfo->groupId;
1923

H
Haojun Liao 已提交
1924 1925
  int32_t start = 0;
  taosArrayPush(pList, &start);
1926

dengyihao's avatar
dengyihao 已提交
1927
  for (int32_t i = 1; i < size; ++i) {
H
Haojun Liao 已提交
1928 1929 1930 1931 1932 1933 1934 1935 1936
    pInfo = taosArrayGet(pTableListInfo->pTableList, i);
    if (pInfo->groupId != gid) {
      taosArrayPush(pList, &i);
      gid = pInfo->groupId;
    }
  }

  pTableListInfo->numOfOuputGroups = taosArrayGetSize(pList);
  pTableListInfo->groupOffset = taosMemoryMalloc(sizeof(int32_t) * pTableListInfo->numOfOuputGroups);
H
Haojun Liao 已提交
1937 1938 1939 1940 1941
  if (pTableListInfo->groupOffset == NULL) {
    taosArrayDestroy(pList);
    return TSDB_CODE_OUT_OF_MEMORY;
  }

H
Haojun Liao 已提交
1942 1943 1944 1945 1946
  memcpy(pTableListInfo->groupOffset, taosArrayGet(pList, 0), sizeof(int32_t) * pTableListInfo->numOfOuputGroups);
  taosArrayDestroy(pList);
  return TDB_CODE_SUCCESS;
}

dengyihao's avatar
dengyihao 已提交
1947 1948
int32_t buildGroupIdMapForAllTables(STableListInfo* pTableListInfo, SReadHandle* pHandle, SNodeList* group,
                                    bool groupSort) {
H
Haojun Liao 已提交
1949
  int32_t code = TSDB_CODE_SUCCESS;
1950
  ASSERT(pTableListInfo->map != NULL);
H
Haojun Liao 已提交
1951

dengyihao's avatar
dengyihao 已提交
1952
  bool   groupByTbname = groupbyTbname(group);
H
Haojun Liao 已提交
1953 1954 1955 1956
  size_t numOfTables = taosArrayGetSize(pTableListInfo->pTableList);
  if (group == NULL || groupByTbname) {
    for (int32_t i = 0; i < numOfTables; i++) {
      STableKeyInfo* info = taosArrayGet(pTableListInfo->pTableList, i);
dengyihao's avatar
dengyihao 已提交
1957
      info->groupId = groupByTbname ? info->uid : 0;
H
Haojun Liao 已提交
1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980
    }

    pTableListInfo->oneTableForEachGroup = groupByTbname;

    if (groupSort && groupByTbname) {
      taosArraySort(pTableListInfo->pTableList, orderbyGroupIdComparFn);
      pTableListInfo->numOfOuputGroups = numOfTables;
    } else {
      pTableListInfo->numOfOuputGroups = 1;
    }
  } else {
    code = getColInfoResultForGroupby(pHandle->meta, group, pTableListInfo);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
    }

    if (groupSort) {
      code = sortTableGroup(pTableListInfo);
    }
  }

  // add all table entry in the hash map
  size_t size = taosArrayGetSize(pTableListInfo->pTableList);
dengyihao's avatar
dengyihao 已提交
1981
  for (int32_t i = 0; i < size; ++i) {
H
Haojun Liao 已提交
1982 1983 1984 1985 1986 1987 1988 1989 1990
    STableKeyInfo* p = taosArrayGet(pTableListInfo->pTableList, i);
    taosHashPut(pTableListInfo->map, &p->uid, sizeof(uint64_t), &i, sizeof(int32_t));
  }

  return code;
}

int32_t createScanTableListInfo(SScanPhysiNode* pScanNode, SNodeList* pGroupTags, bool groupSort, SReadHandle* pHandle,
                                STableListInfo* pTableListInfo, SNode* pTagCond, SNode* pTagIndexCond,
H
Haojun Liao 已提交
1991
                                SExecTaskInfo* pTaskInfo) {
dengyihao's avatar
dengyihao 已提交
1992
  int64_t     st = taosGetTimestampUs();
H
Haojun Liao 已提交
1993
  const char* idStr = GET_TASKID(pTaskInfo);
H
Haojun Liao 已提交
1994 1995 1996 1997 1998 1999

  if (pHandle == NULL) {
    qError("invalid handle, in creating operator tree, %s", idStr);
    return TSDB_CODE_INVALID_PARA;
  }

2000
  int32_t code = getTableList(pHandle->meta, pHandle->vnode, pScanNode, pTagCond, pTagIndexCond, pTableListInfo, idStr);
H
Haojun Liao 已提交
2001 2002 2003 2004 2005
  if (code != TSDB_CODE_SUCCESS) {
    qError("failed to getTableList, code: %s", tstrerror(code));
    return code;
  }

H
Haojun Liao 已提交
2006
  int32_t numOfTables = taosArrayGetSize(pTableListInfo->pTableList);
2007
  ASSERT(pTableListInfo->numOfOuputGroups == 1);
H
Haojun Liao 已提交
2008 2009

  int64_t st1 = taosGetTimestampUs();
H
Haojun Liao 已提交
2010
  pTaskInfo->cost.extractListTime = (st1 - st) / 1000.0;
H
Haojun Liao 已提交
2011 2012
  qDebug("extract queried table list completed, %d tables, elapsed time:%.2f ms %s", numOfTables,
         pTaskInfo->cost.extractListTime, idStr);
H
Haojun Liao 已提交
2013

H
Haojun Liao 已提交
2014
  if (numOfTables == 0) {
H
Haojun Liao 已提交
2015 2016 2017 2018
    qDebug("no table qualified for query, %s" PRIx64, idStr);
    return TSDB_CODE_SUCCESS;
  }

2019
  code = buildGroupIdMapForAllTables(pTableListInfo, pHandle, pGroupTags, groupSort);
H
Haojun Liao 已提交
2020 2021 2022 2023
  if (code != TSDB_CODE_SUCCESS) {
    return code;
  }

dengyihao's avatar
dengyihao 已提交
2024
  pTaskInfo->cost.groupIdMapTime = (taosGetTimestampUs() - st1) / 1000.0;
H
Haojun Liao 已提交
2025
  qDebug("generate group id map completed, elapsed time:%.2f ms %s", pTaskInfo->cost.groupIdMapTime, idStr);
H
Haojun Liao 已提交
2026 2027

  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
2028
}
H
Haojun Liao 已提交
2029 2030 2031 2032 2033 2034 2035 2036 2037

void printDataBlock(SSDataBlock* pBlock, const char* flag) {
  if (!pBlock || pBlock->info.rows == 0) {
    qDebug("===stream===printDataBlock: Block is Null or Empty");
    return;
  }
  char* pBuf = NULL;
  qDebug("%s", dumpBlockData(pBlock, flag, &pBuf));
  taosMemoryFree(pBuf);
dengyihao's avatar
dengyihao 已提交
2038
}