groupoperator.c 47.6 KB
Newer Older
H
Haojun Liao 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

16
#include "filter.h"
H
Haojun Liao 已提交
17
#include "function.h"
18
#include "os.h"
H
Haojun Liao 已提交
19 20 21 22 23
#include "tname.h"

#include "tdatablock.h"
#include "tmsg.h"

24
#include "executorInt.h"
25 26
#include "operator.h"
#include "querytask.h"
H
Haojun Liao 已提交
27 28 29 30
#include "tcompare.h"
#include "thash.h"
#include "ttypes.h"

H
Haojun Liao 已提交
31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60
typedef struct SGroupbyOperatorInfo {
  SOptrBasicInfo binfo;
  SAggSupporter  aggSup;
  SArray*        pGroupCols;     // group by columns, SArray<SColumn>
  SArray*        pGroupColVals;  // current group column values, SArray<SGroupKeys>
  bool           isInit;         // denote if current val is initialized or not
  char*          keyBuf;         // group by keys for hash
  int32_t        groupKeyLen;    // total group by column width
  SGroupResInfo  groupResInfo;
  SExprSupp      scalarSup;
} SGroupbyOperatorInfo;

// The sort in partition may be needed later.
typedef struct SPartitionOperatorInfo {
  SOptrBasicInfo binfo;
  SArray*        pGroupCols;
  SArray*        pGroupColVals;  // current group column values, SArray<SGroupKeys>
  char*          keyBuf;         // group by keys for hash
  int32_t        groupKeyLen;    // total group by column width
  SHashObj*      pGroupSet;      // quick locate the window object for each result

  SDiskbasedBuf* pBuf;              // query result buffer based on blocked-wised disk file
  int32_t        rowCapacity;       // maximum number of rows for each buffer page
  int32_t*       columnOffset;      // start position for each column data
  SArray*        sortedGroupArray;  // SDataGroupInfo sorted by group id
  int32_t        groupIndex;        // group index
  int32_t        pageIndex;         // page index of current group
  SExprSupp      scalarSup;
} SPartitionOperatorInfo;

61
static void*    getCurrentDataGroupInfo(const SPartitionOperatorInfo* pInfo, SDataGroupInfo** pGroupInfo, int32_t len);
H
Haojun Liao 已提交
62
static int32_t* setupColumnOffset(const SSDataBlock* pBlock, int32_t rowCapacity);
63 64
static int32_t  setGroupResultOutputBuf(SOperatorInfo* pOperator, SOptrBasicInfo* binfo, int32_t numOfCols, char* pData,
                                        int16_t bytes, uint64_t groupId, SDiskbasedBuf* pBuf, SAggSupporter* pAggSup);
H
Haojun Liao 已提交
65
static SArray*  extractColumnInfo(SNodeList* pNodeList);
H
Haojun Liao 已提交
66

H
Haojun Liao 已提交
67
static void freeGroupKey(void* param) {
68
  SGroupKeys* pKey = (SGroupKeys*)param;
H
Haojun Liao 已提交
69 70 71
  taosMemoryFree(pKey->pData);
}

72
static void destroyGroupOperatorInfo(void* param) {
H
Haojun Liao 已提交
73
  SGroupbyOperatorInfo* pInfo = (SGroupbyOperatorInfo*)param;
74 75 76 77
  if (pInfo == NULL) {
    return;
  }

78
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
79 80
  taosMemoryFreeClear(pInfo->keyBuf);
  taosArrayDestroy(pInfo->pGroupCols);
H
Haojun Liao 已提交
81
  taosArrayDestroyEx(pInfo->pGroupColVals, freeGroupKey);
82
  cleanupExprSupp(&pInfo->scalarSup);
H
Haojun Liao 已提交
83 84 85

  cleanupGroupResInfo(&pInfo->groupResInfo);
  cleanupAggSup(&pInfo->aggSup);
D
dapan1121 已提交
86
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
87 88
}

wmmhello's avatar
wmmhello 已提交
89
static int32_t initGroupOptrInfo(SArray** pGroupColVals, int32_t* keyLen, char** keyBuf, const SArray* pGroupColList) {
H
Haojun Liao 已提交
90 91
  *pGroupColVals = taosArrayInit(4, sizeof(SGroupKeys));
  if ((*pGroupColVals) == NULL) {
H
Haojun Liao 已提交
92 93 94 95 96
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  int32_t numOfGroupCols = taosArrayGetSize(pGroupColList);
  for (int32_t i = 0; i < numOfGroupCols; ++i) {
5
54liuyao 已提交
97
    SColumn* pCol = (SColumn*)taosArrayGet(pGroupColList, i);
98
    (*keyLen) += pCol->bytes;  // actual data + null_flag
H
Haojun Liao 已提交
99

100
    SGroupKeys key = {0};
101 102
    key.bytes = pCol->bytes;
    key.type = pCol->type;
H
Haojun Liao 已提交
103
    key.isNull = false;
104
    key.pData = taosMemoryCalloc(1, pCol->bytes);
H
Haojun Liao 已提交
105 106 107 108
    if (key.pData == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

H
Haojun Liao 已提交
109
    taosArrayPush((*pGroupColVals), &key);
H
Haojun Liao 已提交
110 111 112
  }

  int32_t nullFlagSize = sizeof(int8_t) * numOfGroupCols;
113
  (*keyLen) += nullFlagSize;
H
Haojun Liao 已提交
114

115
  (*keyBuf) = taosMemoryCalloc(1, (*keyLen));
H
Haojun Liao 已提交
116
  if ((*keyBuf) == NULL) {
H
Haojun Liao 已提交
117 118 119 120 121 122
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  return TSDB_CODE_SUCCESS;
}

123 124
static bool groupKeyCompare(SArray* pGroupCols, SArray* pGroupColVals, SSDataBlock* pBlock, int32_t rowIndex,
                            int32_t numOfGroupCols) {
H
Haojun Liao 已提交
125 126
  SColumnDataAgg* pColAgg = NULL;
  for (int32_t i = 0; i < numOfGroupCols; ++i) {
H
Haojun Liao 已提交
127
    SColumn*         pCol = taosArrayGet(pGroupCols, i);
H
Haojun Liao 已提交
128 129
    SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, pCol->slotId);
    if (pBlock->pBlockAgg != NULL) {
130
      pColAgg = pBlock->pBlockAgg[pCol->slotId];  // TODO is agg data matched?
H
Haojun Liao 已提交
131 132 133 134
    }

    bool isNull = colDataIsNull(pColInfoData, pBlock->info.rows, rowIndex, pColAgg);

H
Haojun Liao 已提交
135
    SGroupKeys* pkey = taosArrayGet(pGroupColVals, i);
H
Haojun Liao 已提交
136 137 138 139 140 141 142 143 144 145
    if (pkey->isNull && isNull) {
      continue;
    }

    if (isNull || pkey->isNull) {
      return false;
    }

    char* val = colDataGetData(pColInfoData, rowIndex);

wmmhello's avatar
wmmhello 已提交
146 147 148
    if (pkey->type == TSDB_DATA_TYPE_JSON) {
      int32_t dataLen = getJsonValueLen(val);

149
      if (memcmp(pkey->pData, val, dataLen) == 0) {
wmmhello's avatar
wmmhello 已提交
150 151 152 153 154
        continue;
      } else {
        return false;
      }
    } else if (IS_VAR_DATA_TYPE(pkey->type)) {
H
Haojun Liao 已提交
155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170
      int32_t len = varDataLen(val);
      if (len == varDataLen(pkey->pData) && memcmp(varDataVal(pkey->pData), varDataVal(val), len) == 0) {
        continue;
      } else {
        return false;
      }
    } else {
      if (memcmp(pkey->pData, val, pkey->bytes) != 0) {
        return false;
      }
    }
  }

  return true;
}

wmmhello's avatar
wmmhello 已提交
171
static void recordNewGroupKeys(SArray* pGroupCols, SArray* pGroupColVals, SSDataBlock* pBlock, int32_t rowIndex) {
H
Haojun Liao 已提交
172 173
  SColumnDataAgg* pColAgg = NULL;

174 175
  size_t numOfGroupCols = taosArrayGetSize(pGroupCols);

H
Haojun Liao 已提交
176
  for (int32_t i = 0; i < numOfGroupCols; ++i) {
D
dapan1121 已提交
177
    SColumn*         pCol = (SColumn*) taosArrayGet(pGroupCols, i);
H
Haojun Liao 已提交
178 179
    SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, pCol->slotId);

D
dapan1121 已提交
180 181 182 183 184
    // valid range check. todo: return error code.
    if (pCol->slotId > taosArrayGetSize(pBlock->pDataBlock)) {
      continue;
    }

H
Haojun Liao 已提交
185
    if (pBlock->pBlockAgg != NULL) {
186
      pColAgg = pBlock->pBlockAgg[pCol->slotId];  // TODO is agg data matched?
H
Haojun Liao 已提交
187 188
    }

H
Haojun Liao 已提交
189
    SGroupKeys* pkey = taosArrayGet(pGroupColVals, i);
H
Haojun Liao 已提交
190 191 192
    if (colDataIsNull(pColInfoData, pBlock->info.rows, rowIndex, pColAgg)) {
      pkey->isNull = true;
    } else {
193
      pkey->isNull = false;
H
Haojun Liao 已提交
194
      char* val = colDataGetData(pColInfoData, rowIndex);
wmmhello's avatar
wmmhello 已提交
195
      if (pkey->type == TSDB_DATA_TYPE_JSON) {
196
        if (tTagIsJson(val)) {
wmmhello's avatar
wmmhello 已提交
197 198 199
          terrno = TSDB_CODE_QRY_JSON_IN_GROUP_ERROR;
          return;
        }
wmmhello's avatar
wmmhello 已提交
200 201 202
        int32_t dataLen = getJsonValueLen(val);
        memcpy(pkey->pData, val, dataLen);
      } else if (IS_VAR_DATA_TYPE(pkey->type)) {
H
Haojun Liao 已提交
203
        memcpy(pkey->pData, val, varDataTLen(val));
204
        ASSERT(varDataTLen(val) <= pkey->bytes);
H
Haojun Liao 已提交
205 206 207 208 209 210 211
      } else {
        memcpy(pkey->pData, val, pkey->bytes);
      }
    }
  }
}

wmmhello's avatar
wmmhello 已提交
212
static int32_t buildGroupKeys(void* pKey, const SArray* pGroupColVals) {
H
Haojun Liao 已提交
213 214 215 216 217 218 219 220 221 222 223 224
  size_t numOfGroupCols = taosArrayGetSize(pGroupColVals);

  char* isNull = (char*)pKey;
  char* pStart = (char*)pKey + sizeof(int8_t) * numOfGroupCols;
  for (int32_t i = 0; i < numOfGroupCols; ++i) {
    SGroupKeys* pkey = taosArrayGet(pGroupColVals, i);
    if (pkey->isNull) {
      isNull[i] = 1;
      continue;
    }

    isNull[i] = 0;
wmmhello's avatar
wmmhello 已提交
225 226 227 228 229
    if (pkey->type == TSDB_DATA_TYPE_JSON) {
      int32_t dataLen = getJsonValueLen(pkey->pData);
      memcpy(pStart, (pkey->pData), dataLen);
      pStart += dataLen;
    } else if (IS_VAR_DATA_TYPE(pkey->type)) {
H
Haojun Liao 已提交
230 231
      varDataCopy(pStart, pkey->pData);
      pStart += varDataTLen(pkey->pData);
232
      ASSERT(varDataTLen(pkey->pData) <= pkey->bytes);
H
Haojun Liao 已提交
233 234 235 236 237 238
    } else {
      memcpy(pStart, pkey->pData, pkey->bytes);
      pStart += pkey->bytes;
    }
  }

239
  return (int32_t)(pStart - (char*)pKey);
H
Haojun Liao 已提交
240 241 242 243 244
}

// assign the group keys or user input constant values if required
static void doAssignGroupKeys(SqlFunctionCtx* pCtx, int32_t numOfOutput, int32_t totalRows, int32_t rowIndex) {
  for (int32_t i = 0; i < numOfOutput; ++i) {
245
    if (pCtx[i].functionId == -1) {  // select count(*),key from t group by key.
H
Haojun Liao 已提交
246 247 248
      SResultRowEntryInfo* pEntryInfo = GET_RES_INFO(&pCtx[i]);

      SColumnInfoData* pColInfoData = pCtx[i].input.pData[0];
249
      // todo OPT all/all not NULL
H
Haojun Liao 已提交
250 251 252 253
      if (!colDataIsNull(pColInfoData, totalRows, rowIndex, NULL)) {
        char* dest = GET_ROWCELL_INTERBUF(pEntryInfo);
        char* data = colDataGetData(pColInfoData, rowIndex);

wmmhello's avatar
wmmhello 已提交
254 255 256 257
        if (pColInfoData->info.type == TSDB_DATA_TYPE_JSON) {
          int32_t dataLen = getJsonValueLen(data);
          memcpy(dest, data, dataLen);
        } else if (IS_VAR_DATA_TYPE(pColInfoData->info.type)) {
258 259 260 261
          varDataCopy(dest, data);
        } else {
          memcpy(dest, data, pColInfoData->info.bytes);
        }
262
      } else {  // it is a NULL value
H
Haojun Liao 已提交
263
        pEntryInfo->isNullRes = 1;
H
Haojun Liao 已提交
264
      }
H
Haojun Liao 已提交
265 266

      pEntryInfo->numOfRes = 1;
H
Haojun Liao 已提交
267 268 269 270 271 272 273 274
    }
  }
}

static void doHashGroupbyAgg(SOperatorInfo* pOperator, SSDataBlock* pBlock) {
  SExecTaskInfo*        pTaskInfo = pOperator->pTaskInfo;
  SGroupbyOperatorInfo* pInfo = pOperator->info;

275
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
H
Haojun Liao 已提交
276 277 278 279 280 281
  int32_t         numOfGroupCols = taosArrayGetSize(pInfo->pGroupCols);
  //  if (type == TSDB_DATA_TYPE_FLOAT || type == TSDB_DATA_TYPE_DOUBLE) {
  // qError("QInfo:0x%"PRIx64" group by not supported on double/float columns, abort", GET_TASKID(pRuntimeEnv));
  //    return;
  //  }

H
Haojun Liao 已提交
282
  int32_t len = 0;
wmmhello's avatar
wmmhello 已提交
283
  terrno = TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
284

H
Haojun Liao 已提交
285
  int32_t num = 0;
D
dapan1121 已提交
286
  uint64_t groupId = 0;
H
Haojun Liao 已提交
287 288 289
  for (int32_t j = 0; j < pBlock->info.rows; ++j) {
    // Compare with the previous row of this column, and do not set the output buffer again if they are identical.
    if (!pInfo->isInit) {
290
      recordNewGroupKeys(pInfo->pGroupCols, pInfo->pGroupColVals, pBlock, j);
wmmhello's avatar
wmmhello 已提交
291
      if (terrno != TSDB_CODE_SUCCESS) {  // group by json error
292
        T_LONG_JMP(pTaskInfo->env, terrno);
wmmhello's avatar
wmmhello 已提交
293
      }
H
Haojun Liao 已提交
294 295 296 297 298
      pInfo->isInit = true;
      num++;
      continue;
    }

H
Haojun Liao 已提交
299
    bool equal = groupKeyCompare(pInfo->pGroupCols, pInfo->pGroupColVals, pBlock, j, numOfGroupCols);
H
Haojun Liao 已提交
300 301 302 303 304
    if (equal) {
      num++;
      continue;
    }

H
Haojun Liao 已提交
305
    // The first row of a new block does not belongs to the previous existed group
306
    if (j == 0) {
H
Haojun Liao 已提交
307
      num++;
308
      recordNewGroupKeys(pInfo->pGroupCols, pInfo->pGroupColVals, pBlock, j);
wmmhello's avatar
wmmhello 已提交
309
      if (terrno != TSDB_CODE_SUCCESS) {  // group by json error
310
        T_LONG_JMP(pTaskInfo->env, terrno);
wmmhello's avatar
wmmhello 已提交
311
      }
H
Haojun Liao 已提交
312 313 314
      continue;
    }

H
Haojun Liao 已提交
315
    len = buildGroupKeys(pInfo->keyBuf, pInfo->pGroupColVals);
316
    int32_t ret = setGroupResultOutputBuf(pOperator, &(pInfo->binfo), pOperator->exprSupp.numOfExprs, pInfo->keyBuf,
H
Haojun Liao 已提交
317
                                          len, pBlock->info.id.groupId, pInfo->aggSup.pResultBuf, &pInfo->aggSup);
H
Haojun Liao 已提交
318
    if (ret != TSDB_CODE_SUCCESS) {  // null data, too many state code
S
Shengliang Guan 已提交
319
      T_LONG_JMP(pTaskInfo->env, TSDB_CODE_APP_ERROR);
H
Haojun Liao 已提交
320 321 322
    }

    int32_t rowIndex = j - num;
dengyihao's avatar
dengyihao 已提交
323 324
    applyAggFunctionOnPartialTuples(pTaskInfo, pCtx, NULL, rowIndex, num, pBlock->info.rows,
                                    pOperator->exprSupp.numOfExprs);
H
Haojun Liao 已提交
325 326

    // assign the group keys or user input constant values if required
327
    doAssignGroupKeys(pCtx, pOperator->exprSupp.numOfExprs, pBlock->info.rows, rowIndex);
328
    recordNewGroupKeys(pInfo->pGroupCols, pInfo->pGroupColVals, pBlock, j);
H
Haojun Liao 已提交
329 330 331 332
    num = 1;
  }

  if (num > 0) {
H
Haojun Liao 已提交
333
    len = buildGroupKeys(pInfo->keyBuf, pInfo->pGroupColVals);
334
    int32_t ret = setGroupResultOutputBuf(pOperator, &(pInfo->binfo), pOperator->exprSupp.numOfExprs, pInfo->keyBuf,
H
Haojun Liao 已提交
335
                                          len, pBlock->info.id.groupId, pInfo->aggSup.pResultBuf, &pInfo->aggSup);
H
Haojun Liao 已提交
336
    if (ret != TSDB_CODE_SUCCESS) {
S
Shengliang Guan 已提交
337
      T_LONG_JMP(pTaskInfo->env, TSDB_CODE_APP_ERROR);
H
Haojun Liao 已提交
338 339 340
    }

    int32_t rowIndex = pBlock->info.rows - num;
dengyihao's avatar
dengyihao 已提交
341 342
    applyAggFunctionOnPartialTuples(pTaskInfo, pCtx, NULL, rowIndex, num, pBlock->info.rows,
                                    pOperator->exprSupp.numOfExprs);
343
    doAssignGroupKeys(pCtx, pOperator->exprSupp.numOfExprs, pBlock->info.rows, rowIndex);
H
Haojun Liao 已提交
344 345 346
  }
}

347 348 349 350
static SSDataBlock* buildGroupResultDataBlock(SOperatorInfo* pOperator) {
  SGroupbyOperatorInfo* pInfo = pOperator->info;

  SSDataBlock* pRes = pInfo->binfo.pRes;
351
  while (1) {
352
    doBuildResultDatablock(pOperator, &pInfo->binfo, &pInfo->groupResInfo, pInfo->aggSup.pResultBuf);
H
Haojun Liao 已提交
353
    doFilter(pRes, pOperator->exprSupp.pFilterInfo, NULL);
354

355
    if (!hasRemainResults(&pInfo->groupResInfo)) {
H
Haojun Liao 已提交
356
      setOperatorCompleted(pOperator);
357 358 359 360 361 362 363 364 365
      break;
    }

    if (pRes->info.rows > 0) {
      break;
    }
  }

  pOperator->resultInfo.totalRows += pRes->info.rows;
366
  return (pRes->info.rows == 0) ? NULL : pRes;
367 368
}

369
static SSDataBlock* hashGroupbyAggregate(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
370 371 372 373
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

374 375
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

H
Haojun Liao 已提交
376 377
  SGroupbyOperatorInfo* pInfo = pOperator->info;
  if (pOperator->status == OP_RES_TO_RETURN) {
378
    return buildGroupResultDataBlock(pOperator);
H
Haojun Liao 已提交
379 380
  }

381 382 383
  int32_t order = TSDB_ORDER_ASC;
  int32_t scanFlag = MAIN_SCAN;

384
  int64_t        st = taosGetTimestampUs();
H
Haojun Liao 已提交
385 386 387
  SOperatorInfo* downstream = pOperator->pDownstream[0];

  while (1) {
388
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
H
Haojun Liao 已提交
389 390 391 392
    if (pBlock == NULL) {
      break;
    }

393
    int32_t code = getTableScanInfo(pOperator, &order, &scanFlag, false);
394
    if (code != TSDB_CODE_SUCCESS) {
395
      T_LONG_JMP(pTaskInfo->env, code);
396 397
    }

H
Haojun Liao 已提交
398
    // the pDataBlock are always the same one, no need to call this again
399
    setInputDataBlock(&pOperator->exprSupp, pBlock, order, scanFlag, true);
400

401
    // there is an scalar expression that needs to be calculated right before apply the group aggregation.
402
    if (pInfo->scalarSup.pExprInfo != NULL) {
403 404
      pTaskInfo->code = projectApplyFunctions(pInfo->scalarSup.pExprInfo, pBlock, pBlock, pInfo->scalarSup.pCtx,
                                              pInfo->scalarSup.numOfExprs, NULL);
405
      if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
406
        T_LONG_JMP(pTaskInfo->env, pTaskInfo->code);
407
      }
408 409
    }

H
Haojun Liao 已提交
410 411 412 413
    doHashGroupbyAgg(pOperator, pBlock);
  }

  pOperator->status = OP_RES_TO_RETURN;
H
Haojun Liao 已提交
414

415 416 417 418 419 420 421 422 423 424 425 426 427 428
#if 0
  if(pOperator->fpSet.encodeResultRow){
    char *result = NULL;
    int32_t length = 0;
    pOperator->fpSet.encodeResultRow(pOperator, &result, &length);
    SAggSupporter* pSup = &pInfo->aggSup;
    taosHashClear(pSup->pResultRowHashTable);
    pInfo->binfo.resultRowInfo.size = 0;
    pOperator->fpSet.decodeResultRow(pOperator, result);
    if(result){
      taosMemoryFree(result);
    }
  }
#endif
429
  initGroupedResultInfo(&pInfo->groupResInfo, pInfo->aggSup.pResultRowHashTable, 0);
430

431
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
432
  return buildGroupResultDataBlock(pOperator);
H
Haojun Liao 已提交
433 434
}

5
54liuyao 已提交
435
SOperatorInfo* createGroupOperatorInfo(SOperatorInfo* downstream, SAggPhysiNode* pAggNode, SExecTaskInfo* pTaskInfo) {
436
  int32_t               code = TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
437 438 439
  SGroupbyOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SGroupbyOperatorInfo));
  SOperatorInfo*        pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
440
    code = TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
441 442 443
    goto _error;
  }

H
Haojun Liao 已提交
444
  SSDataBlock* pResBlock = createDataBlockFromDescNode(pAggNode->node.pOutputDataBlockDesc);
H
Haojun Liao 已提交
445 446 447 448 449 450 451 452 453
  initBasicInfo(&pInfo->binfo, pResBlock);

  int32_t    numOfScalarExpr = 0;
  SExprInfo* pScalarExprInfo = NULL;
  if (pAggNode->pExprs != NULL) {
    pScalarExprInfo = createExprInfo(pAggNode->pExprs, NULL, &numOfScalarExpr);
  }

  pInfo->pGroupCols = extractColumnInfo(pAggNode->pGroupKeys);
454
  code = initExprSupp(&pInfo->scalarSup, pScalarExprInfo, numOfScalarExpr);
455 456 457
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
458

H
Haojun Liao 已提交
459
  initResultSizeInfo(&pOperator->resultInfo, 4096);
H
Haojun Liao 已提交
460 461
  blockDataEnsureCapacity(pInfo->binfo.pRes, pOperator->resultInfo.capacity);

H
Haojun Liao 已提交
462
  code = initGroupOptrInfo(&pInfo->pGroupColVals, &pInfo->groupKeyLen, &pInfo->keyBuf, pInfo->pGroupCols);
H
Haojun Liao 已提交
463 464 465 466
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

H
Haojun Liao 已提交
467 468
  int32_t    num = 0;
  SExprInfo* pExprInfo = createExprInfo(pAggNode->pAggFuncs, pAggNode->pGroupKeys, &num);
L
Liu Jicong 已提交
469 470
  code = initAggSup(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, num, pInfo->groupKeyLen, pTaskInfo->id.str,
                    pTaskInfo->streamInfo.pState);
471 472 473 474
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

475 476 477 478 479
  code = filterInitFromNode((SNode*)pAggNode->node.pConditions, &pOperator->exprSupp.pFilterInfo, 0);
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

480
  initResultRowInfo(&pInfo->binfo.resultRowInfo);
481
  setOperatorInfo(pOperator, "GroupbyAggOperator", 0, true, OP_NOT_OPENED, pInfo, pTaskInfo);
H
Haojun Liao 已提交
482

D
dapan1121 已提交
483 484
  pInfo->binfo.mergeResultBlock = pAggNode->mergeDataBlock;

dengyihao's avatar
dengyihao 已提交
485 486
  pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, hashGroupbyAggregate, NULL, destroyGroupOperatorInfo,
                                         optrDefaultBufFn, NULL);
H
Haojun Liao 已提交
487
  code = appendDownstream(pOperator, &downstream, 1);
488 489 490 491
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }

H
Haojun Liao 已提交
492 493
  return pOperator;

494
_error:
495
  pTaskInfo->code = code;
H
Haojun Liao 已提交
496 497 498
  if (pInfo != NULL) {
    destroyGroupOperatorInfo(pInfo);
  }
H
Haojun Liao 已提交
499 500
  taosMemoryFreeClear(pOperator);
  return NULL;
501 502
}

H
Haojun Liao 已提交
503 504
static void doHashPartition(SOperatorInfo* pOperator, SSDataBlock* pBlock) {
  SPartitionOperatorInfo* pInfo = pOperator->info;
dengyihao's avatar
dengyihao 已提交
505 506
  SExecTaskInfo*          pTaskInfo = pOperator->pTaskInfo;

H
Haojun Liao 已提交
507
  for (int32_t j = 0; j < pBlock->info.rows; ++j) {
508
    recordNewGroupKeys(pInfo->pGroupCols, pInfo->pGroupColVals, pBlock, j);
H
Haojun Liao 已提交
509 510
    int32_t len = buildGroupKeys(pInfo->keyBuf, pInfo->pGroupColVals);

511
    SDataGroupInfo* pGroupInfo = NULL;
512
    void*           pPage = getCurrentDataGroupInfo(pInfo, &pGroupInfo, len);
513 514 515
    if (pPage == NULL) {
      T_LONG_JMP(pTaskInfo->env, terrno);
    }
H
Haojun Liao 已提交
516

517 518 519 520 521
    pGroupInfo->numOfRows += 1;

    // group id
    if (pGroupInfo->groupId == 0) {
      pGroupInfo->groupId = calcGroupId(pInfo->keyBuf, len);
H
Haojun Liao 已提交
522 523
    }

524
    // number of rows
525
    int32_t* rows = (int32_t*)pPage;
H
Haojun Liao 已提交
526

527
    size_t numOfCols = pOperator->exprSupp.numOfExprs;
528
    for (int32_t i = 0; i < numOfCols; ++i) {
529
      SExprInfo* pExpr = &pOperator->exprSupp.pExprInfo[i];
530
      int32_t    slotId = pExpr->base.pParam[0].pCol->slotId;
531 532

      SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
H
Haojun Liao 已提交
533

H
Haojun Liao 已提交
534 535
      int32_t bytes = pColInfoData->info.bytes;
      int32_t startOffset = pInfo->columnOffset[i];
H
Haojun Liao 已提交
536

537
      int32_t* columnLen = NULL;
538
      int32_t  contentLen = 0;
H
Haojun Liao 已提交
539 540

      if (IS_VAR_DATA_TYPE(pColInfoData->info.type)) {
wafwerar's avatar
wafwerar 已提交
541
        int32_t* offset = (int32_t*)((char*)pPage + startOffset);
542 543
        columnLen = (int32_t*)((char*)pPage + startOffset + sizeof(int32_t) * pInfo->rowCapacity);
        char* data = (char*)((char*)columnLen + sizeof(int32_t));
H
Haojun Liao 已提交
544 545 546 547

        if (colDataIsNull_s(pColInfoData, j)) {
          offset[(*rows)] = -1;
          contentLen = 0;
548
        } else if (pColInfoData->info.type == TSDB_DATA_TYPE_JSON) {
wmmhello's avatar
wmmhello 已提交
549
          offset[*rows] = (*columnLen);
550
          char*   src = colDataGetData(pColInfoData, j);
wmmhello's avatar
wmmhello 已提交
551 552 553 554
          int32_t dataLen = getJsonValueLen(src);

          memcpy(data + (*columnLen), src, dataLen);
          int32_t v = (data + (*columnLen) + dataLen - (char*)pPage);
555
          ASSERT(v > 0);
wmmhello's avatar
wmmhello 已提交
556 557

          contentLen = dataLen;
H
Haojun Liao 已提交
558 559 560 561
        } else {
          offset[*rows] = (*columnLen);
          char* src = colDataGetData(pColInfoData, j);
          memcpy(data + (*columnLen), src, varDataTLen(src));
562
          int32_t v = (data + (*columnLen) + varDataTLen(src) - (char*)pPage);
563
          ASSERT(v > 0);
564

H
Haojun Liao 已提交
565 566
          contentLen = varDataTLen(src);
        }
H
Haojun Liao 已提交
567
      } else {
wafwerar's avatar
wafwerar 已提交
568
        char* bitmap = (char*)pPage + startOffset;
569 570
        columnLen = (int32_t*)((char*)pPage + startOffset + BitmapLen(pInfo->rowCapacity));
        char* data = (char*)columnLen + sizeof(int32_t);
H
Haojun Liao 已提交
571 572 573

        bool isNull = colDataIsNull_f(pColInfoData->nullbitmap, j);
        if (isNull) {
H
Haojun Liao 已提交
574
          colDataSetNull_f(bitmap, (*rows));
H
Haojun Liao 已提交
575
        } else {
H
Haojun Liao 已提交
576
          memcpy(data + (*columnLen), colDataGetData(pColInfoData, j), bytes);
577
          ASSERT((data + (*columnLen) + bytes - (char*)pPage) <= getBufPageSize(pInfo->pBuf));
H
Haojun Liao 已提交
578
        }
H
Haojun Liao 已提交
579
        contentLen = bytes;
H
Haojun Liao 已提交
580
      }
H
Haojun Liao 已提交
581 582

      (*columnLen) += contentLen;
H
Haojun Liao 已提交
583 584
    }

H
Haojun Liao 已提交
585 586
    (*rows) += 1;

H
Haojun Liao 已提交
587 588 589
    setBufPageDirty(pPage, true);
    releaseBufPage(pInfo->pBuf, pPage);
  }
H
Haojun Liao 已提交
590 591 592 593 594 595
}

void* getCurrentDataGroupInfo(const SPartitionOperatorInfo* pInfo, SDataGroupInfo** pGroupInfo, int32_t len) {
  SDataGroupInfo* p = taosHashGet(pInfo->pGroupSet, pInfo->keyBuf, len);

  void* pPage = NULL;
596
  if (p == NULL) {  // it is a new group
H
Haojun Liao 已提交
597 598 599 600 601 602 603
    SDataGroupInfo gi = {0};
    gi.pPageList = taosArrayInit(100, sizeof(int32_t));
    taosHashPut(pInfo->pGroupSet, pInfo->keyBuf, len, &gi, sizeof(SDataGroupInfo));

    p = taosHashGet(pInfo->pGroupSet, pInfo->keyBuf, len);

    int32_t pageId = 0;
604
    pPage = getNewBufPage(pInfo->pBuf, &pageId);
605 606 607
    if (pPage == NULL) {
      return pPage;
    }
H
Haojun Liao 已提交
608

609
    taosArrayPush(p->pPageList, &pageId);
610
    *(int32_t*)pPage = 0;
H
Haojun Liao 已提交
611 612 613
  } else {
    int32_t* curId = taosArrayGetLast(p->pPageList);
    pPage = getBufPage(pInfo->pBuf, *curId);
614 615 616 617
    if (pPage == NULL) {
      qError("failed to get buffer, code:%s", tstrerror(terrno));
      return pPage;
    }
H
Haojun Liao 已提交
618

619
    int32_t* rows = (int32_t*)pPage;
H
Haojun Liao 已提交
620
    if (*rows >= pInfo->rowCapacity) {
621 622 623
      // release buffer
      releaseBufPage(pInfo->pBuf, pPage);

H
Haojun Liao 已提交
624 625
      // add a new page for current group
      int32_t pageId = 0;
626
      pPage = getNewBufPage(pInfo->pBuf, &pageId);
627 628 629 630 631
      if (pPage == NULL) {
        qError("failed to get new buffer, code:%s", tstrerror(terrno));
        return NULL;
      }

H
Haojun Liao 已提交
632
      taosArrayPush(p->pPageList, &pageId);
633
      memset(pPage, 0, getBufPageSize(pInfo->pBuf));
H
Haojun Liao 已提交
634 635
    }
  }
H
Haojun Liao 已提交
636

H
Haojun Liao 已提交
637 638 639 640 641 642 643 644 645 646 647 648 649 650
  *pGroupInfo = p;
  return pPage;
}

uint64_t calcGroupId(char* pData, int32_t len) {
  T_MD5_CTX context;
  tMD5Init(&context);
  tMD5Update(&context, (uint8_t*)pData, len);
  tMD5Final(&context);

  // NOTE: only extract the initial 8 bytes of the final MD5 digest
  uint64_t id = 0;
  memcpy(&id, context.digest, sizeof(uint64_t));
  return id;
H
Haojun Liao 已提交
651 652
}

H
Haojun Liao 已提交
653
int32_t* setupColumnOffset(const SSDataBlock* pBlock, int32_t rowCapacity) {
654
  size_t   numOfCols = taosArrayGetSize(pBlock->pDataBlock);
655
  int32_t* offset = taosMemoryCalloc(numOfCols, sizeof(int32_t));
H
Haojun Liao 已提交
656

657 658
  offset[0] = sizeof(int32_t) +
              sizeof(uint64_t);  // the number of rows in current page, ref to SSDataBlock paged serialization format
H
Haojun Liao 已提交
659

660
  for (int32_t i = 0; i < numOfCols - 1; ++i) {
H
Haojun Liao 已提交
661 662 663 664
    SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, i);

    int32_t bytes = pColInfoData->info.bytes;
    int32_t payloadLen = bytes * rowCapacity;
665

H
Haojun Liao 已提交
666 667 668 669 670 671 672 673 674 675 676 677
    if (IS_VAR_DATA_TYPE(pColInfoData->info.type)) {
      // offset segment + content length + payload
      offset[i + 1] = rowCapacity * sizeof(int32_t) + sizeof(int32_t) + payloadLen + offset[i];
    } else {
      // bitmap + content length + payload
      offset[i + 1] = BitmapLen(rowCapacity) + sizeof(int32_t) + payloadLen + offset[i];
    }
  }

  return offset;
}

5
54liuyao 已提交
678
static void clearPartitionOperator(SPartitionOperatorInfo* pInfo) {
679 680 681 682
  int32_t size = taosArrayGetSize(pInfo->sortedGroupArray);
  for (int32_t i = 0; i < size; i++) {
    SDataGroupInfo* pGp = taosArrayGet(pInfo->sortedGroupArray, i);
    taosArrayDestroy(pGp->pPageList);
5
54liuyao 已提交
683
  }
684
  taosArrayClear(pInfo->sortedGroupArray);
5
54liuyao 已提交
685 686 687
  clearDiskbasedBuf(pInfo->pBuf);
}

688 689 690
static int compareDataGroupInfo(const void* group1, const void* group2) {
  const SDataGroupInfo* pGroupInfo1 = group1;
  const SDataGroupInfo* pGroupInfo2 = group2;
691 692 693 694 695

  if (pGroupInfo1->groupId == pGroupInfo2->groupId) {
    return 0;
  }

696
  return (pGroupInfo1->groupId < pGroupInfo2->groupId) ? -1 : 1;
697 698
}

H
Haojun Liao 已提交
699 700
static SSDataBlock* buildPartitionResult(SOperatorInfo* pOperator) {
  SPartitionOperatorInfo* pInfo = pOperator->info;
dengyihao's avatar
dengyihao 已提交
701 702
  SExecTaskInfo*          pTaskInfo = pOperator->pTaskInfo;

703 704
  SDataGroupInfo* pGroupInfo =
      (pInfo->groupIndex != -1) ? taosArrayGet(pInfo->sortedGroupArray, pInfo->groupIndex) : NULL;
705
  if (pInfo->groupIndex == -1 || pInfo->pageIndex >= taosArrayGetSize(pGroupInfo->pPageList)) {
H
Haojun Liao 已提交
706
    // try next group data
707 708
    ++pInfo->groupIndex;
    if (pInfo->groupIndex >= taosArrayGetSize(pInfo->sortedGroupArray)) {
H
Haojun Liao 已提交
709
      setOperatorCompleted(pOperator);
5
54liuyao 已提交
710
      clearPartitionOperator(pInfo);
H
Haojun Liao 已提交
711 712 713
      return NULL;
    }

714
    pGroupInfo = taosArrayGet(pInfo->sortedGroupArray, pInfo->groupIndex);
H
Haojun Liao 已提交
715 716 717 718
    pInfo->pageIndex = 0;
  }

  int32_t* pageId = taosArrayGet(pGroupInfo->pPageList, pInfo->pageIndex);
719
  void*    page = getBufPage(pInfo->pBuf, *pageId);
720 721 722 723
  if (page == NULL) {
    qError("failed to get buffer, code:%s, %s", tstrerror(terrno), GET_TASKID(pTaskInfo));
    T_LONG_JMP(pTaskInfo->env, terrno);
  }
dengyihao's avatar
dengyihao 已提交
724

725
  blockDataEnsureCapacity(pInfo->binfo.pRes, pInfo->rowCapacity);
H
Haojun Liao 已提交
726
  blockDataFromBuf1(pInfo->binfo.pRes, page, pInfo->rowCapacity);
H
Haojun Liao 已提交
727 728

  pInfo->pageIndex += 1;
729
  releaseBufPage(pInfo->pBuf, page);
H
Haojun Liao 已提交
730

731
  pInfo->binfo.pRes->info.dataLoad = 1;
732
  blockDataUpdateTsWindow(pInfo->binfo.pRes, 0);
H
Haojun Liao 已提交
733
  pInfo->binfo.pRes->info.id.groupId = pGroupInfo->groupId;
734 735

  pOperator->resultInfo.totalRows += pInfo->binfo.pRes->info.rows;
H
Haojun Liao 已提交
736 737 738
  return pInfo->binfo.pRes;
}

739
static SSDataBlock* hashPartition(SOperatorInfo* pOperator) {
H
Haojun Liao 已提交
740 741
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
742 743
  }

744 745 746
  SExecTaskInfo* pTaskInfo = pOperator->pTaskInfo;

  SPartitionOperatorInfo* pInfo = pOperator->info;
747
  SSDataBlock*            pRes = pInfo->binfo.pRes;
748

H
Haojun Liao 已提交
749
  if (pOperator->status == OP_RES_TO_RETURN) {
H
Haojun Liao 已提交
750 751
    blockDataCleanup(pRes);
    return buildPartitionResult(pOperator);
H
Haojun Liao 已提交
752 753
  }

754
  int64_t        st = taosGetTimestampUs();
H
Haojun Liao 已提交
755
  SOperatorInfo* downstream = pOperator->pDownstream[0];
H
Haojun Liao 已提交
756

H
Haojun Liao 已提交
757
  while (1) {
758
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
H
Haojun Liao 已提交
759 760 761
    if (pBlock == NULL) {
      break;
    }
H
Haojun Liao 已提交
762

763
    // there is an scalar expression that needs to be calculated right before apply the group aggregation.
764
    if (pInfo->scalarSup.pExprInfo != NULL) {
765 766
      pTaskInfo->code = projectApplyFunctions(pInfo->scalarSup.pExprInfo, pBlock, pBlock, pInfo->scalarSup.pCtx,
                                              pInfo->scalarSup.numOfExprs, NULL);
767
      if (pTaskInfo->code != TSDB_CODE_SUCCESS) {
768
        T_LONG_JMP(pTaskInfo->env, pTaskInfo->code);
769 770 771
      }
    }

wmmhello's avatar
wmmhello 已提交
772
    terrno = TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
773
    doHashPartition(pOperator, pBlock);
wmmhello's avatar
wmmhello 已提交
774
    if (terrno != TSDB_CODE_SUCCESS) {  // group by json error
775
      T_LONG_JMP(pTaskInfo->env, terrno);
wmmhello's avatar
wmmhello 已提交
776
    }
H
Haojun Liao 已提交
777 778
  }

779
  SArray* groupArray = taosArrayInit(taosHashGetSize(pInfo->pGroupSet), sizeof(SDataGroupInfo));
780 781

  void* pGroupIter = taosHashIterate(pInfo->pGroupSet, NULL);
782 783 784 785 786 787 788 789 790 791 792
  while (pGroupIter != NULL) {
    SDataGroupInfo* pGroupInfo = pGroupIter;
    taosArrayPush(groupArray, pGroupInfo);
    pGroupIter = taosHashIterate(pInfo->pGroupSet, pGroupIter);
  }

  taosArraySort(groupArray, compareDataGroupInfo);
  pInfo->sortedGroupArray = groupArray;
  pInfo->groupIndex = -1;
  taosHashClear(pInfo->pGroupSet);

793 794
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;

H
Haojun Liao 已提交
795
  pOperator->status = OP_RES_TO_RETURN;
H
Haojun Liao 已提交
796 797 798 799
  blockDataEnsureCapacity(pRes, 4096);
  return buildPartitionResult(pOperator);
}

800
static void destroyPartitionOperatorInfo(void* param) {
H
Haojun Liao 已提交
801
  SPartitionOperatorInfo* pInfo = (SPartitionOperatorInfo*)param;
802
  cleanupBasicInfo(&pInfo->binfo);
H
Haojun Liao 已提交
803
  taosArrayDestroy(pInfo->pGroupCols);
804

805
  for (int i = 0; i < taosArrayGetSize(pInfo->pGroupColVals); i++) {
wmmhello's avatar
wmmhello 已提交
806 807 808
    SGroupKeys key = *(SGroupKeys*)taosArrayGet(pInfo->pGroupColVals, i);
    taosMemoryFree(key.pData);
  }
809

H
Haojun Liao 已提交
810
  taosArrayDestroy(pInfo->pGroupColVals);
H
Haojun Liao 已提交
811
  taosMemoryFree(pInfo->keyBuf);
dengyihao's avatar
dengyihao 已提交
812 813 814 815 816 817

  int32_t size = taosArrayGetSize(pInfo->sortedGroupArray);
  for (int32_t i = 0; i < size; i++) {
    SDataGroupInfo* pGp = taosArrayGet(pInfo->sortedGroupArray, i);
    taosArrayDestroy(pGp->pPageList);
  }
818
  taosArrayDestroy(pInfo->sortedGroupArray);
D
dapan1121 已提交
819 820 821 822 823 824 825 826

  void* pGroupIter = taosHashIterate(pInfo->pGroupSet, NULL);
  while (pGroupIter != NULL) {
    SDataGroupInfo* pGroupInfo = pGroupIter;
    taosArrayDestroy(pGroupInfo->pPageList);
    pGroupIter = taosHashIterate(pInfo->pGroupSet, pGroupIter);
  }

wmmhello's avatar
wmmhello 已提交
827
  taosHashCleanup(pInfo->pGroupSet);
H
Haojun Liao 已提交
828
  taosMemoryFree(pInfo->columnOffset);
829

830
  cleanupExprSupp(&pInfo->scalarSup);
H
Haojun Liao 已提交
831
  destroyDiskbasedBuf(pInfo->pBuf);
D
dapan1121 已提交
832
  taosMemoryFreeClear(param);
H
Haojun Liao 已提交
833 834
}

835 836
SOperatorInfo* createPartitionOperatorInfo(SOperatorInfo* downstream, SPartitionPhysiNode* pPartNode,
                                           SExecTaskInfo* pTaskInfo) {
H
Haojun Liao 已提交
837
  SPartitionOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SPartitionOperatorInfo));
838
  SOperatorInfo*          pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
H
Haojun Liao 已提交
839
  if (pInfo == NULL || pOperator == NULL) {
dengyihao's avatar
dengyihao 已提交
840 841
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    pTaskInfo->code = terrno;
H
Haojun Liao 已提交
842 843
    goto _error;
  }
844

845
  int32_t    numOfCols = 0;
846 847 848 849
  SExprInfo* pExprInfo = createExprInfo(pPartNode->pTargets, NULL, &numOfCols);
  pInfo->pGroupCols = extractPartitionColInfo(pPartNode->pPartitionKeys);

  if (pPartNode->pExprs != NULL) {
850
    int32_t    num = 0;
851
    SExprInfo* pExprInfo1 = createExprInfo(pPartNode->pExprs, NULL, &num);
852
    int32_t    code = initExprSupp(&pInfo->scalarSup, pExprInfo1, num);
853
    if (code != TSDB_CODE_SUCCESS) {
dengyihao's avatar
dengyihao 已提交
854 855
      terrno = code;
      pTaskInfo->code = terrno;
856 857
      goto _error;
    }
858
  }
H
Haojun Liao 已提交
859 860 861 862

  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);
  pInfo->pGroupSet = taosHashInit(100, hashFn, false, HASH_NO_LOCK);
  if (pInfo->pGroupSet == NULL) {
dengyihao's avatar
dengyihao 已提交
863 864
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    pTaskInfo->code = terrno;
H
Haojun Liao 已提交
865 866 867
    goto _error;
  }

868
  uint32_t defaultPgsz = 0;
869
  uint32_t defaultBufsz = 0;
H
Haojun Liao 已提交
870

H
Haojun Liao 已提交
871
  pInfo->binfo.pRes = createDataBlockFromDescNode(pPartNode->node.pOutputDataBlockDesc);
H
Haojun Liao 已提交
872
  getBufferPgSize(pInfo->binfo.pRes->info.rowSize, &defaultPgsz, &defaultBufsz);
873

wafwerar's avatar
wafwerar 已提交
874
  if (!osTempSpaceAvailable()) {
875
    terrno = TSDB_CODE_NO_DISKSPACE;
wafwerar's avatar
wafwerar 已提交
876
    pTaskInfo->code = terrno;
877
    qError("Create partition operator info failed since %s, tempDir:%s", terrstr(), tsTempDir);
wafwerar's avatar
wafwerar 已提交
878 879
    goto _error;
  }
H
Haojun Liao 已提交
880

wafwerar's avatar
wafwerar 已提交
881
  int32_t code = createDiskbasedBuf(&pInfo->pBuf, defaultPgsz, defaultBufsz, pTaskInfo->id.str, tsTempDir);
H
Haojun Liao 已提交
882
  if (code != TSDB_CODE_SUCCESS) {
dengyihao's avatar
dengyihao 已提交
883 884
    terrno = code;
    pTaskInfo->code = code;
H
Haojun Liao 已提交
885 886 887
    goto _error;
  }

H
Haojun Liao 已提交
888 889
  pInfo->rowCapacity = blockDataGetCapacityInRow(pInfo->binfo.pRes, getBufPageSize(pInfo->pBuf));
  pInfo->columnOffset = setupColumnOffset(pInfo->binfo.pRes, pInfo->rowCapacity);
890
  code = initGroupOptrInfo(&pInfo->pGroupColVals, &pInfo->groupKeyLen, &pInfo->keyBuf, pInfo->pGroupCols);
H
Haojun Liao 已提交
891
  if (code != TSDB_CODE_SUCCESS) {
dengyihao's avatar
dengyihao 已提交
892 893
    terrno = code;
    pTaskInfo->code = code;
H
Haojun Liao 已提交
894 895
    goto _error;
  }
H
Haojun Liao 已提交
896

L
Liu Jicong 已提交
897 898
  setOperatorInfo(pOperator, "PartitionOperator", QUERY_NODE_PHYSICAL_PLAN_PARTITION, false, OP_NOT_OPENED, pInfo,
                  pTaskInfo);
899 900
  pOperator->exprSupp.numOfExprs = numOfCols;
  pOperator->exprSupp.pExprInfo = pExprInfo;
901

dengyihao's avatar
dengyihao 已提交
902 903
  pOperator->fpSet =
      createOperatorFpSet(optrDummyOpenFn, hashPartition, NULL, destroyPartitionOperatorInfo, optrDefaultBufFn, NULL);
H
Haojun Liao 已提交
904

H
Haojun Liao 已提交
905
  code = appendDownstream(pOperator, &downstream, 1);
dengyihao's avatar
dengyihao 已提交
906 907 908 909 910 911
  if (code != TSDB_CODE_SUCCESS) {
    terrno = code;
    pTaskInfo->code = code;
    goto _error;
  }

912 913
  return pOperator;

914
_error:
H
Haojun Liao 已提交
915 916 917
  if (pInfo != NULL) {
    destroyPartitionOperatorInfo(pInfo);
  }
H
Haojun Liao 已提交
918
  taosMemoryFreeClear(pOperator);
919
  return NULL;
920 921
}

922 923 924
int32_t setGroupResultOutputBuf(SOperatorInfo* pOperator, SOptrBasicInfo* binfo, int32_t numOfCols, char* pData,
                                int16_t bytes, uint64_t groupId, SDiskbasedBuf* pBuf, SAggSupporter* pAggSup) {
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
925
  SResultRowInfo* pResultRowInfo = &binfo->resultRowInfo;
926
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
927 928

  SResultRow* pResultRow =
D
dapan1121 已提交
929
      doSetResultOutBufByKey(pBuf, pResultRowInfo, (char*)pData, bytes, true, groupId, pTaskInfo, false, pAggSup, false);
930

931
  setResultRowInitCtx(pResultRow, pCtx, numOfCols, pOperator->exprSupp.rowEntryInfoOffset);
932
  return TSDB_CODE_SUCCESS;
D
dapan1121 已提交
933
}
934 935 936

uint64_t calGroupIdByData(SPartitionBySupporter* pParSup, SExprSupp* pExprSup, SSDataBlock* pBlock, int32_t rowId) {
  if (pExprSup->pExprInfo != NULL) {
937 938
    int32_t code =
        projectApplyFunctions(pExprSup->pExprInfo, pBlock, pBlock, pExprSup->pCtx, pExprSup->numOfExprs, NULL);
939 940 941 942 943
    if (code != TSDB_CODE_SUCCESS) {
      qError("calaculate group id error, code:%d", code);
    }
  }
  recordNewGroupKeys(pParSup->pGroupCols, pParSup->pGroupColVals, pBlock, rowId);
944
  int32_t  len = buildGroupKeys(pParSup->keyBuf, pParSup->pGroupColVals);
945 946 947 948
  uint64_t groupId = calcGroupId(pParSup->keyBuf, len);
  return groupId;
}

949
static bool hasRemainPartion(SStreamPartitionOperatorInfo* pInfo) { return pInfo->parIte != NULL; }
5
54liuyao 已提交
950
static bool hasRemainTbName(SStreamPartitionOperatorInfo* pInfo) { return pInfo->pTbNameIte != NULL; }
951 952 953

static SSDataBlock* buildStreamPartitionResult(SOperatorInfo* pOperator) {
  SStreamPartitionOperatorInfo* pInfo = pOperator->info;
954
  SSDataBlock*                  pDest = pInfo->binfo.pRes;
955
  ASSERT(hasRemainPartion(pInfo));
956 957
  SPartitionDataInfo* pParInfo = (SPartitionDataInfo*)pInfo->parIte;
  blockDataCleanup(pDest);
958
  int32_t      rows = taosArrayGetSize(pParInfo->rowIds);
959 960 961 962
  SSDataBlock* pSrc = pInfo->pInputDataBlock;
  for (int32_t i = 0; i < rows; i++) {
    int32_t rowIndex = *(int32_t*)taosArrayGet(pParInfo->rowIds, i);
    for (int32_t j = 0; j < pOperator->exprSupp.numOfExprs; j++) {
963
      int32_t          slotId = pOperator->exprSupp.pExprInfo[j].base.pParam[0].pCol->slotId;
964 965
      SColumnInfoData* pSrcCol = taosArrayGet(pSrc->pDataBlock, slotId);
      SColumnInfoData* pDestCol = taosArrayGet(pDest->pDataBlock, j);
966 967
      bool             isNull = colDataIsNull(pSrcCol, pSrc->info.rows, rowIndex, NULL);
      char*            pSrcData = colDataGetData(pSrcCol, rowIndex);
968
      colDataSetVal(pDestCol, pDest->info.rows, pSrcData, isNull);
969 970
    }
    pDest->info.rows++;
5
54liuyao 已提交
971 972 973 974 975 976
  }
  pDest->info.parTbName[0] = 0;
  if (pInfo->tbnameCalSup.numOfExprs > 0) {
    void* tbname = NULL;
    if (streamStateGetParName(pOperator->pTaskInfo->streamInfo.pState, pParInfo->groupId, &tbname) == 0) {
      memcpy(pDest->info.parTbName, tbname, TSDB_TABLE_NAME_LEN);
dengyihao's avatar
dengyihao 已提交
977
      streamFreeVal(tbname);
978
    }
979
  }
980 981
  taosArrayDestroy(pParInfo->rowIds);
  pParInfo->rowIds = NULL;
H
Haojun Liao 已提交
982 983
  pDest->info.dataLoad = 1;

984
  blockDataUpdateTsWindow(pDest, pInfo->tsColIndex);
H
Haojun Liao 已提交
985
  pDest->info.id.groupId = pParInfo->groupId;
986 987
  pOperator->resultInfo.totalRows += pDest->info.rows;
  pInfo->parIte = taosHashIterate(pInfo->pPartitions, pInfo->parIte);
988
  ASSERT(pDest->info.rows > 0);
989 990 991 992
  printDataBlock(pDest, "stream partitionby");
  return pDest;
}

5
54liuyao 已提交
993
void appendCreateTableRow(SStreamState* pState, SExprSupp* pTableSup, SExprSupp* pTagSup, uint64_t groupId,
5
54liuyao 已提交
994 995
                          SSDataBlock* pSrcBlock, int32_t rowId, SSDataBlock* pDestBlock) {
  void* pValue = NULL;
5
54liuyao 已提交
996
  if (streamStateGetParName(pState, groupId, &pValue) != 0) {
5
54liuyao 已提交
997
    SSDataBlock* pTmpBlock = blockCopyOneRow(pSrcBlock, rowId);
5
54liuyao 已提交
998 999
    memset(pTmpBlock->info.parTbName, 0, TSDB_TABLE_NAME_LEN);
    pTmpBlock->info.id.groupId = groupId;
5
54liuyao 已提交
1000
    char* tbName = pSrcBlock->info.parTbName;
5
54liuyao 已提交
1001 1002 1003 1004
    if (pTableSup->numOfExprs > 0) {
      projectApplyFunctions(pTableSup->pExprInfo, pDestBlock, pTmpBlock, pTableSup->pCtx, pTableSup->numOfExprs, NULL);
      SColumnInfoData* pTbCol = taosArrayGet(pDestBlock->pDataBlock, UD_TABLE_NAME_COLUMN_INDEX);
      memset(tbName, 0, TSDB_TABLE_NAME_LEN);
5
54liuyao 已提交
1005 1006
      int32_t len = 0;
      if (colDataIsNull_s(pTbCol, pDestBlock->info.rows - 1)) {
5
54liuyao 已提交
1007 1008
        len = 1;
        tbName[0] = 0;
5
54liuyao 已提交
1009 1010 1011 1012
      } else {
        void* pData = colDataGetData(pTbCol, pDestBlock->info.rows - 1);
        len = TMIN(varDataLen(pData), TSDB_TABLE_NAME_LEN - 1);
        memcpy(tbName, varDataVal(pData), len);
5
54liuyao 已提交
1013
        streamStatePutParName(pState, groupId, tbName);
5
54liuyao 已提交
1014
      }
5
54liuyao 已提交
1015
      memcpy(pTmpBlock->info.parTbName, tbName, len);
5
54liuyao 已提交
1016 1017 1018
      pDestBlock->info.rows--;
    } else {
      void* pTbNameCol = taosArrayGet(pDestBlock->pDataBlock, UD_TABLE_NAME_COLUMN_INDEX);
X
Xiaoyu Wang 已提交
1019
      colDataSetNULL(pTbNameCol, pDestBlock->info.rows);
5
54liuyao 已提交
1020
      tbName[0] = 0;
5
54liuyao 已提交
1021 1022 1023 1024 1025
    }

    if (pTagSup->numOfExprs > 0) {
      projectApplyFunctions(pTagSup->pExprInfo, pDestBlock, pTmpBlock, pTagSup->pCtx, pTagSup->numOfExprs, NULL);
      pDestBlock->info.rows--;
5
54liuyao 已提交
1026 1027
    } else {
      memcpy(pDestBlock->info.parTbName, pTmpBlock->info.parTbName, TSDB_TABLE_NAME_LEN);
5
54liuyao 已提交
1028 1029 1030 1031 1032 1033
    }

    void* pGpIdCol = taosArrayGet(pDestBlock->pDataBlock, UD_GROUPID_COLUMN_INDEX);
    colDataAppend(pGpIdCol, pDestBlock->info.rows, (const char*)&groupId, false);
    pDestBlock->info.rows++;
    blockDataDestroy(pTmpBlock);
5
54liuyao 已提交
1034 1035
  } else {
    memcpy(pSrcBlock->info.parTbName, pValue, TSDB_TABLE_NAME_LEN);
5
54liuyao 已提交
1036 1037 1038 1039 1040 1041
  }
  streamStateReleaseBuf(pState, NULL, pValue);
}

static SSDataBlock* buildStreamCreateTableResult(SOperatorInfo* pOperator) {
  SStreamPartitionOperatorInfo* pInfo = pOperator->info;
1042 1043
  if ((pInfo->tbnameCalSup.numOfExprs == 0 && pInfo->tagCalSup.numOfExprs == 0) ||
      taosHashGetSize(pInfo->pPartitions) == 0) {
5
54liuyao 已提交
1044 1045 1046 1047 1048 1049
    return NULL;
  }
  blockDataCleanup(pInfo->pCreateTbRes);
  blockDataEnsureCapacity(pInfo->pCreateTbRes, taosHashGetSize(pInfo->pPartitions));
  SSDataBlock* pSrc = pInfo->pInputDataBlock;

5
54liuyao 已提交
1050
  if (pInfo->pTbNameIte != NULL) {
5
54liuyao 已提交
1051
    SPartitionDataInfo* pParInfo = (SPartitionDataInfo*)pInfo->pTbNameIte;
1052
    int32_t             rowId = *(int32_t*)taosArrayGet(pParInfo->rowIds, 0);
5
54liuyao 已提交
1053
    appendCreateTableRow(pOperator->pTaskInfo->streamInfo.pState, &pInfo->tbnameCalSup, &pInfo->tagCalSup,
1054
                         pParInfo->groupId, pSrc, rowId, pInfo->pCreateTbRes);
5
54liuyao 已提交
1055 1056 1057 1058 1059
    pInfo->pTbNameIte = taosHashIterate(pInfo->pPartitions, pInfo->pTbNameIte);
  }
  return pInfo->pCreateTbRes->info.rows > 0 ? pInfo->pCreateTbRes : NULL;
}

1060 1061 1062 1063
static void doStreamHashPartitionImpl(SStreamPartitionOperatorInfo* pInfo, SSDataBlock* pBlock) {
  pInfo->pInputDataBlock = pBlock;
  for (int32_t i = 0; i < pBlock->info.rows; ++i) {
    recordNewGroupKeys(pInfo->partitionSup.pGroupCols, pInfo->partitionSup.pGroupColVals, pBlock, i);
1064 1065 1066
    int32_t             keyLen = buildGroupKeys(pInfo->partitionSup.keyBuf, pInfo->partitionSup.pGroupColVals);
    SPartitionDataInfo* pParData =
        (SPartitionDataInfo*)taosHashGet(pInfo->pPartitions, pInfo->partitionSup.keyBuf, keyLen);
1067 1068 1069 1070 1071 1072 1073
    if (pParData) {
      taosArrayPush(pParData->rowIds, &i);
    } else {
      SPartitionDataInfo newParData = {0};
      newParData.groupId = calcGroupId(pInfo->partitionSup.keyBuf, keyLen);
      newParData.rowIds = taosArrayInit(64, sizeof(int32_t));
      taosArrayPush(newParData.rowIds, &i);
1074
      taosHashPut(pInfo->pPartitions, pInfo->partitionSup.keyBuf, keyLen, &newParData, sizeof(SPartitionDataInfo));
1075 1076 1077 1078 1079 1080 1081 1082 1083
    }
  }
}

static SSDataBlock* doStreamHashPartition(SOperatorInfo* pOperator) {
  if (pOperator->status == OP_EXEC_DONE) {
    return NULL;
  }

1084
  SExecTaskInfo*                pTaskInfo = pOperator->pTaskInfo;
1085
  SStreamPartitionOperatorInfo* pInfo = pOperator->info;
5
54liuyao 已提交
1086 1087 1088 1089 1090 1091 1092 1093 1094
  SSDataBlock*                  pCtRes = NULL;

  if (hasRemainTbName(pInfo)) {
    pCtRes = buildStreamCreateTableResult(pOperator);
    if (pCtRes != NULL) {
      return pCtRes;
    }
  }

1095 1096 1097 1098
  if (hasRemainPartion(pInfo)) {
    return buildStreamPartitionResult(pOperator);
  }

1099
  int64_t        st = taosGetTimestampUs();
1100 1101 1102 1103 1104
  SOperatorInfo* downstream = pOperator->pDownstream[0];
  {
    pInfo->pInputDataBlock = NULL;
    SSDataBlock* pBlock = downstream->fpSet.getNextFn(downstream);
    if (pBlock == NULL) {
H
Haojun Liao 已提交
1105
      setOperatorCompleted(pOperator);
1106 1107 1108 1109 1110 1111 1112 1113 1114
      return NULL;
    }
    printDataBlock(pBlock, "stream partitionby recv");
    switch (pBlock->info.type) {
      case STREAM_NORMAL:
      case STREAM_PULL_DATA:
      case STREAM_INVALID:
        pInfo->binfo.pRes->info.type = pBlock->info.type;
        break;
1115 1116 1117
      case STREAM_DELETE_DATA: {
        copyDataBlock(pInfo->pDelRes, pBlock);
        pInfo->pDelRes->info.type = STREAM_DELETE_RESULT;
5
54liuyao 已提交
1118
        printDataBlock(pInfo->pDelRes, "stream partitionby delete");
1119
        return pInfo->pDelRes;
1120
      } break;
1121
      default:
L
liuyao 已提交
1122
        ASSERTS(pBlock->info.type == STREAM_CREATE_CHILD_TABLE || pBlock->info.type == STREAM_RETRIEVE, "invalid SSDataBlock type");
1123 1124 1125 1126 1127
        return pBlock;
    }

    // there is an scalar expression that needs to be calculated right before apply the group aggregation.
    if (pInfo->scalarSup.pExprInfo != NULL) {
5
54liuyao 已提交
1128
      projectApplyFunctions(pInfo->scalarSup.pExprInfo, pBlock, pBlock, pInfo->scalarSup.pCtx,
dengyihao's avatar
dengyihao 已提交
1129
                            pInfo->scalarSup.numOfExprs, NULL);
1130 1131 1132 1133 1134
    }
    taosHashClear(pInfo->pPartitions);
    doStreamHashPartitionImpl(pInfo, pBlock);
  }
  pOperator->cost.openCost = (taosGetTimestampUs() - st) / 1000.0;
1135

1136
  pInfo->parIte = taosHashIterate(pInfo->pPartitions, NULL);
5
54liuyao 已提交
1137 1138 1139 1140 1141
  pInfo->pTbNameIte = taosHashIterate(pInfo->pPartitions, NULL);
  pCtRes = buildStreamCreateTableResult(pOperator);
  if (pCtRes != NULL) {
    return pCtRes;
  }
1142 1143 1144 1145 1146 1147 1148 1149
  return buildStreamPartitionResult(pOperator);
}

static void destroyStreamPartitionOperatorInfo(void* param) {
  SStreamPartitionOperatorInfo* pInfo = (SStreamPartitionOperatorInfo*)param;
  cleanupBasicInfo(&pInfo->binfo);
  taosArrayDestroy(pInfo->partitionSup.pGroupCols);

1150
  for (int i = 0; i < taosArrayGetSize(pInfo->partitionSup.pGroupColVals); i++) {
1151 1152 1153 1154 1155 1156 1157
    SGroupKeys key = *(SGroupKeys*)taosArrayGet(pInfo->partitionSup.pGroupColVals, i);
    taosMemoryFree(key.pData);
  }
  taosArrayDestroy(pInfo->partitionSup.pGroupColVals);

  taosMemoryFree(pInfo->partitionSup.keyBuf);
  cleanupExprSupp(&pInfo->scalarSup);
L
Liu Jicong 已提交
1158 1159
  cleanupExprSupp(&pInfo->tbnameCalSup);
  cleanupExprSupp(&pInfo->tagCalSup);
1160
  blockDataDestroy(pInfo->pDelRes);
1161
  taosHashCleanup(pInfo->pPartitions);
5
54liuyao 已提交
1162
  blockDataDestroy(pInfo->pCreateTbRes);
1163 1164 1165 1166 1167 1168 1169 1170 1171 1172
  taosMemoryFreeClear(param);
}

void initParDownStream(SOperatorInfo* downstream, SPartitionBySupporter* pParSup, SExprSupp* pExpr) {
  if (downstream->operatorType != QUERY_NODE_PHYSICAL_PLAN_STREAM_SCAN) {
    return;
  }
  SStreamScanInfo* pScanInfo = downstream->info;
  pScanInfo->partitionSup = *pParSup;
  pScanInfo->pPartScalarSup = pExpr;
5
54liuyao 已提交
1173
  if (!pScanInfo->igCheckUpdate && !pScanInfo->pUpdateInfo) {
5
54liuyao 已提交
1174 1175
    pScanInfo->pUpdateInfo = updateInfoInit(60000, TSDB_TIME_PRECISION_MILLI, 0);
  }
1176 1177
}

5
54liuyao 已提交
1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217
SSDataBlock* buildCreateTableBlock(SExprSupp* tbName, SExprSupp* tag) {
  SSDataBlock* pBlock = taosMemoryCalloc(1, sizeof(SSDataBlock));
  pBlock->info.hasVarCol = false;
  pBlock->info.id.groupId = 0;
  pBlock->info.rows = 0;
  pBlock->info.type = STREAM_CREATE_CHILD_TABLE;
  pBlock->info.watermark = INT64_MIN;

  pBlock->pDataBlock = taosArrayInit(4, sizeof(SColumnInfoData));
  SColumnInfoData infoData = {0};
  infoData.info.type = TSDB_DATA_TYPE_VARCHAR;
  if (tbName->numOfExprs > 0) {
    infoData.info.bytes = tbName->pExprInfo->base.resSchema.bytes;
  } else {
    infoData.info.bytes = 1;
  }
  pBlock->info.rowSize += infoData.info.bytes;
  // sub table name
  taosArrayPush(pBlock->pDataBlock, &infoData);

  SColumnInfoData gpIdData = {0};
  gpIdData.info.type = TSDB_DATA_TYPE_UBIGINT;
  gpIdData.info.bytes = 8;
  pBlock->info.rowSize += gpIdData.info.bytes;
  // group id
  taosArrayPush(pBlock->pDataBlock, &gpIdData);

  for (int32_t i = 0; i < tag->numOfExprs; i++) {
    SColumnInfoData tagCol = {0};
    tagCol.info.type = tag->pExprInfo[i].base.resSchema.type;
    tagCol.info.bytes = tag->pExprInfo[i].base.resSchema.bytes;
    tagCol.info.precision = tag->pExprInfo[i].base.resSchema.precision;
    // tag info
    taosArrayPush(pBlock->pDataBlock, &tagCol);
    pBlock->info.rowSize += tagCol.info.bytes;
  }

  return pBlock;
}

L
liuyao 已提交
1218 1219 1220 1221 1222
void freePartItem(void* ptr) {
  SPartitionDataInfo* pPart = (SPartitionDataInfo*)ptr;
  taosArrayDestroy(pPart->rowIds);
}

1223 1224
SOperatorInfo* createStreamPartitionOperatorInfo(SOperatorInfo* downstream, SStreamPartitionPhysiNode* pPartNode,
                                                 SExecTaskInfo* pTaskInfo) {
1225
  int32_t                       code = TSDB_CODE_SUCCESS;
1226 1227 1228
  SStreamPartitionOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SStreamPartitionOperatorInfo));
  SOperatorInfo*                pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
  if (pInfo == NULL || pOperator == NULL) {
1229
    code = TSDB_CODE_OUT_OF_MEMORY;
1230 1231
    goto _error;
  }
1232

1233
  pInfo->partitionSup.pGroupCols = extractPartitionColInfo(pPartNode->part.pPartitionKeys);
1234

1235
  if (pPartNode->part.pExprs != NULL) {
1236
    int32_t    num = 0;
1237
    SExprInfo* pCalExprInfo = createExprInfo(pPartNode->part.pExprs, NULL, &num);
1238 1239 1240 1241 1242 1243
    code = initExprSupp(&pInfo->scalarSup, pCalExprInfo, num);
    if (code != TSDB_CODE_SUCCESS) {
      goto _error;
    }
  }

5
54liuyao 已提交
1244
  pInfo->tbnameCalSup.numOfExprs = 0;
1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258
  if (pPartNode->pSubtable != NULL) {
    SExprInfo* pSubTableExpr = taosMemoryCalloc(1, sizeof(SExprInfo));
    if (pSubTableExpr == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _error;
    }
    pInfo->tbnameCalSup.pExprInfo = pSubTableExpr;
    createExprFromOneNode(pSubTableExpr, pPartNode->pSubtable, 0);
    code = initExprSupp(&pInfo->tbnameCalSup, pSubTableExpr, 1);
    if (code != TSDB_CODE_SUCCESS) {
      goto _error;
    }
  }

5
54liuyao 已提交
1259
  pInfo->tagCalSup.numOfExprs = 0;
L
Liu Jicong 已提交
1260 1261
  if (pPartNode->pTags != NULL) {
    int32_t    numOfTags;
5
54liuyao 已提交
1262
    SExprInfo* pTagExpr = createExpr(pPartNode->pTags, &numOfTags);
L
Liu Jicong 已提交
1263
    if (pTagExpr == NULL) {
1264
      code = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
1265 1266 1267
      goto _error;
    }
    if (initExprSupp(&pInfo->tagCalSup, pTagExpr, numOfTags) != 0) {
1268
      code = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
1269 1270 1271 1272
      goto _error;
    }
  }

5
54liuyao 已提交
1273 1274 1275 1276 1277 1278
  if (pInfo->tbnameCalSup.numOfExprs != 0 || pInfo->tagCalSup.numOfExprs != 0) {
    pInfo->pCreateTbRes = buildCreateTableBlock(&pInfo->tbnameCalSup, &pInfo->tagCalSup);
  } else {
    pInfo->pCreateTbRes = NULL;
  }

1279
  int32_t keyLen = 0;
1280 1281
  code = initGroupOptrInfo(&pInfo->partitionSup.pGroupColVals, &keyLen, &pInfo->partitionSup.keyBuf,
                           pInfo->partitionSup.pGroupCols);
1282 1283 1284 1285 1286
  if (code != TSDB_CODE_SUCCESS) {
    goto _error;
  }
  pInfo->partitionSup.needCalc = true;

H
Haojun Liao 已提交
1287
  pInfo->binfo.pRes = createDataBlockFromDescNode(pPartNode->part.node.pOutputDataBlockDesc);
1288
  if (pInfo->binfo.pRes == NULL) {
1289
    code = TSDB_CODE_OUT_OF_MEMORY;
1290 1291
    goto _error;
  }
1292 1293 1294

  blockDataEnsureCapacity(pInfo->binfo.pRes, 4096);

1295
  pInfo->parIte = NULL;
5
54liuyao 已提交
1296
  pInfo->pTbNameIte = NULL;
1297
  pInfo->pInputDataBlock = NULL;
1298

1299
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);
1300
  pInfo->pPartitions = taosHashInit(1024, hashFn, false, HASH_NO_LOCK);
L
liuyao 已提交
1301
  taosHashSetFreeFp(pInfo->pPartitions, freePartItem);
1302 1303
  pInfo->tsColIndex = 0;
  pInfo->pDelRes = createSpecialDataBlock(STREAM_DELETE_RESULT);
1304

1305
  int32_t    numOfCols = 0;
1306
  SExprInfo* pExprInfo = createExprInfo(pPartNode->part.pTargets, NULL, &numOfCols);
1307

L
Liu Jicong 已提交
1308 1309
  setOperatorInfo(pOperator, "StreamPartitionOperator", QUERY_NODE_PHYSICAL_PLAN_STREAM_PARTITION, false, OP_NOT_OPENED,
                  pInfo, pTaskInfo);
1310 1311
  pOperator->exprSupp.numOfExprs = numOfCols;
  pOperator->exprSupp.pExprInfo = pExprInfo;
dengyihao's avatar
dengyihao 已提交
1312 1313
  pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, doStreamHashPartition, NULL,
                                         destroyStreamPartitionOperatorInfo, optrDefaultBufFn, NULL);
1314 1315 1316 1317 1318

  initParDownStream(downstream, &pInfo->partitionSup, &pInfo->scalarSup);
  code = appendDownstream(pOperator, &downstream, 1);
  return pOperator;

1319
_error:
1320
  pTaskInfo->code = code;
1321
  destroyStreamPartitionOperatorInfo(pInfo);
1322 1323 1324
  taosMemoryFreeClear(pOperator);
  return NULL;
}
H
Haojun Liao 已提交
1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357

SArray* extractColumnInfo(SNodeList* pNodeList) {
  size_t  numOfCols = LIST_LENGTH(pNodeList);
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColumn));
  if (pList == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return NULL;
  }

  for (int32_t i = 0; i < numOfCols; ++i) {
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pNodeList, i);

    if (nodeType(pNode->pExpr) == QUERY_NODE_COLUMN) {
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;

      SColumn c = extractColumnFromColumnNode(pColNode);
      taosArrayPush(pList, &c);
    } else if (nodeType(pNode->pExpr) == QUERY_NODE_VALUE) {
      SValueNode* pValNode = (SValueNode*)pNode->pExpr;
      SColumn     c = {0};
      c.slotId = pNode->slotId;
      c.colId = pNode->slotId;
      c.type = pValNode->node.type;
      c.bytes = pValNode->node.resType.bytes;
      c.scale = pValNode->node.resType.scale;
      c.precision = pValNode->node.resType.precision;

      taosArrayPush(pList, &c);
    }
  }

  return pList;
}