executorimpl.h 31.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
H
Hongze Cheng 已提交
15
// clang-format off
16 17 18
#ifndef TDENGINE_EXECUTORIMPL_H
#define TDENGINE_EXECUTORIMPL_H

19 20 21 22
#ifdef __cplusplus
extern "C" {
#endif

23
#include "os.h"
S
common  
Shengliang Guan 已提交
24
#include "tcommon.h"
25
#include "tlosertree.h"
dengyihao's avatar
dengyihao 已提交
26
#include "tsort.h"
27 28 29
#include "ttszip.h"
#include "tvariant.h"

H
Haojun Liao 已提交
30
#include "dataSinkMgt.h"
31
#include "executil.h"
H
Haojun Liao 已提交
32
#include "executor.h"
H
Haojun Liao 已提交
33
#include "planner.h"
D
dapan1121 已提交
34
#include "scalar.h"
35 36
#include "taosdef.h"
#include "tarray.h"
H
Haojun Liao 已提交
37
#include "thash.h"
38
#include "tlockfree.h"
D
dapan1121 已提交
39
#include "tmsg.h"
dengyihao's avatar
dengyihao 已提交
40
#include "tpagedbuf.h"
5
54liuyao 已提交
41
#include "tstreamUpdate.h"
H
Haojun Liao 已提交
42

H
Hongze Cheng 已提交
43
#include "vnode.h"
44
#include "executorInt.h"
H
Hongze Cheng 已提交
45

46 47
typedef int32_t (*__block_search_fn_t)(char* data, int32_t num, int64_t key, int32_t order);

dengyihao's avatar
dengyihao 已提交
48 49
#define IS_QUERY_KILLED(_q)   ((_q)->code == TSDB_CODE_TSC_QUERY_CANCELLED)
#define Q_STATUS_EQUAL(p, s)  (((p) & (s)) != 0u)
50 51
#define QUERY_IS_ASC_QUERY(q) (GET_FORWARD_DIRECTION_FACTOR((q)->order.order) == QUERY_ASC_FORWARD_STEP)

52
#define GET_TABLEGROUP(q, _index) ((SArray*)taosArrayGetP((q)->tableqinfoGroupInfo.pGroupList, (_index)))
53

54
#define NEEDTO_COMPRESS_QUERY(size) ((size) > tsCompressColData ? 1 : 0)
55 56

enum {
57 58
  // when this task starts to execute, this status will set
  TASK_NOT_COMPLETED = 0x1u,
59

60
  /* Task is over
61 62 63
   * 1. this status is used in one row result query process, e.g., count/sum/first/last/ avg...etc.
   * 2. when all data within queried time window, it is also denoted as query_completed
   */
64
  TASK_COMPLETED = 0x2u,
65 66 67 68

  /* when the result is not completed return to client, this status will be
   * usually used in case of interval query with interpolation option
   */
69
  TASK_OVER = 0x4u,
70 71 72
};

typedef struct SResultRowCell {
dengyihao's avatar
dengyihao 已提交
73
  uint64_t           groupId;
H
Haojun Liao 已提交
74
  SResultRowPosition pos;
75 76 77 78 79 80
} SResultRowCell;

/**
 * If the number of generated results is greater than this value,
 * query query will be halt and return results to client immediate.
 */
dengyihao's avatar
dengyihao 已提交
81 82 83 84 85
typedef struct SResultInfo {  // TODO refactor
  int64_t totalRows;          // total generated result size in rows
  int64_t totalBytes;         // total results in bytes.
  int32_t capacity;           // capacity of current result output buffer
  int32_t threshold;          // result size threshold in rows.
H
Haojun Liao 已提交
86
} SResultInfo;
87 88

typedef struct STableQueryInfo {
89 90
  TSKEY              lastKey;     // last check ts, todo remove it later
  SResultRowPosition pos;       // current active time window
91
//  SVariant       tag;
92 93 94 95 96 97 98 99 100 101
} STableQueryInfo;

typedef enum {
  QUERY_PROF_BEFORE_OPERATOR_EXEC = 0,
  QUERY_PROF_AFTER_OPERATOR_EXEC,
  QUERY_PROF_QUERY_ABORT
} EQueryProfEventType;

typedef struct {
  EQueryProfEventType eventType;
102
  int64_t             eventTime;
103 104

  union {
105 106
    uint8_t operatorType;  // for operator event
    int32_t abortCode;     // for query abort event
107 108 109 110 111 112 113 114 115
  };
} SQueryProfEvent;

typedef struct {
  uint8_t operatorType;
  int64_t sumSelfTime;
  int64_t sumRunTimes;
} SOperatorProfResult;

H
Haojun Liao 已提交
116 117 118 119 120
typedef struct SLimit {
  int64_t limit;
  int64_t offset;
} SLimit;

121 122 123 124 125 126 127 128 129 130 131
typedef struct SFileBlockLoadRecorder {
  uint64_t totalRows;
  uint64_t totalCheckedRows;
  uint32_t totalBlocks;
  uint32_t loadBlocks;
  uint32_t loadBlockStatis;
  uint32_t skipBlocks;
  uint32_t filterOutBlocks;
  uint64_t elapsedTime;
} SFileBlockLoadRecorder;

H
Haojun Liao 已提交
132
typedef struct STaskCostInfo {
133 134 135 136 137 138 139 140 141 142 143 144
  int64_t created;
  int64_t start;
  int64_t end;

  uint64_t loadStatisTime;
  uint64_t loadFileBlockTime;
  uint64_t loadDataInCacheTime;
  uint64_t loadStatisSize;
  uint64_t loadFileBlockSize;
  uint64_t loadDataInCacheSize;

  uint64_t loadDataTime;
145 146

  SFileBlockLoadRecorder* pRecoder;
147
  uint64_t elapsedTime;
148

149 150 151 152 153 154 155 156
  uint64_t firstStageMergeTime;
  uint64_t winInfoSize;
  uint64_t tableInfoSize;
  uint64_t hashSize;
  uint64_t numOfTimeWindows;

  SArray*   queryProfEvents;      // SArray<SQueryProfEvent>
  SHashObj* operatorProfResults;  // map<operator_type, SQueryProfEvent>
H
Haojun Liao 已提交
157
} STaskCostInfo;
158

H
Haojun Liao 已提交
159 160
typedef struct SOperatorCostInfo {
  uint64_t openCost;
D
dapan1121 已提交
161
  uint64_t totalCost;
H
Haojun Liao 已提交
162 163
} SOperatorCostInfo;

164 165
// The basic query information extracted from the SQueryInfo tree to support the
// execution of query in a data node.
H
Haojun Liao 已提交
166
typedef struct STaskAttr {
dengyihao's avatar
dengyihao 已提交
167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187
  SLimit      limit;
  SLimit      slimit;
  bool        stableQuery;        // super table query or not
  bool        topBotQuery;        // TODO used bitwise flag
  bool        groupbyColumn;      // denote if this is a groupby normal column query
  bool        timeWindowInterpo;  // if the time window start/end required interpolation
  bool        tsCompQuery;        // is tscomp query
  bool        diffQuery;          // is diff query
  bool        pointInterpQuery;   // point interpolation query
  int32_t     havingNum;          // having expr number
  int16_t     numOfCols;
  int16_t     numOfTags;
  STimeWindow window;
  SInterval   interval;
  int16_t     precision;
  int16_t     numOfOutput;
  int16_t     fillType;
  int32_t     resultRowSize;
  int32_t     tagLen;  // tag value length of current query

  SExprInfo*      pExpr1;
188 189 190
  SColumnInfo*    tagColList;
  int32_t         numOfFilterCols;
  int64_t*        fillVal;
191 192 193
  void*           tsdb;
  STableGroupInfo tableGroupInfo;  // table <tid, last_key> list  SArray<STableKeyInfo>
  int32_t         vgId;
H
Haojun Liao 已提交
194
} STaskAttr;
195 196

struct SOperatorInfo;
197 198
struct SAggSupporter;
struct SOptrBasicInfo;
199

dengyihao's avatar
dengyihao 已提交
200 201 202 203
typedef void (*__optr_encode_fn_t)(struct SOperatorInfo* pOperator, struct SAggSupporter* pSup,
                                   struct SOptrBasicInfo* pInfo, char** result, int32_t* length);
typedef bool (*__optr_decode_fn_t)(struct SOperatorInfo* pOperator, struct SAggSupporter* pSup,
                                   struct SOptrBasicInfo* pInfo, char* result, int32_t length);
204

205
typedef int32_t (*__optr_open_fn_t)(struct SOperatorInfo* pOptr);
206
typedef SSDataBlock* (*__optr_fn_t)(struct SOperatorInfo* pOptr);
H
Haojun Liao 已提交
207
typedef void (*__optr_close_fn_t)(void* param, int32_t num);
dengyihao's avatar
dengyihao 已提交
208
typedef int32_t (*__optr_get_explain_fn_t)(struct SOperatorInfo* pOptr, void** pOptrExplain);
H
Haojun Liao 已提交
209

H
Haojun Liao 已提交
210
typedef struct STaskIdInfo {
211 212 213 214
  uint64_t queryId;  // this is also a request id
  uint64_t subplanId;
  uint64_t templateId;
  char*    str;
H
Haojun Liao 已提交
215 216
} STaskIdInfo;

217
typedef struct SExecTaskInfo {
dengyihao's avatar
dengyihao 已提交
218 219 220 221 222 223 224 225 226 227 228
  STaskIdInfo      id;
  uint32_t         status;
  STimeWindow      window;
  STaskCostInfo    cost;
  int64_t          owner;  // if it is in execution
  int32_t          code;
  uint64_t         totalRows;            // total number of rows
  STableGroupInfo  tableqinfoGroupInfo;  // this is a group array list, including SArray<STableQueryInfo*> structure
  char*            sql;                  // query sql string
  jmp_buf          env;                  // jump to this position when error happens.
  EOPTR_EXEC_MODEL execModel;            // operator execution model [batch model|stream model]
229
  struct SOperatorInfo* pRoot;
230
} SExecTaskInfo;
H
Haojun Liao 已提交
231

H
Haojun Liao 已提交
232
typedef struct STaskRuntimeEnv {
H
Haojun Liao 已提交
233 234 235 236 237 238 239 240
  STaskAttr*      pQueryAttr;
  uint32_t        status;  // query status
  uint8_t         scanFlag;  // denotes reversed scan of data or not
  SDiskbasedBuf*  pResultBuf;           // query result buffer based on blocked-wised disk file
  SHashObj*       pResultRowHashTable;  // quick locate the window object for each result
  SHashObj*       pResultRowListSet;    // used to check if current ResultRowInfo has ResultRow object or not
  SArray*         pResultRowArrayList;  // The array list that contains the Result rows
  char*           keyBuf;               // window key buffer
H
Haojun Liao 已提交
241
  // The window result objects pool, all the resultRow Objects are allocated and managed by this object.
dengyihao's avatar
dengyihao 已提交
242 243 244
  char**    prevRow;
  STSBuf*   pTsBuf;      // timestamp filter list
  STSCursor cur;
245

dengyihao's avatar
dengyihao 已提交
246
  char*                          tagVal;  // tag value of current data block
247 248
  STableGroupInfo tableqinfoGroupInfo;  // this is a group array list, including SArray<STableQueryInfo*> structure
  struct SOperatorInfo* proot;
dengyihao's avatar
dengyihao 已提交
249 250
  SGroupResInfo         groupResInfo;
  int64_t               currentOffset;  // dynamic offset value
251

252
  STableQueryInfo* current;
253
  SResultInfo      resultInfo;
254
  struct SUdfInfo* pUdfInfo;
H
Haojun Liao 已提交
255
} STaskRuntimeEnv;
256 257

enum {
dengyihao's avatar
dengyihao 已提交
258 259
  OP_NOT_OPENED = 0x0,
  OP_OPENED = 0x1,
H
Haojun Liao 已提交
260
  OP_RES_TO_RETURN = 0x5,
dengyihao's avatar
dengyihao 已提交
261
  OP_EXEC_DONE = 0x9,
262 263
};

264 265 266 267 268 269 270 271 272 273 274
typedef struct SOperatorFpSet {
  __optr_open_fn_t        _openFn;          // DO NOT invoke this function directly
  __optr_fn_t             getNextFn;
  __optr_fn_t             getStreamResFn;  // execute the aggregate in the stream model, todo remove it
  __optr_fn_t             cleanupFn;       // call this function to release the allocated resources ASAP
  __optr_close_fn_t       closeFn;
  __optr_encode_fn_t      encodeResultRow;
  __optr_decode_fn_t      decodeResultRow;
  __optr_get_explain_fn_t getExplainFn;
} SOperatorFpSet;

275
typedef struct SOperatorInfo {
D
dapan1121 已提交
276
  uint8_t                 operatorType;
277
  bool                    blocking;      // block operator or not
D
dapan1121 已提交
278
  uint8_t                 status;        // denote if current operator is completed
279
  int32_t                 numOfExprs;   // number of columns of the current operator results
D
dapan1121 已提交
280 281 282 283 284 285 286 287
  char*                   name;          // name, used to show the query execution plan
  void*                   info;          // extension attribution
  SExprInfo*              pExpr;
  SExecTaskInfo*          pTaskInfo;
  SOperatorCostInfo       cost;
  SResultInfo             resultInfo;
  struct SOperatorInfo**  pDownstream;      // downstram pointer list
  int32_t                 numOfDownstream;  // number of downstream. The value is always ONE expect for join operator
288
  SOperatorFpSet          fpSet;
289 290 291 292 293
} SOperatorInfo;

typedef struct {
  int32_t      numOfTags;
  int32_t      numOfCols;
294
  SColumnInfo* colList;
295 296
} SQueriedTableInfo;

297 298
typedef enum {
  EX_SOURCE_DATA_NOT_READY = 0x1,
299
  EX_SOURCE_DATA_READY     = 0x2,
300 301
  EX_SOURCE_DATA_EXHAUSTED = 0x3,
} EX_SOURCE_STATUS;
302 303

typedef struct SSourceDataInfo {
dengyihao's avatar
dengyihao 已提交
304
  struct SExchangeInfo* pEx;
305
  int32_t               index;
dengyihao's avatar
dengyihao 已提交
306
  SRetrieveTableRsp*    pRsp;
307
  uint64_t              totalRows;
H
Haojun Liao 已提交
308
  int32_t               code;
309
  EX_SOURCE_STATUS      status;
310 311
} SSourceDataInfo;

H
Haojun Liao 已提交
312
typedef struct SLoadRemoteDataInfo {
dengyihao's avatar
dengyihao 已提交
313 314 315
  uint64_t totalSize;     // total load bytes from remote
  uint64_t totalRows;     // total number of rows
  uint64_t totalElapsed;  // total elapsed time
H
Haojun Liao 已提交
316 317
} SLoadRemoteDataInfo;

318
typedef struct SExchangeInfo {
dengyihao's avatar
dengyihao 已提交
319 320 321 322 323 324 325
  SArray*             pSources;
  SArray*             pSourceDataInfo;
  tsem_t              ready;
  void*               pTransporter;
  SSDataBlock*        pResult;
  bool                seqLoadData;  // sequential load data or not, false by default
  int32_t             current;
H
Haojun Liao 已提交
326
  SLoadRemoteDataInfo loadInfo;
327 328
} SExchangeInfo;

329 330 331
#define COL_MATCH_FROM_COL_ID  0x1
#define COL_MATCH_FROM_SLOT_ID 0x2

H
Haojun Liao 已提交
332
typedef struct SColMatchInfo {
333
  int32_t srcSlotId;     // source slot id
H
Haojun Liao 已提交
334 335 336
  int32_t colId;
  int32_t targetSlotId;
  bool    output;
337
  int32_t matchType;     // determinate the source according to col id or slot id
H
Haojun Liao 已提交
338 339
} SColMatchInfo;

340 341 342 343 344
typedef struct SScanInfo {
  int32_t numOfAsc;
  int32_t numOfDesc;
} SScanInfo;

345
typedef struct STableScanInfo {
H
Haojun Liao 已提交
346
  void*           dataReader;
347
  SFileBlockLoadRecorder readRecorder;
348
  int64_t         numOfRows;
349
  int64_t         elapsedTime;
350
//  int32_t         prevGroupId;  // previous table group id
351
  SScanInfo       scanInfo;
352 353 354
  int32_t         scanTimes;
  SNode*          pFilterNode;  // filter info, which is push down by optimizer
  SqlFunctionCtx* pCtx;         // which belongs to the direct upstream operator operator query context
355 356 357
  SResultRowInfo* pResultRowInfo;
  int32_t*        rowCellInfoOffset;
  SExprInfo*      pExpr;
358
  SSDataBlock*    pResBlock;
H
Haojun Liao 已提交
359
  SArray*         pColMatchInfo;
360
  int32_t         numOfOutput;
361

362
  SQueryTableDataCond cond;
363
  int32_t         scanFlag;     // table scan flag to denote if it is a repeat/reverse/main scan
364
  int32_t         dataBlockLoadFlag;
365
  double          sampleRatio;  // data block sample ratio, 1 by default
366
  SInterval       interval;     // if the upstream is an interval operator, the interval info is also kept here to get the time window to check if current data block needs to be loaded.
367 368 369
} STableScanInfo;

typedef struct STagScanInfo {
370 371 372 373 374 375
  SColumnInfo     *pCols;
  SSDataBlock     *pRes;
  SArray          *pColMatchInfo;
  int32_t          curPos;
  SReadHandle      readHandle;
  STableGroupInfo *pTableGroups;
376 377
} STagScanInfo;

H
Haojun Liao 已提交
378
typedef struct SStreamBlockScanInfo {
dengyihao's avatar
dengyihao 已提交
379 380 381 382 383 384 385 386 387
  SArray*      pBlockLists;      // multiple SSDatablock.
  SSDataBlock* pRes;             // result SSDataBlock
  int32_t      blockType;        // current block type
  int32_t      validBlockIndex;  // Is current data has returned?
  SColumnInfo* pCols;            // the output column info
  uint64_t     numOfRows;        // total scanned rows
  uint64_t     numOfExec;        // execution times
  void*        readerHandle;     // stream block reader handle
  SArray*      pColMatchInfo;    //
5
54liuyao 已提交
388
  SNode*       pCondition;
5
54liuyao 已提交
389 390 391
  SArray*      tsArray;
  SUpdateInfo*  pUpdateInfo;
  int32_t      primaryTsIndex;    // primary time stamp slot id
H
Haojun Liao 已提交
392 393
} SStreamBlockScanInfo;

394
typedef struct SSysTableScanInfo {
395
  SReadHandle readHandle;
396

dengyihao's avatar
dengyihao 已提交
397 398 399 400
  SRetrieveMetaTableRsp* pRsp;
  SRetrieveTableReq      req;
  SEpSet                 epSet;
  tsem_t                 ready;
H
Haojun Liao 已提交
401

H
Haojun Liao 已提交
402 403 404
  int32_t             accountId;
  bool                showRewrite;
  SNode*              pCondition;  // db_name filter condition, to discard data that are not in current database
H
Hongze Cheng 已提交
405
  SMTbCursor*         pCur;        // cursor for iterate the local table meta store.
H
Haojun Liao 已提交
406
  SArray*             scanCols;    // SArray<int16_t> scan column id list
H
Haojun Liao 已提交
407
  SName               name;
dengyihao's avatar
dengyihao 已提交
408
  SSDataBlock*        pRes;
H
Haojun Liao 已提交
409
  int64_t             numOfBlocks;  // extract basic running information.
H
Haojun Liao 已提交
410
  SLoadRemoteDataInfo loadInfo;
411 412
} SSysTableScanInfo;

413
typedef struct SOptrBasicInfo {
dengyihao's avatar
dengyihao 已提交
414 415 416 417
  SResultRowInfo  resultRowInfo;
  int32_t*        rowCellInfoOffset;  // offset value for each row result cell info
  SqlFunctionCtx* pCtx;
  SSDataBlock*    pRes;
418 419
} SOptrBasicInfo;

dengyihao's avatar
dengyihao 已提交
420
// TODO move the resultrowsiz together with SOptrBasicInfo:rowCellInfoOffset
421
typedef struct SAggSupporter {
dengyihao's avatar
dengyihao 已提交
422 423 424
  SHashObj*      pResultRowHashTable;  // quick locate the window object for each result
  char*          keyBuf;               // window key buffer
  SDiskbasedBuf* pResultBuf;           // query result buffer based on blocked-wised disk file
425
  int32_t        resultRowSize;        // the result buffer size for each result row, with the meta data size for each row
426 427
} SAggSupporter;

428 429 430
typedef struct STimeWindowSupp {
  int8_t           calTrigger;
  int64_t          waterMark;
dengyihao's avatar
dengyihao 已提交
431
  SColumnInfoData  timeWindowData;     // query time window info for scalar function execution.
432 433
} STimeWindowAggSupp;

434
typedef struct SIntervalAggOperatorInfo {
435 436 437 438 439 440 441 442 443 444 445 446 447
  SOptrBasicInfo     binfo;              // basic info
  SGroupResInfo      groupResInfo;       // multiple results build supporter
  SInterval          interval;           // interval info
  int32_t            primaryTsIndex;     // primary time stamp slot id from result of downstream operator.
  STimeWindow        win;                // query time range
  bool               timeWindowInterpo;  // interpolation needed or not
  char**             pRow;               // previous row/tuple of already processed datablock
  SAggSupporter      aggSup;             // aggregate supporter
  STableQueryInfo*   pCurrent;           // current tableQueryInfo struct
  int32_t            order;              // current SSDataBlock scan order
  EOPTR_EXEC_MODEL   execModel;          // operator execution model [batch model|stream model]
  SArray*            pUpdatedWindow;     // updated time window due to the input data block from the downstream operator.
  STimeWindowAggSupp twAggSup;
448
  struct SFillInfo*  pFillInfo;          // fill info
5
54liuyao 已提交
449
  bool               invertible;
450
} SIntervalAggOperatorInfo;
451 452

typedef struct SAggOperatorInfo {
H
Haojun Liao 已提交
453 454 455
  SOptrBasicInfo     binfo;
  SAggSupporter      aggSup;
  STableQueryInfo   *current;
H
Haojun Liao 已提交
456
  uint64_t           groupId;
H
Haojun Liao 已提交
457 458
  SGroupResInfo      groupResInfo;
  STableQueryInfo   *pTableQueryInfo;
459 460 461 462 463

  SExprInfo         *pScalarExprInfo;
  int32_t            numOfScalarExpr;      // the number of scalar expression before the aggregate function can be applied
  SqlFunctionCtx    *pScalarCtx;                 // scalar function requried sql function struct.
  int32_t           *rowCellInfoOffset;  // offset value for each row result cell info
464 465 466
} SAggOperatorInfo;

typedef struct SProjectOperatorInfo {
467 468 469 470 471 472 473 474 475 476 477 478 479
  SOptrBasicInfo     binfo;
  SAggSupporter      aggSup;
  SSDataBlock*       existDataBlock;
  SArray*            pPseudoColInfo;
  SLimit             limit;
  SLimit             slimit;

  uint64_t           groupId;
  int64_t            curSOffset;
  int64_t            curGroupOutput;

  int64_t            curOffset;
  int64_t            curOutput;
480 481 482
} SProjectOperatorInfo;

typedef struct SFillOperatorInfo {
483 484 485 486 487 488
  struct SFillInfo* pFillInfo;
  SSDataBlock*      pRes;
  int64_t           totalInputRows;
  void**            p;
  SSDataBlock*      existNewGroupBlock;
  bool              multigroupResult;
489 490 491
} SFillOperatorInfo;

typedef struct SGroupbyOperatorInfo {
dengyihao's avatar
dengyihao 已提交
492
  SOptrBasicInfo  binfo;
493
  SArray*         pGroupCols;     // group by columns, SArray<SColumn>
dengyihao's avatar
dengyihao 已提交
494 495 496 497 498 499 500 501 502 503
  SArray*         pGroupColVals;  // current group column values, SArray<SGroupKeys>
  SNode*          pCondition;
  bool            isInit;       // denote if current val is initialized or not
  char*           keyBuf;       // group by keys for hash
  int32_t         groupKeyLen;  // total group by column width
  SGroupResInfo   groupResInfo;
  SAggSupporter   aggSup;
  SExprInfo*      pScalarExprInfo;
  int32_t         numOfScalarExpr;  // the number of scalar expression in group operator
  SqlFunctionCtx* pScalarFuncCtx;
504
  int32_t*        rowCellInfoOffset;  // offset value for each row result cell info
505 506
} SGroupbyOperatorInfo;

H
Haojun Liao 已提交
507
typedef struct SDataGroupInfo {
508 509 510
  uint64_t        groupId;
  int64_t         numOfRows;
  SArray*         pPageList;
H
Haojun Liao 已提交
511 512 513 514
} SDataGroupInfo;

// The sort in partition may be needed later.
typedef struct SPartitionOperatorInfo {
dengyihao's avatar
dengyihao 已提交
515 516 517 518 519 520 521 522 523 524
  SOptrBasicInfo binfo;
  SArray*        pGroupCols;
  SArray*        pGroupColVals;  // current group column values, SArray<SGroupKeys>
  char*          keyBuf;         // group by keys for hash
  int32_t        groupKeyLen;    // total group by column width
  SHashObj*      pGroupSet;      // quick locate the window object for each result

  SDiskbasedBuf* pBuf;          // query result buffer based on blocked-wised disk file
  int32_t        rowCapacity;   // maximum number of rows for each buffer page
  int32_t*       columnOffset;  // start position for each column data
525 526
  void*          pGroupIter;  // group iterator
  int32_t        pageIndex;   // page index of current group
H
Haojun Liao 已提交
527
} SPartitionOperatorInfo;
528

529
typedef struct SWindowRowsSup {
dengyihao's avatar
dengyihao 已提交
530 531 532 533
  STimeWindow win;
  TSKEY       prevTs;
  int32_t     startRowIndex;
  int32_t     numOfRows;
534 535
} SWindowRowsSup;

H
Haojun Liao 已提交
536
typedef struct SSessionAggOperatorInfo {
537 538 539 540 541 542
  SOptrBasicInfo     binfo;
  SAggSupporter      aggSup;
  SGroupResInfo      groupResInfo;
  SWindowRowsSup     winSup;
  bool               reptScan;        // next round scan
  int64_t            gap;             // session window gap
543
  int32_t            tsSlotId;        // primary timestamp slot id
544
  STimeWindowAggSupp twAggSup;
H
Haojun Liao 已提交
545
} SSessionAggOperatorInfo;
546

547
typedef struct STimeSliceOperatorInfo {
dengyihao's avatar
dengyihao 已提交
548 549 550
  SOptrBasicInfo binfo;
  SInterval      interval;
  SGroupResInfo  groupResInfo;  // multiple results build supporter
551 552
} STimeSliceOperatorInfo;

553
typedef struct SStateWindowOperatorInfo {
554 555 556 557 558 559 560
  SOptrBasicInfo     binfo;
  SAggSupporter      aggSup;
  SGroupResInfo      groupResInfo;
  SWindowRowsSup     winSup;
  int32_t            colIndex;  // start row index
  bool               hasKey;
  SStateKeys         stateKey;
561
  int32_t            tsSlotId;  // primary timestamp column slot id
562
  STimeWindowAggSupp twAggSup;
dengyihao's avatar
dengyihao 已提交
563
  //  bool             reptScan;
564 565
} SStateWindowOperatorInfo;

566
typedef struct SSortedMergeOperatorInfo {
567

568 569 570 571 572 573 574 575 576 577 578 579 580
  SOptrBasicInfo   binfo;
  SArray*          pSortInfo;
  int32_t          numOfSources;
  SSortHandle     *pSortHandle;
  int32_t          bufPageSize;
  uint32_t         sortBufSize;  // max buffer size for in-memory sort
  int32_t          resultRowFactor;
  bool             hasGroupVal;
  SDiskbasedBuf   *pTupleStore;  // keep the final results
  int32_t          numOfResPerPage;
  char**           groupVal;
  SArray          *groupInfo;
  SAggSupporter    aggSup;
581
} SSortedMergeOperatorInfo;
H
Haojun Liao 已提交
582

H
Haojun Liao 已提交
583
typedef struct SSortOperatorInfo {
584
  SOptrBasicInfo binfo;
dengyihao's avatar
dengyihao 已提交
585 586 587
  uint32_t     sortBufSize;  // max buffer size for in-memory sort
  SArray*      pSortInfo;
  SSortHandle* pSortHandle;
588
  SArray*      pColMatchInfo;  // for index map from table scan output
dengyihao's avatar
dengyihao 已提交
589
  int32_t      bufPageSize;
H
Haojun Liao 已提交
590

H
Haojun Liao 已提交
591
  // TODO extact struct
dengyihao's avatar
dengyihao 已提交
592 593 594 595 596
  int64_t  startTs;       // sort start time
  uint64_t sortElapsed;   // sort elapsed time, time to flush to disk not included.
  uint64_t totalSize;     // total load bytes from remote
  uint64_t totalRows;     // total number of rows
  uint64_t totalElapsed;  // total elapsed time
H
Haojun Liao 已提交
597
} SSortOperatorInfo;
598

dengyihao's avatar
dengyihao 已提交
599 600 601
typedef struct STagFilterOperatorInfo {
  SOptrBasicInfo binfo;
} STagFilterOperatorInfo;
602

603 604 605 606 607 608 609 610 611 612 613 614 615 616
typedef struct SJoinOperatorInfo {
  SSDataBlock       *pRes;
  int32_t            joinType;

  SSDataBlock       *pLeft;
  int32_t            leftPos;
  SColumnInfo        leftCol;

  SSDataBlock       *pRight;
  int32_t            rightPos;
  SColumnInfo        rightCol;
  SNode             *pOnCondition;
} SJoinOperatorInfo;

617 618 619
#define OPTR_IS_OPENED(_optr)  (((_optr)->status & OP_OPENED) == OP_OPENED)
#define OPTR_SET_OPENED(_optr) ((_optr)->status |= OP_OPENED)

620 621 622 623
SOperatorFpSet createOperatorFpSet(__optr_open_fn_t openFn, __optr_fn_t nextFn, __optr_fn_t streamFn,
    __optr_fn_t cleanup, __optr_close_fn_t closeFn, __optr_encode_fn_t encode,
    __optr_decode_fn_t decode, __optr_get_explain_fn_t explain);

H
Haojun Liao 已提交
624
int32_t operatorDummyOpenFn(SOperatorInfo* pOperator);
dengyihao's avatar
dengyihao 已提交
625
void    operatorDummyCloseFn(void* param, int32_t numOfCols);
H
Haojun Liao 已提交
626 627
int32_t appendDownstream(SOperatorInfo* p, SOperatorInfo** pDownstream, int32_t num);
int32_t initAggInfo(SOptrBasicInfo* pBasicInfo, SAggSupporter* pAggSup, SExprInfo* pExprInfo, int32_t numOfCols,
628 629
                    SSDataBlock* pResultBlock, size_t keyBufSize, const char* pkey);
void    initResultSizeInfo(SOperatorInfo* pOperator, int32_t numOfRows);
630 631
void doBuildResultDatablock(SOptrBasicInfo *pbInfo, SGroupResInfo* pGroupResInfo, SExprInfo* pExprInfo, SDiskbasedBuf* pBuf);

dengyihao's avatar
dengyihao 已提交
632 633 634 635 636 637 638 639 640 641
void    finalizeMultiTupleQueryResult(SqlFunctionCtx* pCtx, int32_t numOfOutput, SDiskbasedBuf* pBuf,
                                      SResultRowInfo* pResultRowInfo, int32_t* rowCellInfoOffset);
void    doApplyFunctions(SqlFunctionCtx* pCtx, STimeWindow* pWin, SColumnInfoData* pTimeWindowData, int32_t offset,
                         int32_t forwardStep, TSKEY* tsCol, int32_t numOfTotal, int32_t numOfOutput, int32_t order);
int32_t setGroupResultOutputBuf(SOptrBasicInfo* binfo, int32_t numOfCols, char* pData, int16_t type, int16_t bytes,
                                int32_t groupId, SDiskbasedBuf* pBuf, SExecTaskInfo* pTaskInfo, SAggSupporter* pAggSup);
void    doDestroyBasicInfo(SOptrBasicInfo* pInfo, int32_t numOfOutput);
int32_t setSDataBlockFromFetchRsp(SSDataBlock* pRes, SLoadRemoteDataInfo* pLoadInfo, int32_t numOfRows, char* pData,
                                  int32_t compLen, int32_t numOfOutput, int64_t startTs, uint64_t* total,
                                  SArray* pColList);
642
void    getAlignQueryTimeWindow(SInterval* pInterval, int32_t precision, int64_t key, STimeWindow* win);
643
int32_t getTableScanOrder(SOperatorInfo* pOperator);
644

dengyihao's avatar
dengyihao 已提交
645 646
void    doSetOperatorCompleted(SOperatorInfo* pOperator);
void    doFilter(const SNode* pFilterNode, SSDataBlock* pBlock);
647
SqlFunctionCtx* createSqlFunctionCtx(SExprInfo* pExprInfo, int32_t numOfOutput, int32_t** rowCellInfoOffset);
648
void    relocateColumnData(SSDataBlock* pBlock, const SArray* pColMatchInfo, SArray* pCols);
649 650
void    initExecTimeWindowInfo(SColumnInfoData* pColData, STimeWindow* pQueryWindow);
void    cleanupAggSup(SAggSupporter* pAggSup);
651 652 653
void    destroyBasicOperatorInfo(void* param, int32_t numOfOutput);
void    appendOneRowToDataBlock(SSDataBlock* pBlock, STupleHandle* pTupleHandle);

654
SSDataBlock* getSortedBlockData(SSortHandle* pHandle, SSDataBlock* pDataBlock, int32_t capacity, SArray* pColMatchInfo);
655
SSDataBlock* loadNextDataBlock(void* param);
656

657
void setResultRowInitCtx(SResultRow* pResult, SqlFunctionCtx* pCtx, int32_t numOfOutput, int32_t* rowCellInfoOffset);
658 659 660 661

SResultRow* doSetResultOutBufByKey(SDiskbasedBuf* pResultBuf, SResultRowInfo* pResultRowInfo,
                                   char* pData, int16_t bytes, bool masterscan, uint64_t groupId,
                                   SExecTaskInfo* pTaskInfo, bool isIntervalQuery, SAggSupporter* pSup);
H
Haojun Liao 已提交
662

663 664 665
SOperatorInfo* createTableScanOperatorInfo(void* pDataReader, SQueryTableDataCond* pCond, int32_t numOfOutput, int32_t dataLoadFlag, const uint8_t* scanInfo,
                                           SArray* pColMatchInfo, SSDataBlock* pResBlock, SNode* pCondition, SInterval* pInterval, double sampleRatio, SExecTaskInfo* pTaskInfo);

666 667
SOperatorInfo* createAggregateOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols, SSDataBlock* pResultBlock, SExprInfo* pScalarExprInfo,
                                           int32_t numOfScalarExpr, SExecTaskInfo* pTaskInfo, const STableGroupInfo* pTableGroupInfo);
668

wmmhello's avatar
wmmhello 已提交
669
SOperatorInfo* createProjectOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t num, SSDataBlock* pResBlock, SLimit* pLimit, SLimit* pSlimit, SExecTaskInfo* pTaskInfo);
670 671
SOperatorInfo *createSortOperatorInfo(SOperatorInfo* downstream, SSDataBlock* pResBlock, SArray* pSortInfo, SExprInfo* pExprInfo, int32_t numOfCols,
                                      SArray* pIndexMap, SExecTaskInfo* pTaskInfo);
672

H
Haojun Liao 已提交
673
SOperatorInfo* createSortedMergeOperatorInfo(SOperatorInfo** downstream, int32_t numOfDownstream, SExprInfo* pExprInfo, int32_t num, SArray* pSortInfo, SArray* pGroupInfo, SExecTaskInfo* pTaskInfo);
674

X
Xiaoyu Wang 已提交
675
SOperatorInfo* createSysTableScanOperatorInfo(void* pSysTableReadHandle, SSDataBlock* pResBlock, const SName* pName,
dengyihao's avatar
dengyihao 已提交
676 677 678
                                              SNode* pCondition, SEpSet epset, SArray* colList,
                                              SExecTaskInfo* pTaskInfo, bool showRewrite, int32_t accountId);
SOperatorInfo* createIntervalOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
679
                                          SSDataBlock* pResBlock, SInterval* pInterval, int32_t primaryTsSlotId,
680
                                          STimeWindowAggSupp *pTwAggSupp, const STableGroupInfo* pTableGroupInfo, SExecTaskInfo* pTaskInfo);
681
SOperatorInfo* createStreamIntervalOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
682

683 684
                                                SSDataBlock* pResBlock, SInterval* pInterval, int32_t primaryTsSlotId,
                                                STimeWindowAggSupp *pTwAggSupp, const STableGroupInfo* pTableGroupInfo, SExecTaskInfo* pTaskInfo);
dengyihao's avatar
dengyihao 已提交
685
SOperatorInfo* createSessionAggOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
686 687
                                            SSDataBlock* pResBlock, int64_t gap, int32_t tsSlotId, STimeWindowAggSupp* pTwAggSupp,
                                            SExecTaskInfo* pTaskInfo);
dengyihao's avatar
dengyihao 已提交
688 689 690 691
SOperatorInfo* createGroupOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
                                       SSDataBlock* pResultBlock, SArray* pGroupColList, SNode* pCondition,
                                       SExprInfo* pScalarExprInfo, int32_t numOfScalarExpr, SExecTaskInfo* pTaskInfo,
                                       const STableGroupInfo* pTableGroupInfo);
H
Haojun Liao 已提交
692
SOperatorInfo* createDataBlockInfoScanOperator(void* dataReader, SExecTaskInfo* pTaskInfo);
dengyihao's avatar
dengyihao 已提交
693
SOperatorInfo* createStreamScanOperatorInfo(void* streamReadHandle, SSDataBlock* pResBlock, SArray* pColList,
5
54liuyao 已提交
694
                                            SArray* pTableIdList, SExecTaskInfo* pTaskInfo, SNode* pConditions);
H
Haojun Liao 已提交
695

dengyihao's avatar
dengyihao 已提交
696
SOperatorInfo* createFillOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExpr, int32_t numOfCols,
697
                                      SInterval* pInterval, STimeWindow* pWindow, SSDataBlock* pResBlock, int32_t fillType, SNodeListNode* fillVal,
dengyihao's avatar
dengyihao 已提交
698 699
                                      bool multigroupResult, SExecTaskInfo* pTaskInfo);
SOperatorInfo* createStatewindowOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExpr, int32_t numOfCols,
700
                                             SSDataBlock* pResBlock, STimeWindowAggSupp *pTwAggSupp, int32_t tsSlotId, SExecTaskInfo* pTaskInfo);
H
Haojun Liao 已提交
701

dengyihao's avatar
dengyihao 已提交
702 703 704
SOperatorInfo* createPartitionOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
                                           SSDataBlock* pResultBlock, SArray* pGroupColList, SExecTaskInfo* pTaskInfo,
                                           const STableGroupInfo* pTableGroupInfo);
705

dengyihao's avatar
dengyihao 已提交
706 707
SOperatorInfo* createTimeSliceOperatorInfo(SOperatorInfo* downstream, SExprInfo* pExprInfo, int32_t numOfCols,
                                           SSDataBlock* pResultBlock, SExecTaskInfo* pTaskInfo);
708

H
Haojun Liao 已提交
709
SOperatorInfo* createMergeJoinOperatorInfo(SOperatorInfo** pDownstream, int32_t numOfDownstream, SExprInfo* pExprInfo, int32_t numOfCols, SSDataBlock* pResBlock, SNode* pOnCondition, SExecTaskInfo* pTaskInfo);
710
SOperatorInfo* createTagScanOperatorInfo(SReadHandle* pReadHandle, SExprInfo* pExpr, int32_t numOfOutput, SSDataBlock* pResBlock, SArray* pColMatchInfo, STableGroupInfo* pTableGroupInfo, SExecTaskInfo* pTaskInfo);
711

H
Haojun Liao 已提交
712
#if 0
H
Haojun Liao 已提交
713
SOperatorInfo* createTableSeqScanOperatorInfo(void* pTsdbReadHandle, STaskRuntimeEnv* pRuntimeEnv);
714 715
SOperatorInfo* createMultiTableTimeIntervalOperatorInfo(STaskRuntimeEnv* pRuntimeEnv, SOperatorInfo* downstream,
                                                        SExprInfo* pExpr, int32_t numOfOutput);
H
Haojun Liao 已提交
716
#endif
717

718
int32_t projectApplyFunctions(SExprInfo* pExpr, SSDataBlock* pResult, SSDataBlock* pSrcBlock, SqlFunctionCtx* pCtx,
dengyihao's avatar
dengyihao 已提交
719
                           int32_t numOfOutput, SArray* pPseudoList);
720

721
void setInputDataBlock(SOperatorInfo* pOperator, SqlFunctionCtx* pCtx, SSDataBlock* pBlock, int32_t order, bool createDummyCol);
X
Xiaoyu Wang 已提交
722

H
Haojun Liao 已提交
723
void copyTsColoum(SSDataBlock* pRes, SqlFunctionCtx* pCtx, int32_t numOfOutput);
724

725
STableQueryInfo* createTableQueryInfo(void* buf, STimeWindow win);
726

727
bool    isTaskKilled(SExecTaskInfo* pTaskInfo);
728 729
int32_t checkForQueryBuf(size_t numOfTables);

dengyihao's avatar
dengyihao 已提交
730
void setTaskKilled(SExecTaskInfo* pTaskInfo);
731 732

void publishOperatorProfEvent(SOperatorInfo* operatorInfo, EQueryProfEventType eventType);
733
void publishQueryAbortEvent(SExecTaskInfo* pTaskInfo, int32_t code);
734

735
void queryCostStatis(SExecTaskInfo* pTaskInfo);
736

dengyihao's avatar
dengyihao 已提交
737
void    doDestroyTask(SExecTaskInfo* pTaskInfo);
738 739
int32_t getMaximumIdleDurationSec();

740 741
void    doInvokeUdf(struct SUdfInfo* pUdfInfo, SqlFunctionCtx* pCtx, int32_t idx, int32_t type);
void    setTaskStatus(SExecTaskInfo* pTaskInfo, int8_t status);
dengyihao's avatar
dengyihao 已提交
742 743 744 745 746 747 748 749 750
int32_t createExecTaskInfoImpl(SSubplan* pPlan, SExecTaskInfo** pTaskInfo, SReadHandle* pHandle, uint64_t taskId,
                               EOPTR_EXEC_MODEL model);
int32_t getOperatorExplainExecInfo(SOperatorInfo* operatorInfo, SExplainExecInfo** pRes, int32_t* capacity,
                                   int32_t* resNum);

bool aggDecodeResultRow(SOperatorInfo* pOperator, SAggSupporter* pSup, SOptrBasicInfo* pInfo, char* result,
                        int32_t length);
void aggEncodeResultRow(SOperatorInfo* pOperator, SAggSupporter* pSup, SOptrBasicInfo* pInfo, char** result,
                        int32_t* length);
751

752 753 754 755
#ifdef __cplusplus
}
#endif

756
#endif  // TDENGINE_EXECUTORIMPL_H