qExecutor.h 15.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
H
Haojun Liao 已提交
15 16
#ifndef TDENGINE_QEXECUTOR_H
#define TDENGINE_QEXECUTOR_H
17 18 19 20

#include "os.h"

#include "hash.h"
H
Haojun Liao 已提交
21
#include "qAggMain.h"
H
Haojun Liao 已提交
22 23
#include "qFill.h"
#include "qResultbuf.h"
24
#include "qSqlparser.h"
H
Haojun Liao 已提交
25
#include "qTsbuf.h"
26
#include "query.h"
27
#include "taosdef.h"
H
Haojun Liao 已提交
28
#include "tarray.h"
B
Bomin Zhang 已提交
29
#include "tlockfree.h"
H
Haojun Liao 已提交
30
#include "tsdb.h"
31 32

struct SColumnFilterElem;
33
typedef bool (*__filter_func_t)(struct SColumnFilterElem* pFilter, const char* val1, const char* val2, int16_t type);
H
hjxilinx 已提交
34
typedef int32_t (*__block_search_fn_t)(char* data, int32_t num, int64_t key, int32_t order);
35

H
Haojun Liao 已提交
36 37 38 39 40 41
#define IS_QUERY_KILLED(_q) ((_q)->code == TSDB_CODE_TSC_QUERY_CANCELLED)
#define Q_STATUS_EQUAL(p, s)  (((p) & (s)) != 0u)
#define QUERY_IS_ASC_QUERY(q) (GET_FORWARD_DIRECTION_FACTOR((q)->order.order) == QUERY_ASC_FORWARD_STEP)

#define GET_TABLEGROUP(q, _index)   ((SArray*) taosArrayGetP((q)->tableqinfoGroupInfo.pGroupList, (_index)))

H
Haojun Liao 已提交
42 43
#define GET_NUM_OF_RESULTS(_r) (((_r)->outputBuf) == NULL? 0:((_r)->outputBuf)->info.rows)

H
Haojun Liao 已提交
44 45 46 47 48 49 50 51
enum {
  // when query starts to execute, this status will set
      QUERY_NOT_COMPLETED = 0x1u,

  /* query is over
   * 1. this status is used in one row result query process, e.g., count/sum/first/last/ avg...etc.
   * 2. when all data within queried time window, it is also denoted as query_completed
   */
H
Haojun Liao 已提交
52
      QUERY_COMPLETED = 0x2u,
H
Haojun Liao 已提交
53 54 55 56

  /* when the result is not completed return to client, this status will be
   * usually used in case of interval query with interpolation option
   */
H
Haojun Liao 已提交
57
      QUERY_OVER = 0x4u,
H
Haojun Liao 已提交
58 59
};

H
Haojun Liao 已提交
60
typedef struct SResultRowPool {
61 62 63 64 65 66 67 68 69 70
  int32_t elemSize;
  int32_t blockSize;
  int32_t numOfElemPerBlock;

  struct {
    int32_t blockIndex;
    int32_t pos;
  } position;

  SArray* pData;    // SArray<void*>
H
Haojun Liao 已提交
71
} SResultRowPool;
72

73
typedef struct SSqlGroupbyExpr {
H
Haojun Liao 已提交
74 75 76 77 78
  int16_t tableIndex;
  SArray* columnInfo;  // SArray<SColIndex>, group by columns information
  int16_t numOfGroupCols;
  int16_t orderIndex;  // order by column index
  int16_t orderType;   // order by type: asc/desc
79 80
} SSqlGroupbyExpr;

H
Haojun Liao 已提交
81
typedef struct SResultRow {
82
  int32_t       pageId;      // pageId & rowId is the position of current result in disk-based output buffer
H
Haojun Liao 已提交
83
  int32_t       offset:29;    // row index in buffer page
84 85 86 87
  bool          startInterp; // the time window start timestamp has done the interpolation already.
  bool          endInterp;   // the time window end timestamp has done the interpolation already.
  bool          closed;      // this result status: closed or opened
  uint32_t      numOfRows;   // number of rows of current time window
H
Haojun Liao 已提交
88
  SResultRowCellInfo*  pCellInfo;  // For each result column, there is a resultInfo
D
dapan1121 已提交
89 90
  STimeWindow win; 
  char* key;                 // start key of current result row
H
Haojun Liao 已提交
91
} SResultRow;
92

93
typedef struct SGroupResInfo {
H
Haojun Liao 已提交
94 95
  int32_t totalGroup;
  int32_t currentGroup;
96 97 98 99
  int32_t index;
  SArray* pRows;      // SArray<SResultRow*>
} SGroupResInfo;

H
Haojun Liao 已提交
100 101 102 103
/**
 * If the number of generated results is greater than this value,
 * query query will be halt and return results to client immediate.
 */
H
Haojun Liao 已提交
104
typedef struct SRspResultInfo {
H
Haojun Liao 已提交
105
  int64_t total;      // total generated result size in rows
H
Haojun Liao 已提交
106
  int32_t capacity;   // capacity of current result output buffer
H
Haojun Liao 已提交
107
  int32_t threshold;  // result size threshold in rows.
H
Haojun Liao 已提交
108
} SRspResultInfo;
109

H
Haojun Liao 已提交
110
typedef struct SResultRowInfo {
H
Haojun Liao 已提交
111 112 113 114 115 116
  SResultRow** pResult;    // result list
  int16_t      type:8;     // data type for hash key
  int32_t      size:24;    // number of result set
  int32_t      capacity;   // max capacity
  int32_t      curIndex;   // current start active index
  int64_t      prevSKey;   // previous (not completed) sliding window start key
H
Haojun Liao 已提交
117
} SResultRowInfo;
118 119 120 121 122 123 124 125

typedef struct SColumnFilterElem {
  int16_t           bytes;  // column length
  __filter_func_t   fp;
  SColumnFilterInfo filterInfo;
} SColumnFilterElem;

typedef struct SSingleColumnFilterInfo {
H
Haojun Liao 已提交
126
  void*              pData;
127
  int32_t            numOfFilters;
H
Haojun Liao 已提交
128
  SColumnInfo        info;
129 130 131
  SColumnFilterElem* pFilters;
} SSingleColumnFilterInfo;

H
Haojun Liao 已提交
132
typedef struct STableQueryInfo {
H
hjxilinx 已提交
133
  TSKEY       lastKey;
H
Haojun Liao 已提交
134
  int32_t     groupIndex;     // group id in table list
135
  tVariant    tag;
H
hjxilinx 已提交
136
  STimeWindow win;
137
  STSCursor   cur;
H
Haojun Liao 已提交
138
  void*       pTable;         // for retrieve the page id list
H
Haojun Liao 已提交
139
  SResultRowInfo resInfo;
140 141
} STableQueryInfo;

H
Haojun Liao 已提交
142 143 144 145 146 147 148 149 150
typedef struct SQueryCostInfo {
  uint64_t loadStatisTime;
  uint64_t loadFileBlockTime;
  uint64_t loadDataInCacheTime;
  uint64_t loadStatisSize;
  uint64_t loadFileBlockSize;
  uint64_t loadDataInCacheSize;
  
  uint64_t loadDataTime;
151 152 153 154
  uint64_t totalRows;
  uint64_t totalCheckedRows;
  uint32_t totalBlocks;
  uint32_t loadBlocks;
H
Haojun Liao 已提交
155 156
  uint32_t loadBlockStatis;
  uint32_t discardBlocks;
157
  uint64_t elapsedTime;
H
Haojun Liao 已提交
158
  uint64_t firstStageMergeTime;
H
Haojun Liao 已提交
159 160
  uint64_t winInfoSize;
  uint64_t tableInfoSize;
H
Haojun Liao 已提交
161
  uint64_t hashSize;
162
  uint64_t numOfTimeWindows;
H
Haojun Liao 已提交
163
} SQueryCostInfo;
H
hjxilinx 已提交
164

H
Haojun Liao 已提交
165 166 167 168 169
typedef struct {
  int64_t vgroupLimit;
  int64_t ts;
} SOrderedPrjQueryInfo;

170 171 172 173 174
typedef struct {
  char*   tags;
  SArray* pResult;  // SArray<SStddevInterResult>
} SInterResult;

H
Haojun Liao 已提交
175 176 177 178 179 180
typedef struct SSDataBlock {
  SDataStatis *pBlockStatis;
  SArray      *pDataBlock;
  SDataBlockInfo info;
} SSDataBlock;

181
typedef struct SQuery {
H
Haojun Liao 已提交
182 183
  SLimitVal        limit;

H
Haojun Liao 已提交
184 185 186 187 188 189 190 191
  bool             stableQuery;      // super table query or not
  bool             topBotQuery;      // TODO used bitwise flag
  bool             groupbyColumn;    // denote if this is a groupby normal column query
  bool             hasTagResults;    // if there are tag values in final result or not
  bool             timeWindowInterpo;// if the time window start/end required interpolation
  bool             queryBlockDist;    // if query data block distribution
  bool             stabledev;        // super table stddev query
  int32_t          interBufSize;     // intermediate buffer sizse
H
Haojun Liao 已提交
192

D
dapan1121 已提交
193 194
  int32_t          havingNum;        // having expr number

H
Haojun Liao 已提交
195
  SOrderVal        order;
H
Haojun Liao 已提交
196 197
  int16_t          numOfCols;
  int16_t          numOfTags;
H
Haojun Liao 已提交
198

H
Haojun Liao 已提交
199
  STimeWindow      window;
200
  SInterval        interval;
201
  SSessionWindow   sw;
202
  int16_t          precision;
H
Haojun Liao 已提交
203 204
  int16_t          numOfOutput;
  int16_t          fillType;
205 206 207 208
  int16_t          checkResultBuf;   // check if the buffer is full during scan each block

  int32_t          srcRowSize;       // todo extract struct
  int32_t          resultRowSize;
H
Haojun Liao 已提交
209
  int32_t          intermediateResultRowSize; // intermediate result row size, in case of top-k query.
210 211
  int32_t          maxSrcColumnSize;
  int32_t          tagLen;           // tag value length of current query
H
Haojun Liao 已提交
212
  SSqlGroupbyExpr* pGroupbyExpr;
H
Haojun Liao 已提交
213
  SExprInfo*       pExpr1;
H
Haojun Liao 已提交
214 215
  SExprInfo*       pExpr2;
  int32_t          numOfExpr2;
H
Haojun Liao 已提交
216 217 218 219
  SColumnInfo*     colList;
  SColumnInfo*     tagColList;
  int32_t          numOfFilterCols;
  int64_t*         fillVal;
220
  SOrderedPrjQueryInfo prjInfo;        // limit value for each vgroup, only available in global order projection query.
221
  SSingleColumnFilterInfo* pFilterInfo;
H
Haojun Liao 已提交
222

H
Haojun Liao 已提交
223
  STableQueryInfo* current;
H
Haojun Liao 已提交
224 225
  void*            tsdb;
  SMemRef          memRef;
H
Haojun Liao 已提交
226
  STableGroupInfo  tableGroupInfo;       // table <tid, last_key> list  SArray<STableKeyInfo>
H
Haojun Liao 已提交
227
  int32_t          vgId;
228 229
} SQuery;

H
Haojun Liao 已提交
230
typedef SSDataBlock* (*__operator_fn_t)(void* param);
H
Haojun Liao 已提交
231
typedef void (*__optr_cleanup_fn_t)(void* param, int32_t num);
H
Haojun Liao 已提交
232

H
Haojun Liao 已提交
233
struct SOperatorInfo;
H
Haojun Liao 已提交
234

235
typedef struct SQueryRuntimeEnv {
H
Haojun Liao 已提交
236 237
  jmp_buf               env;
  SQuery*               pQuery;
H
Haojun Liao 已提交
238
  uint32_t              status;           // query status
H
Haojun Liao 已提交
239
  void*                 qinfo;
H
Haojun Liao 已提交
240
  uint8_t               scanFlag;         // denotes reversed scan of data or not
H
Haojun Liao 已提交
241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258
  void*                 pQueryHandle;

  int32_t               prevGroupId;      // previous executed group id
  SDiskbasedResultBuf*  pResultBuf;       // query result buffer based on blocked-wised disk file
  SHashObj*             pResultRowHashTable; // quick locate the window object for each result
  char*                 keyBuf;           // window key buffer
  SResultRowPool*       pool;             // window result object pool
  char**                prevRow;

  SArray*               prevResult;       // intermediate result, SArray<SInterResult>
  STSBuf*               pTsBuf;           // timestamp filter list
  STSCursor             cur;

  char*                 tagVal;           // tag value of current data block
  SArithmeticSupport   *sasArray;

  SSDataBlock          *outputBuf;
  STableGroupInfo       tableqinfoGroupInfo;  // this is a group array list, including SArray<STableQueryInfo*> structure
H
Haojun Liao 已提交
259 260 261 262
  struct SOperatorInfo *proot;
  struct SOperatorInfo *pTableScanner;   // table scan operator
  SGroupResInfo         groupResInfo;
  int64_t               currentOffset;   // dynamic offset value
H
Haojun Liao 已提交
263

H
Haojun Liao 已提交
264
  SRspResultInfo        resultInfo;
H
Haojun Liao 已提交
265
  SHashObj             *pTableRetrieveTsMap;
266 267
} SQueryRuntimeEnv;

H
Haojun Liao 已提交
268 269 270 271 272 273
enum {
  OP_IN_EXECUTING   = 1,
  OP_RES_TO_RETURN  = 2,
  OP_EXEC_DONE      = 3,
};

H
Haojun Liao 已提交
274 275 276 277 278
enum OPERATOR_TYPE_E {
  OP_TableScan         = 1,
  OP_DataBlocksOptScan = 2,
  OP_TableSeqScan      = 3,
  OP_TagScan           = 4,
H
Haojun Liao 已提交
279 280 281 282 283 284
  OP_TableBlockInfoScan= 5,
  OP_Aggregate         = 6,
  OP_Arithmetic        = 7,
  OP_Groupby           = 8,
  OP_Limit             = 9,
  OP_Offset            = 10,
285 286 287 288 289
  OP_TimeWindow        = 11,
  OP_SessionWindow     = 12,
  OP_Fill              = 13,
  OP_MultiTableAggregate     = 14,
  OP_MultiTableTimeInterval  = 15,
D
dapan1121 已提交
290
  OP_Having            = 16,
H
Haojun Liao 已提交
291 292
};

H
Haojun Liao 已提交
293
typedef struct SOperatorInfo {
H
Haojun Liao 已提交
294 295 296 297 298 299 300 301
  uint8_t               operatorType;
  bool                  blockingOptr;  // block operator or not
  uint8_t               status;        // denote if current operator is completed
  int32_t               numOfOutput;   // number of columns of the current operator results
  char                 *name;          // name, used to show the query execution plan
  void                 *info;          // extension attribution
  SExprInfo            *pExpr;
  SQueryRuntimeEnv     *pRuntimeEnv;
H
Haojun Liao 已提交
302

H
Haojun Liao 已提交
303
  struct SOperatorInfo *upstream;
H
Haojun Liao 已提交
304
  __operator_fn_t       exec;
H
Haojun Liao 已提交
305
  __optr_cleanup_fn_t   cleanup;
H
Haojun Liao 已提交
306 307
} SOperatorInfo;

308 309 310 311 312
enum {
  QUERY_RESULT_NOT_READY = 1,
  QUERY_RESULT_READY     = 2,
};

313
typedef struct SQInfo {
H
Haojun Liao 已提交
314
  void*            signature;
D
fix bug  
dapan1121 已提交
315
  uint64_t         qId;
H
Haojun Liao 已提交
316 317
  int32_t          code;        // error code to returned to client
  int64_t          owner;       // if it is in execution
H
Haojun Liao 已提交
318

319
  SQueryRuntimeEnv runtimeEnv;
H
Haojun Liao 已提交
320
  SQuery           query;
321
  void*            pBuf;        // allocated buffer for STableQueryInfo, sizeof(STableQueryInfo)*numOfTables;
H
Haojun Liao 已提交
322

323
  pthread_mutex_t  lock;        // used to synchronize the rsp/query threads
H
Haojun Liao 已提交
324
  tsem_t           ready;
325 326
  int32_t          dataReady;   // denote if query result is ready or not
  void*            rspContext;  // response context
327
  int64_t          startExecTs; // start to exec timestamp
328
  char*            sql;         // query sql string
H
Haojun Liao 已提交
329
  SQueryCostInfo   summary;
330 331
} SQInfo;

H
Haojun Liao 已提交
332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347
typedef struct SQueryParam {
  char            *sql;
  char            *tagCond;
  char            *tbnameCond;
  char            *prevResult;
  SArray          *pTableIdList;
  SSqlFuncMsg    **pExprMsg;
  SSqlFuncMsg    **pSecExprMsg;
  SExprInfo       *pExprs;
  SExprInfo       *pSecExprs;

  SColIndex       *pGroupColIndex;
  SColumnInfo     *pTagColumnInfo;
  SSqlGroupbyExpr *pGroupbyExpr;
} SQueryParam;

H
Haojun Liao 已提交
348
typedef struct STableScanInfo {
H
Haojun Liao 已提交
349 350 351 352 353 354 355 356 357 358 359 360
  void           *pQueryHandle;
  int32_t         numOfBlocks;
  int32_t         numOfSkipped;
  int32_t         numOfBlockStatis;
  int64_t         numOfRows;
                 
  int32_t         order;        // scan order
  int32_t         times;        // repeat counts
  int32_t         current;
  int32_t         reverseTimes; // 0 by default

  SQLFunctionCtx *pCtx;         // next operator query context
H
Haojun Liao 已提交
361
  SResultRowInfo *pResultRowInfo;
H
Haojun Liao 已提交
362 363
  int32_t        *rowCellInfoOffset;
  SExprInfo      *pExpr;
H
Haojun Liao 已提交
364 365
  SSDataBlock     block;
  bool            loadExternalRows; // load external rows (prev & next rows)
H
Haojun Liao 已提交
366
  int32_t         numOfOutput;
H
Haojun Liao 已提交
367
  int64_t         elapsedTime;
H
Haojun Liao 已提交
368

H
Haojun Liao 已提交
369
  int32_t         tableIndex;
H
Haojun Liao 已提交
370 371
} STableScanInfo;

372 373 374
typedef struct STagScanInfo {
  SColumnInfo* pCols;
  SSDataBlock* pRes;
H
Haojun Liao 已提交
375 376
  int32_t      totalTables;
  int32_t      currentIndex;
377 378
} STagScanInfo;

H
Haojun Liao 已提交
379
typedef struct SOptrBasicInfo {
H
Haojun Liao 已提交
380
  SResultRowInfo    resultRowInfo;
H
Haojun Liao 已提交
381
  int32_t          *rowCellInfoOffset;  // offset value for each row result cell info
H
Haojun Liao 已提交
382
  SQLFunctionCtx   *pCtx;
H
Haojun Liao 已提交
383
  SSDataBlock      *pRes;
H
Haojun Liao 已提交
384 385
} SOptrBasicInfo;

H
Haojun Liao 已提交
386 387 388 389 390 391
typedef struct SOptrBasicInfo STableIntervalOperatorInfo;

typedef struct SAggOperatorInfo {
  SOptrBasicInfo binfo;
  uint32_t       seed;
} SAggOperatorInfo;
H
Haojun Liao 已提交
392

H
Haojun Liao 已提交
393
typedef struct SArithOperatorInfo {
H
Haojun Liao 已提交
394 395
  SOptrBasicInfo binfo;
  int32_t        bufCapacity;
H
Haojun Liao 已提交
396
  uint32_t       seed;
H
Haojun Liao 已提交
397 398
} SArithOperatorInfo;

H
Haojun Liao 已提交
399 400 401 402 403 404 405 406 407
typedef struct SLimitOperatorInfo {
  int64_t limit;
  int64_t total;
} SLimitOperatorInfo;

typedef struct SOffsetOperatorInfo {
  int64_t offset;
} SOffsetOperatorInfo;

D
dapan1121 已提交
408 409 410 411 412
typedef struct SHavingOperatorInfo {  
  SArray* fp;
} SHavingOperatorInfo;


H
Haojun Liao 已提交
413
typedef struct SFillOperatorInfo {
H
Haojun Liao 已提交
414
  SFillInfo   *pFillInfo;
H
Haojun Liao 已提交
415 416
  SSDataBlock *pRes;
  int64_t      totalInputRows;
H
Haojun Liao 已提交
417 418
} SFillOperatorInfo;

H
Haojun Liao 已提交
419 420 421
typedef struct SGroupbyOperatorInfo {
  SOptrBasicInfo binfo;
  int32_t        colIndex;
H
Haojun Liao 已提交
422
  char          *prevData;   // previous group by value
H
Haojun Liao 已提交
423
} SGroupbyOperatorInfo;
H
Haojun Liao 已提交
424

425 426 427 428 429 430 431 432
typedef struct SSWindowOperatorInfo {
  SOptrBasicInfo binfo;
  STimeWindow    curWindow;  // current time window
  TSKEY          prevTs;     // previous timestamp
  int32_t        numOfRows;  // number of rows
  int32_t        start;      // start row index
} SSWindowOperatorInfo;

H
Haojun Liao 已提交
433 434 435 436
void freeParam(SQueryParam *param);
int32_t convertQueryMsg(SQueryTableMsg *pQueryMsg, SQueryParam* param);
int32_t createQueryFuncExprFromMsg(SQueryTableMsg *pQueryMsg, int32_t numOfOutput, SExprInfo **pExprInfo, SSqlFuncMsg **pExprMsg,
                                   SColumnInfo* pTagCols);
H
Haojun Liao 已提交
437 438 439
int32_t createIndirectQueryFuncExprFromMsg(SQueryTableMsg *pQueryMsg, int32_t numOfOutput, SExprInfo **pExprInfo,
                                           SSqlFuncMsg **pExprMsg, SExprInfo *prevExpr);

H
Haojun Liao 已提交
440 441
SSqlGroupbyExpr *createGroupbyExprFromMsg(SQueryTableMsg *pQueryMsg, SColIndex *pColIndex, int32_t *code);
SQInfo *createQInfoImpl(SQueryTableMsg *pQueryMsg, SSqlGroupbyExpr *pGroupbyExpr, SExprInfo *pExprs,
D
fix bug  
dapan1121 已提交
442
                        SExprInfo *pSecExprs, STableGroupInfo *pTableGroupInfo, SColumnInfo* pTagCols, bool stableQuery, char* sql, uint64_t *qId);
H
Haojun Liao 已提交
443 444 445 446 447 448
int32_t initQInfo(SQueryTableMsg *pQueryMsg, void *tsdb, int32_t vgId, SQInfo *pQInfo, SQueryParam* param, bool isSTable);
void freeColumnFilterInfo(SColumnFilterInfo* pFilter, int32_t numOfFilters);

bool isQueryKilled(SQInfo *pQInfo);
int32_t checkForQueryBuf(size_t numOfTables);
bool doBuildResCheck(SQInfo* pQInfo);
H
Haojun Liao 已提交
449
void setQueryStatus(SQueryRuntimeEnv *pRuntimeEnv, int8_t status);
H
Haojun Liao 已提交
450 451 452 453 454 455 456 457 458 459 460 461 462

bool onlyQueryTags(SQuery* pQuery);
bool isValidQInfo(void *param);

int32_t doDumpQueryResult(SQInfo *pQInfo, char *data);

size_t getResultSize(SQInfo *pQInfo, int64_t *numOfRows);
void setQueryKilled(SQInfo *pQInfo);
void queryCostStatis(SQInfo *pQInfo);
void freeQInfo(SQInfo *pQInfo);

int32_t getMaximumIdleDurationSec();

H
Haojun Liao 已提交
463
#endif  // TDENGINE_QEXECUTOR_H