tsdb.h 12.1 KB
Newer Older
H
more  
Hongze Cheng 已提交
1 2 3
/**************************************
 * FOR OUTSIDE USAGE
 **************************************/
H
Hongze Cheng 已提交
4 5 6 7 8 9 10
#if !defined(_TD_TSDB_H_)
#define _TD_TSDB_H_

#include <pthread.h>
#include <stdbool.h>
#include <stdint.h>

H
more  
hzcheng 已提交
11
// #include "cache.h"
H
Hongze Cheng 已提交
12 13 14 15 16 17 18 19 20
#include "schema.h"

#define TSDB_VERSION_MAJOR 1
#define TSDB_VERSION_MINOR 0

typedef void    tsdb_repo_t;  // use void to hide implementation details from outside
typedef int32_t table_id_t;   // table ID type in this repository
typedef int16_t tsdb_id_t;    // TSDB repository ID

H
more  
hzcheng 已提交
21 22 23 24 25 26 27 28 29 30 31 32 33 34 35
// Submit message
typedef struct {
  int32_t numOfTables;
  char    data[];
} SSubmitMsg;

// Submit message for one table
typedef struct {
  table_id_t tableId;       // table ID to insert
  int32_t    sversion;      // data schema version
  int32_t    numOfRows;     // number of rows data
  int64_t    uid;           // table UID to insert
  char       data[];
} SSubmitBlock;

H
Hongze Cheng 已提交
36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71
// Retention policy.
typedef struct {
  // TODO: Need a more fancy description
  int32_t keep1;
  int32_t keep2;
  int32_t keep3;
} SRetentionPolicy;

// Data sharding policy.
typedef struct {
  // TODO: Need a more fancy description
  int32_t daysPerFile;
} SDataShardPolicy;

// Rows in file block policy
typedef struct {
  // TODO: Need a more fancy description
  int32_t minRowsPerFileBlock;
  int32_t maxRowsPerFileBlock;
} SBlockRowsPolicy;

// Applications trying to manipulate a table should provide both uid and tableId.
// tableId is used for table quick access and uid for verification.
typedef struct {
  int64_t    uid;      // the unique table ID
  table_id_t tableId;  // the table ID in the repository.
} STableId;

// the TSDB repository configuration
typedef struct {
  char *           rootDir;  // TSDB repository root directory, TODO: need to adjust here
  tsdb_id_t        tsdbId;
  int32_t          maxTables;  // maximum number of tables this repository can have
  SDataShardPolicy dataShardPolicy;
  SBlockRowsPolicy blockRowsPolicy;
  SRetentionPolicy retentionPlicy;  // retention configuration
H
more  
hzcheng 已提交
72
  void *           cachePool;       // the cache pool the repository to use
H
Hongze Cheng 已提交
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222
} STSDBCfg;

// the TSDB repository info
typedef struct STSDBRepoInfo {
  STSDBCfg tsdbCfg;
  int64_t  version;            // version of the repository
  int64_t  tsdbTotalDataSize;  // the original inserted data size
  int64_t  tsdbTotalDiskSize;  // the total disk size taken by this TSDB repository
  // TODO: Other informations to add
} STSDBRepoInfo;

// the meter configuration
typedef struct {
  char *     tableName;
  int64_t    uid;      // uid given by upper layer
  table_id_t tableId;  // table ID allocated from upper layer

  char *stableName;  // if not NULL, the table is created from a super table, need to make sure the super
                     // table exists in this TSDB.
  int64_t stableUid;

  int32_t  numOfCols;  // number of columns. For table form super table, not includes the tag schema
  SSchema *schema;     // If numOfCols == schema_->numOfCols, it is a normal table, stableName = NULL
                       // If numOfCols < schema->numOfCols, it is a table created from super table
                       // assert(numOfCols <= schema->numOfCols);

  char *tagValues;  // NULL if it is normal table
                    // otherwise, it contains the tag values.
} STableCfg;

// the meter information report structure
typedef struct {
  STableCfg tableCfg;
  int64_t   version;
  int64_t   tableTotalDataSize; // In bytes
  int64_t   tableTotalDiskSize; // In bytes
} STableInfo;

/**
 * Create a new TSDB repository
 * @param pCfg the TSDB repository configuration, upper layer to free the pointer
 * @param error the error number to set when failure occurs
 *
 * @return a TSDB repository handle on success, NULL for failure and the error number is set
 */
tsdb_repo_t *tsdbCreateRepo(STSDBCfg *pCfg, int32_t *error);

/**
 * Close and free all resources taken by the repository
 * @param pRepo the TSDB repository handle. The interface will free the handle too, so upper
 *              layer do NOT need to free the repo handle again.
 * @param error the error number to set when failure occurs
 *
 * @return 0 for success, -1 for failure and the error number is set
 */
int32_t tsdbDropRepo(tsdb_repo_t *pRepo, int32_t *error);

/**
 * Open an existing TSDB storage repository
 * @param tsdbDir the existing TSDB root directory
 * @param error the error number to set when failure occurs
 *
 * @return a TSDB repository handle on success, NULL for failure and the error number is set
 */
tsdb_repo_t *tsdbOpenRepo(char *tsdbDir, int32_t *error);

/**
 * Close a TSDB repository. Only free memory resources, and keep the files.
 * @param pRepo the opened TSDB repository handle. The interface will free the handle too, so upper
 *              layer do NOT need to free the repo handle again.
 * @param error the error number to set when failure occurs
 *
 * @return 0 for success, -1 for failure and the error number is set
 */
int32_t tsdbCloseRepo(tsdb_repo_t *pRepo, int32_t *error);

/**
 * Change the configuration of a repository
 * @param pCfg the repository configuration, the upper layer should free the pointer
 * @param error the error number to set when failure occurs
 *
 * @return 0 for success, -1 for failure and the error number is set
 */
int32_t tsdbConfigRepo(STSDBCfg *pCfg, int32_t *error);

/**
 * Get the TSDB repository information, including some statistics
 * @param pRepo the TSDB repository handle
 * @param error the error number to set when failure occurs
 *
 * @return a info struct handle on success, NULL for failure and the error number is set. The upper
 *         layers should free the info handle themselves or memory leak will occur
 */
STSDBRepoInfo *tsdbGetStatus(tsdb_repo_t *pRepo, int32_t *error);

// -- For table manipulation

/**
 * Create/Alter a table in a TSDB repository handle
 * @param pRepo the TSDB repository handle
 * @param pCfg the table configurations, the upper layer should free the pointer
 * @param error the error number to set when failure occurs
 *
 * @return 0 for success, -1 for failure and the error number is set
 */
int32_t tsdbCreateTable(tsdb_repo_t *pRepo, STableCfg *pCfg, int32_t *error);
int32_t tsdbAlterTable(tsdb_repo_t *pRepo, STableCfg *pCfg, int32_t *error);

/**
 * Drop a table in a repository and free all the resources it takes
 * @param pRepo the TSDB repository handle
 * @param tid the ID of the table to drop
 * @param error the error number to set when failure occurs
 *
 * @return 0 for success, -1 for failure and the error number is set
 */
int32_t tsdbDropTable(tsdb_repo_t *pRepo, STableId tid, int32_t *error);

/**
 * Get the information of a table in the repository
 * @param pRepo the TSDB repository handle
 * @param tid the ID of the table to drop
 * @param error the error number to set when failure occurs
 *
 * @return a table information handle for success, NULL for failure and the error number is set
 */
STableInfo *tsdbGetTableInfo(tsdb_repo_t *pRepo, STableId tid, int32_t *error);

// -- FOR INSERT DATA
/**
 * Insert data to a table in a repository
 * @param pRepo the TSDB repository handle
 * @param tid the table ID to insert to
 * @param pData the data to insert (will give a more specific description)
 * @param error the error number to set when failure occurs
 *
 * @return the number of points inserted, -1 for failure and the error number is set
 */
int32_t tsdbInsertData(tsdb_repo_t *pRepo, STableId tid, char *pData, int32_t *error);

// -- FOR QUERY TIME SERIES DATA

typedef void tsdb_query_handle_t; // Use void to hide implementation details

// time window
typedef struct STimeWindow {
  int64_t skey;
  int64_t ekey;
} STimeWindow;

H
more  
hzcheng 已提交
223 224 225
typedef struct {
} SColumnFilterInfo;

H
Hongze Cheng 已提交
226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257
// query condition to build vnode iterator
typedef struct STSDBQueryCond {
  STimeWindow       twindow;
  int32_t           order;  // desc/asc order to iterate the data block
  SColumnFilterInfo colFilterInfo;
} STSDBQueryCond;

typedef struct SBlockInfo {
  STimeWindow window;

  int32_t numOfRows;
  int32_t numOfCols;

  STableId tableId;
} SBlockInfo;

//  TODO: move this data struct out of the module
typedef struct SData {
  int32_t num;
  char *  data;
} SData;

typedef struct SDataBlock {
  int32_t numOfCols;
  SData **pData;
} SDataBlock;

typedef struct STableIDList {
  STableId *tableIds;
  int32_t   num;
} STableIDList;

H
more  
hzcheng 已提交
258 259 260 261
typedef struct {

} SFields;

H
Hongze Cheng 已提交
262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357
/**
 * Get the data block iterator, starting from position according to the query condition
 * @param pRepo  the TSDB repository to query on
 * @param pCond  query condition, only includes the filter on primary time stamp
 * @param pTableList    table sid list
 * @return
 */
tsdb_query_handle_t *tsdbQueryFromTableID(tsdb_repo_t *pRepo, STSDBQueryCond *pCond, const STableIDList *pTableList);

/**
 *  Get iterator for super tables, of which tags values satisfy the tag filter info
 *
 *  NOTE: the tagFilterStr is an bin-expression for tag filter, such as ((tag_col = 5) and (tag_col2 > 7))
 *  The filter string is sent from client directly.
 *  The build of the tags filter expression from string is done in the iterator generating function.
 *
 * @param pRepo         the repository to query on
 * @param pCond         query condition
 * @param pTagFilterStr tag filter info
 * @return
 */
tsdb_query_handle_t *tsdbQueryFromTagConds(tsdb_repo_t *pRepo, STSDBQueryCond *pCond, int16_t stableId, const char *pTagFilterStr);

/**
 *  Reset to the start(end) position of current query, from which the iterator starts.
 *
 * @param pQueryHandle
 * @param position  set the iterator traverses position. (TSDB_POS_START|TSDB_POS_END)
 * @return
 */
int32_t tsdbResetQuery(tsdb_query_handle_t *pQueryHandle, int16_t position);

/**
 *  move to next block
 * @param pQueryHandle
 * @param pCond
 * @return
 */
bool tsdbIterNext(tsdb_query_handle_t *pQueryHandle);

/**
 * 当前数据块的信息,调用next函数后,只会获得block的信息,包括:行数、列数、skey/ekey信息。注意该信息并不是现在的SCompBlockInfo信息。
 * 因为SCompBlockInfo是完整的数据块信息,但是迭代器返回并不是。
 * 查询处理引擎会自己决定需要blockInfo, 还是预计算数据,亦或是完整的数据。
 * Get current data block information
 *
 * @param pQueryHandle
 * @return
 */
SBlockInfo tsdbRetrieveDataBlockInfo(tsdb_query_handle_t *pQueryHandle);

/**
 * 获取当前数据块的预计算信息,如果块不完整,无预计算信息,如果是cache块,无预计算信息。
 *
 * Get the pre-calculated information w.r.t. current data block.
 *
 * In case of data block in cache, the pBlockStatis will always be NULL.
 * If a block is not completed loaded from disk, the pBlockStatis will be NULL.

 * @pBlockStatis the pre-calculated value for current data blocks. if the block is a cache block, always return 0
 * @return
 */
int32_t tsdbRetrieveDataBlockStatisInfo(tsdb_query_handle_t *pQueryHandle, SFields *pBlockStatis);

/**
 * 返回加载到缓存中的数据,可能是磁盘数据也可能是内存数据,对客户透明。即使是磁盘数据,返回的结果也是磁盘块中,满足查询时间范围要求的数据行,并不是一个完整的磁盘数
 * 据块。
 *
 * The query condition with primary timestamp is passed to iterator during its constructor function,
 * the returned data block must be satisfied with the time window condition in any cases,
 * which means the SData data block is not actually the completed disk data blocks.
 *
 * @param pQueryHandle
 * @return
 */
SDataBlock *tsdbRetrieveDataBlock(tsdb_query_handle_t *pQueryHandle);

/**
 * Get the qualified tables for (super) table query.
 * Used to handle the super table projection queries, the last_row query, the group by on normal columns query,
 * the interpolation query, and timestamp-comp query for join processing.
 *
 * @param pQueryHandle
 * @return table sid list. the invoker is responsible for the release of this the sid list.
 */
STableIDList *tsdbGetTableList(tsdb_query_handle_t *pQueryHandle);

/**
 * Get the qualified table sid for a super table according to the tag query expression.
 * @param stableid. super table sid
 * @param pTagCond. tag query condition
 *
 */
STableIDList *tsdbQueryTableList(int16_t stableId, const char *pTagCond);

#endif  // _TD_TSDB_H_