tdataformat.h 12.1 KB
Newer Older
H
more  
hzcheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
H
hzcheng 已提交
15
#ifndef _TD_DATA_FORMAT_H_
H
more  
Hongze Cheng 已提交
16 17 18
#define _TD_DATA_FORMAT_H_

#include <stdint.h>
H
hzcheng 已提交
19
#include <stdlib.h>
H
hzcheng 已提交
20
#include <string.h>
H
more  
Hongze Cheng 已提交
21

H
Hongze Cheng 已提交
22
#include "talgo.h"
H
hzcheng 已提交
23
#include "taosdef.h"
H
TD-166  
hzcheng 已提交
24
#include "tutil.h"
H
hzcheng 已提交
25

H
more  
hzcheng 已提交
26 27 28
#ifdef __cplusplus
extern "C" {
#endif
H
hzcheng 已提交
29

30 31
#define STR_TO_VARSTR(x, str) do {VarDataLenT __len = strlen(str); \
  *(VarDataLenT*)(x) = __len; \
32
  strncpy(varDataVal(x), (str), __len);} while(0);
33 34

#define STR_WITH_MAXSIZE_TO_VARSTR(x, str, _maxs) do {\
35 36
  char* _e = stpncpy(varDataVal(x), (str), (_maxs));\
  varDataSetLen(x, (_e - (x) - VARSTR_HEADER_SIZE));\
37 38 39 40
} while(0)

#define STR_WITH_SIZE_TO_VARSTR(x, str, _size) do {\
  *(VarDataLenT*)(x) = (_size); \
41
  strncpy(varDataVal(x), (str), (_size));\
H
hjxilinx 已提交
42 43
} while(0);

H
hzcheng 已提交
44 45 46 47 48
// ----------------- TSDB COLUMN DEFINITION
typedef struct {
  int8_t  type;    // Column type
  int16_t colId;   // column ID
  int32_t bytes;   // column bytes
H
TD-166  
hzcheng 已提交
49
  int32_t offset;  // point offset in SDataRow after the header part
H
hzcheng 已提交
50 51 52 53 54 55 56 57 58 59 60 61 62 63
} STColumn;

#define colType(col) ((col)->type)
#define colColId(col) ((col)->colId)
#define colBytes(col) ((col)->bytes)
#define colOffset(col) ((col)->offset)

#define colSetType(col, t) (colType(col) = (t))
#define colSetColId(col, id) (colColId(col) = (id))
#define colSetBytes(col, b) (colBytes(col) = (b))
#define colSetOffset(col, o) (colOffset(col) = (o))

// ----------------- TSDB SCHEMA DEFINITION
typedef struct {
H
TD-166  
hzcheng 已提交
64
  int      totalCols;  // Total columns allocated
H
hzcheng 已提交
65
  int      numOfCols;  // Number of columns appended
H
TD-166  
hzcheng 已提交
66 67
  int      tlen;       // maximum length of a SDataRow without the header part
  int      flen;       // First part length in a SDataRow after the header part
H
hzcheng 已提交
68 69 70 71
  STColumn columns[];
} STSchema;

#define schemaNCols(s) ((s)->numOfCols)
H
TD-166  
hzcheng 已提交
72 73 74
#define schemaTotalCols(s) ((s)->totalCols)
#define schemaTLen(s) ((s)->tlen)
#define schemaFLen(s) ((s)->flen)
H
hzcheng 已提交
75 76 77
#define schemaColAt(s, i) ((s)->columns + i)

STSchema *tdNewSchema(int32_t nCols);
H
TD-166  
hzcheng 已提交
78 79
#define   tdFreeSchema(s) tfree((s))
int       tdSchemaAddCol(STSchema *pSchema, int8_t type, int16_t colId, int32_t bytes);
H
hzcheng 已提交
80
STSchema *tdDupSchema(STSchema *pSchema);
H
TD-27  
hzcheng 已提交
81 82 83
int       tdGetSchemaEncodeSize(STSchema *pSchema);
void *    tdEncodeSchema(void *dst, STSchema *pSchema);
STSchema *tdDecodeSchema(void **psrc);
H
hzcheng 已提交
84

H
more  
Hongze Cheng 已提交
85 86
// ----------------- Data row structure

H
hzcheng 已提交
87
/* A data row, the format is like below:
H
TD-166  
hzcheng 已提交
88 89 90 91 92 93 94
 * |<------------------------------------- len ---------------------------------->|
 * |<--Head ->|<---------   flen -------------->|                                 |
 * +----------+---------------------------------+---------------------------------+
 * | int32_t  |                                 |                                 |
 * +----------+---------------------------------+---------------------------------+
 * |   len    |           First part            |             Second part         |
 * +----------+---------------------------------+---------------------------------+
H
more  
Hongze Cheng 已提交
95
 */
H
hzcheng 已提交
96 97
typedef void *SDataRow;

H
TD-166  
hzcheng 已提交
98
#define TD_DATA_ROW_HEAD_SIZE sizeof(int32_t)
H
hzcheng 已提交
99

H
hzcheng 已提交
100
#define dataRowLen(r) (*(int32_t *)(r))
H
hzcheng 已提交
101
#define dataRowTuple(r) POINTER_SHIFT(r, TD_DATA_ROW_HEAD_SIZE)
H
TD-34  
hzcheng 已提交
102
#define dataRowKey(r) (*(TSKEY *)(dataRowTuple(r)))
H
hzcheng 已提交
103
#define dataRowSetLen(r, l) (dataRowLen(r) = (l))
H
hzcheng 已提交
104
#define dataRowCpy(dst, r) memcpy((dst), (r), dataRowLen(r))
H
TD-166  
hzcheng 已提交
105
#define dataRowMaxBytesFromSchema(s) (schemaTLen(s) + TD_DATA_ROW_HEAD_SIZE)
H
hzcheng 已提交
106

H
hzcheng 已提交
107
SDataRow tdNewDataRowFromSchema(STSchema *pSchema);
H
hzcheng 已提交
108
void     tdFreeDataRow(SDataRow row);
H
TD-166  
hzcheng 已提交
109
void     tdInitDataRow(SDataRow row, STSchema *pSchema);
H
hzcheng 已提交
110
SDataRow tdDataRowDup(SDataRow row);
H
more  
Hongze Cheng 已提交
111

112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131
static FORCE_INLINE int tdAppendColVal(SDataRow row, void *value, int8_t type, int32_t bytes, int32_t offset) {
  ASSERT(value != NULL);
  int32_t toffset = offset + TD_DATA_ROW_HEAD_SIZE;
  char *  ptr = (char *)POINTER_SHIFT(row, dataRowLen(row));

  switch (type) {
    case TSDB_DATA_TYPE_BINARY:
    case TSDB_DATA_TYPE_NCHAR:
      *(VarDataOffsetT *)POINTER_SHIFT(row, toffset) = dataRowLen(row);
      memcpy(ptr, value, varDataTLen(value));
      dataRowLen(row) += varDataTLen(value);
      break;
    default:
      memcpy(POINTER_SHIFT(row, toffset), value, TYPE_BYTES[type]);
      break;
  }

  return 0;
}

H
TD-166  
hzcheng 已提交
132
// NOTE: offset here including the header size
H
TD-166  
hzcheng 已提交
133 134 135 136
static FORCE_INLINE void *tdGetRowDataOfCol(SDataRow row, int8_t type, int32_t offset) {
  switch (type) {
    case TSDB_DATA_TYPE_BINARY:
    case TSDB_DATA_TYPE_NCHAR:
H
hzcheng 已提交
137
      return POINTER_SHIFT(row, *(VarDataOffsetT *)POINTER_SHIFT(row, offset));
H
TD-166  
hzcheng 已提交
138
    default:
H
hzcheng 已提交
139
      return POINTER_SHIFT(row, offset);
H
TD-166  
hzcheng 已提交
140 141 142
  }
}

H
TD-34  
hzcheng 已提交
143 144
// ----------------- Data column structure
typedef struct SDataCol {
H
TD-166  
hzcheng 已提交
145 146 147
  int8_t          type;       // column type
  int16_t         colId;      // column ID
  int             bytes;      // column data bytes defined
H
TD-166  
hzcheng 已提交
148
  int             offset;     // data offset in a SDataRow (including the header size)
H
TD-166  
hzcheng 已提交
149 150 151 152
  int             spaceSize;  // Total space size for this column
  int             len;        // column data length
  VarDataOffsetT *dataOff;    // For binary and nchar data, the offset in the data column
  void *          pData;      // Actual data pointer
H
TD-34  
hzcheng 已提交
153 154
} SDataCol;

H
TD-166  
hzcheng 已提交
155 156 157
static FORCE_INLINE void dataColReset(SDataCol *pDataCol) { pDataCol->len = 0; }

void dataColInit(SDataCol *pDataCol, STColumn *pCol, void **pBuf, int maxPoints);
H
Haojun Liao 已提交
158 159
void dataColAppendVal(SDataCol *pCol, void *value, int numOfRows, int maxPoints);
void dataColPopPoints(SDataCol *pCol, int pointsToPop, int numOfRows);
H
TD-166  
hzcheng 已提交
160 161
void dataColSetOffset(SDataCol *pCol, int nEle);

H
TD-166  
hzcheng 已提交
162 163
bool isNEleNull(SDataCol *pCol, int nEle);
void dataColSetNEleNull(SDataCol *pCol, int nEle, int maxPoints);
H
TD-166  
hzcheng 已提交
164 165 166

// Get the data pointer from a column-wised data
static FORCE_INLINE void *tdGetColDataOfRow(SDataCol *pCol, int row) {
H
TD-166  
hzcheng 已提交
167 168 169
  switch (pCol->type) {
    case TSDB_DATA_TYPE_BINARY:
    case TSDB_DATA_TYPE_NCHAR:
H
hzcheng 已提交
170
      return POINTER_SHIFT(pCol->pData, pCol->dataOff[row]);
H
TD-166  
hzcheng 已提交
171 172 173
      break;

    default:
H
hzcheng 已提交
174
      return POINTER_SHIFT(pCol->pData, TYPE_BYTES[pCol->type] * row);
H
TD-166  
hzcheng 已提交
175
      break;
H
TD-166  
hzcheng 已提交
176 177 178
  }
}

H
TD-166  
hzcheng 已提交
179
static FORCE_INLINE int32_t dataColGetNEleLen(SDataCol *pDataCol, int rows) {
H
TD-166  
hzcheng 已提交
180 181
  ASSERT(rows > 0);

H
TD-166  
hzcheng 已提交
182 183 184
  switch (pDataCol->type) {
    case TSDB_DATA_TYPE_BINARY:
    case TSDB_DATA_TYPE_NCHAR:
H
TD-166  
hzcheng 已提交
185
      return pDataCol->dataOff[rows - 1] + varDataTLen(tdGetColDataOfRow(pDataCol, rows - 1));
H
TD-166  
hzcheng 已提交
186 187
      break;
    default:
H
TD-166  
hzcheng 已提交
188
      return TYPE_BYTES[pDataCol->type] * rows;
H
TD-166  
hzcheng 已提交
189 190 191 192
  }
}


H
TD-34  
hzcheng 已提交
193
typedef struct {
H
TD-34  
hzcheng 已提交
194 195 196
  int      maxRowSize;
  int      maxCols;    // max number of columns
  int      maxPoints;  // max number of points
H
TD-166  
hzcheng 已提交
197
  int      bufSize;
H
TD-166  
hzcheng 已提交
198

H
Haojun Liao 已提交
199
  int      numOfRows;
H
TD-34  
hzcheng 已提交
200
  int      numOfCols;  // Total number of cols
H
TD-34  
hzcheng 已提交
201
  int      sversion;   // TODO: set sversion
H
TD-34  
hzcheng 已提交
202 203 204 205
  void *   buf;
  SDataCol cols[];
} SDataCols;

H
TD-34  
hzcheng 已提交
206
#define keyCol(pCols) (&((pCols)->cols[0]))  // Key column
H
TD-166  
hzcheng 已提交
207
#define dataColsKeyAt(pCols, idx) ((TSKEY *)(keyCol(pCols)->pData))[(idx)]
H
TD-34  
hzcheng 已提交
208
#define dataColsKeyFirst(pCols) dataColsKeyAt(pCols, 0)
H
Haojun Liao 已提交
209
#define dataColsKeyLast(pCols) ((pCols->numOfRows == 0) ? 0 : dataColsKeyAt(pCols, (pCols)->numOfRows - 1))
H
TD-34  
hzcheng 已提交
210

H
TD-166  
hzcheng 已提交
211
SDataCols *tdNewDataCols(int maxRowSize, int maxCols, int maxRows);
H
TD-34  
hzcheng 已提交
212
void       tdResetDataCols(SDataCols *pCols);
H
TD-34  
hzcheng 已提交
213
void       tdInitDataCols(SDataCols *pCols, STSchema *pSchema);
H
TD-100  
hzcheng 已提交
214
SDataCols *tdDupDataCols(SDataCols *pCols, bool keepData);
H
TD-34  
hzcheng 已提交
215
void       tdFreeDataCols(SDataCols *pCols);
H
TD-34  
hzcheng 已提交
216
void       tdAppendDataRowToDataCol(SDataRow row, SDataCols *pCols);
H
hjxilinx 已提交
217
void       tdPopDataColsPoints(SDataCols *pCols, int pointsToPop); //!!!!
H
hzcheng 已提交
218
int        tdMergeDataCols(SDataCols *target, SDataCols *src, int rowsToMerge);
H
TD-100  
hzcheng 已提交
219
void       tdMergeTwoDataCols(SDataCols *target, SDataCols *src1, int *iter1, SDataCols *src2, int *iter2, int tRows);
H
more  
Hongze Cheng 已提交
220

T
Tao Liu 已提交
221

H
Hongze Cheng 已提交
222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269
// ----------------- K-V data row structure
/*
 * +----------+----------+---------------------------------+---------------------------------+
 * |  int16_t |  int16_t |                                 |                                 |
 * +----------+----------+---------------------------------+---------------------------------+
 * |    len   |   ncols  |           cols index            |             data part           |
 * +----------+----------+---------------------------------+---------------------------------+
 */
typedef void *SKVDataRow;

typedef struct {
  int16_t colId;
  int16_t offset;
} SColIdx;

#define TD_KV_DATA_ROW_HEAD_SIZE 2*sizeof(int16_t)

#define kvDataRowLen(r) (*(int16_t *)(r))
#define kvDataRowNCols(r) (*(int16_t *)POINTER_SHIFT(r, sizeof(int16_t)))
#define kvDataRowColIdx(r) (SColIdx *)POINTER_SHIFT(r, TD_KV_DATA_ROW_HEAD_SIZE)
#define kvDataRowValues(r) POINTER_SHIFT(r, TD_KV_DATA_ROW_HEAD_SIZE + sizeof(SColIdx) * kvDataRowNCols(r))
#define kvDataRowCpy(dst, r) memcpy((dst), (r), kvDataRowLen(r))
#define kvDataRowColVal(r, colIdx) POINTER_SHIFT(kvDataRowValues(r), (colIdx)->offset)
#define kvDataRowSetLen(r, len) kvDataRowLen(r) = (len)
#define kvDataRowSetNCols(r, n) kvDataRowNCols(r) = (n)
#define kvDataRowColIdxAt(r, i) (kvDataRowColIdx(r) + (i))

SKVDataRow tdKVDataRowDup(SKVDataRow row);
SKVDataRow tdSetKVRowDataOfCol(SKVDataRow row, int16_t colId, int8_t type, void *value);
void *     tdEncodeKVDataRow(void *buf, SKVDataRow row);
void *     tdDecodeKVDataRow(void *buf, SKVDataRow *row);

static FORCE_INLINE int comparTagId(const void *key1, const void *key2) {
  if (*(int16_t *)key1 > ((SColIdx *)key2)->colId) {
    return 1;
  } else if (*(int16_t *)key1 < ((SColIdx *)key2)->colId) {
    return -1;
  } else {
    return 0;
  }
}

static FORCE_INLINE void *tdGetKVRowDataOfCol(SKVDataRow row, int16_t colId) {
  void *ret = taosbsearch(&colId, kvDataRowColIdx(row), kvDataRowNCols(row), sizeof(SColIdx), comparTagId, TD_EQ);
  if (ret == NULL) return NULL;
  return kvDataRowColVal(row, (SColIdx *)ret);
}

T
Tao Liu 已提交
270 271 272
// ----------------- Tag row structure

/* A tag row, the format is like below:
T
Tao Liu 已提交
273 274 275 276 277 278 279 280 281
+----------+----------------------------------------------------------------+
| STagRow  | STagCol | STagCol | STagCol | STagCol | ...| STagCol | STagCol | 
+----------+----------------------------------------------------------------+

pData
+----------+----------------------------------------------------------------+
| value 1     | value 2 |  value 3     | value 4       | ....|value n       |
+----------+----------------------------------------------------------------+

T
Tao Liu 已提交
282
 */
T
Tao Liu 已提交
283

T
Tao Liu 已提交
284 285 286 287 288 289 290 291 292 293 294

#define TD_TAG_ROW_HEAD_SIZE sizeof(int16_t)

#define tagRowNum(r) (*(int16_t *)(r))
#define tagRowArray(r) POINTER_SHIFT(r, TD_TAG_ROW_HEAD_SIZE)
//#define dataRowKey(r) (*(TSKEY *)(dataRowTuple(r)))
//#define dataRowSetLen(r, l) (dataRowLen(r) = (l))
//#define dataRowCpy(dst, r) memcpy((dst), (r), dataRowLen(r))
//#define dataRowMaxBytesFromSchema(s) (schemaTLen(s) + TD_DATA_ROW_HEAD_SIZE)

typedef struct {
H
Hongze Cheng 已提交
295 296 297
  int16_t  colId;  // column ID
  int16_t  colType;
  uint16_t offset;  // to store value for numeric col or offset for binary/Nchar
T
Tao Liu 已提交
298 299 300
} STagCol;

typedef struct {
H
Hongze Cheng 已提交
301 302 303 304 305
  int32_t  len;
  void *   pData;  // Space to store the tag value
  uint16_t dataLen;
  int16_t  ncols;  // Total columns allocated
  STagCol  tagCols[];
T
Tao Liu 已提交
306 307
} STagRow;

T
Tao Liu 已提交
308 309
#define tagColSize(r) (sizeof(STagCol) + r.colLen)

H
Hongze Cheng 已提交
310 311 312 313 314 315 316 317 318 319
int       tdSetTagCol(SDataRow row, void *value, int16_t len, int8_t type,
                      int16_t colId);                   // insert tag value and update all the information
int       tdDeleteTagCol(SDataRow row, int16_t colId);  // delete tag value and update all the information
void *    tdQueryTagByID(SDataRow row, int16_t colId, int16_t *type);  // if find tag, 0, else return -1;
int       tdAppendTagColVal(SDataRow row, void *value, int8_t type, int32_t bytes, int16_t colId);
SDataRow  tdTagRowDup(SDataRow row);
void      tdFreeTagRow(SDataRow row);
SDataRow  tdTagRowDecode(SDataRow row);
int       tdTagRowCpy(SDataRow dst, SDataRow src);
void *    tdNewTagRowFromSchema(STSchema *pSchema, int16_t numofTags);
T
Tao Liu 已提交
320
STSchema *tdGetSchemaFromData(SDataRow *row);
T
Tao Liu 已提交
321

H
more  
hzcheng 已提交
322 323 324 325
#ifdef __cplusplus
}
#endif

H
hzcheng 已提交
326
#endif  // _TD_DATA_FORMAT_H_