qextbuffer.h 6.9 KB
Newer Older
H
hzcheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */
#ifndef TDENGINE_TEXTBUFFER_H
#define TDENGINE_TEXTBUFFER_H

#ifdef __cplusplus
extern "C" {
#endif

H
hjxilinx 已提交
22
#include "os.h"
S
slguan 已提交
23
#include "taosmsg.h"
H
hjxilinx 已提交
24
#include "tutil.h"
H
hzcheng 已提交
25

H
hjxilinx 已提交
26 27 28 29
#define DEFAULT_PAGE_SIZE 16384  // 16k larger than the SHistoInfo
#define MIN_BUFFER_SIZE (1 << 19)
#define MAX_TMPFILE_PATH_LENGTH PATH_MAX
#define INITIAL_ALLOCATION_BUFFER_SIZE 64
H
hzcheng 已提交
30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57

typedef enum EXT_BUFFER_FLUSH_MODEL {
  /*
   * all data that have been flushed to disk is belonged to the same group
   * which means, all data in disk are sorted, or order is not matter in this case
   */
  SINGLE_APPEND_MODEL,

  /*
   * each flush operation to disk is completely independant to any other flush operation
   * we simply merge several set of data in one file, to reduce the count of flat files
   * in disk. So in this case, we need to keep the flush-out information in tFlushoutInfo
   * structure.
   */
  MULTIPLE_APPEND_MODEL,
} EXT_BUFFER_FLUSH_MODEL;

typedef struct tFlushoutInfo {
  uint32_t startPageId;
  uint32_t numOfPages;
} tFlushoutInfo;

typedef struct tFlushoutData {
  uint32_t       nAllocSize;
  uint32_t       nLength;
  tFlushoutInfo *pFlushoutInfo;
} tFlushoutData;

H
hjxilinx 已提交
58
typedef struct SFileInfo {
H
hzcheng 已提交
59
  uint32_t      nFileSize;  // in pages
H
hjxilinx 已提交
60
  uint32_t      pageSize;
H
hzcheng 已提交
61 62
  uint32_t      numOfElemsInFile;
  tFlushoutData flushoutData;
H
hjxilinx 已提交
63
} SFileInfo;
H
hzcheng 已提交
64 65 66 67 68 69 70 71 72 73 74

typedef struct tFilePage {
  uint64_t numOfElems;
  char     data[];
} tFilePage;

typedef struct tFilePagesItem {
  struct tFilePagesItem *pNext;
  tFilePage              item;
} tFilePagesItem;

S
slguan 已提交
75 76
typedef struct SSchemaEx {
  struct SSchema field;
H
hjxilinx 已提交
77
  int16_t        offset;
S
slguan 已提交
78
} SSchemaEx;
H
hjxilinx 已提交
79 80 81 82 83

typedef struct SColumnModel {
  int32_t    capacity;
  int32_t    numOfCols;
  int16_t    rowSize;
S
slguan 已提交
84
  SSchemaEx *pFields;
H
hjxilinx 已提交
85
} SColumnModel;
H
hzcheng 已提交
86

H
hjxilinx 已提交
87 88
typedef struct SColumnOrderInfo {
  int32_t numOfCols;
H
hzcheng 已提交
89
  int16_t pData[];
H
hjxilinx 已提交
90
} SColumnOrderInfo;
H
hzcheng 已提交
91 92

typedef struct tOrderDescriptor {
H
hjxilinx 已提交
93 94 95
  SColumnModel *   pColumnModel;
  int32_t          tsOrder;  // timestamp order type if exists
  SColumnOrderInfo orderIdx;
H
hzcheng 已提交
96 97 98
} tOrderDescriptor;

typedef struct tExtMemBuffer {
H
hjxilinx 已提交
99
  int32_t inMemCapacity;
H
hzcheng 已提交
100
  int32_t nElemSize;
H
hjxilinx 已提交
101 102
  int32_t pageSize;
  int32_t numOfTotalElems;
H
hzcheng 已提交
103 104
  int32_t numOfElemsInBuffer;
  int32_t numOfElemsPerPage;
H
hjxilinx 已提交
105
  int16_t numOfInMemPages;
H
hzcheng 已提交
106 107 108 109

  tFilePagesItem *pHead;
  tFilePagesItem *pTail;

H
hjxilinx 已提交
110 111 112
  char *    path;
  FILE *    file;
  SFileInfo fileMeta;
H
hzcheng 已提交
113

H
hjxilinx 已提交
114
  SColumnModel *         pColumnModel;
H
hzcheng 已提交
115 116 117
  EXT_BUFFER_FLUSH_MODEL flushModel;
} tExtMemBuffer;

S
slguan 已提交
118
typedef struct tTagSchema {
S
slguan 已提交
119
  struct SSchema *pSchema;
S
slguan 已提交
120 121 122 123 124 125 126
  int32_t         numOfCols;
  int32_t         colOffset[];
} tTagSchema;

typedef struct tSidSet {
  int32_t            numOfSids;
  int32_t            numOfSubSet;
H
hjxilinx 已提交
127
  STableIdInfo     **pTableIdList;
S
slguan 已提交
128
  int32_t *          starterPos;  // position of each subgroup, generated according to
S
slguan 已提交
129 130
  SColumnModel      *pColumnModel;
  SColumnOrderInfo   orderIdx;
S
slguan 已提交
131 132
} tSidSet;

H
hjxilinx 已提交
133 134 135 136 137 138
/**
 *
 * @param inMemSize
 * @param elemSize
 * @param pModel
 * @return
H
hzcheng 已提交
139
 */
H
hjxilinx 已提交
140
tExtMemBuffer *createExtMemBuffer(int32_t inMemSize, int32_t elemSize, SColumnModel *pModel);
H
hzcheng 已提交
141

H
hjxilinx 已提交
142 143 144 145
/**
 *
 * @param pMemBuffer
 * @return
H
hzcheng 已提交
146
 */
H
hjxilinx 已提交
147
void *destoryExtMemBuffer(tExtMemBuffer *pMemBuffer);
H
hzcheng 已提交
148

H
hjxilinx 已提交
149
/**
H
hzcheng 已提交
150 151 152 153 154 155 156 157
 * @param pMemBuffer
 * @param data       input data pointer
 * @param numOfRows  number of rows in data
 * @param pModel     column format model
 * @return           number of pages in memory
 */
int16_t tExtMemBufferPut(tExtMemBuffer *pMemBuffer, void *data, int32_t numOfRows);

H
hjxilinx 已提交
158 159 160 161
/**
 *
 * @param pMemBuffer
 * @return
H
hzcheng 已提交
162 163 164
 */
bool tExtMemBufferFlush(tExtMemBuffer *pMemBuffer);

H
hjxilinx 已提交
165 166
/**
 *
H
hzcheng 已提交
167 168 169 170 171 172 173 174 175 176 177 178
 * remove all data that has been put into buffer, including in buffer or
 * ext-buffer(disk)
 */
void tExtMemBufferClear(tExtMemBuffer *pMemBuffer);

/*
 * this function should be removed.
 * since the flush to disk operation is transparent to client this structure should provide stream operation for data,
 * and there is an internal cursor point to the data.
 */
bool tExtMemBufferLoadData(tExtMemBuffer *pMemBuffer, tFilePage *pFilePage, int32_t flushIdx, int32_t pageIdx);

H
hjxilinx 已提交
179 180 181 182 183
/**
 *
 * @param pMemBuffer
 * @return
 */
H
hzcheng 已提交
184 185
bool tExtMemBufferIsAllDataInMem(tExtMemBuffer *pMemBuffer);

H
hjxilinx 已提交
186 187 188 189 190 191 192
/**
 *
 * @param fields
 * @param numOfCols
 * @param blockCapacity
 * @return
 */
S
slguan 已提交
193
SColumnModel *createColumnModel(SSchema *fields, int32_t numOfCols, int32_t blockCapacity);
H
hjxilinx 已提交
194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213

/**
 *
 * @param pSrc
 * @return
 */
SColumnModel *cloneColumnModel(SColumnModel *pSrc);

/**
 *
 * @param pModel
 */
void destroyColumnModel(SColumnModel *pModel);

/*
 * compress data into consecutive block without hole in data
 */
void tColModelCompact(SColumnModel *pModel, tFilePage *inputBuffer, int32_t maxElemsCapacity);

void     tColModelErase(SColumnModel *pModel, tFilePage *inputBuffer, int32_t maxCapacity, int32_t s, int32_t e);
S
slguan 已提交
214
SSchema *getColumnModelSchema(SColumnModel *pColumnModel, int32_t index);
H
hzcheng 已提交
215

H
hjxilinx 已提交
216
int16_t getColumnModelOffset(SColumnModel *pColumnModel, int32_t index);
H
hzcheng 已提交
217 218 219 220 221 222 223 224 225

typedef struct SSrcColumnInfo {
  int32_t functionId;
  int32_t type;
} SSrcColumnInfo;

/*
 * display data in column format model for debug purpose only
 */
H
hjxilinx 已提交
226
void tColModelDisplay(SColumnModel *pModel, void *pData, int32_t numOfRows, int32_t maxCount);
H
hzcheng 已提交
227

H
hjxilinx 已提交
228
void tColModelDisplayEx(SColumnModel *pModel, void *pData, int32_t numOfRows, int32_t maxCount, SSrcColumnInfo *pInfo);
H
hzcheng 已提交
229

H
hjxilinx 已提交
230 231
tOrderDescriptor *tOrderDesCreate(const int32_t *orderColIdx, int32_t numOfOrderCols, SColumnModel *pModel,
                                  int32_t tsOrderType);
H
hzcheng 已提交
232 233 234

void tOrderDescDestroy(tOrderDescriptor *pDesc);

H
hjxilinx 已提交
235
void tColModelAppend(SColumnModel *dstModel, tFilePage *dstPage, void *srcData, int32_t srcStartRows,
H
hzcheng 已提交
236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256
                     int32_t numOfRowsToWrite, int32_t srcCapacity);

typedef int (*__col_compar_fn_t)(tOrderDescriptor *, int32_t numOfRows, int32_t idx1, int32_t idx2, char *data);

void tColDataQSort(tOrderDescriptor *, int32_t numOfRows, int32_t start, int32_t end, char *data, int32_t orderType);

int32_t compare_sa(tOrderDescriptor *, int32_t numOfRows, int32_t idx1, int32_t idx2, char *data);

int32_t compare_sd(tOrderDescriptor *, int32_t numOfRows, int32_t idx1, int32_t idx2, char *data);

int32_t compare_a(tOrderDescriptor *, int32_t numOfRow1, int32_t s1, char *data1, int32_t numOfRow2, int32_t s2,
                  char *data2);

int32_t compare_d(tOrderDescriptor *, int32_t numOfRow1, int32_t s1, char *data1, int32_t numOfRow2, int32_t s2,
                  char *data2);

#ifdef __cplusplus
}
#endif

#endif  // TBASE_SORT_H