tsdbReaderWriter.c 41.1 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#include "tsdb.h"

H
Hongze Cheng 已提交
18
// SDelFWriter ====================================================
H
Hongze Cheng 已提交
19 20
int32_t tsdbDelFWriterOpen(SDelFWriter **ppWriter, SDelFile *pFile, STsdb *pTsdb) {
  int32_t      code = 0;
H
Hongze Cheng 已提交
21 22
  char         fname[TSDB_FILENAME_LEN];
  char         hdr[TSDB_FHDR_SIZE] = {0};
H
Hongze Cheng 已提交
23
  SDelFWriter *pDelFWriter;
H
Hongze Cheng 已提交
24
  int64_t      n;
H
Hongze Cheng 已提交
25

H
Hongze Cheng 已提交
26
  // alloc
H
Hongze Cheng 已提交
27 28 29 30 31 32
  pDelFWriter = (SDelFWriter *)taosMemoryCalloc(1, sizeof(*pDelFWriter));
  if (pDelFWriter == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }
  pDelFWriter->pTsdb = pTsdb;
H
Hongze Cheng 已提交
33 34 35
  pDelFWriter->fDel = *pFile;

  tsdbDelFileName(pTsdb, pFile, fname);
H
Hongze Cheng 已提交
36 37 38 39 40 41
  pDelFWriter->pWriteH = taosOpenFile(fname, TD_FILE_WRITE | TD_FILE_CREATE);
  if (pDelFWriter->pWriteH == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
42 43 44
  // update header
  n = taosWriteFile(pDelFWriter->pWriteH, &hdr, TSDB_FHDR_SIZE);
  if (n < 0) {
H
Hongze Cheng 已提交
45 46 47 48
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
49
  pDelFWriter->fDel.size = TSDB_FHDR_SIZE;
H
Hongze Cheng 已提交
50
  pDelFWriter->fDel.offset = 0;
H
more  
Hongze Cheng 已提交
51

H
Hongze Cheng 已提交
52
  *ppWriter = pDelFWriter;
H
Hongze Cheng 已提交
53 54 55
  return code;

_err:
S
Shengliang Guan 已提交
56
  tsdbError("vgId:%d, failed to open del file writer since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
57
  *ppWriter = NULL;
H
Hongze Cheng 已提交
58 59 60
  return code;
}

H
Hongze Cheng 已提交
61 62 63
int32_t tsdbDelFWriterClose(SDelFWriter **ppWriter, int8_t sync) {
  int32_t      code = 0;
  SDelFWriter *pWriter = *ppWriter;
H
Hongze Cheng 已提交
64
  STsdb       *pTsdb = pWriter->pTsdb;
H
Hongze Cheng 已提交
65 66 67 68 69 70 71 72 73 74 75 76 77

  // sync
  if (sync && taosFsyncFile(pWriter->pWriteH) < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  // close
  if (taosCloseFile(&pWriter->pWriteH) < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
78 79 80
  for (int32_t iBuf = 0; iBuf < sizeof(pWriter->aBuf) / sizeof(uint8_t *); iBuf++) {
    tFree(pWriter->aBuf[iBuf]);
  }
H
Hongze Cheng 已提交
81 82
  taosMemoryFree(pWriter);

H
Hongze Cheng 已提交
83
  *ppWriter = NULL;
H
Hongze Cheng 已提交
84 85 86
  return code;

_err:
H
Hongze Cheng 已提交
87
  tsdbError("vgId:%d, failed to close del file writer since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
88 89 90
  return code;
}

H
Hongze Cheng 已提交
91 92 93 94
int32_t tsdbWriteDelData(SDelFWriter *pWriter, SArray *aDelData, SDelIdx *pDelIdx) {
  int32_t code = 0;
  int64_t size;
  int64_t n;
H
Hongze Cheng 已提交
95

H
Hongze Cheng 已提交
96
  // prepare
H
Hongze Cheng 已提交
97
  size = sizeof(uint32_t);
H
Hongze Cheng 已提交
98 99 100 101
  for (int32_t iDelData = 0; iDelData < taosArrayGetSize(aDelData); iDelData++) {
    size += tPutDelData(NULL, taosArrayGet(aDelData, iDelData));
  }
  size += sizeof(TSCKSUM);
H
Hongze Cheng 已提交
102 103

  // alloc
H
Hongze Cheng 已提交
104
  code = tRealloc(&pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
105 106 107
  if (code) goto _err;

  // build
H
Hongze Cheng 已提交
108
  n = 0;
H
Hongze Cheng 已提交
109
  n += tPutU32(pWriter->aBuf[0] + n, TSDB_FILE_DLMT);
H
Hongze Cheng 已提交
110
  for (int32_t iDelData = 0; iDelData < taosArrayGetSize(aDelData); iDelData++) {
H
Hongze Cheng 已提交
111
    n += tPutDelData(pWriter->aBuf[0] + n, taosArrayGet(aDelData, iDelData));
H
Hongze Cheng 已提交
112
  }
H
Hongze Cheng 已提交
113
  taosCalcChecksumAppend(0, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
114 115 116 117

  ASSERT(n + sizeof(TSCKSUM) == size);

  // write
H
Hongze Cheng 已提交
118
  n = taosWriteFile(pWriter->pWriteH, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
119 120 121 122 123 124 125 126
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  ASSERT(n == size);

  // update
H
Hongze Cheng 已提交
127
  pDelIdx->offset = pWriter->fDel.size;
H
Hongze Cheng 已提交
128
  pDelIdx->size = size;
H
Hongze Cheng 已提交
129
  pWriter->fDel.size += size;
H
Hongze Cheng 已提交
130 131 132 133

  return code;

_err:
S
Shengliang Guan 已提交
134
  tsdbError("vgId:%d, failed to write del data since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
135 136 137
  return code;
}

H
Hongze Cheng 已提交
138
int32_t tsdbWriteDelIdx(SDelFWriter *pWriter, SArray *aDelIdx) {
H
Hongze Cheng 已提交
139
  int32_t  code = 0;
H
Hongze Cheng 已提交
140 141 142 143
  int64_t  size;
  int64_t  n;
  SDelIdx *pDelIdx;

H
Hongze Cheng 已提交
144
  // prepare
H
Hongze Cheng 已提交
145
  size = sizeof(uint32_t);
H
Hongze Cheng 已提交
146 147 148 149
  for (int32_t iDelIdx = 0; iDelIdx < taosArrayGetSize(aDelIdx); iDelIdx++) {
    size += tPutDelIdx(NULL, taosArrayGet(aDelIdx, iDelIdx));
  }
  size += sizeof(TSCKSUM);
H
Hongze Cheng 已提交
150 151

  // alloc
H
Hongze Cheng 已提交
152
  code = tRealloc(&pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
153
  if (code) goto _err;
H
Hongze Cheng 已提交
154

H
Hongze Cheng 已提交
155
  // build
H
Hongze Cheng 已提交
156
  n = 0;
H
Hongze Cheng 已提交
157
  n += tPutU32(pWriter->aBuf[0] + n, TSDB_FILE_DLMT);
H
Hongze Cheng 已提交
158
  for (int32_t iDelIdx = 0; iDelIdx < taosArrayGetSize(aDelIdx); iDelIdx++) {
H
Hongze Cheng 已提交
159
    n += tPutDelIdx(pWriter->aBuf[0] + n, taosArrayGet(aDelIdx, iDelIdx));
H
Hongze Cheng 已提交
160
  }
H
Hongze Cheng 已提交
161
  taosCalcChecksumAppend(0, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
162

H
Hongze Cheng 已提交
163 164
  ASSERT(n + sizeof(TSCKSUM) == size);

H
Hongze Cheng 已提交
165
  // write
H
Hongze Cheng 已提交
166
  n = taosWriteFile(pWriter->pWriteH, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
167
  if (n < 0) {
H
Hongze Cheng 已提交
168 169 170 171
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
172
  // update
H
Hongze Cheng 已提交
173 174
  pWriter->fDel.offset = pWriter->fDel.size;
  pWriter->fDel.size += size;
H
Hongze Cheng 已提交
175

H
Hongze Cheng 已提交
176 177 178
  return code;

_err:
S
Shengliang Guan 已提交
179
  tsdbError("vgId:%d, write del idx failed since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
180 181 182
  return code;
}

H
Hongze Cheng 已提交
183 184 185 186 187
int32_t tsdbUpdateDelFileHdr(SDelFWriter *pWriter) {
  int32_t code = 0;
  char    hdr[TSDB_FHDR_SIZE];
  int64_t size = TSDB_FHDR_SIZE;
  int64_t n;
H
Hongze Cheng 已提交
188 189

  // build
H
Hongze Cheng 已提交
190 191 192
  memset(hdr, 0, size);
  tPutDelFile(hdr, &pWriter->fDel);
  taosCalcChecksumAppend(0, hdr, size);
H
Hongze Cheng 已提交
193 194 195 196 197 198 199 200

  // seek
  if (taosLSeekFile(pWriter->pWriteH, 0, SEEK_SET) < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  // write
H
Hongze Cheng 已提交
201 202
  n = taosWriteFile(pWriter->pWriteH, hdr, size);
  if (n < 0) {
H
Hongze Cheng 已提交
203 204 205 206
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
207 208 209
  return code;

_err:
S
Shengliang Guan 已提交
210
  tsdbError("vgId:%d, update del file hdr failed since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
211 212 213 214 215
  return code;
}

// SDelFReader ====================================================
struct SDelFReader {
H
Hongze Cheng 已提交
216
  STsdb    *pTsdb;
H
Hongze Cheng 已提交
217
  SDelFile  fDel;
H
Hongze Cheng 已提交
218
  TdFilePtr pReadH;
H
Hongze Cheng 已提交
219

H
Hongze Cheng 已提交
220
  uint8_t *aBuf[1];
H
refact  
Hongze Cheng 已提交
221
};
H
Hongze Cheng 已提交
222

H
Hongze Cheng 已提交
223
int32_t tsdbDelFReaderOpen(SDelFReader **ppReader, SDelFile *pFile, STsdb *pTsdb) {
H
Hongze Cheng 已提交
224
  int32_t      code = 0;
H
Hongze Cheng 已提交
225
  char         fname[TSDB_FILENAME_LEN];
H
Hongze Cheng 已提交
226
  SDelFReader *pDelFReader;
H
Hongze Cheng 已提交
227
  int64_t      n;
H
Hongze Cheng 已提交
228 229 230 231 232 233 234 235 236 237

  // alloc
  pDelFReader = (SDelFReader *)taosMemoryCalloc(1, sizeof(*pDelFReader));
  if (pDelFReader == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }

  // open impl
  pDelFReader->pTsdb = pTsdb;
H
Hongze Cheng 已提交
238 239 240
  pDelFReader->fDel = *pFile;

  tsdbDelFileName(pTsdb, pFile, fname);
H
Hongze Cheng 已提交
241
  pDelFReader->pReadH = taosOpenFile(fname, TD_FILE_READ);
H
Hongze Cheng 已提交
242
  if (pDelFReader->pReadH == NULL) {
H
Hongze Cheng 已提交
243 244 245 246 247 248 249 250 251 252
    code = TAOS_SYSTEM_ERROR(errno);
    taosMemoryFree(pDelFReader);
    goto _err;
  }

_exit:
  *ppReader = pDelFReader;
  return code;

_err:
S
Shengliang Guan 已提交
253
  tsdbError("vgId:%d, del file reader open failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
254
  *ppReader = NULL;
H
Hongze Cheng 已提交
255 256 257
  return code;
}

H
Hongze Cheng 已提交
258 259 260
int32_t tsdbDelFReaderClose(SDelFReader **ppReader) {
  int32_t      code = 0;
  SDelFReader *pReader = *ppReader;
H
Hongze Cheng 已提交
261 262

  if (pReader) {
H
Hongze Cheng 已提交
263 264 265 266
    if (taosCloseFile(&pReader->pReadH) < 0) {
      code = TAOS_SYSTEM_ERROR(errno);
      goto _exit;
    }
H
Hongze Cheng 已提交
267 268 269
    for (int32_t iBuf = 0; iBuf < sizeof(pReader->aBuf) / sizeof(uint8_t *); iBuf++) {
      tFree(pReader->aBuf[iBuf]);
    }
H
Hongze Cheng 已提交
270 271
    taosMemoryFree(pReader);
  }
H
Hongze Cheng 已提交
272
  *ppReader = NULL;
H
Hongze Cheng 已提交
273

H
Hongze Cheng 已提交
274
_exit:
H
Hongze Cheng 已提交
275 276 277
  return code;
}

H
Hongze Cheng 已提交
278 279 280 281 282
int32_t tsdbReadDelData(SDelFReader *pReader, SDelIdx *pDelIdx, SArray *aDelData) {
  int32_t code = 0;
  int64_t offset = pDelIdx->offset;
  int64_t size = pDelIdx->size;
  int64_t n;
H
Hongze Cheng 已提交
283

H
Hongze Cheng 已提交
284
  taosArrayClear(aDelData);
H
Hongze Cheng 已提交
285 286

  // seek
H
Hongze Cheng 已提交
287
  if (taosLSeekFile(pReader->pReadH, offset, SEEK_SET) < 0) {
H
Hongze Cheng 已提交
288 289 290 291 292
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  // alloc
H
Hongze Cheng 已提交
293
  code = tRealloc(&pReader->aBuf[0], size);
H
Hongze Cheng 已提交
294 295 296
  if (code) goto _err;

  // read
H
Hongze Cheng 已提交
297
  n = taosReadFile(pReader->pReadH, pReader->aBuf[0], size);
H
Hongze Cheng 已提交
298 299 300
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
H
Hongze Cheng 已提交
301
  } else if (n < size) {
H
Hongze Cheng 已提交
302 303
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
H
Hongze Cheng 已提交
304 305 306
  }

  // check
H
Hongze Cheng 已提交
307
  if (!taosCheckChecksumWhole(pReader->aBuf[0], size)) {
H
Hongze Cheng 已提交
308 309 310 311
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

H
Hongze Cheng 已提交
312 313
  // // decode
  n = 0;
H
Hongze Cheng 已提交
314 315

  uint32_t delimiter;
H
Hongze Cheng 已提交
316
  n += tGetU32(pReader->aBuf[0] + n, &delimiter);
H
Hongze Cheng 已提交
317
  while (n < size - sizeof(TSCKSUM)) {
H
Hongze Cheng 已提交
318
    SDelData delData;
H
Hongze Cheng 已提交
319
    n += tGetDelData(pReader->aBuf[0] + n, &delData);
H
Hongze Cheng 已提交
320

H
Hongze Cheng 已提交
321
    if (taosArrayPush(aDelData, &delData) == NULL) {
H
Hongze Cheng 已提交
322 323 324
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _err;
    }
H
Hongze Cheng 已提交
325
  }
H
Hongze Cheng 已提交
326

H
Hongze Cheng 已提交
327 328
  ASSERT(n == size - sizeof(TSCKSUM));

H
Hongze Cheng 已提交
329 330 331
  return code;

_err:
S
Shengliang Guan 已提交
332
  tsdbError("vgId:%d, read del data failed since %s", TD_VID(pReader->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
333 334 335
  return code;
}

H
Hongze Cheng 已提交
336 337 338 339 340
int32_t tsdbReadDelIdx(SDelFReader *pReader, SArray *aDelIdx) {
  int32_t code = 0;
  int32_t n;
  int64_t offset = pReader->fDel.offset;
  int64_t size = pReader->fDel.size - offset;
H
Hongze Cheng 已提交
341

H
Hongze Cheng 已提交
342
  taosArrayClear(aDelIdx);
H
more  
Hongze Cheng 已提交
343

H
Hongze Cheng 已提交
344
  // seek
H
Hongze Cheng 已提交
345
  if (taosLSeekFile(pReader->pReadH, offset, SEEK_SET) < 0) {
H
Hongze Cheng 已提交
346 347 348 349
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
350
  // alloc
H
Hongze Cheng 已提交
351
  code = tRealloc(&pReader->aBuf[0], size);
H
Hongze Cheng 已提交
352
  if (code) goto _err;
H
Hongze Cheng 已提交
353

H
Hongze Cheng 已提交
354
  // read
H
Hongze Cheng 已提交
355
  n = taosReadFile(pReader->pReadH, pReader->aBuf[0], size);
H
Hongze Cheng 已提交
356
  if (n < 0) {
H
Hongze Cheng 已提交
357
    code = TAOS_SYSTEM_ERROR(errno);
H
Hongze Cheng 已提交
358
    goto _err;
H
Hongze Cheng 已提交
359 360 361
  } else if (n < size) {
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
H
Hongze Cheng 已提交
362 363 364
  }

  // check
H
Hongze Cheng 已提交
365
  if (!taosCheckChecksumWhole(pReader->aBuf[0], size)) {
H
Hongze Cheng 已提交
366 367 368 369 370
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

  // decode
H
Hongze Cheng 已提交
371
  n = 0;
H
Hongze Cheng 已提交
372
  uint32_t delimiter;
H
Hongze Cheng 已提交
373
  n += tGetU32(pReader->aBuf[0] + n, &delimiter);
H
Hongze Cheng 已提交
374
  ASSERT(delimiter == TSDB_FILE_DLMT);
H
Hongze Cheng 已提交
375 376

  while (n < size - sizeof(TSCKSUM)) {
H
Hongze Cheng 已提交
377 378
    SDelIdx delIdx;

H
Hongze Cheng 已提交
379
    n += tGetDelIdx(pReader->aBuf[0] + n, &delIdx);
H
Hongze Cheng 已提交
380

H
Hongze Cheng 已提交
381
    if (taosArrayPush(aDelIdx, &delIdx) == NULL) {
H
Hongze Cheng 已提交
382 383 384 385 386 387
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _err;
    }
  }

  ASSERT(n == size - sizeof(TSCKSUM));
H
Hongze Cheng 已提交
388 389 390 391

  return code;

_err:
S
Shengliang Guan 已提交
392
  tsdbError("vgId:%d, read del idx failed since %s", TD_VID(pReader->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
393
  return code;
H
Hongze Cheng 已提交
394 395 396 397
}

// SDataFReader ====================================================
int32_t tsdbDataFReaderOpen(SDataFReader **ppReader, STsdb *pTsdb, SDFileSet *pSet) {
H
Hongze Cheng 已提交
398 399 400 401 402 403 404 405 406 407 408 409 410 411 412
  int32_t       code = 0;
  SDataFReader *pReader;
  char          fname[TSDB_FILENAME_LEN];

  // alloc
  pReader = (SDataFReader *)taosMemoryCalloc(1, sizeof(*pReader));
  if (pReader == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }
  pReader->pTsdb = pTsdb;
  pReader->pSet = pSet;

  // open impl
  // head
H
Hongze Cheng 已提交
413
  tsdbHeadFileName(pTsdb, pSet->diskId, pSet->fid, pSet->pHeadF, fname);
H
Hongze Cheng 已提交
414 415 416 417 418 419 420
  pReader->pHeadFD = taosOpenFile(fname, TD_FILE_READ);
  if (pReader->pHeadFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  // data
H
Hongze Cheng 已提交
421
  tsdbDataFileName(pTsdb, pSet->diskId, pSet->fid, pSet->pDataF, fname);
H
Hongze Cheng 已提交
422 423 424 425 426 427 428
  pReader->pDataFD = taosOpenFile(fname, TD_FILE_READ);
  if (pReader->pDataFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  // sma
H
Hongze Cheng 已提交
429
  tsdbSmaFileName(pTsdb, pSet->diskId, pSet->fid, pSet->pSmaF, fname);
H
Hongze Cheng 已提交
430 431 432 433 434 435
  pReader->pSmaFD = taosOpenFile(fname, TD_FILE_READ);
  if (pReader->pSmaFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
436
  // sst
H
Hongze Cheng 已提交
437 438 439 440
  for (int32_t iSst = 0; iSst < pSet->nSstF; iSst++) {
    tsdbSstFileName(pTsdb, pSet->diskId, pSet->fid, pSet->aSstF[iSst], fname);
    pReader->aLastFD[iSst] = taosOpenFile(fname, TD_FILE_READ);
    if (pReader->aLastFD[iSst] == NULL) {
H
Hongze Cheng 已提交
441 442 443
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }
H
Hongze Cheng 已提交
444 445
  }

H
Hongze Cheng 已提交
446 447 448 449
  *ppReader = pReader;
  return code;

_err:
S
Shengliang Guan 已提交
450
  tsdbError("vgId:%d, tsdb data file reader open failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
451
  *ppReader = NULL;
H
Hongze Cheng 已提交
452 453 454
  return code;
}

H
Hongze Cheng 已提交
455
int32_t tsdbDataFReaderClose(SDataFReader **ppReader) {
H
Hongze Cheng 已提交
456
  int32_t code = 0;
H
Hongze Cheng 已提交
457
  if (*ppReader == NULL) goto _exit;
H
Hongze Cheng 已提交
458

H
Hongze Cheng 已提交
459
  // head
H
Hongze Cheng 已提交
460
  if (taosCloseFile(&(*ppReader)->pHeadFD) < 0) {
H
Hongze Cheng 已提交
461 462 463 464
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
465
  // data
H
Hongze Cheng 已提交
466
  if (taosCloseFile(&(*ppReader)->pDataFD) < 0) {
H
Hongze Cheng 已提交
467 468 469 470
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
471 472
  // sma
  if (taosCloseFile(&(*ppReader)->pSmaFD) < 0) {
H
Hongze Cheng 已提交
473 474 475 476
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
477
  // sst
H
Hongze Cheng 已提交
478 479
  for (int32_t iSst = 0; iSst < (*ppReader)->pSet->nSstF; iSst++) {
    if (taosCloseFile(&(*ppReader)->aLastFD[iSst]) < 0) {
H
Hongze Cheng 已提交
480 481 482
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }
H
Hongze Cheng 已提交
483 484
  }

H
Hongze Cheng 已提交
485 486 487
  for (int32_t iBuf = 0; iBuf < sizeof((*ppReader)->aBuf) / sizeof(uint8_t *); iBuf++) {
    tFree((*ppReader)->aBuf[iBuf]);
  }
H
Hongze Cheng 已提交
488
  taosMemoryFree(*ppReader);
H
Hongze Cheng 已提交
489 490

_exit:
H
Hongze Cheng 已提交
491
  *ppReader = NULL;
H
Hongze Cheng 已提交
492 493 494
  return code;

_err:
S
Shengliang Guan 已提交
495
  tsdbError("vgId:%d, data file reader close failed since %s", TD_VID((*ppReader)->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
496 497 498
  return code;
}

H
Hongze Cheng 已提交
499 500 501
int32_t tsdbReadBlockIdx(SDataFReader *pReader, SArray *aBlockIdx) {
  int32_t  code = 0;
  int64_t  offset = pReader->pSet->pHeadF->offset;
H
Hongze Cheng 已提交
502
  int64_t  size = pReader->pSet->pHeadF->size - offset;
H
Hongze Cheng 已提交
503 504
  int64_t  n;
  uint32_t delimiter;
H
Hongze Cheng 已提交
505

H
Hongze Cheng 已提交
506 507 508 509
  taosArrayClear(aBlockIdx);
  if (size == 0) {
    goto _exit;
  }
H
Hongze Cheng 已提交
510 511

  // alloc
H
Hongze Cheng 已提交
512
  code = tRealloc(&pReader->aBuf[0], size);
H
Hongze Cheng 已提交
513 514 515 516 517 518 519 520 521
  if (code) goto _err;

  // seek
  if (taosLSeekFile(pReader->pHeadFD, offset, SEEK_SET) < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  // read
H
Hongze Cheng 已提交
522
  n = taosReadFile(pReader->pHeadFD, pReader->aBuf[0], size);
H
Hongze Cheng 已提交
523 524 525 526 527 528 529 530 531
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  } else if (n < size) {
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

  // check
H
Hongze Cheng 已提交
532
  if (!taosCheckChecksumWhole(pReader->aBuf[0], size)) {
H
Hongze Cheng 已提交
533 534 535 536 537
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

  // decode
H
Hongze Cheng 已提交
538
  n = 0;
H
Hongze Cheng 已提交
539
  n = tGetU32(pReader->aBuf[0] + n, &delimiter);
H
Hongze Cheng 已提交
540
  ASSERT(delimiter == TSDB_FILE_DLMT);
H
Hongze Cheng 已提交
541 542

  while (n < size - sizeof(TSCKSUM)) {
H
Hongze Cheng 已提交
543
    SBlockIdx blockIdx;
H
Hongze Cheng 已提交
544
    n += tGetBlockIdx(pReader->aBuf[0] + n, &blockIdx);
H
Hongze Cheng 已提交
545 546 547 548 549 550 551

    if (taosArrayPush(aBlockIdx, &blockIdx) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _err;
    }
  }

H
Hongze Cheng 已提交
552 553
  ASSERT(n + sizeof(TSCKSUM) == size);

H
Hongze Cheng 已提交
554
_exit:
H
Hongze Cheng 已提交
555 556 557
  return code;

_err:
S
Shengliang Guan 已提交
558
  tsdbError("vgId:%d, read block idx failed since %s", TD_VID(pReader->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
559 560 561
  return code;
}

H
Hongze Cheng 已提交
562
int32_t tsdbReadSstBlk(SDataFReader *pReader, int32_t iSst, SArray *aSstBlk) {
H
Hongze Cheng 已提交
563
  int32_t  code = 0;
H
Hongze Cheng 已提交
564 565
  int64_t  offset = pReader->pSet->aSstF[iSst]->offset;
  int64_t  size = pReader->pSet->aSstF[iSst]->size - offset;
H
Hongze Cheng 已提交
566 567 568
  int64_t  n;
  uint32_t delimiter;

H
Hongze Cheng 已提交
569
  taosArrayClear(aSstBlk);
H
Hongze Cheng 已提交
570 571 572
  if (size == 0) {
    goto _exit;
  }
H
Hongze Cheng 已提交
573 574

  // alloc
H
Hongze Cheng 已提交
575
  code = tRealloc(&pReader->aBuf[0], size);
H
Hongze Cheng 已提交
576 577 578
  if (code) goto _err;

  // seek
H
Hongze Cheng 已提交
579
  if (taosLSeekFile(pReader->aLastFD[iSst], offset, SEEK_SET) < 0) {
H
Hongze Cheng 已提交
580 581 582 583 584
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  // read
H
Hongze Cheng 已提交
585
  n = taosReadFile(pReader->aLastFD[iSst], pReader->aBuf[0], size);
H
Hongze Cheng 已提交
586 587 588 589 590 591 592 593 594
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  } else if (n < size) {
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

  // check
H
Hongze Cheng 已提交
595
  if (!taosCheckChecksumWhole(pReader->aBuf[0], size)) {
H
Hongze Cheng 已提交
596 597 598 599 600 601
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

  // decode
  n = 0;
H
Hongze Cheng 已提交
602
  n = tGetU32(pReader->aBuf[0] + n, &delimiter);
H
Hongze Cheng 已提交
603 604 605
  ASSERT(delimiter == TSDB_FILE_DLMT);

  while (n < size - sizeof(TSCKSUM)) {
H
Hongze Cheng 已提交
606 607
    SSstBlk blockl;
    n += tGetSstBlk(pReader->aBuf[0] + n, &blockl);
H
Hongze Cheng 已提交
608

H
Hongze Cheng 已提交
609
    if (taosArrayPush(aSstBlk, &blockl) == NULL) {
H
Hongze Cheng 已提交
610 611 612 613 614 615 616
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _err;
    }
  }

  ASSERT(n + sizeof(TSCKSUM) == size);

H
Hongze Cheng 已提交
617
_exit:
H
Hongze Cheng 已提交
618 619 620 621 622 623 624
  return code;

_err:
  tsdbError("vgId:%d read blockl failed since %s", TD_VID(pReader->pTsdb->pVnode), tstrerror(code));
  return code;
}

H
Hongze Cheng 已提交
625 626 627 628 629 630
int32_t tsdbReadBlock(SDataFReader *pReader, SBlockIdx *pBlockIdx, SMapData *mBlock) {
  int32_t code = 0;
  int64_t offset = pBlockIdx->offset;
  int64_t size = pBlockIdx->size;
  int64_t n;
  int64_t tn;
H
Hongze Cheng 已提交
631

H
Hongze Cheng 已提交
632
  // alloc
H
Hongze Cheng 已提交
633
  code = tRealloc(&pReader->aBuf[0], size);
H
Hongze Cheng 已提交
634 635 636 637 638 639 640 641 642
  if (code) goto _err;

  // seek
  if (taosLSeekFile(pReader->pHeadFD, offset, SEEK_SET) < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  // read
H
Hongze Cheng 已提交
643
  n = taosReadFile(pReader->pHeadFD, pReader->aBuf[0], size);
H
Hongze Cheng 已提交
644 645 646 647 648 649 650 651 652
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  } else if (n < size) {
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

  // check
H
Hongze Cheng 已提交
653
  if (!taosCheckChecksumWhole(pReader->aBuf[0], size)) {
H
Hongze Cheng 已提交
654 655 656 657 658
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

  // decode
H
Hongze Cheng 已提交
659 660 661
  n = 0;

  uint32_t delimiter;
H
Hongze Cheng 已提交
662
  n += tGetU32(pReader->aBuf[0] + n, &delimiter);
H
Hongze Cheng 已提交
663
  ASSERT(delimiter == TSDB_FILE_DLMT);
H
Hongze Cheng 已提交
664

H
Hongze Cheng 已提交
665
  tn = tGetMapData(pReader->aBuf[0] + n, mBlock);
H
Hongze Cheng 已提交
666 667 668 669 670
  if (tn < 0) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }
  n += tn;
H
Hongze Cheng 已提交
671 672 673 674 675
  ASSERT(n + sizeof(TSCKSUM) == size);

  return code;

_err:
S
Shengliang Guan 已提交
676
  tsdbError("vgId:%d, read block failed since %s", TD_VID(pReader->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
677 678 679
  return code;
}

H
Hongze Cheng 已提交
680
int32_t tsdbReadBlockSma(SDataFReader *pReader, SDataBlk *pDataBlk, SArray *aColumnDataAgg) {
H
Hongze Cheng 已提交
681
  int32_t   code = 0;
H
Hongze Cheng 已提交
682
  SSmaInfo *pSmaInfo = &pDataBlk->smaInfo;
H
Hongze Cheng 已提交
683 684 685 686 687 688 689

  ASSERT(pSmaInfo->size > 0);

  taosArrayClear(aColumnDataAgg);

  // alloc
  int32_t size = pSmaInfo->size + sizeof(TSCKSUM);
H
Hongze Cheng 已提交
690
  code = tRealloc(&pReader->aBuf[0], size);
H
Hongze Cheng 已提交
691 692
  if (code) goto _err;

H
Hongze Cheng 已提交
693 694 695 696 697 698 699 700 701 702
  // seek
  int64_t n = taosLSeekFile(pReader->pSmaFD, pSmaInfo->offset, SEEK_SET);
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  } else if (n < pSmaInfo->offset) {
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

H
Hongze Cheng 已提交
703
  // read
H
Hongze Cheng 已提交
704
  n = taosReadFile(pReader->pSmaFD, pReader->aBuf[0], size);
H
Hongze Cheng 已提交
705 706 707 708 709 710 711 712 713
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  } else if (n < size) {
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

  // check
H
Hongze Cheng 已提交
714
  if (!taosCheckChecksumWhole(pReader->aBuf[0], size)) {
H
Hongze Cheng 已提交
715 716 717 718 719 720 721 722 723
    code = TSDB_CODE_FILE_CORRUPTED;
    goto _err;
  }

  // decode
  n = 0;
  while (n < pSmaInfo->size) {
    SColumnDataAgg sma;

H
Hongze Cheng 已提交
724
    n += tGetColumnDataAgg(pReader->aBuf[0] + n, &sma);
H
Hongze Cheng 已提交
725 726 727 728 729 730 731 732 733 734 735 736 737
    if (taosArrayPush(aColumnDataAgg, &sma) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _err;
    }
  }

  return code;

_err:
  tsdbError("vgId:%d tsdb read block sma failed since %s", TD_VID(pReader->pTsdb->pVnode), tstrerror(code));
  return code;
}

H
Hongze Cheng 已提交
738 739
static int32_t tsdbReadBlockDataImpl(SDataFReader *pReader, SBlockInfo *pBlkInfo, int8_t fromLast,
                                     SBlockData *pBlockData) {
H
Hongze Cheng 已提交
740 741
  int32_t code = 0;

H
Hongze Cheng 已提交
742
  tBlockDataClear(pBlockData);
H
Hongze Cheng 已提交
743

H
Hongze Cheng 已提交
744
  TdFilePtr pFD = fromLast ? pReader->aLastFD[0] : pReader->pDataFD;  // (todo)
H
Hongze Cheng 已提交
745

H
Hongze Cheng 已提交
746
  // uid + version + tskey
H
Hongze Cheng 已提交
747
  code = tsdbReadAndCheck(pFD, pBlkInfo->offset, &pReader->aBuf[0], pBlkInfo->szKey, 1);
H
Hongze Cheng 已提交
748 749
  if (code) goto _err;
  SDiskDataHdr hdr;
H
Hongze Cheng 已提交
750
  uint8_t     *p = pReader->aBuf[0] + tGetDiskDataHdr(pReader->aBuf[0], &hdr);
H
Hongze Cheng 已提交
751

H
Hongze Cheng 已提交
752
  ASSERT(hdr.delimiter == TSDB_FILE_DLMT);
H
Hongze Cheng 已提交
753 754
  ASSERT(pBlockData->suid == hdr.suid);
  ASSERT(pBlockData->uid == hdr.uid);
H
Hongze Cheng 已提交
755

H
Hongze Cheng 已提交
756 757
  pBlockData->nRow = hdr.nRow;

H
Hongze Cheng 已提交
758
  // uid
H
Hongze Cheng 已提交
759 760 761
  if (hdr.uid == 0) {
    ASSERT(hdr.szUid);
    code = tsdbDecmprData(p, hdr.szUid, TSDB_DATA_TYPE_BIGINT, hdr.cmprAlg, (uint8_t **)&pBlockData->aUid,
H
Hongze Cheng 已提交
762
                          sizeof(int64_t) * hdr.nRow, &pReader->aBuf[1]);
H
Hongze Cheng 已提交
763 764
    if (code) goto _err;
  } else {
H
Hongze Cheng 已提交
765
    ASSERT(!hdr.szUid);
H
Hongze Cheng 已提交
766 767 768
  }
  p += hdr.szUid;

H
Hongze Cheng 已提交
769
  // version
H
Hongze Cheng 已提交
770
  code = tsdbDecmprData(p, hdr.szVer, TSDB_DATA_TYPE_BIGINT, hdr.cmprAlg, (uint8_t **)&pBlockData->aVersion,
H
Hongze Cheng 已提交
771
                        sizeof(int64_t) * hdr.nRow, &pReader->aBuf[1]);
H
Hongze Cheng 已提交
772 773 774
  if (code) goto _err;
  p += hdr.szVer;

H
Hongze Cheng 已提交
775 776
  // TSKEY
  code = tsdbDecmprData(p, hdr.szKey, TSDB_DATA_TYPE_TIMESTAMP, hdr.cmprAlg, (uint8_t **)&pBlockData->aTSKEY,
H
Hongze Cheng 已提交
777
                        sizeof(TSKEY) * hdr.nRow, &pReader->aBuf[1]);
H
Hongze Cheng 已提交
778 779 780
  if (code) goto _err;
  p += hdr.szKey;

H
Hongze Cheng 已提交
781
  ASSERT(p - pReader->aBuf[0] == pBlkInfo->szKey - sizeof(TSCKSUM));
H
Hongze Cheng 已提交
782 783

  // read and decode columns
H
Hongze Cheng 已提交
784 785
  if (taosArrayGetSize(pBlockData->aIdx) == 0) goto _exit;

H
Hongze Cheng 已提交
786
  if (hdr.szBlkCol > 0) {
H
Hongze Cheng 已提交
787
    int64_t offset = pBlkInfo->offset + pBlkInfo->szKey;
H
Hongze Cheng 已提交
788
    code = tsdbReadAndCheck(pFD, offset, &pReader->aBuf[0], hdr.szBlkCol + sizeof(TSCKSUM), 1);
H
Hongze Cheng 已提交
789
    if (code) goto _err;
H
Hongze Cheng 已提交
790
  }
H
Hongze Cheng 已提交
791

H
Hongze Cheng 已提交
792 793 794
  SBlockCol  blockCol = {.cid = 0};
  SBlockCol *pBlockCol = &blockCol;
  int32_t    n = 0;
H
Hongze Cheng 已提交
795

H
Hongze Cheng 已提交
796 797
  for (int32_t iColData = 0; iColData < taosArrayGetSize(pBlockData->aIdx); iColData++) {
    SColData *pColData = tBlockDataGetColDataByIdx(pBlockData, iColData);
H
Hongze Cheng 已提交
798

H
Hongze Cheng 已提交
799 800
    while (pBlockCol && pBlockCol->cid < pColData->cid) {
      if (n < hdr.szBlkCol) {
H
Hongze Cheng 已提交
801
        n += tGetBlockCol(pReader->aBuf[0] + n, pBlockCol);
H
Hongze Cheng 已提交
802 803 804 805 806
      } else {
        ASSERT(n == hdr.szBlkCol);
        pBlockCol = NULL;
      }
    }
H
Hongze Cheng 已提交
807

H
Hongze Cheng 已提交
808 809 810
    if (pBlockCol == NULL || pBlockCol->cid > pColData->cid) {
      // add a lot of NONE
      for (int32_t iRow = 0; iRow < hdr.nRow; iRow++) {
H
Hongze Cheng 已提交
811
        code = tColDataAppendValue(pColData, &COL_VAL_NONE(pColData->cid, pColData->type));
H
Hongze Cheng 已提交
812 813 814 815 816 817 818 819 820 821 822 823
        if (code) goto _err;
      }
    } else {
      ASSERT(pBlockCol->type == pColData->type);
      ASSERT(pBlockCol->flag && pBlockCol->flag != HAS_NONE);

      if (pBlockCol->flag == HAS_NULL) {
        // add a lot of NULL
        for (int32_t iRow = 0; iRow < hdr.nRow; iRow++) {
          code = tColDataAppendValue(pColData, &COL_VAL_NULL(pBlockCol->cid, pBlockCol->type));
          if (code) goto _err;
        }
H
Hongze Cheng 已提交
824
      } else {
H
Hongze Cheng 已提交
825 826 827
        // decode from binary
        int64_t offset = pBlkInfo->offset + pBlkInfo->szKey + hdr.szBlkCol + sizeof(TSCKSUM) + pBlockCol->offset;
        int32_t size = pBlockCol->szBitmap + pBlockCol->szOffset + pBlockCol->szValue + sizeof(TSCKSUM);
H
Hongze Cheng 已提交
828

H
Hongze Cheng 已提交
829
        code = tsdbReadAndCheck(pFD, offset, &pReader->aBuf[1], size, 0);
H
Hongze Cheng 已提交
830 831
        if (code) goto _err;

H
Hongze Cheng 已提交
832
        code = tsdbDecmprColData(pReader->aBuf[1], pBlockCol, hdr.cmprAlg, hdr.nRow, pColData, &pReader->aBuf[2]);
H
Hongze Cheng 已提交
833 834 835 836 837
        if (code) goto _err;
      }
    }
  }

H
Hongze Cheng 已提交
838
_exit:
H
Hongze Cheng 已提交
839 840 841 842 843 844 845
  return code;

_err:
  tsdbError("vgId:%d tsdb read block data impl failed since %s", TD_VID(pReader->pTsdb->pVnode), tstrerror(code));
  return code;
}

H
Hongze Cheng 已提交
846
int32_t tsdbReadDataBlock(SDataFReader *pReader, SDataBlk *pDataBlk, SBlockData *pBlockData) {
H
Hongze Cheng 已提交
847 848
  int32_t code = 0;

H
Hongze Cheng 已提交
849
  code = tsdbReadBlockDataImpl(pReader, &pDataBlk->aSubBlock[0], 0, pBlockData);
H
Hongze Cheng 已提交
850 851
  if (code) goto _err;

H
Hongze Cheng 已提交
852
  if (pDataBlk->nSubBlock > 1) {
H
Hongze Cheng 已提交
853 854
    SBlockData bData1;
    SBlockData bData2;
H
Hongze Cheng 已提交
855

H
Hongze Cheng 已提交
856 857
    // create
    code = tBlockDataCreate(&bData1);
H
Hongze Cheng 已提交
858
    if (code) goto _err;
H
Hongze Cheng 已提交
859
    code = tBlockDataCreate(&bData2);
H
Hongze Cheng 已提交
860 861
    if (code) goto _err;

H
Hongze Cheng 已提交
862 863 864
    // init
    tBlockDataInitEx(&bData1, pBlockData);
    tBlockDataInitEx(&bData2, pBlockData);
H
Hongze Cheng 已提交
865

H
Hongze Cheng 已提交
866 867
    for (int32_t iSubBlock = 1; iSubBlock < pDataBlk->nSubBlock; iSubBlock++) {
      code = tsdbReadBlockDataImpl(pReader, &pDataBlk->aSubBlock[iSubBlock], 0, &bData1);
H
Hongze Cheng 已提交
868
      if (code) {
H
Hongze Cheng 已提交
869 870
        tBlockDataDestroy(&bData1, 1);
        tBlockDataDestroy(&bData2, 1);
H
Hongze Cheng 已提交
871 872 873
        goto _err;
      }

H
Hongze Cheng 已提交
874
      code = tBlockDataCopy(pBlockData, &bData2);
H
Hongze Cheng 已提交
875
      if (code) {
H
Hongze Cheng 已提交
876 877
        tBlockDataDestroy(&bData1, 1);
        tBlockDataDestroy(&bData2, 1);
H
Hongze Cheng 已提交
878 879
        goto _err;
      }
H
Hongze Cheng 已提交
880

H
Hongze Cheng 已提交
881
      code = tBlockDataMerge(&bData1, &bData2, pBlockData);
H
Hongze Cheng 已提交
882
      if (code) {
H
Hongze Cheng 已提交
883 884
        tBlockDataDestroy(&bData1, 1);
        tBlockDataDestroy(&bData2, 1);
H
Hongze Cheng 已提交
885 886 887 888
        goto _err;
      }
    }

H
Hongze Cheng 已提交
889 890
    tBlockDataDestroy(&bData1, 1);
    tBlockDataDestroy(&bData2, 1);
H
Hongze Cheng 已提交
891 892 893 894 895
  }

  return code;

_err:
H
Hongze Cheng 已提交
896
  tsdbError("vgId:%d tsdb read data block failed since %s", TD_VID(pReader->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
897 898 899
  return code;
}

H
Hongze Cheng 已提交
900
int32_t tsdbReadSstBlock(SDataFReader *pReader, int32_t iSst, SSstBlk *pSstBlk, SBlockData *pBlockData) {
H
Hongze Cheng 已提交
901 902
  int32_t code = 0;

H
Hongze Cheng 已提交
903
  code = tsdbReadBlockDataImpl(pReader, &pSstBlk->bInfo, 1, pBlockData);
H
Hongze Cheng 已提交
904 905 906 907 908 909
  if (code) goto _err;

  return code;

_err:
  tsdbError("vgId:%d tsdb read last block failed since %s", TD_VID(pReader->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
910 911
  return code;
}
H
Hongze Cheng 已提交
912

H
Hongze Cheng 已提交
913
int32_t tsdbReadSstBlockEx(SDataFReader *pReader, int32_t iSst, SSstBlk *pSstBlk, SBlockData *pBlockData) {
H
Hongze Cheng 已提交
914 915 916
  int32_t code = 0;

  // read
H
Hongze Cheng 已提交
917
  code = tsdbReadAndCheck(pReader->aLastFD[iSst], pSstBlk->bInfo.offset, &pReader->aBuf[0], pSstBlk->bInfo.szBlock, 0);
H
Hongze Cheng 已提交
918 919 920
  if (code) goto _exit;

  // decmpr
H
Hongze Cheng 已提交
921
  code = tDecmprBlockData(pReader->aBuf[0], pSstBlk->bInfo.szBlock, pBlockData, &pReader->aBuf[1]);
H
Hongze Cheng 已提交
922 923 924 925 926 927
  if (code) goto _exit;

_exit:
  return code;
}

H
Hongze Cheng 已提交
928 929
// SDataFWriter ====================================================
int32_t tsdbDataFWriterOpen(SDataFWriter **ppWriter, STsdb *pTsdb, SDFileSet *pSet) {
H
Hongze Cheng 已提交
930 931 932 933 934 935 936 937 938 939 940 941 942 943
  int32_t       code = 0;
  int32_t       flag;
  int64_t       n;
  SDataFWriter *pWriter = NULL;
  char          fname[TSDB_FILENAME_LEN];
  char          hdr[TSDB_FHDR_SIZE] = {0};

  // alloc
  pWriter = taosMemoryCalloc(1, sizeof(*pWriter));
  if (pWriter == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }
  pWriter->pTsdb = pTsdb;
H
Hongze Cheng 已提交
944 945 946 947 948 949
  pWriter->wSet = (SDFileSet){
      .diskId = pSet->diskId,
      .fid = pSet->fid,
      .pHeadF = &pWriter->fHead,
      .pDataF = &pWriter->fData,
      .pSmaF = &pWriter->fSma,
H
Hongze Cheng 已提交
950
      .nSstF = pSet->nSstF  //
H
Hongze Cheng 已提交
951
  };
H
Hongze Cheng 已提交
952 953 954
  pWriter->fHead = *pSet->pHeadF;
  pWriter->fData = *pSet->pDataF;
  pWriter->fSma = *pSet->pSmaF;
H
Hongze Cheng 已提交
955 956 957
  for (int8_t iSst = 0; iSst < pSet->nSstF; iSst++) {
    pWriter->wSet.aSstF[iSst] = &pWriter->fSst[iSst];
    pWriter->fSst[iSst] = *pSet->aSstF[iSst];
H
Hongze Cheng 已提交
958
  }
H
Hongze Cheng 已提交
959 960 961

  // head
  flag = TD_FILE_WRITE | TD_FILE_CREATE | TD_FILE_TRUNC;
H
Hongze Cheng 已提交
962
  tsdbHeadFileName(pTsdb, pWriter->wSet.diskId, pWriter->wSet.fid, &pWriter->fHead, fname);
H
Hongze Cheng 已提交
963 964 965 966 967 968 969 970 971 972 973 974 975 976
  pWriter->pHeadFD = taosOpenFile(fname, flag);
  if (pWriter->pHeadFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  n = taosWriteFile(pWriter->pHeadFD, hdr, TSDB_FHDR_SIZE);
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  ASSERT(n == TSDB_FHDR_SIZE);

H
Hongze Cheng 已提交
977
  pWriter->fHead.size += TSDB_FHDR_SIZE;
H
Hongze Cheng 已提交
978 979

  // data
H
Hongze Cheng 已提交
980
  if (pWriter->fData.size == 0) {
H
Hongze Cheng 已提交
981 982 983 984
    flag = TD_FILE_WRITE | TD_FILE_CREATE | TD_FILE_TRUNC;
  } else {
    flag = TD_FILE_WRITE;
  }
H
Hongze Cheng 已提交
985
  tsdbDataFileName(pTsdb, pWriter->wSet.diskId, pWriter->wSet.fid, &pWriter->fData, fname);
H
Hongze Cheng 已提交
986 987 988 989 990
  pWriter->pDataFD = taosOpenFile(fname, flag);
  if (pWriter->pDataFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
H
Hongze Cheng 已提交
991
  if (pWriter->fData.size == 0) {
H
Hongze Cheng 已提交
992 993 994 995 996 997
    n = taosWriteFile(pWriter->pDataFD, hdr, TSDB_FHDR_SIZE);
    if (n < 0) {
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }

H
Hongze Cheng 已提交
998
    pWriter->fData.size += TSDB_FHDR_SIZE;
H
Hongze Cheng 已提交
999 1000 1001 1002 1003 1004 1005
  } else {
    n = taosLSeekFile(pWriter->pDataFD, 0, SEEK_END);
    if (n < 0) {
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }

H
Hongze Cheng 已提交
1006
    ASSERT(n == pWriter->fData.size);
H
Hongze Cheng 已提交
1007 1008 1009
  }

  // sma
H
Hongze Cheng 已提交
1010
  if (pWriter->fSma.size == 0) {
H
Hongze Cheng 已提交
1011 1012 1013 1014
    flag = TD_FILE_WRITE | TD_FILE_CREATE | TD_FILE_TRUNC;
  } else {
    flag = TD_FILE_WRITE;
  }
H
Hongze Cheng 已提交
1015
  tsdbSmaFileName(pTsdb, pWriter->wSet.diskId, pWriter->wSet.fid, &pWriter->fSma, fname);
H
Hongze Cheng 已提交
1016 1017 1018 1019 1020
  pWriter->pSmaFD = taosOpenFile(fname, flag);
  if (pWriter->pSmaFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
H
Hongze Cheng 已提交
1021
  if (pWriter->fSma.size == 0) {
H
Hongze Cheng 已提交
1022 1023 1024 1025 1026 1027
    n = taosWriteFile(pWriter->pSmaFD, hdr, TSDB_FHDR_SIZE);
    if (n < 0) {
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }

H
Hongze Cheng 已提交
1028
    pWriter->fSma.size += TSDB_FHDR_SIZE;
H
Hongze Cheng 已提交
1029 1030 1031 1032 1033 1034 1035
  } else {
    n = taosLSeekFile(pWriter->pSmaFD, 0, SEEK_END);
    if (n < 0) {
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }

H
Hongze Cheng 已提交
1036
    ASSERT(n == pWriter->fSma.size);
H
Hongze Cheng 已提交
1037 1038
  }

H
Hongze Cheng 已提交
1039
  // sst
H
Hongze Cheng 已提交
1040
  ASSERT(pWriter->fSst[pSet->nSstF - 1].size == 0);
H
Hongze Cheng 已提交
1041
  flag = TD_FILE_WRITE | TD_FILE_CREATE | TD_FILE_TRUNC;
H
Hongze Cheng 已提交
1042
  tsdbSstFileName(pTsdb, pWriter->wSet.diskId, pWriter->wSet.fid, &pWriter->fSst[pSet->nSstF - 1], fname);
H
Hongze Cheng 已提交
1043 1044 1045 1046 1047 1048 1049 1050 1051 1052
  pWriter->pLastFD = taosOpenFile(fname, flag);
  if (pWriter->pLastFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
  n = taosWriteFile(pWriter->pLastFD, hdr, TSDB_FHDR_SIZE);
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
H
Hongze Cheng 已提交
1053
  pWriter->fSst[pWriter->wSet.nSstF - 1].size += TSDB_FHDR_SIZE;
H
Hongze Cheng 已提交
1054

H
Hongze Cheng 已提交
1055 1056 1057 1058
  *ppWriter = pWriter;
  return code;

_err:
S
Shengliang Guan 已提交
1059
  tsdbError("vgId:%d, tsdb data file writer open failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1060
  *ppWriter = NULL;
H
Hongze Cheng 已提交
1061 1062 1063
  return code;
}

H
Hongze Cheng 已提交
1064
int32_t tsdbDataFWriterClose(SDataFWriter **ppWriter, int8_t sync) {
H
Hongze Cheng 已提交
1065
  int32_t code = 0;
H
Hongze Cheng 已提交
1066
  STsdb  *pTsdb = NULL;
H
Hongze Cheng 已提交
1067

H
Hongze Cheng 已提交
1068
  if (*ppWriter == NULL) goto _exit;
H
Hongze Cheng 已提交
1069 1070 1071

  pTsdb = (*ppWriter)->pTsdb;
  if (sync) {
H
Hongze Cheng 已提交
1072
    if (taosFsyncFile((*ppWriter)->pHeadFD) < 0) {
H
Hongze Cheng 已提交
1073 1074 1075 1076
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }

H
Hongze Cheng 已提交
1077
    if (taosFsyncFile((*ppWriter)->pDataFD) < 0) {
H
Hongze Cheng 已提交
1078 1079 1080 1081
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }

H
Hongze Cheng 已提交
1082
    if (taosFsyncFile((*ppWriter)->pSmaFD) < 0) {
H
Hongze Cheng 已提交
1083 1084 1085 1086
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }

H
Hongze Cheng 已提交
1087
    if (taosFsyncFile((*ppWriter)->pLastFD) < 0) {
H
Hongze Cheng 已提交
1088 1089 1090 1091 1092
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }
  }

H
Hongze Cheng 已提交
1093
  if (taosCloseFile(&(*ppWriter)->pHeadFD) < 0) {
H
Hongze Cheng 已提交
1094 1095 1096 1097
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1098
  if (taosCloseFile(&(*ppWriter)->pDataFD) < 0) {
H
Hongze Cheng 已提交
1099 1100 1101 1102
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1103
  if (taosCloseFile(&(*ppWriter)->pSmaFD) < 0) {
H
Hongze Cheng 已提交
1104 1105 1106 1107
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1108
  if (taosCloseFile(&(*ppWriter)->pLastFD) < 0) {
H
Hongze Cheng 已提交
1109 1110 1111 1112
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1113 1114 1115
  for (int32_t iBuf = 0; iBuf < sizeof((*ppWriter)->aBuf) / sizeof(uint8_t *); iBuf++) {
    tFree((*ppWriter)->aBuf[iBuf]);
  }
H
Hongze Cheng 已提交
1116
  taosMemoryFree(*ppWriter);
H
Hongze Cheng 已提交
1117
_exit:
H
Hongze Cheng 已提交
1118
  *ppWriter = NULL;
H
Hongze Cheng 已提交
1119 1120 1121
  return code;

_err:
S
Shengliang Guan 已提交
1122
  tsdbError("vgId:%d, data file writer close failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1123 1124 1125
  return code;
}

H
Hongze Cheng 已提交
1126
int32_t tsdbUpdateDFileSetHeader(SDataFWriter *pWriter) {
H
Hongze Cheng 已提交
1127
  int32_t code = 0;
H
Hongze Cheng 已提交
1128 1129
  int64_t n;
  char    hdr[TSDB_FHDR_SIZE];
H
Hongze Cheng 已提交
1130 1131

  // head ==============
H
Hongze Cheng 已提交
1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146
  memset(hdr, 0, TSDB_FHDR_SIZE);
  tPutHeadFile(hdr, &pWriter->fHead);
  taosCalcChecksumAppend(0, hdr, TSDB_FHDR_SIZE);

  n = taosLSeekFile(pWriter->pHeadFD, 0, SEEK_SET);
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  n = taosWriteFile(pWriter->pHeadFD, hdr, TSDB_FHDR_SIZE);
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
H
Hongze Cheng 已提交
1147 1148

  // data ==============
H
Hongze Cheng 已提交
1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163
  memset(hdr, 0, TSDB_FHDR_SIZE);
  tPutDataFile(hdr, &pWriter->fData);
  taosCalcChecksumAppend(0, hdr, TSDB_FHDR_SIZE);

  n = taosLSeekFile(pWriter->pDataFD, 0, SEEK_SET);
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  n = taosWriteFile(pWriter->pDataFD, hdr, TSDB_FHDR_SIZE);
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
H
Hongze Cheng 已提交
1164

H
Hongze Cheng 已提交
1165
  // sma ==============
H
Hongze Cheng 已提交
1166
  memset(hdr, 0, TSDB_FHDR_SIZE);
H
Hongze Cheng 已提交
1167
  tPutSmaFile(hdr, &pWriter->fSma);
H
Hongze Cheng 已提交
1168 1169
  taosCalcChecksumAppend(0, hdr, TSDB_FHDR_SIZE);

H
Hongze Cheng 已提交
1170
  n = taosLSeekFile(pWriter->pSmaFD, 0, SEEK_SET);
H
Hongze Cheng 已提交
1171 1172 1173 1174 1175
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1176
  n = taosWriteFile(pWriter->pSmaFD, hdr, TSDB_FHDR_SIZE);
H
Hongze Cheng 已提交
1177 1178 1179 1180
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
H
Hongze Cheng 已提交
1181

H
Hongze Cheng 已提交
1182
  // sst ==============
H
Hongze Cheng 已提交
1183
  memset(hdr, 0, TSDB_FHDR_SIZE);
H
Hongze Cheng 已提交
1184
  tPutSstFile(hdr, &pWriter->fSst[pWriter->wSet.nSstF - 1]);
H
Hongze Cheng 已提交
1185 1186
  taosCalcChecksumAppend(0, hdr, TSDB_FHDR_SIZE);

H
Hongze Cheng 已提交
1187
  n = taosLSeekFile(pWriter->pLastFD, 0, SEEK_SET);
H
Hongze Cheng 已提交
1188 1189 1190 1191 1192
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1193
  n = taosWriteFile(pWriter->pLastFD, hdr, TSDB_FHDR_SIZE);
H
Hongze Cheng 已提交
1194 1195 1196 1197
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
H
Hongze Cheng 已提交
1198 1199 1200 1201

  return code;

_err:
S
Shengliang Guan 已提交
1202
  tsdbError("vgId:%d, update DFileSet header failed since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1203 1204 1205
  return code;
}

H
Hongze Cheng 已提交
1206
int32_t tsdbWriteBlockIdx(SDataFWriter *pWriter, SArray *aBlockIdx) {
H
Hongze Cheng 已提交
1207
  int32_t    code = 0;
H
Hongze Cheng 已提交
1208
  SHeadFile *pHeadFile = &pWriter->fHead;
H
Hongze Cheng 已提交
1209
  int64_t    size = 0;
H
Hongze Cheng 已提交
1210 1211
  int64_t    n;

H
Hongze Cheng 已提交
1212 1213 1214 1215 1216
  // check
  if (taosArrayGetSize(aBlockIdx) == 0) {
    pHeadFile->offset = pHeadFile->size;
    goto _exit;
  }
H
Hongze Cheng 已提交
1217 1218

  // prepare
H
Hongze Cheng 已提交
1219
  size = sizeof(uint32_t);
H
Hongze Cheng 已提交
1220 1221 1222 1223
  for (int32_t iBlockIdx = 0; iBlockIdx < taosArrayGetSize(aBlockIdx); iBlockIdx++) {
    size += tPutBlockIdx(NULL, taosArrayGet(aBlockIdx, iBlockIdx));
  }
  size += sizeof(TSCKSUM);
H
Hongze Cheng 已提交
1224 1225

  // alloc
H
Hongze Cheng 已提交
1226
  code = tRealloc(&pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1227 1228 1229
  if (code) goto _err;

  // build
H
Hongze Cheng 已提交
1230
  n = 0;
H
Hongze Cheng 已提交
1231
  n = tPutU32(pWriter->aBuf[0] + n, TSDB_FILE_DLMT);
H
Hongze Cheng 已提交
1232
  for (int32_t iBlockIdx = 0; iBlockIdx < taosArrayGetSize(aBlockIdx); iBlockIdx++) {
H
Hongze Cheng 已提交
1233
    n += tPutBlockIdx(pWriter->aBuf[0] + n, taosArrayGet(aBlockIdx, iBlockIdx));
H
Hongze Cheng 已提交
1234
  }
H
Hongze Cheng 已提交
1235
  taosCalcChecksumAppend(0, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1236 1237 1238 1239

  ASSERT(n + sizeof(TSCKSUM) == size);

  // write
H
Hongze Cheng 已提交
1240
  n = taosWriteFile(pWriter->pHeadFD, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1241 1242 1243 1244 1245
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1246 1247 1248
  // update
  pHeadFile->offset = pHeadFile->size;
  pHeadFile->size += size;
H
Hongze Cheng 已提交
1249

H
Hongze Cheng 已提交
1250
_exit:
H
Hongze Cheng 已提交
1251 1252
  tsdbTrace("vgId:%d write block idx, offset:%" PRId64 " size:%" PRId64 " nBlockIdx:%d", TD_VID(pWriter->pTsdb->pVnode),
            pHeadFile->offset, size, taosArrayGetSize(aBlockIdx));
H
Hongze Cheng 已提交
1253 1254 1255
  return code;

_err:
S
Shengliang Guan 已提交
1256
  tsdbError("vgId:%d, write block idx failed since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1257 1258 1259
  return code;
}

H
Hongze Cheng 已提交
1260 1261 1262 1263 1264
int32_t tsdbWriteBlock(SDataFWriter *pWriter, SMapData *mBlock, SBlockIdx *pBlockIdx) {
  int32_t    code = 0;
  SHeadFile *pHeadFile = &pWriter->fHead;
  int64_t    size;
  int64_t    n;
H
Hongze Cheng 已提交
1265

H
Hongze Cheng 已提交
1266
  ASSERT(mBlock->nItem > 0);
H
Hongze Cheng 已提交
1267 1268

  // alloc
H
Hongze Cheng 已提交
1269
  size = sizeof(uint32_t) + tPutMapData(NULL, mBlock) + sizeof(TSCKSUM);
H
Hongze Cheng 已提交
1270
  code = tRealloc(&pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1271 1272 1273 1274
  if (code) goto _err;

  // build
  n = 0;
H
Hongze Cheng 已提交
1275 1276 1277
  n += tPutU32(pWriter->aBuf[0] + n, TSDB_FILE_DLMT);
  n += tPutMapData(pWriter->aBuf[0] + n, mBlock);
  taosCalcChecksumAppend(0, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1278 1279 1280 1281

  ASSERT(n + sizeof(TSCKSUM) == size);

  // write
H
Hongze Cheng 已提交
1282
  n = taosWriteFile(pWriter->pHeadFD, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1283 1284 1285 1286 1287
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1288 1289
  // update
  pBlockIdx->offset = pHeadFile->size;
H
Hongze Cheng 已提交
1290
  pBlockIdx->size = size;
H
Hongze Cheng 已提交
1291
  pHeadFile->size += size;
H
Hongze Cheng 已提交
1292

H
Hongze Cheng 已提交
1293 1294 1295 1296
  tsdbTrace("vgId:%d, write block, file ID:%d commit ID:%d suid:%" PRId64 " uid:%" PRId64 " offset:%" PRId64
            " size:%" PRId64 " nItem:%d",
            TD_VID(pWriter->pTsdb->pVnode), pWriter->wSet.fid, pHeadFile->commitID, pBlockIdx->suid, pBlockIdx->uid,
            pBlockIdx->offset, pBlockIdx->size, mBlock->nItem);
H
Hongze Cheng 已提交
1297 1298 1299
  return code;

_err:
S
Shengliang Guan 已提交
1300
  tsdbError("vgId:%d, write block failed since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1301 1302 1303
  return code;
}

H
Hongze Cheng 已提交
1304
int32_t tsdbWriteSstBlk(SDataFWriter *pWriter, SArray *aSstBlk) {
H
Hongze Cheng 已提交
1305 1306 1307 1308
  int32_t   code = 0;
  SSstFile *pSstFile = &pWriter->fSst[pWriter->wSet.nSstF - 1];
  int64_t   size;
  int64_t   n;
H
Hongze Cheng 已提交
1309

H
Hongze Cheng 已提交
1310
  // check
H
Hongze Cheng 已提交
1311
  if (taosArrayGetSize(aSstBlk) == 0) {
H
Hongze Cheng 已提交
1312
    pSstFile->offset = pSstFile->size;
H
Hongze Cheng 已提交
1313 1314 1315
    goto _exit;
  }

H
Hongze Cheng 已提交
1316
  // size
H
Hongze Cheng 已提交
1317
  size = sizeof(uint32_t);  // TSDB_FILE_DLMT
H
Hongze Cheng 已提交
1318 1319
  for (int32_t iBlockL = 0; iBlockL < taosArrayGetSize(aSstBlk); iBlockL++) {
    size += tPutSstBlk(NULL, taosArrayGet(aSstBlk, iBlockL));
H
Hongze Cheng 已提交
1320 1321 1322 1323
  }
  size += sizeof(TSCKSUM);

  // alloc
H
Hongze Cheng 已提交
1324
  code = tRealloc(&pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1325 1326 1327 1328
  if (code) goto _err;

  // encode
  n = 0;
H
Hongze Cheng 已提交
1329
  n += tPutU32(pWriter->aBuf[0] + n, TSDB_FILE_DLMT);
H
Hongze Cheng 已提交
1330 1331
  for (int32_t iBlockL = 0; iBlockL < taosArrayGetSize(aSstBlk); iBlockL++) {
    n += tPutSstBlk(pWriter->aBuf[0] + n, taosArrayGet(aSstBlk, iBlockL));
H
Hongze Cheng 已提交
1332
  }
H
Hongze Cheng 已提交
1333
  taosCalcChecksumAppend(0, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1334 1335 1336 1337

  ASSERT(n + sizeof(TSCKSUM) == size);

  // write
H
Hongze Cheng 已提交
1338
  n = taosWriteFile(pWriter->pLastFD, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1339 1340 1341 1342 1343 1344
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  // update
H
Hongze Cheng 已提交
1345 1346
  pSstFile->offset = pSstFile->size;
  pSstFile->size += size;
H
Hongze Cheng 已提交
1347

H
Hongze Cheng 已提交
1348
_exit:
H
Hongze Cheng 已提交
1349
  tsdbTrace("vgId:%d tsdb write blockl, loffset:%" PRId64 " size:%" PRId64, TD_VID(pWriter->pTsdb->pVnode),
H
Hongze Cheng 已提交
1350
            pSstFile->offset, size);
H
Hongze Cheng 已提交
1351 1352 1353 1354 1355 1356 1357
  return code;

_err:
  tsdbError("vgId:%d tsdb write blockl failed since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code));
  return code;
}

H
Hongze Cheng 已提交
1358
static void tsdbUpdateBlockInfo(SBlockData *pBlockData, SDataBlk *pDataBlk) {
H
Hongze Cheng 已提交
1359
  for (int32_t iRow = 0; iRow < pBlockData->nRow; iRow++) {
H
Hongze Cheng 已提交
1360 1361
    TSDBKEY key = {.ts = pBlockData->aTSKEY[iRow], .version = pBlockData->aVersion[iRow]};

H
Hongze Cheng 已提交
1362
    if (iRow == 0) {
H
Hongze Cheng 已提交
1363 1364
      if (tsdbKeyCmprFn(&pDataBlk->minKey, &key) > 0) {
        pDataBlk->minKey = key;
H
Hongze Cheng 已提交
1365 1366 1367
      }
    } else {
      if (pBlockData->aTSKEY[iRow] == pBlockData->aTSKEY[iRow - 1]) {
H
Hongze Cheng 已提交
1368
        pDataBlk->hasDup = 1;
H
Hongze Cheng 已提交
1369
      }
H
Hongze Cheng 已提交
1370 1371
    }

H
Hongze Cheng 已提交
1372 1373
    if (iRow == pBlockData->nRow - 1 && tsdbKeyCmprFn(&pDataBlk->maxKey, &key) < 0) {
      pDataBlk->maxKey = key;
H
Hongze Cheng 已提交
1374 1375
    }

H
Hongze Cheng 已提交
1376 1377
    pDataBlk->minVer = TMIN(pDataBlk->minVer, key.version);
    pDataBlk->maxVer = TMAX(pDataBlk->maxVer, key.version);
H
Hongze Cheng 已提交
1378
  }
H
Hongze Cheng 已提交
1379
  pDataBlk->nRow += pBlockData->nRow;
H
Hongze Cheng 已提交
1380
}
H
Hongze Cheng 已提交
1381

H
Hongze Cheng 已提交
1382 1383
static int32_t tsdbWriteBlockSma(SDataFWriter *pWriter, SBlockData *pBlockData, SSmaInfo *pSmaInfo) {
  int32_t code = 0;
H
Hongze Cheng 已提交
1384

H
Hongze Cheng 已提交
1385 1386 1387 1388
  pSmaInfo->offset = 0;
  pSmaInfo->size = 0;

  // encode
H
Hongze Cheng 已提交
1389
  for (int32_t iColData = 0; iColData < taosArrayGetSize(pBlockData->aIdx); iColData++) {
H
Hongze Cheng 已提交
1390 1391 1392
    SColData *pColData = tBlockDataGetColDataByIdx(pBlockData, iColData);

    if ((!pColData->smaOn) || IS_VAR_DATA_TYPE(pColData->type)) continue;
H
Hongze Cheng 已提交
1393

H
Hongze Cheng 已提交
1394 1395
    SColumnDataAgg sma;
    tsdbCalcColDataSMA(pColData, &sma);
H
Hongze Cheng 已提交
1396

H
Hongze Cheng 已提交
1397
    code = tRealloc(&pWriter->aBuf[0], pSmaInfo->size + tPutColumnDataAgg(NULL, &sma));
H
Hongze Cheng 已提交
1398
    if (code) goto _err;
H
Hongze Cheng 已提交
1399
    pSmaInfo->size += tPutColumnDataAgg(pWriter->aBuf[0] + pSmaInfo->size, &sma);
H
Hongze Cheng 已提交
1400
  }
H
Hongze Cheng 已提交
1401

H
Hongze Cheng 已提交
1402 1403 1404
  // write
  if (pSmaInfo->size) {
    int32_t size = pSmaInfo->size + sizeof(TSCKSUM);
H
Hongze Cheng 已提交
1405

H
Hongze Cheng 已提交
1406
    code = tRealloc(&pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1407
    if (code) goto _err;
H
Hongze Cheng 已提交
1408

H
Hongze Cheng 已提交
1409
    taosCalcChecksumAppend(0, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1410

H
Hongze Cheng 已提交
1411
    int64_t n = taosWriteFile(pWriter->pSmaFD, pWriter->aBuf[0], size);
H
Hongze Cheng 已提交
1412 1413 1414 1415 1416 1417 1418
    if (n < 0) {
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }

    pSmaInfo->offset = pWriter->fSma.size;
    pWriter->fSma.size += size;
H
Hongze Cheng 已提交
1419
  }
H
Hongze Cheng 已提交
1420

H
Hongze Cheng 已提交
1421
  return code;
H
Hongze Cheng 已提交
1422

H
Hongze Cheng 已提交
1423
_err:
H
Hongze Cheng 已提交
1424
  tsdbError("vgId:%d tsdb write block sma failed since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1425 1426
  return code;
}
H
Hongze Cheng 已提交
1427

H
Hongze Cheng 已提交
1428
int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, SBlockInfo *pBlkInfo, SSmaInfo *pSmaInfo,
H
Hongze Cheng 已提交
1429
                           int8_t cmprAlg, int8_t toLast) {
H
Hongze Cheng 已提交
1430
  int32_t code = 0;
H
Hongze Cheng 已提交
1431 1432

  ASSERT(pBlockData->nRow > 0);
H
Hongze Cheng 已提交
1433

H
Hongze Cheng 已提交
1434
  pBlkInfo->offset = toLast ? pWriter->fSst[pWriter->wSet.nSstF - 1].size : pWriter->fData.size;
H
Hongze Cheng 已提交
1435 1436 1437
  pBlkInfo->szBlock = 0;
  pBlkInfo->szKey = 0;

H
Hongze Cheng 已提交
1438 1439
  int32_t aBufN[4] = {0};
  code = tCmprBlockData(pBlockData, cmprAlg, NULL, NULL, pWriter->aBuf, aBufN);
H
Hongze Cheng 已提交
1440 1441
  if (code) goto _err;

H
Hongze Cheng 已提交
1442 1443 1444
  // write =================
  TdFilePtr pFD = toLast ? pWriter->pLastFD : pWriter->pDataFD;

H
Hongze Cheng 已提交
1445 1446
  pBlkInfo->szKey = aBufN[3] + aBufN[2];
  pBlkInfo->szBlock = aBufN[0] + aBufN[1] + aBufN[2] + aBufN[3];
H
Hongze Cheng 已提交
1447

H
Hongze Cheng 已提交
1448
  int64_t n = taosWriteFile(pFD, pWriter->aBuf[3], aBufN[3]);
H
Hongze Cheng 已提交
1449 1450 1451 1452 1453
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1454
  n = taosWriteFile(pFD, pWriter->aBuf[2], aBufN[2]);
H
Hongze Cheng 已提交
1455 1456 1457 1458 1459
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1460 1461
  if (aBufN[1]) {
    n = taosWriteFile(pFD, pWriter->aBuf[1], aBufN[1]);
H
Hongze Cheng 已提交
1462 1463 1464 1465 1466
    if (n < 0) {
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }
  }
H
Hongze Cheng 已提交
1467

H
Hongze Cheng 已提交
1468 1469
  if (aBufN[0]) {
    n = taosWriteFile(pFD, pWriter->aBuf[0], aBufN[0]);
H
Hongze Cheng 已提交
1470 1471 1472 1473 1474
    if (n < 0) {
      code = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }
  }
H
Hongze Cheng 已提交
1475 1476 1477

  // update info
  if (toLast) {
H
Hongze Cheng 已提交
1478
    pWriter->fSst[pWriter->wSet.nSstF - 1].size += pBlkInfo->szBlock;
H
Hongze Cheng 已提交
1479 1480 1481
  } else {
    pWriter->fData.size += pBlkInfo->szBlock;
  }
H
Hongze Cheng 已提交
1482

H
Hongze Cheng 已提交
1483 1484 1485 1486 1487
  // ================= SMA ====================
  if (pSmaInfo) {
    code = tsdbWriteBlockSma(pWriter, pBlockData, pSmaInfo);
    if (code) goto _err;
  }
H
Hongze Cheng 已提交
1488

H
Hongze Cheng 已提交
1489
_exit:
H
Hongze Cheng 已提交
1490 1491 1492
  tsdbTrace("vgId:%d tsdb write block data, suid:%" PRId64 " uid:%" PRId64 " nRow:%d, offset:%" PRId64 " size:%d",
            TD_VID(pWriter->pTsdb->pVnode), pBlockData->suid, pBlockData->uid, pBlockData->nRow, pBlkInfo->offset,
            pBlkInfo->szBlock);
H
Hongze Cheng 已提交
1493 1494
  return code;

H
Hongze Cheng 已提交
1495
_err:
H
Hongze Cheng 已提交
1496
  tsdbError("vgId:%d tsdb write block data failed since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1497
  return code;
H
Hongze Cheng 已提交
1498
}
H
Hongze Cheng 已提交
1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509

int32_t tsdbDFileSetCopy(STsdb *pTsdb, SDFileSet *pSetFrom, SDFileSet *pSetTo) {
  int32_t   code = 0;
  int64_t   n;
  int64_t   size;
  TdFilePtr pOutFD = NULL;  // TODO
  TdFilePtr PInFD = NULL;   // TODO
  char      fNameFrom[TSDB_FILENAME_LEN];
  char      fNameTo[TSDB_FILENAME_LEN];

  // head
H
Hongze Cheng 已提交
1510 1511
  tsdbHeadFileName(pTsdb, pSetFrom->diskId, pSetFrom->fid, pSetFrom->pHeadF, fNameFrom);
  tsdbHeadFileName(pTsdb, pSetTo->diskId, pSetTo->fid, pSetTo->pHeadF, fNameTo);
H
Hongze Cheng 已提交
1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524

  pOutFD = taosOpenFile(fNameTo, TD_FILE_WRITE | TD_FILE_CREATE | TD_FILE_TRUNC);
  if (pOutFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  PInFD = taosOpenFile(fNameFrom, TD_FILE_READ);
  if (PInFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1525
  n = taosFSendFile(pOutFD, PInFD, 0, pSetFrom->pHeadF->size);
H
Hongze Cheng 已提交
1526 1527 1528 1529 1530 1531 1532 1533
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
  taosCloseFile(&pOutFD);
  taosCloseFile(&PInFD);

  // data
H
Hongze Cheng 已提交
1534 1535
  tsdbDataFileName(pTsdb, pSetFrom->diskId, pSetFrom->fid, pSetFrom->pDataF, fNameFrom);
  tsdbDataFileName(pTsdb, pSetTo->diskId, pSetTo->fid, pSetTo->pDataF, fNameTo);
H
Hongze Cheng 已提交
1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548

  pOutFD = taosOpenFile(fNameTo, TD_FILE_WRITE | TD_FILE_CREATE | TD_FILE_TRUNC);
  if (pOutFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  PInFD = taosOpenFile(fNameFrom, TD_FILE_READ);
  if (PInFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1549
  n = taosFSendFile(pOutFD, PInFD, 0, pSetFrom->pDataF->size);
H
Hongze Cheng 已提交
1550 1551 1552 1553 1554 1555 1556
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
  taosCloseFile(&pOutFD);
  taosCloseFile(&PInFD);

H
Hongze Cheng 已提交
1557
  // sst
H
Hongze Cheng 已提交
1558 1559
  tsdbSstFileName(pTsdb, pSetFrom->diskId, pSetFrom->fid, pSetFrom->aSstF[0], fNameFrom);
  tsdbSstFileName(pTsdb, pSetTo->diskId, pSetTo->fid, pSetTo->aSstF[0], fNameTo);
H
Hongze Cheng 已提交
1560

H
Hongze Cheng 已提交
1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572
  pOutFD = taosOpenFile(fNameTo, TD_FILE_WRITE | TD_FILE_CREATE | TD_FILE_TRUNC);
  if (pOutFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  PInFD = taosOpenFile(fNameFrom, TD_FILE_READ);
  if (PInFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1573
  n = taosFSendFile(pOutFD, PInFD, 0, pSetFrom->aSstF[0]->size);
H
Hongze Cheng 已提交
1574 1575 1576 1577 1578 1579 1580 1581
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
  taosCloseFile(&pOutFD);
  taosCloseFile(&PInFD);

  // sma
H
Hongze Cheng 已提交
1582 1583
  tsdbSmaFileName(pTsdb, pSetFrom->diskId, pSetFrom->fid, pSetFrom->pSmaF, fNameFrom);
  tsdbSmaFileName(pTsdb, pSetTo->diskId, pSetTo->fid, pSetTo->pSmaF, fNameTo);
H
Hongze Cheng 已提交
1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594 1595 1596

  pOutFD = taosOpenFile(fNameTo, TD_FILE_WRITE | TD_FILE_CREATE | TD_FILE_TRUNC);
  if (pOutFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  PInFD = taosOpenFile(fNameFrom, TD_FILE_READ);
  if (PInFD == NULL) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

H
Hongze Cheng 已提交
1597
  n = taosFSendFile(pOutFD, PInFD, 0, pSetFrom->pSmaF->size);
H
Hongze Cheng 已提交
1598 1599 1600 1601 1602 1603 1604 1605 1606 1607
  if (n < 0) {
    code = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
  taosCloseFile(&pOutFD);
  taosCloseFile(&PInFD);

  return code;

_err:
S
Shengliang Guan 已提交
1608
  tsdbError("vgId:%d, tsdb DFileSet copy failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1609
  return code;
H
Hongze Cheng 已提交
1610
}