tsdbCommit.c 41.6 KB
Newer Older
H
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

H
Hongze Cheng 已提交
16
#include "tsdb.h"
H
Hongze Cheng 已提交
17 18 19 20 21
typedef struct {
  int64_t   suid;
  int64_t   uid;
  STSchema *pTSchema;
} SSkmInfo;
H
Hongze Cheng 已提交
22

H
Hongze Cheng 已提交
23 24 25 26 27 28
typedef struct {
  int64_t suid;
  int64_t uid;
  TSDBROW row;
} SRowInfo;

H
Hongze Cheng 已提交
29
typedef struct {
H
Hongze Cheng 已提交
30
  STsdb *pTsdb;
H
Hongze Cheng 已提交
31
  /* commit data */
H
Hongze Cheng 已提交
32
  int64_t commitID;
H
Hongze Cheng 已提交
33 34
  int32_t minutes;
  int8_t  precision;
H
Hongze Cheng 已提交
35 36
  int32_t minRow;
  int32_t maxRow;
H
Hongze Cheng 已提交
37
  int8_t  cmprAlg;
H
Hongze Cheng 已提交
38
  STsdbFS fs;
H
Hongze Cheng 已提交
39
  // --------------
H
Hongze Cheng 已提交
40
  TSKEY   nextKey;  // reset by each table commit
H
Hongze Cheng 已提交
41 42 43
  int32_t commitFid;
  TSKEY   minKey;
  TSKEY   maxKey;
H
Hongze Cheng 已提交
44
  // commit file data
H
Hongze Cheng 已提交
45 46
  struct {
    SDataFReader *pReader;
H
Hongze Cheng 已提交
47 48 49 50 51 52 53 54 55 56 57 58
    // data
    SArray    *aBlockIdx;  // SArray<SBlockIdx>
    int32_t    iBlockIdx;
    SBlockIdx *pBlockIdx;
    SMapData   mBlock;  // SMapData<SBlock>
    SBlockData bData;
    // last
    SArray    *aBlockL;  // SArray<SBlockL>
    int32_t    iBlockL;
    SBlockL   *pBlockL;
    SBlockData bDatal;
    int32_t    iRow;
H
Hongze Cheng 已提交
59 60
    SRowInfo  *pRowInfo;
    SRowInfo   rowInfo;
H
Hongze Cheng 已提交
61 62 63 64
  } dReader;
  struct {
    SDataFWriter *pWriter;
    SArray       *aBlockIdx;  // SArray<SBlockIdx>
H
Hongze Cheng 已提交
65
    SArray       *aBlockL;    // SArray<SBlockL>
H
Hongze Cheng 已提交
66 67
    SMapData      mBlock;     // SMapData<SBlock>
    SBlockData    bData;
H
Hongze Cheng 已提交
68
    SBlockData    bDatal;
H
Hongze Cheng 已提交
69 70 71
  } dWriter;
  SSkmInfo skmTable;
  SSkmInfo skmRow;
H
Hongze Cheng 已提交
72
  /* commit del */
H
Hongze Cheng 已提交
73 74
  SDelFReader *pDelFReader;
  SDelFWriter *pDelFWriter;
H
Hongze Cheng 已提交
75 76 77
  SArray      *aDelIdx;   // SArray<SDelIdx>
  SArray      *aDelIdxN;  // SArray<SDelIdx>
  SArray      *aDelData;  // SArray<SDelData>
H
Hongze Cheng 已提交
78
} SCommitter;
H
refact  
Hongze Cheng 已提交
79

H
Hongze Cheng 已提交
80 81 82 83 84
static int32_t tsdbStartCommit(STsdb *pTsdb, SCommitter *pCommitter);
static int32_t tsdbCommitData(SCommitter *pCommitter);
static int32_t tsdbCommitDel(SCommitter *pCommitter);
static int32_t tsdbCommitCache(SCommitter *pCommitter);
static int32_t tsdbEndCommit(SCommitter *pCommitter, int32_t eno);
H
refact  
Hongze Cheng 已提交
85

H
refact  
Hongze Cheng 已提交
86
int32_t tsdbBegin(STsdb *pTsdb) {
H
Hongze Cheng 已提交
87
  int32_t code = 0;
H
Hongze Cheng 已提交
88

89 90
  if (!pTsdb) return code;

H
Hongze Cheng 已提交
91 92
  SMemTable *pMemTable;
  code = tsdbMemTableCreate(pTsdb, &pMemTable);
H
Hongze Cheng 已提交
93
  if (code) goto _err;
H
Hongze Cheng 已提交
94

H
Hongze Cheng 已提交
95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110
  // lock
  code = taosThreadRwlockWrlock(&pTsdb->rwLock);
  if (code) {
    code = TAOS_SYSTEM_ERROR(code);
    goto _err;
  }

  pTsdb->mem = pMemTable;

  // unlock
  code = taosThreadRwlockUnlock(&pTsdb->rwLock);
  if (code) {
    code = TAOS_SYSTEM_ERROR(code);
    goto _err;
  }

H
Hongze Cheng 已提交
111 112 113
  return code;

_err:
S
Shengliang Guan 已提交
114
  tsdbError("vgId:%d, tsdb begin failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
115
  return code;
H
Hongze Cheng 已提交
116 117
}

H
more  
Hongze Cheng 已提交
118
int32_t tsdbCommit(STsdb *pTsdb) {
119
  if (!pTsdb) return 0;
H
Hongze Cheng 已提交
120

H
more  
Hongze Cheng 已提交
121
  int32_t    code = 0;
H
Hongze Cheng 已提交
122 123 124 125
  SCommitter commith;
  SMemTable *pMemTable = pTsdb->mem;

  // check
H
Hongze Cheng 已提交
126
  if (pMemTable->nRow == 0 && pMemTable->nDel == 0) {
H
Hongze Cheng 已提交
127
    taosThreadRwlockWrlock(&pTsdb->rwLock);
H
Hongze Cheng 已提交
128
    pTsdb->mem = NULL;
H
Hongze Cheng 已提交
129 130 131
    taosThreadRwlockUnlock(&pTsdb->rwLock);

    tsdbUnrefMemTable(pMemTable);
H
Hongze Cheng 已提交
132 133
    goto _exit;
  }
H
refact  
Hongze Cheng 已提交
134

H
more  
Hongze Cheng 已提交
135
  // start commit
H
more  
Hongze Cheng 已提交
136
  code = tsdbStartCommit(pTsdb, &commith);
H
Hongze Cheng 已提交
137
  if (code) goto _err;
H
refact  
Hongze Cheng 已提交
138

H
refact  
Hongze Cheng 已提交
139 140
  // commit impl
  code = tsdbCommitData(&commith);
H
Hongze Cheng 已提交
141
  if (code) goto _err;
H
refact  
Hongze Cheng 已提交
142 143

  code = tsdbCommitDel(&commith);
H
Hongze Cheng 已提交
144
  if (code) goto _err;
H
refact  
Hongze Cheng 已提交
145 146

  // end commit
H
more  
Hongze Cheng 已提交
147
  code = tsdbEndCommit(&commith, 0);
H
Hongze Cheng 已提交
148
  if (code) goto _err;
H
refact  
Hongze Cheng 已提交
149

H
Hongze Cheng 已提交
150
_exit:
H
refact  
Hongze Cheng 已提交
151 152 153
  return code;

_err:
H
Hongze Cheng 已提交
154
  tsdbEndCommit(&commith, code);
C
Cary Xu 已提交
155
  tsdbError("vgId:%d, failed to commit since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
refact  
Hongze Cheng 已提交
156 157 158
  return code;
}

H
Hongze Cheng 已提交
159
static int32_t tsdbCommitDelStart(SCommitter *pCommitter) {
H
Hongze Cheng 已提交
160 161 162 163
  int32_t    code = 0;
  STsdb     *pTsdb = pCommitter->pTsdb;
  SMemTable *pMemTable = pTsdb->imem;

H
Hongze Cheng 已提交
164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180
  pCommitter->aDelIdx = taosArrayInit(0, sizeof(SDelIdx));
  if (pCommitter->aDelIdx == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }

  pCommitter->aDelData = taosArrayInit(0, sizeof(SDelData));
  if (pCommitter->aDelData == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }

  pCommitter->aDelIdxN = taosArrayInit(0, sizeof(SDelIdx));
  if (pCommitter->aDelIdxN == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }
H
Hongze Cheng 已提交
181

H
Hongze Cheng 已提交
182
  SDelFile *pDelFileR = pCommitter->fs.pDelFile;
H
Hongze Cheng 已提交
183
  if (pDelFileR) {
H
Hongze Cheng 已提交
184
    code = tsdbDelFReaderOpen(&pCommitter->pDelFReader, pDelFileR, pTsdb, NULL);
H
Hongze Cheng 已提交
185
    if (code) goto _err;
H
Hongze Cheng 已提交
186

H
Hongze Cheng 已提交
187
    code = tsdbReadDelIdx(pCommitter->pDelFReader, pCommitter->aDelIdx, NULL);
H
Hongze Cheng 已提交
188
    if (code) goto _err;
H
Hongze Cheng 已提交
189 190
  }

H
Hongze Cheng 已提交
191
  // prepare new
H
Hongze Cheng 已提交
192 193
  SDelFile wDelFile = {.commitID = pCommitter->commitID, .size = 0, .offset = 0};
  code = tsdbDelFWriterOpen(&pCommitter->pDelFWriter, &wDelFile, pTsdb);
H
Hongze Cheng 已提交
194
  if (code) goto _err;
H
Hongze Cheng 已提交
195 196

_exit:
S
Shengliang Guan 已提交
197
  tsdbDebug("vgId:%d, commit del start", TD_VID(pTsdb->pVnode));
H
Hongze Cheng 已提交
198 199 200
  return code;

_err:
S
Shengliang Guan 已提交
201
  tsdbError("vgId:%d, commit del start failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
202 203 204
  return code;
}

H
Hongze Cheng 已提交
205
static int32_t tsdbCommitTableDel(SCommitter *pCommitter, STbData *pTbData, SDelIdx *pDelIdx) {
H
Hongze Cheng 已提交
206
  int32_t   code = 0;
H
Hongze Cheng 已提交
207
  SDelData *pDelData;
H
Hongze Cheng 已提交
208 209
  tb_uid_t  suid;
  tb_uid_t  uid;
H
Hongze Cheng 已提交
210 211

  if (pTbData) {
H
Hongze Cheng 已提交
212 213
    suid = pTbData->suid;
    uid = pTbData->uid;
H
Hongze Cheng 已提交
214

H
Hongze Cheng 已提交
215 216 217 218
    if (pTbData->pHead == NULL) {
      pTbData = NULL;
    }
  }
H
Hongze Cheng 已提交
219 220

  if (pDelIdx) {
H
Hongze Cheng 已提交
221 222 223 224
    suid = pDelIdx->suid;
    uid = pDelIdx->uid;

    code = tsdbReadDelData(pCommitter->pDelFReader, pDelIdx, pCommitter->aDelData, NULL);
H
Hongze Cheng 已提交
225
    if (code) goto _err;
226 227
  } else {
    taosArrayClear(pCommitter->aDelData);
H
Hongze Cheng 已提交
228 229
  }

H
Hongze Cheng 已提交
230
  if (pTbData == NULL && pDelIdx == NULL) goto _exit;
H
Hongze Cheng 已提交
231

H
Hongze Cheng 已提交
232
  SDelIdx delIdx = {.suid = suid, .uid = uid};
H
Hongze Cheng 已提交
233 234

  // memory
H
Hongze Cheng 已提交
235 236
  pDelData = pTbData ? pTbData->pHead : NULL;
  for (; pDelData; pDelData = pDelData->pNext) {
H
Hongze Cheng 已提交
237 238 239 240
    if (taosArrayPush(pCommitter->aDelData, pDelData) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _err;
    }
H
Hongze Cheng 已提交
241 242 243
  }

  // write
H
Hongze Cheng 已提交
244
  code = tsdbWriteDelData(pCommitter->pDelFWriter, pCommitter->aDelData, NULL, &delIdx);
H
Hongze Cheng 已提交
245 246 247
  if (code) goto _err;

  // put delIdx
248
  if (taosArrayPush(pCommitter->aDelIdxN, &delIdx) == NULL) {
H
Hongze Cheng 已提交
249 250 251
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }
H
Hongze Cheng 已提交
252 253 254 255 256

_exit:
  return code;

_err:
S
Shengliang Guan 已提交
257
  tsdbError("vgId:%d, commit table del failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
258 259 260
  return code;
}

H
Hongze Cheng 已提交
261 262
static int32_t tsdbCommitDelEnd(SCommitter *pCommitter) {
  int32_t code = 0;
H
Hongze Cheng 已提交
263
  STsdb  *pTsdb = pCommitter->pTsdb;
H
Hongze Cheng 已提交
264

H
Hongze Cheng 已提交
265
  code = tsdbWriteDelIdx(pCommitter->pDelFWriter, pCommitter->aDelIdxN, NULL);
H
Hongze Cheng 已提交
266
  if (code) goto _err;
H
Hongze Cheng 已提交
267

H
Hongze Cheng 已提交
268 269 270
  code = tsdbUpdateDelFileHdr(pCommitter->pDelFWriter);
  if (code) goto _err;

H
Hongze Cheng 已提交
271
  code = tsdbFSUpsertDelFile(&pCommitter->fs, &pCommitter->pDelFWriter->fDel);
H
Hongze Cheng 已提交
272
  if (code) goto _err;
H
Hongze Cheng 已提交
273

H
Hongze Cheng 已提交
274
  code = tsdbDelFWriterClose(&pCommitter->pDelFWriter, 1);
H
Hongze Cheng 已提交
275
  if (code) goto _err;
H
Hongze Cheng 已提交
276 277

  if (pCommitter->pDelFReader) {
H
Hongze Cheng 已提交
278
    code = tsdbDelFReaderClose(&pCommitter->pDelFReader);
H
Hongze Cheng 已提交
279 280 281
    if (code) goto _err;
  }

H
Hongze Cheng 已提交
282 283 284 285
  taosArrayDestroy(pCommitter->aDelIdx);
  taosArrayDestroy(pCommitter->aDelData);
  taosArrayDestroy(pCommitter->aDelIdxN);

H
Hongze Cheng 已提交
286 287 288
  return code;

_err:
S
Shengliang Guan 已提交
289
  tsdbError("vgId:%d, commit del end failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
290 291 292
  return code;
}

H
Hongze Cheng 已提交
293
static int32_t tsdbCommitterNextLastRow(SCommitter *pCommitter) {
H
Hongze Cheng 已提交
294 295 296 297 298
  int32_t code = 0;

  ASSERT(pCommitter->dReader.pReader);
  ASSERT(pCommitter->dReader.pRowInfo);

H
Hongze Cheng 已提交
299
  SBlockData *pBlockDatal = &pCommitter->dReader.bDatal;
H
Hongze Cheng 已提交
300
  pCommitter->dReader.iRow++;
H
Hongze Cheng 已提交
301
  if (pCommitter->dReader.iRow < pBlockDatal->nRow) {
H
Hongze Cheng 已提交
302 303 304
    if (pBlockDatal->uid) {
      pCommitter->dReader.pRowInfo->uid = pBlockDatal->uid;
    } else {
H
Hongze Cheng 已提交
305 306 307
      pCommitter->dReader.pRowInfo->uid = pBlockDatal->aUid[pCommitter->dReader.iRow];
    }
    pCommitter->dReader.pRowInfo->row = tsdbRowFromBlockData(pBlockDatal, pCommitter->dReader.iRow);
H
Hongze Cheng 已提交
308 309 310 311
  } else {
    pCommitter->dReader.iBlockL++;
    if (pCommitter->dReader.iBlockL < taosArrayGetSize(pCommitter->dReader.aBlockL)) {
      pCommitter->dReader.pBlockL = (SBlockL *)taosArrayGet(pCommitter->dReader.aBlockL, pCommitter->dReader.iBlockL);
H
Hongze Cheng 已提交
312
      code = tsdbReadLastBlock(pCommitter->dReader.pReader, pCommitter->dReader.pBlockL, pBlockDatal, NULL, NULL);
H
Hongze Cheng 已提交
313 314 315
      if (code) goto _exit;

      pCommitter->dReader.iRow = 0;
H
Hongze Cheng 已提交
316 317 318 319 320 321 322
      pCommitter->dReader.pRowInfo->suid = pBlockDatal->suid;
      if (pBlockDatal->uid) {
        pCommitter->dReader.pRowInfo->uid = pBlockDatal->uid;
      } else {
        pCommitter->dReader.pRowInfo->uid = pBlockDatal->aUid[0];
      }
      pCommitter->dReader.pRowInfo->row = tsdbRowFromBlockData(pBlockDatal, pCommitter->dReader.iRow);
H
Hongze Cheng 已提交
323 324 325 326 327 328 329 330 331
    } else {
      pCommitter->dReader.pRowInfo = NULL;
    }
  }

_exit:
  return code;
}

H
Hongze Cheng 已提交
332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353
static int32_t tsdbCommitterNextTableData(SCommitter *pCommitter) {
  int32_t code = 0;

  ASSERT(pCommitter->dReader.pBlockIdx);

  pCommitter->dReader.iBlockIdx++;
  if (pCommitter->dReader.iBlockIdx < taosArrayGetSize(pCommitter->dReader.aBlockIdx)) {
    pCommitter->dReader.pBlockIdx =
        (SBlockIdx *)taosArrayGet(pCommitter->dReader.aBlockIdx, pCommitter->dReader.iBlockIdx);

    code = tsdbReadBlock(pCommitter->dReader.pReader, pCommitter->dReader.pBlockIdx, &pCommitter->dReader.mBlock, NULL);
    if (code) goto _exit;

    ASSERT(pCommitter->dReader.mBlock.nItem > 0);
  } else {
    pCommitter->dReader.pBlockIdx = NULL;
  }

_exit:
  return code;
}

H
Hongze Cheng 已提交
354 355 356 357
static int32_t tsdbCommitFileDataStart(SCommitter *pCommitter) {
  int32_t    code = 0;
  STsdb     *pTsdb = pCommitter->pTsdb;
  SDFileSet *pRSet = NULL;
H
Hongze Cheng 已提交
358

H
Hongze Cheng 已提交
359
  // memory
H
Hongze Cheng 已提交
360 361 362
  pCommitter->commitFid = tsdbKeyFid(pCommitter->nextKey, pCommitter->minutes, pCommitter->precision);
  tsdbFidKeyRange(pCommitter->commitFid, pCommitter->minutes, pCommitter->precision, &pCommitter->minKey,
                  &pCommitter->maxKey);
H
Hongze Cheng 已提交
363
  pCommitter->nextKey = TSKEY_MAX;
H
Hongze Cheng 已提交
364

H
Hongze Cheng 已提交
365
  // Reader
H
Hongze Cheng 已提交
366 367
  pRSet = (SDFileSet *)taosArraySearch(pCommitter->fs.aDFileSet, &(SDFileSet){.fid = pCommitter->commitFid},
                                       tDFileSetCmprFn, TD_EQ);
H
Hongze Cheng 已提交
368
  if (pRSet) {
H
Hongze Cheng 已提交
369
    code = tsdbDataFReaderOpen(&pCommitter->dReader.pReader, pTsdb, pRSet);
H
Hongze Cheng 已提交
370 371
    if (code) goto _err;

H
Hongze Cheng 已提交
372
    // data
H
Hongze Cheng 已提交
373
    code = tsdbReadBlockIdx(pCommitter->dReader.pReader, pCommitter->dReader.aBlockIdx, NULL);
H
Hongze Cheng 已提交
374
    if (code) goto _err;
H
Hongze Cheng 已提交
375

H
Hongze Cheng 已提交
376 377 378 379 380 381 382 383 384 385 386
    pCommitter->dReader.iBlockIdx = 0;
    if (pCommitter->dReader.iBlockIdx < taosArrayGetSize(pCommitter->dReader.aBlockIdx)) {
      pCommitter->dReader.pBlockIdx =
          (SBlockIdx *)taosArrayGet(pCommitter->dReader.aBlockIdx, pCommitter->dReader.iBlockIdx);

      code =
          tsdbReadBlock(pCommitter->dReader.pReader, pCommitter->dReader.pBlockIdx, &pCommitter->dReader.mBlock, NULL);
      if (code) goto _err;
    } else {
      pCommitter->dReader.pBlockIdx = NULL;
    }
H
Hongze Cheng 已提交
387
    tBlockDataReset(&pCommitter->dReader.bData);
H
Hongze Cheng 已提交
388 389

    // last
H
Hongze Cheng 已提交
390 391 392
    code = tsdbReadBlockL(pCommitter->dReader.pReader, pCommitter->dReader.aBlockL, NULL);
    if (code) goto _err;

H
Hongze Cheng 已提交
393 394 395
    pCommitter->dReader.iBlockL = -1;
    pCommitter->dReader.iRow = -1;
    pCommitter->dReader.pRowInfo = &pCommitter->dReader.rowInfo;
H
Hongze Cheng 已提交
396
    tBlockDataReset(&pCommitter->dReader.bDatal);
H
Hongze Cheng 已提交
397
    code = tsdbCommitterNextLastRow(pCommitter);
H
Hongze Cheng 已提交
398
    if (code) goto _err;
H
Hongze Cheng 已提交
399
  } else {
H
Hongze Cheng 已提交
400
    pCommitter->dReader.pBlockIdx = NULL;
H
Hongze Cheng 已提交
401
    pCommitter->dReader.pRowInfo = NULL;
H
Hongze Cheng 已提交
402
  }
H
Hongze Cheng 已提交
403

H
Hongze Cheng 已提交
404
  // Writer
H
Hongze Cheng 已提交
405 406 407 408 409
  SHeadFile fHead;
  SDataFile fData;
  SLastFile fLast;
  SSmaFile  fSma;
  SDFileSet wSet = {.pHeadF = &fHead, .pDataF = &fData, .pLastF = &fLast, .pSmaF = &fSma};
H
Hongze Cheng 已提交
410
  if (pRSet) {
H
Hongze Cheng 已提交
411 412
    wSet.diskId = pRSet->diskId;
    wSet.fid = pCommitter->commitFid;
H
Hongze Cheng 已提交
413
    fHead = (SHeadFile){.commitID = pCommitter->commitID, .offset = 0, .size = 0, .loffset = 0};
H
Hongze Cheng 已提交
414 415 416
    fData = *pRSet->pDataF;
    fLast = (SLastFile){.commitID = pCommitter->commitID, .size = 0};
    fSma = *pRSet->pSmaF;
H
Hongze Cheng 已提交
417
  } else {
418 419 420 421
    SDiskID did = {0};

    tfsAllocDisk(pTsdb->pVnode->pTfs, 0, &did);

H
Hongze Cheng 已提交
422 423
    tfsMkdirRecurAt(pTsdb->pVnode->pTfs, pTsdb->path, did);

424
    wSet.diskId = did;
H
Hongze Cheng 已提交
425
    wSet.fid = pCommitter->commitFid;
H
Hongze Cheng 已提交
426
    fHead = (SHeadFile){.commitID = pCommitter->commitID, .offset = 0, .size = 0, .loffset = 0};
H
Hongze Cheng 已提交
427 428 429
    fData = (SDataFile){.commitID = pCommitter->commitID, .size = 0};
    fLast = (SLastFile){.commitID = pCommitter->commitID, .size = 0};
    fSma = (SSmaFile){.commitID = pCommitter->commitID, .size = 0};
H
Hongze Cheng 已提交
430
  }
H
Hongze Cheng 已提交
431
  code = tsdbDataFWriterOpen(&pCommitter->dWriter.pWriter, pTsdb, &wSet);
H
Hongze Cheng 已提交
432
  if (code) goto _err;
H
Hongze Cheng 已提交
433

H
Hongze Cheng 已提交
434 435 436 437 438 439
  taosArrayClear(pCommitter->dWriter.aBlockIdx);
  taosArrayClear(pCommitter->dWriter.aBlockL);
  tMapDataReset(&pCommitter->dWriter.mBlock);
  tBlockDataReset(&pCommitter->dWriter.bData);
  tBlockDataReset(&pCommitter->dWriter.bDatal);

H
Hongze Cheng 已提交
440
_exit:
H
Hongze Cheng 已提交
441 442 443
  return code;

_err:
S
Shengliang Guan 已提交
444
  tsdbError("vgId:%d, commit file data start failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
445
  return code;
H
Hongze Cheng 已提交
446 447
}

H
Hongze Cheng 已提交
448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463
static int32_t tsdbCommitterUpdateTableSchema(SCommitter *pCommitter, int64_t suid, int64_t uid, int32_t sver) {
  int32_t code = 0;

  if (pCommitter->skmTable.pTSchema) {
    if (pCommitter->skmTable.suid == suid) {
      if (suid == 0) {
        if (pCommitter->skmTable.uid == uid && sver == pCommitter->skmTable.pTSchema->version) goto _exit;
      } else {
        if (sver == pCommitter->skmTable.pTSchema->version) goto _exit;
      }
    }
  }

  pCommitter->skmTable.suid = suid;
  pCommitter->skmTable.uid = uid;
  tTSchemaDestroy(pCommitter->skmTable.pTSchema);
H
Hongze Cheng 已提交
464 465
  code = metaGetTbTSchemaEx(pCommitter->pTsdb->pVnode->pMeta, suid, uid, sver, &pCommitter->skmTable.pTSchema);
  if (code) goto _exit;
H
Hongze Cheng 已提交
466 467 468 469 470 471

_exit:
  return code;
}

static int32_t tsdbCommitterUpdateRowSchema(SCommitter *pCommitter, int64_t suid, int64_t uid, int32_t sver) {
H
Hongze Cheng 已提交
472 473
  int32_t code = 0;

H
Hongze Cheng 已提交
474 475
  if (pCommitter->skmRow.pTSchema) {
    if (pCommitter->skmRow.suid == suid) {
H
Hongze Cheng 已提交
476
      if (suid == 0) {
H
Hongze Cheng 已提交
477
        if (pCommitter->skmRow.uid == uid && sver == pCommitter->skmRow.pTSchema->version) goto _exit;
H
Hongze Cheng 已提交
478
      } else {
H
Hongze Cheng 已提交
479
        if (sver == pCommitter->skmRow.pTSchema->version) goto _exit;
H
Hongze Cheng 已提交
480 481 482 483
      }
    }
  }

H
Hongze Cheng 已提交
484 485 486
  pCommitter->skmRow.suid = suid;
  pCommitter->skmRow.uid = uid;
  tTSchemaDestroy(pCommitter->skmRow.pTSchema);
H
Hongze Cheng 已提交
487 488 489
  code = metaGetTbTSchemaEx(pCommitter->pTsdb->pVnode->pMeta, suid, uid, sver, &pCommitter->skmRow.pTSchema);
  if (code) {
    goto _exit;
H
Hongze Cheng 已提交
490 491 492 493 494 495
  }

_exit:
  return code;
}

H
Hongze Cheng 已提交
496
static int32_t tsdbCommitDataBlock(SCommitter *pCommitter, SBlock *pBlock) {
H
Hongze Cheng 已提交
497 498 499
  int32_t     code = 0;
  SBlockData *pBlockData = &pCommitter->dWriter.bData;
  SBlock      block;
H
Hongze Cheng 已提交
500

H
Hongze Cheng 已提交
501
  ASSERT(pBlockData->nRow > 0);
H
Hongze Cheng 已提交
502

H
Hongze Cheng 已提交
503 504 505 506 507 508
  if (pBlock) {
    block = *pBlock;  // as a subblock
  } else {
    tBlockReset(&block);  // as a new block
  }

H
Hongze Cheng 已提交
509 510 511 512
  // statistic
  block.nRow += pBlockData->nRow;
  for (int32_t iRow = 0; iRow < pBlockData->nRow; iRow++) {
    TSDBKEY key = {.ts = pBlockData->aTSKEY[iRow], .version = pBlockData->aVersion[iRow]};
H
Hongze Cheng 已提交
513

H
Hongze Cheng 已提交
514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532
    if (iRow == 0) {
      if (tsdbKeyCmprFn(&block.minKey, &key) > 0) {
        block.minKey = key;
      }
    } else {
      if (pBlockData->aTSKEY[iRow] == pBlockData->aTSKEY[iRow - 1]) {
        block.hasDup = 1;
      }
    }

    if (iRow == pBlockData->nRow - 1 && tsdbKeyCmprFn(&block.maxKey, &key) < 0) {
      block.maxKey = key;
    }

    block.minVer = TMIN(block.minVer, key.version);
    block.maxVer = TMAX(block.maxVer, key.version);
  }

  // write
H
Hongze Cheng 已提交
533 534 535 536
  block.nSubBlock++;
  code = tsdbWriteBlockData(pCommitter->dWriter.pWriter, pBlockData, &block.aSubBlock[block.nSubBlock - 1],
                            ((block.nSubBlock == 1) && block.hasDup) ? &block.smaInfo : NULL, pCommitter->cmprAlg, 0,
                            NULL);
H
Hongze Cheng 已提交
537 538 539
  if (code) goto _err;

  // put SBlock
H
Hongze Cheng 已提交
540
  code = tMapDataPutItem(&pCommitter->dWriter.mBlock, &block, tPutBlock);
H
Hongze Cheng 已提交
541
  if (code) goto _err;
H
Hongze Cheng 已提交
542

H
Hongze Cheng 已提交
543 544
  // clear
  tBlockDataClearData(pBlockData);
H
Hongze Cheng 已提交
545

H
Hongze Cheng 已提交
546 547 548 549
  return code;

_err:
  tsdbError("vgId:%d tsdb commit data block failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
550 551 552 553
  return code;
}

static int32_t tsdbCommitLastBlock(SCommitter *pCommitter) {
H
Hongze Cheng 已提交
554 555 556 557 558 559 560 561 562 563 564 565 566
  int32_t     code = 0;
  SBlockL     blockL;
  SBlockData *pBlockData = &pCommitter->dWriter.bDatal;

  ASSERT(pBlockData->nRow > 0);

  // statistic
  blockL.suid = pBlockData->suid;
  blockL.nRow = pBlockData->nRow;
  blockL.minVer = VERSION_MAX;
  blockL.maxVer = VERSION_MIN;
  for (int32_t iRow = 0; iRow < pBlockData->nRow; iRow++) {
    blockL.minVer = TMIN(blockL.minVer, pBlockData->aVersion[iRow]);
H
Hongze Cheng 已提交
567
    blockL.maxVer = TMAX(blockL.maxVer, pBlockData->aVersion[iRow]);
H
Hongze Cheng 已提交
568 569 570
  }
  blockL.minUid = pBlockData->uid ? pBlockData->uid : pBlockData->aUid[0];
  blockL.maxUid = pBlockData->uid ? pBlockData->uid : pBlockData->aUid[pBlockData->nRow - 1];
H
Hongze Cheng 已提交
571

H
Hongze Cheng 已提交
572 573 574
  // write
  code = tsdbWriteBlockData(pCommitter->dWriter.pWriter, pBlockData, &blockL.bInfo, NULL, pCommitter->cmprAlg, 1, NULL);
  if (code) goto _err;
H
Hongze Cheng 已提交
575

H
Hongze Cheng 已提交
576
  // push SBlockL
H
Hongze Cheng 已提交
577 578
  if (taosArrayPush(pCommitter->dWriter.aBlockL, &blockL) == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
H
Hongze Cheng 已提交
579
    goto _err;
H
Hongze Cheng 已提交
580 581
  }

H
Hongze Cheng 已提交
582 583
  // clear
  tBlockDataClearData(pBlockData);
H
Hongze Cheng 已提交
584

H
Hongze Cheng 已提交
585 586 587 588
  return code;

_err:
  tsdbError("vgId:%d tsdb commit last block failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
589 590 591
  return code;
}

H
Hongze Cheng 已提交
592
static int32_t tsdbMergeCommitData(SCommitter *pCommitter, STbDataIter *pIter, SBlock *pBlock) {
H
Hongze Cheng 已提交
593
  int32_t     code = 0;
H
Hongze Cheng 已提交
594 595 596
  STbData    *pTbData = pIter->pTbData;
  SBlockData *pBlockDataR = &pCommitter->dReader.bData;
  SBlockData *pBlockDataW = &pCommitter->dWriter.bData;
H
Hongze Cheng 已提交
597

H
Hongze Cheng 已提交
598
  code = tsdbReadDataBlock(pCommitter->dReader.pReader, pBlock, pBlockDataR, NULL, NULL);
H
Hongze Cheng 已提交
599 600
  if (code) goto _err;

H
Hongze Cheng 已提交
601 602 603 604 605 606 607 608
  tBlockDataClearData(pBlockDataW);
  int32_t  iRow = 0;
  TSDBROW  row;
  TSDBROW *pRow1 = tsdbTbDataIterGet(pIter);
  TSDBROW *pRow2 = &row;
  *pRow2 = tsdbRowFromBlockData(pBlockDataR, iRow);
  while (pRow1 && pRow2) {
    int32_t c = tsdbRowCmprFn(pRow1, pRow2);
H
Hongze Cheng 已提交
609

H
Hongze Cheng 已提交
610 611 612
    if (c < 0) {
      code = tsdbCommitterUpdateRowSchema(pCommitter, pTbData->suid, pTbData->uid, TSDBROW_SVERSION(pRow1));
      if (code) goto _err;
H
Hongze Cheng 已提交
613

H
Hongze Cheng 已提交
614
      code = tBlockDataAppendRow(pBlockDataW, pRow1, pCommitter->skmRow.pTSchema, pTbData->uid);
H
Hongze Cheng 已提交
615
      if (code) goto _err;
H
Hongze Cheng 已提交
616

H
Hongze Cheng 已提交
617 618 619 620
      // next
      tsdbTbDataIterNext(pIter);
      pRow1 = tsdbTbDataIterGet(pIter);
    } else if (c > 0) {
H
Hongze Cheng 已提交
621
      code = tBlockDataAppendRow(pBlockDataW, pRow2, NULL, pTbData->uid);
H
Hongze Cheng 已提交
622
      if (code) goto _err;
H
Hongze Cheng 已提交
623

H
Hongze Cheng 已提交
624 625 626
      iRow++;
      if (iRow < pBlockDataR->nRow) {
        *pRow2 = tsdbRowFromBlockData(pBlockDataR, iRow);
H
Hongze Cheng 已提交
627
      } else {
H
Hongze Cheng 已提交
628
        pRow2 = NULL;
H
Hongze Cheng 已提交
629
      }
H
Hongze Cheng 已提交
630 631
    } else {
      ASSERT(0);
H
Hongze Cheng 已提交
632 633
    }

H
Hongze Cheng 已提交
634 635
    // check
    if (pBlockDataW->nRow >= pCommitter->maxRow * 4 / 5) {
H
Hongze Cheng 已提交
636
      code = tsdbCommitDataBlock(pCommitter, NULL);
H
Hongze Cheng 已提交
637
      if (code) goto _err;
H
Hongze Cheng 已提交
638
    }
H
Hongze Cheng 已提交
639
  }
H
Hongze Cheng 已提交
640

H
Hongze Cheng 已提交
641
  while (pRow2) {
H
Hongze Cheng 已提交
642
    code = tBlockDataAppendRow(pBlockDataW, pRow2, NULL, pTbData->uid);
H
Hongze Cheng 已提交
643 644
    if (code) goto _err;

H
Hongze Cheng 已提交
645 646 647
    iRow++;
    if (iRow < pBlockDataR->nRow) {
      *pRow2 = tsdbRowFromBlockData(pBlockDataR, iRow);
H
Hongze Cheng 已提交
648
    } else {
H
Hongze Cheng 已提交
649
      pRow2 = NULL;
H
Hongze Cheng 已提交
650 651
    }

H
Hongze Cheng 已提交
652 653
    // check
    if (pBlockDataW->nRow >= pCommitter->maxRow * 4 / 5) {
H
Hongze Cheng 已提交
654
      code = tsdbCommitDataBlock(pCommitter, NULL);
H
Hongze Cheng 已提交
655
      if (code) goto _err;
H
Hongze Cheng 已提交
656
    }
H
Hongze Cheng 已提交
657
  }
H
Hongze Cheng 已提交
658

H
Hongze Cheng 已提交
659 660
  // check
  if (pBlockDataW->nRow > 0) {
H
Hongze Cheng 已提交
661
    code = tsdbCommitDataBlock(pCommitter, NULL);
H
Hongze Cheng 已提交
662
    if (code) goto _err;
H
Hongze Cheng 已提交
663 664 665 666 667
  }

  return code;

_err:
H
Hongze Cheng 已提交
668
  tsdbError("vgId:%d, tsdb merge commit data failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
669 670 671
  return code;
}

H
Hongze Cheng 已提交
672 673 674
static int32_t tsdbCommitTableMemData(SCommitter *pCommitter, STbDataIter *pIter, TSDBKEY toKey) {
  int32_t     code = 0;
  STbData    *pTbData = pIter->pTbData;
H
Hongze Cheng 已提交
675
  SBlockData *pBlockData = &pCommitter->dWriter.bData;
H
Hongze Cheng 已提交
676

H
Hongze Cheng 已提交
677
  tBlockDataClearData(pBlockData);
H
Hongze Cheng 已提交
678
  TSDBROW *pRow = tsdbTbDataIterGet(pIter);
H
Hongze Cheng 已提交
679
  while (true) {
H
Hongze Cheng 已提交
680
    if (pRow == NULL) {
H
Hongze Cheng 已提交
681 682 683 684 685 686 687
      if (pBlockData->nRow > 0) {
        goto _write_block;
      } else {
        break;
      }
    }

H
Hongze Cheng 已提交
688
    // update schema
H
Hongze Cheng 已提交
689
    code = tsdbCommitterUpdateRowSchema(pCommitter, pTbData->suid, pTbData->uid, TSDBROW_SVERSION(pRow));
H
Hongze Cheng 已提交
690 691
    if (code) goto _err;

H
Hongze Cheng 已提交
692
    // append
H
Hongze Cheng 已提交
693
    code = tBlockDataAppendRow(pBlockData, pRow, pCommitter->skmRow.pTSchema, pTbData->uid);
H
Hongze Cheng 已提交
694 695 696 697
    if (code) goto _err;

    tsdbTbDataIterNext(pIter);
    pRow = tsdbTbDataIterGet(pIter);
698
    if (pRow) {
H
Hongze Cheng 已提交
699 700
      TSDBKEY rowKey = TSDBROW_KEY(pRow);
      if (tsdbKeyCmprFn(&rowKey, &toKey) >= 0) {
701 702 703
        pRow = NULL;
      }
    }
H
Hongze Cheng 已提交
704

H
Hongze Cheng 已提交
705 706
    if (pBlockData->nRow >= pCommitter->maxRow * 4 / 5) {
    _write_block:
H
Hongze Cheng 已提交
707
      code = tsdbCommitDataBlock(pCommitter, NULL);
H
Hongze Cheng 已提交
708 709
      if (code) goto _err;
    }
H
Hongze Cheng 已提交
710 711 712 713 714
  }

  return code;

_err:
S
Shengliang Guan 已提交
715
  tsdbError("vgId:%d, tsdb commit table mem data failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
716 717 718
  return code;
}

H
Hongze Cheng 已提交
719 720
static int32_t tsdbGetNumOfRowsLessThan(STbDataIter *pIter, TSDBKEY key) {
  int32_t nRow = 0;
H
Hongze Cheng 已提交
721

H
Hongze Cheng 已提交
722
  STbDataIter iter = *pIter;
H
Hongze Cheng 已提交
723
  while (true) {
H
Hongze Cheng 已提交
724
    TSDBROW *pRow = tsdbTbDataIterGet(&iter);
H
Hongze Cheng 已提交
725 726
    if (pRow == NULL) break;

H
Hongze Cheng 已提交
727 728
    int32_t c = tsdbKeyCmprFn(&TSDBROW_KEY(pRow), &key);
    if (c < 0) {
H
Hongze Cheng 已提交
729
      nRow++;
H
Hongze Cheng 已提交
730
      tsdbTbDataIterNext(&iter);
H
Hongze Cheng 已提交
731 732 733 734 735 736 737 738 739 740 741 742
    } else if (c > 0) {
      break;
    } else {
      ASSERT(0);
    }
  }

  return nRow;
}

static int32_t tsdbMergeAsSubBlock(SCommitter *pCommitter, STbDataIter *pIter, SBlock *pBlock) {
  int32_t     code = 0;
H
Hongze Cheng 已提交
743
  STbData    *pTbData = pIter->pTbData;
H
Hongze Cheng 已提交
744
  SBlockData *pBlockData = &pCommitter->dWriter.bData;
H
Hongze Cheng 已提交
745

H
Hongze Cheng 已提交
746
  tBlockDataClearData(pBlockData);
H
Hongze Cheng 已提交
747
  TSDBROW *pRow = tsdbTbDataIterGet(pIter);
H
Hongze Cheng 已提交
748
  while (true) {
H
Hongze Cheng 已提交
749 750 751 752 753 754 755 756 757 758
    if (pRow == NULL) break;

    code = tsdbCommitterUpdateRowSchema(pCommitter, pTbData->suid, pTbData->uid, TSDBROW_SVERSION(pRow));
    if (code) goto _err;

    code = tBlockDataAppendRow(pBlockData, pRow, pCommitter->skmRow.pTSchema, pTbData->uid);
    if (code) goto _err;

    tsdbTbDataIterNext(pIter);
    pRow = tsdbTbDataIterGet(pIter);
H
Hongze Cheng 已提交
759
    if (pRow) {
H
Hongze Cheng 已提交
760 761
      TSDBKEY rowKey = TSDBROW_KEY(pRow);
      if (tsdbKeyCmprFn(&rowKey, &pBlock->maxKey) > 0) {
H
Hongze Cheng 已提交
762 763 764 765 766
        pRow = NULL;
      }
    }
  }

H
Hongze Cheng 已提交
767
  ASSERT(pBlockData->nRow > 0 && pBlock->nRow + pBlockData->nRow <= pCommitter->maxRow);
H
Hongze Cheng 已提交
768

H
Hongze Cheng 已提交
769
  code = tsdbCommitDataBlock(pCommitter, pBlock);
H
Hongze Cheng 已提交
770 771 772 773 774
  if (code) goto _err;

  return code;

_err:
S
Shengliang Guan 已提交
775
  tsdbError("vgId:%d, tsdb merge as subblock failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
776 777 778
  return code;
}

H
Hongze Cheng 已提交
779 780 781 782
static int32_t tsdbMergeCommitLast(SCommitter *pCommitter, STbDataIter *pIter) {
  int32_t  code = 0;
  STbData *pTbData = pIter->pTbData;
  int32_t  nRow = tsdbGetNumOfRowsLessThan(pIter, (TSDBKEY){.ts = pCommitter->maxKey + 1, .version = VERSION_MIN});
H
Hongze Cheng 已提交
783

H
Hongze Cheng 已提交
784
  if (pCommitter->dReader.pRowInfo) {
H
Hongze Cheng 已提交
785 786 787 788 789 790 791 792
    if (pCommitter->dReader.pRowInfo->suid) {
      for (int32_t iRow = pCommitter->dReader.iRow; iRow < pCommitter->dReader.bDatal.nRow; iRow++) {
        if (pTbData->uid != pCommitter->dReader.bDatal.aUid[iRow]) break;
        nRow++;
      }
    } else {
      ASSERT(pCommitter->dReader.iRow == 0);
      nRow += pCommitter->dReader.bDatal.nRow;
H
Hongze Cheng 已提交
793 794 795 796 797
    }
  }

  if (nRow == 0) goto _exit;

H
Hongze Cheng 已提交
798
  TSDBROW *pRow = tsdbTbDataIterGet(pIter);
H
Hongze Cheng 已提交
799 800 801 802
  if (pRow && TSDBROW_TS(pRow) > pCommitter->maxKey) {
    pRow = NULL;
  }

H
Hongze Cheng 已提交
803 804
  SRowInfo *pRowInfo = pCommitter->dReader.pRowInfo;
  if (pRowInfo && pRowInfo->uid != pTbData->uid) {
H
Hongze Cheng 已提交
805 806 807 808
    pRowInfo = NULL;
  }

  while (nRow) {
H
Hongze Cheng 已提交
809 810 811
    SBlockData *pBlockData;
    int8_t      toData;

H
Hongze Cheng 已提交
812
    if (nRow < pCommitter->minRow) {  // to .last
H
Hongze Cheng 已提交
813
      toData = 0;
H
Hongze Cheng 已提交
814 815
      pBlockData = &pCommitter->dWriter.bDatal;

H
Hongze Cheng 已提交
816 817 818 819 820
      // commit and reset block data schema if need
      if (pBlockData->nRow > 0) {
        if (pBlockData->suid != pTbData->suid || pBlockData->suid == 0) {
          code = tsdbCommitLastBlock(pCommitter);
          if (code) goto _err;
H
Hongze Cheng 已提交
821

H
Hongze Cheng 已提交
822 823 824 825 826 827 828 829
          tBlockDataReset(pBlockData);
        }
      }

      // set block data schema if need
      if (pBlockData->suid == 0 && pBlockData->uid == 0) {
        code = tBlockDataSetSchema(pBlockData, pCommitter->skmTable.pTSchema, pTbData->suid,
                                   pTbData->suid ? 0 : pTbData->uid);
H
Hongze Cheng 已提交
830 831 832 833 834 835 836 837
        if (code) goto _err;
      }

      if (pBlockData->nRow + nRow > pCommitter->maxRow) {
        code = tsdbCommitLastBlock(pCommitter);
        if (code) goto _err;
      }
    } else {  // to .data
H
Hongze Cheng 已提交
838
      toData = 1;
H
Hongze Cheng 已提交
839
      pBlockData = &pCommitter->dWriter.bData;
H
Hongze Cheng 已提交
840
      ASSERT(pBlockData->nRow == 0);
H
Hongze Cheng 已提交
841 842 843 844 845 846 847 848
    }

    while (pRow && pRowInfo) {
      int32_t c = tsdbRowCmprFn(pRow, &pRowInfo->row);
      if (c < 0) {
        code = tsdbCommitterUpdateRowSchema(pCommitter, pTbData->suid, pTbData->uid, TSDBROW_SVERSION(pRow));
        if (code) goto _err;

H
Hongze Cheng 已提交
849
        code = tBlockDataAppendRow(pBlockData, pRow, pCommitter->skmRow.pTSchema, pTbData->uid);
H
Hongze Cheng 已提交
850 851 852 853 854 855 856 857
        if (code) goto _err;

        tsdbTbDataIterNext(pIter);
        pRow = tsdbTbDataIterGet(pIter);
        if (pRow && TSDBROW_TS(pRow) > pCommitter->maxKey) {
          pRow = NULL;
        }
      } else if (c > 0) {
H
Hongze Cheng 已提交
858
        code = tBlockDataAppendRow(pBlockData, &pRowInfo->row, NULL, pTbData->uid);
H
Hongze Cheng 已提交
859 860 861 862 863 864
        if (code) goto _err;

        code = tsdbCommitterNextLastRow(pCommitter);
        if (code) goto _err;

        pRowInfo = pCommitter->dReader.pRowInfo;
H
Hongze Cheng 已提交
865
        if (pRowInfo && pRowInfo->uid != pTbData->uid) {
H
Hongze Cheng 已提交
866 867 868 869 870 871 872
          pRowInfo = NULL;
        }
      } else {
        ASSERT(0);
      }

      nRow--;
H
Hongze Cheng 已提交
873 874 875
      if (toData) {
        if (nRow == 0 || pBlockData->nRow >= pCommitter->maxRow * 4 / 5) {
          code = tsdbCommitDataBlock(pCommitter, NULL);
H
Hongze Cheng 已提交
876 877 878 879 880 881 882 883 884 885
          if (code) goto _err;
          goto _outer_break;
        }
      }
    }

    while (pRow) {
      code = tsdbCommitterUpdateRowSchema(pCommitter, pTbData->suid, pTbData->uid, TSDBROW_SVERSION(pRow));
      if (code) goto _err;

H
Hongze Cheng 已提交
886
      code = tBlockDataAppendRow(pBlockData, pRow, pCommitter->skmRow.pTSchema, pTbData->uid);
H
Hongze Cheng 已提交
887 888 889 890 891 892 893 894
      if (code) goto _err;

      tsdbTbDataIterNext(pIter);
      pRow = tsdbTbDataIterGet(pIter);
      if (pRow && TSDBROW_TS(pRow) > pCommitter->maxKey) {
        pRow = NULL;
      }

H
Hongze Cheng 已提交
895
      nRow--;
H
Hongze Cheng 已提交
896 897 898
      if (toData) {
        if (nRow == 0 || pBlockData->nRow >= pCommitter->maxRow * 4 / 5) {
          code = tsdbCommitDataBlock(pCommitter, NULL);
H
Hongze Cheng 已提交
899 900
          if (code) goto _err;
          goto _outer_break;
H
Hongze Cheng 已提交
901 902
        }
      }
H
Hongze Cheng 已提交
903 904 905
    }

    while (pRowInfo) {
H
Hongze Cheng 已提交
906
      code = tBlockDataAppendRow(pBlockData, &pRowInfo->row, NULL, pTbData->uid);
H
Hongze Cheng 已提交
907 908 909 910
      if (code) goto _err;

      code = tsdbCommitterNextLastRow(pCommitter);
      if (code) goto _err;
H
Hongze Cheng 已提交
911 912

      pRowInfo = pCommitter->dReader.pRowInfo;
H
Hongze Cheng 已提交
913
      if (pRowInfo && pRowInfo->uid != pTbData->uid) {
H
Hongze Cheng 已提交
914 915 916
        pRowInfo = NULL;
      }

H
Hongze Cheng 已提交
917
      nRow--;
H
Hongze Cheng 已提交
918 919 920
      if (toData) {
        if (nRow == 0 || pBlockData->nRow >= pCommitter->maxRow * 4 / 5) {
          code = tsdbCommitDataBlock(pCommitter, NULL);
H
Hongze Cheng 已提交
921 922 923
          if (code) goto _err;
          goto _outer_break;
        }
H
Hongze Cheng 已提交
924 925 926
      }
    }

H
Hongze Cheng 已提交
927 928
  _outer_break:
    ASSERT(nRow >= 0);
H
Hongze Cheng 已提交
929 930
  }

H
Hongze Cheng 已提交
931
_exit:
H
Hongze Cheng 已提交
932 933 934
  return code;

_err:
H
Hongze Cheng 已提交
935
  tsdbError("vgId:%d tsdb merge commit last failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
936 937 938
  return code;
}

H
Hongze Cheng 已提交
939 940 941 942
static int32_t tsdbCommitTableData(SCommitter *pCommitter, STbData *pTbData) {
  int32_t code = 0;

  ASSERT(pCommitter->dReader.pBlockIdx == NULL || tTABLEIDCmprFn(pCommitter->dReader.pBlockIdx, pTbData) >= 0);
H
Hongze Cheng 已提交
943
  ASSERT(pCommitter->dReader.pRowInfo == NULL || tTABLEIDCmprFn(pCommitter->dReader.pRowInfo, pTbData) >= 0);
H
Hongze Cheng 已提交
944 945 946 947 948 949 950 951 952 953 954 955 956 957

  // merge commit table data
  STbDataIter  iter = {0};
  STbDataIter *pIter = &iter;
  TSDBROW     *pRow;

  tsdbTbDataIterOpen(pTbData, &(TSDBKEY){.ts = pCommitter->minKey, .version = VERSION_MIN}, 0, pIter);
  pRow = tsdbTbDataIterGet(pIter);
  if (pRow && TSDBROW_TS(pRow) > pCommitter->maxKey) {
    pRow = NULL;
  }

  if (pRow == NULL) goto _exit;

H
Hongze Cheng 已提交
958 959 960
  int32_t iBlock = 0;
  SBlock  block;
  SBlock *pBlock = &block;
H
Hongze Cheng 已提交
961
  if (pCommitter->dReader.pBlockIdx && tTABLEIDCmprFn(pTbData, pCommitter->dReader.pBlockIdx) == 0) {
H
Hongze Cheng 已提交
962 963 964 965 966
    tMapDataGetItemByIdx(&pCommitter->dReader.mBlock, iBlock, pBlock, tGetBlock);
  } else {
    pBlock = NULL;
  }

H
Hongze Cheng 已提交
967 968 969
  code = tsdbCommitterUpdateTableSchema(pCommitter, pTbData->suid, pTbData->uid, pTbData->maxSkmVer);
  if (code) goto _err;

H
Hongze Cheng 已提交
970
  tMapDataReset(&pCommitter->dWriter.mBlock);
H
Hongze Cheng 已提交
971
  code = tBlockDataSetSchema(&pCommitter->dWriter.bData, pCommitter->skmTable.pTSchema, pTbData->suid, pTbData->uid);
H
Hongze Cheng 已提交
972
  if (code) goto _err;
H
Hongze Cheng 已提交
973 974

  // .data merge
H
Hongze Cheng 已提交
975 976 977 978 979 980 981 982 983 984 985 986 987
  while (pBlock && pRow) {
    int32_t c = tBlockCmprFn(pBlock, &(SBlock){.minKey = TSDBROW_KEY(pRow), .maxKey = TSDBROW_KEY(pRow)});
    if (c < 0) {  // disk
      code = tMapDataPutItem(&pCommitter->dWriter.mBlock, pBlock, tPutBlock);
      if (code) goto _err;

      // next
      iBlock++;
      if (iBlock < pCommitter->dReader.mBlock.nItem) {
        tMapDataGetItemByIdx(&pCommitter->dReader.mBlock, iBlock, pBlock, tGetBlock);
      } else {
        pBlock = NULL;
      }
H
Hongze Cheng 已提交
988 989
    } else if (c > 0) {  // memory
      code = tsdbCommitTableMemData(pCommitter, pIter, pBlock->minKey);
H
Hongze Cheng 已提交
990 991 992 993 994 995 996 997
      if (code) goto _err;

      // next
      pRow = tsdbTbDataIterGet(pIter);
      if (pRow && TSDBROW_TS(pRow) > pCommitter->maxKey) {
        pRow = NULL;
      }
    } else {  // merge
H
Hongze Cheng 已提交
998
      int32_t nOvlp = tsdbGetNumOfRowsLessThan(pIter, pBlock->maxKey);
H
Hongze Cheng 已提交
999 1000 1001 1002 1003 1004 1005

      ASSERT(nOvlp > 0);

      if (pBlock->nRow + nOvlp <= pCommitter->maxRow && pBlock->nSubBlock < TSDB_MAX_SUBBLOCKS) {
        code = tsdbMergeAsSubBlock(pCommitter, pIter, pBlock);
        if (code) goto _err;
      } else {
H
Hongze Cheng 已提交
1006
        code = tsdbMergeCommitData(pCommitter, pIter, pBlock);
H
Hongze Cheng 已提交
1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027
        if (code) goto _err;
      }

      // next
      pRow = tsdbTbDataIterGet(pIter);
      if (pRow && TSDBROW_TS(pRow) > pCommitter->maxKey) {
        pRow = NULL;
      }
      iBlock++;
      if (iBlock < pCommitter->dReader.mBlock.nItem) {
        tMapDataGetItemByIdx(&pCommitter->dReader.mBlock, iBlock, pBlock, tGetBlock);
      } else {
        pBlock = NULL;
      }
    }
  }

  while (pBlock) {
    code = tMapDataPutItem(&pCommitter->dWriter.mBlock, pBlock, tPutBlock);
    if (code) goto _err;

H
Hongze Cheng 已提交
1028
    // next
H
Hongze Cheng 已提交
1029 1030 1031 1032 1033 1034 1035 1036
    iBlock++;
    if (iBlock < pCommitter->dReader.mBlock.nItem) {
      tMapDataGetItemByIdx(&pCommitter->dReader.mBlock, iBlock, pBlock, tGetBlock);
    } else {
      pBlock = NULL;
    }
  }

H
Hongze Cheng 已提交
1037
  // .data append and .last merge
H
Hongze Cheng 已提交
1038 1039
  code = tsdbMergeCommitLast(pCommitter, pIter);
  if (code) goto _err;
H
Hongze Cheng 已提交
1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065

  // end
  if (pCommitter->dWriter.mBlock.nItem > 0) {
    SBlockIdx blockIdx = {.suid = pTbData->suid, .uid = pTbData->uid};
    code = tsdbWriteBlock(pCommitter->dWriter.pWriter, &pCommitter->dWriter.mBlock, NULL, &blockIdx);
    if (code) goto _err;

    if (taosArrayPush(pCommitter->dWriter.aBlockIdx, &blockIdx) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _err;
    }
  }

_exit:
  pRow = tsdbTbDataIterGet(pIter);
  if (pRow) {
    pCommitter->nextKey = TMIN(pCommitter->nextKey, TSDBROW_TS(pRow));
  }

  return code;

_err:
  tsdbError("vgId:%d tsdb commit table data failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
  return code;
}

H
Hongze Cheng 已提交
1066 1067 1068
static int32_t tsdbCommitFileDataEnd(SCommitter *pCommitter) {
  int32_t code = 0;

H
Hongze Cheng 已提交
1069
  // write aBlockIdx
H
Hongze Cheng 已提交
1070
  code = tsdbWriteBlockIdx(pCommitter->dWriter.pWriter, pCommitter->dWriter.aBlockIdx, NULL);
H
Hongze Cheng 已提交
1071 1072
  if (code) goto _err;

H
Hongze Cheng 已提交
1073 1074 1075 1076
  // write aBlockL
  code = tsdbWriteBlockL(pCommitter->dWriter.pWriter, pCommitter->dWriter.aBlockL, NULL);
  if (code) goto _err;

H
Hongze Cheng 已提交
1077
  // update file header
H
Hongze Cheng 已提交
1078
  code = tsdbUpdateDFileSetHeader(pCommitter->dWriter.pWriter);
H
Hongze Cheng 已提交
1079 1080 1081
  if (code) goto _err;

  // upsert SDFileSet
H
Hongze Cheng 已提交
1082
  code = tsdbFSUpsertFSet(&pCommitter->fs, &pCommitter->dWriter.pWriter->wSet);
H
Hongze Cheng 已提交
1083 1084 1085
  if (code) goto _err;

  // close and sync
H
Hongze Cheng 已提交
1086
  code = tsdbDataFWriterClose(&pCommitter->dWriter.pWriter, 1);
H
Hongze Cheng 已提交
1087 1088
  if (code) goto _err;

H
Hongze Cheng 已提交
1089 1090
  if (pCommitter->dReader.pReader) {
    code = tsdbDataFReaderClose(&pCommitter->dReader.pReader);
H
Hongze Cheng 已提交
1091
    if (code) goto _err;
H
Hongze Cheng 已提交
1092 1093 1094 1095 1096 1097
  }

_exit:
  return code;

_err:
S
Shengliang Guan 已提交
1098
  tsdbError("vgId:%d, commit file data end failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1099 1100 1101
  return code;
}

H
Hongze Cheng 已提交
1102 1103 1104
static int32_t tsdbMoveCommitData(SCommitter *pCommitter, TABLEID toTable) {
  int32_t code = 0;

H
Hongze Cheng 已提交
1105
  // .data
H
Hongze Cheng 已提交
1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117
  while (true) {
    if (pCommitter->dReader.pBlockIdx == NULL || tTABLEIDCmprFn(pCommitter->dReader.pBlockIdx, &toTable) >= 0) break;

    SBlockIdx blockIdx = *pCommitter->dReader.pBlockIdx;
    code = tsdbWriteBlock(pCommitter->dWriter.pWriter, &pCommitter->dReader.mBlock, NULL, &blockIdx);
    if (code) goto _err;

    if (taosArrayPush(pCommitter->dWriter.aBlockIdx, &blockIdx) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _err;
    }

H
Hongze Cheng 已提交
1118 1119
    code = tsdbCommitterNextTableData(pCommitter);
    if (code) goto _err;
H
Hongze Cheng 已提交
1120 1121
  }

H
Hongze Cheng 已提交
1122
  // .last
H
Hongze Cheng 已提交
1123
  while (true) {
H
Hongze Cheng 已提交
1124
    if (pCommitter->dReader.pRowInfo == NULL || tTABLEIDCmprFn(pCommitter->dReader.pRowInfo, &toTable) >= 0) break;
H
Hongze Cheng 已提交
1125

H
Hongze Cheng 已提交
1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136
    SBlockData *pBlockDataR = &pCommitter->dReader.bDatal;
    SBlockData *pBlockDataW = &pCommitter->dWriter.bDatal;
    tb_uid_t    suid = pCommitter->dReader.pRowInfo->suid;
    tb_uid_t    uid = pCommitter->dReader.pRowInfo->uid;

    ASSERT((pBlockDataR->suid && !pBlockDataR->uid) || (!pBlockDataR->suid && pBlockDataR->uid));
    ASSERT(pBlockDataR->nRow > 0);

    // commit and reset block data schema if need
    if (pBlockDataW->nRow > 0) {
      if (pBlockDataW->suid != pCommitter->dReader.pRowInfo->suid || pBlockDataW->suid == 0) {
H
Hongze Cheng 已提交
1137
        code = tsdbCommitLastBlock(pCommitter);
H
Hongze Cheng 已提交
1138
        if (code) goto _err;
H
Hongze Cheng 已提交
1139 1140

        tBlockDataReset(pBlockDataW);
H
Hongze Cheng 已提交
1141
      }
H
Hongze Cheng 已提交
1142 1143
    }

H
Hongze Cheng 已提交
1144 1145 1146
    // set block data schema if need
    if (pBlockDataW->suid == 0 && pBlockDataW->uid == 0) {
      code = tsdbCommitterUpdateTableSchema(pCommitter, suid, uid, 1 /*TOOD*/);
H
Hongze Cheng 已提交
1147 1148
      if (code) goto _err;

H
Hongze Cheng 已提交
1149
      code = tBlockDataSetSchema(pBlockDataW, pCommitter->skmTable.pTSchema, suid, suid ? 0 : uid);
H
Hongze Cheng 已提交
1150
      if (code) goto _err;
H
Hongze Cheng 已提交
1151 1152
    }

H
Hongze Cheng 已提交
1153 1154
    // check if it can make sure that one table data in one block
    int32_t nRow = 0;
H
Hongze Cheng 已提交
1155 1156 1157 1158 1159 1160 1161 1162
    if (pBlockDataR->suid) {
      for (int32_t iRow = pCommitter->dReader.iRow; (iRow < pBlockDataR->nRow) && (pBlockDataR->aUid[iRow] == uid);
           iRow++) {
        nRow++;
      }
    } else {
      ASSERT(pCommitter->dReader.iRow == 0);
      nRow = pBlockDataR->nRow;
H
Hongze Cheng 已提交
1163
    }
H
Hongze Cheng 已提交
1164

H
Hongze Cheng 已提交
1165
    ASSERT(nRow > 0 && nRow < pCommitter->minRow);
H
Hongze Cheng 已提交
1166

H
Hongze Cheng 已提交
1167 1168
    if (pBlockDataW->nRow + nRow > pCommitter->maxRow) {
      ASSERT(pBlockDataW->nRow > 0);
H
Hongze Cheng 已提交
1169

H
Hongze Cheng 已提交
1170 1171
      code = tsdbCommitLastBlock(pCommitter);
      if (code) goto _err;
H
Hongze Cheng 已提交
1172 1173
    }

H
Hongze Cheng 已提交
1174
    while (nRow > 0) {
H
Hongze Cheng 已提交
1175
      code = tBlockDataAppendRow(pBlockDataW, &pCommitter->dReader.pRowInfo->row, NULL, uid);
H
Hongze Cheng 已提交
1176 1177
      if (code) goto _err;

H
Hongze Cheng 已提交
1178
      code = tsdbCommitterNextLastRow(pCommitter);
H
Hongze Cheng 已提交
1179
      if (code) goto _err;
H
Hongze Cheng 已提交
1180 1181

      nRow--;
H
Hongze Cheng 已提交
1182 1183 1184 1185 1186 1187 1188 1189 1190 1191
    }
  }

  return code;

_err:
  tsdbError("vgId:%d tsdb move commit data failed since %s", TD_VID(pCommitter->pTsdb->pVnode), tstrerror(code));
  return code;
}

H
Hongze Cheng 已提交
1192
static int32_t tsdbCommitFileData(SCommitter *pCommitter) {
H
Hongze Cheng 已提交
1193 1194 1195
  int32_t    code = 0;
  STsdb     *pTsdb = pCommitter->pTsdb;
  SMemTable *pMemTable = pTsdb->imem;
H
Hongze Cheng 已提交
1196 1197 1198 1199 1200 1201

  // commit file data start
  code = tsdbCommitFileDataStart(pCommitter);
  if (code) goto _err;

  // commit file data impl
H
Hongze Cheng 已提交
1202 1203
  for (int32_t iTbData = 0; iTbData < taosArrayGetSize(pMemTable->aTbData); iTbData++) {
    STbData *pTbData = (STbData *)taosArrayGetP(pMemTable->aTbData, iTbData);
H
Hongze Cheng 已提交
1204

H
Hongze Cheng 已提交
1205
    // move commit until current (suid, uid)
H
Hongze Cheng 已提交
1206
    code = tsdbMoveCommitData(pCommitter, *(TABLEID *)pTbData);
H
Hongze Cheng 已提交
1207 1208
    if (code) goto _err;

H
Hongze Cheng 已提交
1209
    // commit current table data
H
Hongze Cheng 已提交
1210
    code = tsdbCommitTableData(pCommitter, pTbData);
H
Hongze Cheng 已提交
1211
    if (code) goto _err;
H
Hongze Cheng 已提交
1212
  }
H
Hongze Cheng 已提交
1213

H
Hongze Cheng 已提交
1214 1215
  code = tsdbMoveCommitData(pCommitter, (TABLEID){.suid = INT64_MAX, .uid = INT64_MAX});
  if (code) goto _err;
H
Hongze Cheng 已提交
1216

H
Hongze Cheng 已提交
1217
  if (pCommitter->dWriter.bDatal.nRow > 0) {
H
Hongze Cheng 已提交
1218
    code = tsdbCommitLastBlock(pCommitter);
H
Hongze Cheng 已提交
1219
    if (code) goto _err;
H
Hongze Cheng 已提交
1220 1221
  }

H
Hongze Cheng 已提交
1222 1223
  // commit file data end
  code = tsdbCommitFileDataEnd(pCommitter);
H
Hongze Cheng 已提交
1224
  if (code) goto _err;
H
Hongze Cheng 已提交
1225 1226 1227 1228

  return code;

_err:
S
Shengliang Guan 已提交
1229
  tsdbError("vgId:%d, commit file data failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1230 1231
  tsdbDataFReaderClose(&pCommitter->dReader.pReader);
  tsdbDataFWriterClose(&pCommitter->dWriter.pWriter, 0);
H
Hongze Cheng 已提交
1232 1233 1234
  return code;
}

H
Hongze Cheng 已提交
1235 1236
// ----------------------------------------------------------------------------
static int32_t tsdbStartCommit(STsdb *pTsdb, SCommitter *pCommitter) {
H
Hongze Cheng 已提交
1237
  int32_t code = 0;
H
Hongze Cheng 已提交
1238

H
Hongze Cheng 已提交
1239 1240
  memset(pCommitter, 0, sizeof(*pCommitter));
  ASSERT(pTsdb->mem && pTsdb->imem == NULL);
H
Hongze Cheng 已提交
1241

H
more  
Hongze Cheng 已提交
1242
  taosThreadRwlockWrlock(&pTsdb->rwLock);
H
Hongze Cheng 已提交
1243 1244
  pTsdb->imem = pTsdb->mem;
  pTsdb->mem = NULL;
H
more  
Hongze Cheng 已提交
1245
  taosThreadRwlockUnlock(&pTsdb->rwLock);
H
Hongze Cheng 已提交
1246

H
Hongze Cheng 已提交
1247
  pCommitter->pTsdb = pTsdb;
H
Hongze Cheng 已提交
1248
  pCommitter->commitID = pTsdb->pVnode->state.commitID;
H
Hongze Cheng 已提交
1249 1250 1251 1252
  pCommitter->minutes = pTsdb->keepCfg.days;
  pCommitter->precision = pTsdb->keepCfg.precision;
  pCommitter->minRow = pTsdb->pVnode->config.tsdbCfg.minRows;
  pCommitter->maxRow = pTsdb->pVnode->config.tsdbCfg.maxRows;
H
Hongze Cheng 已提交
1253
  pCommitter->cmprAlg = pTsdb->pVnode->config.tsdbCfg.compression;
H
Hongze Cheng 已提交
1254

H
Hongze Cheng 已提交
1255
  code = tsdbFSCopy(pTsdb, &pCommitter->fs);
H
Hongze Cheng 已提交
1256 1257 1258 1259 1260
  if (code) goto _err;

  return code;

_err:
S
Shengliang Guan 已提交
1261
  tsdbError("vgId:%d, tsdb start commit failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1262 1263 1264
  return code;
}

H
Hongze Cheng 已提交
1265 1266 1267
static int32_t tsdbCommitDataStart(SCommitter *pCommitter) {
  int32_t code = 0;

H
Hongze Cheng 已提交
1268
  // Reader
H
Hongze Cheng 已提交
1269 1270
  pCommitter->dReader.aBlockIdx = taosArrayInit(0, sizeof(SBlockIdx));
  if (pCommitter->dReader.aBlockIdx == NULL) {
H
Hongze Cheng 已提交
1271 1272 1273 1274
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

H
Hongze Cheng 已提交
1275 1276 1277
  code = tBlockDataInit(&pCommitter->dReader.bData);
  if (code) goto _exit;

H
Hongze Cheng 已提交
1278 1279
  pCommitter->dReader.aBlockL = taosArrayInit(0, sizeof(SBlockL));
  if (pCommitter->dReader.aBlockL == NULL) {
H
Hongze Cheng 已提交
1280 1281 1282 1283
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

H
Hongze Cheng 已提交
1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299
  code = tBlockDataInit(&pCommitter->dReader.bDatal);
  if (code) goto _exit;

  // Writer
  pCommitter->dWriter.aBlockIdx = taosArrayInit(0, sizeof(SBlockIdx));
  if (pCommitter->dWriter.aBlockIdx == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

  pCommitter->dWriter.aBlockL = taosArrayInit(0, sizeof(SBlockL));
  if (pCommitter->dWriter.aBlockL == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

H
Hongze Cheng 已提交
1300
  code = tBlockDataInit(&pCommitter->dWriter.bData);
H
Hongze Cheng 已提交
1301
  if (code) goto _exit;
H
Hongze Cheng 已提交
1302

H
Hongze Cheng 已提交
1303 1304 1305
  code = tBlockDataInit(&pCommitter->dWriter.bDatal);
  if (code) goto _exit;

H
Hongze Cheng 已提交
1306 1307 1308 1309 1310
_exit:
  return code;
}

static void tsdbCommitDataEnd(SCommitter *pCommitter) {
H
Hongze Cheng 已提交
1311
  // Reader
H
Hongze Cheng 已提交
1312 1313 1314
  taosArrayDestroy(pCommitter->dReader.aBlockIdx);
  tMapDataClear(&pCommitter->dReader.mBlock);
  tBlockDataClear(&pCommitter->dReader.bData, 1);
H
Hongze Cheng 已提交
1315
  taosArrayDestroy(pCommitter->dReader.aBlockL);
H
Hongze Cheng 已提交
1316 1317 1318
  tBlockDataClear(&pCommitter->dReader.bDatal, 1);

  // Writer
H
Hongze Cheng 已提交
1319
  taosArrayDestroy(pCommitter->dWriter.aBlockIdx);
H
Hongze Cheng 已提交
1320
  taosArrayDestroy(pCommitter->dWriter.aBlockL);
H
Hongze Cheng 已提交
1321 1322
  tMapDataClear(&pCommitter->dWriter.mBlock);
  tBlockDataClear(&pCommitter->dWriter.bData, 1);
H
Hongze Cheng 已提交
1323
  tBlockDataClear(&pCommitter->dWriter.bDatal, 1);
H
Hongze Cheng 已提交
1324 1325
  tTSchemaDestroy(pCommitter->skmTable.pTSchema);
  tTSchemaDestroy(pCommitter->skmRow.pTSchema);
H
Hongze Cheng 已提交
1326 1327
}

H
Hongze Cheng 已提交
1328 1329 1330 1331
static int32_t tsdbCommitData(SCommitter *pCommitter) {
  int32_t    code = 0;
  STsdb     *pTsdb = pCommitter->pTsdb;
  SMemTable *pMemTable = pTsdb->imem;
H
Hongze Cheng 已提交
1332

H
Hongze Cheng 已提交
1333
  // check
H
Hongze Cheng 已提交
1334
  if (pMemTable->nRow == 0) goto _exit;
H
Hongze Cheng 已提交
1335

H
Hongze Cheng 已提交
1336 1337
  // start ====================
  code = tsdbCommitDataStart(pCommitter);
H
Hongze Cheng 已提交
1338
  if (code) goto _err;
H
Hongze Cheng 已提交
1339 1340 1341

  // impl ====================
  pCommitter->nextKey = pMemTable->minKey;
H
Hongze Cheng 已提交
1342 1343
  while (pCommitter->nextKey < TSKEY_MAX) {
    code = tsdbCommitFileData(pCommitter);
H
Hongze Cheng 已提交
1344
    if (code) goto _err;
H
Hongze Cheng 已提交
1345
  }
H
Hongze Cheng 已提交
1346

H
Hongze Cheng 已提交
1347 1348 1349
  // end ====================
  tsdbCommitDataEnd(pCommitter);

H
Hongze Cheng 已提交
1350
_exit:
S
Shengliang Guan 已提交
1351
  tsdbDebug("vgId:%d, commit data done, nRow:%" PRId64, TD_VID(pTsdb->pVnode), pMemTable->nRow);
H
Hongze Cheng 已提交
1352
  return code;
H
Hongze Cheng 已提交
1353

H
Hongze Cheng 已提交
1354
_err:
H
Hongze Cheng 已提交
1355
  tsdbCommitDataEnd(pCommitter);
S
Shengliang Guan 已提交
1356
  tsdbError("vgId:%d, commit data failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1357 1358
  return code;
}
H
Hongze Cheng 已提交
1359

H
Hongze Cheng 已提交
1360 1361 1362 1363
static int32_t tsdbCommitDel(SCommitter *pCommitter) {
  int32_t    code = 0;
  STsdb     *pTsdb = pCommitter->pTsdb;
  SMemTable *pMemTable = pTsdb->imem;
H
Hongze Cheng 已提交
1364

H
Hongze Cheng 已提交
1365 1366
  if (pMemTable->nDel == 0) {
    goto _exit;
H
Hongze Cheng 已提交
1367
  }
H
Hongze Cheng 已提交
1368

H
Hongze Cheng 已提交
1369 1370 1371 1372 1373
  // start
  code = tsdbCommitDelStart(pCommitter);
  if (code) {
    goto _err;
  }
H
Hongze Cheng 已提交
1374

H
Hongze Cheng 已提交
1375
  // impl
H
Hongze Cheng 已提交
1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430
  int32_t  iDelIdx = 0;
  int32_t  nDelIdx = taosArrayGetSize(pCommitter->aDelIdx);
  int32_t  iTbData = 0;
  int32_t  nTbData = taosArrayGetSize(pMemTable->aTbData);
  STbData *pTbData;
  SDelIdx *pDelIdx;

  ASSERT(nTbData > 0);

  pTbData = (STbData *)taosArrayGetP(pMemTable->aTbData, iTbData);
  pDelIdx = (iDelIdx < nDelIdx) ? (SDelIdx *)taosArrayGet(pCommitter->aDelIdx, iDelIdx) : NULL;
  while (true) {
    if (pTbData == NULL && pDelIdx == NULL) break;

    if (pTbData && pDelIdx) {
      int32_t c = tTABLEIDCmprFn(pTbData, pDelIdx);

      if (c == 0) {
        goto _commit_mem_and_disk_del;
      } else if (c < 0) {
        goto _commit_mem_del;
      } else {
        goto _commit_disk_del;
      }
    } else if (pTbData) {
      goto _commit_mem_del;
    } else {
      goto _commit_disk_del;
    }

  _commit_mem_del:
    code = tsdbCommitTableDel(pCommitter, pTbData, NULL);
    if (code) goto _err;

    iTbData++;
    pTbData = (iTbData < nTbData) ? (STbData *)taosArrayGetP(pMemTable->aTbData, iTbData) : NULL;
    continue;

  _commit_disk_del:
    code = tsdbCommitTableDel(pCommitter, NULL, pDelIdx);
    if (code) goto _err;

    iDelIdx++;
    pDelIdx = (iDelIdx < nDelIdx) ? (SDelIdx *)taosArrayGet(pCommitter->aDelIdx, iDelIdx) : NULL;
    continue;

  _commit_mem_and_disk_del:
    code = tsdbCommitTableDel(pCommitter, pTbData, pDelIdx);
    if (code) goto _err;

    iTbData++;
    pTbData = (iTbData < nTbData) ? (STbData *)taosArrayGetP(pMemTable->aTbData, iTbData) : NULL;
    iDelIdx++;
    pDelIdx = (iDelIdx < nDelIdx) ? (SDelIdx *)taosArrayGet(pCommitter->aDelIdx, iDelIdx) : NULL;
    continue;
H
Hongze Cheng 已提交
1431
  }
H
Hongze Cheng 已提交
1432

H
Hongze Cheng 已提交
1433 1434 1435 1436 1437
  // end
  code = tsdbCommitDelEnd(pCommitter);
  if (code) {
    goto _err;
  }
H
Hongze Cheng 已提交
1438

H
Hongze Cheng 已提交
1439
_exit:
S
Shengliang Guan 已提交
1440
  tsdbDebug("vgId:%d, commit del done, nDel:%" PRId64, TD_VID(pTsdb->pVnode), pMemTable->nDel);
H
Hongze Cheng 已提交
1441 1442 1443
  return code;

_err:
S
Shengliang Guan 已提交
1444
  tsdbError("vgId:%d, commit del failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1445
  return code;
H
Hongze Cheng 已提交
1446 1447
}

H
Hongze Cheng 已提交
1448
static int32_t tsdbEndCommit(SCommitter *pCommitter, int32_t eno) {
H
Hongze Cheng 已提交
1449 1450 1451 1452
  int32_t    code = 0;
  STsdb     *pTsdb = pCommitter->pTsdb;
  SMemTable *pMemTable = pTsdb->imem;

H
Hongze Cheng 已提交
1453
  ASSERT(eno == 0);
H
Hongze Cheng 已提交
1454 1455 1456

  code = tsdbFSCommit1(pTsdb, &pCommitter->fs);
  if (code) goto _err;
H
Hongze Cheng 已提交
1457

H
Hongze Cheng 已提交
1458
  // lock
H
Hongze Cheng 已提交
1459
  taosThreadRwlockWrlock(&pTsdb->rwLock);
H
Hongze Cheng 已提交
1460 1461 1462 1463 1464 1465 1466 1467

  // commit or rollback
  code = tsdbFSCommit2(pTsdb, &pCommitter->fs);
  if (code) {
    taosThreadRwlockUnlock(&pTsdb->rwLock);
    goto _err;
  }

H
Hongze Cheng 已提交
1468
  pTsdb->imem = NULL;
H
Hongze Cheng 已提交
1469 1470

  // unlock
H
Hongze Cheng 已提交
1471 1472 1473
  taosThreadRwlockUnlock(&pTsdb->rwLock);

  tsdbUnrefMemTable(pMemTable);
H
Hongze Cheng 已提交
1474
  tsdbFSDestroy(&pCommitter->fs);
H
Hongze Cheng 已提交
1475

S
Shengliang Guan 已提交
1476
  tsdbInfo("vgId:%d, tsdb end commit", TD_VID(pTsdb->pVnode));
H
Hongze Cheng 已提交
1477 1478 1479
  return code;

_err:
S
Shengliang Guan 已提交
1480
  tsdbError("vgId:%d, tsdb end commit failed since %s", TD_VID(pTsdb->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
1481 1482
  return code;
}