tsdbCompact.c 19.1 KB
Newer Older
H
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#include "tsdb.h"

H
Hongze Cheng 已提交
18 19 20 21
#define TSDB_ITER_TYPE_MEM 0x0
#define TSDB_ITER_TYPE_DAT 0x1
#define TSDB_ITER_TYPE_STT 0x2

H
Hongze Cheng 已提交
22 23
typedef struct {
} SMemDIter;
H
Hongze Cheng 已提交
24 25

typedef struct {
H
Hongze Cheng 已提交
26 27 28 29 30 31 32
  SDataFReader *pReader;
  SArray       *aBlockIdx;  // SArray<SBlockIdx>
  SMapData      mDataBlk;   // SMapData<SDataBlk>
  SBlockData    bData;
  int32_t       iBlockIdx;
  int32_t       iDataBlk;
  int32_t       iRow;
H
Hongze Cheng 已提交
33 34 35
} SDataDIter;

typedef struct {
H
Hongze Cheng 已提交
36 37 38 39 40 41
  SDataFReader *pReader;
  int32_t       iStt;
  SArray       *aSttBlk;  // SArray<SSttBlk>
  SBlockData    bData;
  int32_t       iSttBlk;
  int32_t       iRow;
H
Hongze Cheng 已提交
42 43
} SSttDIter;

H
Hongze Cheng 已提交
44 45 46
typedef struct STsdbDataIter {
  struct STsdbDataIter *next;

H
Hongze Cheng 已提交
47 48 49 50
  int32_t     flag;
  SRowInfo    rowInfo;
  SRBTreeNode n;
  char        handle[];
H
Hongze Cheng 已提交
51 52
} STsdbDataIter;

H
Hongze Cheng 已提交
53 54
#define TSDB_DATA_ITER_FROM_RBTN(N) ((STsdbDataIter *)((char *)N - offsetof(STsdbDataIter, n)))

H
Hongze Cheng 已提交
55
typedef struct {
H
Hongze Cheng 已提交
56 57
  STsdb         *pTsdb;
  int64_t        cid;
H
Hongze Cheng 已提交
58 59 60
  int32_t        maxRows;
  int32_t        minRows;
  STsdbFS        fs;
H
Hongze Cheng 已提交
61 62 63 64 65
  int32_t        fid;
  SDFileSet     *pDFileSet;
  SDataFReader  *pReader;
  STsdbDataIter *iterList;  // list of iterators
  SRBTree        rtree;
H
Hongze Cheng 已提交
66
  STsdbDataIter *pIter;
H
Hongze Cheng 已提交
67
  SBlockData     bData;
H
Hongze Cheng 已提交
68
  SSkmInfo       tbSkm;
H
Hongze Cheng 已提交
69 70
} STsdbCompactor;

H
Hongze Cheng 已提交
71 72
#define TSDB_FLG_DEEP_COMPACT 0x1

H
Hongze Cheng 已提交
73
// ITER =========================
H
Hongze Cheng 已提交
74
static int32_t tsdbDataIterNext(STsdbDataIter *pIter, TABLEID *pExcludeTableId);
H
Hongze Cheng 已提交
75

H
Hongze Cheng 已提交
76 77 78 79 80 81 82
static int32_t tsdbDataIterCmprFn(const SRBTreeNode *n1, const SRBTreeNode *n2) {
  const STsdbDataIter *pIter1 = (STsdbDataIter *)((char *)n1 - offsetof(STsdbDataIter, n));
  const STsdbDataIter *pIter2 = (STsdbDataIter *)((char *)n2 - offsetof(STsdbDataIter, n));

  return tRowInfoCmprFn(&pIter1->rowInfo, &pIter2->rowInfo);
}

H
Hongze Cheng 已提交
83
static int32_t tsdbMemDIterOpen(STsdbDataIter **ppIter) {
H
Hongze Cheng 已提交
84 85
  int32_t code = 0;
  int32_t lino = 0;
H
Hongze Cheng 已提交
86 87 88 89 90 91 92

  STsdbDataIter *pIter = (STsdbDataIter *)taosMemoryCalloc(1, sizeof(*pIter) + sizeof(SMemDIter));
  if (pIter == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

H
Hongze Cheng 已提交
93
  // TODO
H
Hongze Cheng 已提交
94

H
Hongze Cheng 已提交
95
_exit:
H
Hongze Cheng 已提交
96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112
  if (code) {
    *ppIter = NULL;
  } else {
    *ppIter = pIter;
  }
  return code;
}

static int32_t tsdbDataDIterOpen(SDataFReader *pReader, STsdbDataIter **ppIter) {
  int32_t code = 0;
  int32_t lino = 0;

  STsdbDataIter *pIter = (STsdbDataIter *)taosMemoryCalloc(1, sizeof(*pIter) + sizeof(SDataDIter));
  if (NULL == pIter) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }
H
Hongze Cheng 已提交
113
  pIter->flag = TSDB_ITER_TYPE_DAT;
H
Hongze Cheng 已提交
114

H
Hongze Cheng 已提交
115 116 117 118 119 120 121 122 123 124 125 126 127
  SDataDIter *pDataDIter = (SDataDIter *)pIter->handle;
  pDataDIter->pReader = pReader;
  pDataDIter->aBlockIdx = taosArrayInit(0, sizeof(SBlockIdx));
  if (pDataDIter->aBlockIdx == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

  code = tsdbReadBlockIdx(pReader, pDataDIter->aBlockIdx);
  TSDB_CHECK_CODE(code, lino, _exit);

  if (taosArrayGetSize(pDataDIter->aBlockIdx) == 0) goto _clear_exit;

H
Hongze Cheng 已提交
128
  // TODO
H
Hongze Cheng 已提交
129 130 131
  code = tBlockDataCreate(&pDataDIter->bData);
  TSDB_CHECK_CODE(code, lino, _exit);

H
Hongze Cheng 已提交
132
  pDataDIter->iBlockIdx = -1;
H
Hongze Cheng 已提交
133 134 135
  pDataDIter->iDataBlk = 0;
  pDataDIter->iRow = 0;

H
Hongze Cheng 已提交
136
  code = tsdbDataIterNext(pIter, NULL);
H
Hongze Cheng 已提交
137
  TSDB_CHECK_CODE(code, lino, _exit);
H
Hongze Cheng 已提交
138 139 140

_exit:
  if (code) {
H
Hongze Cheng 已提交
141
  _clear_exit:
H
Hongze Cheng 已提交
142
    *ppIter = NULL;
H
Hongze Cheng 已提交
143 144 145 146 147 148
    if (pIter) {
      tBlockDataDestroy(&pDataDIter->bData, 1);
      tMapDataClear(&pDataDIter->mDataBlk);
      taosArrayDestroy(pDataDIter->aBlockIdx);
      taosMemoryFree(pIter);
    }
H
Hongze Cheng 已提交
149 150 151 152 153 154
  } else {
    *ppIter = pIter;
  }
  return code;
}

H
Hongze Cheng 已提交
155
static int32_t tsdbSttDIterOpen(SDataFReader *pReader, int32_t iStt, STsdbDataIter **ppIter) {
H
Hongze Cheng 已提交
156 157 158 159 160 161 162 163
  int32_t code = 0;
  int32_t lino = 0;

  STsdbDataIter *pIter = (STsdbDataIter *)taosMemoryCalloc(1, sizeof(*pIter) + sizeof(SSttDIter));
  if (pIter == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }
H
Hongze Cheng 已提交
164
  pIter->flag = TSDB_ITER_TYPE_STT;
H
Hongze Cheng 已提交
165

H
Hongze Cheng 已提交
166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182
  SSttDIter *pSttDIter = (SSttDIter *)pIter->handle;
  pSttDIter->pReader = pReader;
  pSttDIter->iStt = iStt;
  pSttDIter->aSttBlk = taosArrayInit(0, sizeof(SSttBlk));
  if (pSttDIter->aSttBlk == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

  code = tsdbReadSttBlk(pReader, pSttDIter->iStt, pSttDIter->aSttBlk);
  TSDB_CHECK_CODE(code, lino, _exit);

  if (taosArrayGetSize(pSttDIter->aSttBlk) == 0) goto _clear_exit;

  code = tBlockDataCreate(&pSttDIter->bData);
  TSDB_CHECK_CODE(code, lino, _exit);

H
Hongze Cheng 已提交
183 184
  pSttDIter->iSttBlk = -1;
  pSttDIter->iRow = -1;
H
Hongze Cheng 已提交
185

H
Hongze Cheng 已提交
186
  code = tsdbDataIterNext(pIter, NULL);
H
Hongze Cheng 已提交
187
  TSDB_CHECK_CODE(code, lino, _exit);
H
Hongze Cheng 已提交
188 189 190

_exit:
  if (code) {
H
Hongze Cheng 已提交
191
  _clear_exit:
H
Hongze Cheng 已提交
192
    *ppIter = NULL;
H
Hongze Cheng 已提交
193 194 195 196 197
    if (pIter) {
      tBlockDataDestroy(&pSttDIter->bData, 1);
      taosArrayDestroy(pSttDIter->aSttBlk);
      taosMemoryFree(pIter);
    }
H
Hongze Cheng 已提交
198 199 200
  } else {
    *ppIter = pIter;
  }
H
Hongze Cheng 已提交
201 202 203 204 205
  return code;
}

static void tsdbDataIterClose(STsdbDataIter *pIter) {
  // TODO
H
Hongze Cheng 已提交
206
  ASSERT(0);
H
Hongze Cheng 已提交
207 208
}

H
Hongze Cheng 已提交
209
static int32_t tsdbDataIterNext(STsdbDataIter *pIter, TABLEID *pExcludeTableId) {
H
Hongze Cheng 已提交
210 211
  int32_t code = 0;
  int32_t lino = 0;
H
Hongze Cheng 已提交
212 213 214 215 216 217 218 219 220 221

  if (pIter->flag & TSDB_ITER_TYPE_MEM) {
    // TODO
    ASSERT(0);
  } else if (pIter->flag & TSDB_ITER_TYPE_DAT) {
    // TODO
    ASSERT(0);
  } else if (pIter->flag & TSDB_ITER_TYPE_STT) {
    SSttDIter *pSttDIter = (SSttDIter *)pIter->handle;

H
Hongze Cheng 已提交
222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251
    for (;;) {
      if (++pSttDIter->iRow >= pSttDIter->bData.nRow) {
        for (;;) {
          if (++pSttDIter->iSttBlk < taosArrayGetSize(pSttDIter->aSttBlk)) {
            SSttBlk *pSttBlk = (SSttBlk *)taosArrayGet(pSttDIter->aSttBlk, pSttDIter->iSttBlk);

            // check exclusion
            if (pExcludeTableId) {
              if (pExcludeTableId->uid) {  // exclude (suid, uid)
                if (pSttBlk->minUid == pExcludeTableId->uid && pSttBlk->maxUid == pExcludeTableId->uid) continue;
              } else {  // exclude (suid, *)
                if (pSttBlk->suid == pExcludeTableId->suid) continue;
              }
            }

            code = tsdbReadSttBlockEx(pSttDIter->pReader, pSttDIter->iStt, pSttBlk, &pSttDIter->bData);
            TSDB_CHECK_CODE(code, lino, _exit);

            pIter->rowInfo.suid = pSttBlk->suid;
            pSttDIter->iRow = 0;
            break;
          } else {
            // iter end, all set 0 and exit
            pIter->rowInfo.suid = 0;
            pIter->rowInfo.uid = 0;
            goto _exit;
          }
        }
      }

H
Hongze Cheng 已提交
252 253
      pIter->rowInfo.uid = pSttDIter->bData.uid ? pSttDIter->bData.uid : pSttDIter->bData.aUid[pSttDIter->iRow];
      pIter->rowInfo.row = tsdbRowFromBlockData(&pSttDIter->bData, pSttDIter->iRow);
H
Hongze Cheng 已提交
254 255 256 257 258 259 260 261

      // check exclusion
      if (pExcludeTableId) {
        if (pExcludeTableId->uid) {  // exclude (suid, uid)
          if (pIter->rowInfo.uid == pExcludeTableId->uid) continue;
        } else {  // exclude (suid, *)
          if (pIter->rowInfo.suid == pExcludeTableId->suid) continue;
        }
H
Hongze Cheng 已提交
262
      }
H
Hongze Cheng 已提交
263 264

      break;
H
Hongze Cheng 已提交
265 266 267 268 269
    }
  } else {
    ASSERT(0);
  }

H
Hongze Cheng 已提交
270 271 272
_exit:
  return code;
}
H
Hongze Cheng 已提交
273 274

// COMPACT =========================
H
Hongze Cheng 已提交
275
static int32_t tsdbBeginCompact(STsdb *pTsdb, STsdbCompactor *pCompactor) {
H
Hongze Cheng 已提交
276 277 278
  int32_t code = 0;
  int32_t lino = 0;

H
Hongze Cheng 已提交
279
  pCompactor->pTsdb = pTsdb;
H
Hongze Cheng 已提交
280 281 282
  // pCompactor->cid = 0; (TODO)
  pCompactor->maxRows = pTsdb->pVnode->config.tsdbCfg.maxRows;
  pCompactor->minRows = pTsdb->pVnode->config.tsdbCfg.minRows;
H
Hongze Cheng 已提交
283 284 285 286 287 288

  code = tsdbFSCopy(pTsdb, &pCompactor->fs);
  TSDB_CHECK_CODE(code, lino, _exit);

  pCompactor->fid = INT32_MIN;

H
Hongze Cheng 已提交
289 290 291
  code = tBlockDataCreate(&pCompactor->bData);
  TSDB_CHECK_CODE(code, lino, _exit);

H
Hongze Cheng 已提交
292 293 294 295 296 297 298
_exit:
  if (code) {
    tsdbError("vgId:%d %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, lino, tstrerror(code));
  }
  return code;
}

H
Hongze Cheng 已提交
299
static int32_t tsdbCommitCompact(STsdbCompactor *pCompactor) {
H
Hongze Cheng 已提交
300 301 302
  int32_t code = 0;
  int32_t lino = 0;

H
Hongze Cheng 已提交
303 304
  STsdb *pTsdb = pCompactor->pTsdb;

H
Hongze Cheng 已提交
305 306 307 308 309 310 311 312 313
  // TODO

_exit:
  if (code) {
    tsdbError("vgId:%d %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, lino, tstrerror(code));
  }
  return code;
}

H
Hongze Cheng 已提交
314
static int32_t tsdbAbortCompact(STsdbCompactor *pCompactor) {
H
Hongze Cheng 已提交
315 316 317
  int32_t code = 0;
  int32_t lino = 0;

H
Hongze Cheng 已提交
318 319
  STsdb *pTsdb = pCompactor->pTsdb;

H
Hongze Cheng 已提交
320 321 322 323 324 325 326 327 328
  // TODO

_exit:
  if (code) {
    tsdbError("vgId:%d %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, lino, tstrerror(code));
  }
  return code;
}

H
Hongze Cheng 已提交
329
static int32_t tsdbDeepCompact(STsdbCompactor *pCompactor) {
H
Hongze Cheng 已提交
330 331 332
  int32_t code = 0;
  int32_t lino = 0;

H
Hongze Cheng 已提交
333
  STsdb *pTsdb = pCompactor->pTsdb;
H
Hongze Cheng 已提交
334

H
Hongze Cheng 已提交
335 336 337
  code = tsdbDataFReaderOpen(&pCompactor->pReader, pTsdb, pCompactor->pDFileSet);
  TSDB_CHECK_CODE(code, lino, _exit);

H
Hongze Cheng 已提交
338 339 340 341 342 343 344
_exit:
  if (code) {
    tsdbError("vgId:%d %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, lino, tstrerror(code));
  }
  return code;
}

H
Hongze Cheng 已提交
345
static int32_t tsdbShallowCompact(STsdbCompactor *pCompactor) {
H
Hongze Cheng 已提交
346
  int32_t code = 0;
H
Hongze Cheng 已提交
347 348
  int32_t lino = 0;

H
Hongze Cheng 已提交
349 350
  STsdb *pTsdb = pCompactor->pTsdb;

H
Hongze Cheng 已提交
351 352 353 354 355 356 357
_exit:
  if (code) {
    tsdbError("vgId:%d %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, lino, tstrerror(code));
  }
  return code;
}

H
Hongze Cheng 已提交
358
static int32_t tsdbCompactNextRowImpl(STsdbCompactor *pCompactor, TABLEID *pExcludeTableId) {
H
Hongze Cheng 已提交
359 360
  int32_t code = 0;
  int32_t lino = 0;
H
Hongze Cheng 已提交
361

H
Hongze Cheng 已提交
362 363 364 365
  for (;;) {
    if (pCompactor->pIter) {
      code = tsdbDataIterNext(pCompactor->pIter, pExcludeTableId);
      TSDB_CHECK_CODE(code, lino, _exit);
H
Hongze Cheng 已提交
366

H
Hongze Cheng 已提交
367 368 369 370 371 372
      if (pCompactor->pIter->rowInfo.suid == 0 && pCompactor->pIter->rowInfo.uid == 0) {
        pCompactor->pIter = NULL;
      } else {
        SRBTreeNode *pNode = tRBTreeMin(&pCompactor->rtree);
        if (pNode) {
          STsdbDataIter *pIter = TSDB_DATA_ITER_FROM_RBTN(pNode);
H
Hongze Cheng 已提交
373

H
Hongze Cheng 已提交
374 375
          int32_t c = tRowInfoCmprFn(&pCompactor->pIter->rowInfo, &pIter->rowInfo);
          ASSERT(c);
H
Hongze Cheng 已提交
376

H
Hongze Cheng 已提交
377 378 379 380
          if (c > 0) {
            tRBTreePut(&pCompactor->rtree, &pCompactor->pIter->n);
            pCompactor->pIter = NULL;
          }
H
Hongze Cheng 已提交
381 382 383
        }
      }
    }
H
Hongze Cheng 已提交
384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401

    if (pCompactor->pIter == NULL) {
      SRBTreeNode *pNode = tRBTreeMin(&pCompactor->rtree);
      if (pNode) {
        pCompactor->pIter = TSDB_DATA_ITER_FROM_RBTN(pNode);
        tRBTreeDrop(&pCompactor->rtree, pNode);

        if (pExcludeTableId) {
          if (pExcludeTableId->uid) {
            if (pCompactor->pIter->rowInfo.uid == pExcludeTableId->uid) continue;
          } else {
            if (pCompactor->pIter->rowInfo.suid == pExcludeTableId->suid) continue;
          }
        }
      }
    }

    break;
H
Hongze Cheng 已提交
402 403
  }

H
Hongze Cheng 已提交
404 405 406 407 408 409 410 411
_exit:
  return code;
}

static int32_t tsdbCompactNextRow(STsdbCompactor *pCompactor) {
  int32_t code = 0;
  int32_t lino = 0;

H
Hongze Cheng 已提交
412 413 414
  TABLEID  excludeTableId;
  TABLEID *pExcludeTableId = NULL;

H
Hongze Cheng 已提交
415
  for (;;) {
H
Hongze Cheng 已提交
416
    code = tsdbCompactNextRowImpl(pCompactor, pExcludeTableId);
H
Hongze Cheng 已提交
417 418 419 420
    TSDB_CHECK_CODE(code, lino, _exit);

    // check if the table of the row exists
    if (pCompactor->pIter) {
H
Hongze Cheng 已提交
421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443
      SRowInfo *pRowInfo = &pCompactor->pIter->rowInfo;

      // Table exists, just break out
      if (pRowInfo->uid == pCompactor->tbSkm.uid) break;

      SMetaInfo info;
      if (pRowInfo->suid) {  // child table

        // check if super table exists
        if (pRowInfo->suid != pCompactor->tbSkm.suid) {
          if (metaGetInfo(pCompactor->pTsdb->pVnode->pMeta, pRowInfo->uid, &info, NULL) != TSDB_CODE_SUCCESS) {
            excludeTableId.suid = pRowInfo->suid;
            excludeTableId.uid = 0;
            pExcludeTableId = &excludeTableId;
            continue;
          }

          // super table exists
          pCompactor->tbSkm.suid = pRowInfo->suid;
          pCompactor->tbSkm.uid = 0;
          tDestroyTSchema(pCompactor->tbSkm.pTSchema);
          pCompactor->tbSkm.pTSchema = metaGetTbTSchema(pCompactor->pTsdb->pVnode->pMeta, pRowInfo->suid, -1, 1);
          if (pCompactor->tbSkm.pTSchema == NULL) {
H
Hongze Cheng 已提交
444 445 446
            code = TSDB_CODE_OUT_OF_MEMORY;
            TSDB_CHECK_CODE(code, lino, _exit);
          }
H
Hongze Cheng 已提交
447
        }
H
Hongze Cheng 已提交
448

H
Hongze Cheng 已提交
449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466
        // check if table exists
        if (metaGetInfo(pCompactor->pTsdb->pVnode->pMeta, pRowInfo->uid, &info, NULL) != TSDB_CODE_SUCCESS) {
          excludeTableId.suid = pRowInfo->suid;
          excludeTableId.uid = pRowInfo->uid;
          pExcludeTableId = &excludeTableId;
          continue;
        }

        // table exists
        pCompactor->tbSkm.uid = pRowInfo->uid;
      } else {  // normal table
        // check if table exists
        if (metaGetInfo(pCompactor->pTsdb->pVnode->pMeta, pRowInfo->uid, &info, NULL) != TSDB_CODE_SUCCESS) {
          excludeTableId.suid = pRowInfo->suid;
          excludeTableId.uid = pRowInfo->uid;
          pExcludeTableId = &excludeTableId;
          continue;
        }
H
Hongze Cheng 已提交
467

H
Hongze Cheng 已提交
468 469 470 471 472 473 474 475 476
        // table exists
        pCompactor->tbSkm.suid = pRowInfo->suid;
        pCompactor->tbSkm.uid = pRowInfo->uid;
        tDestroyTSchema(pCompactor->tbSkm.pTSchema);

        pCompactor->tbSkm.pTSchema = metaGetTbTSchema(pCompactor->pTsdb->pVnode->pMeta, pRowInfo->suid, -1, 1);
        if (pCompactor->tbSkm.pTSchema == NULL) {
          code = TSDB_CODE_OUT_OF_MEMORY;
          TSDB_CHECK_CODE(code, lino, _exit);
H
Hongze Cheng 已提交
477 478
        }
      }
H
Hongze Cheng 已提交
479 480

      break;
H
Hongze Cheng 已提交
481 482 483
    } else {
      // iter end, just break out
      break;
H
Hongze Cheng 已提交
484 485 486 487
    }
  }

_exit:
H
Hongze Cheng 已提交
488 489 490 491
  if (code) {
    tsdbError("vgId:%d %s failed at line %d since %s", TD_VID(pCompactor->pTsdb->pVnode), __func__, lino,
              tstrerror(code));
  }
H
Hongze Cheng 已提交
492 493 494
  return code;
}

H
Hongze Cheng 已提交
495
static int32_t tsdbCompactGetRow(STsdbCompactor *pCompactor, SRowInfo **ppRowInfo, STSchema **ppTSchema) {
H
Hongze Cheng 已提交
496 497 498 499 500 501 502 503 504
  int32_t code = 0;
  int32_t lino = 0;

  if (pCompactor->pIter == NULL) {
    code = tsdbCompactNextRow(pCompactor);
    TSDB_CHECK_CODE(code, lino, _exit);
  }

  if (pCompactor->pIter) {
H
Hongze Cheng 已提交
505 506
    ASSERT(pCompactor->pIter->rowInfo.suid == pCompactor->tbSkm.suid);
    ASSERT(pCompactor->pIter->rowInfo.uid == pCompactor->tbSkm.uid);
H
Hongze Cheng 已提交
507
    *ppRowInfo = &pCompactor->pIter->rowInfo;
H
Hongze Cheng 已提交
508
    *ppTSchema = pCompactor->tbSkm.pTSchema;
H
Hongze Cheng 已提交
509
  } else {
H
Hongze Cheng 已提交
510 511
    *ppRowInfo = NULL;
    *ppTSchema = NULL;
H
Hongze Cheng 已提交
512 513
  }

H
Hongze Cheng 已提交
514 515 516 517
_exit:
  return code;
}

H
Hongze Cheng 已提交
518
static int32_t tsdbOpenCompactor(STsdbCompactor *pCompactor) {
H
Hongze Cheng 已提交
519 520 521
  int32_t code = 0;
  int32_t lino = 0;

H
Hongze Cheng 已提交
522
  STsdb *pTsdb = pCompactor->pTsdb;
H
Hongze Cheng 已提交
523

H
Hongze Cheng 已提交
524 525 526 527
  // next compact file
  pCompactor->pDFileSet = (SDFileSet *)taosArraySearch(pCompactor->fs.aDFileSet, &(SDFileSet){.fid = pCompactor->fid},
                                                       tDFileSetCmprFn, TD_GT);
  if (pCompactor->pDFileSet == NULL) goto _exit;
H
Hongze Cheng 已提交
528

H
Hongze Cheng 已提交
529 530 531
  pCompactor->fid = pCompactor->pDFileSet->fid;

  code = tsdbDataFReaderOpen(&pCompactor->pReader, pTsdb, pCompactor->pDFileSet);
H
Hongze Cheng 已提交
532 533
  TSDB_CHECK_CODE(code, lino, _exit);

H
Hongze Cheng 已提交
534 535
  // open iters
  STsdbDataIter *pIter;
H
Hongze Cheng 已提交
536

H
Hongze Cheng 已提交
537 538
  pCompactor->iterList = NULL;
  tRBTreeCreate(&pCompactor->rtree, tsdbDataIterCmprFn);
H
Hongze Cheng 已提交
539

H
Hongze Cheng 已提交
540 541 542 543 544 545 546 547 548 549 550
  code = tsdbDataDIterOpen(pCompactor->pReader, &pIter);
  TSDB_CHECK_CODE(code, lino, _exit);

  if (pIter) {
    pIter->next = pCompactor->iterList;
    pCompactor->iterList = pIter;
    tRBTreePut(&pCompactor->rtree, &pIter->n);
  }

  for (int32_t iStt = 0; iStt < pCompactor->pReader->pSet->nSttF; iStt++) {
    code = tsdbSttDIterOpen(pCompactor->pReader, iStt, &pIter);
H
Hongze Cheng 已提交
551 552
    TSDB_CHECK_CODE(code, lino, _exit);

H
Hongze Cheng 已提交
553 554 555 556 557 558
    if (pIter) {
      pIter->next = pCompactor->iterList;
      pCompactor->iterList = pIter;
      tRBTreePut(&pCompactor->rtree, &pIter->n);
    }
  }
H
Hongze Cheng 已提交
559
  pCompactor->pIter = NULL;
H
Hongze Cheng 已提交
560
  tBlockDataReset(&pCompactor->bData);
H
Hongze Cheng 已提交
561 562 563 564 565 566 567 568 569

_exit:
  if (code) {
    tsdbError("vgId:%d %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, lino, tstrerror(code));
  } else {
    tsdbDebug("vgId:%d %s done", TD_VID(pTsdb->pVnode), __func__);
  }
  return code;
}
H
Hongze Cheng 已提交
570

H
Hongze Cheng 已提交
571 572
static void tsdbCloseCompactor(STsdbCompactor *pCompactor) {
  STsdb *pTsdb = pCompactor->pTsdb;
H
Hongze Cheng 已提交
573

H
Hongze Cheng 已提交
574 575 576 577 578
  for (STsdbDataIter *pIter = pCompactor->iterList; pIter;) {
    STsdbDataIter *pIterNext = pIter->next;
    tsdbDataIterClose(pIter);
    pIter = pIterNext;
  }
H
Hongze Cheng 已提交
579

H
Hongze Cheng 已提交
580 581
  // TODO
  ASSERT(0);
H
Hongze Cheng 已提交
582

H
Hongze Cheng 已提交
583 584 585
_exit:
  tsdbDebug("vgId:%d %s done", TD_VID(pTsdb->pVnode), __func__);
}
H
Hongze Cheng 已提交
586

H
Hongze Cheng 已提交
587 588 589 590 591 592 593
int32_t tsdbCompact(STsdb *pTsdb, int32_t flag) {
  int32_t code = 0;
  int32_t lino = 0;

  // Check if can do compact (TODO)

  // Do compact
H
Hongze Cheng 已提交
594
  STsdbCompactor *pCompactor = &(STsdbCompactor){0};
H
Hongze Cheng 已提交
595

H
Hongze Cheng 已提交
596
  code = tsdbBeginCompact(pTsdb, pCompactor);
H
Hongze Cheng 已提交
597 598 599
  TSDB_CHECK_CODE(code, lino, _exit);

  while (true) {
H
Hongze Cheng 已提交
600
    code = tsdbOpenCompactor(pCompactor);
H
Hongze Cheng 已提交
601 602
    TSDB_CHECK_CODE(code, lino, _exit);

H
Hongze Cheng 已提交
603
    if (pCompactor->pDFileSet == NULL) break;
H
Hongze Cheng 已提交
604

H
Hongze Cheng 已提交
605
    // loop to merge row by row
H
Hongze Cheng 已提交
606 607 608
    SRowInfo *pRowInfo = NULL;
    STSchema *pTSchema = NULL;
    int64_t   nRow = 0;
H
Hongze Cheng 已提交
609
    for (;;) {
H
Hongze Cheng 已提交
610
      code = tsdbCompactGetRow(pCompactor, &pRowInfo, &pTSchema);
H
Hongze Cheng 已提交
611
      TSDB_CHECK_CODE(code, lino, _exit);
H
Hongze Cheng 已提交
612

H
Hongze Cheng 已提交
613
      if (pRowInfo == NULL) break;
H
Hongze Cheng 已提交
614

H
Hongze Cheng 已提交
615 616
      nRow++;

H
Hongze Cheng 已提交
617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662
      if (pCompactor->bData.suid == 0 && pCompactor->bData.uid == 0) {  // init the block data if not initialized yet
        code = tBlockDataInit(&pCompactor->bData, &(TABLEID){.suid = pRowInfo->suid, .uid = pRowInfo->uid}, pTSchema,
                              NULL, 0);
        TSDB_CHECK_CODE(code, lino, _exit);
      } else {
        if (pCompactor->bData.suid != pRowInfo->suid) {  // not same super table
          if (pCompactor->bData.nRow < pCompactor->minRows) {
            // TODO: write block data to .stt file, need to check if nRow is 0
            tBlockDataClear(&pCompactor->bData);
          } else {
            // TODO: write block data to .data file, need to check if nRow is 0
            tBlockDataClear(&pCompactor->bData);
          }

          code = tBlockDataInit(&pCompactor->bData, &(TABLEID){.suid = pRowInfo->suid, .uid = pRowInfo->uid}, pTSchema,
                                NULL, 0);
          TSDB_CHECK_CODE(code, lino, _exit);
        } else if (pCompactor->bData.uid != pRowInfo->uid) {
          if (pRowInfo->suid) {  // different child table
            if (pCompactor->bData.nRow > pCompactor->minRows) {
              // TODO
            }
          } else {  // different normal table
            if (pCompactor->bData.nRow < pCompactor->minRows) {
              // TODO: write data to .stt file, need to check if nRow is 0
              tBlockDataClear(&pCompactor->bData);
            } else {
              // TODO: write data to .data file, need to check if nRow is 0
              tBlockDataClear(&pCompactor->bData);
            }

            code = tBlockDataInit(&pCompactor->bData, &(TABLEID){.suid = pRowInfo->suid, .uid = pRowInfo->uid},
                                  pTSchema, NULL, 0);
            TSDB_CHECK_CODE(code, lino, _exit);
          }
        }
      }

      // append row to block data
      code = tBlockDataAppendRow(&pCompactor->bData, &pRowInfo->row, pTSchema, pRowInfo->uid);
      TSDB_CHECK_CODE(code, lino, _exit);

      // check if block data is full
      if (pCompactor->bData.nRow >= pCompactor->maxRows) {
        tBlockDataClear(&pCompactor->bData);
      }
H
Hongze Cheng 已提交
663

H
Hongze Cheng 已提交
664 665 666
      // iterate to next row
      code = tsdbCompactNextRow(pCompactor);
      TSDB_CHECK_CODE(code, lino, _exit);
H
Hongze Cheng 已提交
667
    }
H
Hongze Cheng 已提交
668

H
Hongze Cheng 已提交
669
    tsdbCloseCompactor(pCompactor);
H
Hongze Cheng 已提交
670 671 672 673 674
  }

_exit:
  if (code) {
    tsdbError("vgId:%d %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, lino, tstrerror(code));
H
Hongze Cheng 已提交
675
    tsdbAbortCompact(pCompactor);
H
Hongze Cheng 已提交
676
  } else {
H
Hongze Cheng 已提交
677
    tsdbCommitCompact(pCompactor);
H
Hongze Cheng 已提交
678
  }
H
Hongze Cheng 已提交
679 680
  return code;
}