tsdbUtil.c 51.6 KB
Newer Older
H
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

16
#include "tdataformat.h"
H
Hongze Cheng 已提交
17 18
#include "tsdb.h"

H
Hongze Cheng 已提交
19
// SMapData =======================================================================
H
Hongze Cheng 已提交
20 21 22 23
void tMapDataReset(SMapData *pMapData) {
  pMapData->nItem = 0;
  pMapData->nData = 0;
}
H
Hongze Cheng 已提交
24

H
Hongze Cheng 已提交
25
void tMapDataClear(SMapData *pMapData) {
H
Hongze Cheng 已提交
26 27
  tFree((uint8_t *)pMapData->aOffset);
  tFree(pMapData->pData);
28 29
  pMapData->pData = NULL;
  pMapData->aOffset = NULL;
H
Hongze Cheng 已提交
30 31
}

H
Hongze Cheng 已提交
32 33 34 35 36 37 38 39 40
int32_t tMapDataPutItem(SMapData *pMapData, void *pItem, int32_t (*tPutItemFn)(uint8_t *, void *)) {
  int32_t code = 0;
  int32_t offset = pMapData->nData;
  int32_t nItem = pMapData->nItem;

  pMapData->nItem++;
  pMapData->nData += tPutItemFn(NULL, pItem);

  // alloc
H
Hongze Cheng 已提交
41
  code = tRealloc((uint8_t **)&pMapData->aOffset, sizeof(int32_t) * pMapData->nItem);
H
Hongze Cheng 已提交
42
  if (code) goto _exit;
H
Hongze Cheng 已提交
43
  code = tRealloc(&pMapData->pData, pMapData->nData);
H
Hongze Cheng 已提交
44
  if (code) goto _exit;
H
Hongze Cheng 已提交
45 46

  // put
H
Hongze Cheng 已提交
47
  pMapData->aOffset[nItem] = offset;
H
Hongze Cheng 已提交
48 49
  tPutItemFn(pMapData->pData + offset, pItem);

H
Hongze Cheng 已提交
50
_exit:
H
Hongze Cheng 已提交
51 52 53
  return code;
}

H
Hongze Cheng 已提交
54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
int32_t tMapDataCopy(SMapData *pFrom, SMapData *pTo) {
  int32_t code = 0;

  pTo->nItem = pFrom->nItem;
  pTo->nData = pFrom->nData;
  code = tRealloc((uint8_t **)&pTo->aOffset, sizeof(int32_t) * pFrom->nItem);
  if (code) goto _exit;
  code = tRealloc(&pTo->pData, pFrom->nData);
  if (code) goto _exit;
  memcpy(pTo->aOffset, pFrom->aOffset, sizeof(int32_t) * pFrom->nItem);
  memcpy(pTo->pData, pFrom->pData, pFrom->nData);

_exit:
  return code;
}

H
Hongze Cheng 已提交
70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97
int32_t tMapDataSearch(SMapData *pMapData, void *pSearchItem, int32_t (*tGetItemFn)(uint8_t *, void *),
                       int32_t (*tItemCmprFn)(const void *, const void *), void *pItem) {
  int32_t code = 0;
  int32_t lidx = 0;
  int32_t ridx = pMapData->nItem - 1;
  int32_t midx;
  int32_t c;

  while (lidx <= ridx) {
    midx = (lidx + ridx) / 2;

    tMapDataGetItemByIdx(pMapData, midx, pItem, tGetItemFn);

    c = tItemCmprFn(pSearchItem, pItem);
    if (c == 0) {
      goto _exit;
    } else if (c < 0) {
      ridx = midx - 1;
    } else {
      lidx = midx + 1;
    }
  }

  code = TSDB_CODE_NOT_FOUND;

_exit:
  return code;
}
H
Hongze Cheng 已提交
98

H
Hongze Cheng 已提交
99 100 101
void tMapDataGetItemByIdx(SMapData *pMapData, int32_t idx, void *pItem, int32_t (*tGetItemFn)(uint8_t *, void *)) {
  ASSERT(idx >= 0 && idx < pMapData->nItem);
  tGetItemFn(pMapData->pData + pMapData->aOffset[idx], pItem);
H
Hongze Cheng 已提交
102 103 104 105 106 107
}

int32_t tPutMapData(uint8_t *p, SMapData *pMapData) {
  int32_t n = 0;

  n += tPutI32v(p ? p + n : p, pMapData->nItem);
H
Hongze Cheng 已提交
108
  if (pMapData->nItem) {
H
Hongze Cheng 已提交
109
    int32_t lOffset = 0;
H
Hongze Cheng 已提交
110
    for (int32_t iItem = 0; iItem < pMapData->nItem; iItem++) {
H
Hongze Cheng 已提交
111 112
      n += tPutI32v(p ? p + n : p, pMapData->aOffset[iItem] - lOffset);
      lOffset = pMapData->aOffset[iItem];
H
Hongze Cheng 已提交
113
    }
H
Hongze Cheng 已提交
114 115 116 117 118 119

    n += tPutI32v(p ? p + n : p, pMapData->nData);
    if (p) {
      memcpy(p + n, pMapData->pData, pMapData->nData);
    }
    n += pMapData->nData;
H
Hongze Cheng 已提交
120 121 122 123 124 125 126
  }

  return n;
}

int32_t tGetMapData(uint8_t *p, SMapData *pMapData) {
  int32_t n = 0;
H
Hongze Cheng 已提交
127 128 129
  int32_t offset;

  tMapDataReset(pMapData);
H
Hongze Cheng 已提交
130 131

  n += tGetI32v(p + n, &pMapData->nItem);
H
Hongze Cheng 已提交
132
  if (pMapData->nItem) {
H
Hongze Cheng 已提交
133
    if (tRealloc((uint8_t **)&pMapData->aOffset, sizeof(int32_t) * pMapData->nItem)) return -1;
H
Hongze Cheng 已提交
134

H
Hongze Cheng 已提交
135
    int32_t lOffset = 0;
H
Hongze Cheng 已提交
136 137
    for (int32_t iItem = 0; iItem < pMapData->nItem; iItem++) {
      n += tGetI32v(p + n, &pMapData->aOffset[iItem]);
H
Hongze Cheng 已提交
138 139
      pMapData->aOffset[iItem] += lOffset;
      lOffset = pMapData->aOffset[iItem];
H
Hongze Cheng 已提交
140
    }
H
Hongze Cheng 已提交
141 142

    n += tGetI32v(p + n, &pMapData->nData);
H
Hongze Cheng 已提交
143
    if (tRealloc(&pMapData->pData, pMapData->nData)) return -1;
H
Hongze Cheng 已提交
144 145
    memcpy(pMapData->pData, p + n, pMapData->nData);
    n += pMapData->nData;
H
Hongze Cheng 已提交
146 147 148 149 150
  }

  return n;
}

H
Hongze Cheng 已提交
151
// TABLEID =======================================================================
H
Hongze Cheng 已提交
152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170
int32_t tTABLEIDCmprFn(const void *p1, const void *p2) {
  TABLEID *pId1 = (TABLEID *)p1;
  TABLEID *pId2 = (TABLEID *)p2;

  if (pId1->suid < pId2->suid) {
    return -1;
  } else if (pId1->suid > pId2->suid) {
    return 1;
  }

  if (pId1->uid < pId2->uid) {
    return -1;
  } else if (pId1->uid > pId2->uid) {
    return 1;
  }

  return 0;
}

H
Hongze Cheng 已提交
171
// SBlockIdx ======================================================
H
Hongze Cheng 已提交
172 173 174 175 176 177 178 179
int32_t tPutBlockIdx(uint8_t *p, void *ph) {
  int32_t    n = 0;
  SBlockIdx *pBlockIdx = (SBlockIdx *)ph;

  n += tPutI64(p ? p + n : p, pBlockIdx->suid);
  n += tPutI64(p ? p + n : p, pBlockIdx->uid);
  n += tPutI64v(p ? p + n : p, pBlockIdx->offset);
  n += tPutI64v(p ? p + n : p, pBlockIdx->size);
H
Hongze Cheng 已提交
180 181 182 183

  return n;
}

H
Hongze Cheng 已提交
184 185 186
int32_t tGetBlockIdx(uint8_t *p, void *ph) {
  int32_t    n = 0;
  SBlockIdx *pBlockIdx = (SBlockIdx *)ph;
H
Hongze Cheng 已提交
187

H
Hongze Cheng 已提交
188 189 190 191
  n += tGetI64(p + n, &pBlockIdx->suid);
  n += tGetI64(p + n, &pBlockIdx->uid);
  n += tGetI64v(p + n, &pBlockIdx->offset);
  n += tGetI64v(p + n, &pBlockIdx->size);
H
Hongze Cheng 已提交
192 193 194 195

  return n;
}

196
int32_t tCmprBlockIdx(void const *lhs, void const *rhs) {
M
Minglei Jin 已提交
197 198
  SBlockIdx *lBlockIdx = (SBlockIdx *)lhs;
  SBlockIdx *rBlockIdx = (SBlockIdx *)rhs;
199

M
Minglei Jin 已提交
200
  if (lBlockIdx->suid < rBlockIdx->suid) {
201
    return -1;
M
Minglei Jin 已提交
202
  } else if (lBlockIdx->suid > rBlockIdx->suid) {
203 204 205
    return 1;
  }

M
Minglei Jin 已提交
206
  if (lBlockIdx->uid < rBlockIdx->uid) {
207
    return -1;
M
Minglei Jin 已提交
208
  } else if (lBlockIdx->uid > rBlockIdx->uid) {
209 210 211 212 213 214
    return 1;
  }

  return 0;
}

215 216
int32_t tCmprBlockL(void const *lhs, void const *rhs) {
  SBlockIdx *lBlockIdx = (SBlockIdx *)lhs;
H
Hongze Cheng 已提交
217
  SSttBlk   *rBlockL = (SSttBlk *)rhs;
218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233

  if (lBlockIdx->suid < rBlockL->suid) {
    return -1;
  } else if (lBlockIdx->suid > rBlockL->suid) {
    return 1;
  }

  if (lBlockIdx->uid < rBlockL->minUid) {
    return -1;
  } else if (lBlockIdx->uid > rBlockL->maxUid) {
    return 1;
  }

  return 0;
}

H
Hongze Cheng 已提交
234
// SDataBlk ======================================================
H
Hongze Cheng 已提交
235
void tDataBlkReset(SDataBlk *pDataBlk) {
H
Hongze Cheng 已提交
236
  *pDataBlk = (SDataBlk){.minKey = TSDBKEY_MAX, .maxKey = TSDBKEY_MIN, .minVer = VERSION_MAX, .maxVer = VERSION_MIN};
H
Hongze Cheng 已提交
237 238
}

H
Hongze Cheng 已提交
239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255
int32_t tPutDataBlk(uint8_t *p, void *ph) {
  int32_t   n = 0;
  SDataBlk *pDataBlk = (SDataBlk *)ph;

  n += tPutI64v(p ? p + n : p, pDataBlk->minKey.version);
  n += tPutI64v(p ? p + n : p, pDataBlk->minKey.ts);
  n += tPutI64v(p ? p + n : p, pDataBlk->maxKey.version);
  n += tPutI64v(p ? p + n : p, pDataBlk->maxKey.ts);
  n += tPutI64v(p ? p + n : p, pDataBlk->minVer);
  n += tPutI64v(p ? p + n : p, pDataBlk->maxVer);
  n += tPutI32v(p ? p + n : p, pDataBlk->nRow);
  n += tPutI8(p ? p + n : p, pDataBlk->hasDup);
  n += tPutI8(p ? p + n : p, pDataBlk->nSubBlock);
  for (int8_t iSubBlock = 0; iSubBlock < pDataBlk->nSubBlock; iSubBlock++) {
    n += tPutI64v(p ? p + n : p, pDataBlk->aSubBlock[iSubBlock].offset);
    n += tPutI32v(p ? p + n : p, pDataBlk->aSubBlock[iSubBlock].szBlock);
    n += tPutI32v(p ? p + n : p, pDataBlk->aSubBlock[iSubBlock].szKey);
H
Hongze Cheng 已提交
256
  }
H
Hongze Cheng 已提交
257 258 259
  if (pDataBlk->nSubBlock == 1 && !pDataBlk->hasDup) {
    n += tPutI64v(p ? p + n : p, pDataBlk->smaInfo.offset);
    n += tPutI32v(p ? p + n : p, pDataBlk->smaInfo.size);
H
Hongze Cheng 已提交
260 261
  }

H
Hongze Cheng 已提交
262 263 264
  return n;
}

H
Hongze Cheng 已提交
265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281
int32_t tGetDataBlk(uint8_t *p, void *ph) {
  int32_t   n = 0;
  SDataBlk *pDataBlk = (SDataBlk *)ph;

  n += tGetI64v(p + n, &pDataBlk->minKey.version);
  n += tGetI64v(p + n, &pDataBlk->minKey.ts);
  n += tGetI64v(p + n, &pDataBlk->maxKey.version);
  n += tGetI64v(p + n, &pDataBlk->maxKey.ts);
  n += tGetI64v(p + n, &pDataBlk->minVer);
  n += tGetI64v(p + n, &pDataBlk->maxVer);
  n += tGetI32v(p + n, &pDataBlk->nRow);
  n += tGetI8(p + n, &pDataBlk->hasDup);
  n += tGetI8(p + n, &pDataBlk->nSubBlock);
  for (int8_t iSubBlock = 0; iSubBlock < pDataBlk->nSubBlock; iSubBlock++) {
    n += tGetI64v(p + n, &pDataBlk->aSubBlock[iSubBlock].offset);
    n += tGetI32v(p + n, &pDataBlk->aSubBlock[iSubBlock].szBlock);
    n += tGetI32v(p + n, &pDataBlk->aSubBlock[iSubBlock].szKey);
H
Hongze Cheng 已提交
282
  }
H
Hongze Cheng 已提交
283 284 285
  if (pDataBlk->nSubBlock == 1 && !pDataBlk->hasDup) {
    n += tGetI64v(p + n, &pDataBlk->smaInfo.offset);
    n += tGetI32v(p + n, &pDataBlk->smaInfo.size);
H
Hongze Cheng 已提交
286
  } else {
H
Hongze Cheng 已提交
287 288
    pDataBlk->smaInfo.offset = 0;
    pDataBlk->smaInfo.size = 0;
H
Hongze Cheng 已提交
289 290
  }

H
Hongze Cheng 已提交
291 292 293
  return n;
}

H
Hongze Cheng 已提交
294
int32_t tDataBlkCmprFn(const void *p1, const void *p2) {
H
Hongze Cheng 已提交
295 296
  SDataBlk *pBlock1 = (SDataBlk *)p1;
  SDataBlk *pBlock2 = (SDataBlk *)p2;
H
Hongze Cheng 已提交
297

H
Hongze Cheng 已提交
298
  if (tsdbKeyCmprFn(&pBlock1->maxKey, &pBlock2->minKey) < 0) {
H
Hongze Cheng 已提交
299
    return -1;
H
Hongze Cheng 已提交
300
  } else if (tsdbKeyCmprFn(&pBlock1->minKey, &pBlock2->maxKey) > 0) {
H
Hongze Cheng 已提交
301
    return 1;
H
Hongze Cheng 已提交
302 303 304 305 306
  }

  return 0;
}

H
Hongze Cheng 已提交
307
bool tDataBlkHasSma(SDataBlk *pDataBlk) {
H
Hongze Cheng 已提交
308 309
  if (pDataBlk->nSubBlock > 1) return false;
  if (pDataBlk->hasDup) return false;
H
Hongze Cheng 已提交
310

H
Hongze Cheng 已提交
311
  return pDataBlk->smaInfo.size > 0;
H
Hongze Cheng 已提交
312
}
H
Hongze Cheng 已提交
313

H
Hongze Cheng 已提交
314 315
// SSttBlk ======================================================
int32_t tPutSttBlk(uint8_t *p, void *ph) {
H
Hongze Cheng 已提交
316
  int32_t  n = 0;
H
Hongze Cheng 已提交
317 318 319 320 321 322 323 324 325 326 327 328 329
  SSttBlk *pSttBlk = (SSttBlk *)ph;

  n += tPutI64(p ? p + n : p, pSttBlk->suid);
  n += tPutI64(p ? p + n : p, pSttBlk->minUid);
  n += tPutI64(p ? p + n : p, pSttBlk->maxUid);
  n += tPutI64v(p ? p + n : p, pSttBlk->minKey);
  n += tPutI64v(p ? p + n : p, pSttBlk->maxKey);
  n += tPutI64v(p ? p + n : p, pSttBlk->minVer);
  n += tPutI64v(p ? p + n : p, pSttBlk->maxVer);
  n += tPutI32v(p ? p + n : p, pSttBlk->nRow);
  n += tPutI64v(p ? p + n : p, pSttBlk->bInfo.offset);
  n += tPutI32v(p ? p + n : p, pSttBlk->bInfo.szBlock);
  n += tPutI32v(p ? p + n : p, pSttBlk->bInfo.szKey);
H
Hongze Cheng 已提交
330 331 332 333

  return n;
}

H
Hongze Cheng 已提交
334
int32_t tGetSttBlk(uint8_t *p, void *ph) {
H
Hongze Cheng 已提交
335
  int32_t  n = 0;
H
Hongze Cheng 已提交
336 337 338 339 340 341 342 343 344 345 346 347 348
  SSttBlk *pSttBlk = (SSttBlk *)ph;

  n += tGetI64(p + n, &pSttBlk->suid);
  n += tGetI64(p + n, &pSttBlk->minUid);
  n += tGetI64(p + n, &pSttBlk->maxUid);
  n += tGetI64v(p + n, &pSttBlk->minKey);
  n += tGetI64v(p + n, &pSttBlk->maxKey);
  n += tGetI64v(p + n, &pSttBlk->minVer);
  n += tGetI64v(p + n, &pSttBlk->maxVer);
  n += tGetI32v(p + n, &pSttBlk->nRow);
  n += tGetI64v(p + n, &pSttBlk->bInfo.offset);
  n += tGetI32v(p + n, &pSttBlk->bInfo.szBlock);
  n += tGetI32v(p + n, &pSttBlk->bInfo.szKey);
H
Hongze Cheng 已提交
349 350 351

  return n;
}
H
Hongze Cheng 已提交
352

H
Hongze Cheng 已提交
353 354 355 356 357 358 359 360 361
// SBlockCol ======================================================
int32_t tPutBlockCol(uint8_t *p, void *ph) {
  int32_t    n = 0;
  SBlockCol *pBlockCol = (SBlockCol *)ph;

  ASSERT(pBlockCol->flag && (pBlockCol->flag != HAS_NONE));

  n += tPutI16v(p ? p + n : p, pBlockCol->cid);
  n += tPutI8(p ? p + n : p, pBlockCol->type);
H
Hongze Cheng 已提交
362
  n += tPutI8(p ? p + n : p, pBlockCol->smaOn);
H
Hongze Cheng 已提交
363
  n += tPutI8(p ? p + n : p, pBlockCol->flag);
H
Hongze Cheng 已提交
364
  n += tPutI32v(p ? p + n : p, pBlockCol->szOrigin);
H
Hongze Cheng 已提交
365 366

  if (pBlockCol->flag != HAS_NULL) {
H
Hongze Cheng 已提交
367 368 369 370 371 372 373 374 375 376 377 378
    if (pBlockCol->flag != HAS_VALUE) {
      n += tPutI32v(p ? p + n : p, pBlockCol->szBitmap);
    }

    if (IS_VAR_DATA_TYPE(pBlockCol->type)) {
      n += tPutI32v(p ? p + n : p, pBlockCol->szOffset);
    }

    if (pBlockCol->flag != (HAS_NULL | HAS_NONE)) {
      n += tPutI32v(p ? p + n : p, pBlockCol->szValue);
    }

H
Hongze Cheng 已提交
379
    n += tPutI32v(p ? p + n : p, pBlockCol->offset);
H
Hongze Cheng 已提交
380 381
  }

H
Hongze Cheng 已提交
382
_exit:
H
Hongze Cheng 已提交
383 384 385 386 387 388 389 390 391
  return n;
}

int32_t tGetBlockCol(uint8_t *p, void *ph) {
  int32_t    n = 0;
  SBlockCol *pBlockCol = (SBlockCol *)ph;

  n += tGetI16v(p + n, &pBlockCol->cid);
  n += tGetI8(p + n, &pBlockCol->type);
H
Hongze Cheng 已提交
392
  n += tGetI8(p + n, &pBlockCol->smaOn);
H
Hongze Cheng 已提交
393
  n += tGetI8(p + n, &pBlockCol->flag);
H
Hongze Cheng 已提交
394
  n += tGetI32v(p + n, &pBlockCol->szOrigin);
H
Hongze Cheng 已提交
395 396 397

  ASSERT(pBlockCol->flag && (pBlockCol->flag != HAS_NONE));

H
Hongze Cheng 已提交
398 399 400 401 402
  pBlockCol->szBitmap = 0;
  pBlockCol->szOffset = 0;
  pBlockCol->szValue = 0;
  pBlockCol->offset = 0;

H
Hongze Cheng 已提交
403
  if (pBlockCol->flag != HAS_NULL) {
H
Hongze Cheng 已提交
404 405 406 407 408 409 410 411 412 413 414 415
    if (pBlockCol->flag != HAS_VALUE) {
      n += tGetI32v(p + n, &pBlockCol->szBitmap);
    }

    if (IS_VAR_DATA_TYPE(pBlockCol->type)) {
      n += tGetI32v(p + n, &pBlockCol->szOffset);
    }

    if (pBlockCol->flag != (HAS_NULL | HAS_NONE)) {
      n += tGetI32v(p + n, &pBlockCol->szValue);
    }

H
Hongze Cheng 已提交
416
    n += tGetI32v(p + n, &pBlockCol->offset);
H
Hongze Cheng 已提交
417 418 419 420 421
  }

  return n;
}

H
Hongze Cheng 已提交
422 423 424 425 426 427 428 429 430 431
int32_t tBlockColCmprFn(const void *p1, const void *p2) {
  if (((SBlockCol *)p1)->cid < ((SBlockCol *)p2)->cid) {
    return -1;
  } else if (((SBlockCol *)p1)->cid > ((SBlockCol *)p2)->cid) {
    return 1;
  }

  return 0;
}

H
Hongze Cheng 已提交
432
// SDelIdx ======================================================
433
int32_t tCmprDelIdx(void const *lhs, void const *rhs) {
M
Minglei Jin 已提交
434 435
  SDelIdx *lDelIdx = (SDelIdx *)lhs;
  SDelIdx *rDelIdx = (SDelIdx *)rhs;
436

M
Minglei Jin 已提交
437
  if (lDelIdx->suid < rDelIdx->suid) {
438
    return -1;
M
Minglei Jin 已提交
439
  } else if (lDelIdx->suid > rDelIdx->suid) {
440 441 442
    return 1;
  }

M
Minglei Jin 已提交
443
  if (lDelIdx->uid < rDelIdx->uid) {
444
    return -1;
M
Minglei Jin 已提交
445
  } else if (lDelIdx->uid > rDelIdx->uid) {
446 447 448 449 450 451
    return 1;
  }

  return 0;
}

H
Hongze Cheng 已提交
452 453 454 455 456 457 458 459
int32_t tPutDelIdx(uint8_t *p, void *ph) {
  SDelIdx *pDelIdx = (SDelIdx *)ph;
  int32_t  n = 0;

  n += tPutI64(p ? p + n : p, pDelIdx->suid);
  n += tPutI64(p ? p + n : p, pDelIdx->uid);
  n += tPutI64v(p ? p + n : p, pDelIdx->offset);
  n += tPutI64v(p ? p + n : p, pDelIdx->size);
H
Hongze Cheng 已提交
460 461 462 463

  return n;
}

H
Hongze Cheng 已提交
464 465 466
int32_t tGetDelIdx(uint8_t *p, void *ph) {
  SDelIdx *pDelIdx = (SDelIdx *)ph;
  int32_t  n = 0;
H
Hongze Cheng 已提交
467

H
Hongze Cheng 已提交
468 469 470 471
  n += tGetI64(p + n, &pDelIdx->suid);
  n += tGetI64(p + n, &pDelIdx->uid);
  n += tGetI64v(p + n, &pDelIdx->offset);
  n += tGetI64v(p + n, &pDelIdx->size);
H
Hongze Cheng 已提交
472 473 474 475

  return n;
}

H
Hongze Cheng 已提交
476
// SDelData ======================================================
H
Hongze Cheng 已提交
477 478 479 480 481 482 483
int32_t tPutDelData(uint8_t *p, void *ph) {
  SDelData *pDelData = (SDelData *)ph;
  int32_t   n = 0;

  n += tPutI64v(p ? p + n : p, pDelData->version);
  n += tPutI64(p ? p + n : p, pDelData->sKey);
  n += tPutI64(p ? p + n : p, pDelData->eKey);
H
Hongze Cheng 已提交
484 485 486 487

  return n;
}

H
Hongze Cheng 已提交
488 489 490
int32_t tGetDelData(uint8_t *p, void *ph) {
  SDelData *pDelData = (SDelData *)ph;
  int32_t   n = 0;
H
Hongze Cheng 已提交
491

H
Hongze Cheng 已提交
492 493 494
  n += tGetI64v(p + n, &pDelData->version);
  n += tGetI64(p + n, &pDelData->sKey);
  n += tGetI64(p + n, &pDelData->eKey);
H
Hongze Cheng 已提交
495 496

  return n;
H
Hongze Cheng 已提交
497 498
}

H
Hongze Cheng 已提交
499 500 501 502 503 504
int32_t tsdbKeyFid(TSKEY key, int32_t minutes, int8_t precision) {
  if (key < 0) {
    return (int)((key + 1) / tsTickPerMin[precision] / minutes - 1);
  } else {
    return (int)((key / tsTickPerMin[precision] / minutes));
  }
H
Hongze Cheng 已提交
505 506
}

H
Hongze Cheng 已提交
507 508 509 510 511
void tsdbFidKeyRange(int32_t fid, int32_t minutes, int8_t precision, TSKEY *minKey, TSKEY *maxKey) {
  *minKey = fid * minutes * tsTickPerMin[precision];
  *maxKey = *minKey + minutes * tsTickPerMin[precision] - 1;
}

H
Hongze Cheng 已提交
512 513 514 515
int32_t tsdbFidLevel(int32_t fid, STsdbKeepCfg *pKeepCfg, int64_t now) {
  int32_t aFid[3];
  TSKEY   key;

H
Hongze Cheng 已提交
516 517 518 519 520 521 522 523 524 525
  if (pKeepCfg->precision == TSDB_TIME_PRECISION_MILLI) {
    now = now * 1000;
  } else if (pKeepCfg->precision == TSDB_TIME_PRECISION_MICRO) {
    now = now * 1000000l;
  } else if (pKeepCfg->precision == TSDB_TIME_PRECISION_NANO) {
    now = now * 1000000000l;
  } else {
    ASSERT(0);
  }

H
Hongze Cheng 已提交
526
  key = now - pKeepCfg->keep0 * tsTickPerMin[pKeepCfg->precision];
H
Hongze Cheng 已提交
527
  aFid[0] = tsdbKeyFid(key, pKeepCfg->days, pKeepCfg->precision);
H
Hongze Cheng 已提交
528
  key = now - pKeepCfg->keep1 * tsTickPerMin[pKeepCfg->precision];
H
Hongze Cheng 已提交
529
  aFid[1] = tsdbKeyFid(key, pKeepCfg->days, pKeepCfg->precision);
H
Hongze Cheng 已提交
530
  key = now - pKeepCfg->keep2 * tsTickPerMin[pKeepCfg->precision];
H
Hongze Cheng 已提交
531
  aFid[2] = tsdbKeyFid(key, pKeepCfg->days, pKeepCfg->precision);
H
Hongze Cheng 已提交
532 533 534 535 536 537 538 539 540 541 542

  if (fid >= aFid[0]) {
    return 0;
  } else if (fid >= aFid[1]) {
    return 1;
  } else if (fid >= aFid[2]) {
    return 2;
  } else {
    return -1;
  }
}
H
Hongze Cheng 已提交
543

H
Hongze Cheng 已提交
544 545
// TSDBROW ======================================================
void tsdbRowGetColVal(TSDBROW *pRow, STSchema *pTSchema, int32_t iCol, SColVal *pColVal) {
H
Hongze Cheng 已提交
546 547 548
  STColumn *pTColumn = &pTSchema->columns[iCol];
  SValue    value;

H
Hongze Cheng 已提交
549 550
  ASSERT(iCol > 0);

H
Hongze Cheng 已提交
551
  if (pRow->type == 0) {
H
Hongze Cheng 已提交
552
    tTSRowGetVal(pRow->pTSRow, pTSchema, iCol, pColVal);
H
Hongze Cheng 已提交
553
  } else if (pRow->type == 1) {
H
Hongze Cheng 已提交
554
    SColData *pColData;
H
Hongze Cheng 已提交
555

H
Hongze Cheng 已提交
556
    tBlockDataGetColData(pRow->pBlockData, pTColumn->colId, &pColData);
H
Hongze Cheng 已提交
557

H
Hongze Cheng 已提交
558
    if (pColData) {
H
Hongze Cheng 已提交
559
      tColDataGetValue(pColData, pRow->iRow, pColVal);
H
Hongze Cheng 已提交
560
    } else {
H
Hongze Cheng 已提交
561
      *pColVal = COL_VAL_NONE(pTColumn->colId, pTColumn->type);
H
Hongze Cheng 已提交
562 563 564 565
    }
  } else {
    ASSERT(0);
  }
H
Hongze Cheng 已提交
566 567
}

H
Hongze Cheng 已提交
568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587
int32_t tPutTSDBRow(uint8_t *p, TSDBROW *pRow) {
  int32_t n = 0;

  n += tPutI64(p, pRow->version);
  if (p) memcpy(p + n, pRow->pTSRow, pRow->pTSRow->len);
  n += pRow->pTSRow->len;

  return n;
}

int32_t tGetTSDBRow(uint8_t *p, TSDBROW *pRow) {
  int32_t n = 0;

  n += tGetI64(p, &pRow->version);
  pRow->pTSRow = (STSRow *)(p + n);
  n += pRow->pTSRow->len;

  return n;
}

H
Hongze Cheng 已提交
588 589 590 591
int32_t tsdbRowCmprFn(const void *p1, const void *p2) {
  return tsdbKeyCmprFn(&TSDBROW_KEY((TSDBROW *)p1), &TSDBROW_KEY((TSDBROW *)p2));
}

H
Hongze Cheng 已提交
592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615
// SRowIter ======================================================
void tRowIterInit(SRowIter *pIter, TSDBROW *pRow, STSchema *pTSchema) {
  pIter->pRow = pRow;
  if (pRow->type == 0) {
    ASSERT(pTSchema);
    pIter->pTSchema = pTSchema;
    pIter->i = 1;
  } else if (pRow->type == 1) {
    pIter->pTSchema = NULL;
    pIter->i = 0;
  } else {
    ASSERT(0);
  }
}

SColVal *tRowIterNext(SRowIter *pIter) {
  if (pIter->pRow->type == 0) {
    if (pIter->i < pIter->pTSchema->numOfCols) {
      tsdbRowGetColVal(pIter->pRow, pIter->pTSchema, pIter->i, &pIter->colVal);
      pIter->i++;

      return &pIter->colVal;
    }
  } else {
H
Hongze Cheng 已提交
616 617
    if (pIter->i < taosArrayGetSize(pIter->pRow->pBlockData->aIdx)) {
      SColData *pColData = tBlockDataGetColDataByIdx(pIter->pRow->pBlockData, pIter->i);
H
Hongze Cheng 已提交
618 619 620 621 622 623 624 625 626 627 628

      tColDataGetValue(pColData, pIter->pRow->iRow, &pIter->colVal);
      pIter->i++;

      return &pIter->colVal;
    }
  }

  return NULL;
}

H
Hongze Cheng 已提交
629
// SRowMerger ======================================================
630 631 632 633 634 635

int32_t tRowMergerInit2(SRowMerger *pMerger, STSchema *pResTSchema, TSDBROW *pRow, STSchema *pTSchema) {
  int32_t   code = 0;
  TSDBKEY   key = TSDBROW_KEY(pRow);
  SColVal  *pColVal = &(SColVal){0};
  STColumn *pTColumn;
M
Minglei Jin 已提交
636
  int32_t   iCol, jCol = 0;
637 638 639 640 641 642 643 644 645 646 647

  pMerger->pTSchema = pResTSchema;
  pMerger->version = key.version;

  pMerger->pArray = taosArrayInit(pResTSchema->numOfCols, sizeof(SColVal));
  if (pMerger->pArray == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

  // ts
M
Minglei Jin 已提交
648
  pTColumn = &pTSchema->columns[jCol++];
649 650 651 652 653 654 655 656 657 658

  ASSERT(pTColumn->type == TSDB_DATA_TYPE_TIMESTAMP);

  *pColVal = COL_VAL_VALUE(pTColumn->colId, pTColumn->type, (SValue){.ts = key.ts});
  if (taosArrayPush(pMerger->pArray, pColVal) == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

  // other
M
Minglei Jin 已提交
659
  for (iCol = 1; jCol < pTSchema->numOfCols && iCol < pResTSchema->numOfCols; ++iCol) {
660
    pTColumn = &pResTSchema->columns[iCol];
M
Minglei Jin 已提交
661 662 663 664 665
    if (pTSchema->columns[jCol].colId < pTColumn->colId) {
      ++jCol;
      --iCol;
      continue;
    } else if (pTSchema->columns[jCol].colId > pTColumn->colId) {
666 667 668 669
      taosArrayPush(pMerger->pArray, &COL_VAL_NONE(pTColumn->colId, pTColumn->type));
      continue;
    }

M
Minglei Jin 已提交
670
    tsdbRowGetColVal(pRow, pTSchema, jCol++, pColVal);
671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690
    if (taosArrayPush(pMerger->pArray, pColVal) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _exit;
    }
  }

  for (; iCol < pResTSchema->numOfCols; ++iCol) {
    pTColumn = &pResTSchema->columns[iCol];
    taosArrayPush(pMerger->pArray, &COL_VAL_NONE(pTColumn->colId, pTColumn->type));
  }

_exit:
  return code;
}

int32_t tRowMergerAdd(SRowMerger *pMerger, TSDBROW *pRow, STSchema *pTSchema) {
  int32_t   code = 0;
  TSDBKEY   key = TSDBROW_KEY(pRow);
  SColVal  *pColVal = &(SColVal){0};
  STColumn *pTColumn;
M
Minglei Jin 已提交
691
  int32_t   iCol, jCol = 1;
692 693 694

  ASSERT(((SColVal *)pMerger->pArray->pData)->value.ts == key.ts);

M
Minglei Jin 已提交
695
  for (iCol = 1; iCol < pMerger->pTSchema->numOfCols && jCol < pTSchema->numOfCols; ++iCol) {
696
    pTColumn = &pMerger->pTSchema->columns[iCol];
M
Minglei Jin 已提交
697 698 699 700 701
    if (pTSchema->columns[jCol].colId < pTColumn->colId) {
      ++jCol;
      --iCol;
      continue;
    } else if (pTSchema->columns[jCol].colId > pTColumn->colId) {
702 703 704
      continue;
    }

M
Minglei Jin 已提交
705
    tsdbRowGetColVal(pRow, pTSchema, jCol++, pColVal);
706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726

    if (key.version > pMerger->version) {
      if (!pColVal->isNone) {
        taosArraySet(pMerger->pArray, iCol, pColVal);
      }
    } else if (key.version < pMerger->version) {
      SColVal *tColVal = (SColVal *)taosArrayGet(pMerger->pArray, iCol);
      if (tColVal->isNone && !pColVal->isNone) {
        taosArraySet(pMerger->pArray, iCol, pColVal);
      }
    } else {
      ASSERT(0);
    }
  }

  pMerger->version = key.version;

_exit:
  return code;
}

H
Hongze Cheng 已提交
727 728
int32_t tRowMergerInit(SRowMerger *pMerger, TSDBROW *pRow, STSchema *pTSchema) {
  int32_t   code = 0;
H
Hongze Cheng 已提交
729
  TSDBKEY   key = TSDBROW_KEY(pRow);
H
Hongze Cheng 已提交
730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769
  SColVal  *pColVal = &(SColVal){0};
  STColumn *pTColumn;

  pMerger->pTSchema = pTSchema;
  pMerger->version = key.version;

  pMerger->pArray = taosArrayInit(pTSchema->numOfCols, sizeof(SColVal));
  if (pMerger->pArray == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

  // ts
  pTColumn = &pTSchema->columns[0];

  ASSERT(pTColumn->type == TSDB_DATA_TYPE_TIMESTAMP);

  *pColVal = COL_VAL_VALUE(pTColumn->colId, pTColumn->type, (SValue){.ts = key.ts});
  if (taosArrayPush(pMerger->pArray, pColVal) == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }

  // other
  for (int16_t iCol = 1; iCol < pTSchema->numOfCols; iCol++) {
    tsdbRowGetColVal(pRow, pTSchema, iCol, pColVal);
    if (taosArrayPush(pMerger->pArray, pColVal) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _exit;
    }
  }

_exit:
  return code;
}

void tRowMergerClear(SRowMerger *pMerger) { taosArrayDestroy(pMerger->pArray); }

int32_t tRowMerge(SRowMerger *pMerger, TSDBROW *pRow) {
  int32_t  code = 0;
H
Hongze Cheng 已提交
770
  TSDBKEY  key = TSDBROW_KEY(pRow);
H
Hongze Cheng 已提交
771 772 773 774 775 776 777 778
  SColVal *pColVal = &(SColVal){0};

  ASSERT(((SColVal *)pMerger->pArray->pData)->value.ts == key.ts);

  for (int32_t iCol = 1; iCol < pMerger->pTSchema->numOfCols; iCol++) {
    tsdbRowGetColVal(pRow, pMerger->pTSchema, iCol, pColVal);

    if (key.version > pMerger->version) {
H
Hongze Cheng 已提交
779 780 781
      if (!pColVal->isNone) {
        taosArraySet(pMerger->pArray, iCol, pColVal);
      }
H
Hongze Cheng 已提交
782
    } else if (key.version < pMerger->version) {
H
Hongze Cheng 已提交
783 784 785 786
      SColVal *tColVal = (SColVal *)taosArrayGet(pMerger->pArray, iCol);
      if (tColVal->isNone && !pColVal->isNone) {
        taosArraySet(pMerger->pArray, iCol, pColVal);
      }
H
Hongze Cheng 已提交
787 788 789 790 791 792 793 794 795 796 797 798 799
    } else {
      ASSERT(0);
    }
  }

  pMerger->version = key.version;

_exit:
  return code;
}

int32_t tRowMergerGetRow(SRowMerger *pMerger, STSRow **ppRow) {
  int32_t code = 0;
800 801 802

  code = tdSTSRowNew(pMerger->pArray, pMerger->pTSchema, ppRow);

H
Hongze Cheng 已提交
803 804 805
  return code;
}

H
Hongze Cheng 已提交
806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908
// delete skyline ======================================================
static int32_t tsdbMergeSkyline(SArray *aSkyline1, SArray *aSkyline2, SArray *aSkyline) {
  int32_t  code = 0;
  int32_t  i1 = 0;
  int32_t  n1 = taosArrayGetSize(aSkyline1);
  int32_t  i2 = 0;
  int32_t  n2 = taosArrayGetSize(aSkyline2);
  TSDBKEY *pSkyline1;
  TSDBKEY *pSkyline2;
  TSDBKEY  item;
  int64_t  version1 = 0;
  int64_t  version2 = 0;

  ASSERT(n1 > 0 && n2 > 0);

  taosArrayClear(aSkyline);

  while (i1 < n1 && i2 < n2) {
    pSkyline1 = (TSDBKEY *)taosArrayGet(aSkyline1, i1);
    pSkyline2 = (TSDBKEY *)taosArrayGet(aSkyline2, i2);

    if (pSkyline1->ts < pSkyline2->ts) {
      version1 = pSkyline1->version;
      i1++;
    } else if (pSkyline1->ts > pSkyline2->ts) {
      version2 = pSkyline2->version;
      i2++;
    } else {
      version1 = pSkyline1->version;
      version2 = pSkyline2->version;
      i1++;
      i2++;
    }

    item.ts = TMIN(pSkyline1->ts, pSkyline2->ts);
    item.version = TMAX(version1, version2);
    if (taosArrayPush(aSkyline, &item) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _exit;
    }
  }

  while (i1 < n1) {
    pSkyline1 = (TSDBKEY *)taosArrayGet(aSkyline1, i1);
    item.ts = pSkyline1->ts;
    item.version = pSkyline1->version;
    if (taosArrayPush(aSkyline, &item) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _exit;
    }
    i1++;
  }

  while (i2 < n2) {
    pSkyline2 = (TSDBKEY *)taosArrayGet(aSkyline2, i2);
    item.ts = pSkyline2->ts;
    item.version = pSkyline2->version;
    if (taosArrayPush(aSkyline, &item) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _exit;
    }
    i2++;
  }

_exit:
  return code;
}
int32_t tsdbBuildDeleteSkyline(SArray *aDelData, int32_t sidx, int32_t eidx, SArray *aSkyline) {
  int32_t   code = 0;
  SDelData *pDelData;
  int32_t   midx;

  taosArrayClear(aSkyline);
  if (sidx == eidx) {
    pDelData = (SDelData *)taosArrayGet(aDelData, sidx);
    taosArrayPush(aSkyline, &(TSDBKEY){.ts = pDelData->sKey, .version = pDelData->version});
    taosArrayPush(aSkyline, &(TSDBKEY){.ts = pDelData->eKey, .version = 0});
  } else {
    SArray *aSkyline1 = NULL;
    SArray *aSkyline2 = NULL;

    aSkyline1 = taosArrayInit(0, sizeof(TSDBKEY));
    aSkyline2 = taosArrayInit(0, sizeof(TSDBKEY));
    if (aSkyline1 == NULL || aSkyline2 == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _clear;
    }

    midx = (sidx + eidx) / 2;

    code = tsdbBuildDeleteSkyline(aDelData, sidx, midx, aSkyline1);
    if (code) goto _clear;

    code = tsdbBuildDeleteSkyline(aDelData, midx + 1, eidx, aSkyline2);
    if (code) goto _clear;

    code = tsdbMergeSkyline(aSkyline1, aSkyline2, aSkyline);

  _clear:
    taosArrayDestroy(aSkyline1);
    taosArrayDestroy(aSkyline2);
  }

H
Hongze Cheng 已提交
909 910 911
  return code;
}

H
Hongze Cheng 已提交
912
// SBlockData ======================================================
H
Hongze Cheng 已提交
913
int32_t tBlockDataCreate(SBlockData *pBlockData) {
H
Hongze Cheng 已提交
914
  int32_t code = 0;
H
Hongze Cheng 已提交
915

H
Hongze Cheng 已提交
916 917
  pBlockData->suid = 0;
  pBlockData->uid = 0;
H
Hongze Cheng 已提交
918
  pBlockData->nRow = 0;
H
Hongze Cheng 已提交
919
  pBlockData->aUid = NULL;
H
Hongze Cheng 已提交
920 921
  pBlockData->aVersion = NULL;
  pBlockData->aTSKEY = NULL;
H
Hongze Cheng 已提交
922 923
  pBlockData->aIdx = taosArrayInit(0, sizeof(int32_t));
  if (pBlockData->aIdx == NULL) {
H
Hongze Cheng 已提交
924 925 926 927 928
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }
  pBlockData->aColData = taosArrayInit(0, sizeof(SColData));
  if (pBlockData->aColData == NULL) {
H
Hongze Cheng 已提交
929
    taosArrayDestroy(pBlockData->aIdx);
H
Hongze Cheng 已提交
930 931 932
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _exit;
  }
H
Hongze Cheng 已提交
933 934 935 936 937

_exit:
  return code;
}

H
Hongze Cheng 已提交
938
void tBlockDataDestroy(SBlockData *pBlockData, int8_t deepClear) {
H
Hongze Cheng 已提交
939
  tFree((uint8_t *)pBlockData->aUid);
H
Hongze Cheng 已提交
940 941
  tFree((uint8_t *)pBlockData->aVersion);
  tFree((uint8_t *)pBlockData->aTSKEY);
H
Hongze Cheng 已提交
942
  taosArrayDestroy(pBlockData->aIdx);
H
Haojun Liao 已提交
943
  taosArrayDestroyEx(pBlockData->aColData, deepClear ? tColDataDestroy : NULL);
H
Hongze Cheng 已提交
944
  pBlockData->aUid = NULL;
H
Haojun Liao 已提交
945
  pBlockData->aVersion = NULL;
H
Hongze Cheng 已提交
946 947 948
  pBlockData->aTSKEY = NULL;
  pBlockData->aIdx = NULL;
  pBlockData->aColData = NULL;
H
Hongze Cheng 已提交
949 950
}

H
Hongze Cheng 已提交
951 952 953 954 955 956 957
int32_t tBlockDataInit(SBlockData *pBlockData, int64_t suid, int64_t uid, STSchema *pTSchema) {
  int32_t code = 0;

  ASSERT(suid || uid);

  pBlockData->suid = suid;
  pBlockData->uid = uid;
H
Hongze Cheng 已提交
958
  pBlockData->nRow = 0;
H
Hongze Cheng 已提交
959

H
Hongze Cheng 已提交
960
  taosArrayClear(pBlockData->aIdx);
H
Hongze Cheng 已提交
961 962 963 964 965 966 967 968 969 970 971 972
  for (int32_t iColumn = 1; iColumn < pTSchema->numOfCols; iColumn++) {
    STColumn *pTColumn = &pTSchema->columns[iColumn];

    SColData *pColData;
    code = tBlockDataAddColData(pBlockData, iColumn - 1, &pColData);
    if (code) goto _exit;

    tColDataInit(pColData, pTColumn->colId, pTColumn->type, (pTColumn->flags & COL_SMA_ON) ? 1 : 0);
  }

_exit:
  return code;
H
Hongze Cheng 已提交
973 974
}

H
Hongze Cheng 已提交
975
int32_t tBlockDataInitEx(SBlockData *pBlockData, SBlockData *pBlockDataFrom) {
H
Hongze Cheng 已提交
976 977
  int32_t code = 0;

H
Hongze Cheng 已提交
978
  ASSERT(pBlockDataFrom->suid || pBlockDataFrom->uid);
H
Hongze Cheng 已提交
979

H
Hongze Cheng 已提交
980 981
  pBlockData->suid = pBlockDataFrom->suid;
  pBlockData->uid = pBlockDataFrom->uid;
H
Hongze Cheng 已提交
982
  pBlockData->nRow = 0;
H
Hongze Cheng 已提交
983

H
Hongze Cheng 已提交
984
  taosArrayClear(pBlockData->aIdx);
H
Hongze Cheng 已提交
985 986
  for (int32_t iColData = 0; iColData < taosArrayGetSize(pBlockDataFrom->aIdx); iColData++) {
    SColData *pColDataFrom = tBlockDataGetColDataByIdx(pBlockDataFrom, iColData);
H
Hongze Cheng 已提交
987

H
Hongze Cheng 已提交
988 989 990
    SColData *pColData;
    code = tBlockDataAddColData(pBlockData, iColData, &pColData);
    if (code) goto _exit;
H
Hongze Cheng 已提交
991

H
Hongze Cheng 已提交
992
    tColDataInit(pColData, pColDataFrom->cid, pColDataFrom->type, pColDataFrom->smaOn);
H
Hongze Cheng 已提交
993 994 995 996 997 998
  }

_exit:
  return code;
}

H
Hongze Cheng 已提交
999 1000 1001 1002 1003 1004 1005 1006
void tBlockDataReset(SBlockData *pBlockData) {
  pBlockData->suid = 0;
  pBlockData->uid = 0;
  pBlockData->nRow = 0;
  taosArrayClear(pBlockData->aIdx);
}

void tBlockDataClear(SBlockData *pBlockData) {
H
Hongze Cheng 已提交
1007 1008
  ASSERT(pBlockData->suid || pBlockData->uid);

H
Hongze Cheng 已提交
1009
  pBlockData->nRow = 0;
H
Hongze Cheng 已提交
1010 1011
  for (int32_t iColData = 0; iColData < taosArrayGetSize(pBlockData->aIdx); iColData++) {
    SColData *pColData = tBlockDataGetColDataByIdx(pBlockData, iColData);
H
Haojun Liao 已提交
1012
    tColDataClear(pColData);
H
Hongze Cheng 已提交
1013 1014 1015
  }
}

H
Hongze Cheng 已提交
1016 1017
int32_t tBlockDataAddColData(SBlockData *pBlockData, int32_t iColData, SColData **ppColData) {
  int32_t   code = 0;
H
Hongze Cheng 已提交
1018
  SColData *pColData = NULL;
H
Hongze Cheng 已提交
1019
  int32_t   idx = taosArrayGetSize(pBlockData->aIdx);
H
Hongze Cheng 已提交
1020 1021

  if (idx >= taosArrayGetSize(pBlockData->aColData)) {
H
Hongze Cheng 已提交
1022 1023 1024 1025
    if (taosArrayPush(pBlockData->aColData, &((SColData){0})) == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto _err;
    }
H
Hongze Cheng 已提交
1026 1027 1028
  }
  pColData = (SColData *)taosArrayGet(pBlockData->aColData, idx);

H
Hongze Cheng 已提交
1029
  if (taosArrayInsert(pBlockData->aIdx, iColData, &idx) == NULL) {
H
Hongze Cheng 已提交
1030 1031
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
H
Hongze Cheng 已提交
1032 1033
  }

H
Hongze Cheng 已提交
1034 1035 1036 1037 1038 1039
  *ppColData = pColData;
  return code;

_err:
  *ppColData = NULL;
  return code;
H
Hongze Cheng 已提交
1040
}
H
Hongze Cheng 已提交
1041

H
Hongze Cheng 已提交
1042
int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTSchema, int64_t uid) {
H
Hongze Cheng 已提交
1043
  int32_t code = 0;
H
Hongze Cheng 已提交
1044

H
Hongze Cheng 已提交
1045 1046 1047 1048 1049 1050 1051 1052 1053 1054
  ASSERT(pBlockData->suid || pBlockData->uid);

  // uid
  if (pBlockData->uid == 0) {
    ASSERT(uid);
    code = tRealloc((uint8_t **)&pBlockData->aUid, sizeof(int64_t) * (pBlockData->nRow + 1));
    if (code) goto _err;
    pBlockData->aUid[pBlockData->nRow] = uid;
  }
  // version
H
Hongze Cheng 已提交
1055
  code = tRealloc((uint8_t **)&pBlockData->aVersion, sizeof(int64_t) * (pBlockData->nRow + 1));
H
Hongze Cheng 已提交
1056
  if (code) goto _err;
H
Hongze Cheng 已提交
1057 1058
  pBlockData->aVersion[pBlockData->nRow] = TSDBROW_VERSION(pRow);
  // timestamp
H
Hongze Cheng 已提交
1059
  code = tRealloc((uint8_t **)&pBlockData->aTSKEY, sizeof(TSKEY) * (pBlockData->nRow + 1));
H
Hongze Cheng 已提交
1060
  if (code) goto _err;
H
Hongze Cheng 已提交
1061
  pBlockData->aTSKEY[pBlockData->nRow] = TSDBROW_TS(pRow);
H
Hongze Cheng 已提交
1062

H
Hongze Cheng 已提交
1063
  // OTHER
H
Hongze Cheng 已提交
1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076
  SRowIter rIter = {0};
  SColVal *pColVal;

  tRowIterInit(&rIter, pRow, pTSchema);
  pColVal = tRowIterNext(&rIter);
  for (int32_t iColData = 0; iColData < taosArrayGetSize(pBlockData->aIdx); iColData++) {
    SColData *pColData = tBlockDataGetColDataByIdx(pBlockData, iColData);

    while (pColVal && pColVal->cid < pColData->cid) {
      pColVal = tRowIterNext(&rIter);
    }

    if (pColVal == NULL || pColVal->cid > pColData->cid) {
H
Hongze Cheng 已提交
1077
      code = tColDataAppendValue(pColData, &COL_VAL_NONE(pColData->cid, pColData->type));
H
Hongze Cheng 已提交
1078
      if (code) goto _err;
H
Hongze Cheng 已提交
1079 1080 1081 1082
    } else {
      code = tColDataAppendValue(pColData, pColVal);
      if (code) goto _err;
      pColVal = tRowIterNext(&rIter);
H
Hongze Cheng 已提交
1083
    }
H
Hongze Cheng 已提交
1084
  }
H
Hongze Cheng 已提交
1085

H
Hongze Cheng 已提交
1086
_exit:
H
Hongze Cheng 已提交
1087
  pBlockData->nRow++;
H
Hongze Cheng 已提交
1088
  return code;
H
Hongze Cheng 已提交
1089

H
Hongze Cheng 已提交
1090
_err:
H
Hongze Cheng 已提交
1091
  return code;
1092
}
H
Hongze Cheng 已提交
1093

H
Hongze Cheng 已提交
1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112
int32_t tBlockDataCorrectSchema(SBlockData *pBlockData, SBlockData *pBlockDataFrom) {
  int32_t code = 0;

  int32_t iColData = 0;
  for (int32_t iColDataFrom = 0; iColDataFrom < taosArrayGetSize(pBlockDataFrom->aIdx); iColDataFrom++) {
    SColData *pColDataFrom = tBlockDataGetColDataByIdx(pBlockDataFrom, iColDataFrom);

    while (true) {
      SColData *pColData;
      if (iColData < taosArrayGetSize(pBlockData->aIdx)) {
        pColData = tBlockDataGetColDataByIdx(pBlockData, iColData);
      } else {
        pColData = NULL;
      }

      if (pColData == NULL || pColData->cid > pColDataFrom->cid) {
        code = tBlockDataAddColData(pBlockData, iColData, &pColData);
        if (code) goto _exit;

H
Hongze Cheng 已提交
1113
        tColDataInit(pColData, pColDataFrom->cid, pColDataFrom->type, pColDataFrom->smaOn);
H
Hongze Cheng 已提交
1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133
        for (int32_t iRow = 0; iRow < pBlockData->nRow; iRow++) {
          code = tColDataAppendValue(pColData, &COL_VAL_NONE(pColData->cid, pColData->type));
          if (code) goto _exit;
        }

        iColData++;
        break;
      } else if (pColData->cid == pColDataFrom->cid) {
        iColData++;
        break;
      } else {
        iColData++;
      }
    }
  }

_exit:
  return code;
}

H
Hongze Cheng 已提交
1134 1135 1136
int32_t tBlockDataMerge(SBlockData *pBlockData1, SBlockData *pBlockData2, SBlockData *pBlockData) {
  int32_t code = 0;

H
Hongze Cheng 已提交
1137 1138 1139 1140
  ASSERT(pBlockData->suid == pBlockData1->suid);
  ASSERT(pBlockData->uid == pBlockData1->uid);
  ASSERT(pBlockData1->nRow > 0);
  ASSERT(pBlockData2->nRow > 0);
H
Hongze Cheng 已提交
1141

H
Hongze Cheng 已提交
1142
  tBlockDataClear(pBlockData);
H
Hongze Cheng 已提交
1143

H
Hongze Cheng 已提交
1144 1145 1146 1147
  TSDBROW  row1 = tsdbRowFromBlockData(pBlockData1, 0);
  TSDBROW  row2 = tsdbRowFromBlockData(pBlockData2, 0);
  TSDBROW *pRow1 = &row1;
  TSDBROW *pRow2 = &row2;
H
Hongze Cheng 已提交
1148

H
Hongze Cheng 已提交
1149 1150
  while (pRow1 && pRow2) {
    int32_t c = tsdbRowCmprFn(pRow1, pRow2);
H
Hongze Cheng 已提交
1151 1152

    if (c < 0) {
H
Hongze Cheng 已提交
1153 1154
      code = tBlockDataAppendRow(pBlockData, pRow1, NULL,
                                 pBlockData1->uid ? pBlockData1->uid : pBlockData1->aUid[pRow1->iRow]);
H
Hongze Cheng 已提交
1155
      if (code) goto _exit;
H
Hongze Cheng 已提交
1156 1157 1158 1159 1160 1161 1162

      pRow1->iRow++;
      if (pRow1->iRow < pBlockData1->nRow) {
        *pRow1 = tsdbRowFromBlockData(pBlockData1, pRow1->iRow);
      } else {
        pRow1 = NULL;
      }
H
Hongze Cheng 已提交
1163
    } else if (c > 0) {
H
Hongze Cheng 已提交
1164 1165
      code = tBlockDataAppendRow(pBlockData, pRow2, NULL,
                                 pBlockData2->uid ? pBlockData2->uid : pBlockData2->aUid[pRow2->iRow]);
H
Hongze Cheng 已提交
1166
      if (code) goto _exit;
H
Hongze Cheng 已提交
1167 1168 1169 1170 1171 1172 1173

      pRow2->iRow++;
      if (pRow2->iRow < pBlockData2->nRow) {
        *pRow2 = tsdbRowFromBlockData(pBlockData2, pRow2->iRow);
      } else {
        pRow2 = NULL;
      }
H
Hongze Cheng 已提交
1174 1175 1176 1177 1178
    } else {
      ASSERT(0);
    }
  }

H
Hongze Cheng 已提交
1179 1180 1181
  while (pRow1) {
    code = tBlockDataAppendRow(pBlockData, pRow1, NULL,
                               pBlockData1->uid ? pBlockData1->uid : pBlockData1->aUid[pRow1->iRow]);
H
Hongze Cheng 已提交
1182
    if (code) goto _exit;
H
Hongze Cheng 已提交
1183 1184 1185 1186 1187 1188 1189

    pRow1->iRow++;
    if (pRow1->iRow < pBlockData1->nRow) {
      *pRow1 = tsdbRowFromBlockData(pBlockData1, pRow1->iRow);
    } else {
      pRow1 = NULL;
    }
H
Hongze Cheng 已提交
1190 1191
  }

H
Hongze Cheng 已提交
1192 1193 1194
  while (pRow2) {
    code = tBlockDataAppendRow(pBlockData, pRow2, NULL,
                               pBlockData2->uid ? pBlockData2->uid : pBlockData2->aUid[pRow2->iRow]);
H
Hongze Cheng 已提交
1195
    if (code) goto _exit;
H
Hongze Cheng 已提交
1196 1197 1198 1199 1200 1201 1202

    pRow2->iRow++;
    if (pRow2->iRow < pBlockData2->nRow) {
      *pRow2 = tsdbRowFromBlockData(pBlockData2, pRow2->iRow);
    } else {
      pRow2 = NULL;
    }
H
Hongze Cheng 已提交
1203 1204 1205 1206 1207 1208
  }

_exit:
  return code;
}

H
Hongze Cheng 已提交
1209 1210 1211 1212 1213 1214 1215 1216
int32_t tBlockDataCopy(SBlockData *pSrc, SBlockData *pDest) {
  int32_t code = 0;

  tBlockDataClear(pDest);

  ASSERT(pDest->suid == pSrc->suid);
  ASSERT(pDest->uid == pSrc->uid);
  ASSERT(taosArrayGetSize(pSrc->aIdx) == taosArrayGetSize(pDest->aIdx));
H
Hongze Cheng 已提交
1217

H
Hongze Cheng 已提交
1218
  pDest->nRow = pSrc->nRow;
H
Hongze Cheng 已提交
1219

H
Hongze Cheng 已提交
1220 1221 1222 1223 1224
  if (pSrc->uid == 0) {
    code = tRealloc((uint8_t **)&pDest->aUid, sizeof(int64_t) * pDest->nRow);
    if (code) goto _exit;
    memcpy(pDest->aUid, pSrc->aUid, sizeof(int64_t) * pDest->nRow);
  }
H
Hongze Cheng 已提交
1225

H
Hongze Cheng 已提交
1226
  code = tRealloc((uint8_t **)&pDest->aVersion, sizeof(int64_t) * pDest->nRow);
H
Hongze Cheng 已提交
1227
  if (code) goto _exit;
H
Hongze Cheng 已提交
1228 1229 1230
  memcpy(pDest->aVersion, pSrc->aVersion, sizeof(int64_t) * pDest->nRow);

  code = tRealloc((uint8_t **)&pDest->aTSKEY, sizeof(TSKEY) * pDest->nRow);
H
Hongze Cheng 已提交
1231
  if (code) goto _exit;
H
Hongze Cheng 已提交
1232
  memcpy(pDest->aTSKEY, pSrc->aTSKEY, sizeof(TSKEY) * pDest->nRow);
H
Hongze Cheng 已提交
1233

H
Hongze Cheng 已提交
1234 1235 1236 1237 1238 1239
  for (int32_t iColData = 0; iColData < taosArrayGetSize(pSrc->aIdx); iColData++) {
    SColData *pColSrc = tBlockDataGetColDataByIdx(pSrc, iColData);
    SColData *pColDest = tBlockDataGetColDataByIdx(pDest, iColData);

    ASSERT(pColSrc->cid == pColDest->cid);
    ASSERT(pColSrc->type == pColDest->type);
H
Hongze Cheng 已提交
1240

H
Hongze Cheng 已提交
1241
    code = tColDataCopy(pColSrc, pColDest);
H
Hongze Cheng 已提交
1242 1243 1244 1245 1246
    if (code) goto _exit;
  }

_exit:
  return code;
1247
}
H
Hongze Cheng 已提交
1248

H
Hongze Cheng 已提交
1249 1250 1251 1252 1253
SColData *tBlockDataGetColDataByIdx(SBlockData *pBlockData, int32_t idx) {
  ASSERT(idx >= 0 && idx < taosArrayGetSize(pBlockData->aIdx));
  return (SColData *)taosArrayGet(pBlockData->aColData, *(int32_t *)taosArrayGet(pBlockData->aIdx, idx));
}

H
Hongze Cheng 已提交
1254 1255
void tBlockDataGetColData(SBlockData *pBlockData, int16_t cid, SColData **ppColData) {
  ASSERT(cid != PRIMARYKEY_TIMESTAMP_COL_ID);
H
Hongze Cheng 已提交
1256 1257
  int32_t lidx = 0;
  int32_t ridx = taosArrayGetSize(pBlockData->aIdx) - 1;
H
Hongze Cheng 已提交
1258

H
Hongze Cheng 已提交
1259
  while (lidx <= ridx) {
M
Minglei Jin 已提交
1260 1261
    int32_t   midx = (lidx + ridx) / 2;
    SColData *pColData = tBlockDataGetColDataByIdx(pBlockData, midx);
H
Haojun Liao 已提交
1262
    int32_t   c = (pColData->cid == cid) ? 0 : ((pColData->cid > cid) ? 1 : -1);
H
Hongze Cheng 已提交
1263 1264 1265 1266 1267 1268 1269 1270 1271

    if (c == 0) {
      *ppColData = pColData;
      return;
    } else if (c < 0) {
      lidx = midx + 1;
    } else {
      ridx = midx - 1;
    }
H
Hongze Cheng 已提交
1272
  }
H
Hongze Cheng 已提交
1273 1274

  *ppColData = NULL;
H
Hongze Cheng 已提交
1275 1276
}

H
Hongze Cheng 已提交
1277 1278
int32_t tCmprBlockData(SBlockData *pBlockData, int8_t cmprAlg, uint8_t **ppOut, int32_t *szOut, uint8_t *aBuf[],
                       int32_t aBufN[]) {
H
Hongze Cheng 已提交
1279
  int32_t code = 0;
H
Hongze Cheng 已提交
1280

H
Hongze Cheng 已提交
1281 1282 1283 1284 1285 1286 1287 1288 1289
  SDiskDataHdr hdr = {.delimiter = TSDB_FILE_DLMT,
                      .fmtVer = 0,
                      .suid = pBlockData->suid,
                      .uid = pBlockData->uid,
                      .nRow = pBlockData->nRow,
                      .cmprAlg = cmprAlg};

  // encode =================
  // columns AND SBlockCol
H
Hongze Cheng 已提交
1290
  aBufN[0] = 0;
H
Hongze Cheng 已提交
1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304
  for (int32_t iColData = 0; iColData < taosArrayGetSize(pBlockData->aIdx); iColData++) {
    SColData *pColData = tBlockDataGetColDataByIdx(pBlockData, iColData);

    ASSERT(pColData->flag);

    if (pColData->flag == HAS_NONE) continue;

    SBlockCol blockCol = {.cid = pColData->cid,
                          .type = pColData->type,
                          .smaOn = pColData->smaOn,
                          .flag = pColData->flag,
                          .szOrigin = pColData->nData};

    if (pColData->flag != HAS_NULL) {
H
Hongze Cheng 已提交
1305
      code = tsdbCmprColData(pColData, cmprAlg, &blockCol, &aBuf[0], aBufN[0], &aBuf[2]);
H
Hongze Cheng 已提交
1306 1307
      if (code) goto _exit;

H
Hongze Cheng 已提交
1308
      blockCol.offset = aBufN[0];
H
Hongze Cheng 已提交
1309
      aBufN[0] = aBufN[0] + blockCol.szBitmap + blockCol.szOffset + blockCol.szValue;
H
Hongze Cheng 已提交
1310 1311
    }

H
Hongze Cheng 已提交
1312
    code = tRealloc(&aBuf[1], hdr.szBlkCol + tPutBlockCol(NULL, &blockCol));
H
Hongze Cheng 已提交
1313
    if (code) goto _exit;
H
Hongze Cheng 已提交
1314
    hdr.szBlkCol += tPutBlockCol(aBuf[1] + hdr.szBlkCol, &blockCol);
H
Hongze Cheng 已提交
1315
  }
H
Hongze Cheng 已提交
1316

H
Hongze Cheng 已提交
1317 1318
  // SBlockCol
  aBufN[1] = hdr.szBlkCol;
H
Hongze Cheng 已提交
1319

H
Hongze Cheng 已提交
1320
  // uid + version + tskey
H
Hongze Cheng 已提交
1321
  aBufN[2] = 0;
H
Hongze Cheng 已提交
1322 1323
  if (pBlockData->uid == 0) {
    code = tsdbCmprData((uint8_t *)pBlockData->aUid, sizeof(int64_t) * pBlockData->nRow, TSDB_DATA_TYPE_BIGINT, cmprAlg,
H
Hongze Cheng 已提交
1324
                        &aBuf[2], aBufN[2], &hdr.szUid, &aBuf[3]);
H
Hongze Cheng 已提交
1325
    if (code) goto _exit;
H
Hongze Cheng 已提交
1326
  }
H
Hongze Cheng 已提交
1327
  aBufN[2] += hdr.szUid;
H
Hongze Cheng 已提交
1328

H
Hongze Cheng 已提交
1329
  code = tsdbCmprData((uint8_t *)pBlockData->aVersion, sizeof(int64_t) * pBlockData->nRow, TSDB_DATA_TYPE_BIGINT,
H
Hongze Cheng 已提交
1330
                      cmprAlg, &aBuf[2], aBufN[2], &hdr.szVer, &aBuf[3]);
H
Hongze Cheng 已提交
1331
  if (code) goto _exit;
H
Hongze Cheng 已提交
1332
  aBufN[2] += hdr.szVer;
H
Hongze Cheng 已提交
1333

H
Hongze Cheng 已提交
1334
  code = tsdbCmprData((uint8_t *)pBlockData->aTSKEY, sizeof(TSKEY) * pBlockData->nRow, TSDB_DATA_TYPE_TIMESTAMP,
H
Hongze Cheng 已提交
1335
                      cmprAlg, &aBuf[2], aBufN[2], &hdr.szKey, &aBuf[3]);
H
Hongze Cheng 已提交
1336
  if (code) goto _exit;
H
Hongze Cheng 已提交
1337
  aBufN[2] += hdr.szKey;
H
Hongze Cheng 已提交
1338

H
Hongze Cheng 已提交
1339
  // hdr
H
Hongze Cheng 已提交
1340 1341
  aBufN[3] = tPutDiskDataHdr(NULL, &hdr);
  code = tRealloc(&aBuf[3], aBufN[3]);
H
Hongze Cheng 已提交
1342
  if (code) goto _exit;
H
Hongze Cheng 已提交
1343
  tPutDiskDataHdr(aBuf[3], &hdr);
H
Hongze Cheng 已提交
1344

H
Hongze Cheng 已提交
1345 1346
  // aggragate
  if (ppOut) {
H
Hongze Cheng 已提交
1347
    *szOut = aBufN[0] + aBufN[1] + aBufN[2] + aBufN[3];
H
Hongze Cheng 已提交
1348 1349
    code = tRealloc(ppOut, *szOut);
    if (code) goto _exit;
H
Hongze Cheng 已提交
1350

H
Hongze Cheng 已提交
1351 1352 1353 1354
    memcpy(*ppOut, aBuf[3], aBufN[3]);
    memcpy(*ppOut + aBufN[3], aBuf[2], aBufN[2]);
    if (aBufN[1]) {
      memcpy(*ppOut + aBufN[3] + aBufN[2], aBuf[1], aBufN[1]);
H
Hongze Cheng 已提交
1355
    }
H
Hongze Cheng 已提交
1356 1357
    if (aBufN[0]) {
      memcpy(*ppOut + aBufN[3] + aBufN[2] + aBufN[1], aBuf[0], aBufN[0]);
H
Hongze Cheng 已提交
1358
    }
H
Hongze Cheng 已提交
1359 1360
  }

H
Hongze Cheng 已提交
1361 1362 1363 1364
_exit:
  return code;
}

H
Hongze Cheng 已提交
1365
int32_t tDecmprBlockData(uint8_t *pIn, int32_t szIn, SBlockData *pBlockData, uint8_t *aBuf[]) {
H
Hongze Cheng 已提交
1366
  int32_t code = 0;
H
Hongze Cheng 已提交
1367

H
Hongze Cheng 已提交
1368
  tBlockDataReset(pBlockData);
H
Hongze Cheng 已提交
1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401

  int32_t      n = 0;
  SDiskDataHdr hdr = {0};

  // SDiskDataHdr
  n += tGetDiskDataHdr(pIn + n, &hdr);
  ASSERT(hdr.delimiter == TSDB_FILE_DLMT);

  pBlockData->suid = hdr.suid;
  pBlockData->uid = hdr.uid;
  pBlockData->nRow = hdr.nRow;

  // uid
  if (hdr.uid == 0) {
    ASSERT(hdr.szUid);
    code = tsdbDecmprData(pIn + n, hdr.szUid, TSDB_DATA_TYPE_BIGINT, hdr.cmprAlg, (uint8_t **)&pBlockData->aUid,
                          sizeof(int64_t) * hdr.nRow, &aBuf[0]);
    if (code) goto _exit;
  } else {
    ASSERT(!hdr.szUid);
  }
  n += hdr.szUid;

  // version
  code = tsdbDecmprData(pIn + n, hdr.szVer, TSDB_DATA_TYPE_BIGINT, hdr.cmprAlg, (uint8_t **)&pBlockData->aVersion,
                        sizeof(int64_t) * hdr.nRow, &aBuf[0]);
  if (code) goto _exit;
  n += hdr.szVer;

  // TSKEY
  code = tsdbDecmprData(pIn + n, hdr.szKey, TSDB_DATA_TYPE_TIMESTAMP, hdr.cmprAlg, (uint8_t **)&pBlockData->aTSKEY,
                        sizeof(TSKEY) * hdr.nRow, &aBuf[0]);
  if (code) goto _exit;
H
Hongze Cheng 已提交
1402
  n += hdr.szKey;
H
Hongze Cheng 已提交
1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423

  // loop to decode each column data
  if (hdr.szBlkCol == 0) goto _exit;

  int32_t nt = 0;
  while (nt < hdr.szBlkCol) {
    SBlockCol blockCol = {0};
    nt += tGetBlockCol(pIn + n + nt, &blockCol);
    ASSERT(nt <= hdr.szBlkCol);

    SColData *pColData;
    code = tBlockDataAddColData(pBlockData, taosArrayGetSize(pBlockData->aIdx), &pColData);
    if (code) goto _exit;

    tColDataInit(pColData, blockCol.cid, blockCol.type, blockCol.smaOn);
    if (blockCol.flag == HAS_NULL) {
      for (int32_t iRow = 0; iRow < hdr.nRow; iRow++) {
        code = tColDataAppendValue(pColData, &COL_VAL_NULL(blockCol.cid, blockCol.type));
        if (code) goto _exit;
      }
    } else {
H
Hongze Cheng 已提交
1424 1425
      code = tsdbDecmprColData(pIn + n + hdr.szBlkCol + blockCol.offset, &blockCol, hdr.cmprAlg, hdr.nRow, pColData,
                               &aBuf[0]);
H
Hongze Cheng 已提交
1426 1427 1428 1429 1430
      if (code) goto _exit;
    }
  }

_exit:
H
Hongze Cheng 已提交
1431
  return code;
H
Hongze Cheng 已提交
1432 1433
}

H
Hongze Cheng 已提交
1434 1435 1436 1437 1438 1439
// SDiskDataHdr ==============================
int32_t tPutDiskDataHdr(uint8_t *p, void *ph) {
  int32_t       n = 0;
  SDiskDataHdr *pHdr = (SDiskDataHdr *)ph;

  n += tPutU32(p ? p + n : p, pHdr->delimiter);
H
Hongze Cheng 已提交
1440
  n += tPutU32v(p ? p + n : p, pHdr->fmtVer);
H
Hongze Cheng 已提交
1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457
  n += tPutI64(p ? p + n : p, pHdr->suid);
  n += tPutI64(p ? p + n : p, pHdr->uid);
  n += tPutI32v(p ? p + n : p, pHdr->szUid);
  n += tPutI32v(p ? p + n : p, pHdr->szVer);
  n += tPutI32v(p ? p + n : p, pHdr->szKey);
  n += tPutI32v(p ? p + n : p, pHdr->szBlkCol);
  n += tPutI32v(p ? p + n : p, pHdr->nRow);
  n += tPutI8(p ? p + n : p, pHdr->cmprAlg);

  return n;
}

int32_t tGetDiskDataHdr(uint8_t *p, void *ph) {
  int32_t       n = 0;
  SDiskDataHdr *pHdr = (SDiskDataHdr *)ph;

  n += tGetU32(p + n, &pHdr->delimiter);
H
Hongze Cheng 已提交
1458
  n += tGetU32v(p + n, &pHdr->fmtVer);
H
Hongze Cheng 已提交
1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470
  n += tGetI64(p + n, &pHdr->suid);
  n += tGetI64(p + n, &pHdr->uid);
  n += tGetI32v(p + n, &pHdr->szUid);
  n += tGetI32v(p + n, &pHdr->szVer);
  n += tGetI32v(p + n, &pHdr->szKey);
  n += tGetI32v(p + n, &pHdr->szBlkCol);
  n += tGetI32v(p + n, &pHdr->nRow);
  n += tGetI8(p + n, &pHdr->cmprAlg);

  return n;
}

H
Hongze Cheng 已提交
1471
// ALGORITHM ==============================
H
Hongze Cheng 已提交
1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495
int32_t tPutColumnDataAgg(uint8_t *p, SColumnDataAgg *pColAgg) {
  int32_t n = 0;

  n += tPutI16v(p ? p + n : p, pColAgg->colId);
  n += tPutI16v(p ? p + n : p, pColAgg->numOfNull);
  n += tPutI64(p ? p + n : p, pColAgg->sum);
  n += tPutI64(p ? p + n : p, pColAgg->max);
  n += tPutI64(p ? p + n : p, pColAgg->min);

  return n;
}

int32_t tGetColumnDataAgg(uint8_t *p, SColumnDataAgg *pColAgg) {
  int32_t n = 0;

  n += tGetI16v(p + n, &pColAgg->colId);
  n += tGetI16v(p + n, &pColAgg->numOfNull);
  n += tGetI64(p + n, &pColAgg->sum);
  n += tGetI64(p + n, &pColAgg->max);
  n += tGetI64(p + n, &pColAgg->min);

  return n;
}

H
Hongze Cheng 已提交
1496 1497 1498 1499
void tsdbCalcColDataSMA(SColData *pColData, SColumnDataAgg *pColAgg) {
  SColVal  colVal;
  SColVal *pColVal = &colVal;

1500 1501 1502 1503
  memset(pColAgg, 0, sizeof(*pColAgg));
  bool minAssigned = false;
  bool maxAssigned = false;

H
Hongze Cheng 已提交
1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515
  *pColAgg = (SColumnDataAgg){.colId = pColData->cid};
  for (int32_t iVal = 0; iVal < pColData->nVal; iVal++) {
    tColDataGetValue(pColData, iVal, pColVal);

    if (pColVal->isNone || pColVal->isNull) {
      pColAgg->numOfNull++;
    } else {
      switch (pColData->type) {
        case TSDB_DATA_TYPE_NULL:
          break;
        case TSDB_DATA_TYPE_BOOL:
          break;
1516
        case TSDB_DATA_TYPE_TINYINT: {
1517
          pColAgg->sum += colVal.value.i8;
1518
          if (!minAssigned || pColAgg->min > colVal.value.i8) {
1519
            pColAgg->min = colVal.value.i8;
1520
            minAssigned = true;
1521
          }
1522
          if (!maxAssigned || pColAgg->max < colVal.value.i8) {
1523
            pColAgg->max = colVal.value.i8;
1524
            maxAssigned = true;
1525
          }
H
Hongze Cheng 已提交
1526
          break;
1527
        }
1528
        case TSDB_DATA_TYPE_SMALLINT: {
1529
          pColAgg->sum += colVal.value.i16;
1530
          if (!minAssigned || pColAgg->min > colVal.value.i16) {
1531
            pColAgg->min = colVal.value.i16;
1532
            minAssigned = true;
1533
          }
1534
          if (!maxAssigned || pColAgg->max < colVal.value.i16) {
1535
            pColAgg->max = colVal.value.i16;
1536
            maxAssigned = true;
1537
          }
H
Hongze Cheng 已提交
1538
          break;
1539
        }
1540 1541
        case TSDB_DATA_TYPE_INT: {
          pColAgg->sum += colVal.value.i32;
1542
          if (!minAssigned || pColAgg->min > colVal.value.i32) {
1543
            pColAgg->min = colVal.value.i32;
1544
            minAssigned = true;
1545
          }
1546
          if (!maxAssigned || pColAgg->max < colVal.value.i32) {
1547
            pColAgg->max = colVal.value.i32;
1548
            maxAssigned = true;
1549
          }
H
Hongze Cheng 已提交
1550
          break;
1551 1552 1553
        }
        case TSDB_DATA_TYPE_BIGINT: {
          pColAgg->sum += colVal.value.i64;
1554
          if (!minAssigned || pColAgg->min > colVal.value.i64) {
1555
            pColAgg->min = colVal.value.i64;
1556
            minAssigned = true;
1557
          }
1558
          if (!maxAssigned || pColAgg->max < colVal.value.i64) {
1559
            pColAgg->max = colVal.value.i64;
1560
            maxAssigned = true;
1561
          }
H
Hongze Cheng 已提交
1562
          break;
1563
        }
1564
        case TSDB_DATA_TYPE_FLOAT: {
H
Hongze Cheng 已提交
1565 1566 1567
          *(double *)(&pColAgg->sum) += colVal.value.f;
          if (!minAssigned || *(double *)(&pColAgg->min) > colVal.value.f) {
            *(double *)(&pColAgg->min) = colVal.value.f;
1568
            minAssigned = true;
1569
          }
H
Hongze Cheng 已提交
1570 1571
          if (!maxAssigned || *(double *)(&pColAgg->max) < colVal.value.f) {
            *(double *)(&pColAgg->max) = colVal.value.f;
1572
            maxAssigned = true;
1573
          }
H
Hongze Cheng 已提交
1574
          break;
1575
        }
1576
        case TSDB_DATA_TYPE_DOUBLE: {
H
Hongze Cheng 已提交
1577 1578 1579
          *(double *)(&pColAgg->sum) += colVal.value.d;
          if (!minAssigned || *(double *)(&pColAgg->min) > colVal.value.d) {
            *(double *)(&pColAgg->min) = colVal.value.d;
1580
            minAssigned = true;
1581
          }
H
Hongze Cheng 已提交
1582 1583
          if (!maxAssigned || *(double *)(&pColAgg->max) < colVal.value.d) {
            *(double *)(&pColAgg->max) = colVal.value.d;
1584
            maxAssigned = true;
1585
          }
H
Hongze Cheng 已提交
1586
          break;
1587
        }
H
Hongze Cheng 已提交
1588 1589
        case TSDB_DATA_TYPE_VARCHAR:
          break;
1590
        case TSDB_DATA_TYPE_TIMESTAMP: {
1591
          if (!minAssigned || pColAgg->min > colVal.value.i64) {
1592
            pColAgg->min = colVal.value.i64;
1593
            minAssigned = true;
1594
          }
1595
          if (!maxAssigned || pColAgg->max < colVal.value.i64) {
1596
            pColAgg->max = colVal.value.i64;
1597
            maxAssigned = true;
1598
          }
H
Hongze Cheng 已提交
1599
          break;
1600
        }
H
Hongze Cheng 已提交
1601 1602
        case TSDB_DATA_TYPE_NCHAR:
          break;
1603
        case TSDB_DATA_TYPE_UTINYINT: {
1604
          pColAgg->sum += colVal.value.u8;
1605
          if (!minAssigned || pColAgg->min > colVal.value.u8) {
1606
            pColAgg->min = colVal.value.u8;
1607
            minAssigned = true;
1608
          }
1609
          if (!maxAssigned || pColAgg->max < colVal.value.u8) {
1610
            pColAgg->max = colVal.value.u8;
1611
            maxAssigned = true;
1612
          }
H
Hongze Cheng 已提交
1613
          break;
1614
        }
1615
        case TSDB_DATA_TYPE_USMALLINT: {
1616
          pColAgg->sum += colVal.value.u16;
1617
          if (!minAssigned || pColAgg->min > colVal.value.u16) {
1618
            pColAgg->min = colVal.value.u16;
1619
            minAssigned = true;
1620
          }
1621
          if (!maxAssigned || pColAgg->max < colVal.value.u16) {
1622
            pColAgg->max = colVal.value.u16;
1623
            maxAssigned = true;
1624
          }
H
Hongze Cheng 已提交
1625
          break;
1626
        }
1627
        case TSDB_DATA_TYPE_UINT: {
1628
          pColAgg->sum += colVal.value.u32;
1629
          if (!minAssigned || pColAgg->min > colVal.value.u32) {
1630
            pColAgg->min = colVal.value.u32;
1631
            minAssigned = true;
1632
          }
1633
          if (!minAssigned || pColAgg->max < colVal.value.u32) {
1634
            pColAgg->max = colVal.value.u32;
1635
            maxAssigned = true;
1636
          }
H
Hongze Cheng 已提交
1637
          break;
1638
        }
1639
        case TSDB_DATA_TYPE_UBIGINT: {
1640
          pColAgg->sum += colVal.value.u64;
1641
          if (!minAssigned || pColAgg->min > colVal.value.u64) {
1642
            pColAgg->min = colVal.value.u64;
1643
            minAssigned = true;
1644
          }
1645
          if (!maxAssigned || pColAgg->max < colVal.value.u64) {
1646
            pColAgg->max = colVal.value.u64;
1647
            maxAssigned = true;
1648
          }
H
Hongze Cheng 已提交
1649
          break;
1650
        }
H
Hongze Cheng 已提交
1651 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666
        case TSDB_DATA_TYPE_JSON:
          break;
        case TSDB_DATA_TYPE_VARBINARY:
          break;
        case TSDB_DATA_TYPE_DECIMAL:
          break;
        case TSDB_DATA_TYPE_BLOB:
          break;
        case TSDB_DATA_TYPE_MEDIUMBLOB:
          break;
        default:
          ASSERT(0);
      }
    }
  }
}
H
Hongze Cheng 已提交
1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703

int32_t tsdbCmprData(uint8_t *pIn, int32_t szIn, int8_t type, int8_t cmprAlg, uint8_t **ppOut, int32_t nOut,
                     int32_t *szOut, uint8_t **ppBuf) {
  int32_t code = 0;

  ASSERT(szIn > 0 && ppOut);

  if (cmprAlg == NO_COMPRESSION) {
    code = tRealloc(ppOut, nOut + szIn);
    if (code) goto _exit;

    memcpy(*ppOut + nOut, pIn, szIn);
    *szOut = szIn;
  } else {
    int32_t size = szIn + COMP_OVERFLOW_BYTES;

    code = tRealloc(ppOut, nOut + size);
    if (code) goto _exit;

    if (cmprAlg == TWO_STAGE_COMP) {
      ASSERT(ppBuf);
      code = tRealloc(ppBuf, size);
      if (code) goto _exit;
    }

    *szOut =
        tDataTypes[type].compFunc(pIn, szIn, szIn / tDataTypes[type].bytes, *ppOut + nOut, size, cmprAlg, *ppBuf, size);
    if (*szOut <= 0) {
      code = TSDB_CODE_COMPRESS_ERROR;
      goto _exit;
    }
  }

_exit:
  return code;
}

H
Hongze Cheng 已提交
1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733
int32_t tsdbDecmprData(uint8_t *pIn, int32_t szIn, int8_t type, int8_t cmprAlg, uint8_t **ppOut, int32_t szOut,
                       uint8_t **ppBuf) {
  int32_t code = 0;

  code = tRealloc(ppOut, szOut);
  if (code) goto _exit;

  if (cmprAlg == NO_COMPRESSION) {
    ASSERT(szIn == szOut);
    memcpy(*ppOut, pIn, szOut);
  } else {
    if (cmprAlg == TWO_STAGE_COMP) {
      code = tRealloc(ppBuf, szOut + COMP_OVERFLOW_BYTES);
      if (code) goto _exit;
    }

    int32_t size = tDataTypes[type].decompFunc(pIn, szIn, szOut / tDataTypes[type].bytes, *ppOut, szOut, cmprAlg,
                                               *ppBuf, szOut + COMP_OVERFLOW_BYTES);
    if (size <= 0) {
      code = TSDB_CODE_COMPRESS_ERROR;
      goto _exit;
    }

    ASSERT(size == szOut);
  }

_exit:
  return code;
}

H
Hongze Cheng 已提交
1734
int32_t tsdbCmprColData(SColData *pColData, int8_t cmprAlg, SBlockCol *pBlockCol, uint8_t **ppOut, int32_t nOut,
H
Hongze Cheng 已提交
1735
                        uint8_t **ppBuf) {
H
Hongze Cheng 已提交
1736 1737
  int32_t code = 0;

H
Hongze Cheng 已提交
1738 1739
  ASSERT(pColData->flag && (pColData->flag != HAS_NONE) && (pColData->flag != HAS_NULL));

H
Hongze Cheng 已提交
1740 1741 1742 1743 1744
  pBlockCol->szBitmap = 0;
  pBlockCol->szOffset = 0;
  pBlockCol->szValue = 0;

  int32_t size = 0;
H
Hongze Cheng 已提交
1745 1746
  // bitmap
  if (pColData->flag != HAS_VALUE) {
H
Haojun Liao 已提交
1747 1748 1749 1750
    int32_t szBitMap;
    if (pColData->flag == (HAS_VALUE | HAS_NULL | HAS_NONE)) {
      szBitMap = BIT2_SIZE(pColData->nVal);
    } else {
H
Hongze Cheng 已提交
1751 1752 1753
      szBitMap = BIT1_SIZE(pColData->nVal);
    }

H
Haojun Liao 已提交
1754 1755
    code = tsdbCmprData(pColData->pBitMap, szBitMap, TSDB_DATA_TYPE_TINYINT, cmprAlg, ppOut, nOut + size,
                        &pBlockCol->szBitmap, ppBuf);
H
Hongze Cheng 已提交
1756 1757
    if (code) goto _exit;
  }
H
Hongze Cheng 已提交
1758
  size += pBlockCol->szBitmap;
H
Hongze Cheng 已提交
1759 1760 1761 1762

  // offset
  if (IS_VAR_DATA_TYPE(pColData->type)) {
    code = tsdbCmprData((uint8_t *)pColData->aOffset, sizeof(int32_t) * pColData->nVal, TSDB_DATA_TYPE_INT, cmprAlg,
H
Hongze Cheng 已提交
1763
                        ppOut, nOut + size, &pBlockCol->szOffset, ppBuf);
H
Hongze Cheng 已提交
1764 1765
    if (code) goto _exit;
  }
H
Hongze Cheng 已提交
1766
  size += pBlockCol->szOffset;
H
Hongze Cheng 已提交
1767 1768

  // value
H
Hongze Cheng 已提交
1769
  if ((pColData->flag != (HAS_NULL | HAS_NONE)) && pColData->nData) {
H
Hongze Cheng 已提交
1770
    code = tsdbCmprData((uint8_t *)pColData->pData, pColData->nData, pColData->type, cmprAlg, ppOut, nOut + size,
H
Hongze Cheng 已提交
1771 1772 1773
                        &pBlockCol->szValue, ppBuf);
    if (code) goto _exit;
  }
H
Hongze Cheng 已提交
1774
  size += pBlockCol->szValue;
H
Hongze Cheng 已提交
1775 1776 1777 1778

_exit:
  return code;
}
H
Hongze Cheng 已提交
1779 1780 1781 1782 1783

int32_t tsdbDecmprColData(uint8_t *pIn, SBlockCol *pBlockCol, int8_t cmprAlg, int32_t nVal, SColData *pColData,
                          uint8_t **ppBuf) {
  int32_t code = 0;

H
Hongze Cheng 已提交
1784 1785
  ASSERT(pColData->cid == pBlockCol->cid);
  ASSERT(pColData->type == pBlockCol->type);
H
Hongze Cheng 已提交
1786 1787 1788 1789 1790 1791 1792 1793
  pColData->smaOn = pBlockCol->smaOn;
  pColData->flag = pBlockCol->flag;
  pColData->nVal = nVal;
  pColData->nData = pBlockCol->szOrigin;

  uint8_t *p = pIn;
  // bitmap
  if (pBlockCol->szBitmap) {
H
Haojun Liao 已提交
1794 1795 1796
    int32_t szBitMap;
    if (pColData->flag == (HAS_VALUE | HAS_NULL | HAS_NONE)) {
      szBitMap = BIT2_SIZE(pColData->nVal);
H
Hongze Cheng 已提交
1797
    } else {
H
Haojun Liao 已提交
1798
      szBitMap = BIT1_SIZE(pColData->nVal);
H
Hongze Cheng 已提交
1799
    }
H
Haojun Liao 已提交
1800 1801 1802

    code = tsdbDecmprData(p, pBlockCol->szBitmap, TSDB_DATA_TYPE_TINYINT, cmprAlg, &pColData->pBitMap, szBitMap, ppBuf);
    if (code) goto _exit;
H
Hongze Cheng 已提交
1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820
  }
  p += pBlockCol->szBitmap;

  // offset
  if (pBlockCol->szOffset) {
    code = tsdbDecmprData(p, pBlockCol->szOffset, TSDB_DATA_TYPE_INT, cmprAlg, (uint8_t **)&pColData->aOffset,
                          sizeof(int32_t) * pColData->nVal, ppBuf);
    if (code) goto _exit;
  }
  p += pBlockCol->szOffset;

  // value
  if (pBlockCol->szValue) {
    code = tsdbDecmprData(p, pBlockCol->szValue, pColData->type, cmprAlg, &pColData->pData, pColData->nData, ppBuf);
    if (code) goto _exit;
  }
  p += pBlockCol->szValue;

H
Hongze Cheng 已提交
1821 1822 1823
_exit:
  return code;
}