tdatablock.c 46.0 KB
Newer Older
S
Shengliang Guan 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#define _DEFAULT_SOURCE
H
Haojun Liao 已提交
17
#include "tdatablock.h"
S
compare  
Shengliang Guan 已提交
18
#include "tcompare.h"
19
#include "tglobal.h"
20
#include "tlog.h"
21

L
Liu Jicong 已提交
22
int32_t taosGetFqdnPortFromEp(const char* ep, SEp* pEp) {
H
Haojun Liao 已提交
23 24
  pEp->port = 0;
  strcpy(pEp->fqdn, ep);
25

L
Liu Jicong 已提交
26
  char* temp = strchr(pEp->fqdn, ':');
27 28
  if (temp) {
    *temp = 0;
L
Liu Jicong 已提交
29
    pEp->port = atoi(temp + 1);
30 31
  }

H
Haojun Liao 已提交
32
  if (pEp->port == 0) {
S
Shengliang Guan 已提交
33
    pEp->port = tsServerPort;
34 35 36 37 38
  }

  return 0;
}

L
Liu Jicong 已提交
39
void addEpIntoEpSet(SEpSet* pEpSet, const char* fqdn, uint16_t port) {
H
Haojun Liao 已提交
40 41 42 43 44 45 46 47 48 49
  if (pEpSet == NULL || fqdn == NULL || strlen(fqdn) == 0) {
    return;
  }

  int32_t index = pEpSet->numOfEps;
  tstrncpy(pEpSet->eps[index].fqdn, fqdn, tListLen(pEpSet->eps[index].fqdn));
  pEpSet->eps[index].port = port;
  pEpSet->numOfEps += 1;
}

L
Liu Jicong 已提交
50
bool isEpsetEqual(const SEpSet* s1, const SEpSet* s2) {
51 52 53 54 55
  if (s1->numOfEps != s2->numOfEps || s1->inUse != s2->inUse) {
    return false;
  }

  for (int32_t i = 0; i < s1->numOfEps; i++) {
L
Liu Jicong 已提交
56
    if (s1->eps[i].port != s2->eps[i].port || strncmp(s1->eps[i].fqdn, s2->eps[i].fqdn, TSDB_FQDN_LEN) != 0)
57 58 59 60 61
      return false;
  }
  return true;
}

L
Liu Jicong 已提交
62
void updateEpSet_s(SCorEpSet* pEpSet, SEpSet* pNewEpSet) {
63 64 65 66 67
  taosCorBeginWrite(&pEpSet->version);
  pEpSet->epSet = *pNewEpSet;
  taosCorEndWrite(&pEpSet->version);
}

L
Liu Jicong 已提交
68
SEpSet getEpSet_s(SCorEpSet* pEpSet) {
69 70 71 72 73 74 75 76
  SEpSet ep = {0};
  taosCorBeginRead(&pEpSet->version);
  ep = pEpSet->epSet;
  taosCorEndRead(&pEpSet->version);

  return ep;
}

77
int32_t colDataGetLength(const SColumnInfoData* pColumnInfoData, int32_t numOfRows) {
H
Haojun Liao 已提交
78 79 80 81
  ASSERT(pColumnInfoData != NULL);
  if (IS_VAR_DATA_TYPE(pColumnInfoData->info.type)) {
    return pColumnInfoData->varmeta.length;
  } else {
82 83 84 85 86
    if (pColumnInfoData->info.type == TSDB_DATA_TYPE_NULL) {
      return 0;
    } else {
      return pColumnInfoData->info.bytes * numOfRows;
    }
H
Haojun Liao 已提交
87 88 89
  }
}

H
Haojun Liao 已提交
90 91 92 93 94 95 96 97
int32_t colDataGetFullLength(const SColumnInfoData* pColumnInfoData, int32_t numOfRows) {
  if (IS_VAR_DATA_TYPE(pColumnInfoData->info.type)) {
    return pColumnInfoData->varmeta.length + sizeof(int32_t) * numOfRows;
  } else {
    return pColumnInfoData->info.bytes * numOfRows + BitmapLen(numOfRows);
  }
}

H
Haojun Liao 已提交
98 99 100 101
void colDataTrim(SColumnInfoData* pColumnInfoData) {
  // TODO
}

102 103 104 105
int32_t colDataAppend(SColumnInfoData* pColumnInfoData, uint32_t currentRow, const char* pData, bool isNull) {
  ASSERT(pColumnInfoData != NULL);

  if (isNull) {
H
Haojun Liao 已提交
106 107
    // There is a placehold for each NULL value of binary or nchar type.
    if (IS_VAR_DATA_TYPE(pColumnInfoData->info.type)) {
L
Liu Jicong 已提交
108
      pColumnInfoData->varmeta.offset[currentRow] = -1;  // it is a null value of VAR type.
H
Haojun Liao 已提交
109 110 111 112
    } else {
      colDataSetNull_f(pColumnInfoData->nullbitmap, currentRow);
    }

H
Haojun Liao 已提交
113
    pColumnInfoData->hasNull = true;
114 115 116 117 118
    return 0;
  }

  int32_t type = pColumnInfoData->info.type;
  if (IS_VAR_DATA_TYPE(type)) {
119
    int32_t dataLen = varDataTLen(pData);
120 121
    if (type == TSDB_DATA_TYPE_JSON) {
      if (*pData == TSDB_DATA_TYPE_NULL) {
122
        dataLen = 0;
123 124 125
      } else if (*pData == TSDB_DATA_TYPE_NCHAR) {
        dataLen = varDataTLen(pData + CHAR_BYTES);
      } else if (*pData == TSDB_DATA_TYPE_BIGINT || *pData == TSDB_DATA_TYPE_DOUBLE) {
126
        dataLen = LONG_BYTES;
127
      } else if (*pData == TSDB_DATA_TYPE_BOOL) {
128 129 130 131
        dataLen = CHAR_BYTES;
      }
      dataLen += CHAR_BYTES;
    }
132

H
Haojun Liao 已提交
133
    SVarColAttr* pAttr = &pColumnInfoData->varmeta;
134
    if (pAttr->allocLen < pAttr->length + dataLen) {
H
Haojun Liao 已提交
135
      uint32_t newSize = pAttr->allocLen;
136
      if (newSize <= 1) {
H
Haojun Liao 已提交
137 138 139
        newSize = 8;
      }

140
      while (newSize < pAttr->length + dataLen) {
H
Haojun Liao 已提交
141 142 143
        newSize = newSize * 1.5;
      }

wafwerar's avatar
wafwerar 已提交
144
      char* buf = taosMemoryRealloc(pColumnInfoData->pData, newSize);
H
Haojun Liao 已提交
145
      if (buf == NULL) {
H
Haojun Liao 已提交
146
        return TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
147 148 149 150 151 152 153 154 155
      }

      pColumnInfoData->pData = buf;
      pAttr->allocLen = newSize;
    }

    uint32_t len = pColumnInfoData->varmeta.length;
    pColumnInfoData->varmeta.offset[currentRow] = len;

156 157
    memcpy(pColumnInfoData->pData + len, pData, dataLen);
    pColumnInfoData->varmeta.length += dataLen;
158
  } else {
wmmhello's avatar
wmmhello 已提交
159
    memcpy(pColumnInfoData->pData + pColumnInfoData->info.bytes * currentRow, pData, pColumnInfoData->info.bytes);
160 161 162 163 164
  }

  return 0;
}

L
Liu Jicong 已提交
165 166
static void doBitmapMerge(SColumnInfoData* pColumnInfoData, int32_t numOfRow1, const SColumnInfoData* pSource,
                          int32_t numOfRow2) {
wmmhello's avatar
wmmhello 已提交
167 168
  if (numOfRow2 <= 0) return;

H
Haojun Liao 已提交
169 170 171
  uint32_t total = numOfRow1 + numOfRow2;

  if (BitmapLen(numOfRow1) < BitmapLen(total)) {
wafwerar's avatar
wafwerar 已提交
172
    char*    tmp = taosMemoryRealloc(pColumnInfoData->nullbitmap, BitmapLen(total));
H
Haojun Liao 已提交
173 174 175 176 177 178 179 180 181 182
    uint32_t extend = BitmapLen(total) - BitmapLen(numOfRow1);
    memset(tmp + BitmapLen(numOfRow1), 0, extend);
    pColumnInfoData->nullbitmap = tmp;
  }

  uint32_t remindBits = BitPos(numOfRow1);
  uint32_t shiftBits = 8 - remindBits;

  if (remindBits == 0) {  // no need to shift bits of bitmap
    memcpy(pColumnInfoData->nullbitmap + BitmapLen(numOfRow1), pSource->nullbitmap, BitmapLen(numOfRow2));
wmmhello's avatar
wmmhello 已提交
183 184
    return;
  }
H
Haojun Liao 已提交
185

wmmhello's avatar
wmmhello 已提交
186 187
  uint8_t* p = (uint8_t*)pSource->nullbitmap;
  pColumnInfoData->nullbitmap[BitmapLen(numOfRow1) - 1] |= (p[0] >> remindBits);  // copy remind bits
H
Haojun Liao 已提交
188

wmmhello's avatar
wmmhello 已提交
189 190 191
  if (BitmapLen(numOfRow1) == BitmapLen(total)) {
    return;
  }
H
Haojun Liao 已提交
192

wmmhello's avatar
wmmhello 已提交
193 194
  int32_t len = BitmapLen(numOfRow2);
  int32_t i = 0;
H
Haojun Liao 已提交
195

wmmhello's avatar
wmmhello 已提交
196
  uint8_t* start = (uint8_t*)&pColumnInfoData->nullbitmap[BitmapLen(numOfRow1)];
L
Liu Jicong 已提交
197 198
  int32_t  overCount = BitmapLen(total) - BitmapLen(numOfRow1);
  while (i < len) {  // size limit of pSource->nullbitmap
wmmhello's avatar
wmmhello 已提交
199
    if (i >= 1) {
L
Liu Jicong 已提交
200
      start[i - 1] |= (p[i] >> remindBits);  // copy remind bits
H
Haojun Liao 已提交
201
    }
wmmhello's avatar
wmmhello 已提交
202

L
Liu Jicong 已提交
203
    if (i >= overCount) {  // size limit of pColumnInfoData->nullbitmap
wmmhello's avatar
wmmhello 已提交
204 205 206
      return;
    }

L
Liu Jicong 已提交
207
    start[i] |= (p[i] << shiftBits);  // copy shift bits
wmmhello's avatar
wmmhello 已提交
208
    i += 1;
H
Haojun Liao 已提交
209 210 211
  }
}

L
Liu Jicong 已提交
212 213
int32_t colDataMergeCol(SColumnInfoData* pColumnInfoData, uint32_t numOfRow1, const SColumnInfoData* pSource,
                        uint32_t numOfRow2) {
H
Haojun Liao 已提交
214 215 216 217 218 219
  ASSERT(pColumnInfoData != NULL && pSource != NULL && pColumnInfoData->info.type == pSource->info.type);

  if (numOfRow2 == 0) {
    return numOfRow1;
  }

wmmhello's avatar
wmmhello 已提交
220 221 222
  if (pSource->hasNull) {
    pColumnInfoData->hasNull = pSource->hasNull;
  }
223

H
Haojun Liao 已提交
224 225
  if (IS_VAR_DATA_TYPE(pColumnInfoData->info.type)) {
    // Handle the bitmap
wafwerar's avatar
wafwerar 已提交
226
    char* p = taosMemoryRealloc(pColumnInfoData->varmeta.offset, sizeof(int32_t) * (numOfRow1 + numOfRow2));
H
Haojun Liao 已提交
227
    if (p == NULL) {
228
      return TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
229 230
    }

L
Liu Jicong 已提交
231 232
    pColumnInfoData->varmeta.offset = (int32_t*)p;
    for (int32_t i = 0; i < numOfRow2; ++i) {
233 234 235 236 237
      if (pSource->varmeta.offset[i] == -1) {
        pColumnInfoData->varmeta.offset[i + numOfRow1] = -1;
      } else {
        pColumnInfoData->varmeta.offset[i + numOfRow1] = pSource->varmeta.offset[i] + pColumnInfoData->varmeta.length;
      }
238
    }
H
Haojun Liao 已提交
239

240
    // copy data
H
Haojun Liao 已提交
241 242 243
    uint32_t len = pSource->varmeta.length;
    uint32_t oldLen = pColumnInfoData->varmeta.length;
    if (pColumnInfoData->varmeta.allocLen < len + oldLen) {
wafwerar's avatar
wafwerar 已提交
244
      char* tmp = taosMemoryRealloc(pColumnInfoData->pData, len + oldLen);
H
Haojun Liao 已提交
245
      if (tmp == NULL) {
246
        return TSDB_CODE_OUT_OF_MEMORY;
H
Haojun Liao 已提交
247 248 249 250 251 252
      }

      pColumnInfoData->pData = tmp;
      pColumnInfoData->varmeta.allocLen = len + oldLen;
    }

253 254
    memcpy(pColumnInfoData->pData + oldLen, pSource->pData, len);
    pColumnInfoData->varmeta.length = len + oldLen;
H
Haojun Liao 已提交
255 256 257 258
  } else {
    doBitmapMerge(pColumnInfoData, numOfRow1, pSource, numOfRow2);

    int32_t newSize = (numOfRow1 + numOfRow2) * pColumnInfoData->info.bytes;
wafwerar's avatar
wafwerar 已提交
259
    char*   tmp = taosMemoryRealloc(pColumnInfoData->pData, newSize);
H
Haojun Liao 已提交
260 261 262 263 264 265 266 267 268 269 270 271
    if (tmp == NULL) {
      return TSDB_CODE_VND_OUT_OF_MEMORY;
    }

    pColumnInfoData->pData = tmp;
    int32_t offset = pColumnInfoData->info.bytes * numOfRow1;
    memcpy(pColumnInfoData->pData + offset, pSource->pData, pSource->info.bytes * numOfRow2);
  }

  return numOfRow1 + numOfRow2;
}

272 273 274 275 276 277 278 279
int32_t colDataAssign(SColumnInfoData* pColumnInfoData, const SColumnInfoData* pSource, int32_t numOfRows) {
  ASSERT(pColumnInfoData != NULL && pSource != NULL && pColumnInfoData->info.type == pSource->info.type);
  if (numOfRows == 0) {
    return numOfRows;
  }

  if (IS_VAR_DATA_TYPE(pColumnInfoData->info.type)) {
    // Handle the bitmap
wafwerar's avatar
wafwerar 已提交
280
    char* p = taosMemoryRealloc(pColumnInfoData->varmeta.offset, sizeof(int32_t) * numOfRows);
281 282 283 284
    if (p == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

L
Liu Jicong 已提交
285
    pColumnInfoData->varmeta.offset = (int32_t*)p;
286 287 288
    memcpy(pColumnInfoData->varmeta.offset, pSource->varmeta.offset, sizeof(int32_t) * numOfRows);

    if (pColumnInfoData->varmeta.allocLen < pSource->varmeta.length) {
wafwerar's avatar
wafwerar 已提交
289
      char* tmp = taosMemoryRealloc(pColumnInfoData->pData, pSource->varmeta.length);
290 291 292 293 294 295 296 297 298 299 300
      if (tmp == NULL) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }

      pColumnInfoData->pData = tmp;
      pColumnInfoData->varmeta.allocLen = pSource->varmeta.length;
    }

    memcpy(pColumnInfoData->pData, pSource->pData, pSource->varmeta.length);
    pColumnInfoData->varmeta.length = pSource->varmeta.length;
  } else {
wafwerar's avatar
wafwerar 已提交
301
    char* tmp = taosMemoryRealloc(pColumnInfoData->nullbitmap, BitmapLen(numOfRows));
302 303 304 305 306 307 308 309
    if (tmp == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

    pColumnInfoData->nullbitmap = tmp;
    memcpy(pColumnInfoData->nullbitmap, pSource->nullbitmap, BitmapLen(numOfRows));

    int32_t newSize = numOfRows * pColumnInfoData->info.bytes;
wafwerar's avatar
wafwerar 已提交
310
    tmp = taosMemoryRealloc(pColumnInfoData->pData, newSize);
311 312 313 314 315 316 317 318
    if (tmp == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }

    pColumnInfoData->pData = tmp;
    memcpy(pColumnInfoData->pData, pSource->pData, pSource->info.bytes * numOfRows);
  }

319 320
  pColumnInfoData->hasNull = pSource->hasNull;
  pColumnInfoData->info = pSource->info;
321 322 323
  return 0;
}

H
Haojun Liao 已提交
324
size_t blockDataGetNumOfCols(const SSDataBlock* pBlock) {
H
Haojun Liao 已提交
325
  ASSERT(pBlock && pBlock->info.numOfCols == taosArrayGetSize(pBlock->pDataBlock));
326 327 328
  return pBlock->info.numOfCols;
}

L
Liu Jicong 已提交
329
size_t blockDataGetNumOfRows(const SSDataBlock* pBlock) { return pBlock->info.rows; }
330

H
Haojun Liao 已提交
331
int32_t blockDataUpdateTsWindow(SSDataBlock* pDataBlock) {
332 333 334 335 336 337 338 339 340 341 342 343 344
  if (pDataBlock == NULL || pDataBlock->info.rows <= 0) {
    return 0;
  }

  if (pDataBlock->info.numOfCols <= 0) {
    return -1;
  }

  SColumnInfoData* pColInfoData = taosArrayGet(pDataBlock->pDataBlock, 0);
  if (pColInfoData->info.type != TSDB_DATA_TYPE_TIMESTAMP) {
    return 0;
  }

L
Liu Jicong 已提交
345 346
  pDataBlock->info.window.skey = *(TSKEY*)colDataGetData(pColInfoData, 0);
  pDataBlock->info.window.ekey = *(TSKEY*)colDataGetData(pColInfoData, (pDataBlock->info.rows - 1));
347 348 349
  return 0;
}

350
// if pIndexMap = NULL, merger one column by on column
351
int32_t blockDataMerge(SSDataBlock* pDest, const SSDataBlock* pSrc, SArray* pIndexMap) {
wmmhello's avatar
wmmhello 已提交
352
  assert(pSrc != NULL && pDest != NULL);
H
Haojun Liao 已提交
353

wmmhello's avatar
wmmhello 已提交
354
  int32_t numOfCols = pDest->info.numOfCols;
L
Liu Jicong 已提交
355
  for (int32_t i = 0; i < numOfCols; ++i) {
356
    int32_t mapIndex = i;
L
Liu Jicong 已提交
357
    if (pIndexMap) {
358 359
      mapIndex = *(int32_t*)taosArrayGet(pIndexMap, i);
    }
H
Haojun Liao 已提交
360
    SColumnInfoData* pCol2 = taosArrayGet(pDest->pDataBlock, i);
361
    SColumnInfoData* pCol1 = taosArrayGet(pSrc->pDataBlock, mapIndex);
H
Haojun Liao 已提交
362

363 364
    uint32_t oldLen = colDataGetLength(pCol2, pDest->info.rows);
    uint32_t newLen = colDataGetLength(pCol1, pSrc->info.rows);
H
Haojun Liao 已提交
365 366

    int32_t newSize = oldLen + newLen;
wafwerar's avatar
wafwerar 已提交
367
    char*   tmp = taosMemoryRealloc(pCol2->pData, newSize);
H
Haojun Liao 已提交
368 369 370 371 372 373 374 375 376 377 378 379 380 381 382
    if (tmp != NULL) {
      pCol2->pData = tmp;
      colDataMergeCol(pCol2, pDest->info.rows, pCol1, pSrc->info.rows);
    } else {
      return TSDB_CODE_VND_OUT_OF_MEMORY;
    }
  }

  pDest->info.rows += pSrc->info.rows;
  return TSDB_CODE_SUCCESS;
}

size_t blockDataGetSize(const SSDataBlock* pBlock) {
  assert(pBlock != NULL);

L
Liu Jicong 已提交
383
  size_t  total = 0;
H
Haojun Liao 已提交
384
  int32_t numOfCols = pBlock->info.numOfCols;
H
Haojun Liao 已提交
385

L
Liu Jicong 已提交
386
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
387
    SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, i);
H
Haojun Liao 已提交
388
    total += colDataGetFullLength(pColInfoData, pBlock->info.rows);
H
Haojun Liao 已提交
389 390 391 392 393 394 395
  }

  return total;
}

// the number of tuples can be fit in one page.
// Actual data rows pluses the corresponding meta data must fit in one memory buffer of the given page size.
L
Liu Jicong 已提交
396 397
int32_t blockDataSplitRows(SSDataBlock* pBlock, bool hasVarCol, int32_t startIndex, int32_t* stopIndex,
                           int32_t pageSize) {
H
Haojun Liao 已提交
398 399 400 401 402
  ASSERT(pBlock != NULL && stopIndex != NULL);

  int32_t numOfCols = pBlock->info.numOfCols;
  int32_t numOfRows = pBlock->info.rows;

H
Haojun Liao 已提交
403 404
  int32_t bitmapChar = 1;

L
Liu Jicong 已提交
405
  size_t headerSize = sizeof(int32_t);
406
  size_t colHeaderSize = sizeof(int32_t) * numOfCols;
L
Liu Jicong 已提交
407
  size_t payloadSize = pageSize - (headerSize + colHeaderSize);
408

H
Haojun Liao 已提交
409
  // TODO speedup by checking if the whole page can fit in firstly.
H
Haojun Liao 已提交
410
  if (!hasVarCol) {
L
Liu Jicong 已提交
411
    size_t  rowSize = blockDataGetRowSize(pBlock);
412 413
    int32_t capacity = payloadSize / (rowSize + numOfCols * bitmapChar / 8.0);
    ASSERT(capacity > 0);
414

415
    *stopIndex = startIndex + capacity - 1;
H
Haojun Liao 已提交
416 417 418
    if (*stopIndex >= numOfRows) {
      *stopIndex = numOfRows - 1;
    }
419

H
Haojun Liao 已提交
420
    return TSDB_CODE_SUCCESS;
421
  }
wmmhello's avatar
wmmhello 已提交
422 423 424 425 426 427
  // iterate the rows that can be fit in this buffer page
  int32_t size = (headerSize + colHeaderSize);
  for (int32_t j = startIndex; j < numOfRows; ++j) {
    for (int32_t i = 0; i < numOfCols; ++i) {
      SColumnInfoData* pColInfoData = TARRAY_GET_ELEM(pBlock->pDataBlock, i);
      if (IS_VAR_DATA_TYPE(pColInfoData->info.type)) {
428
        if (pColInfoData->varmeta.offset[j] != -1) {
wmmhello's avatar
wmmhello 已提交
429 430
          char* p = colDataGetData(pColInfoData, j);
          size += varDataTLen(p);
H
Haojun Liao 已提交
431 432
        }

wmmhello's avatar
wmmhello 已提交
433
        size += sizeof(pColInfoData->varmeta.offset[0]);
434
      } else {
wmmhello's avatar
wmmhello 已提交
435
        size += pColInfoData->info.bytes;
H
Haojun Liao 已提交
436

wmmhello's avatar
wmmhello 已提交
437 438 439
        if (((j - startIndex) & 0x07) == 0) {
          size += 1;  // the space for null bitmap
        }
H
Haojun Liao 已提交
440 441 442
      }
    }

wmmhello's avatar
wmmhello 已提交
443
    if (size > pageSize) {  // pageSize must be able to hold one row
wmmhello's avatar
wmmhello 已提交
444
      *stopIndex = j - 1;
wmmhello's avatar
wmmhello 已提交
445
      ASSERT(*stopIndex >= startIndex);
wmmhello's avatar
wmmhello 已提交
446 447 448

      return TSDB_CODE_SUCCESS;
    }
H
Haojun Liao 已提交
449
  }
wmmhello's avatar
wmmhello 已提交
450 451 452 453

  // all fit in
  *stopIndex = numOfRows - 1;
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
454 455
}

456 457 458 459 460
SSDataBlock* blockDataExtractBlock(SSDataBlock* pBlock, int32_t startIndex, int32_t rowCount) {
  if (pBlock == NULL || startIndex < 0 || rowCount > pBlock->info.rows || rowCount + startIndex > pBlock->info.rows) {
    return NULL;
  }

wafwerar's avatar
wafwerar 已提交
461
  SSDataBlock* pDst = taosMemoryCalloc(1, sizeof(SSDataBlock));
462 463 464 465
  if (pDst == NULL) {
    return NULL;
  }

466 467 468 469 470
  pDst->info = pBlock->info;

  pDst->info.rows = 0;
  pDst->pDataBlock = taosArrayInit(pBlock->info.numOfCols, sizeof(SColumnInfoData));

L
Liu Jicong 已提交
471 472
  for (int32_t i = 0; i < pBlock->info.numOfCols; ++i) {
    SColumnInfoData  colInfo = {0};
473 474 475 476 477
    SColumnInfoData* pSrcCol = taosArrayGet(pBlock->pDataBlock, i);
    colInfo.info = pSrcCol->info;

    if (IS_VAR_DATA_TYPE(pSrcCol->info.type)) {
      SVarColAttr* pAttr = &colInfo.varmeta;
wafwerar's avatar
wafwerar 已提交
478
      pAttr->offset = taosMemoryCalloc(rowCount, sizeof(int32_t));
479
    } else {
wafwerar's avatar
wafwerar 已提交
480 481
      colInfo.nullbitmap = taosMemoryCalloc(1, BitmapLen(rowCount));
      colInfo.pData = taosMemoryCalloc(rowCount, colInfo.info.bytes);
482 483 484 485 486 487 488 489 490 491
    }

    taosArrayPush(pDst->pDataBlock, &colInfo);
  }

  for (int32_t i = 0; i < pBlock->info.numOfCols; ++i) {
    SColumnInfoData* pColData = taosArrayGet(pBlock->pDataBlock, i);
    SColumnInfoData* pDstCol = taosArrayGet(pDst->pDataBlock, i);

    for (int32_t j = startIndex; j < (startIndex + rowCount); ++j) {
492
      bool  isNull = colDataIsNull(pColData, pBlock->info.rows, j, pBlock->pBlockAgg[i]);
493
      char* p = colDataGetData(pColData, j);
494 495 496 497 498 499 500 501 502

      colDataAppend(pDstCol, j - startIndex, p, isNull);
    }
  }

  pDst->info.rows = rowCount;
  return pDst;
}

H
Haojun Liao 已提交
503 504
/**
 *
505 506 507 508 509
 * +------------------+---------------------------------------------+
 * |the number of rows|                    column #1                |
 * |    (4 bytes)     |------------+-----------------------+--------+
 * |                  | null bitmap| column length(4bytes) | values |
 * +------------------+------------+-----------------------+--------+
H
Haojun Liao 已提交
510 511 512 513
 * @param buf
 * @param pBlock
 * @return
 */
514
int32_t blockDataToBuf(char* buf, const SSDataBlock* pBlock) {
H
Haojun Liao 已提交
515 516 517
  ASSERT(pBlock != NULL);

  // write the number of rows
L
Liu Jicong 已提交
518
  *(uint32_t*)buf = pBlock->info.rows;
H
Haojun Liao 已提交
519 520 521 522 523 524

  int32_t numOfCols = pBlock->info.numOfCols;
  int32_t numOfRows = pBlock->info.rows;

  char* pStart = buf + sizeof(uint32_t);

L
Liu Jicong 已提交
525
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
526 527 528 529 530 531 532 533 534
    SColumnInfoData* pCol = taosArrayGet(pBlock->pDataBlock, i);
    if (IS_VAR_DATA_TYPE(pCol->info.type)) {
      memcpy(pStart, pCol->varmeta.offset, numOfRows * sizeof(int32_t));
      pStart += numOfRows * sizeof(int32_t);
    } else {
      memcpy(pStart, pCol->nullbitmap, BitmapLen(numOfRows));
      pStart += BitmapLen(pBlock->info.rows);
    }

535
    uint32_t dataSize = colDataGetLength(pCol, numOfRows);
536

L
Liu Jicong 已提交
537
    *(int32_t*)pStart = dataSize;
538 539
    pStart += sizeof(int32_t);

H
Haojun Liao 已提交
540 541 542 543 544 545 546
    memcpy(pStart, pCol->pData, dataSize);
    pStart += dataSize;
  }

  return 0;
}

547
int32_t blockDataFromBuf(SSDataBlock* pBlock, const char* buf) {
L
Liu Jicong 已提交
548
  pBlock->info.rows = *(int32_t*)buf;
549

L
Liu Jicong 已提交
550
  int32_t     numOfCols = pBlock->info.numOfCols;
551 552
  const char* pStart = buf + sizeof(uint32_t);

L
Liu Jicong 已提交
553
  for (int32_t i = 0; i < numOfCols; ++i) {
554 555 556
    SColumnInfoData* pCol = taosArrayGet(pBlock->pDataBlock, i);

    if (IS_VAR_DATA_TYPE(pCol->info.type)) {
H
Haojun Liao 已提交
557
      size_t metaSize = pBlock->info.rows * sizeof(int32_t);
L
Liu Jicong 已提交
558
      char*  tmp = taosMemoryRealloc(pCol->varmeta.offset, metaSize);  // preview calloc is too small
wmmhello's avatar
wmmhello 已提交
559 560 561 562
      if (tmp == NULL) {
        return TSDB_CODE_OUT_OF_MEMORY;
      }
      pCol->varmeta.offset = (int32_t*)tmp;
563 564 565 566 567 568 569
      memcpy(pCol->varmeta.offset, pStart, metaSize);
      pStart += metaSize;
    } else {
      memcpy(pCol->nullbitmap, pStart, BitmapLen(pBlock->info.rows));
      pStart += BitmapLen(pBlock->info.rows);
    }

L
Liu Jicong 已提交
570
    int32_t colLength = *(int32_t*)pStart;
571 572
    pStart += sizeof(int32_t);

573 574
    if (IS_VAR_DATA_TYPE(pCol->info.type)) {
      if (pCol->varmeta.allocLen < colLength) {
wafwerar's avatar
wafwerar 已提交
575
        char* tmp = taosMemoryRealloc(pCol->pData, colLength);
576 577 578 579 580 581 582 583 584 585
        if (tmp == NULL) {
          return TSDB_CODE_OUT_OF_MEMORY;
        }

        pCol->pData = tmp;
        pCol->varmeta.allocLen = colLength;
      }

      pCol->varmeta.length = colLength;
      ASSERT(pCol->varmeta.length <= pCol->varmeta.allocLen);
586 587 588 589 590
    }

    memcpy(pCol->pData, pStart, colLength);
    pStart += colLength;
  }
591 592

  return TSDB_CODE_SUCCESS;
593 594
}

H
Haojun Liao 已提交
595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631
int32_t blockDataFromBuf1(SSDataBlock* pBlock, const char* buf, size_t capacity) {
  pBlock->info.rows = *(int32_t*)buf;

  int32_t     numOfCols = pBlock->info.numOfCols;
  const char* pStart = buf + sizeof(uint32_t);

  for (int32_t i = 0; i < numOfCols; ++i) {
    SColumnInfoData* pCol = taosArrayGet(pBlock->pDataBlock, i);

    if (IS_VAR_DATA_TYPE(pCol->info.type)) {
      size_t metaSize = capacity * sizeof(int32_t);
      memcpy(pCol->varmeta.offset, pStart, metaSize);
      pStart += metaSize;
    } else {
      memcpy(pCol->nullbitmap, pStart, BitmapLen(capacity));
      pStart += BitmapLen(capacity);
    }

    int32_t colLength = *(int32_t*)pStart;
    pStart += sizeof(int32_t);

    if (IS_VAR_DATA_TYPE(pCol->info.type)) {
      if (pCol->varmeta.allocLen < colLength) {
        char* tmp = taosMemoryRealloc(pCol->pData, colLength);
        if (tmp == NULL) {
          return TSDB_CODE_OUT_OF_MEMORY;
        }

        pCol->pData = tmp;
        pCol->varmeta.allocLen = colLength;
      }

      pCol->varmeta.length = colLength;
      ASSERT(pCol->varmeta.length <= pCol->varmeta.allocLen);
    }

    memcpy(pCol->pData, pStart, colLength);
632
    pStart += pCol->info.bytes * capacity;
H
Haojun Liao 已提交
633 634 635 636 637
  }

  return TSDB_CODE_SUCCESS;
}

638
size_t blockDataGetRowSize(SSDataBlock* pBlock) {
H
Haojun Liao 已提交
639
  ASSERT(pBlock != NULL);
640 641
  if (pBlock->info.rowSize == 0) {
    size_t rowSize = 0;
H
Haojun Liao 已提交
642

L
Liu Jicong 已提交
643 644 645 646 647
    size_t numOfCols = pBlock->info.numOfCols;
    for (int32_t i = 0; i < numOfCols; ++i) {
      SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, i);
      rowSize += pColInfo->info.bytes;
    }
648 649

    pBlock->info.rowSize = rowSize;
H
Haojun Liao 已提交
650 651
  }

652
  return pBlock->info.rowSize;
H
Haojun Liao 已提交
653 654
}

H
Haojun Liao 已提交
655 656 657 658 659 660
/**
 * @refitem blockDataToBuf for the meta size
 * @param pBlock
 * @return
 */
size_t blockDataGetSerialMetaSize(const SSDataBlock* pBlock) {
661 662
  // | total rows/total length | block group id | each column length |
  return sizeof(int32_t) + sizeof(uint64_t) + pBlock->info.numOfCols * sizeof(int32_t);
H
Haojun Liao 已提交
663 664 665 666 667 668 669
}

double blockDataGetSerialRowSize(const SSDataBlock* pBlock) {
  ASSERT(pBlock != NULL);
  double rowSize = 0;

  size_t numOfCols = pBlock->info.numOfCols;
L
Liu Jicong 已提交
670
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
671 672 673 674 675 676
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, i);
    rowSize += pColInfo->info.bytes;

    if (IS_VAR_DATA_TYPE(pColInfo->info.type)) {
      rowSize += sizeof(int32_t);
    } else {
L
Liu Jicong 已提交
677
      rowSize += 1 / 8.0;  // one bit for each record
H
Haojun Liao 已提交
678 679 680 681 682 683
    }
  }

  return rowSize;
}

H
Haojun Liao 已提交
684
typedef struct SSDataBlockSortHelper {
L
Liu Jicong 已提交
685 686
  SArray*      orderInfo;  // SArray<SBlockOrderInfo>
  SSDataBlock* pDataBlock;
H
Haojun Liao 已提交
687 688 689
} SSDataBlockSortHelper;

int32_t dataBlockCompar(const void* p1, const void* p2, const void* param) {
L
Liu Jicong 已提交
690
  const SSDataBlockSortHelper* pHelper = (const SSDataBlockSortHelper*)param;
H
Haojun Liao 已提交
691 692 693

  SSDataBlock* pDataBlock = pHelper->pDataBlock;

L
Liu Jicong 已提交
694 695
  int32_t left = *(int32_t*)p1;
  int32_t right = *(int32_t*)p2;
H
Haojun Liao 已提交
696 697

  SArray* pInfo = pHelper->orderInfo;
698

L
Liu Jicong 已提交
699
  for (int32_t i = 0; i < pInfo->size; ++i) {
H
Haojun Liao 已提交
700
    SBlockOrderInfo* pOrder = TARRAY_GET_ELEM(pInfo, i);
L
Liu Jicong 已提交
701
    SColumnInfoData* pColInfoData = pOrder->pColData;  // TARRAY_GET_ELEM(pDataBlock->pDataBlock, pOrder->colIndex);
H
Haojun Liao 已提交
702

703
    if (pColInfoData->hasNull) {
704 705
      bool leftNull = colDataIsNull(pColInfoData, pDataBlock->info.rows, left, NULL);
      bool rightNull = colDataIsNull(pColInfoData, pDataBlock->info.rows, right, NULL);
706
      if (leftNull && rightNull) {
L
Liu Jicong 已提交
707
        continue;  // continue to next slot
708
      }
H
Haojun Liao 已提交
709

710
      if (rightNull) {
H
Haojun Liao 已提交
711
        return pOrder->nullFirst ? 1 : -1;
712
      }
H
Haojun Liao 已提交
713

714
      if (leftNull) {
H
Haojun Liao 已提交
715
        return pOrder->nullFirst ? -1 : 1;
716
      }
H
Haojun Liao 已提交
717 718
    }

L
Liu Jicong 已提交
719
    void* left1 = colDataGetData(pColInfoData, left);
720
    void* right1 = colDataGetData(pColInfoData, right);
H
Haojun Liao 已提交
721

722
    __compar_fn_t fn = getKeyComparFunc(pColInfoData->info.type, pOrder->order);
723

724 725 726 727 728
    int ret = fn(left1, right1);
    if (ret == 0) {
      continue;
    } else {
      return ret;
H
Haojun Liao 已提交
729 730 731 732 733 734
    }
  }

  return 0;
}

L
Liu Jicong 已提交
735 736
static int32_t doAssignOneTuple(SColumnInfoData* pDstCols, int32_t numOfRows, const SSDataBlock* pSrcBlock,
                                int32_t tupleIndex) {
H
Haojun Liao 已提交
737
  int32_t code = 0;
H
Haojun Liao 已提交
738 739 740 741 742 743
  int32_t numOfCols = pSrcBlock->info.numOfCols;

  for (int32_t i = 0; i < numOfCols; ++i) {
    SColumnInfoData* pDst = &pDstCols[i];
    SColumnInfoData* pSrc = taosArrayGet(pSrcBlock->pDataBlock, i);

744
    if (pSrc->hasNull && colDataIsNull(pSrc, pSrcBlock->info.rows, tupleIndex, pSrcBlock->pBlockAgg[i])) {
H
Haojun Liao 已提交
745 746 747 748
      code = colDataAppend(pDst, numOfRows, NULL, true);
      if (code != TSDB_CODE_SUCCESS) {
        return code;
      }
H
Haojun Liao 已提交
749
    } else {
750
      char* p = colDataGetData(pSrc, tupleIndex);
H
Haojun Liao 已提交
751 752 753 754
      code = colDataAppend(pDst, numOfRows, p, false);
      if (code != TSDB_CODE_SUCCESS) {
        return code;
      }
H
Haojun Liao 已提交
755 756
    }
  }
757 758

  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
759 760
}

H
Haojun Liao 已提交
761
static int32_t blockDataAssign(SColumnInfoData* pCols, const SSDataBlock* pDataBlock, int32_t* index) {
H
Haojun Liao 已提交
762
#if 0
H
Haojun Liao 已提交
763
  for (int32_t i = 0; i < pDataBlock->info.rows; ++i) {
H
Haojun Liao 已提交
764 765 766 767
    int32_t code = doAssignOneTuple(pCols, i, pDataBlock, index[i]);
    if (code != TSDB_CODE_SUCCESS) {
      return code;
    }
H
Haojun Liao 已提交
768
  }
H
Haojun Liao 已提交
769
#else
L
Liu Jicong 已提交
770
  for (int32_t i = 0; i < pDataBlock->info.numOfCols; ++i) {
H
Haojun Liao 已提交
771 772 773 774
    SColumnInfoData* pDst = &pCols[i];
    SColumnInfoData* pSrc = taosArrayGet(pDataBlock->pDataBlock, i);

    if (IS_VAR_DATA_TYPE(pSrc->info.type)) {
L
Liu Jicong 已提交
775 776
      memcpy(pDst->pData, pSrc->pData, pSrc->varmeta.length);
      pDst->varmeta.length = pSrc->varmeta.length;
H
Haojun Liao 已提交
777

L
Liu Jicong 已提交
778 779 780
      for (int32_t j = 0; j < pDataBlock->info.rows; ++j) {
        pDst->varmeta.offset[j] = pSrc->varmeta.offset[index[j]];
      }
H
Haojun Liao 已提交
781
    } else {
wmmhello's avatar
wmmhello 已提交
782 783 784 785
      for (int32_t j = 0; j < pDataBlock->info.rows; ++j) {
        if (colDataIsNull_f(pSrc->nullbitmap, index[j])) {
          colDataSetNull_f(pDst->nullbitmap, j);
          continue;
H
Haojun Liao 已提交
786
        }
wmmhello's avatar
wmmhello 已提交
787
        memcpy(pDst->pData + j * pDst->info.bytes, pSrc->pData + index[j] * pDst->info.bytes, pDst->info.bytes);
H
Haojun Liao 已提交
788 789 790 791
      }
    }
  }
#endif
H
Haojun Liao 已提交
792
  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
793 794 795 796 797 798
}

static SColumnInfoData* createHelpColInfoData(const SSDataBlock* pDataBlock) {
  int32_t rows = pDataBlock->info.rows;
  int32_t numOfCols = pDataBlock->info.numOfCols;

wafwerar's avatar
wafwerar 已提交
799
  SColumnInfoData* pCols = taosMemoryCalloc(numOfCols, sizeof(SColumnInfoData));
H
Haojun Liao 已提交
800 801 802 803
  if (pCols == NULL) {
    return NULL;
  }

L
Liu Jicong 已提交
804
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
805 806 807 808
    SColumnInfoData* pColInfoData = taosArrayGet(pDataBlock->pDataBlock, i);
    pCols[i].info = pColInfoData->info;

    if (IS_VAR_DATA_TYPE(pCols[i].info.type)) {
wafwerar's avatar
wafwerar 已提交
809 810
      pCols[i].varmeta.offset = taosMemoryCalloc(rows, sizeof(int32_t));
      pCols[i].pData = taosMemoryCalloc(1, pColInfoData->varmeta.length);
H
Haojun Liao 已提交
811 812 813

      pCols[i].varmeta.length = pColInfoData->varmeta.length;
      pCols[i].varmeta.allocLen = pCols[i].varmeta.length;
H
Haojun Liao 已提交
814
    } else {
wafwerar's avatar
wafwerar 已提交
815 816
      pCols[i].nullbitmap = taosMemoryCalloc(1, BitmapLen(rows));
      pCols[i].pData = taosMemoryCalloc(rows, pCols[i].info.bytes);
H
Haojun Liao 已提交
817 818 819 820 821 822
    }
  }

  return pCols;
}

H
Haojun Liao 已提交
823
static void copyBackToBlock(SSDataBlock* pDataBlock, SColumnInfoData* pCols) {
H
Haojun Liao 已提交
824 825
  int32_t numOfCols = pDataBlock->info.numOfCols;

L
Liu Jicong 已提交
826
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
827 828 829 830
    SColumnInfoData* pColInfoData = taosArrayGet(pDataBlock->pDataBlock, i);
    pColInfoData->info = pCols[i].info;

    if (IS_VAR_DATA_TYPE(pColInfoData->info.type)) {
wafwerar's avatar
wafwerar 已提交
831
      taosMemoryFreeClear(pColInfoData->varmeta.offset);
H
Haojun Liao 已提交
832 833
      pColInfoData->varmeta = pCols[i].varmeta;
    } else {
wafwerar's avatar
wafwerar 已提交
834
      taosMemoryFreeClear(pColInfoData->nullbitmap);
H
Haojun Liao 已提交
835 836 837
      pColInfoData->nullbitmap = pCols[i].nullbitmap;
    }

wafwerar's avatar
wafwerar 已提交
838
    taosMemoryFreeClear(pColInfoData->pData);
H
Haojun Liao 已提交
839 840 841
    pColInfoData->pData = pCols[i].pData;
  }

wafwerar's avatar
wafwerar 已提交
842
  taosMemoryFreeClear(pCols);
H
Haojun Liao 已提交
843 844 845
}

static int32_t* createTupleIndex(size_t rows) {
wafwerar's avatar
wafwerar 已提交
846
  int32_t* index = taosMemoryCalloc(rows, sizeof(int32_t));
H
Haojun Liao 已提交
847 848 849 850
  if (index == NULL) {
    return NULL;
  }

L
Liu Jicong 已提交
851
  for (int32_t i = 0; i < rows; ++i) {
H
Haojun Liao 已提交
852 853 854 855 856 857
    index[i] = i;
  }

  return index;
}

wafwerar's avatar
wafwerar 已提交
858
static void destroyTupleIndex(int32_t* index) { taosMemoryFreeClear(index); }
H
Haojun Liao 已提交
859

H
Haojun Liao 已提交
860
int32_t blockDataSort(SSDataBlock* pDataBlock, SArray* pOrderInfo) {
H
Haojun Liao 已提交
861 862 863 864 865 866 867
  ASSERT(pDataBlock != NULL && pOrderInfo != NULL);
  if (pDataBlock->info.rows <= 1) {
    return TSDB_CODE_SUCCESS;
  }

  // Allocate the additional buffer.
  uint32_t rows = pDataBlock->info.rows;
H
Haojun Liao 已提交
868 869 870 871 872 873 874

  bool sortColumnHasNull = false;
  bool varTypeSort = false;

  for (int32_t i = 0; i < taosArrayGetSize(pOrderInfo); ++i) {
    SBlockOrderInfo* pInfo = taosArrayGet(pOrderInfo, i);

H
Haojun Liao 已提交
875
    SColumnInfoData* pColInfoData = taosArrayGet(pDataBlock->pDataBlock, pInfo->slotId);
H
Haojun Liao 已提交
876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892
    if (pColInfoData->hasNull) {
      sortColumnHasNull = true;
    }

    if (IS_VAR_DATA_TYPE(pColInfoData->info.type)) {
      varTypeSort = true;
    }
  }

  if (taosArrayGetSize(pOrderInfo) == 1 && (!sortColumnHasNull)) {
    if (pDataBlock->info.numOfCols == 1) {
      if (!varTypeSort) {
        SColumnInfoData* pColInfoData = taosArrayGet(pDataBlock->pDataBlock, 0);
        SBlockOrderInfo* pOrder = taosArrayGet(pOrderInfo, 0);

        int64_t p0 = taosGetTimestampUs();

893
        __compar_fn_t fn = getKeyComparFunc(pColInfoData->info.type, pOrder->order);
H
Haojun Liao 已提交
894 895 896
        qsort(pColInfoData->pData, pDataBlock->info.rows, pColInfoData->info.bytes, fn);

        int64_t p1 = taosGetTimestampUs();
897
        uDebug("blockDataSort easy cost:%" PRId64 ", rows:%d\n", p1 - p0, pDataBlock->info.rows);
H
Haojun Liao 已提交
898 899 900 901 902 903 904 905

        return TSDB_CODE_SUCCESS;
      } else {  // var data type
      }
    } else if (pDataBlock->info.numOfCols == 2) {
    }
  }

H
Haojun Liao 已提交
906 907 908 909 910 911
  int32_t* index = createTupleIndex(rows);
  if (index == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return terrno;
  }

912 913
  int64_t p0 = taosGetTimestampUs();

H
Haojun Liao 已提交
914
  SSDataBlockSortHelper helper = {.pDataBlock = pDataBlock, .orderInfo = pOrderInfo};
L
Liu Jicong 已提交
915
  for (int32_t i = 0; i < taosArrayGetSize(helper.orderInfo); ++i) {
H
Haojun Liao 已提交
916
    struct SBlockOrderInfo* pInfo = taosArrayGet(helper.orderInfo, i);
H
Haojun Liao 已提交
917
    pInfo->pColData = taosArrayGet(pDataBlock->pDataBlock, pInfo->slotId);
H
Haojun Liao 已提交
918 919
  }

H
Haojun Liao 已提交
920 921
  taosqsort(index, rows, sizeof(int32_t), &helper, dataBlockCompar);

922 923
  int64_t p1 = taosGetTimestampUs();

H
Haojun Liao 已提交
924 925
  SColumnInfoData* pCols = createHelpColInfoData(pDataBlock);
  if (pCols == NULL) {
926
    destroyTupleIndex(index);
H
Haojun Liao 已提交
927 928 929 930
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return terrno;
  }

931 932
  int64_t p2 = taosGetTimestampUs();

wmmhello's avatar
wmmhello 已提交
933
  blockDataAssign(pCols, pDataBlock, index);
H
Haojun Liao 已提交
934

935
  int64_t p3 = taosGetTimestampUs();
H
Haojun Liao 已提交
936 937

  copyBackToBlock(pDataBlock, pCols);
938 939
  int64_t p4 = taosGetTimestampUs();

L
Liu Jicong 已提交
940 941 942
  uDebug("blockDataSort complex sort:%" PRId64 ", create:%" PRId64 ", assign:%" PRId64 ", copyback:%" PRId64
         ", rows:%d\n",
         p1 - p0, p2 - p1, p3 - p2, p4 - p3, rows);
H
Haojun Liao 已提交
943
  destroyTupleIndex(index);
H
Haojun Liao 已提交
944 945

  return TSDB_CODE_SUCCESS;
H
Haojun Liao 已提交
946
}
947

H
Haojun Liao 已提交
948 949
typedef struct SHelper {
  int32_t index;
L
Liu Jicong 已提交
950 951 952 953 954
  union {
    char*   pData;
    int64_t i64;
    double  d64;
  };
H
Haojun Liao 已提交
955 956 957 958 959 960
} SHelper;

SHelper* createTupleIndex_rv(int32_t numOfRows, SArray* pOrderInfo, SSDataBlock* pBlock) {
  int32_t sortValLengthPerRow = 0;
  int32_t numOfCols = taosArrayGetSize(pOrderInfo);

L
Liu Jicong 已提交
961
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
962
    SBlockOrderInfo* pInfo = taosArrayGet(pOrderInfo, i);
H
Haojun Liao 已提交
963
    SColumnInfoData* pColInfo = taosArrayGet(pBlock->pDataBlock, pInfo->slotId);
H
Haojun Liao 已提交
964 965 966 967 968 969
    pInfo->pColData = pColInfo;
    sortValLengthPerRow += pColInfo->info.bytes;
  }

  size_t len = sortValLengthPerRow * pBlock->info.rows;

wafwerar's avatar
wafwerar 已提交
970 971
  char*    buf = taosMemoryCalloc(1, len);
  SHelper* phelper = taosMemoryCalloc(numOfRows, sizeof(SHelper));
L
Liu Jicong 已提交
972
  for (int32_t i = 0; i < numOfRows; ++i) {
H
Haojun Liao 已提交
973 974 975 976 977
    phelper[i].index = i;
    phelper[i].pData = buf + sortValLengthPerRow * i;
  }

  int32_t offset = 0;
L
Liu Jicong 已提交
978
  for (int32_t i = 0; i < numOfCols; ++i) {
H
Haojun Liao 已提交
979
    SBlockOrderInfo* pInfo = taosArrayGet(pOrderInfo, i);
L
Liu Jicong 已提交
980 981 982 983
    for (int32_t j = 0; j < numOfRows; ++j) {
      phelper[j].i64 = *(int32_t*)pInfo->pColData->pData + pInfo->pColData->info.bytes * j;
      //      memcpy(phelper[j].pData + offset, pInfo->pColData->pData + pInfo->pColData->info.bytes * j,
      //      pInfo->pColData->info.bytes);
H
Haojun Liao 已提交
984 985 986 987 988 989 990 991 992
    }

    offset += pInfo->pColData->info.bytes;
  }

  return phelper;
}

int32_t dataBlockCompar_rv(const void* p1, const void* p2, const void* param) {
L
Liu Jicong 已提交
993
  const SSDataBlockSortHelper* pHelper = (const SSDataBlockSortHelper*)param;
H
Haojun Liao 已提交
994

L
Liu Jicong 已提交
995
  //  SSDataBlock* pDataBlock = pHelper->pDataBlock;
H
Haojun Liao 已提交
996

L
Liu Jicong 已提交
997 998
  SHelper* left = (SHelper*)p1;
  SHelper* right = (SHelper*)p2;
H
Haojun Liao 已提交
999 1000 1001 1002

  SArray* pInfo = pHelper->orderInfo;

  int32_t offset = 0;
L
Liu Jicong 已提交
1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046
  //  for(int32_t i = 0; i < pInfo->size; ++i) {
  //    SBlockOrderInfo* pOrder = TARRAY_GET_ELEM(pInfo, 0);
  //    SColumnInfoData* pColInfoData = pOrder->pColData;//TARRAY_GET_ELEM(pDataBlock->pDataBlock, pOrder->colIndex);

  //    if (pColInfoData->hasNull) {
  //      bool leftNull  = colDataIsNull(pColInfoData, pDataBlock->info.rows, left, pDataBlock->pBlockAgg);
  //      bool rightNull = colDataIsNull(pColInfoData, pDataBlock->info.rows, right, pDataBlock->pBlockAgg);
  //      if (leftNull && rightNull) {
  //        continue; // continue to next slot
  //      }
  //
  //      if (rightNull) {
  //        return pHelper->nullFirst? 1:-1;
  //      }
  //
  //      if (leftNull) {
  //        return pHelper->nullFirst? -1:1;
  //      }
  //    }

  //    void* left1  = colDataGetData(pColInfoData, left);
  //    void* right1 = colDataGetData(pColInfoData, right);

  //    switch(pColInfoData->info.type) {
  //      case TSDB_DATA_TYPE_INT: {
  int32_t leftx = *(int32_t*)left->pData;    //*(int32_t*)(left->pData + offset);
  int32_t rightx = *(int32_t*)right->pData;  //*(int32_t*)(right->pData + offset);

  //        offset += pColInfoData->info.bytes;
  if (leftx == rightx) {
    //          break;
    return 0;
  } else {
    //          if (pOrder->order == TSDB_ORDER_ASC) {
    return (leftx < rightx) ? -1 : 1;
    //          } else {
    //            return (leftx < rightx)? 1:-1;
    //          }
  }
  //      }
  //      default:
  //        assert(0);
  //    }
  //  }
H
Haojun Liao 已提交
1047 1048 1049 1050

  return 0;
}

L
Liu Jicong 已提交
1051
int32_t varColSort(SColumnInfoData* pColumnInfoData, SBlockOrderInfo* pOrder) { return 0; }
H
Haojun Liao 已提交
1052 1053

int32_t blockDataSort_rv(SSDataBlock* pDataBlock, SArray* pOrderInfo, bool nullFirst) {
L
Liu Jicong 已提交
1054
  // Allocate the additional buffer.
H
Haojun Liao 已提交
1055 1056
  int64_t p0 = taosGetTimestampUs();

H
Haojun Liao 已提交
1057
  SSDataBlockSortHelper helper = {.pDataBlock = pDataBlock, .orderInfo = pOrderInfo};
H
Haojun Liao 已提交
1058 1059 1060 1061 1062 1063 1064 1065 1066 1067

  uint32_t rows = pDataBlock->info.rows;
  SHelper* index = createTupleIndex_rv(rows, helper.orderInfo, pDataBlock);
  if (index == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return terrno;
  }

  taosqsort(index, rows, sizeof(SHelper), &helper, dataBlockCompar_rv);

L
Liu Jicong 已提交
1068
  int64_t          p1 = taosGetTimestampUs();
H
Haojun Liao 已提交
1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087
  SColumnInfoData* pCols = createHelpColInfoData(pDataBlock);
  if (pCols == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return terrno;
  }

  int64_t p2 = taosGetTimestampUs();

  //  int32_t code = blockDataAssign(pCols, pDataBlock, index);
  //  if (code != TSDB_CODE_SUCCESS) {
  //    terrno = code;
  //    return code;
  //  }

  int64_t p3 = taosGetTimestampUs();

  copyBackToBlock(pDataBlock, pCols);
  int64_t p4 = taosGetTimestampUs();

L
Liu Jicong 已提交
1088 1089
  printf("sort:%" PRId64 ", create:%" PRId64 ", assign:%" PRId64 ", copyback:%" PRId64 ", rows:%d\n", p1 - p0, p2 - p1,
         p3 - p2, p4 - p3, rows);
H
Haojun Liao 已提交
1090
  //  destroyTupleIndex(index);
1091
  return 0;
H
Haojun Liao 已提交
1092 1093
}

1094
void blockDataCleanup(SSDataBlock* pDataBlock) {
1095
  pDataBlock->info.rows = 0;
1096 1097 1098
  for (int32_t i = 0; i < pDataBlock->info.numOfCols; ++i) {
    SColumnInfoData* p = taosArrayGet(pDataBlock->pDataBlock, i);
    colInfoDataCleanup(p, pDataBlock->info.capacity);
1099 1100 1101
  }
}

1102 1103
int32_t colInfoDataEnsureCapacity(SColumnInfoData* pColumn, size_t existRows, uint32_t numOfRows) {
  if (0 == numOfRows || numOfRows <= existRows) {
X
Xiaoyu Wang 已提交
1104 1105 1106
    return TSDB_CODE_SUCCESS;
  }

D
dapan1121 已提交
1107
  if (IS_VAR_DATA_TYPE(pColumn->info.type)) {
wafwerar's avatar
wafwerar 已提交
1108
    char* tmp = taosMemoryRealloc(pColumn->varmeta.offset, sizeof(int32_t) * numOfRows);
D
dapan1121 已提交
1109 1110 1111
    if (tmp == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
1112

D
dapan1121 已提交
1113
    pColumn->varmeta.offset = (int32_t*)tmp;
1114
    memset(&pColumn->varmeta.offset[existRows], 0, sizeof(int32_t) * (numOfRows - existRows));
D
dapan1121 已提交
1115
  } else {
wafwerar's avatar
wafwerar 已提交
1116
    char* tmp = taosMemoryRealloc(pColumn->nullbitmap, BitmapLen(numOfRows));
D
dapan1121 已提交
1117 1118 1119
    if (tmp == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
1120

1121
    int32_t oldLen = BitmapLen(existRows);
D
dapan1121 已提交
1122
    pColumn->nullbitmap = tmp;
1123
    memset(&pColumn->nullbitmap[oldLen], 0, BitmapLen(numOfRows) - oldLen);
1124 1125 1126 1127 1128

    if (pColumn->info.type == TSDB_DATA_TYPE_NULL) {
      return TSDB_CODE_SUCCESS;
    }

X
Xiaoyu Wang 已提交
1129
    assert(pColumn->info.bytes);
wafwerar's avatar
wafwerar 已提交
1130
    tmp = taosMemoryRealloc(pColumn->pData, numOfRows * pColumn->info.bytes);
D
dapan1121 已提交
1131 1132 1133
    if (tmp == NULL) {
      return TSDB_CODE_OUT_OF_MEMORY;
    }
1134

D
dapan1121 已提交
1135 1136 1137 1138 1139 1140
    pColumn->pData = tmp;
  }

  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
1141
void colInfoDataCleanup(SColumnInfoData* pColumn, uint32_t numOfRows) {
1142 1143 1144 1145 1146 1147 1148
  if (IS_VAR_DATA_TYPE(pColumn->info.type)) {
    pColumn->varmeta.length = 0;
  } else {
    memset(pColumn->nullbitmap, 0, BitmapLen(numOfRows));
  }
}

D
dapan1121 已提交
1149 1150
int32_t blockDataEnsureCapacity(SSDataBlock* pDataBlock, uint32_t numOfRows) {
  int32_t code = 0;
H
Haojun Liao 已提交
1151 1152 1153
  if (numOfRows == 0) {
    return TSDB_CODE_SUCCESS;
  }
L
Liu Jicong 已提交
1154

1155 1156
  pDataBlock->info.capacity = numOfRows;

L
Liu Jicong 已提交
1157
  for (int32_t i = 0; i < pDataBlock->info.numOfCols; ++i) {
D
dapan1121 已提交
1158
    SColumnInfoData* p = taosArrayGet(pDataBlock->pDataBlock, i);
1159
    code = colInfoDataEnsureCapacity(p, pDataBlock->info.rows, numOfRows);
D
dapan1121 已提交
1160 1161
    if (code) {
      return code;
1162 1163
    }
  }
H
Haojun Liao 已提交
1164 1165 1166 1167 1168 1169 1170 1171 1172

  return TSDB_CODE_SUCCESS;
}

void* blockDataDestroy(SSDataBlock* pBlock) {
  if (pBlock == NULL) {
    return NULL;
  }

L
Liu Jicong 已提交
1173
  blockDestroyInner(pBlock);
wafwerar's avatar
wafwerar 已提交
1174
  taosMemoryFreeClear(pBlock);
H
Haojun Liao 已提交
1175
  return NULL;
D
dapan1121 已提交
1176
}
1177

1178
SSDataBlock* createOneDataBlock(const SSDataBlock* pDataBlock, bool copyData) {
L
Liu Jicong 已提交
1179
  if (pDataBlock == NULL) {
1180 1181
    return NULL;
  }
1182

1183 1184
  int32_t numOfCols = pDataBlock->info.numOfCols;

wafwerar's avatar
wafwerar 已提交
1185
  SSDataBlock* pBlock = taosMemoryCalloc(1, sizeof(SSDataBlock));
1186
  pBlock->pDataBlock = taosArrayInit(numOfCols, sizeof(SColumnInfoData));
1187

1188
  pBlock->info.numOfCols = numOfCols;
1189
  pBlock->info.hasVarCol = pDataBlock->info.hasVarCol;
L
Liu Jicong 已提交
1190
  pBlock->info.rowSize = pDataBlock->info.rows;
1191

L
Liu Jicong 已提交
1192
  for (int32_t i = 0; i < numOfCols; ++i) {
1193 1194 1195 1196 1197 1198
    SColumnInfoData  colInfo = {0};
    SColumnInfoData* p = taosArrayGet(pDataBlock->pDataBlock, i);
    colInfo.info = p->info;
    taosArrayPush(pBlock->pDataBlock, &colInfo);
  }

1199 1200 1201 1202 1203
  if (copyData) {
    for (int32_t i = 0; i < numOfCols; ++i) {
      SColumnInfoData* pDst = taosArrayGet(pBlock->pDataBlock, i);
      SColumnInfoData* pSrc = taosArrayGet(pDataBlock->pDataBlock, i);

1204
      int32_t code = colInfoDataEnsureCapacity(pDst, 0, pDataBlock->info.rows);
1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215
      if (code != TSDB_CODE_SUCCESS) {
        return NULL;
      }

      colDataAssign(pDst, pSrc, pDataBlock->info.rows);
    }

    pBlock->info.rows = pDataBlock->info.rows;
    pBlock->info.capacity = pDataBlock->info.rows;
  }

1216 1217 1218 1219
  return pBlock;
}

size_t blockDataGetCapacityInRow(const SSDataBlock* pBlock, size_t pageSize) {
L
Liu Jicong 已提交
1220
  return (int32_t)((pageSize - blockDataGetSerialMetaSize(pBlock)) / blockDataGetSerialRowSize(pBlock));
1221
}
H
Haojun Liao 已提交
1222

1223 1224
void colDataDestroy(SColumnInfoData* pColData) {
  if (IS_VAR_DATA_TYPE(pColData->info.type)) {
H
Haojun Liao 已提交
1225
    taosMemoryFree(pColData->varmeta.offset);
1226
  } else {
H
Haojun Liao 已提交
1227
    taosMemoryFree(pColData->nullbitmap);
1228 1229
  }

H
Haojun Liao 已提交
1230
  taosMemoryFree(pColData->pData);
1231 1232
}

H
Haojun Liao 已提交
1233 1234 1235 1236
static void doShiftBitmap(char* nullBitmap, size_t n, size_t total) {
  int32_t len = BitmapLen(total);

  int32_t newLen = BitmapLen(total - n);
L
Liu Jicong 已提交
1237 1238
  if (n % 8 == 0) {
    memmove(nullBitmap, nullBitmap + n / 8, newLen);
H
Haojun Liao 已提交
1239 1240 1241 1242
  } else {
    int32_t tail = n % 8;
    int32_t i = 0;

L
Liu Jicong 已提交
1243 1244
    uint8_t* p = (uint8_t*)nullBitmap;
    while (i < len) {
H
Haojun Liao 已提交
1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270
      uint8_t v = p[i];

      p[i] = 0;
      p[i] = (v << tail);

      if (i < len - 1) {
        uint8_t next = p[i + 1];
        p[i] |= (next >> (8 - tail));
      }

      i += 1;
    }
  }
}

static void colDataTrimFirstNRows(SColumnInfoData* pColInfoData, size_t n, size_t total) {
  if (IS_VAR_DATA_TYPE(pColInfoData->info.type)) {
    memmove(pColInfoData->varmeta.offset, &pColInfoData->varmeta.offset[n], (total - n));
    memset(&pColInfoData->varmeta.offset[total - n - 1], 0, n);
  } else {
    int32_t bytes = pColInfoData->info.bytes;
    memmove(pColInfoData->pData, ((char*)pColInfoData->pData + n * bytes), (total - n) * bytes);
    doShiftBitmap(pColInfoData->nullbitmap, n, total);
  }
}

L
Liu Jicong 已提交
1271
int32_t blockDataTrimFirstNRows(SSDataBlock* pBlock, size_t n) {
H
Haojun Liao 已提交
1272 1273 1274 1275 1276 1277 1278
  if (n == 0) {
    return TSDB_CODE_SUCCESS;
  }

  if (pBlock->info.rows <= n) {
    blockDataCleanup(pBlock);
  } else {
L
Liu Jicong 已提交
1279
    for (int32_t i = 0; i < pBlock->info.numOfCols; ++i) {
H
Haojun Liao 已提交
1280 1281 1282 1283 1284 1285 1286 1287 1288
      SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, i);
      colDataTrimFirstNRows(pColInfoData, n, pBlock->info.rows);
    }

    pBlock->info.rows -= n;
  }
  return TSDB_CODE_SUCCESS;
}

H
Haojun Liao 已提交
1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314
int32_t tEncodeDataBlock(void** buf, const SSDataBlock* pBlock) {
  int64_t tbUid = pBlock->info.uid;
  int16_t numOfCols = pBlock->info.numOfCols;
  int16_t hasVarCol = pBlock->info.hasVarCol;
  int32_t rows = pBlock->info.rows;
  int32_t sz = taosArrayGetSize(pBlock->pDataBlock);

  int32_t tlen = 0;
  tlen += taosEncodeFixedI64(buf, tbUid);
  tlen += taosEncodeFixedI16(buf, numOfCols);
  tlen += taosEncodeFixedI16(buf, hasVarCol);
  tlen += taosEncodeFixedI32(buf, rows);
  tlen += taosEncodeFixedI32(buf, sz);
  for (int32_t i = 0; i < sz; i++) {
    SColumnInfoData* pColData = (SColumnInfoData*)taosArrayGet(pBlock->pDataBlock, i);
    tlen += taosEncodeFixedI16(buf, pColData->info.colId);
    tlen += taosEncodeFixedI16(buf, pColData->info.type);
    tlen += taosEncodeFixedI32(buf, pColData->info.bytes);

    if (IS_VAR_DATA_TYPE(pColData->info.type)) {
      tlen += taosEncodeBinary(buf, pColData->varmeta.offset, sizeof(int32_t) * rows);
    } else {
      tlen += taosEncodeBinary(buf, pColData->nullbitmap, BitmapLen(rows));
    }

    int32_t len = colDataGetLength(pColData, rows);
X
Xiaoyu Wang 已提交
1315
    tlen += taosEncodeFixedI32(buf, len);
H
Haojun Liao 已提交
1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350

    tlen += taosEncodeBinary(buf, pColData->pData, len);
  }
  return tlen;
}

void* tDecodeDataBlock(const void* buf, SSDataBlock* pBlock) {
  int32_t sz;

  buf = taosDecodeFixedI64(buf, &pBlock->info.uid);
  buf = taosDecodeFixedI16(buf, &pBlock->info.numOfCols);
  buf = taosDecodeFixedI16(buf, &pBlock->info.hasVarCol);
  buf = taosDecodeFixedI32(buf, &pBlock->info.rows);
  buf = taosDecodeFixedI32(buf, &sz);
  pBlock->pDataBlock = taosArrayInit(sz, sizeof(SColumnInfoData));
  for (int32_t i = 0; i < sz; i++) {
    SColumnInfoData data = {0};
    buf = taosDecodeFixedI16(buf, &data.info.colId);
    buf = taosDecodeFixedI16(buf, &data.info.type);
    buf = taosDecodeFixedI32(buf, &data.info.bytes);

    if (IS_VAR_DATA_TYPE(data.info.type)) {
      buf = taosDecodeBinary(buf, (void**)&data.varmeta.offset, pBlock->info.rows * sizeof(int32_t));
      data.varmeta.length = pBlock->info.rows * sizeof(int32_t);
      data.varmeta.allocLen = data.varmeta.length;
    } else {
      buf = taosDecodeBinary(buf, (void**)&data.nullbitmap, BitmapLen(pBlock->info.rows));
    }

    int32_t len = 0;
    buf = taosDecodeFixedI32(buf, &len);
    buf = taosDecodeBinary(buf, (void**)&data.pData, len);
    taosArrayPush(pBlock->pDataBlock, &data);
  }
  return (void*)buf;
L
Liu Jicong 已提交
1351
}
L
Liu Jicong 已提交
1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365

int32_t tEncodeDataBlocks(void** buf, const SArray* blocks) {
  int32_t tlen = 0;
  int32_t sz = taosArrayGetSize(blocks);
  tlen += taosEncodeFixedI32(buf, sz);

  for (int32_t i = 0; i < sz; i++) {
    SSDataBlock* pBlock = taosArrayGet(blocks, i);
    tlen += tEncodeDataBlock(buf, pBlock);
  }

  return tlen;
}

L
Liu Jicong 已提交
1366
void* tDecodeDataBlocks(const void* buf, SArray** blocks) {
L
Liu Jicong 已提交
1367 1368
  int32_t sz;
  buf = taosDecodeFixedI32(buf, &sz);
L
Liu Jicong 已提交
1369 1370

  *blocks = taosArrayInit(sz, sizeof(SSDataBlock));
L
Liu Jicong 已提交
1371 1372 1373
  for (int32_t i = 0; i < sz; i++) {
    SSDataBlock pBlock = {0};
    buf = tDecodeDataBlock(buf, &pBlock);
L
Liu Jicong 已提交
1374
    taosArrayPush(*blocks, &pBlock);
L
Liu Jicong 已提交
1375 1376 1377
  }
  return (void*)buf;
}
L
Liu Jicong 已提交
1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414

static char* formatTimestamp(char* buf, int64_t val, int precision) {
  time_t  tt;
  int32_t ms = 0;
  if (precision == TSDB_TIME_PRECISION_NANO) {
    tt = (time_t)(val / 1000000000);
    ms = val % 1000000000;
  } else if (precision == TSDB_TIME_PRECISION_MICRO) {
    tt = (time_t)(val / 1000000);
    ms = val % 1000000;
  } else {
    tt = (time_t)(val / 1000);
    ms = val % 1000;
  }

  /* comment out as it make testcases like select_with_tags.sim fail.
    but in windows, this may cause the call to localtime crash if tt < 0,
    need to find a better solution.
    if (tt < 0) {
      tt = 0;
    }
    */

#ifdef WINDOWS
  if (tt < 0) tt = 0;
#endif
  if (tt <= 0 && ms < 0) {
    tt--;
    if (precision == TSDB_TIME_PRECISION_NANO) {
      ms += 1000000000;
    } else if (precision == TSDB_TIME_PRECISION_MICRO) {
      ms += 1000000;
    } else {
      ms += 1000;
    }
  }

1415
  struct tm* ptm = taosLocalTime(&tt, NULL);
L
Liu Jicong 已提交
1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427
  size_t     pos = strftime(buf, 35, "%Y-%m-%d %H:%M:%S", ptm);

  if (precision == TSDB_TIME_PRECISION_NANO) {
    sprintf(buf + pos, ".%09d", ms);
  } else if (precision == TSDB_TIME_PRECISION_MICRO) {
    sprintf(buf + pos, ".%06d", ms);
  } else {
    sprintf(buf + pos, ".%03d", ms);
  }

  return buf;
}
H
Haojun Liao 已提交
1428

L
Liu Jicong 已提交
1429
void blockDebugShowData(const SArray* dataBlocks) {
L
Liu Jicong 已提交
1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448
  char    pBuf[128];
  int32_t sz = taosArrayGetSize(dataBlocks);
  for (int32_t i = 0; i < sz; i++) {
    SSDataBlock* pDataBlock = taosArrayGet(dataBlocks, i);
    int32_t      colNum = pDataBlock->info.numOfCols;
    int32_t      rows = pDataBlock->info.rows;
    for (int32_t j = 0; j < rows; j++) {
      printf("|");
      for (int32_t k = 0; k < colNum; k++) {
        SColumnInfoData* pColInfoData = taosArrayGet(pDataBlock->pDataBlock, k);
        void*            var = POINTER_SHIFT(pColInfoData->pData, j * pColInfoData->info.bytes);
        switch (pColInfoData->info.type) {
          case TSDB_DATA_TYPE_TIMESTAMP:
            formatTimestamp(pBuf, *(uint64_t*)var, TSDB_TIME_PRECISION_MILLI);
            printf(" %25s |", pBuf);
            break;
          case TSDB_DATA_TYPE_INT:
            printf(" %15d |", *(int32_t*)var);
            break;
L
Liu Jicong 已提交
1449 1450 1451
          case TSDB_DATA_TYPE_UINT:
            printf(" %15u |", *(uint32_t*)var);
            break;
L
Liu Jicong 已提交
1452 1453 1454
          case TSDB_DATA_TYPE_BIGINT:
            printf(" %15ld |", *(int64_t*)var);
            break;
L
Liu Jicong 已提交
1455 1456 1457
          case TSDB_DATA_TYPE_UBIGINT:
            printf(" %15lu |", *(uint64_t*)var);
            break;
L
Liu Jicong 已提交
1458 1459 1460 1461 1462 1463 1464
        }
      }
      printf("\n");
    }
  }
}

L
Liu Jicong 已提交
1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528
SSubmitReq* tdBlockToSubmit(const SArray* pBlocks, const STSchema* pTSchema) {
  SSubmitReq* ret = NULL;

  // cal size
  int32_t cap = sizeof(SSubmitReq);
  int32_t sz = taosArrayGetSize(pBlocks);
  for (int32_t i = 0; i < sz; i++) {
    SSDataBlock* pDataBlock = taosArrayGet(pBlocks, i);
    int32_t      rows = pDataBlock->info.rows;
    // TODO min
    int32_t rowSize = pDataBlock->info.rowSize;
    int32_t maxLen = TD_ROW_MAX_BYTES_FROM_SCHEMA(pTSchema);
    cap += sizeof(SSubmitBlk) + rows * maxLen;
  }

  // assign data
  ret = taosMemoryCalloc(1, cap);
  ret->version = htonl(1);
  ret->length = htonl(cap - sizeof(SSubmitReq));
  ret->numOfBlocks = htonl(sz);

  void* submitBlk = POINTER_SHIFT(ret, sizeof(SSubmitReq));
  for (int32_t i = 0; i < sz; i++) {
    SSDataBlock* pDataBlock = taosArrayGet(pBlocks, i);

    SSubmitBlk* blkHead = submitBlk;
    blkHead->numOfRows = htons(pDataBlock->info.rows);
    blkHead->schemaLen = 0;
    blkHead->sversion = htonl(pTSchema->version);
    // TODO
    blkHead->suid = 0;
    blkHead->uid = htobe64(pDataBlock->info.uid);

    int32_t rows = pDataBlock->info.rows;
    int32_t maxLen = TD_ROW_MAX_BYTES_FROM_SCHEMA(pTSchema);
    /*blkHead->dataLen = htonl(rows * maxLen);*/
    blkHead->dataLen = 0;

    void*   blockData = POINTER_SHIFT(submitBlk, sizeof(SSubmitBlk));
    STSRow* rowData = blockData;

    for (int32_t j = 0; j < pDataBlock->info.rows; j++) {
      SRowBuilder rb = {0};
      tdSRowInit(&rb, pTSchema->version);
      tdSRowSetTpInfo(&rb, pTSchema->numOfCols, pTSchema->flen);
      tdSRowResetBuf(&rb, rowData);

      for (int32_t k = 0; k < pTSchema->numOfCols; k++) {
        const STColumn*  pColumn = &pTSchema->columns[k];
        SColumnInfoData* pColData = taosArrayGet(pDataBlock->pDataBlock, k);
        void*            data = colDataGetData(pColData, j);
        tdAppendColValToRow(&rb, pColumn->colId, pColumn->type, TD_VTYPE_NORM, data, true, pColumn->offset, k);
      }
      int32_t rowLen = TD_ROW_LEN(rowData);
      rowData = POINTER_SHIFT(rowData, rowLen);
      blkHead->dataLen += rowLen;
    }
    int32_t len = blkHead->dataLen;
    blkHead->dataLen = htonl(len);
    blkHead = POINTER_SHIFT(blkHead, len);
  }

  return ret;
}