“3ab9b88dd769d011cd1a88f93e8a38aa037f2641”上不存在“...mgmt/mgmt_snode/git@gitcode.net:taosdata/tdengine.git”
提交 ed6276bd 编写于 作者: M Minglei Jin

Merge branch 'feat/tsdb_refact' of https://github.com/taosdata/TDengine into feat/tsdb_refact

...@@ -24,3 +24,4 @@ if(${BUILD_WITH_TRAFT}) ...@@ -24,3 +24,4 @@ if(${BUILD_WITH_TRAFT})
endif(${BUILD_WITH_TRAFT}) endif(${BUILD_WITH_TRAFT})
add_subdirectory(tdev) add_subdirectory(tdev)
add_subdirectory(lz4)
add_executable(lz4_test "")
target_sources(lz4_test
PRIVATE
"main.c"
)
target_link_libraries(lz4_test lz4_static)
\ No newline at end of file
#include <stdio.h>
#include "lz4.h"
int main(int argc, char const *argv[]) {
printf("%d\n", LZ4_compressBound(1024));
return 0;
}
...@@ -101,17 +101,17 @@ typedef struct SColumnInfoData { ...@@ -101,17 +101,17 @@ typedef struct SColumnInfoData {
} SColumnInfoData; } SColumnInfoData;
typedef struct SQueryTableDataCond { typedef struct SQueryTableDataCond {
// STimeWindow twindow;
uint64_t suid; uint64_t suid;
int32_t order; // desc|asc order to iterate the data block int32_t order; // desc|asc order to iterate the data block
int32_t numOfCols; int32_t numOfCols;
SColumnInfo* colList; SColumnInfo* colList;
bool loadExternalRows; // load external rows or not int32_t type; // data block load type:
int32_t type; // data block load type:
int32_t numOfTWindows; int32_t numOfTWindows;
STimeWindow* twindows; STimeWindow* twindows;
int64_t startVersion; int32_t numOfTables; // number of tables
int64_t endVersion; uint64_t* uidList; // table uid list
int64_t startVersion; // start version
int64_t endVersion; // end version
} SQueryTableDataCond; } SQueryTableDataCond;
void* blockDataDestroy(SSDataBlock* pBlock); void* blockDataDestroy(SSDataBlock* pBlock);
......
...@@ -116,12 +116,11 @@ int32_t metaTbCursorNext(SMTbCursor *pTbCur); ...@@ -116,12 +116,11 @@ int32_t metaTbCursorNext(SMTbCursor *pTbCur);
// typedef struct STsdb STsdb; // typedef struct STsdb STsdb;
typedef struct STsdbReader STsdbReader; typedef struct STsdbReader STsdbReader;
#define BLOCK_LOAD_OFFSET_SEQ_ORDER 1 #define BLOCK_LOAD_OFFSET_ORDER 1
#define BLOCK_LOAD_TABLE_SEQ_ORDER 2 #define BLOCK_LOAD_TABLESEQ_ORDER 2
#define BLOCK_LOAD_TABLE_RR_ORDER 3 #define BLOCK_LOAD_EXTERN_ORDER 3
int32_t tsdbReaderOpen(SVnode *pVnode, SQueryTableDataCond *pCond, STableListInfo *tableInfoGroup, uint64_t qId, int32_t tsdbReaderOpen(SVnode* pVnode, SQueryTableDataCond* pCond, STableListInfo* pTableList, uint64_t qId, uint64_t taskId, STsdbReader** ppReader);
uint64_t taskId, STsdbReader **ppReader);
void tsdbReaderClose(STsdbReader *pReader); void tsdbReaderClose(STsdbReader *pReader);
bool tsdbNextDataBlock(STsdbReader *pReader); bool tsdbNextDataBlock(STsdbReader *pReader);
void tsdbRetrieveDataBlockInfo(STsdbReader *pReader, SDataBlockInfo *pDataBlockInfo); void tsdbRetrieveDataBlockInfo(STsdbReader *pReader, SDataBlockInfo *pDataBlockInfo);
......
...@@ -86,8 +86,8 @@ typedef struct STsdbFSState STsdbFSState; ...@@ -86,8 +86,8 @@ typedef struct STsdbFSState STsdbFSState;
#define TSDBROW_VERSION(ROW) (((ROW)->type == 0) ? (ROW)->version : (ROW)->pBlockData->aVersion[(ROW)->iRow]) #define TSDBROW_VERSION(ROW) (((ROW)->type == 0) ? (ROW)->version : (ROW)->pBlockData->aVersion[(ROW)->iRow])
#define TSDBROW_SVERSION(ROW) TD_ROW_SVER((ROW)->pTSRow) #define TSDBROW_SVERSION(ROW) TD_ROW_SVER((ROW)->pTSRow)
#define TSDBROW_KEY(ROW) ((TSDBKEY){.version = TSDBROW_VERSION(ROW), .ts = TSDBROW_TS(ROW)}) #define TSDBROW_KEY(ROW) ((TSDBKEY){.version = TSDBROW_VERSION(ROW), .ts = TSDBROW_TS(ROW)})
#define tsdbRowFromTSRow(VERSION, TSROW) ((TSDBROW){.type = 0, .version = (VERSION), .pTSRow = (TSROW)}); #define tsdbRowFromTSRow(VERSION, TSROW) ((TSDBROW){.type = 0, .version = (VERSION), .pTSRow = (TSROW)})
#define tsdbRowFromBlockData(BLOCKDATA, IROW) ((TSDBROW){.type = 1, .pBlockData = (BLOCKDATA), .iRow = (IROW)}); #define tsdbRowFromBlockData(BLOCKDATA, IROW) ((TSDBROW){.type = 1, .pBlockData = (BLOCKDATA), .iRow = (IROW)})
void tsdbRowGetColVal(TSDBROW *pRow, STSchema *pTSchema, int32_t iCol, SColVal *pColVal); void tsdbRowGetColVal(TSDBROW *pRow, STSchema *pTSchema, int32_t iCol, SColVal *pColVal);
int32_t tPutTSDBRow(uint8_t *p, TSDBROW *pRow); int32_t tPutTSDBRow(uint8_t *p, TSDBROW *pRow);
int32_t tGetTSDBRow(uint8_t *p, TSDBROW *pRow); int32_t tGetTSDBRow(uint8_t *p, TSDBROW *pRow);
...@@ -132,6 +132,7 @@ int32_t tCmprBlockIdx(void const *lhs, void const *rhs); ...@@ -132,6 +132,7 @@ int32_t tCmprBlockIdx(void const *lhs, void const *rhs);
void tColDataReset(SColData *pColData, int16_t cid, int8_t type); void tColDataReset(SColData *pColData, int16_t cid, int8_t type);
void tColDataClear(void *ph); void tColDataClear(void *ph);
int32_t tColDataAppendValue(SColData *pColData, SColVal *pColVal); int32_t tColDataAppendValue(SColData *pColData, SColVal *pColVal);
int32_t tColDataCopy(SColData *pColDataSrc, SColData *pColDataDest);
int32_t tColDataGetValue(SColData *pColData, int32_t iRow, SColVal *pColVal); int32_t tColDataGetValue(SColData *pColData, int32_t iRow, SColVal *pColVal);
int32_t tColDataPCmprFn(const void *p1, const void *p2); int32_t tColDataPCmprFn(const void *p1, const void *p2);
// SBlockData // SBlockData
...@@ -140,7 +141,10 @@ int32_t tColDataPCmprFn(const void *p1, const void *p2); ...@@ -140,7 +141,10 @@ int32_t tColDataPCmprFn(const void *p1, const void *p2);
int32_t tBlockDataInit(SBlockData *pBlockData); int32_t tBlockDataInit(SBlockData *pBlockData);
void tBlockDataReset(SBlockData *pBlockData); void tBlockDataReset(SBlockData *pBlockData);
void tBlockDataClear(SBlockData *pBlockData); void tBlockDataClear(SBlockData *pBlockData);
int32_t tBlockDataAddColData(SBlockData *pBlockData, int32_t iColData, SColData **ppColData);
int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTSchema); int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTSchema);
int32_t tBlockDataMerge(SBlockData *pBlockData1, SBlockData *pBlockData2, SBlockData *pBlockData);
int32_t tBlockDataCopy(SBlockData *pBlockDataSrc, SBlockData *pBlockDataDest);
// SDelIdx // SDelIdx
int32_t tPutDelIdx(uint8_t *p, void *ph); int32_t tPutDelIdx(uint8_t *p, void *ph);
int32_t tGetDelIdx(uint8_t *p, void *ph); int32_t tGetDelIdx(uint8_t *p, void *ph);
...@@ -179,6 +183,9 @@ bool tsdbTbDataIterNext(STbDataIter *pIter); ...@@ -179,6 +183,9 @@ bool tsdbTbDataIterNext(STbDataIter *pIter);
// tsdbFile.c ============================================================================================== // tsdbFile.c ==============================================================================================
typedef enum { TSDB_HEAD_FILE = 0, TSDB_DATA_FILE, TSDB_LAST_FILE, TSDB_SMA_FILE } EDataFileT; typedef enum { TSDB_HEAD_FILE = 0, TSDB_DATA_FILE, TSDB_LAST_FILE, TSDB_SMA_FILE } EDataFileT;
void tsdbDataFileName(STsdb *pTsdb, SDFileSet *pDFileSet, EDataFileT ftype, char fname[]); void tsdbDataFileName(STsdb *pTsdb, SDFileSet *pDFileSet, EDataFileT ftype, char fname[]);
bool tsdbFileIsSame(SDFileSet *pDFileSet1, SDFileSet *pDFileSet2, EDataFileT ftype);
int32_t tsdbUpdateDFileHdr(TdFilePtr pFD, SDFileSet *pSet, EDataFileT ftype);
int32_t tsdbDFileRollback(STsdb *pTsdb, SDFileSet *pSet, EDataFileT ftype);
int32_t tPutDataFileHdr(uint8_t *p, SDFileSet *pSet, EDataFileT ftype); int32_t tPutDataFileHdr(uint8_t *p, SDFileSet *pSet, EDataFileT ftype);
int32_t tPutDelFile(uint8_t *p, SDelFile *pDelFile); int32_t tPutDelFile(uint8_t *p, SDelFile *pDelFile);
int32_t tGetDelFile(uint8_t *p, SDelFile *pDelFile); int32_t tGetDelFile(uint8_t *p, SDelFile *pDelFile);
...@@ -201,7 +208,7 @@ SDFileSet *tsdbFSStateGetDFileSet(STsdbFSState *pState, int32_t fid); ...@@ -201,7 +208,7 @@ SDFileSet *tsdbFSStateGetDFileSet(STsdbFSState *pState, int32_t fid);
// SDataFWriter // SDataFWriter
int32_t tsdbDataFWriterOpen(SDataFWriter **ppWriter, STsdb *pTsdb, SDFileSet *pSet); int32_t tsdbDataFWriterOpen(SDataFWriter **ppWriter, STsdb *pTsdb, SDFileSet *pSet);
int32_t tsdbDataFWriterClose(SDataFWriter **ppWriter, int8_t sync); int32_t tsdbDataFWriterClose(SDataFWriter **ppWriter, int8_t sync);
int32_t tsdbUpdateDFileSetHeader(SDataFWriter *pWriter, uint8_t **ppBuf); int32_t tsdbUpdateDFileSetHeader(SDataFWriter *pWriter);
int32_t tsdbWriteBlockIdx(SDataFWriter *pWriter, SMapData *pMapData, uint8_t **ppBuf); int32_t tsdbWriteBlockIdx(SDataFWriter *pWriter, SMapData *pMapData, uint8_t **ppBuf);
int32_t tsdbWriteBlock(SDataFWriter *pWriter, SMapData *pMapData, uint8_t **ppBuf, SBlockIdx *pBlockIdx); int32_t tsdbWriteBlock(SDataFWriter *pWriter, SMapData *pMapData, uint8_t **ppBuf, SBlockIdx *pBlockIdx);
int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_t **ppBuf1, uint8_t **ppBuf2, int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_t **ppBuf1, uint8_t **ppBuf2,
...@@ -364,15 +371,18 @@ typedef struct { ...@@ -364,15 +371,18 @@ typedef struct {
int8_t type; int8_t type;
int8_t flag; // HAS_NONE|HAS_NULL|HAS_VALUE int8_t flag; // HAS_NONE|HAS_NULL|HAS_VALUE
int64_t offset; int64_t offset;
int64_t size; int64_t bsize; // bitmap size
int64_t csize; // compressed column value size
int64_t osize; // original column value size (only save for variant data type)
} SBlockCol; } SBlockCol;
typedef struct { typedef struct {
int64_t nRow; int64_t nRow;
int8_t cmprAlg; int8_t cmprAlg;
int64_t offset; int64_t offset;
int64_t ksize; int64_t vsize; // VERSION size
int64_t bsize; int64_t ksize; // TSKEY size
int64_t bsize; // total block size
SMapData mBlockCol; // SMapData<SBlockCol> SMapData mBlockCol; // SMapData<SBlockCol>
} SSubBlock; } SSubBlock;
...@@ -408,7 +418,6 @@ struct SColData { ...@@ -408,7 +418,6 @@ struct SColData {
int32_t *aOffset; int32_t *aOffset;
int32_t nData; int32_t nData;
uint8_t *pData; uint8_t *pData;
uint8_t *pBuf;
}; };
struct SBlockData { struct SBlockData {
......
...@@ -782,7 +782,13 @@ static int32_t tsdbCommitDiskData(SCommitter *pCommitter, SBlockIdx *oBlockIdx) ...@@ -782,7 +782,13 @@ static int32_t tsdbCommitDiskData(SCommitter *pCommitter, SBlockIdx *oBlockIdx)
if (code) goto _err; if (code) goto _err;
tBlockReset(pBlockN); tBlockReset(pBlockN);
pBlockN->last = 1; pBlockN->minKey = pBlockO->minKey;
pBlockN->maxKey = pBlockO->maxKey;
pBlockN->minVersion = pBlockO->minVersion;
pBlockN->maxVersion = pBlockO->maxVersion;
pBlockN->nRow = pBlockO->nRow;
pBlockN->last = pBlockO->last;
pBlockN->hasDup = pBlockO->hasDup;
code = tsdbWriteBlockData(pCommitter->pWriter, pBlockDataO, NULL, NULL, pBlockIdx, pBlockN, pCommitter->cmprAlg); code = tsdbWriteBlockData(pCommitter->pWriter, pBlockDataO, NULL, NULL, pBlockIdx, pBlockN, pCommitter->cmprAlg);
if (code) goto _err; if (code) goto _err;
...@@ -964,7 +970,7 @@ static int32_t tsdbCommitFileDataEnd(SCommitter *pCommitter) { ...@@ -964,7 +970,7 @@ static int32_t tsdbCommitFileDataEnd(SCommitter *pCommitter) {
if (code) goto _err; if (code) goto _err;
// update file header // update file header
code = tsdbUpdateDFileSetHeader(pCommitter->pWriter, NULL); code = tsdbUpdateDFileSetHeader(pCommitter->pWriter);
if (code) goto _err; if (code) goto _err;
// upsert SDFileSet // upsert SDFileSet
......
...@@ -171,7 +171,71 @@ _err: ...@@ -171,7 +171,71 @@ _err:
static int32_t tsdbApplyDFileSetChange(STsdbFS *pFS, SDFileSet *pFrom, SDFileSet *pTo) { static int32_t tsdbApplyDFileSetChange(STsdbFS *pFS, SDFileSet *pFrom, SDFileSet *pTo) {
int32_t code = 0; int32_t code = 0;
// TODO char fname[TSDB_FILENAME_LEN];
if (pFrom && pTo) {
// head
if (tsdbFileIsSame(pFrom, pTo, TSDB_HEAD_FILE)) {
ASSERT(0);
} else {
tsdbDataFileName(pFS->pTsdb, pFrom, TSDB_HEAD_FILE, fname);
taosRemoveFile(fname);
}
// data
if (tsdbFileIsSame(pFrom, pTo, TSDB_DATA_FILE)) {
if (pFrom->fData.size > pTo->fData.size) {
code = tsdbDFileRollback(pFS->pTsdb, pTo, TSDB_DATA_FILE);
if (code) goto _err;
}
} else {
tsdbDataFileName(pFS->pTsdb, pFrom, TSDB_DATA_FILE, fname);
taosRemoveFile(fname);
}
// last
if (tsdbFileIsSame(pFrom, pTo, TSDB_LAST_FILE)) {
if (pFrom->fLast.size > pTo->fLast.size) {
code = tsdbDFileRollback(pFS->pTsdb, pTo, TSDB_LAST_FILE);
if (code) goto _err;
}
} else {
tsdbDataFileName(pFS->pTsdb, pFrom, TSDB_LAST_FILE, fname);
taosRemoveFile(fname);
}
// sma
if (tsdbFileIsSame(pFrom, pTo, TSDB_SMA_FILE)) {
if (pFrom->fSma.size > pTo->fSma.size) {
code = tsdbDFileRollback(pFS->pTsdb, pTo, TSDB_SMA_FILE);
if (code) goto _err;
}
} else {
tsdbDataFileName(pFS->pTsdb, pFrom, TSDB_SMA_FILE, fname);
taosRemoveFile(fname);
}
} else if (pFrom) {
// head
tsdbDataFileName(pFS->pTsdb, pFrom, TSDB_HEAD_FILE, fname);
taosRemoveFile(fname);
// data
tsdbDataFileName(pFS->pTsdb, pFrom, TSDB_DATA_FILE, fname);
taosRemoveFile(fname);
// last
tsdbDataFileName(pFS->pTsdb, pFrom, TSDB_LAST_FILE, fname);
taosRemoveFile(fname);
// fsm
tsdbDataFileName(pFS->pTsdb, pFrom, TSDB_SMA_FILE, fname);
taosRemoveFile(fname);
}
return code;
_err:
tsdbError("vgId:%d tsdb apply disk file set change failed since %s", TD_VID(pFS->pTsdb->pVnode), tstrerror(code));
return code; return code;
} }
......
...@@ -120,6 +120,107 @@ void tsdbDataFileName(STsdb *pTsdb, SDFileSet *pDFileSet, EDataFileT ftype, char ...@@ -120,6 +120,107 @@ void tsdbDataFileName(STsdb *pTsdb, SDFileSet *pDFileSet, EDataFileT ftype, char
} }
} }
bool tsdbFileIsSame(SDFileSet *pDFileSet1, SDFileSet *pDFileSet2, EDataFileT ftype) {
if (pDFileSet1->diskId.level != pDFileSet2->diskId.level || pDFileSet1->diskId.id != pDFileSet2->diskId.id) {
return false;
}
switch (ftype) {
case TSDB_HEAD_FILE:
return pDFileSet1->fHead.commitID == pDFileSet2->fHead.commitID;
case TSDB_DATA_FILE:
return pDFileSet1->fData.commitID == pDFileSet2->fData.commitID;
case TSDB_LAST_FILE:
return pDFileSet1->fLast.commitID == pDFileSet2->fLast.commitID;
case TSDB_SMA_FILE:
return pDFileSet1->fSma.commitID == pDFileSet2->fSma.commitID;
default:
ASSERT(0);
break;
}
}
int32_t tsdbUpdateDFileHdr(TdFilePtr pFD, SDFileSet *pSet, EDataFileT ftype) {
int32_t code = 0;
int64_t n;
char hdr[TSDB_FHDR_SIZE];
memset(hdr, 0, TSDB_FHDR_SIZE);
tPutDataFileHdr(hdr, pSet, ftype);
taosCalcChecksumAppend(0, hdr, TSDB_FHDR_SIZE);
n = taosLSeekFile(pFD, 0, SEEK_SET);
if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _exit;
}
n = taosWriteFile(pFD, hdr, TSDB_FHDR_SIZE);
if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _exit;
}
_exit:
return code;
}
int32_t tsdbDFileRollback(STsdb *pTsdb, SDFileSet *pSet, EDataFileT ftype) {
int32_t code = 0;
int64_t size;
TdFilePtr pFD;
char fname[TSDB_FILENAME_LEN];
tsdbDataFileName(pTsdb, pSet, ftype, fname);
// open
pFD = taosOpenFile(fname, TD_FILE_WRITE);
if (pFD == NULL) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// truncate
switch (ftype) {
case TSDB_HEAD_FILE:
size = pSet->fHead.size;
break;
case TSDB_DATA_FILE:
size = pSet->fData.size;
break;
case TSDB_LAST_FILE:
size = pSet->fLast.size;
break;
case TSDB_SMA_FILE:
size = pSet->fSma.size;
break;
default:
ASSERT(0);
}
if (taosFtruncateFile(pFD, size) < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// update header
code = tsdbUpdateDFileHdr(pFD, pSet, ftype);
if (code) goto _err;
// sync
if (taosFsyncFile(pFD) < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// close
taosCloseFile(&pFD);
return code;
_err:
return code;
}
int32_t tPutDataFileHdr(uint8_t *p, SDFileSet *pSet, EDataFileT ftype) { int32_t tPutDataFileHdr(uint8_t *p, SDFileSet *pSet, EDataFileT ftype) {
int32_t n = 0; int32_t n = 0;
......
...@@ -14,7 +14,6 @@ ...@@ -14,7 +14,6 @@
*/ */
#include "tsdb.h" #include "tsdb.h"
#define EXTRA_BYTES 2
#define ASCENDING_TRAVERSE(o) (o == TSDB_ORDER_ASC) #define ASCENDING_TRAVERSE(o) (o == TSDB_ORDER_ASC)
#define QH_GET_NUM_OF_COLS(handle) ((size_t)(taosArrayGetSize((handle)->pColumns))) #define QH_GET_NUM_OF_COLS(handle) ((size_t)(taosArrayGetSize((handle)->pColumns)))
...@@ -24,11 +23,6 @@ ...@@ -24,11 +23,6 @@
.rows = (_block)->numOfRows, \ .rows = (_block)->numOfRows, \
.uid = (_checkInfo)->tableId}) .uid = (_checkInfo)->tableId})
enum {
TSDB_QUERY_TYPE_ALL = 1,
TSDB_QUERY_TYPE_LAST = 2,
};
enum { enum {
TSDB_CACHED_TYPE_NONE = 0, TSDB_CACHED_TYPE_NONE = 0,
TSDB_CACHED_TYPE_LASTROW = 1, TSDB_CACHED_TYPE_LASTROW = 1,
...@@ -41,7 +35,7 @@ typedef struct SQueryFilePos { ...@@ -41,7 +35,7 @@ typedef struct SQueryFilePos {
int32_t pos; int32_t pos;
int64_t lastKey; int64_t lastKey;
int32_t rows; int32_t rows;
bool mixBlock; bool composedBlock;
bool blockCompleted; bool blockCompleted;
STimeWindow win; STimeWindow win;
} SQueryFilePos; } SQueryFilePos;
...@@ -53,94 +47,137 @@ typedef struct SDataBlockLoadInfo { ...@@ -53,94 +47,137 @@ typedef struct SDataBlockLoadInfo {
SArray* pLoadedCols; SArray* pLoadedCols;
} SDataBlockLoadInfo; } SDataBlockLoadInfo;
typedef struct SLoadCompBlockInfo {
int32_t tid; /* table tid */
int32_t fileId;
} SLoadCompBlockInfo;
enum { enum {
CHECKINFO_CHOSEN_MEM = 0, CHECKINFO_CHOSEN_MEM = 0,
CHECKINFO_CHOSEN_IMEM = 1, CHECKINFO_CHOSEN_IMEM = 1,
CHECKINFO_CHOSEN_BOTH = 2 // for update=2(merge case) CHECKINFO_CHOSEN_BOTH = 2 // for update=2(merge case)
}; };
typedef struct STableCheckInfo { typedef struct STableBlockScanInfo {
uint64_t suid; uint64_t uid;
uint64_t tableId; TSKEY lastKey;
TSKEY lastKey; SBlockIdx blockIdx;
SArray* pBlockList; // block data index list
// SBlockInfo* pCompInfo; // SBlockInfo* pCompInfo;
int32_t compSize; // int32_t compSize;
int32_t numOfBlocks : 29; // number of qualified data blocks not the original blocks // int32_t numOfBlocks : 29; // number of qualified data blocks not the original blocks
uint8_t chosen : 2; // indicate which iterator should move forward uint8_t chosen : 2; // indicate which iterator should move forward
bool initBuf : 1; // whether to initialize the in-memory skip list iterator or not bool iterInit; // whether to initialize the in-memory skip list iterator or not
STbDataIter* iter; // mem buffer skip list iterator STbDataIter iter; // mem buffer skip list iterator
STbDataIter* iiter; // imem buffer skip list iterator STbDataIter iiter; // imem buffer skip list iterator
} STableCheckInfo; bool memHasVal;
bool imemHasVal;
typedef struct STableBlockInfo { } STableBlockScanInfo;
SBlock* compBlock;
STableCheckInfo* pTableCheckInfo; typedef struct SBlockOrderWrapper {
} STableBlockInfo; int64_t uid;
SBlock* pBlock;
} SBlockOrderWrapper;
typedef struct SBlockOrderSupporter { typedef struct SBlockOrderSupporter {
int32_t numOfTables; int32_t numOfTables;
STableBlockInfo** pDataBlockInfo; SBlockOrderWrapper** pDataBlockInfo;
int32_t* blockIndexArray; int32_t* indexPerTable;
int32_t* numOfBlocksPerTable; int32_t* numOfBlocksPerTable;
} SBlockOrderSupporter; } SBlockOrderSupporter;
typedef struct SIOCostSummary { typedef struct SIOCostSummary {
int64_t blockLoadTime; int64_t blockLoadTime;
int64_t statisInfoLoadTime; int64_t statisInfoLoadTime;
int64_t checkForNextTime; int64_t checkForNextTime;
int64_t headFileLoad; int64_t headFileLoad;
int64_t headFileLoadTime; int64_t headFileLoadTime;
} SIOCostSummary; } SIOCostSummary;
typedef struct SBlockLoadSuppInfo { typedef struct SBlockLoadSuppInfo {
SColumnDataAgg* pstatis; SColumnDataAgg* pstatis;
SColumnDataAgg** plist; SColumnDataAgg** plist;
SArray* defaultLoadColumn; // default load column int16_t* colIdList; // default load column
int32_t* slotIds; // colId to slotId int32_t* slotIds; // colId to slotId
} SBlockLoadSuppInfo; } SBlockLoadSuppInfo;
typedef struct SFileSetIter {
int32_t numOfFiles; // number of total files
int32_t index; // current accessed index in the list
SArray* pFileList; // data file list
} SFileSetIter;
typedef struct SFileDataBlockInfo {
int32_t tbBlockIdx; // index position in STableBlockScanInfo in order to check whether neighbor block overlaps with it
int64_t uid;
} SFileDataBlockInfo;
typedef struct SDataBlockIter {
int32_t numOfBlocks;
int32_t index;
SArray* blockList; // SArray<SFileDataBlockInfo>
} SDataBlockIter;
typedef struct SFileBlockDumpInfo {
int32_t totalRows;
int32_t rowIndex;
int64_t lastKey;
} SFileBlockDumpInfo;
typedef struct SComposedDataBlock {
bool composed;
int32_t rows;
} SComposedDataBlock;
typedef struct SReaderStatus {
SQueryFilePos cur; // current position
int32_t tableListIndex;
bool loadFromFile; // check file stage
bool initStartPos;
SHashObj* pTableMap; // SHash<STableBlockScanInfo>
int32_t realNumOfRows;
SFileBlockDumpInfo fBlockDumpInfo;
SBlockData fileBlockData;
SFileSetIter fileIter;
SDataBlockIter blockIter;
} SReaderStatus;
struct STsdbReader { struct STsdbReader {
STsdb* pTsdb; STsdb* pTsdb;
uint64_t suid; uint64_t suid;
int16_t order; int16_t order;
SQueryFilePos cur; // current position STimeWindow window; // the primary query time window that applies to all queries
STimeWindow window; // the primary query time window that applies to all queries SSDataBlock* pResBlock;
// SColumnDataAgg* statis; // query level statistics, only one table block statistics info exists at any time int32_t capacity;
// SColumnDataAgg** pstatis;// the ptr array list to return to caller SReaderStatus status;
int32_t numOfBlocks; char* idStr; // query info handle, for debug purpose
SArray* pColumns; // SArray<SColumnInfoData> int32_t type; // query type: 1. retrieve all data blocks, 2. retrieve direct prev|next rows
bool locateStart;
int32_t outputCapacity;
int32_t realNumOfRows;
SArray* pTableCheckInfo; // SArray<STableCheckInfo>
int32_t activeIndex;
bool checkFiles; // check file stage
int8_t cachelastrow; // check if last row cached
bool loadExternalRow; // load time window external data rows
bool currentLoadExternalRows; // current load external rows
int32_t loadType; // block load type
char* idStr; // query info handle, for debug purpose
int32_t type; // query type: retrieve all data blocks, 2. retrieve only last row, 3. retrieve direct prev|next rows
SDFileSet* pFileGroup;
// SFSIter fileIter;
// SReadH rhelper;
STableBlockInfo* pDataBlockInfo;
SDataCols* pDataCols; // in order to hold current file data block
int32_t allocSize; // allocated data block size
SDataBlockLoadInfo dataBlockLoadInfo; /* record current block load information */
SLoadCompBlockInfo compBlockLoadInfo; /* record current compblock information in SQueryAttr */
SBlockLoadSuppInfo suppInfo; SBlockLoadSuppInfo suppInfo;
SArray* prev; // previous row which is before than time window SArray* prev; // previous row which is before than time window
SArray* next; // next row which is after the query time window SArray* next; // next row which is after the query time window
SIOCostSummary cost; SIOCostSummary cost;
STSchema* pSchema; STSchema* pSchema;
SDataFReader* pFileReader;
int64_t startVersion;
int64_t endVersion;
#if 0
SFileBlockInfo* pDataBlockInfo;
SDataCols* pDataCols; // in order to hold current file data block
int32_t allocSize; // allocated data block size
SDataBlockLoadInfo dataBlockLoadInfo; /* record current block load information */
SLoadCompBlockInfo compBlockLoadInfo; /* record current compblock information in SQueryAttr */
// SDFileSet* pFileGroup;
// SFSIter fileIter;
// SReadH rhelper;
// SColumnDataAgg* statis; // query level statistics, only one table block statistics info exists at any time
// SColumnDataAgg** pstatis;// the ptr array list to return to caller
#endif
}; };
static SFileDataBlockInfo* getCurrentBlockInfo(SDataBlockIter* pBlockIter);
static int tsdbReadRowsFromCache(STableBlockScanInfo* pScanInfo, TSDBKEY maxKey, int32_t capacity, STsdbReader* pReader);
static TSDBROW* getValidRow(STbDataIter* pIter, bool* hasVal, STsdbReader* pReader);
static int32_t doLoadRowsOfIdenticalTsInFileBlock(SBlockData* pData, SFileBlockDumpInfo* pDumpInfo, int64_t ts, SRowMerger *pMerger,
STsdbReader* pReader, STSRow** pRow);
// static void tsdbInitDataBlockLoadInfo(SDataBlockLoadInfo* pBlockLoadInfo) { // static void tsdbInitDataBlockLoadInfo(SDataBlockLoadInfo* pBlockLoadInfo) {
// pBlockLoadInfo->slot = -1; // pBlockLoadInfo->slot = -1;
// pBlockLoadInfo->uid = 0; // pBlockLoadInfo->uid = 0;
...@@ -152,70 +189,50 @@ struct STsdbReader { ...@@ -152,70 +189,50 @@ struct STsdbReader {
// pCompBlockLoadInfo->fileId = -1; // pCompBlockLoadInfo->fileId = -1;
// } // }
// static SArray* getColumnIdList(STsdbReader* pTsdbReadHandle) { static int32_t setColumnIdList(STsdbReader* pReader, SSDataBlock* pBlock) {
// size_t numOfCols = QH_GET_NUM_OF_COLS(pTsdbReadHandle); size_t numOfCols = taosArrayGetSize(pBlock->pDataBlock);
// assert(numOfCols <= TSDB_MAX_COLUMNS); pReader->suppInfo.colIdList = taosMemoryCalloc(numOfCols, sizeof(int16_t));
if (pReader->suppInfo.colIdList == NULL) {
// SArray* pIdList = taosArrayInit(numOfCols, sizeof(int16_t)); return TSDB_CODE_OUT_OF_MEMORY;
// for (int32_t i = 0; i < numOfCols; ++i) { }
// SColumnInfoData* pCol = taosArrayGet(pTsdbReadHandle->pColumns, i);
// taosArrayPush(pIdList, &pCol->info.colId);
// }
// return pIdList;
// }
// static SArray* getDefaultLoadColumns(STsdbReader* pTsdbReadHandle, bool loadTS) {
// SArray* pLocalIdList = getColumnIdList(pTsdbReadHandle);
// // check if the primary time stamp column needs to load
// int16_t colId = *(int16_t*)taosArrayGet(pLocalIdList, 0);
// // the primary timestamp column does not be included in the the specified load column list, add it
// if (loadTS && colId != PRIMARYKEY_TIMESTAMP_COL_ID) {
// int16_t columnId = PRIMARYKEY_TIMESTAMP_COL_ID;
// taosArrayInsert(pLocalIdList, 0, &columnId);
// }
// return pLocalIdList;
// }
static SArray* createCheckInfoFromTableGroup(STsdbReader* pTsdbReadHandle, STableListInfo* pTableList) {
// size_t tableSize = taosArrayGetSize(pTableList->pTableList);
// assert(tableSize >= 1);
// // allocate buffer in order to load data blocks from file
// SArray* pTableCheckInfo = taosArrayInit(tableSize, sizeof(STableCheckInfo));
// if (pTableCheckInfo == NULL) {
// return NULL;
// }
// // todo apply the lastkey of table check to avoid to load header file
// for (int32_t j = 0; j < tableSize; ++j) {
// STableKeyInfo* pKeyInfo = (STableKeyInfo*)taosArrayGet(pTableList->pTableList, j);
// STableCheckInfo info = {.lastKey = pKeyInfo->lastKey, .tableId = pKeyInfo->uid};
// info.suid = pTsdbReadHandle->suid;
// if (ASCENDING_TRAVERSE(pTsdbReadHandle->order)) {
// if (info.lastKey == INT64_MIN || info.lastKey < pTsdbReadHandle->window.skey) {
// info.lastKey = pTsdbReadHandle->window.skey;
// }
// assert(info.lastKey >= pTsdbReadHandle->window.skey && info.lastKey <= pTsdbReadHandle->window.ekey); for (int32_t i = 0; i < numOfCols; ++i) {
// } else { SColumnInfoData* pCol = taosArrayGet(pBlock->pDataBlock, i);
// info.lastKey = pTsdbReadHandle->window.skey; pReader->suppInfo.colIdList[i] = pCol->info.colId;
// } }
// taosArrayPush(pTableCheckInfo, &info); return TSDB_CODE_SUCCESS;
// tsdbDebug("%p check table uid:%" PRId64 " from lastKey:%" PRId64 " %s", pTsdbReadHandle, info.tableId, }
// info.lastKey,
// pTsdbReadHandle->idStr);
// }
// // TODO group table according to the tag value. static SHashObj* createDataBlockScanInfo(STsdbReader* pTsdbReader, const uint64_t* idList, int32_t numOfTables) {
// taosArraySort(pTableCheckInfo, tsdbCheckInfoCompar); ASSERT(numOfTables >= 1);
// return pTableCheckInfo;
return NULL; // allocate buffer in order to load data blocks from file
// todo use simple hash instead
SHashObj* pTableMap = taosHashInit(numOfTables, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_NO_LOCK);
if (pTableMap == NULL) {
return NULL;
}
// todo apply the lastkey of table check to avoid to load header file
for (int32_t j = 0; j < numOfTables; ++j) {
STableBlockScanInfo info = {.lastKey = 0, .uid = idList[j]};
if (ASCENDING_TRAVERSE(pTsdbReader->order)) {
if (info.lastKey == INT64_MIN || info.lastKey < pTsdbReader->window.skey) {
info.lastKey = pTsdbReader->window.skey;
}
ASSERT(info.lastKey >= pTsdbReader->window.skey && info.lastKey <= pTsdbReader->window.ekey);
} else {
info.lastKey = pTsdbReader->window.skey;
}
taosHashPut(pTableMap, &info.uid, sizeof(uint64_t), &info, sizeof(info));
tsdbDebug("%p check table uid:%" PRId64 " from lastKey:%" PRId64 " %s", pTsdbReader, info.uid, info.lastKey,
pTsdbReader->idStr);
}
return pTableMap;
} }
// static void resetCheckInfo(STsdbReader* pTsdbReadHandle) { // static void resetCheckInfo(STsdbReader* pTsdbReadHandle) {
...@@ -224,7 +241,7 @@ static SArray* createCheckInfoFromTableGroup(STsdbReader* pTsdbReadHandle, STabl ...@@ -224,7 +241,7 @@ static SArray* createCheckInfoFromTableGroup(STsdbReader* pTsdbReadHandle, STabl
// // todo apply the lastkey of table check to avoid to load header file // // todo apply the lastkey of table check to avoid to load header file
// for (int32_t i = 0; i < numOfTables; ++i) { // for (int32_t i = 0; i < numOfTables; ++i) {
// STableCheckInfo* pCheckInfo = (STableCheckInfo*)taosArrayGet(pTsdbReadHandle->pTableCheckInfo, i); // STableBlockScanInfo* pCheckInfo = (STableBlockScanInfo*)taosArrayGet(pTsdbReadHandle->pTableCheckInfo, i);
// pCheckInfo->lastKey = pTsdbReadHandle->window.skey; // pCheckInfo->lastKey = pTsdbReadHandle->window.skey;
// pCheckInfo->iter = tsdbTbDataIterDestroy(pCheckInfo->iter); // pCheckInfo->iter = tsdbTbDataIterDestroy(pCheckInfo->iter);
// pCheckInfo->iiter = tsdbTbDataIterDestroy(pCheckInfo->iiter); // pCheckInfo->iiter = tsdbTbDataIterDestroy(pCheckInfo->iiter);
...@@ -239,24 +256,24 @@ static SArray* createCheckInfoFromTableGroup(STsdbReader* pTsdbReadHandle, STabl ...@@ -239,24 +256,24 @@ static SArray* createCheckInfoFromTableGroup(STsdbReader* pTsdbReadHandle, STabl
// } // }
// // only one table, not need to sort again // // only one table, not need to sort again
// static SArray* createCheckInfoFromCheckInfo(STableCheckInfo* pCheckInfo, TSKEY skey, SArray** psTable) { // static SArray* createCheckInfoFromCheckInfo(STableBlockScanInfo* pCheckInfo, TSKEY skey, SArray** psTable) {
// SArray* pNew = taosArrayInit(1, sizeof(STableCheckInfo)); // SArray* pNew = taosArrayInit(1, sizeof(STableBlockScanInfo));
// STableCheckInfo info = {.lastKey = skey}; // STableBlockScanInfo info = {.lastKey = skey};
// info.tableId = pCheckInfo->tableId; // info.tableId = pCheckInfo->tableId;
// taosArrayPush(pNew, &info); // taosArrayPush(pNew, &info);
// return pNew; // return pNew;
// } // }
// static bool emptyQueryTimewindow(STsdbReader* pTsdbReadHandle) { static bool isEmptyQueryTimeWindow(STsdbReader* pTsdbReader) {
// assert(pTsdbReadHandle != NULL); ASSERT(pTsdbReader != NULL);
// STimeWindow* w = &pTsdbReadHandle->window; STimeWindow* w = &pTsdbReader->window;
// bool asc = ASCENDING_TRAVERSE(pTsdbReadHandle->order); bool asc = ASCENDING_TRAVERSE(pTsdbReader->order);
// return ((asc && w->skey > w->ekey) || (!asc && w->ekey > w->skey)); return ((asc && w->skey > w->ekey) || (!asc && w->ekey > w->skey));
// } }
// // Update the query time window according to the data time to live(TTL) information, in order to avoid to return // // Update the query time window according to the data time to live(TTL) information, in order to avoid to return
// // the expired data to client, even it is queried already. // // the expired data to client, even it is queried already.
...@@ -267,6 +284,7 @@ static SArray* createCheckInfoFromTableGroup(STsdbReader* pTsdbReadHandle, STabl ...@@ -267,6 +284,7 @@ static SArray* createCheckInfoFromTableGroup(STsdbReader* pTsdbReadHandle, STabl
// return now - (tsTickPerMin[pCfg->precision] * pCfg->keep2) + 1; // needs to add one tick // return now - (tsTickPerMin[pCfg->precision] * pCfg->keep2) + 1; // needs to add one tick
// } // }
// todo remove this
static void setQueryTimewindow(STsdbReader* pReader, SQueryTableDataCond* pCond, int32_t tWinIdx) { static void setQueryTimewindow(STsdbReader* pReader, SQueryTableDataCond* pCond, int32_t tWinIdx) {
// pReader->window = pCond->twindows[tWinIdx]; // pReader->window = pCond->twindows[tWinIdx];
...@@ -293,113 +311,140 @@ static void setQueryTimewindow(STsdbReader* pReader, SQueryTableDataCond* pCond, ...@@ -293,113 +311,140 @@ static void setQueryTimewindow(STsdbReader* pReader, SQueryTableDataCond* pCond,
// } // }
} }
static int32_t tsdbReaderCreate(SVnode* pVnode, SQueryTableDataCond* pCond, uint64_t qId, uint64_t taskId, static void checkResultSize(const SQueryTableDataCond* pCond, STsdbReader* pReader) {
STsdbReader** ppReader) { int32_t rowLen = 0;
int32_t code = 0; for (int32_t i = 0; i < pCond->numOfCols; ++i) {
STsdbReader* pReader = NULL; rowLen += pCond->colList[i].bytes;
}
// make sure the output SSDataBlock size be less than 2MB.
int32_t TWOMB = 2 * 1024 * 1024;
if (pReader->capacity * rowLen > TWOMB) {
pReader->capacity = TWOMB / rowLen;
}
}
// init file iterator
static int32_t initFileIterator(SFileSetIter* pIter, const STsdbFSState* pFState) {
pIter->index = -1;
pIter->numOfFiles = taosArrayGetSize(pFState->aDFileSet);
pIter->pFileList = taosArrayDup(pFState->aDFileSet);
return TSDB_CODE_SUCCESS;
}
static void resetDataBlockIterator(SDataBlockIter* pIter) {
pIter->numOfBlocks = -1;
}
static bool nextFilesetIterator(SFileSetIter* pIter, int32_t order, STsdbReader* pReader) {
if (pIter->index >= pIter->numOfFiles) {
return false;
}
pIter->index += 1;
// check file the time range of coverage
STimeWindow win = {0};
SDFileSet *pDFile = (SDFileSet *)taosArrayGet(pIter->pFileList, pIter->index);
// alloc int32_t code = tsdbDataFReaderOpen(&pReader->pFileReader, pReader->pTsdb, pDFile);
pReader = (STsdbReader*)taosMemoryCalloc(1, sizeof(*pReader)); if (code != TSDB_CODE_SUCCESS) {
goto _err;
}
// tsdbGetFidKeyRange(pCfg->days, pCfg->precision, pTsdbReadHandle->pFileGroup->fid, &win.skey, &win.ekey);
// current file are not overlapped with query time window, ignore remain files
if ((ASCENDING_TRAVERSE(order) && win.skey > pReader->window.ekey) ||
(!ASCENDING_TRAVERSE(order) && win.ekey < pReader->window.ekey)) {
tsdbDebug("%p remain files are not qualified for qrange:%" PRId64 "-%" PRId64 ", ignore, %s", pReader,
pReader->window.skey, pReader->window.ekey, pReader->idStr);
return false;
}
_err:
return false;
}
static void initReaderStatus(SReaderStatus* pStatus) {
pStatus->cur.fid = INT32_MIN;
pStatus->cur.win = TSWINDOW_INITIALIZER;
pStatus->initStartPos = false;
pStatus->tableListIndex = 0; // current active table index
pStatus->loadFromFile = true;
}
static int32_t tsdbReaderCreate(SVnode* pVnode, SQueryTableDataCond* pCond, STsdbReader** ppReader, const char* idstr) {
int32_t code = 0;
STsdbReader* pReader = (STsdbReader*)taosMemoryCalloc(1, sizeof(*pReader));
if (pReader == NULL) { if (pReader == NULL) {
code = TSDB_CODE_OUT_OF_MEMORY; code = TSDB_CODE_OUT_OF_MEMORY;
goto _err; goto _end;
} }
pReader->pTsdb = pVnode->pTsdb; // TODO: pass in pTsdb directly
pReader->suid = pCond->suid;
pReader->order = pCond->order;
pReader->loadType = pCond->type;
pReader->loadExternalRow = pCond->loadExternalRows;
pReader->currentLoadExternalRows = pCond->loadExternalRows;
pReader->type = TSDB_QUERY_TYPE_ALL;
pReader->cur.fid = INT32_MIN;
pReader->cur.win = TSWINDOW_INITIALIZER;
pReader->checkFiles = true;
pReader->activeIndex = 0; // current active table index
pReader->allocSize = 0;
pReader->locateStart = false;
pReader->outputCapacity = 4096; //((STsdb*)tsdb)->config.maxRowsPerFileBlock;
// char buf[128] = {0};
// snprintf(buf, tListLen(buf), "TID:0x%" PRIx64 " QID:0x%" PRIx64, taskId, qId);
// pReadHandle->idStr = strdup(buf);
// // if (tsdbInitReadH(&pReadHandle->rhelper, pReadHandle->pTsdb) != 0) {
// // goto _end;
// // }
initReaderStatus(&pReader->status);
pReader->pTsdb = pVnode->pTsdb;
pReader->suid = pCond->suid;
pReader->order = pCond->order;
pReader->capacity = 4096;
pReader->idStr = strdup(idstr);
pReader->startVersion= pCond->startVersion;
pReader->endVersion = pCond->endVersion;
// todo remove this
setQueryTimewindow(pReader, pCond, 0); setQueryTimewindow(pReader, pCond, 0);
if (pCond->numOfCols > 0) { if (pCond->numOfCols > 0) {
// int32_t rowLen = 0; checkResultSize(pCond, pReader);
// for (int32_t i = 0; i < pCond->numOfCols; ++i) {
// rowLen += pCond->colList[i].bytes; // allocate buffer in order to load data blocks from file
// } pReader->suppInfo.pstatis = taosMemoryCalloc(pCond->numOfCols, sizeof(SColumnDataAgg));
if (pReader->suppInfo.pstatis == NULL) {
// // make sure the output SSDataBlock size be less than 2MB. code = TSDB_CODE_OUT_OF_MEMORY;
// int32_t TWOMB = 2 * 1024 * 1024; goto _end;
// if (pReadHandle->outputCapacity * rowLen > TWOMB) { }
// pReadHandle->outputCapacity = TWOMB / rowLen;
// } // todo use new api refactor this
pReader->pResBlock = taosMemoryCalloc(1, sizeof(SSDataBlock));
// // allocate buffer in order to load data blocks from file if (pReader->pResBlock == NULL) {
// pReadHandle->suppInfo.pstatis = taosMemoryCalloc(pCond->numOfCols, sizeof(SColumnDataAgg)); code = TSDB_CODE_OUT_OF_MEMORY;
// if (pReadHandle->suppInfo.pstatis == NULL) { goto _end;
// goto _end; }
// }
pReader->pResBlock->pDataBlock = taosArrayInit(pCond->numOfCols, sizeof(SColumnInfoData));
// // todo: use list instead of array? for (int32_t i = 0; i < pCond->numOfCols; ++i) {
// pReadHandle->pColumns = taosArrayInit(pCond->numOfCols, sizeof(SColumnInfoData)); SColumnInfoData colInfo = {{0}, 0};
// if (pReadHandle->pColumns == NULL) { colInfo.info = pCond->colList[i];
// goto _end; taosArrayPush(pReader->pResBlock->pDataBlock, &colInfo);
// } }
// for (int32_t i = 0; i < pCond->numOfCols; ++i) { setColumnIdList(pReader, pReader->pResBlock);
// SColumnInfoData colInfo = {{0}, 0}; pReader->suppInfo.slotIds = taosMemoryCalloc(pCond->numOfCols, sizeof(int32_t));
// colInfo.info = pCond->colList[i]; pReader->suppInfo.plist = taosMemoryCalloc(pCond->numOfCols, POINTER_BYTES);
// int32_t code = colInfoDataEnsureCapacity(&colInfo, 0, pReadHandle->outputCapacity);
// if (code != TSDB_CODE_SUCCESS) {
// goto _end;
// }
// taosArrayPush(pReadHandle->pColumns, &colInfo);
// }
// pReadHandle->suppInfo.defaultLoadColumn = getDefaultLoadColumns(pReadHandle, true);
// size_t size = taosArrayGetSize(pReadHandle->suppInfo.defaultLoadColumn);
// pReadHandle->suppInfo.slotIds = taosMemoryCalloc(size, sizeof(int32_t));
// pReadHandle->suppInfo.plist = taosMemoryCalloc(size, POINTER_BYTES);
} }
// pReadHandle->pDataCols = tdNewDataCols(1000, pVnode->config.tsdbCfg.maxRows); // todo refactor
// if (pReadHandle->pDataCols == NULL) { STsdbFSState* pFState = pReader->pTsdb->fs->cState;
// tsdbError("%p failed to malloc buf for pDataCols, %s", pReadHandle, pReadHandle->idStr); initFileIterator(&pReader->status.fileIter, pFState);
// terrno = TSDB_CODE_TDB_OUT_OF_MEMORY; resetDataBlockIterator(&pReader->status.blockIter);
// goto _end;
// }
// tsdbInitDataBlockLoadInfo(&pReadHandle->dataBlockLoadInfo);
// tsdbInitCompBlockLoadInfo(&pReadHandle->compBlockLoadInfo);
// return (STsdbReader*)pReadHandle;
// _end: // no data in files, let's try buffer in memory
// tsdbReaderClose(pReadHandle); if (pReader->status.fileIter.numOfFiles == 0) {
// terrno = TSDB_CODE_TDB_OUT_OF_MEMORY; pReader->status.loadFromFile = false;
// return NULL; }
*ppReader = pReader; *ppReader = pReader;
return code; return code;
_err: _end:
// tsdbError(""); tsdbReaderClose(pReader);
*ppReader = NULL; *ppReader = NULL;
return code; return code;
} }
// static int32_t setCurrentSchema(SVnode* pVnode, STsdbReader* pTsdbReadHandle) { // static int32_t setCurrentSchema(SVnode* pVnode, STsdbReader* pTsdbReadHandle) {
// STableCheckInfo* pCheckInfo = taosArrayGet(pTsdbReadHandle->pTableCheckInfo, 0); // STableBlockScanInfo* pCheckInfo = taosArrayGet(pTsdbReadHandle->pTableCheckInfo, 0);
// int32_t sversion = 1; // int32_t sversion = 1;
...@@ -463,7 +508,7 @@ _err: ...@@ -463,7 +508,7 @@ _err:
// // pTsdbReadHandle->pTableCheckInfo = destroyTableCheckInfo(pTsdbReadHandle->pTableCheckInfo); // // pTsdbReadHandle->pTableCheckInfo = destroyTableCheckInfo(pTsdbReadHandle->pTableCheckInfo);
// pTsdbReadHandle->pTableCheckInfo = NULL; // createCheckInfoFromTableGroup(pTsdbReadHandle, groupList, pMeta, // pTsdbReadHandle->pTableCheckInfo = NULL; // createDataBlockScanInfo(pTsdbReadHandle, groupList, pMeta,
// // &pTable); // // &pTable);
// if (pTsdbReadHandle->pTableCheckInfo == NULL) { // if (pTsdbReadHandle->pTableCheckInfo == NULL) {
// // tsdbReaderClose(pTsdbReadHandle); // // tsdbReaderClose(pTsdbReadHandle);
...@@ -484,7 +529,7 @@ _err: ...@@ -484,7 +529,7 @@ _err:
// return res; // return res;
// } // }
// static bool initTableMemIterator(STsdbReader* pHandle, STableCheckInfo* pCheckInfo) { // static bool initTableMemIterator(STsdbReader* pHandle, STableBlockScanInfo* pCheckInfo) {
// if (pCheckInfo->initBuf) { // if (pCheckInfo->initBuf) {
// return true; // return true;
// } // }
...@@ -566,12 +611,12 @@ _err: ...@@ -566,12 +611,12 @@ _err:
// return true; // return true;
// } // }
// static void destroyTableMemIterator(STableCheckInfo* pCheckInfo) { // static void destroyTableMemIterator(STableBlockScanInfo* pCheckInfo) {
// tsdbTbDataIterDestroy(pCheckInfo->iter); // tsdbTbDataIterDestroy(pCheckInfo->iter);
// tsdbTbDataIterDestroy(pCheckInfo->iiter); // tsdbTbDataIterDestroy(pCheckInfo->iiter);
// } // }
// static TSKEY extractFirstTraverseKey(STableCheckInfo* pCheckInfo, int32_t order, int32_t update, TDRowVerT maxVer) { // static TSKEY extractFirstTraverseKey(STableBlockScanInfo* pCheckInfo, int32_t order, int32_t update, TDRowVerT maxVer) {
// TSDBROW row = {0}; // TSDBROW row = {0};
// STSRow *rmem = NULL, *rimem = NULL; // STSRow *rmem = NULL, *rimem = NULL;
...@@ -621,7 +666,7 @@ _err: ...@@ -621,7 +666,7 @@ _err:
// } // }
// } // }
// static STSRow* getSRowInTableMem(STableCheckInfo* pCheckInfo, int32_t order, int32_t update, STSRow** extraRow, // static STSRow* getSRowInTableMem(STableBlockScanInfo* pCheckInfo, int32_t order, int32_t update, STSRow** extraRow,
// TDRowVerT maxVer) { // TDRowVerT maxVer) {
// TSDBROW row; // TSDBROW row;
// STSRow *rmem = NULL, *rimem = NULL; // STSRow *rmem = NULL, *rimem = NULL;
...@@ -685,7 +730,7 @@ _err: ...@@ -685,7 +730,7 @@ _err:
// } // }
// } // }
// static bool moveToNextRowInMem(STableCheckInfo* pCheckInfo) { // static bool moveToNextRowInMem(STableBlockScanInfo* pCheckInfo) {
// bool hasNext = false; // bool hasNext = false;
// if (pCheckInfo->chosen == CHECKINFO_CHOSEN_MEM) { // if (pCheckInfo->chosen == CHECKINFO_CHOSEN_MEM) {
// if (pCheckInfo->iter != NULL) { // if (pCheckInfo->iter != NULL) {
...@@ -729,7 +774,7 @@ _err: ...@@ -729,7 +774,7 @@ _err:
// assert(pHandle->activeIndex < size && pHandle->activeIndex >= 0 && size >= 1); // assert(pHandle->activeIndex < size && pHandle->activeIndex >= 0 && size >= 1);
// pHandle->cur.fid = INT32_MIN; // pHandle->cur.fid = INT32_MIN;
// STableCheckInfo* pCheckInfo = taosArrayGet(pHandle->pTableCheckInfo, pHandle->activeIndex); // STableBlockScanInfo* pCheckInfo = taosArrayGet(pHandle->pTableCheckInfo, pHandle->activeIndex);
// if (!pCheckInfo->initBuf) { // if (!pCheckInfo->initBuf) {
// initTableMemIterator(pHandle, pCheckInfo); // initTableMemIterator(pHandle, pCheckInfo);
// } // }
...@@ -814,188 +859,154 @@ _err: ...@@ -814,188 +859,154 @@ _err:
// return midSlot; // return midSlot;
// } // }
// static int32_t loadBlockInfo(STsdbReader* pTsdbReadHandle, int32_t index, int32_t* numOfBlocks) { static int32_t doLoadBlockIndex(STsdbReader* pReader, SDataFReader* pFileReader, SArray* pIndexList) {
// int32_t code = 0; int32_t code = 0;
// STableCheckInfo* pCheckInfo = taosArrayGet(pTsdbReadHandle->pTableCheckInfo, index);
// pCheckInfo->numOfBlocks = 0;
// STable table = {.uid = pCheckInfo->tableId, .suid = pCheckInfo->suid};
// table.pSchema = pTsdbReadHandle->pSchema;
// if (tsdbSetReadTable(&pTsdbReadHandle->rhelper, &table) != TSDB_CODE_SUCCESS) {
// code = terrno;
// return code;
// }
// SBlockIdx* compIndex = pTsdbReadHandle->rhelper.pBlkIdx;
// // no data block in this file, try next file
// if (compIndex == NULL || compIndex->uid != pCheckInfo->tableId) {
// return 0; // no data blocks in the file belongs to pCheckInfo->pTable
// }
// if (pCheckInfo->compSize < (int32_t)compIndex->len) {
// assert(compIndex->len > 0);
// char* t = taosMemoryRealloc(pCheckInfo->pCompInfo, compIndex->len);
// if (t == NULL) {
// terrno = TSDB_CODE_TDB_OUT_OF_MEMORY;
// code = TSDB_CODE_TDB_OUT_OF_MEMORY;
// return code;
// }
// pCheckInfo->pCompInfo = (SBlockInfo*)t;
// pCheckInfo->compSize = compIndex->len;
// }
// if (tsdbLoadBlockInfo(&(pTsdbReadHandle->rhelper), (void*)(pCheckInfo->pCompInfo)) < 0) {
// return terrno;
// }
// SBlockInfo* pCompInfo = pCheckInfo->pCompInfo;
// TSKEY s = TSKEY_INITIAL_VAL, e = TSKEY_INITIAL_VAL;
// if (ASCENDING_TRAVERSE(pTsdbReadHandle->order)) {
// assert(pCheckInfo->lastKey <= pTsdbReadHandle->window.ekey &&
// pTsdbReadHandle->window.skey <= pTsdbReadHandle->window.ekey);
// } else {
// assert(pCheckInfo->lastKey >= pTsdbReadHandle->window.ekey &&
// pTsdbReadHandle->window.skey >= pTsdbReadHandle->window.ekey);
// }
// s = TMIN(pCheckInfo->lastKey, pTsdbReadHandle->window.ekey);
// e = TMAX(pCheckInfo->lastKey, pTsdbReadHandle->window.ekey);
// // discard the unqualified data block based on the query time window
// int32_t start = binarySearchForBlock(pCompInfo->blocks, compIndex->numOfBlocks, s, TSDB_ORDER_ASC);
// int32_t end = start;
// if (s > pCompInfo->blocks[start].maxKey.ts) {
// return 0;
// }
// // todo speedup the procedure of located end block
// while (end < (int32_t)compIndex->numOfBlocks && (pCompInfo->blocks[end].minKey.ts <= e)) {
// end += 1;
// }
// pCheckInfo->numOfBlocks = (end - start);
// if (start > 0) {
// memmove(pCompInfo->blocks, &pCompInfo->blocks[start], pCheckInfo->numOfBlocks * sizeof(SBlock));
// }
// (*numOfBlocks) += pCheckInfo->numOfBlocks;
// return 0;
// }
// static int32_t getFileCompInfo(STsdbReader* pTsdbReadHandle, int32_t* numOfBlocks) {
// // load all the comp offset value for all tables in this file
// int32_t code = TSDB_CODE_SUCCESS;
// *numOfBlocks = 0;
// pTsdbReadHandle->cost.headFileLoad += 1;
// int64_t s = taosGetTimestampUs();
// size_t numOfTables = 0; SMapData blockIdxMap;
// if (pTsdbReadHandle->loadType == BLOCK_LOAD_TABLE_SEQ_ORDER) { tMapDataReset(&blockIdxMap);
// code = loadBlockInfo(pTsdbReadHandle, pTsdbReadHandle->activeIndex, numOfBlocks);
// } else if (pTsdbReadHandle->loadType == BLOCK_LOAD_OFFSET_SEQ_ORDER) {
// numOfTables = taosArrayGetSize(pTsdbReadHandle->pTableCheckInfo);
// for (int32_t i = 0; i < numOfTables; ++i) { code = tsdbReadBlockIdx(pFileReader, &blockIdxMap, NULL);
// code = loadBlockInfo(pTsdbReadHandle, i, numOfBlocks); if (code != TSDB_CODE_SUCCESS) {
// if (code != TSDB_CODE_SUCCESS) { goto _err;
// int64_t e = taosGetTimestampUs(); }
// pTsdbReadHandle->cost.headFileLoadTime += (e - s); if (blockIdxMap.nItem == 0) {
// return code; return TSDB_CODE_SUCCESS;
// } }
// }
// } else {
// assert(0);
// }
// int64_t e = taosGetTimestampUs(); SBlockIdx blockIndex = {0};
// pTsdbReadHandle->cost.headFileLoadTime += (e - s); for (int32_t i = 0; i < blockIdxMap.nItem; ++i) {
// return code; code = tMapDataGetItemByIdx(&blockIdxMap, i, &blockIndex, tGetBlockIdx);
// } if (code != TSDB_CODE_SUCCESS) {
goto _err;
}
if (blockIndex.suid != pReader->suid) {
continue;
}
// this block belongs to a table that is not queried.
void* p = taosHashGet(pReader->status.pTableMap, &blockIndex.uid, sizeof(uint64_t));
if (p == NULL) {
continue;
}
if ((ASCENDING_TRAVERSE(pReader->order) &&
(blockIndex.minKey > pReader->window.ekey || blockIndex.maxKey < pReader->window.skey)) ||
(!ASCENDING_TRAVERSE(pReader->order) &&
(blockIndex.minKey > pReader->window.skey || blockIndex.maxKey < pReader->window.ekey))) {
continue;
}
STableBlockScanInfo* pScanInfo = p;
if (pScanInfo->pBlockList == NULL) {
pScanInfo->pBlockList = taosArrayInit(16, sizeof(SBlock));
}
taosArrayPush(pIndexList, &blockIndex);
}
// static int32_t doLoadFileDataBlock(STsdbReader* pTsdbReadHandle, SBlock* pBlock, STableCheckInfo* pCheckInfo, tMapDataClear(&blockIdxMap);
// int32_t slotIndex) { return TSDB_CODE_SUCCESS;
// int64_t st = taosGetTimestampUs();
// int32_t code = tdInitDataCols(pTsdbReadHandle->pDataCols, pTsdbReadHandle->pSchema); _err:
// if (code != TSDB_CODE_SUCCESS) { tMapDataClear(&blockIdxMap);
// tsdbError("%p failed to malloc buf for pDataCols, %s", pTsdbReadHandle, pTsdbReadHandle->idStr); return code;
// terrno = TSDB_CODE_TDB_OUT_OF_MEMORY; }
// goto _error;
// }
// code = tdInitDataCols(pTsdbReadHandle->rhelper.pDCols[0], pTsdbReadHandle->pSchema); static int32_t doLoadFileBlock(STsdbReader* pReader, SArray* pIndexList, uint32_t* numOfValidTables) {
// if (code != TSDB_CODE_SUCCESS) { size_t numOfTables = taosArrayGetSize(pIndexList);
// tsdbError("%p failed to malloc buf for rhelper.pDataCols[0], %s", pTsdbReadHandle, pTsdbReadHandle->idStr);
// terrno = TSDB_CODE_TDB_OUT_OF_MEMORY;
// goto _error;
// }
// code = tdInitDataCols(pTsdbReadHandle->rhelper.pDCols[1], pTsdbReadHandle->pSchema); *numOfValidTables = 0;
// if (code != TSDB_CODE_SUCCESS) {
// tsdbError("%p failed to malloc buf for rhelper.pDataCols[1], %s", pTsdbReadHandle, pTsdbReadHandle->idStr);
// terrno = TSDB_CODE_TDB_OUT_OF_MEMORY;
// goto _error;
// }
// int16_t* colIds = pTsdbReadHandle->suppInfo.defaultLoadColumn->pData; for(int32_t i = 0; i < numOfTables; ++i) {
SBlockIdx* pBlockIdx = taosArrayGet(pIndexList, i);
// int32_t ret = tsdbLoadBlockDataCols(&(pTsdbReadHandle->rhelper), pBlock, pCheckInfo->pCompInfo, colIds, SMapData mapData;
// (int)(QH_GET_NUM_OF_COLS(pTsdbReadHandle)), true); tMapDataReset(&mapData);
// if (ret != TSDB_CODE_SUCCESS) { tsdbReadBlock(pReader->pFileReader, pBlockIdx, &mapData, NULL);
// int32_t c = terrno;
// assert(c != TSDB_CODE_SUCCESS);
// goto _error;
// }
// SDataBlockLoadInfo* pBlockLoadInfo = &pTsdbReadHandle->dataBlockLoadInfo; STableBlockScanInfo* pScanInfo = taosHashGet(pReader->status.pTableMap, &pBlockIdx->uid, sizeof(int64_t));
ASSERT(pScanInfo->pBlockList == NULL || taosArrayGetSize(pScanInfo->pBlockList) == 0);
for (int32_t j = 0; j < mapData.nItem; ++j) {
SBlock block = {0};
// pBlockLoadInfo->fileGroup = pTsdbReadHandle->pFileGroup; int32_t code = tMapDataGetItemByIdx(&mapData, j, &block, tGetBlock);
// pBlockLoadInfo->slot = pTsdbReadHandle->cur.slot; if (code != TSDB_CODE_SUCCESS) {
// pBlockLoadInfo->uid = pCheckInfo->tableId; return code;
}
// SDataCols* pCols = pTsdbReadHandle->rhelper.pDCols[0]; if ((ASCENDING_TRAVERSE(pReader->order) &&
// assert(pCols->numOfRows != 0 && pCols->numOfRows <= pBlock->numOfRows); (block.minKey.ts > pReader->window.ekey || block.maxKey.ts < pReader->window.skey)) ||
(!ASCENDING_TRAVERSE(pReader->order) &&
(block.minKey.ts > pReader->window.skey || block.maxKey.ts < pReader->window.ekey))) {
continue;
}
// pBlock->numOfRows = pCols->numOfRows; void* p = taosArrayPush(pScanInfo->pBlockList, &block);
if (p == NULL) {
return TSDB_CODE_OUT_OF_MEMORY;
}
}
// // Convert from TKEY to TSKEY for primary timestamp column if current block has timestamp before if (pScanInfo->pBlockList != NULL && taosArrayGetSize(pScanInfo->pBlockList) > 0) {
// 1970-01-01T00:00:00Z if (pBlock->minKey.ts < 0 && colIds[0] == PRIMARYKEY_TIMESTAMP_COL_ID) { (*numOfValidTables) += 1;
// int64_t* src = pCols->cols[0].pData; }
// for (int32_t i = 0; i < pBlock->numOfRows; ++i) { }
// src[i] = tdGetKey(src[i]);
// }
// }
// int64_t elapsedTime = (taosGetTimestampUs() - st); return TSDB_CODE_SUCCESS;
// pTsdbReadHandle->cost.blockLoadTime += elapsedTime; }
// tsdbDebug("%p load file block into buffer, index:%d, brange:%" PRId64 "-%" PRId64 ", rows:%d, elapsed time:%" static int32_t doLoadFileBlockData(STsdbReader* pReader, SDataBlockIter* pBlockIter, STableBlockScanInfo* pBlockScanInfo, SBlockData* pBlockData) {
// PRId64 int64_t st = taosGetTimestampUs();
// " us, %s", int32_t numOfCols = taosArrayGetSize(pReader->pResBlock->pDataBlock);
// pTsdbReadHandle, slotIndex, pBlock->minKey.ts, pBlock->maxKey.ts, pBlock->numOfRows, elapsedTime,
// pTsdbReadHandle->idStr);
// return TSDB_CODE_SUCCESS;
// _error: SFileDataBlockInfo* pFBlock = getCurrentBlockInfo(pBlockIter);
// pBlock->numOfRows = 0; SBlock* pBlock = taosArrayGet(pBlockScanInfo->pBlockList, pFBlock->tbBlockIdx);
uint8_t *pb = NULL, *pb1 = NULL;
int32_t code = tsdbReadBlockData(pReader->pFileReader, &pBlockScanInfo->blockIdx, pBlock, pBlockData, /*pReader->suppInfo.colIdList, numOfCols, */&pb, &pb1);
if (code != TSDB_CODE_SUCCESS) {
goto _error;
}
// tsdbError("%p error occurs in loading file block, index:%d, brange:%" PRId64 "-%" PRId64 ", rows:%d, %s", /*
// pTsdbReadHandle, slotIndex, pBlock->minKey.ts, pBlock->maxKey.ts, pBlock->numOfRows, int32_t ret = tsdbLoadBlockDataCols(&(pReader->rhelper), pBlock, pCheckInfo->pCompInfo, colIds,
// pTsdbReadHandle->idStr); (int)(QH_GET_NUM_OF_COLS(pReader)), true);
// return terrno; if (ret != TSDB_CODE_SUCCESS) {
// } int32_t c = terrno;
assert(c != TSDB_CODE_SUCCESS);
goto _error;
}
SDataBlockLoadInfo* pBlockLoadInfo = &pReader->dataBlockLoadInfo;
pBlockLoadInfo->fileGroup = pReader->pFileGroup;
pBlockLoadInfo->slot = pReader->cur.slot;
pBlockLoadInfo->uid = pCheckInfo->tableId;
SDataCols* pCols = pReader->rhelper.pDCols[0];
assert(pCols->numOfRows != 0 && pCols->numOfRows <= pBlock->numOfRows);
pBlock->numOfRows = pCols->numOfRows;
*/
int64_t elapsedTime = (taosGetTimestampUs() - st);
pReader->cost.blockLoadTime += elapsedTime;
tsdbDebug("%p load file block into buffer, global index:%d, table index:%d, brange:%" PRId64 "-%" PRId64
", rows:%d, minVer:%" PRId64 ", maxVer:%" PRId64 ", elapsed time:%" PRId64 " us, %s",
pReader, pBlockIter->index, pFBlock->tbBlockIdx, pBlock->minKey.ts, pBlock->maxKey.ts, pBlockData->nRow,
pBlock->minVersion, pBlock->maxVersion, elapsedTime, pReader->idStr);
return TSDB_CODE_SUCCESS;
_error:
tsdbError("%p error occurs in loading file block, global index:%d, table index:%d, brange:%" PRId64 "-%" PRId64 ", rows:%d, %s",
pReader, pBlockIter->index, pFBlock->tbBlockIdx, pBlock->minKey.ts, pBlock->maxKey.ts, pBlock->nRow, pReader->idStr);
return code;
}
// static int32_t handleDataMergeIfNeeded(STsdbReader* pTsdbReadHandle, SBlock* pBlock, STableCheckInfo* pCheckInfo) { // static int32_t handleDataMergeIfNeeded(STsdbReader* pTsdbReadHandle, SBlock* pBlock, STableBlockScanInfo* pCheckInfo) {
// SQueryFilePos* cur = &pTsdbReadHandle->cur; // SQueryFilePos* cur = &pTsdbReadHandle->cur;
// STsdbCfg* pCfg = REPO_CFG(pTsdbReadHandle->pTsdb); // STsdbCfg* pCfg = REPO_CFG(pTsdbReadHandle->pTsdb);
// SDataBlockInfo binfo = GET_FILE_DATA_BLOCK_INFO(pCheckInfo, pBlock); // SDataBlockInfo binfo = GET_FILE_DATA_BLOCK_INFO(pCheckInfo, pBlock);
...@@ -1041,7 +1052,7 @@ _err: ...@@ -1041,7 +1052,7 @@ _err:
// } // }
// // return error, add test cases // // return error, add test cases
// if ((code = doLoadFileDataBlock(pTsdbReadHandle, pBlock, pCheckInfo, cur->slot)) != TSDB_CODE_SUCCESS) { // if ((code = doLoadFileBlockData(pTsdbReadHandle, pBlock, pCheckInfo, cur->slot)) != TSDB_CODE_SUCCESS) {
// return code; // return code;
// } // }
...@@ -1074,7 +1085,7 @@ _err: ...@@ -1074,7 +1085,7 @@ _err:
// // make sure to only load once // // make sure to only load once
// bool firstTimeExtract = ((cur->pos == 0 && ascScan) || (cur->pos == binfo.rows - 1 && (!ascScan))); // bool firstTimeExtract = ((cur->pos == 0 && ascScan) || (cur->pos == binfo.rows - 1 && (!ascScan)));
// if (pTsdbReadHandle->outputCapacity < binfo.rows && firstTimeExtract) { // if (pTsdbReadHandle->outputCapacity < binfo.rows && firstTimeExtract) {
// code = doLoadFileDataBlock(pTsdbReadHandle, pBlock, pCheckInfo, cur->slot); // code = doLoadFileBlockData(pTsdbReadHandle, pBlock, pCheckInfo, cur->slot);
// if (code != TSDB_CODE_SUCCESS) { // if (code != TSDB_CODE_SUCCESS) {
// return code; // return code;
// } // }
...@@ -1102,7 +1113,7 @@ _err: ...@@ -1102,7 +1113,7 @@ _err:
// return code; // return code;
// } // }
// static int32_t loadFileDataBlock(STsdbReader* pTsdbReadHandle, SBlock* pBlock, STableCheckInfo* pCheckInfo, // static int32_t loadFileDataBlock(STsdbReader* pTsdbReadHandle, SBlock* pBlock, STableBlockScanInfo* pCheckInfo,
// bool* exists) { // bool* exists) {
// SQueryFilePos* cur = &pTsdbReadHandle->cur; // SQueryFilePos* cur = &pTsdbReadHandle->cur;
// int32_t code = TSDB_CODE_SUCCESS; // int32_t code = TSDB_CODE_SUCCESS;
...@@ -1111,7 +1122,7 @@ _err: ...@@ -1111,7 +1122,7 @@ _err:
// if (asc) { // if (asc) {
// // query ended in/started from current block // // query ended in/started from current block
// if (pTsdbReadHandle->window.ekey < pBlock->maxKey.ts || pCheckInfo->lastKey > pBlock->minKey.ts) { // if (pTsdbReadHandle->window.ekey < pBlock->maxKey.ts || pCheckInfo->lastKey > pBlock->minKey.ts) {
// if ((code = doLoadFileDataBlock(pTsdbReadHandle, pBlock, pCheckInfo, cur->slot)) != TSDB_CODE_SUCCESS) { // if ((code = doLoadFileBlockData(pTsdbReadHandle, pBlock, pCheckInfo, cur->slot)) != TSDB_CODE_SUCCESS) {
// *exists = false; // *exists = false;
// return code; // return code;
// } // }
...@@ -1135,7 +1146,7 @@ _err: ...@@ -1135,7 +1146,7 @@ _err:
// } // }
// } else { // desc order, query ended in current block // } else { // desc order, query ended in current block
// if (pTsdbReadHandle->window.ekey > pBlock->minKey.ts || pCheckInfo->lastKey < pBlock->maxKey.ts) { // if (pTsdbReadHandle->window.ekey > pBlock->minKey.ts || pCheckInfo->lastKey < pBlock->maxKey.ts) {
// if ((code = doLoadFileDataBlock(pTsdbReadHandle, pBlock, pCheckInfo, cur->slot)) != TSDB_CODE_SUCCESS) { // if ((code = doLoadFileBlockData(pTsdbReadHandle, pBlock, pCheckInfo, cur->slot)) != TSDB_CODE_SUCCESS) {
// *exists = false; // *exists = false;
// return code; // return code;
// } // }
...@@ -1531,7 +1542,7 @@ _err: ...@@ -1531,7 +1542,7 @@ _err:
// } // }
// } // }
// static void updateInfoAfterMerge(STsdbReader* pTsdbReadHandle, STableCheckInfo* pCheckInfo, int32_t numOfRows, // static void updateInfoAfterMerge(STsdbReader* pTsdbReadHandle, STableBlockScanInfo* pCheckInfo, int32_t numOfRows,
// int32_t endPos) { // int32_t endPos) {
// SQueryFilePos* cur = &pTsdbReadHandle->cur; // SQueryFilePos* cur = &pTsdbReadHandle->cur;
...@@ -1562,7 +1573,7 @@ _err: ...@@ -1562,7 +1573,7 @@ _err:
// } // }
// } // }
// static void copyAllRemainRowsFromFileBlock(STsdbReader* pTsdbReadHandle, STableCheckInfo* pCheckInfo, // static void copyAllRemainRowsFromFileBlock(STsdbReader* pTsdbReadHandle, STableBlockScanInfo* pCheckInfo,
// SDataBlockInfo* pBlockInfo, int32_t endPos) { // SDataBlockInfo* pBlockInfo, int32_t endPos) {
// SQueryFilePos* cur = &pTsdbReadHandle->cur; // SQueryFilePos* cur = &pTsdbReadHandle->cur;
...@@ -1648,7 +1659,7 @@ _err: ...@@ -1648,7 +1659,7 @@ _err:
// // only return the qualified data to client in terms of query time window, data rows in the same block but do not // // only return the qualified data to client in terms of query time window, data rows in the same block but do not
// // be included in the query time window will be discarded // // be included in the query time window will be discarded
// static void doMergeTwoLevelData(STsdbReader* pTsdbReadHandle, STableCheckInfo* pCheckInfo, SBlock* pBlock) { // static void doMergeTwoLevelData(STsdbReader* pTsdbReadHandle, STableBlockScanInfo* pCheckInfo, SBlock* pBlock) {
// SQueryFilePos* cur = &pTsdbReadHandle->cur; // SQueryFilePos* cur = &pTsdbReadHandle->cur;
// SDataBlockInfo blockInfo = GET_FILE_DATA_BLOCK_INFO(pCheckInfo, pBlock); // SDataBlockInfo blockInfo = GET_FILE_DATA_BLOCK_INFO(pCheckInfo, pBlock);
// STsdbCfg* pCfg = REPO_CFG(pTsdbReadHandle->pTsdb); // STsdbCfg* pCfg = REPO_CFG(pTsdbReadHandle->pTsdb);
...@@ -1926,192 +1937,176 @@ _err: ...@@ -1926,192 +1937,176 @@ _err:
// return midPos; // return midPos;
// } // }
// static void cleanBlockOrderSupporter(SBlockOrderSupporter* pSupporter, int32_t numOfTables) { static void cleanupBlockOrderSupporter(SBlockOrderSupporter* pSup) {
// taosMemoryFreeClear(pSupporter->numOfBlocksPerTable); taosMemoryFreeClear(pSup->numOfBlocksPerTable);
// taosMemoryFreeClear(pSupporter->blockIndexArray); taosMemoryFreeClear(pSup->indexPerTable);
// for (int32_t i = 0; i < numOfTables; ++i) {
// STableBlockInfo* pBlockInfo = pSupporter->pDataBlockInfo[i];
// taosMemoryFreeClear(pBlockInfo);
// }
// taosMemoryFreeClear(pSupporter->pDataBlockInfo);
// }
// static int32_t dataBlockOrderCompar(const void* pLeft, const void* pRight, void* param) {
// int32_t leftTableIndex = *(int32_t*)pLeft;
// int32_t rightTableIndex = *(int32_t*)pRight;
// SBlockOrderSupporter* pSupporter = (SBlockOrderSupporter*)param;
// int32_t leftTableBlockIndex = pSupporter->blockIndexArray[leftTableIndex];
// int32_t rightTableBlockIndex = pSupporter->blockIndexArray[rightTableIndex];
// if (leftTableBlockIndex > pSupporter->numOfBlocksPerTable[leftTableIndex]) {
// /* left block is empty */
// return 1;
// } else if (rightTableBlockIndex > pSupporter->numOfBlocksPerTable[rightTableIndex]) {
// /* right block is empty */
// return -1;
// }
// STableBlockInfo* pLeftBlockInfoEx = &pSupporter->pDataBlockInfo[leftTableIndex][leftTableBlockIndex];
// STableBlockInfo* pRightBlockInfoEx = &pSupporter->pDataBlockInfo[rightTableIndex][rightTableBlockIndex];
// // assert(pLeftBlockInfoEx->compBlock->offset != pRightBlockInfoEx->compBlock->offset);
// #if 0 // TODO: temporarily comment off requested by Dr. Liao
// if (pLeftBlockInfoEx->compBlock->offset == pRightBlockInfoEx->compBlock->offset &&
// pLeftBlockInfoEx->compBlock->last == pRightBlockInfoEx->compBlock->last) {
// tsdbError("error in header file, two block with same offset:%" PRId64,
// (int64_t)pLeftBlockInfoEx->compBlock->offset);
// }
// #endif
// return pLeftBlockInfoEx->compBlock->offset > pRightBlockInfoEx->compBlock->offset ? 1 : -1;
// }
// static int32_t createDataBlocksInfo(STsdbReader* pTsdbReadHandle, int32_t numOfBlocks, int32_t* numOfAllocBlocks) {
// size_t size = sizeof(STableBlockInfo) * numOfBlocks;
// if (pTsdbReadHandle->allocSize < size) {
// pTsdbReadHandle->allocSize = (int32_t)size;
// char* tmp = taosMemoryRealloc(pTsdbReadHandle->pDataBlockInfo, pTsdbReadHandle->allocSize);
// if (tmp == NULL) {
// return TSDB_CODE_TDB_OUT_OF_MEMORY;
// }
// pTsdbReadHandle->pDataBlockInfo = (STableBlockInfo*)tmp;
// }
// memset(pTsdbReadHandle->pDataBlockInfo, 0, size);
// *numOfAllocBlocks = numOfBlocks;
// // access data blocks according to the offset of each block in asc/desc order.
// int32_t numOfTables = (int32_t)taosArrayGetSize(pTsdbReadHandle->pTableCheckInfo);
// SBlockOrderSupporter sup = {0};
// sup.numOfTables = numOfTables;
// sup.numOfBlocksPerTable = taosMemoryCalloc(1, sizeof(int32_t) * numOfTables);
// sup.blockIndexArray = taosMemoryCalloc(1, sizeof(int32_t) * numOfTables);
// sup.pDataBlockInfo = taosMemoryCalloc(1, POINTER_BYTES * numOfTables);
// if (sup.numOfBlocksPerTable == NULL || sup.blockIndexArray == NULL || sup.pDataBlockInfo == NULL) {
// cleanBlockOrderSupporter(&sup, 0);
// return TSDB_CODE_TDB_OUT_OF_MEMORY;
// }
// int32_t cnt = 0;
// int32_t numOfQualTables = 0;
// for (int32_t j = 0; j < numOfTables; ++j) {
// STableCheckInfo* pTableCheck = (STableCheckInfo*)taosArrayGet(pTsdbReadHandle->pTableCheckInfo, j);
// if (pTableCheck->numOfBlocks <= 0) {
// continue;
// }
// SBlock* pBlock = pTableCheck->pCompInfo->blocks;
// sup.numOfBlocksPerTable[numOfQualTables] = pTableCheck->numOfBlocks;
// char* buf = taosMemoryMalloc(sizeof(STableBlockInfo) * pTableCheck->numOfBlocks);
// if (buf == NULL) {
// cleanBlockOrderSupporter(&sup, numOfQualTables);
// return TSDB_CODE_TDB_OUT_OF_MEMORY;
// }
// sup.pDataBlockInfo[numOfQualTables] = (STableBlockInfo*)buf; for (int32_t i = 0; i < pSup->numOfTables; ++i) {
SBlockOrderWrapper* pBlockInfo = pSup->pDataBlockInfo[i];
// for (int32_t k = 0; k < pTableCheck->numOfBlocks; ++k) { taosMemoryFreeClear(pBlockInfo);
// STableBlockInfo* pBlockInfo = &sup.pDataBlockInfo[numOfQualTables][k]; }
// pBlockInfo->compBlock = &pBlock[k];
// pBlockInfo->pTableCheckInfo = pTableCheck;
// cnt++;
// }
// numOfQualTables++;
// }
// assert(numOfBlocks == cnt);
// // since there is only one table qualified, blocks are not sorted
// if (numOfQualTables == 1) {
// memcpy(pTsdbReadHandle->pDataBlockInfo, sup.pDataBlockInfo[0], sizeof(STableBlockInfo) * numOfBlocks);
// cleanBlockOrderSupporter(&sup, numOfQualTables);
// tsdbDebug("%p create data blocks info struct completed for 1 table, %d blocks not sorted %s", pTsdbReadHandle, taosMemoryFreeClear(pSup->pDataBlockInfo);
// cnt, }
// pTsdbReadHandle->idStr);
// return TSDB_CODE_SUCCESS;
// }
// tsdbDebug("%p create data blocks info struct completed, %d blocks in %d tables %s", pTsdbReadHandle, cnt, static int32_t initBlockOrderSupporter(SBlockOrderSupporter* pSup, int32_t numOfTables) {
// numOfQualTables, pTsdbReadHandle->idStr); ASSERT(numOfTables >= 1);
// assert(cnt <= numOfBlocks && numOfQualTables <= numOfTables); // the pTableQueryInfo[j]->numOfBlocks may be 0 pSup->numOfBlocksPerTable = taosMemoryCalloc(1, sizeof(int32_t) * numOfTables);
// sup.numOfTables = numOfQualTables; pSup->indexPerTable = taosMemoryCalloc(1, sizeof(int32_t) * numOfTables);
pSup->pDataBlockInfo = taosMemoryCalloc(1, POINTER_BYTES * numOfTables);
// SMultiwayMergeTreeInfo* pTree = NULL; if (pSup->numOfBlocksPerTable == NULL || pSup->indexPerTable == NULL || pSup->pDataBlockInfo == NULL) {
// uint8_t ret = tMergeTreeCreate(&pTree, sup.numOfTables, &sup, dataBlockOrderCompar); cleanupBlockOrderSupporter(pSup);
// if (ret != TSDB_CODE_SUCCESS) { return TSDB_CODE_OUT_OF_MEMORY;
// cleanBlockOrderSupporter(&sup, numOfTables); }
// return TSDB_CODE_TDB_OUT_OF_MEMORY;
// }
// int32_t numOfTotal = 0; return TSDB_CODE_SUCCESS;
}
// while (numOfTotal < cnt) { static int32_t fileDataBlockOrderCompar(const void* pLeft, const void* pRight, void* param) {
// int32_t pos = tMergeTreeGetChosenIndex(pTree); int32_t leftIndex = *(int32_t*)pLeft;
// int32_t index = sup.blockIndexArray[pos]++; int32_t rightIndex = *(int32_t*)pRight;
// STableBlockInfo* pBlocksInfo = sup.pDataBlockInfo[pos]; SBlockOrderSupporter* pSupporter = (SBlockOrderSupporter*)param;
// pTsdbReadHandle->pDataBlockInfo[numOfTotal++] = pBlocksInfo[index];
// // set data block index overflow, in order to disable the offset comparator int32_t leftTableBlockIndex = pSupporter->indexPerTable[leftIndex];
// if (sup.blockIndexArray[pos] >= sup.numOfBlocksPerTable[pos]) { int32_t rightTableBlockIndex = pSupporter->indexPerTable[rightIndex];
// sup.blockIndexArray[pos] = sup.numOfBlocksPerTable[pos] + 1;
// }
// tMergeTreeAdjust(pTree, tMergeTreeGetAdjustIndex(pTree)); if (leftTableBlockIndex > pSupporter->numOfBlocksPerTable[leftIndex]) {
// } /* left block is empty */
return 1;
} else if (rightTableBlockIndex > pSupporter->numOfBlocksPerTable[rightIndex]) {
/* right block is empty */
return -1;
}
// /* SBlockOrderWrapper* pLeftBlock = &pSupporter->pDataBlockInfo[leftIndex][leftTableBlockIndex];
// * available when no import exists SBlockOrderWrapper* pRightBlock = &pSupporter->pDataBlockInfo[rightIndex][rightTableBlockIndex];
// * for(int32_t i = 0; i < cnt - 1; ++i) {
// * assert((*pDataBlockInfo)[i].compBlock->offset < (*pDataBlockInfo)[i+1].compBlock->offset);
// * }
// */
// tsdbDebug("%p %d data blocks sort completed, %s", pTsdbReadHandle, cnt, pTsdbReadHandle->idStr); return pLeftBlock->pBlock->aSubBlock[0].offset > pRightBlock->pBlock->aSubBlock[0].offset ? 1 : -1;
// cleanBlockOrderSupporter(&sup, numOfTables); }
// taosMemoryFree(pTree);
// return TSDB_CODE_SUCCESS; static int32_t initBlockIterator(STsdbReader* pReader, SDataBlockIter* pBlockIter, int32_t numOfBlocks) {
// } pBlockIter->numOfBlocks = numOfBlocks;
// access data blocks according to the offset of each block in asc/desc order.
int32_t numOfTables = (int32_t)taosHashGetSize(pReader->status.pTableMap);
SBlockOrderSupporter sup = {0};
int32_t code = initBlockOrderSupporter(&sup, numOfTables);
if (code != TSDB_CODE_SUCCESS) {
return code;
}
int32_t cnt = 0;
void* ptr = NULL;
while(1) {
ptr = taosHashIterate(pReader->status.pTableMap, &ptr);
if (ptr == NULL) {
break;
}
STableBlockScanInfo* pTableScanInfo = (STableBlockScanInfo*)ptr;
if (pTableScanInfo->pBlockList == NULL || taosArrayGetSize(pTableScanInfo->pBlockList) == 0) {
continue;
}
size_t num = taosArrayGetSize(pTableScanInfo->pBlockList);
sup.numOfBlocksPerTable[sup.numOfTables] = num;
char* buf = taosMemoryMalloc(sizeof(SBlockOrderWrapper) * num);
if (buf == NULL) {
cleanupBlockOrderSupporter(&sup);
return TSDB_CODE_TDB_OUT_OF_MEMORY;
}
sup.pDataBlockInfo[sup.numOfTables] = (SBlockOrderWrapper*)buf;
for (int32_t k = 0; k < num; ++k) {
SBlockOrderWrapper wrapper = {0};
wrapper.pBlock = (SBlock*)taosArrayGet(pTableScanInfo->pBlockList, k);
wrapper.uid = pTableScanInfo->uid;
sup.pDataBlockInfo[sup.numOfTables][k] = wrapper;
cnt++;
}
sup.numOfTables += 1;
}
ASSERT(numOfBlocks == cnt);
// since there is only one table qualified, blocks are not sorted
if (sup.numOfTables == 1) {
for(int32_t i = 0; i < numOfBlocks; ++i) {
SFileDataBlockInfo blockInfo = {.uid = sup.pDataBlockInfo[0][i].uid, .tbBlockIdx = i};
taosArrayPush(pBlockIter->blockList, &blockInfo);
}
tsdbDebug("%p create blocks info struct completed for one table, %d blocks not sorted %s",
pReader, cnt, pReader->idStr);
return TSDB_CODE_SUCCESS;
}
tsdbDebug("%p create data blocks info struct completed, %d blocks in %d tables %s", pReader, cnt, sup.numOfTables, pReader->idStr);
assert(cnt <= numOfBlocks && sup.numOfTables <= numOfTables); // the pTableQueryInfo[j]->numOfBlocks may be 0
SMultiwayMergeTreeInfo* pTree = NULL;
uint8_t ret = tMergeTreeCreate(&pTree, sup.numOfTables, &sup, fileDataBlockOrderCompar);
if (ret != TSDB_CODE_SUCCESS) {
cleanupBlockOrderSupporter(&sup);
return TSDB_CODE_TDB_OUT_OF_MEMORY;
}
int32_t numOfTotal = 0;
while (numOfTotal < cnt) {
int32_t pos = tMergeTreeGetChosenIndex(pTree);
int32_t index = sup.indexPerTable[pos]++;
SFileDataBlockInfo blockInfo = {.uid = sup.pDataBlockInfo[pos][index].uid, .tbBlockIdx = index};
taosArrayPush(pBlockIter->blockList, &blockInfo);
// set data block index overflow, in order to disable the offset comparator
if (sup.indexPerTable[pos] >= sup.numOfBlocksPerTable[pos]) {
sup.indexPerTable[pos] = sup.numOfBlocksPerTable[pos] + 1;
}
numOfTotal += 1;
tMergeTreeAdjust(pTree, tMergeTreeGetAdjustIndex(pTree));
}
tsdbDebug("%p %d data blocks sort completed, %s", pReader, cnt, pReader->idStr);
cleanupBlockOrderSupporter(&sup);
taosMemoryFree(pTree);
pBlockIter->index = 0;
return TSDB_CODE_SUCCESS;
}
// static int32_t getFirstFileDataBlock(STsdbReader* pTsdbReadHandle, bool* exists); // static int32_t getFirstFileDataBlock(STsdbReader* pTsdbReadHandle, bool* exists);
// static int32_t getDataBlock(STsdbReader* pTsdbReadHandle, STableBlockInfo* pNext, bool* exists) { //static int32_t getDataBlock(STsdbReader* pTsdbReadHandle, SFileBlockInfo* pNext, bool* exists) {
// int32_t step = ASCENDING_TRAVERSE(pTsdbReadHandle->order) ? 1 : -1; // int32_t step = ASCENDING_TRAVERSE(pTsdbReadHandle->order) ? 1 : -1;
// SQueryFilePos* cur = &pTsdbReadHandle->cur; // SQueryFilePos* cur = &pTsdbReadHandle->cur;
//
// while (1) { // while (1) {
// int32_t code = loadFileDataBlock(pTsdbReadHandle, pNext->compBlock, pNext->pTableCheckInfo, exists); // int32_t code = loadFileDataBlock(pTsdbReadHandle, pNext->compBlock, pNext->pTableCheckInfo, exists);
// if (code != TSDB_CODE_SUCCESS || *exists) { // if (code != TSDB_CODE_SUCCESS || *exists) {
// return code; // return code;
// } // }
//
// if ((cur->slot == pTsdbReadHandle->numOfBlocks - 1 && ASCENDING_TRAVERSE(pTsdbReadHandle->order)) || // if ((cur->slot == pTsdbReadHandle->numOfBlocks - 1 && ASCENDING_TRAVERSE(pTsdbReadHandle->order)) ||
// (cur->slot == 0 && !ASCENDING_TRAVERSE(pTsdbReadHandle->order))) { // (cur->slot == 0 && !ASCENDING_TRAVERSE(pTsdbReadHandle->order))) {
// // all data blocks in current file has been checked already, try next file if exists // // all data blocks in current file has been checked already, try next file if exists
// return getFirstFileDataBlock(pTsdbReadHandle, exists); // return getFirstFileDataBlock(pTsdbReadHandle, exists);
// } else { // next block of the same file // } else { // next block of the same file
// cur->slot += step; // cur->slot += step;
// cur->mixBlock = false; // cur->mixBlock = false;
// cur->blockCompleted = false; // cur->blockCompleted = false;
// pNext = &pTsdbReadHandle->pDataBlockInfo[cur->slot]; // pNext = &pTsdbReadHandle->pDataBlockInfo[cur->slot];
// }
// } // }
// } // }
//}
// static int32_t getFirstFileDataBlock(STsdbReader* pTsdbReadHandle, bool* exists) { // static int32_t getFirstFileDataBlock(STsdbReader* pTsdbReadHandle, bool* exists) {
// pTsdbReadHandle->numOfBlocks = 0; // pTsdbReadHandle->numOfBlocks = 0;
...@@ -2198,7 +2193,7 @@ _err: ...@@ -2198,7 +2193,7 @@ _err:
// cur->slot = ASCENDING_TRAVERSE(pTsdbReadHandle->order) ? 0 : pTsdbReadHandle->numOfBlocks - 1; // cur->slot = ASCENDING_TRAVERSE(pTsdbReadHandle->order) ? 0 : pTsdbReadHandle->numOfBlocks - 1;
// cur->fid = pTsdbReadHandle->pFileGroup->fid; // cur->fid = pTsdbReadHandle->pFileGroup->fid;
// STableBlockInfo* pBlockInfo = &pTsdbReadHandle->pDataBlockInfo[cur->slot]; // SFileBlockInfo* pBlockInfo = &pTsdbReadHandle->pDataBlockInfo[cur->slot];
// return getDataBlock(pTsdbReadHandle, pBlockInfo, exists); // return getDataBlock(pTsdbReadHandle, pBlockInfo, exists);
// } // }
...@@ -2222,52 +2217,163 @@ _err: ...@@ -2222,52 +2217,163 @@ _err:
// return (numOfRows - startRow) / bucketRange; // return (numOfRows - startRow) / bucketRange;
// } // }
// static int32_t getDataBlocksInFiles(STsdbReader* pTsdbReadHandle, bool* exists) { // query ended in/started from current block
// STsdbFS* pFileHandle = REPO_FS(pTsdbReadHandle->pTsdb); static int32_t dataBlockPartialRequired(STimeWindow* pWindow, SBlock* pBlock) {
// SQueryFilePos* cur = &pTsdbReadHandle->cur; return ((pWindow->ekey < pBlock->maxKey.ts && pWindow->ekey >= pBlock->minKey.ts) ||
(pWindow->skey <= pBlock->maxKey.ts && pWindow->skey > pBlock->minKey.ts));
}
// // find the start data block in file static SFileDataBlockInfo* getCurrentBlockInfo(SDataBlockIter* pBlockIter) {
// if (!pTsdbReadHandle->locateStart) { SFileDataBlockInfo* pFBlockInfo = taosArrayGet(pBlockIter->blockList, pBlockIter->index);
// pTsdbReadHandle->locateStart = true; return pFBlockInfo;
// STsdbKeepCfg* pCfg = REPO_KEEP_CFG(pTsdbReadHandle->pTsdb); }
// int32_t fid = getFileIdFromKey(pTsdbReadHandle->window.skey, pCfg->days, pCfg->precision);
// tsdbRLockFS(pFileHandle); static bool overlapWithNeighborBlock(SBlock* pBlock, int32_t blockIndex) {
// tsdbFSIterInit(&pTsdbReadHandle->fileIter, pFileHandle, pTsdbReadHandle->order); return false;
// tsdbFSIterSeek(&pTsdbReadHandle->fileIter, fid); }
// tsdbUnLockFS(pFileHandle);
// return getFirstFileDataBlock(pTsdbReadHandle, exists); static bool bufferDataInFileBlockGap(int32_t order, int64_t key, SBlock* pBlock) {
// } else { bool ascScan = ASCENDING_TRAVERSE(order);
// // check if current file block is all consumed
// STableBlockInfo* pBlockInfo = &pTsdbReadHandle->pDataBlockInfo[cur->slot];
// STableCheckInfo* pCheckInfo = pBlockInfo->pTableCheckInfo;
// // current block is done, try next return (ascScan && (key != TSKEY_INITIAL_VAL && key <= pBlock->minKey.ts)) ||
// if ((!cur->mixBlock) || cur->blockCompleted) { (!ascScan && (key != TSKEY_INITIAL_VAL && key >= pBlock->maxKey.ts));
// // all data blocks in current file has been checked already, try next file if exists }
// } else {
// tsdbDebug("%p continue in current data block, index:%d, pos:%d, %s", pTsdbReadHandle, cur->slot, cur->pos,
// pTsdbReadHandle->idStr);
// int32_t code = handleDataMergeIfNeeded(pTsdbReadHandle, pBlockInfo->compBlock, pCheckInfo);
// *exists = (pTsdbReadHandle->realNumOfRows > 0);
// if (code != TSDB_CODE_SUCCESS || *exists) { static int32_t buildInmemDataBlock(STsdbReader* pReader, STableBlockScanInfo* pBlockScanInfo, SBlock* pBlock, TSDBKEY *key) {
// return code; int32_t code = TSDB_CODE_SUCCESS;
// }
// }
// // current block is empty, try next block in file bool ascScan = ASCENDING_TRAVERSE(pReader->order);
// // all data blocks in current file has been checked already, try next file if exists bool cacheDataInFileBlockHole = (ascScan && (key->ts != TSKEY_INITIAL_VAL && key->ts < pBlock->minKey.ts)) ||
// if (isEndFileDataBlock(cur, pTsdbReadHandle->numOfBlocks, ASCENDING_TRAVERSE(pTsdbReadHandle->order))) { (!ascScan && (key->ts != TSKEY_INITIAL_VAL && key->ts > pBlock->maxKey.ts));
// return getFirstFileDataBlock(pTsdbReadHandle, exists); ASSERT(cacheDataInFileBlockHole);
// } else {
// moveToNextDataBlockInCurrentFile(pTsdbReadHandle); // do not load file block into buffer
// STableBlockInfo* pNext = &pTsdbReadHandle->pDataBlockInfo[cur->slot]; int32_t step = ascScan ? 1 : -1;
// return getDataBlock(pTsdbReadHandle, pNext, exists);
// } TSDBKEY maxKey = {.version = pReader->endVersion};
// } maxKey.ts = ascScan ? (pBlock->minKey.ts - step) : (pBlock->maxKey.ts - step);
// }
pBlockScanInfo->memHasVal = tsdbTbDataIterNext(&pBlockScanInfo->iter);
pBlockScanInfo->imemHasVal = tsdbTbDataIterNext(&pBlockScanInfo->iiter);
code = tsdbReadRowsFromCache(pBlockScanInfo, maxKey, pReader->capacity, pReader);
return code;
}
static int32_t buildComposedDataBlock(STsdbReader* pReader, STableBlockScanInfo* pBlockScanInfo) {
SFileBlockDumpInfo *pDumpInfo = &pReader->status.fBlockDumpInfo;
SBlockData* pData = &pReader->status.fileBlockData;
STSchema* pSchema = NULL;
SRowMerger merge = {0};
int64_t key = pData->aTSKEY[0];
TSDBROW* pRow = getValidRow(&pBlockScanInfo->iter, &pBlockScanInfo->memHasVal, pReader);
TSDBROW* piRow = getValidRow(&pBlockScanInfo->iiter, &pBlockScanInfo->imemHasVal, pReader);
if (pBlockScanInfo->memHasVal && pBlockScanInfo->imemHasVal) {
TSDBKEY k = TSDBROW_KEY(pRow);
TSDBKEY ik = TSDBROW_KEY(piRow);
// todo check version in file
if (key < k.ts || key < ik.ts) {
tRowMergerInit(&merge, NULL, pSchema);
STSRow* pTsRow = NULL;
doLoadRowsOfIdenticalTsInFileBlock(pData, pDumpInfo, key, &merge, pReader, &pTsRow);
}
}
return TSDB_CODE_SUCCESS;
}
static int32_t loadDataInFiles(STsdbReader* pReader, bool* exists) {
SReaderStatus* pStatus = &pReader->status;
SFileSetIter* pFIter = &pStatus->fileIter;
if (pFIter->index < pFIter->numOfFiles) {
if (pReader->status.blockIter.index == -1) {
int32_t numOfBlocks = 0;
while (1) {
bool hasNext = nextFilesetIterator(&pStatus->fileIter, pReader->order, pReader);
if (!hasNext) {
// no data files on disk
break;
}
SArray* pIndexList = taosArrayInit(4, sizeof(SBlockIdx));
int32_t code = doLoadBlockIndex(pReader, pReader->pFileReader, pIndexList);
if (code != TSDB_CODE_SUCCESS) {
return code;
}
if (taosArrayGetSize(pIndexList) > 0) {
uint32_t numOfValidTable = 0;
code = doLoadFileBlock(pReader, pIndexList, &numOfValidTable);
if (code != TSDB_CODE_SUCCESS) {
return code;
}
if (numOfValidTable > 0) {
break;
}
}
// no blocks in current file, try next files
}
SDataBlockIter* pBlockIter = &pReader->status.blockIter;
int32_t code = initBlockIterator(pReader, pBlockIter, numOfBlocks);
if (code != TSDB_CODE_SUCCESS) {
return code;
}
int64_t key = 0; // todo get the first qualified key in buffer
SFileDataBlockInfo* pFBlock = getCurrentBlockInfo(pBlockIter);
STableBlockScanInfo* pScanInfo = taosHashGet(pReader->status.pTableMap, &pFBlock->uid, sizeof(pFBlock->uid));
SBlock* pBlock = taosArrayGet(pScanInfo->pBlockList, pFBlock->tbBlockIdx);
if (pScanInfo->iterInit == false) {
STbData* d = NULL;
tsdbGetTbDataFromMemTable(pReader->pTsdb->mem, pReader->suid, pScanInfo->uid, &d);
TSDBKEY startKey = {.ts = pReader->window.skey, .version = pReader->startVersion};
tsdbTbDataIterOpen(d, &startKey, 0, &pScanInfo->iter);
STbData* di = NULL;
tsdbGetTbDataFromMemTable(pReader->pTsdb->imem, pReader->suid, pScanInfo->uid, &di);
tsdbTbDataIterOpen(di, &startKey, 0, &pScanInfo->iiter);
pScanInfo->iterInit = true;
}
if (dataBlockPartialRequired(&pReader->window, pBlock) || overlapWithNeighborBlock(pBlock, pFBlock->tbBlockIdx)) {
SBlockData data = {0};
doLoadFileBlockData(pReader, pBlockIter, pScanInfo, &data);
// build composed data block
} else if (bufferDataInFileBlockGap(pReader->order, key, pBlock)) {
// data in memory that are earlier than current file block
TSDBKEY maxKey = {.ts = pReader->window.ekey, .version = pReader->endVersion};
buildInmemDataBlock(pReader, pScanInfo, pBlock, &maxKey);
// build data block from in-memory buffer data completed.
} else { // whole block is required, return it directly
SDataBlockInfo info = {0};
info.rows = pBlock->nRow;
info.uid = pScanInfo->uid;
info.window.skey = pBlock->minKey.ts;
info.window.ekey = pBlock->maxKey.ts;
}
} else {
}
}
return TSDB_CODE_SUCCESS;
}
// static bool doHasDataInBuffer(STsdbReader* pTsdbReadHandle) { // static bool doHasDataInBuffer(STsdbReader* pTsdbReadHandle) {
// size_t numOfTables = taosArrayGetSize(pTsdbReadHandle->pTableCheckInfo); // size_t numOfTables = taosArrayGetSize(pTsdbReadHandle->pTableCheckInfo);
...@@ -2293,7 +2399,7 @@ _err: ...@@ -2293,7 +2399,7 @@ _err:
// int32_t i = 0; // int32_t i = 0;
// while (i < numOfTables) { // while (i < numOfTables) {
// STableCheckInfo* pCheckInfo = taosArrayGet(pTsdbReadHandle->pTableCheckInfo, i); // STableBlockScanInfo* pCheckInfo = taosArrayGet(pTsdbReadHandle->pTableCheckInfo, i);
// // the first qualified table for interpolation query // // the first qualified table for interpolation query
// // if ((pTsdbReadHandle->window.skey <= pCheckInfo->pTableObj->lastKey) && // // if ((pTsdbReadHandle->window.skey <= pCheckInfo->pTableObj->lastKey) &&
...@@ -2309,71 +2415,188 @@ _err: ...@@ -2309,71 +2415,188 @@ _err:
// return; // return;
// } // }
// STableCheckInfo info = *(STableCheckInfo*)taosArrayGet(pTsdbReadHandle->pTableCheckInfo, i); // STableBlockScanInfo info = *(STableBlockScanInfo*)taosArrayGet(pTsdbReadHandle->pTableCheckInfo, i);
// taosArrayClear(pTsdbReadHandle->pTableCheckInfo); // taosArrayClear(pTsdbReadHandle->pTableCheckInfo);
// info.lastKey = pTsdbReadHandle->window.skey; // info.lastKey = pTsdbReadHandle->window.skey;
// taosArrayPush(pTsdbReadHandle->pTableCheckInfo, &info); // taosArrayPush(pTsdbReadHandle->pTableCheckInfo, &info);
// } // }
// static int tsdbReadRowsFromCache(STableCheckInfo* pCheckInfo, TSKEY maxKey, int maxRowsToRead, STimeWindow* win, TSDBROW* getValidRow(STbDataIter* pIter, bool* hasVal, STsdbReader* pReader) {
// STsdbReader* pTsdbReadHandle) { if (!hasVal) {
// int numOfRows = 0; return NULL;
// int curRows = 0; }
// int32_t numOfCols = (int32_t)taosArrayGetSize(pTsdbReadHandle->pColumns);
// STsdbCfg* pCfg = REPO_CFG(pTsdbReadHandle->pTsdb);
// win->skey = TSKEY_INITIAL_VAL;
// int64_t st = taosGetTimestampUs();
// int16_t rv = -1;
// STSchema* pSchema = NULL;
// TSKEY lastRowKey = TSKEY_INITIAL_VAL;
// do {
// STSRow* row = getSRowInTableMem(pCheckInfo, pTsdbReadHandle->order, pCfg->update, NULL, TD_VER_MAX);
// if (row == NULL) {
// break;
// }
// TSKEY key = TD_ROW_KEY(row); TSDBROW* pRow = tsdbTbDataIterGet(pIter);
// if ((key > maxKey && ASCENDING_TRAVERSE(pTsdbReadHandle->order)) ||
// (key < maxKey && !ASCENDING_TRAVERSE(pTsdbReadHandle->order))) {
// tsdbDebug("%p key:%" PRIu64 " beyond qrange:%" PRId64 " - %" PRId64 ", no more data in buffer",
// pTsdbReadHandle,
// key, pTsdbReadHandle->window.skey, pTsdbReadHandle->window.ekey);
// break; TSDBKEY key = TSDBROW_KEY(pRow);
// } if (key.ts > pReader->window.ekey) {
*hasVal = false;
return NULL;
}
// if (win->skey == INT64_MIN) { if (key.version <= pReader->endVersion) {
// win->skey = key; return pRow;
// } }
// win->ekey = key; while(1) {
// if (rv != TD_ROW_SVER(row)) { *hasVal = tsdbTbDataIterNext(pIter);
// pSchema = metaGetTbTSchema(REPO_META(pTsdbReadHandle->pTsdb), pCheckInfo->tableId, TD_ROW_SVER(row)); if (!(*hasVal)) {
// rv = TD_ROW_SVER(row); return NULL;
// } }
// numOfRows += mergeTwoRowFromMem(pTsdbReadHandle, maxRowsToRead, &curRows, row, NULL, numOfCols,
// pCheckInfo->tableId,
// pSchema, NULL, pCfg->update, &lastRowKey);
// if (numOfRows >= maxRowsToRead) { pRow = tsdbTbDataIterGet(pIter);
// moveToNextRowInMem(pCheckInfo);
// break;
// }
// } while (moveToNextRowInMem(pCheckInfo)); key = TSDBROW_KEY(pRow);
if (key.ts > pReader->window.ekey) {
*hasVal = false;
return NULL;
}
// taosMemoryFreeClear(pSchema); // free the STSChema if (key.version <= pReader->endVersion) {
// assert(numOfRows <= maxRowsToRead); return pRow;
}
}
}
// int64_t elapsedTime = taosGetTimestampUs() - st; int32_t doLoadRowsOfIdenticalTs(STbDataIter *pIter, bool* hasVal, int64_t ts, SRowMerger* pMerger, STsdbReader* pReader) {
// tsdbDebug("%p build data block from cache completed, elapsed time:%" PRId64 " us, numOfRows:%d, numOfCols:%d, %s", while (1) {
// pTsdbReadHandle, elapsedTime, numOfRows, numOfCols, pTsdbReadHandle->idStr); *hasVal = tsdbTbDataIterNext(pIter);
if (!*hasVal) {
break;
}
// return numOfRows; TSDBROW* pRow = getValidRow(pIter, hasVal, pReader);
// } TSDBKEY k = TSDBROW_KEY(pRow);
if (k.ts > ts) {
break;
}
tRowMerge(pMerger, pRow);
}
return TSDB_CODE_SUCCESS;
}
int32_t doLoadRowsOfIdenticalTsInFileBlock(SBlockData* pData, SFileBlockDumpInfo* pDumpInfo, int64_t ts, SRowMerger *pMerger,
STsdbReader* pReader, STSRow** pRow) {
int64_t key = pData->aTSKEY[pDumpInfo->rowIndex];
if ((pDumpInfo->rowIndex < pData->nRow - 1)) {
if (pData->aTSKEY[pDumpInfo->rowIndex + 1] < key) {
SRowMerger merger = {0};
tRowMergerInit(&merger, NULL, NULL);
int32_t rowIndex = pDumpInfo->rowIndex + 1;
while (pData->aTSKEY[rowIndex] == key) {
tRowMerge(&merger, NULL);
}
tRowMergerGetRow(&merger, pRow);
tRowMergerClear(&merger);
}
} else {
}
return TSDB_CODE_SUCCESS;
}
int32_t tsdbGetNextRowInMem(STableBlockScanInfo* pBlockScanInfo, STsdbReader* pReader, STSRow** pTSRow) {
STSchema* pSchema = NULL; // todo set the correct schema
TSKEY mergeTs = TSKEY_INITIAL_VAL;
SRowMerger merge = {0};
TSDBROW* pRow = getValidRow(&pBlockScanInfo->iter, &pBlockScanInfo->memHasVal, pReader);
TSDBROW* piRow = getValidRow(&pBlockScanInfo->iiter, &pBlockScanInfo->imemHasVal, pReader);
TSDBKEY k = {.ts = TSKEY_INITIAL_VAL};
TSDBKEY ik = {.ts = TSKEY_INITIAL_VAL};
if (pBlockScanInfo->memHasVal && pBlockScanInfo->imemHasVal) {
k = TSDBROW_KEY(pRow);
ik = TSDBROW_KEY(piRow);
if (ik.ts <= k.ts) {
tRowMergerInit(&merge, piRow, pSchema);
doLoadRowsOfIdenticalTs(&pBlockScanInfo->iiter, &pBlockScanInfo->imemHasVal, ik.ts, &merge, pReader);
if (k.ts == mergeTs) {
doLoadRowsOfIdenticalTs(&pBlockScanInfo->iter, &pBlockScanInfo->memHasVal, k.ts, &merge, pReader);
}
tRowMergerGetRow(&merge, pTSRow);
return TSDB_CODE_SUCCESS;
} else { // k.ts < ik.ts
tRowMergerInit(&merge, pRow, pSchema);
doLoadRowsOfIdenticalTs(&pBlockScanInfo->iter, &pBlockScanInfo->memHasVal, k.ts, &merge, pReader);
tRowMergerGetRow(&merge, pTSRow);
return TSDB_CODE_SUCCESS;
}
}
if (pBlockScanInfo->memHasVal) {
tRowMergerInit(&merge, pRow, pSchema);
doLoadRowsOfIdenticalTs(&pBlockScanInfo->iter, &pBlockScanInfo->memHasVal, k.ts, &merge, pReader);
tRowMergerGetRow(&merge, pTSRow);
return TSDB_CODE_SUCCESS;
}
if (pBlockScanInfo->imemHasVal) {
tRowMergerInit(&merge, piRow, pSchema);
doLoadRowsOfIdenticalTs(&pBlockScanInfo->iiter, &pBlockScanInfo->imemHasVal, ik.ts, &merge, pReader);
tRowMergerGetRow(&merge, pTSRow);
return TSDB_CODE_SUCCESS;
}
return TSDB_CODE_SUCCESS;
}
int32_t tsdbReadRowsFromCache(STableBlockScanInfo* pBlockScanInfo, TSDBKEY maxKey, int32_t capacity, STsdbReader* pReader) {
int32_t numOfRows = 0;
int32_t numOfCols = (int32_t)taosArrayGetSize(pReader->pResBlock->pDataBlock);
SSDataBlock* pBlock = pReader->pResBlock;
int64_t st = taosGetTimestampUs();
STSchema* pSchema = NULL;
do {
STSRow* pTSRow = NULL;
tsdbGetNextRowInMem(pBlockScanInfo, pReader, &pTSRow);
// todo assign to ssdatablock
if (pBlockScanInfo->memHasVal) {
TSDBROW* pRow = tsdbTbDataIterGet(&pBlockScanInfo->iter);
TSDBKEY k = TSDBROW_KEY(pRow);
if (k.ts >= maxKey.ts) {
break;
}
}
if (pBlockScanInfo->imemHasVal) {
TSDBROW* pRow = tsdbTbDataIterGet(&pBlockScanInfo->iiter);
TSDBKEY k = TSDBROW_KEY(pRow);
if (k.ts >= maxKey.ts) {
break;
}
}
// no data in buffer, return immediately
if (!(pBlockScanInfo->memHasVal || pBlockScanInfo->imemHasVal)) {
break;
}
if (numOfRows >= capacity) {
break;
}
} while (1);
taosMemoryFreeClear(pSchema);
assert(numOfRows <= capacity);
int64_t elapsedTime = taosGetTimestampUs() - st;
tsdbDebug("%p build data block from cache completed, elapsed time:%" PRId64 " us, numOfRows:%d, numOfCols:%d, %s",
pReader, elapsedTime, pBlock->info.rows, numOfCols, pReader->idStr);
return TSDB_CODE_SUCCESS;
}
// static void destroyHelper(void* param) { // static void destroyHelper(void* param) {
// if (param == NULL) { // if (param == NULL) {
...@@ -2398,7 +2621,7 @@ _err: ...@@ -2398,7 +2621,7 @@ _err:
// // check if the query range overlaps with the file data block // // check if the query range overlaps with the file data block
// bool exists = true; // bool exists = true;
// int32_t code = getDataBlocksInFiles(pTsdbReadHandle, &exists); // int32_t code = loadDataInFiles(pTsdbReadHandle, &exists);
// if (code != TSDB_CODE_SUCCESS) { // if (code != TSDB_CODE_SUCCESS) {
// pTsdbReadHandle->checkFiles = false; // pTsdbReadHandle->checkFiles = false;
// return false; // return false;
...@@ -2459,7 +2682,7 @@ _err: ...@@ -2459,7 +2682,7 @@ _err:
// int32_t curRow = 0; // int32_t curRow = 0;
// if (++pTsdbReadHandle->activeIndex < numOfTables) { // if (++pTsdbReadHandle->activeIndex < numOfTables) {
// STableCheckInfo* pCheckInfo = taosArrayGet(pTsdbReadHandle->pTableCheckInfo, pTsdbReadHandle->activeIndex); // STableBlockScanInfo* pCheckInfo = taosArrayGet(pTsdbReadHandle->pTableCheckInfo, pTsdbReadHandle->activeIndex);
// // int32_t ret = tsdbGetCachedLastRow(pCheckInfo->pTableObj, &pRow, &key); // // int32_t ret = tsdbGetCachedLastRow(pCheckInfo->pTableObj, &pRow, &key);
// // if (ret != TSDB_CODE_SUCCESS) { // // if (ret != TSDB_CODE_SUCCESS) {
// // return false; // // return false;
...@@ -2494,7 +2717,7 @@ _err: ...@@ -2494,7 +2717,7 @@ _err:
// return true; // return true;
// } // }
// STableCheckInfo* pCheckInfo = taosArrayGet(pTsdbReadHandle->pTableCheckInfo, pTsdbReadHandle->activeIndex); // STableBlockScanInfo* pCheckInfo = taosArrayGet(pTsdbReadHandle->pTableCheckInfo, pTsdbReadHandle->activeIndex);
// pCheckInfo->numOfBlocks = 0; // pCheckInfo->numOfBlocks = 0;
// pTsdbReadHandle->activeIndex += 1; // pTsdbReadHandle->activeIndex += 1;
...@@ -2543,17 +2766,6 @@ _err: ...@@ -2543,17 +2766,6 @@ _err:
// return true; // return true;
// } // }
// static int tsdbCheckInfoCompar(const void* key1, const void* key2) {
// if (((STableCheckInfo*)key1)->tableId < ((STableCheckInfo*)key2)->tableId) {
// return -1;
// } else if (((STableCheckInfo*)key1)->tableId > ((STableCheckInfo*)key2)->tableId) {
// return 1;
// } else {
// ASSERT(false);
// return 0;
// }
// }
// static void* doFreeColumnInfoData(SArray* pColumnInfoData) { // static void* doFreeColumnInfoData(SArray* pColumnInfoData) {
// if (pColumnInfoData == NULL) { // if (pColumnInfoData == NULL) {
// return NULL; // return NULL;
...@@ -2572,7 +2784,7 @@ _err: ...@@ -2572,7 +2784,7 @@ _err:
// static void* destroyTableCheckInfo(SArray* pTableCheckInfo) { // static void* destroyTableCheckInfo(SArray* pTableCheckInfo) {
// size_t size = taosArrayGetSize(pTableCheckInfo); // size_t size = taosArrayGetSize(pTableCheckInfo);
// for (int32_t i = 0; i < size; ++i) { // for (int32_t i = 0; i < size; ++i) {
// STableCheckInfo* p = taosArrayGet(pTableCheckInfo, i); // STableBlockScanInfo* p = taosArrayGet(pTableCheckInfo, i);
// destroyTableMemIterator(p); // destroyTableMemIterator(p);
// taosMemoryFreeClear(p->pCompInfo); // taosMemoryFreeClear(p->pCompInfo);
...@@ -2583,25 +2795,31 @@ _err: ...@@ -2583,25 +2795,31 @@ _err:
// } // }
// ====================================== EXPOSED APIs ====================================== // ====================================== EXPOSED APIs ======================================
int32_t tsdbReaderOpen(SVnode* pVnode, SQueryTableDataCond* pCond, STableListInfo* tableList, uint64_t qId, int32_t tsdbReaderOpen(SVnode* pVnode, SQueryTableDataCond* pCond, STableListInfo* pTableList, uint64_t qId, uint64_t taskId, STsdbReader** ppReader) {
uint64_t taskId, STsdbReader** ppReader) { char buf[128] = {0};
int32_t code = 0; snprintf(buf, tListLen(buf), "TID:0x%" PRIx64 " QID:0x%" PRIx64, taskId, qId);
code = tsdbReaderCreate(pVnode, pCond, qId, taskId, ppReader); int32_t code = tsdbReaderCreate(pVnode, pCond, ppReader, buf);
if (code) goto _err; if (code) {
goto _err;
}
// if (emptyQueryTimewindow(pReader)) { STsdbReader* pReader = *ppReader;
// return (STsdbReader*)pReader; if (isEmptyQueryTimeWindow(pReader)) {
// } tsdbDebug("%p query window not overlaps with the data set, no result returned, %s", pReader, pReader->idStr);
return TSDB_CODE_SUCCESS;
}
// // todo apply the lastkey of table check to avoid to load header file pReader->status.pTableMap = createDataBlockScanInfo(pReader, pCond->uidList, pCond->numOfTables);
// pReader->pTableCheckInfo = createCheckInfoFromTableGroup(pReader, tableList); if (pReader->status.pTableMap == NULL) {
// if (pReader->pTableCheckInfo == NULL) { tsdbReaderClose(pReader);
// // tsdbReaderClose(pTsdbReadHandle); *ppReader = NULL;
// terrno = TSDB_CODE_TDB_OUT_OF_MEMORY;
// return NULL; code = TSDB_CODE_TDB_OUT_OF_MEMORY;
// } goto _err;
}
#if 0
// int32_t code = setCurrentSchema(pVnode, pReader); // int32_t code = setCurrentSchema(pVnode, pReader);
// if (code != TSDB_CODE_SUCCESS) { // if (code != TSDB_CODE_SUCCESS) {
// terrno = code; // terrno = code;
...@@ -2627,94 +2845,90 @@ int32_t tsdbReaderOpen(SVnode* pVnode, SQueryTableDataCond* pCond, STableListInf ...@@ -2627,94 +2845,90 @@ int32_t tsdbReaderOpen(SVnode* pVnode, SQueryTableDataCond* pCond, STableListInf
// return NULL; // return NULL;
// } // }
// } // }
#endif
// tsdbDebug("%p total numOfTable:%" PRIzu " in this query, table %" PRIzu " %s", pReader, tsdbDebug("%p total numOfTable:%d in this query %s", pReader, pCond->numOfTables, pReader->idStr);
// taosArrayGetSize(pReader->pTableCheckInfo), taosArrayGetSize(tableList->pTableList), pReader->idStr);
return code; return code;
_err: _err:
// tsdbError(""); tsdbError("failed to create tsdb reader, code: %s %s", tstrerror(code), pReader->idStr);
return code; return code;
} }
void tsdbReaderClose(STsdbReader* pReader) { void tsdbReaderClose(STsdbReader* pReader) {
// if (pReader == NULL) { if (pReader == NULL) {
// return; return;
// } }
// pReader->pColumns = doFreeColumnInfoData(pReader->pColumns);
// taosArrayDestroy(pReader->suppInfo.defaultLoadColumn);
// taosMemoryFreeClear(pReader->pDataBlockInfo);
// taosMemoryFreeClear(pReader->suppInfo.pstatis);
// taosMemoryFreeClear(pReader->suppInfo.plist);
// taosMemoryFree(pReader->suppInfo.slotIds);
// if (!emptyQueryTimewindow(pReader)) { blockDataDestroy(pReader->pResBlock);
// // tsdbMayUnTakeMemSnapshot(pTsdbReadHandle);
// } else {
// assert(pReader->pTableCheckInfo == NULL);
// }
// if (pReader->pTableCheckInfo != NULL) { taosMemoryFreeClear(pReader->suppInfo.pstatis);
// pReader->pTableCheckInfo = destroyTableCheckInfo(pReader->pTableCheckInfo); taosMemoryFreeClear(pReader->suppInfo.plist);
// } taosMemoryFree(pReader->suppInfo.slotIds);
// tsdbDestroyReadH(&pReader->rhelper); if (!isEmptyQueryTimeWindow(pReader)) {
// tsdbMayUnTakeMemSnapshot(pTsdbReadHandle);
} else {
ASSERT(pReader->status.pTableMap == NULL);
}
#if 0
// if (pReader->status.pTableScanInfo != NULL) {
// pReader->status.pTableScanInfo = destroyTableCheckInfo(pReader->status.pTableScanInfo);
// }
// tdFreeDataCols(pReader->pDataCols); // tsdbDestroyReadH(&pReader->rhelper);
// pReader->pDataCols = NULL;
// pReader->prev = doFreeColumnInfoData(pReader->prev); // tdFreeDataCols(pReader->pDataCols);
// pReader->next = doFreeColumnInfoData(pReader->next); // pReader->pDataCols = NULL;
//
// pReader->prev = doFreeColumnInfoData(pReader->prev);
// pReader->next = doFreeColumnInfoData(pReader->next);
#endif
// SIOCostSummary* pCost = &pReader->cost; SIOCostSummary* pCost = &pReader->cost;
// tsdbDebug("%p :io-cost summary: head-file read cnt:%" PRIu64 ", head-file time:%" PRIu64 " us, statis-info:%" tsdbDebug("%p :io-cost summary: head-file read cnt:%" PRIu64 ", head-file time:%" PRIu64 " us, statis-info:%" PRId64
// PRId64 " us, datablock:%" PRId64 " us, check data:%" PRId64 " us, %s",
// " us, datablock:%" PRId64 " us, check data:%" PRId64 " us, %s", pReader, pCost->headFileLoad, pCost->headFileLoadTime, pCost->statisInfoLoadTime, pCost->blockLoadTime,
// pReader, pCost->headFileLoad, pCost->headFileLoadTime, pCost->statisInfoLoadTime, pCost->blockLoadTime, pCost->checkForNextTime, pReader->idStr);
// pCost->checkForNextTime, pReader->idStr);
// taosMemoryFree(pReader->idStr); taosMemoryFree(pReader->idStr);
// taosMemoryFree(pReader->pSchema); taosMemoryFree(pReader->pSchema);
// taosMemoryFreeClear(pReader); taosMemoryFreeClear(pReader);
} }
bool tsdbNextDataBlock(STsdbReader* pReader) { bool tsdbNextDataBlock(STsdbReader* pReader) {
bool ret = false; bool ret = false;
// size_t numOfCols = taosArrayGetSize(pReader->pColumns); if (isEmptyQueryTimeWindow(pReader)) {
// for (int32_t i = 0; i < numOfCols; ++i) { return false;
// SColumnInfoData* pColInfo = taosArrayGet(pReader->pColumns, i); }
// colInfoDataCleanup(pColInfo, pReader->outputCapacity);
// }
// if (emptyQueryTimewindow(pReader)) { // cleanup the data that belongs to the previous data block
// tsdbDebug("%p query window not overlaps with the data set, no result returned, %s", pReader, pReader->idStr); blockDataCleanup(pReader->pResBlock);
// return false;
// }
// int64_t stime = taosGetTimestampUs(); int64_t stime = taosGetTimestampUs();
// int64_t elapsedTime = stime; int64_t elapsedTime = stime;
// // TODO refactor: remove "type" if (pReader->type == BLOCK_LOAD_OFFSET_ORDER) {
// if (pReader->type == TSDB_QUERY_TYPE_LAST) { if (pReader->status.loadFromFile) {
// if (pReader->cachelastrow == TSDB_CACHED_TYPE_LASTROW) { bool exists = true;
// // return loadCachedLastRow(pTsdbReadHandle); int32_t code = loadDataInFiles(pReader, &exists);
// } else if (pReader->cachelastrow == TSDB_CACHED_TYPE_LAST) {
// // return loadCachedLast(pTsdbReadHandle);
// }
// }
} else { // no data in files, let's try in-memory buffer
}
} else if (pReader->type == BLOCK_LOAD_TABLESEQ_ORDER) {
} else if (pReader->type == BLOCK_LOAD_EXTERN_ORDER) {
}
// if (pReader->loadType == BLOCK_LOAD_TABLE_SEQ_ORDER) { // if (pReader->loadType == BLOCK_LOAD_TABLE_SEQ_ORDER) {
// return loadDataBlockFromTableSeq(pReader); // return loadDataBlockFromTableSeq(pReader);
// } else { // loadType == RR and Offset Order // } else { // loadType == RR and Offset Order
// if (pReader->checkFiles) { // if (pReader->checkFiles) {
// // check if the query range overlaps with the file data block // // check if the query range overlaps with the file data block
// bool exists = true; // bool exists = true;
// int32_t code = loadDataInFiles(pReader, &exists);
// int32_t code = getDataBlocksInFiles(pReader, &exists);
// if (code != TSDB_CODE_SUCCESS) { // if (code != TSDB_CODE_SUCCESS) {
// pReader->activeIndex = 0; // pReader->activeIndex = 0;
// pReader->checkFiles = false; // pReader->checkFiles = false;
...@@ -2749,10 +2963,10 @@ void tsdbRetrieveDataBlockInfo(STsdbReader* pReader, SDataBlockInfo* pDataBlockI ...@@ -2749,10 +2963,10 @@ void tsdbRetrieveDataBlockInfo(STsdbReader* pReader, SDataBlockInfo* pDataBlockI
// // there are data in file // // there are data in file
// if (pReader->cur.fid != INT32_MIN) { // if (pReader->cur.fid != INT32_MIN) {
// STableBlockInfo* pBlockInfo = &pReader->pDataBlockInfo[cur->slot]; // SFileBlockInfo* pBlockInfo = &pReader->pDataBlockInfo[cur->slot];
// uid = pBlockInfo->pTableCheckInfo->tableId; // uid = pBlockInfo->pTableCheckInfo->tableId;
// } else { // } else {
// STableCheckInfo* pCheckInfo = taosArrayGet(pReader->pTableCheckInfo, pReader->activeIndex); // STableBlockScanInfo* pCheckInfo = taosArrayGet(pReader->pTableCheckInfo, pReader->activeIndex);
// uid = pCheckInfo->tableId; // uid = pCheckInfo->tableId;
// } // }
...@@ -2781,7 +2995,7 @@ int32_t tsdbRetrieveDataBlockStatisInfo(STsdbReader* pReader, SColumnDataAgg*** ...@@ -2781,7 +2995,7 @@ int32_t tsdbRetrieveDataBlockStatisInfo(STsdbReader* pReader, SColumnDataAgg***
// return TSDB_CODE_SUCCESS; // return TSDB_CODE_SUCCESS;
// } // }
// STableBlockInfo* pBlockInfo = &pReader->pDataBlockInfo[c->slot]; // SFileBlockInfo* pBlockInfo = &pReader->pDataBlockInfo[c->slot];
// assert((c->slot >= 0 && c->slot < pReader->numOfBlocks) || ((c->slot == pReader->numOfBlocks) && (c->slot == 0))); // assert((c->slot >= 0 && c->slot < pReader->numOfBlocks) || ((c->slot == pReader->numOfBlocks) && (c->slot == 0)));
// // file block with sub-blocks has no statistics data // // file block with sub-blocks has no statistics data
...@@ -2854,8 +3068,8 @@ SArray* tsdbRetrieveDataBlock(STsdbReader* pReader, SArray* pIdList) { ...@@ -2854,8 +3068,8 @@ SArray* tsdbRetrieveDataBlock(STsdbReader* pReader, SArray* pIdList) {
// if (pReader->cur.fid == INT32_MIN) { // if (pReader->cur.fid == INT32_MIN) {
// return pReader->pColumns; // return pReader->pColumns;
// } else { // } else {
// STableBlockInfo* pBlockInfo = &pReader->pDataBlockInfo[pReader->cur.slot]; // SFileBlockInfo* pBlockInfo = &pReader->pDataBlockInfo[pReader->cur.slot];
// STableCheckInfo* pCheckInfo = pBlockInfo->pTableCheckInfo; // STableBlockScanInfo* pCheckInfo = pBlockInfo->pTableCheckInfo;
// if (pReader->cur.mixBlock) { // if (pReader->cur.mixBlock) {
// return pReader->pColumns; // return pReader->pColumns;
...@@ -2871,7 +3085,7 @@ SArray* tsdbRetrieveDataBlock(STsdbReader* pReader, SArray* pIdList) { ...@@ -2871,7 +3085,7 @@ SArray* tsdbRetrieveDataBlock(STsdbReader* pReader, SArray* pIdList) {
// return pReader->pColumns; // return pReader->pColumns;
// } else { // only load the file block // } else { // only load the file block
// SBlock* pBlock = pBlockInfo->compBlock; // SBlock* pBlock = pBlockInfo->compBlock;
// if (doLoadFileDataBlock(pReader, pBlock, pCheckInfo, pReader->cur.slot) != TSDB_CODE_SUCCESS) { // if (doLoadFileBlockData(pReader, pBlock, pCheckInfo, pReader->cur.slot) != TSDB_CODE_SUCCESS) {
// return NULL; // return NULL;
// } // }
...@@ -2884,7 +3098,7 @@ SArray* tsdbRetrieveDataBlock(STsdbReader* pReader, SArray* pIdList) { ...@@ -2884,7 +3098,7 @@ SArray* tsdbRetrieveDataBlock(STsdbReader* pReader, SArray* pIdList) {
} }
void tsdbResetReadHandle(STsdbReader* pReader, SQueryTableDataCond* pCond, int32_t tWinIdx) { void tsdbResetReadHandle(STsdbReader* pReader, SQueryTableDataCond* pCond, int32_t tWinIdx) {
// if (emptyQueryTimewindow(pReader)) { // if (isEmptyQueryTimeWindow(pReader)) {
// if (pCond->order != pReader->order) { // if (pCond->order != pReader->order) {
// pReader->order = pCond->order; // pReader->order = pCond->order;
// TSWAP(pReader->window.skey, pReader->window.ekey); // TSWAP(pReader->window.skey, pReader->window.ekey);
...@@ -2998,7 +3212,7 @@ int32_t tsdbGetFileBlocksDistInfo(STsdbReader* pReader, STableBlockDistInfo* pTa ...@@ -2998,7 +3212,7 @@ int32_t tsdbGetFileBlocksDistInfo(STsdbReader* pReader, STableBlockDistInfo* pTa
// pTableBlockInfo->numOfBlocks += numOfBlocks; // pTableBlockInfo->numOfBlocks += numOfBlocks;
// for (int32_t i = 0; i < numOfTables; ++i) { // for (int32_t i = 0; i < numOfTables; ++i) {
// STableCheckInfo* pCheckInfo = taosArrayGet(pReader->pTableCheckInfo, i); // STableBlockScanInfo* pCheckInfo = taosArrayGet(pReader->pTableCheckInfo, i);
// SBlock* pBlock = pCheckInfo->pCompInfo->blocks; // SBlock* pBlock = pCheckInfo->pCompInfo->blocks;
...@@ -3040,7 +3254,7 @@ int64_t tsdbGetNumOfRowsInMemTable(STsdbReader* pReader) { ...@@ -3040,7 +3254,7 @@ int64_t tsdbGetNumOfRowsInMemTable(STsdbReader* pReader) {
// size_t size = taosArrayGetSize(pReader->pTableCheckInfo); // size_t size = taosArrayGetSize(pReader->pTableCheckInfo);
// for (int32_t i = 0; i < size; ++i) { // for (int32_t i = 0; i < size; ++i) {
// STableCheckInfo* pCheckInfo = taosArrayGet(pReader->pTableCheckInfo, i); // STableBlockScanInfo* pCheckInfo = taosArrayGet(pReader->pTableCheckInfo, i);
// // if (pMemT && pCheckInfo->tableId < pMemT->maxTables) { // // if (pMemT && pCheckInfo->tableId < pMemT->maxTables) {
// // pMem = pMemT->tData[pCheckInfo->tableId]; // // pMem = pMemT->tData[pCheckInfo->tableId];
......
...@@ -599,93 +599,234 @@ int32_t tsdbReadColData(SDataFReader *pReader, SBlockIdx *pBlockIdx, SBlock *pBl ...@@ -599,93 +599,234 @@ int32_t tsdbReadColData(SDataFReader *pReader, SBlockIdx *pBlockIdx, SBlock *pBl
return code; return code;
} }
int32_t tsdbReadBlockData(SDataFReader *pReader, SBlockIdx *pBlockIdx, SBlock *pBlock, SBlockData *pBlockData, static int32_t tsdbReadSubBlockData(SDataFReader *pReader, SBlockIdx *pBlockIdx, SBlock *pBlock, int32_t iSubBlock,
uint8_t **ppBuf1, uint8_t **ppBuf2) { SBlockData *pBlockData, uint8_t **ppBuf1, uint8_t **ppBuf2) {
int32_t code = 0; int32_t code = 0;
uint8_t *p;
int64_t size;
int64_t n;
TdFilePtr pFD = pBlock->last ? pReader->pLastFD : pReader->pDataFD; TdFilePtr pFD = pBlock->last ? pReader->pLastFD : pReader->pDataFD;
uint8_t *pBuf1 = NULL; SSubBlock *pSubBlock = &pBlock->aSubBlock[iSubBlock];
uint8_t *pBuf2 = NULL; SBlockCol *pBlockCol = &(SBlockCol){0};
SBlockCol *pBlockCol = &(SBlockCol){};
if (!ppBuf1) ppBuf1 = &pBuf1; tBlockDataReset(pBlockData);
if (!ppBuf2) ppBuf2 = &pBuf2;
for (int32_t iSubBlock = 0; iSubBlock < pBlock->nSubBlock; iSubBlock++) { // realloc
SSubBlock *pSubBlock = &pBlock->aSubBlock[iSubBlock]; code = tsdbRealloc(ppBuf1, pSubBlock->bsize);
uint8_t *p; if (code) goto _err;
int64_t n;
// realloc // seek
code = tsdbRealloc(ppBuf1, pSubBlock->bsize); n = taosLSeekFile(pFD, pSubBlock->offset, SEEK_SET);
if (code) goto _err; if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// seek // read
n = taosLSeekFile(pFD, pSubBlock->offset, SEEK_SET); n = taosReadFile(pFD, *ppBuf1, pSubBlock->bsize);
if (n < 0) { if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno); code = TAOS_SYSTEM_ERROR(errno);
goto _err;
} else if (n < pSubBlock->bsize) {
code = TSDB_CODE_FILE_CORRUPTED;
goto _err;
}
// check
p = *ppBuf1;
SBlockDataHdr *pHdr = (SBlockDataHdr *)p;
ASSERT(pHdr->delimiter == TSDB_FILE_DLMT);
ASSERT(pHdr->suid == pBlockIdx->suid);
ASSERT(pHdr->uid == pBlockIdx->uid);
p += sizeof(*pHdr);
if (!taosCheckChecksumWhole(p, pSubBlock->vsize + pSubBlock->ksize + sizeof(TSCKSUM))) {
code = TSDB_CODE_FILE_CORRUPTED;
goto _err;
}
p += (pSubBlock->vsize + pSubBlock->ksize + sizeof(TSCKSUM));
for (int32_t iBlockCol = 0; iBlockCol < pSubBlock->mBlockCol.nItem; iBlockCol++) {
tMapDataGetItemByIdx(&pSubBlock->mBlockCol, iBlockCol, pBlockCol, tGetBlockCol);
ASSERT(pBlockCol->flag && pBlockCol->flag != HAS_NONE);
if (pBlockCol->flag == HAS_NULL) continue;
if (!taosCheckChecksumWhole(p, pBlockCol->bsize + pBlockCol->csize + sizeof(TSCKSUM))) {
code = TSDB_CODE_FILE_CORRUPTED;
goto _err; goto _err;
} }
p = p + pBlockCol->bsize + pBlockCol->csize + sizeof(TSCKSUM);
}
// recover
pBlockData->nRow = pSubBlock->nRow;
p = *ppBuf1 + sizeof(*pHdr);
code = tsdbRealloc((uint8_t **)&pBlockData->aVersion, pBlockData->nRow * sizeof(int64_t));
if (code) goto _err;
code = tsdbRealloc((uint8_t **)&pBlockData->aTSKEY, pBlockData->nRow * sizeof(TSKEY));
if (code) goto _err;
if (pSubBlock->cmprAlg == NO_COMPRESSION) {
ASSERT(pSubBlock->vsize == sizeof(int64_t) * pSubBlock->nRow);
ASSERT(pSubBlock->ksize == sizeof(TSKEY) * pSubBlock->nRow);
// VERSION
memcpy(pBlockData->aVersion, p, pSubBlock->vsize);
// TSKEY
memcpy(pBlockData->aTSKEY, p + pSubBlock->vsize, pSubBlock->ksize);
} else {
size = sizeof(int64_t) * pSubBlock->nRow + COMP_OVERFLOW_BYTES;
if (pSubBlock->cmprAlg == TWO_STAGE_COMP) {
code = tsdbRealloc(ppBuf2, size);
if (code) goto _err;
}
// read // VERSION
n = taosReadFile(pFD, *ppBuf1, pSubBlock->bsize); n = tsDecompressBigint(p, pSubBlock->vsize, pSubBlock->nRow, (char *)pBlockData->aVersion,
sizeof(int64_t) * pSubBlock->nRow, pSubBlock->cmprAlg, *ppBuf2, size);
if (n < 0) { if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno); code = TSDB_CODE_COMPRESS_ERROR;
goto _err; goto _err;
} else if (n < pSubBlock->bsize) { }
code = TSDB_CODE_FILE_CORRUPTED;
// TSKEY
n = tsDecompressTimestamp(p + pSubBlock->vsize, pSubBlock->ksize, pSubBlock->nRow, (char *)pBlockData->aTSKEY,
sizeof(TSKEY) * pSubBlock->nRow, pSubBlock->cmprAlg, *ppBuf2, size);
if (n < 0) {
code = TSDB_CODE_COMPRESS_ERROR;
goto _err; goto _err;
} }
}
p = p + pSubBlock->vsize + pSubBlock->ksize + sizeof(TSCKSUM);
// check for (int32_t iBlockCol = 0; iBlockCol < pSubBlock->mBlockCol.nItem; iBlockCol++) {
p = *ppBuf1; SColData *pColData;
SBlockDataHdr *pHdr = (SBlockDataHdr *)p;
ASSERT(pHdr->delimiter == TSDB_FILE_DLMT);
ASSERT(pHdr->suid == pBlockIdx->suid);
ASSERT(pHdr->uid == pBlockIdx->uid);
p += sizeof(*pHdr);
if (!taosCheckChecksumWhole(p, pSubBlock->ksize)) { tMapDataGetItemByIdx(&pSubBlock->mBlockCol, iBlockCol, pBlockCol, tGetBlockCol);
code = TSDB_CODE_FILE_CORRUPTED; ASSERT(pBlockCol->flag && pBlockCol->flag != HAS_NONE);
goto _err;
code = tBlockDataAddColData(pBlockData, iBlockCol, &pColData);
if (code) goto _err;
tColDataReset(pColData, pBlockCol->cid, pBlockCol->type);
if (pBlockCol->flag == HAS_NULL) {
for (int32_t iRow = 0; iRow < pSubBlock->nRow; iRow++) {
code = tColDataAppendValue(pColData, &COL_VAL_NULL(pBlockCol->cid, pBlockCol->type));
if (code) goto _err;
}
continue;
} }
p += pSubBlock->ksize; pColData->nVal = pSubBlock->nRow;
pColData->flag = pBlockCol->flag;
for (int32_t iBlockCol = 0; iBlockCol < pSubBlock->mBlockCol.nItem; iBlockCol++) { // bitmap
tMapDataGetItemByIdx(&pSubBlock->mBlockCol, iBlockCol, pBlockCol, tGetBlockCol); if (pBlockCol->flag != HAS_VALUE) {
size = BIT2_SIZE(pSubBlock->nRow);
code = tsdbRealloc(&pColData->pBitMap, size);
if (code) goto _err;
ASSERT(pBlockCol->flag && pBlockCol->flag != HAS_NONE); ASSERT(pBlockCol->bsize == size);
memcpy(pColData->pBitMap, p, size);
} else {
ASSERT(pBlockCol->bsize == 0);
}
p = p + pBlockCol->bsize;
// value
if (IS_VAR_DATA_TYPE(pBlockCol->type)) {
pColData->nData = pBlockCol->osize;
} else {
pColData->nData = tDataTypes[pBlockCol->type].bytes * pSubBlock->nRow;
}
code = tsdbRealloc(&pColData->pData, pColData->nData);
if (code) goto _err;
if (pBlockCol->flag == HAS_NULL) continue; if (pSubBlock->cmprAlg == NO_COMPRESSION) {
memcpy(pColData->pData, p, pColData->nData);
} else {
size = pColData->nData + COMP_OVERFLOW_BYTES;
if (pSubBlock->cmprAlg == TWO_STAGE_COMP) {
code = tsdbRealloc(ppBuf2, size);
if (code) goto _err;
}
if (!taosCheckChecksumWhole(p, pBlockCol->size)) { n = tDataTypes[pBlockCol->type].decompFunc(p, pBlockCol->csize, pSubBlock->nRow, pColData->pData, pColData->nData,
code = TSDB_CODE_FILE_CORRUPTED; pSubBlock->cmprAlg, *ppBuf2, size);
if (n < 0) {
code = TSDB_CODE_COMPRESS_ERROR;
goto _err; goto _err;
} }
p += pBlockCol->size;
ASSERT(n == pColData->nData);
} }
p = p + pBlockCol->csize + sizeof(TSCKSUM);
}
// recover // TODO
pBlockData->nRow = pSubBlock->nRow; return code;
p = *ppBuf1 + sizeof(*pHdr);
code = tsdbRealloc((uint8_t **)&pBlockData->aVersion, pBlockData->nRow * sizeof(int64_t)); _err:
if (code) goto _err; tsdbError("vgId:%d tsdb read sub block data failed since %s", TD_VID(pReader->pTsdb->pVnode), tstrerror(code));
code = tsdbRealloc((uint8_t **)&pBlockData->aTSKEY, pBlockData->nRow * sizeof(TSKEY)); return code;
if (code) goto _err; }
p += pSubBlock->ksize;
for (int32_t iBlockCol = 0; iBlockCol < pSubBlock->mBlockCol.nItem; iBlockCol++) { int32_t tsdbReadBlockData(SDataFReader *pReader, SBlockIdx *pBlockIdx, SBlock *pBlock, SBlockData *pBlockData,
tMapDataGetItemByIdx(&pSubBlock->mBlockCol, iBlockCol, pBlockCol, tGetBlockCol); uint8_t **ppBuf1, uint8_t **ppBuf2) {
int32_t code = 0;
TdFilePtr pFD = pBlock->last ? pReader->pLastFD : pReader->pDataFD;
uint8_t *pBuf1 = NULL;
uint8_t *pBuf2 = NULL;
int32_t iSubBlock;
if (pBlockCol->flag == HAS_NONE) { if (!ppBuf1) ppBuf1 = &pBuf1;
// All NULL value if (!ppBuf2) ppBuf2 = &pBuf2;
} else {
// decompress // read the first sub-block
p += pBlockCol->size; iSubBlock = 0;
code = tsdbReadSubBlockData(pReader, pBlockIdx, pBlock, iSubBlock, pBlockData, ppBuf1, ppBuf2);
if (code) goto _err;
// read remain block data and do merg
if (pBlock->nSubBlock > 1) {
SBlockData *pBlockData1 = &(SBlockData){0};
SBlockData *pBlockData2 = &(SBlockData){0};
for (iSubBlock = 1; iSubBlock < pBlock->nSubBlock; iSubBlock++) {
code = tsdbReadSubBlockData(pReader, pBlockIdx, pBlock, iSubBlock, pBlockData, ppBuf1, ppBuf2);
if (code) {
tBlockDataClear(pBlockData1);
tBlockDataClear(pBlockData2);
goto _err;
}
code = tBlockDataCopy(pBlockData, pBlockData2);
if (code) {
tBlockDataClear(pBlockData1);
tBlockDataClear(pBlockData2);
goto _err;
}
// merge two block data
code = tBlockDataMerge(pBlockData1, pBlockData2, pBlockData);
if (code) {
tBlockDataClear(pBlockData1);
tBlockDataClear(pBlockData2);
goto _err;
} }
} }
tBlockDataClear(pBlockData1);
tBlockDataClear(pBlockData2);
} }
ASSERT(pBlock->nRow == pBlockData->nRow);
ASSERT(tsdbKeyCmprFn(&pBlock->minKey, &TSDBROW_KEY(&tBlockDataFirstRow(pBlockData))) == 0);
ASSERT(tsdbKeyCmprFn(&pBlock->maxKey, &TSDBROW_KEY(&tBlockDataLastRow(pBlockData))) == 0);
if (pBuf1) tsdbFree(pBuf1); if (pBuf1) tsdbFree(pBuf1);
if (pBuf2) tsdbFree(pBuf2); if (pBuf2) tsdbFree(pBuf2);
return code; return code;
...@@ -906,99 +1047,35 @@ _err: ...@@ -906,99 +1047,35 @@ _err:
return code; return code;
} }
int32_t tsdbUpdateDFileSetHeader(SDataFWriter *pWriter, uint8_t **ppBuf) { int32_t tsdbUpdateDFileSetHeader(SDataFWriter *pWriter) {
int32_t code = 0; int32_t code = 0;
int64_t size = TSDB_FHDR_SIZE; int64_t size = TSDB_FHDR_SIZE;
int64_t n; int64_t n;
uint8_t *pBuf = NULL; uint8_t hdr[TSDB_FHDR_SIZE];
SHeadFile *pHeadFile = &pWriter->wSet.fHead; SHeadFile *pHeadFile = &pWriter->wSet.fHead;
SDataFile *pDataFile = &pWriter->wSet.fData; SDataFile *pDataFile = &pWriter->wSet.fData;
SLastFile *pLastFile = &pWriter->wSet.fLast; SLastFile *pLastFile = &pWriter->wSet.fLast;
SSmaFile *pSmaFile = &pWriter->wSet.fSma; SSmaFile *pSmaFile = &pWriter->wSet.fSma;
// alloc
if (!ppBuf) ppBuf = &pBuf;
code = tsdbRealloc(ppBuf, size);
if (code) goto _err;
// head ============== // head ==============
// build code = tsdbUpdateDFileHdr(pWriter->pHeadFD, &pWriter->wSet, TSDB_HEAD_FILE);
memset(*ppBuf, 0, size); if (code) goto _err;
tPutDataFileHdr(*ppBuf, &pWriter->wSet, TSDB_HEAD_FILE);
taosCalcChecksumAppend(0, *ppBuf, size);
// seek
if (taosLSeekFile(pWriter->pHeadFD, 0, SEEK_SET) < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// write
n = taosWriteFile(pWriter->pHeadFD, *ppBuf, size);
if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// data ============== // data ==============
memset(*ppBuf, 0, size); code = tsdbUpdateDFileHdr(pWriter->pHeadFD, &pWriter->wSet, TSDB_DATA_FILE);
tPutDataFileHdr(*ppBuf, &pWriter->wSet, TSDB_DATA_FILE); if (code) goto _err;
taosCalcChecksumAppend(0, *ppBuf, size);
// seek
if (taosLSeekFile(pWriter->pDataFD, 0, SEEK_SET) < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// write
n = taosWriteFile(pWriter->pDataFD, *ppBuf, size);
if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// last ============== // last ==============
memset(*ppBuf, 0, size); code = tsdbUpdateDFileHdr(pWriter->pHeadFD, &pWriter->wSet, TSDB_LAST_FILE);
tPutDataFileHdr(*ppBuf, &pWriter->wSet, TSDB_LAST_FILE); if (code) goto _err;
taosCalcChecksumAppend(0, *ppBuf, size);
// seek
if (taosLSeekFile(pWriter->pLastFD, 0, SEEK_SET) < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// write
n = taosWriteFile(pWriter->pLastFD, *ppBuf, size);
if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// sma ============== // sma ==============
memset(*ppBuf, 0, size); code = tsdbUpdateDFileHdr(pWriter->pHeadFD, &pWriter->wSet, TSDB_SMA_FILE);
tPutDataFileHdr(*ppBuf, &pWriter->wSet, TSDB_SMA_FILE); if (code) goto _err;
taosCalcChecksumAppend(0, *ppBuf, size);
// seek
if (taosLSeekFile(pWriter->pSmaFD, 0, SEEK_SET) < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
// write
n = taosWriteFile(pWriter->pSmaFD, *ppBuf, size);
if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno);
goto _err;
}
tsdbFree(pBuf);
return code; return code;
_err: _err:
tsdbFree(pBuf);
tsdbError("vgId:%d update DFileSet header failed since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code)); tsdbError("vgId:%d update DFileSet header failed since %s", TD_VID(pWriter->pTsdb->pVnode), tstrerror(code));
return code; return code;
} }
...@@ -1134,27 +1211,26 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_ ...@@ -1134,27 +1211,26 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_
pSubBlock->bsize += n; pSubBlock->bsize += n;
// TSDBKEY // TSDBKEY
pSubBlock->ksize = 0;
if (cmprAlg == NO_COMPRESSION) { if (cmprAlg == NO_COMPRESSION) {
// TSKEY cksm = 0;
size = sizeof(TSKEY) * pBlockData->nRow;
n = taosWriteFile(pFileFD, pBlockData->aTSKEY, size); // version
pSubBlock->vsize = sizeof(int64_t) * pBlockData->nRow;
n = taosWriteFile(pFileFD, pBlockData->aVersion, pSubBlock->vsize);
if (n < 0) { if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno); code = TAOS_SYSTEM_ERROR(errno);
goto _err; goto _err;
} }
pSubBlock->ksize += size; cksm = taosCalcChecksum(cksm, (uint8_t *)pBlockData->aVersion, pSubBlock->vsize);
cksm = taosCalcChecksum(0, (uint8_t *)pBlockData->aTSKEY, size);
// version // TSKEY
size = sizeof(int64_t) * pBlockData->nRow; pSubBlock->ksize = sizeof(TSKEY) * pBlockData->nRow;
n = taosWriteFile(pFileFD, pBlockData->aVersion, size); n = taosWriteFile(pFileFD, pBlockData->aTSKEY, pSubBlock->ksize);
if (n < 0) { if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno); code = TAOS_SYSTEM_ERROR(errno);
goto _err; goto _err;
} }
pSubBlock->ksize += size; cksm = taosCalcChecksum(cksm, (uint8_t *)pBlockData->aTSKEY, pSubBlock->ksize);
cksm = taosCalcChecksum(cksm, (uint8_t *)pBlockData->aVersion, size);
// cksm // cksm
size = sizeof(cksm); size = sizeof(cksm);
...@@ -1163,11 +1239,10 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_ ...@@ -1163,11 +1239,10 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_
code = TAOS_SYSTEM_ERROR(errno); code = TAOS_SYSTEM_ERROR(errno);
goto _err; goto _err;
} }
pSubBlock->ksize += size;
} else { } else {
ASSERT(cmprAlg == ONE_STAGE_COMP || cmprAlg == TWO_STAGE_COMP); ASSERT(cmprAlg == ONE_STAGE_COMP || cmprAlg == TWO_STAGE_COMP);
size = (sizeof(TSKEY) + sizeof(int64_t)) * pBlockData->nRow + COMP_OVERFLOW_BYTES * 2 + sizeof(TSCKSUM); size = (sizeof(int64_t) + sizeof(TSKEY)) * pBlockData->nRow + COMP_OVERFLOW_BYTES * 2 + sizeof(TSCKSUM);
code = tsdbRealloc(ppBuf1, size); code = tsdbRealloc(ppBuf1, size);
if (code) goto _err; if (code) goto _err;
...@@ -1177,37 +1252,37 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_ ...@@ -1177,37 +1252,37 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_
if (code) goto _err; if (code) goto _err;
} }
// TSKEY // version
n = tsCompressTimestamp((char *)pBlockData->aTSKEY, sizeof(TSKEY) * pBlockData->nRow, pBlockData->nRow, *ppBuf1, n = tsCompressBigint((char *)pBlockData->aVersion, sizeof(int64_t) * pBlockData->nRow, pBlockData->nRow, *ppBuf1,
size, cmprAlg, *ppBuf2, size); size, cmprAlg, *ppBuf2, size);
if (n <= 0) { if (n <= 0) {
code = TSDB_CODE_COMPRESS_ERROR; code = TSDB_CODE_COMPRESS_ERROR;
goto _err; goto _err;
} }
pSubBlock->ksize += n; pSubBlock->vsize = n;
// version // TSKEY
n = tsCompressBigint((char *)pBlockData->aVersion, sizeof(int64_t) * pBlockData->nRow, pBlockData->nRow, n = tsCompressTimestamp((char *)pBlockData->aTSKEY, sizeof(TSKEY) * pBlockData->nRow, pBlockData->nRow,
*ppBuf1 + pSubBlock->ksize, size - pSubBlock->ksize, cmprAlg, *ppBuf2, size); *ppBuf1 + pSubBlock->vsize, size - pSubBlock->vsize, cmprAlg, *ppBuf2, size);
if (n <= 0) { if (n <= 0) {
code = TSDB_CODE_COMPRESS_ERROR; code = TSDB_CODE_COMPRESS_ERROR;
goto _err; goto _err;
} }
pSubBlock->ksize += n; pSubBlock->ksize = n;
// cksm // cksm
pSubBlock->ksize += sizeof(TSCKSUM); n = pSubBlock->vsize + pSubBlock->ksize + sizeof(TSCKSUM);
ASSERT(pSubBlock->ksize <= size); ASSERT(n <= size);
taosCalcChecksumAppend(0, *ppBuf1, pSubBlock->ksize); taosCalcChecksumAppend(0, *ppBuf1, n);
// write // write
n = taosWriteFile(pFileFD, *ppBuf1, pSubBlock->ksize); n = taosWriteFile(pFileFD, *ppBuf1, n);
if (n < 0) { if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno); code = TAOS_SYSTEM_ERROR(errno);
goto _err; goto _err;
} }
} }
pSubBlock->bsize += pSubBlock->ksize; pSubBlock->bsize += (pSubBlock->vsize + pSubBlock->ksize + sizeof(TSCKSUM));
// other columns // other columns
offset = 0; offset = 0;
...@@ -1226,19 +1301,18 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_ ...@@ -1226,19 +1301,18 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_
if (pColData->flag != HAS_NULL) { if (pColData->flag != HAS_NULL) {
cksm = 0; cksm = 0;
pBlockCol->offset = offset; pBlockCol->offset = offset;
pBlockCol->size = 0;
// bitmap // bitmap
if (pColData->flag != HAS_VALUE) { if (pColData->flag == HAS_VALUE) {
// optimize bitmap storage (todo) pBlockCol->bsize = 0;
n = taosWriteFile(pFileFD, pColData->pBitMap, BIT2_SIZE(pBlockData->nRow)); } else {
pBlockCol->bsize = BIT2_SIZE(pBlockData->nRow);
n = taosWriteFile(pFileFD, pColData->pBitMap, pBlockCol->bsize);
if (n < 0) { if (n < 0) {
code = TAOS_SYSTEM_ERROR(errno); code = TAOS_SYSTEM_ERROR(errno);
goto _err; goto _err;
} }
cksm = taosCalcChecksum(cksm, pColData->pBitMap, n); cksm = taosCalcChecksum(cksm, pColData->pBitMap, n);
pBlockCol->size += n;
} }
// data // data
...@@ -1249,7 +1323,8 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_ ...@@ -1249,7 +1323,8 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_
code = TAOS_SYSTEM_ERROR(errno); code = TAOS_SYSTEM_ERROR(errno);
goto _err; goto _err;
} }
pBlockCol->size += n; pBlockCol->csize = n;
pBlockCol->osize = n;
// checksum // checksum
cksm = taosCalcChecksum(cksm, pColData->pData, pColData->nData); cksm = taosCalcChecksum(cksm, pColData->pData, pColData->nData);
...@@ -1258,7 +1333,6 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_ ...@@ -1258,7 +1333,6 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_
code = TAOS_SYSTEM_ERROR(errno); code = TAOS_SYSTEM_ERROR(errno);
goto _err; goto _err;
} }
pBlockCol->size += n;
} else { } else {
size = pColData->nData + COMP_OVERFLOW_BYTES + sizeof(TSCKSUM); size = pColData->nData + COMP_OVERFLOW_BYTES + sizeof(TSCKSUM);
...@@ -1277,6 +1351,8 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_ ...@@ -1277,6 +1351,8 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_
code = TSDB_CODE_COMPRESS_ERROR; code = TSDB_CODE_COMPRESS_ERROR;
goto _err; goto _err;
} }
pBlockCol->csize = n;
pBlockCol->osize = pColData->nData;
// cksm // cksm
n += sizeof(TSCKSUM); n += sizeof(TSCKSUM);
...@@ -1289,13 +1365,11 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_ ...@@ -1289,13 +1365,11 @@ int32_t tsdbWriteBlockData(SDataFWriter *pWriter, SBlockData *pBlockData, uint8_
code = TAOS_SYSTEM_ERROR(errno); code = TAOS_SYSTEM_ERROR(errno);
goto _err; goto _err;
} }
pBlockCol->size += n;
} }
// state // state
offset += pBlockCol->size; offset = offset + pBlockCol->bsize + pBlockCol->csize + sizeof(TSCKSUM);
pSubBlock->bsize += pBlockCol->size; pSubBlock->bsize = pSubBlock->bsize + pBlockCol->bsize + pBlockCol->csize + sizeof(TSCKSUM);
} }
code = tMapDataPutItem(&pSubBlock->mBlockCol, pBlockCol, tPutBlockCol); code = tMapDataPutItem(&pSubBlock->mBlockCol, pBlockCol, tPutBlockCol);
......
...@@ -355,6 +355,7 @@ void tBlockReset(SBlock *pBlock) { ...@@ -355,6 +355,7 @@ void tBlockReset(SBlock *pBlock) {
pBlock->aSubBlock[iSubBlock].nRow = 0; pBlock->aSubBlock[iSubBlock].nRow = 0;
pBlock->aSubBlock[iSubBlock].cmprAlg = -1; pBlock->aSubBlock[iSubBlock].cmprAlg = -1;
pBlock->aSubBlock[iSubBlock].offset = -1; pBlock->aSubBlock[iSubBlock].offset = -1;
pBlock->aSubBlock[iSubBlock].vsize = -1;
pBlock->aSubBlock[iSubBlock].ksize = -1; pBlock->aSubBlock[iSubBlock].ksize = -1;
pBlock->aSubBlock[iSubBlock].bsize = -1; pBlock->aSubBlock[iSubBlock].bsize = -1;
tMapDataReset(&pBlock->aSubBlock->mBlockCol); tMapDataReset(&pBlock->aSubBlock->mBlockCol);
...@@ -384,6 +385,7 @@ int32_t tPutBlock(uint8_t *p, void *ph) { ...@@ -384,6 +385,7 @@ int32_t tPutBlock(uint8_t *p, void *ph) {
n += tPutI64v(p ? p + n : p, pBlock->aSubBlock[iSubBlock].nRow); n += tPutI64v(p ? p + n : p, pBlock->aSubBlock[iSubBlock].nRow);
n += tPutI8(p ? p + n : p, pBlock->aSubBlock[iSubBlock].cmprAlg); n += tPutI8(p ? p + n : p, pBlock->aSubBlock[iSubBlock].cmprAlg);
n += tPutI64v(p ? p + n : p, pBlock->aSubBlock[iSubBlock].offset); n += tPutI64v(p ? p + n : p, pBlock->aSubBlock[iSubBlock].offset);
n += tPutI64v(p ? p + n : p, pBlock->aSubBlock[iSubBlock].vsize);
n += tPutI64v(p ? p + n : p, pBlock->aSubBlock[iSubBlock].ksize); n += tPutI64v(p ? p + n : p, pBlock->aSubBlock[iSubBlock].ksize);
n += tPutI64v(p ? p + n : p, pBlock->aSubBlock[iSubBlock].bsize); n += tPutI64v(p ? p + n : p, pBlock->aSubBlock[iSubBlock].bsize);
n += tPutMapData(p ? p + n : p, &pBlock->aSubBlock[iSubBlock].mBlockCol); n += tPutMapData(p ? p + n : p, &pBlock->aSubBlock[iSubBlock].mBlockCol);
...@@ -408,6 +410,7 @@ int32_t tGetBlock(uint8_t *p, void *ph) { ...@@ -408,6 +410,7 @@ int32_t tGetBlock(uint8_t *p, void *ph) {
n += tGetI64v(p + n, &pBlock->aSubBlock[iSubBlock].nRow); n += tGetI64v(p + n, &pBlock->aSubBlock[iSubBlock].nRow);
n += tGetI8(p + n, &pBlock->aSubBlock[iSubBlock].cmprAlg); n += tGetI8(p + n, &pBlock->aSubBlock[iSubBlock].cmprAlg);
n += tGetI64v(p + n, &pBlock->aSubBlock[iSubBlock].offset); n += tGetI64v(p + n, &pBlock->aSubBlock[iSubBlock].offset);
n += tGetI64v(p + n, &pBlock->aSubBlock[iSubBlock].vsize);
n += tGetI64v(p + n, &pBlock->aSubBlock[iSubBlock].ksize); n += tGetI64v(p + n, &pBlock->aSubBlock[iSubBlock].ksize);
n += tGetI64v(p + n, &pBlock->aSubBlock[iSubBlock].bsize); n += tGetI64v(p + n, &pBlock->aSubBlock[iSubBlock].bsize);
n += tGetMapData(p + n, &pBlock->aSubBlock[iSubBlock].mBlockCol); n += tGetMapData(p + n, &pBlock->aSubBlock[iSubBlock].mBlockCol);
...@@ -443,7 +446,13 @@ int32_t tPutBlockCol(uint8_t *p, void *ph) { ...@@ -443,7 +446,13 @@ int32_t tPutBlockCol(uint8_t *p, void *ph) {
if (pBlockCol->flag != HAS_NULL) { if (pBlockCol->flag != HAS_NULL) {
n += tPutI64v(p ? p + n : p, pBlockCol->offset); n += tPutI64v(p ? p + n : p, pBlockCol->offset);
n += tPutI64v(p ? p + n : p, pBlockCol->size); if (pBlockCol->flag != HAS_VALUE) {
n += tPutI64v(p ? p + n : p, pBlockCol->bsize);
}
n += tPutI64v(p ? p + n : p, pBlockCol->csize);
if (IS_VAR_DATA_TYPE(pBlockCol->type)) {
n += tPutI64v(p ? p + n : p, pBlockCol->osize);
}
} }
return n; return n;
...@@ -461,7 +470,17 @@ int32_t tGetBlockCol(uint8_t *p, void *ph) { ...@@ -461,7 +470,17 @@ int32_t tGetBlockCol(uint8_t *p, void *ph) {
if (pBlockCol->flag != HAS_NULL) { if (pBlockCol->flag != HAS_NULL) {
n += tGetI64v(p + n, &pBlockCol->offset); n += tGetI64v(p + n, &pBlockCol->offset);
n += tGetI64v(p + n, &pBlockCol->size); if (pBlockCol->flag != HAS_VALUE) {
n += tGetI64v(p + n, &pBlockCol->bsize);
} else {
pBlockCol->bsize = 0;
}
n += tGetI64v(p + n, &pBlockCol->csize);
if (IS_VAR_DATA_TYPE(pBlockCol->type)) {
n += tGetI64v(p + n, &pBlockCol->osize);
} else {
pBlockCol->osize = -1;
}
} }
return n; return n;
...@@ -921,6 +940,29 @@ _exit: ...@@ -921,6 +940,29 @@ _exit:
return code; return code;
} }
int32_t tColDataCopy(SColData *pColDataSrc, SColData *pColDataDest) {
int32_t code = 0;
pColDataDest->cid = pColDataDest->cid;
pColDataDest->type = pColDataDest->type;
pColDataDest->offsetValid = 0;
pColDataDest->nVal = pColDataSrc->nVal;
pColDataDest->flag = pColDataSrc->flag;
if (pColDataSrc->flag != HAS_NONE && pColDataSrc->flag != HAS_NULL && pColDataSrc->flag != HAS_VALUE) {
code = tsdbRealloc(&pColDataDest->pBitMap, BIT2_SIZE(pColDataDest->nVal));
if (code) goto _exit;
memcpy(pColDataDest->pBitMap, pColDataSrc->pBitMap, BIT2_SIZE(pColDataSrc->nVal));
}
pColDataDest->nData = pColDataSrc->nData;
code = tsdbRealloc(&pColDataDest->pData, pColDataSrc->nData);
if (code) goto _exit;
memcpy(pColDataDest->pData, pColDataSrc->pData, pColDataSrc->nData);
_exit:
return code;
}
static int32_t tColDataUpdateOffset(SColData *pColData) { static int32_t tColDataUpdateOffset(SColData *pColData) {
int32_t code = 0; int32_t code = 0;
SValue value; SValue value;
...@@ -1039,24 +1081,30 @@ void tBlockDataClear(SBlockData *pBlockData) { ...@@ -1039,24 +1081,30 @@ void tBlockDataClear(SBlockData *pBlockData) {
taosArrayDestroyEx(pBlockData->aColData, tColDataClear); taosArrayDestroyEx(pBlockData->aColData, tColDataClear);
} }
static SColData *tBlockDataAddBlockCol(SBlockData *pBlockData, int32_t iColData, int16_t cid, int8_t type) { int32_t tBlockDataAddColData(SBlockData *pBlockData, int32_t iColData, SColData **ppColData) {
int32_t code = 0;
SColData *pColData = NULL; SColData *pColData = NULL;
int32_t idx = taosArrayGetSize(pBlockData->aColDataP); int32_t idx = taosArrayGetSize(pBlockData->aColDataP);
if (idx >= taosArrayGetSize(pBlockData->aColData)) { if (idx >= taosArrayGetSize(pBlockData->aColData)) {
if (taosArrayPush(pBlockData->aColData, &((SColData){0})) == NULL) return NULL; if (taosArrayPush(pBlockData->aColData, &((SColData){0})) == NULL) {
code = TSDB_CODE_OUT_OF_MEMORY;
goto _err;
}
} }
pColData = (SColData *)taosArrayGet(pBlockData->aColData, idx); pColData = (SColData *)taosArrayGet(pBlockData->aColData, idx);
tColDataReset(pColData, cid, type);
if (taosArrayInsert(pBlockData->aColDataP, iColData, &pColData) == NULL) return NULL;
// append NONE if (taosArrayInsert(pBlockData->aColDataP, iColData, &pColData) == NULL) {
for (int32_t i = 0; i < pBlockData->nRow; i++) { code = TSDB_CODE_OUT_OF_MEMORY;
if (tColDataAppendValue(pColData, &COL_VAL_NONE(cid, type)) != 0) return NULL; goto _err;
} }
return pColData; *ppColData = pColData;
return code;
_err:
*ppColData = NULL;
return code;
} }
int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTSchema) { int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTSchema) {
...@@ -1092,10 +1140,14 @@ int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTS ...@@ -1092,10 +1140,14 @@ int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTS
code = tColDataAppendValue(pColData, &(COL_VAL_NONE(pColData->cid, pColData->type))); code = tColDataAppendValue(pColData, &(COL_VAL_NONE(pColData->cid, pColData->type)));
if (code) goto _err; if (code) goto _err;
} else { } else {
pColData = tBlockDataAddBlockCol(pBlockData, iColData, pColVal->cid, pColVal->type); code = tBlockDataAddColData(pBlockData, iColData, &pColData);
if (pColData == NULL) { if (code) goto _err;
code = TSDB_CODE_OUT_OF_MEMORY;
goto _err; // append a NONE
tColDataReset(pColData, pColVal->cid, pColVal->type);
for (int32_t iRow = 0; iRow < pBlockData->nRow; iRow++) {
code = tColDataAppendValue(pColData, &COL_VAL_NONE(pColVal->cid, pColVal->type));
if (code) goto _err;
} }
code = tColDataAppendValue(pColData, pColVal); code = tColDataAppendValue(pColData, pColVal);
...@@ -1119,10 +1171,13 @@ int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTS ...@@ -1119,10 +1171,13 @@ int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTS
} }
while (pColVal) { while (pColVal) {
pColData = tBlockDataAddBlockCol(pBlockData, iColData, pColVal->cid, pColVal->type); code = tBlockDataAddColData(pBlockData, iColData, &pColData);
if (pColData == NULL) { if (code) goto _err;
code = TSDB_CODE_OUT_OF_MEMORY;
goto _err; tColDataReset(pColData, pColVal->cid, pColVal->type);
for (int32_t iRow = 0; iRow < pBlockData->nRow; iRow++) {
code = tColDataAppendValue(pColData, &COL_VAL_NONE(pColVal->cid, pColVal->type));
if (code) goto _err;
} }
code = tColDataAppendValue(pColData, pColVal); code = tColDataAppendValue(pColData, pColVal);
...@@ -1138,3 +1193,85 @@ int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTS ...@@ -1138,3 +1193,85 @@ int32_t tBlockDataAppendRow(SBlockData *pBlockData, TSDBROW *pRow, STSchema *pTS
_err: _err:
return code; return code;
} }
int32_t tBlockDataMerge(SBlockData *pBlockData1, SBlockData *pBlockData2, SBlockData *pBlockData) {
int32_t code = 0;
tBlockDataReset(pBlockData);
// loop to merge
int32_t iRow1 = 0;
int32_t nRow1 = pBlockData1->nRow;
int32_t iRow2 = 0;
int32_t nRow2 = pBlockData2->nRow;
TSDBROW row1;
TSDBROW row2;
int32_t c;
while (iRow1 < nRow1 && iRow2 < nRow2) {
row1 = tsdbRowFromBlockData(pBlockData1, iRow1);
row2 = tsdbRowFromBlockData(pBlockData2, iRow2);
c = tsdbKeyCmprFn(&TSDBROW_KEY(&row1), &TSDBROW_KEY(&row2));
if (c < 0) {
code = tBlockDataAppendRow(pBlockData, &row1, NULL);
if (code) goto _exit;
iRow1++;
} else if (c > 0) {
code = tBlockDataAppendRow(pBlockData, &row2, NULL);
if (code) goto _exit;
iRow2++;
} else {
ASSERT(0);
}
}
while (iRow1 < nRow1) {
row1 = tsdbRowFromBlockData(pBlockData1, iRow1);
code = tBlockDataAppendRow(pBlockData, &row1, NULL);
if (code) goto _exit;
iRow1++;
}
while (iRow2 < nRow2) {
row2 = tsdbRowFromBlockData(pBlockData2, iRow2);
code = tBlockDataAppendRow(pBlockData, &row2, NULL);
if (code) goto _exit;
iRow2++;
}
_exit:
return code;
}
int32_t tBlockDataCopy(SBlockData *pBlockDataSrc, SBlockData *pBlockDataDest) {
int32_t code = 0;
SColData *pColDataSrc;
SColData *pColDataDest;
ASSERT(pBlockDataSrc->nRow > 0);
tBlockDataReset(pBlockDataDest);
pBlockDataDest->nRow = pBlockDataSrc->nRow;
// TSDBKEY
code = tsdbRealloc((uint8_t **)&pBlockDataDest->aVersion, sizeof(int64_t) * pBlockDataSrc->nRow);
if (code) goto _exit;
code = tsdbRealloc((uint8_t **)&pBlockDataDest->aTSKEY, sizeof(TSKEY) * pBlockDataSrc->nRow);
if (code) goto _exit;
memcpy(pBlockDataDest->aVersion, pBlockDataSrc->aVersion, sizeof(int64_t) * pBlockDataSrc->nRow);
memcpy(pBlockDataDest->aTSKEY, pBlockDataSrc->aTSKEY, sizeof(TSKEY) * pBlockDataSrc->nRow);
// other
for (size_t iColData = 0; iColData < taosArrayGetSize(pBlockDataSrc->aColDataP); iColData++) {
pColDataSrc = (SColData *)taosArrayGetP(pBlockDataSrc->aColDataP, iColData);
code = tBlockDataAddColData(pBlockDataDest, iColData, &pColDataDest);
if (code) goto _exit;
code = tColDataCopy(pColDataSrc, pColDataDest);
if (code) goto _exit;
}
_exit:
return code;
}
\ No newline at end of file
...@@ -620,8 +620,6 @@ SColumn extractColumnFromColumnNode(SColumnNode* pColNode) { ...@@ -620,8 +620,6 @@ SColumn extractColumnFromColumnNode(SColumnNode* pColNode) {
} }
int32_t initQueryTableDataCond(SQueryTableDataCond* pCond, const STableScanPhysiNode* pTableScanNode) { int32_t initQueryTableDataCond(SQueryTableDataCond* pCond, const STableScanPhysiNode* pTableScanNode) {
pCond->loadExternalRows = false;
pCond->order = pTableScanNode->scanSeq[0] > 0 ? TSDB_ORDER_ASC : TSDB_ORDER_DESC; pCond->order = pTableScanNode->scanSeq[0] > 0 ? TSDB_ORDER_ASC : TSDB_ORDER_DESC;
pCond->numOfCols = LIST_LENGTH(pTableScanNode->scan.pScanCols); pCond->numOfCols = LIST_LENGTH(pTableScanNode->scan.pScanCols);
pCond->colList = taosMemoryCalloc(pCond->numOfCols, sizeof(SColumnInfo)); pCond->colList = taosMemoryCalloc(pCond->numOfCols, sizeof(SColumnInfo));
...@@ -647,15 +645,7 @@ int32_t initQueryTableDataCond(SQueryTableDataCond* pCond, const STableScanPhysi ...@@ -647,15 +645,7 @@ int32_t initQueryTableDataCond(SQueryTableDataCond* pCond, const STableScanPhysi
} }
#endif #endif
for (int32_t i = 0; i < pCond->numOfTWindows; ++i) { pCond->type = BLOCK_LOAD_OFFSET_ORDER;
if ((pCond->order == TSDB_ORDER_ASC && pCond->twindows[i].skey > pCond->twindows[i].ekey) ||
(pCond->order == TSDB_ORDER_DESC && pCond->twindows[i].skey < pCond->twindows[i].ekey)) {
TSWAP(pCond->twindows[i].skey, pCond->twindows[i].ekey);
}
}
taosqsort(pCond->twindows, pCond->numOfTWindows, sizeof(STimeWindow), pCond, compareTimeWindow);
pCond->type = BLOCK_LOAD_OFFSET_SEQ_ORDER;
// pCond->type = pTableScanNode->scanFlag; // pCond->type = pTableScanNode->scanFlag;
int32_t j = 0; int32_t j = 0;
...@@ -677,6 +667,5 @@ int32_t initQueryTableDataCond(SQueryTableDataCond* pCond, const STableScanPhysi ...@@ -677,6 +667,5 @@ int32_t initQueryTableDataCond(SQueryTableDataCond* pCond, const STableScanPhysi
} }
void cleanupQueryTableDataCond(SQueryTableDataCond* pCond) { void cleanupQueryTableDataCond(SQueryTableDataCond* pCond) {
taosMemoryFree(pCond->twindows);
taosMemoryFree(pCond->colList); taosMemoryFree(pCond->colList);
} }
\ No newline at end of file
...@@ -4306,7 +4306,11 @@ STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle ...@@ -4306,7 +4306,11 @@ STsdbReader* doCreateDataReader(STableScanPhysiNode* pTableScanNode, SReadHandle
} }
STsdbReader* pReader; STsdbReader* pReader;
tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo, queryId, taskId, &pReader); code = tsdbReaderOpen(pHandle->vnode, &cond, pTableListInfo, queryId, taskId, &pReader);
if (code != TSDB_CODE_SUCCESS) {
goto _error;
}
cleanupQueryTableDataCond(&cond); cleanupQueryTableDataCond(&cond);
return pReader; return pReader;
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册