dataDispatcher.c 9.7 KB
Newer Older
X
Xiaoyu Wang 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#include "dataSinkInt.h"
#include "dataSinkMgt.h"
18
#include "executorimpl.h"
X
Xiaoyu Wang 已提交
19 20
#include "planner.h"
#include "tcompression.h"
L
Liu Jicong 已提交
21
#include "tdatablock.h"
X
Xiaoyu Wang 已提交
22 23 24
#include "tglobal.h"
#include "tqueue.h"

D
dapan1121 已提交
25 26
extern SDataSinkStat gDataSinkStat;

27 28 29
typedef struct SDataDispatchBuf {
  int32_t useSize;
  int32_t allocSize;
L
Liu Jicong 已提交
30
  char*   pData;
31 32 33 34 35
} SDataDispatchBuf;

typedef struct SDataCacheEntry {
  int32_t dataLen;
  int32_t numOfRows;
36
  int32_t numOfCols;
37 38 39
  int8_t  compressed;
  char    data[];
} SDataCacheEntry;
X
Xiaoyu Wang 已提交
40 41

typedef struct SDataDispatchHandle {
L
Liu Jicong 已提交
42 43
  SDataSinkHandle     sink;
  SDataSinkManager*   pManager;
X
Xiaoyu Wang 已提交
44
  SDataBlockDescNode* pSchema;
L
Liu Jicong 已提交
45 46 47 48 49
  STaosQueue*         pDataBlocks;
  SDataDispatchBuf    nextOutput;
  int32_t             status;
  bool                queryEnd;
  uint64_t            useconds;
D
dapan1121 已提交
50
  uint64_t            cachedSize;
L
Liu Jicong 已提交
51
  TdThreadMutex       mutex;
X
Xiaoyu Wang 已提交
52 53
} SDataDispatchHandle;

L
Liu Jicong 已提交
54
static bool needCompress(const SSDataBlock* pData, int32_t numOfCols) {
X
Xiaoyu Wang 已提交
55 56 57 58
  if (tsCompressColData < 0 || 0 == pData->info.rows) {
    return false;
  }

X
Xiaoyu Wang 已提交
59
  for (int32_t col = 0; col < numOfCols; ++col) {
X
Xiaoyu Wang 已提交
60
    SColumnInfoData* pColRes = taosArrayGet(pData->pDataBlock, col);
L
Liu Jicong 已提交
61
    int32_t          colSize = pColRes->info.bytes * pData->info.rows;
X
Xiaoyu Wang 已提交
62 63 64 65 66 67 68 69
    if (NEEDTO_COMPRESS_QUERY(colSize)) {
      return true;
    }
  }

  return false;
}

70
// clang-format off
H
Haojun Liao 已提交
71
// data format:
72 73 74 75
// +----------------+--------------+--------------+------------------+--------------------------------------------+------------------------------------+-------------+-----------+-------------+-----------+
// |SDataCacheEntry | total length | numOfRows    |     group id     | col1_schema | col2_schema | col3_schema... | column#1 length, column#2 length...| col1 bitmap | col1 data | col2 bitmap | col2 data | .... |                |  (4 bytes)   |(8 bytes)
// |                |sizeof(int32) | sizeof(int32)| sizeof(uint64_t) |(sizeof(int16_t)+sizeof(int32_t))*numOfCols | sizeof(int32_t) * numOfCols        | actual size |           |
// +----------------+--------------+--------------+------------------+--------------------------------------------+------------------------------------+-------------+-----------+-------------+-----------+
H
Haojun Liao 已提交
76 77
// The length of bitmap is decided by number of rows of this data block, and the length of each column data is
// recorded in the first segment, next to the struct header
78
// clang-format on
D
dapan1121 已提交
79
static void toDataCacheEntry(SDataDispatchHandle* pHandle, const SInputData* pInput, SDataDispatchBuf* pBuf) {
80
  int32_t numOfCols = 0;
81
  SNode*  pNode;
82 83 84 85 86 87
  FOREACH(pNode, pHandle->pSchema->pSlots) {
    SSlotDescNode* pSlotDesc = (SSlotDescNode*)pNode;
    if (pSlotDesc->output) {
      ++numOfCols;
    }
  }
88
  SDataCacheEntry* pEntry = (SDataCacheEntry*)pBuf->pData;
L
Liu Jicong 已提交
89 90
  pEntry->compressed = (int8_t)needCompress(pInput->pData, numOfCols);
  pEntry->numOfRows = pInput->pData->info.rows;
S
shenglian zhou 已提交
91
  pEntry->numOfCols = numOfCols;
L
Liu Jicong 已提交
92
  pEntry->dataLen = 0;
X
Xiaoyu Wang 已提交
93

D
dapan1121 已提交
94
  pBuf->useSize = sizeof(SDataCacheEntry);
95
  blockEncode(pInput->pData, pEntry->data, &pEntry->dataLen, numOfCols, pEntry->compressed);
96

L
Liu Jicong 已提交
97
  pBuf->useSize += pEntry->dataLen;
98 99 100

  atomic_add_fetch_64(&pHandle->cachedSize, pEntry->dataLen);
  atomic_add_fetch_64(&gDataSinkStat.cachedSize, pEntry->dataLen);
X
Xiaoyu Wang 已提交
101 102
}

103
static bool allocBuf(SDataDispatchHandle* pDispatcher, const SInputData* pInput, SDataDispatchBuf* pBuf) {
H
Haojun Liao 已提交
104
  uint32_t capacity = pDispatcher->pManager->cfg.maxDataBlockNumPerQuery;
105
  if (taosQueueItemSize(pDispatcher->pDataBlocks) > capacity) {
H
Haojun Liao 已提交
106
    qError("SinkNode queue is full, no capacity, max:%d, current:%d, no capacity", capacity,
107
           taosQueueItemSize(pDispatcher->pDataBlocks));
108 109
    return false;
  }
H
Haojun Liao 已提交
110

D
dapan1121 已提交
111
  pBuf->allocSize = sizeof(SDataCacheEntry) + blockGetEncodeSize(pInput->pData);
H
Haojun Liao 已提交
112

wafwerar's avatar
wafwerar 已提交
113
  pBuf->pData = taosMemoryMalloc(pBuf->allocSize);
H
Haojun Liao 已提交
114 115 116 117
  if (pBuf->pData == NULL) {
    qError("SinkNode failed to malloc memory, size:%d, code:%d", pBuf->allocSize, TAOS_SYSTEM_ERROR(errno));
  }

118 119 120 121
  return NULL != pBuf->pData;
}

static int32_t updateStatus(SDataDispatchHandle* pDispatcher) {
wafwerar's avatar
wafwerar 已提交
122
  taosThreadMutexLock(&pDispatcher->mutex);
123
  int32_t blockNums = taosQueueItemSize(pDispatcher->pDataBlocks);
L
Liu Jicong 已提交
124 125 126
  int32_t status =
      (0 == blockNums ? DS_BUF_EMPTY
                      : (blockNums < pDispatcher->pManager->cfg.maxDataBlockNumPerQuery ? DS_BUF_LOW : DS_BUF_FULL));
127
  pDispatcher->status = status;
wafwerar's avatar
wafwerar 已提交
128
  taosThreadMutexUnlock(&pDispatcher->mutex);
129 130 131 132
  return status;
}

static int32_t getStatus(SDataDispatchHandle* pDispatcher) {
wafwerar's avatar
wafwerar 已提交
133
  taosThreadMutexLock(&pDispatcher->mutex);
134
  int32_t status = pDispatcher->status;
wafwerar's avatar
wafwerar 已提交
135
  taosThreadMutexUnlock(&pDispatcher->mutex);
136 137 138
  return status;
}

X
Xiaoyu Wang 已提交
139
static int32_t putDataBlock(SDataSinkHandle* pHandle, const SInputData* pInput, bool* pContinue) {
X
Xiaoyu Wang 已提交
140
  SDataDispatchHandle* pDispatcher = (SDataDispatchHandle*)pHandle;
141
  SDataDispatchBuf*    pBuf = taosAllocateQitem(sizeof(SDataDispatchBuf), DEF_QITEM);
142 143 144 145 146
  if (NULL == pBuf || !allocBuf(pDispatcher, pInput, pBuf)) {
    return TSDB_CODE_QRY_OUT_OF_MEMORY;
  }
  toDataCacheEntry(pDispatcher, pInput, pBuf);
  taosWriteQitem(pDispatcher->pDataBlocks, pBuf);
X
Xiaoyu Wang 已提交
147
  *pContinue = (DS_BUF_LOW == updateStatus(pDispatcher) ? true : false);
148
  return TSDB_CODE_SUCCESS;
X
Xiaoyu Wang 已提交
149 150
}

D
dapan1121 已提交
151
static void endPut(struct SDataSinkHandle* pHandle, uint64_t useconds) {
152
  SDataDispatchHandle* pDispatcher = (SDataDispatchHandle*)pHandle;
wafwerar's avatar
wafwerar 已提交
153
  taosThreadMutexLock(&pDispatcher->mutex);
X
Xiaoyu Wang 已提交
154 155
  pDispatcher->queryEnd = true;
  pDispatcher->useconds = useconds;
wafwerar's avatar
wafwerar 已提交
156
  taosThreadMutexUnlock(&pDispatcher->mutex);
157
}
X
Xiaoyu Wang 已提交
158

D
dapan1121 已提交
159
static void getDataLength(SDataSinkHandle* pHandle, int64_t* pLen, bool* pQueryEnd) {
160 161
  SDataDispatchHandle* pDispatcher = (SDataDispatchHandle*)pHandle;
  if (taosQueueEmpty(pDispatcher->pDataBlocks)) {
X
Xiaoyu Wang 已提交
162 163 164
    *pQueryEnd = pDispatcher->queryEnd;
    *pLen = 0;
    return;
165
  }
166

167 168 169 170
  SDataDispatchBuf* pBuf = NULL;
  taosReadQitem(pDispatcher->pDataBlocks, (void**)&pBuf);
  memcpy(&pDispatcher->nextOutput, pBuf, sizeof(SDataDispatchBuf));
  taosFreeQitem(pBuf);
X
Xiaoyu Wang 已提交
171
  *pLen = ((SDataCacheEntry*)(pDispatcher->nextOutput.pData))->dataLen;
L
Liu Jicong 已提交
172
  *pQueryEnd = pDispatcher->queryEnd;
D
dapan1121 已提交
173
  qDebug("got data len %" PRId64 ", row num %d in sink", *pLen, ((SDataCacheEntry*)(pDispatcher->nextOutput.pData))->numOfRows);
X
Xiaoyu Wang 已提交
174 175
}

X
Xiaoyu Wang 已提交
176
static int32_t getDataBlock(SDataSinkHandle* pHandle, SOutputData* pOutput) {
177
  SDataDispatchHandle* pDispatcher = (SDataDispatchHandle*)pHandle;
178 179 180
  if (NULL == pDispatcher->nextOutput.pData) {
    assert(pDispatcher->queryEnd);
    pOutput->useconds = pDispatcher->useconds;
X
Xiaoyu Wang 已提交
181
    pOutput->precision = pDispatcher->pSchema->precision;
D
dapan1121 已提交
182 183
    pOutput->bufStatus = DS_BUF_EMPTY;
    pOutput->queryEnd = pDispatcher->queryEnd;
184 185
    return TSDB_CODE_SUCCESS;
  }
186 187 188
  SDataCacheEntry* pEntry = (SDataCacheEntry*)(pDispatcher->nextOutput.pData);
  memcpy(pOutput->pData, pEntry->data, pEntry->dataLen);
  pOutput->numOfRows = pEntry->numOfRows;
189
  pOutput->numOfCols = pEntry->numOfCols;
190
  pOutput->compressed = pEntry->compressed;
D
dapan1121 已提交
191

192 193
  atomic_sub_fetch_64(&pDispatcher->cachedSize, pEntry->dataLen);
  atomic_sub_fetch_64(&gDataSinkStat.cachedSize, pEntry->dataLen);
D
dapan1121 已提交
194

wafwerar's avatar
wafwerar 已提交
195
  taosMemoryFreeClear(pDispatcher->nextOutput.pData);  // todo persistent
X
Xiaoyu Wang 已提交
196
  pOutput->bufStatus = updateStatus(pDispatcher);
wafwerar's avatar
wafwerar 已提交
197
  taosThreadMutexLock(&pDispatcher->mutex);
X
Xiaoyu Wang 已提交
198 199
  pOutput->queryEnd = pDispatcher->queryEnd;
  pOutput->useconds = pDispatcher->useconds;
X
Xiaoyu Wang 已提交
200
  pOutput->precision = pDispatcher->pSchema->precision;
wafwerar's avatar
wafwerar 已提交
201
  taosThreadMutexUnlock(&pDispatcher->mutex);
D
dapan1121 已提交
202

203 204
  return TSDB_CODE_SUCCESS;
}
X
Xiaoyu Wang 已提交
205

206 207
static int32_t destroyDataSinker(SDataSinkHandle* pHandle) {
  SDataDispatchHandle* pDispatcher = (SDataDispatchHandle*)pHandle;
D
dapan1121 已提交
208
  atomic_sub_fetch_64(&gDataSinkStat.cachedSize, pDispatcher->cachedSize);
wafwerar's avatar
wafwerar 已提交
209
  taosMemoryFreeClear(pDispatcher->nextOutput.pData);
210 211 212
  while (!taosQueueEmpty(pDispatcher->pDataBlocks)) {
    SDataDispatchBuf* pBuf = NULL;
    taosReadQitem(pDispatcher->pDataBlocks, (void**)&pBuf);
wafwerar's avatar
wafwerar 已提交
213
    taosMemoryFreeClear(pBuf->pData);
214 215 216
    taosFreeQitem(pBuf);
  }
  taosCloseQueue(pDispatcher->pDataBlocks);
wafwerar's avatar
wafwerar 已提交
217
  taosThreadMutexDestroy(&pDispatcher->mutex);
218
  return TSDB_CODE_SUCCESS;
X
Xiaoyu Wang 已提交
219 220
}

D
dapan1121 已提交
221
static int32_t getCacheSize(struct SDataSinkHandle* pHandle, uint64_t* size) {
D
dapan1121 已提交
222 223 224 225 226 227
  SDataDispatchHandle* pDispatcher = (SDataDispatchHandle*)pHandle;

  *size = atomic_load_64(&pDispatcher->cachedSize);
  return TSDB_CODE_SUCCESS;
}

X
Xiaoyu Wang 已提交
228
int32_t createDataDispatcher(SDataSinkManager* pManager, const SDataSinkNode* pDataSink, DataSinkHandle* pHandle) {
wafwerar's avatar
wafwerar 已提交
229
  SDataDispatchHandle* dispatcher = taosMemoryCalloc(1, sizeof(SDataDispatchHandle));
X
Xiaoyu Wang 已提交
230 231
  if (NULL == dispatcher) {
    terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
232
    return TSDB_CODE_QRY_OUT_OF_MEMORY;
X
Xiaoyu Wang 已提交
233 234
  }
  dispatcher->sink.fPut = putDataBlock;
D
dapan1121 已提交
235
  dispatcher->sink.fEndPut = endPut;
236 237
  dispatcher->sink.fGetLen = getDataLength;
  dispatcher->sink.fGetData = getDataBlock;
X
Xiaoyu Wang 已提交
238
  dispatcher->sink.fDestroy = destroyDataSinker;
D
dapan1121 已提交
239
  dispatcher->sink.fGetCacheSize = getCacheSize;
240
  dispatcher->pManager = pManager;
X
Xiaoyu Wang 已提交
241
  dispatcher->pSchema = pDataSink->pInputDataBlockDesc;
X
Xiaoyu Wang 已提交
242 243
  dispatcher->status = DS_BUF_EMPTY;
  dispatcher->queryEnd = false;
X
Xiaoyu Wang 已提交
244
  dispatcher->pDataBlocks = taosOpenQueue();
wafwerar's avatar
wafwerar 已提交
245
  taosThreadMutexInit(&dispatcher->mutex, NULL);
X
Xiaoyu Wang 已提交
246 247
  if (NULL == dispatcher->pDataBlocks) {
    terrno = TSDB_CODE_QRY_OUT_OF_MEMORY;
248
    return TSDB_CODE_QRY_OUT_OF_MEMORY;
X
Xiaoyu Wang 已提交
249 250 251 252
  }
  *pHandle = dispatcher;
  return TSDB_CODE_SUCCESS;
}