vnodeSnapshot.c 10.9 KB
Newer Older
H
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

H
Hongze Cheng 已提交
16
#include "vnd.h"
H
Hongze Cheng 已提交
17

H
Hongze Cheng 已提交
18
// SVSnapReader ========================================================
H
Hongze Cheng 已提交
19
struct SVSnapReader {
H
Hongze Cheng 已提交
20 21 22
  SVnode *pVnode;
  int64_t sver;
  int64_t ever;
H
Hongze Cheng 已提交
23
  int64_t index;
H
Hongze Cheng 已提交
24 25
  // meta
  int8_t           metaDone;
H
Hongze Cheng 已提交
26
  SMetaSnapReader *pMetaReader;
H
Hongze Cheng 已提交
27 28
  // tsdb
  int8_t           tsdbDone;
H
Hongze Cheng 已提交
29
  STsdbSnapReader *pTsdbReader;
L
Liu Jicong 已提交
30 31 32 33 34 35 36 37 38 39
  // tq
  int8_t           tqHandleDone;
  STqSnapReader   *pTqSnapReader;
  int8_t           tqOffsetDone;
  STqOffsetReader *pTqOffsetReader;
  // stream
  int8_t              streamTaskDone;
  SStreamTaskReader  *pStreamTaskReader;
  int8_t              streamStateDone;
  SStreamStateReader *pStreamStateReader;
C
Cary Xu 已提交
40
  // rsma
C
Cary Xu 已提交
41
  int8_t           rsmaDone;
42
  SRSmaSnapReader *pRsmaReader;
H
Hongze Cheng 已提交
43 44
};

H
Hongze Cheng 已提交
45
int32_t vnodeSnapReaderOpen(SVnode *pVnode, int64_t sver, int64_t ever, SVSnapReader **ppReader) {
H
Hongze Cheng 已提交
46
  int32_t       code = 0;
H
Hongze Cheng 已提交
47
  SVSnapReader *pReader = NULL;
H
Hongze Cheng 已提交
48

H
Hongze Cheng 已提交
49
  pReader = (SVSnapReader *)taosMemoryCalloc(1, sizeof(*pReader));
H
Hongze Cheng 已提交
50 51 52 53 54 55 56 57
  if (pReader == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }
  pReader->pVnode = pVnode;
  pReader->sver = sver;
  pReader->ever = ever;

S
Shengliang Guan 已提交
58
  vInfo("vgId:%d, vnode snapshot reader opened, sver:%" PRId64 " ever:%" PRId64, TD_VID(pVnode), sver, ever);
H
Hongze Cheng 已提交
59
  *ppReader = pReader;
H
Hongze Cheng 已提交
60
  return code;
H
Hongze Cheng 已提交
61 62

_err:
S
Shengliang Guan 已提交
63
  vError("vgId:%d, vnode snapshot reader open failed since %s", TD_VID(pVnode), tstrerror(code));
H
Hongze Cheng 已提交
64
  *ppReader = NULL;
H
Hongze Cheng 已提交
65
  return code;
H
Hongze Cheng 已提交
66 67
}

H
Hongze Cheng 已提交
68
int32_t vnodeSnapReaderClose(SVSnapReader *pReader) {
H
Hongze Cheng 已提交
69 70
  int32_t code = 0;

C
Cary Xu 已提交
71 72 73 74
  if (pReader->pRsmaReader) {
    rsmaSnapReaderClose(&pReader->pRsmaReader);
  }

H
Hongze Cheng 已提交
75 76 77 78 79 80 81
  if (pReader->pTsdbReader) {
    tsdbSnapReaderClose(&pReader->pTsdbReader);
  }

  if (pReader->pMetaReader) {
    metaSnapReaderClose(&pReader->pMetaReader);
  }
H
Hongze Cheng 已提交
82

S
Shengliang Guan 已提交
83
  vInfo("vgId:%d, vnode snapshot reader closed", TD_VID(pReader->pVnode));
H
Hongze Cheng 已提交
84
  taosMemoryFree(pReader);
H
Hongze Cheng 已提交
85
  return code;
H
Hongze Cheng 已提交
86 87
}

H
Hongze Cheng 已提交
88
int32_t vnodeSnapRead(SVSnapReader *pReader, uint8_t **ppData, uint32_t *nData) {
H
Hongze Cheng 已提交
89 90
  int32_t code = 0;

H
Hongze Cheng 已提交
91
  // META ==============
H
Hongze Cheng 已提交
92
  if (!pReader->metaDone) {
H
Hongze Cheng 已提交
93 94 95 96 97 98 99
    // open reader if not
    if (pReader->pMetaReader == NULL) {
      code = metaSnapReaderOpen(pReader->pVnode->pMeta, pReader->sver, pReader->ever, &pReader->pMetaReader);
      if (code) goto _err;
    }

    code = metaSnapRead(pReader->pMetaReader, ppData);
H
Hongze Cheng 已提交
100
    if (code) {
H
Hongze Cheng 已提交
101 102 103 104
      goto _err;
    } else {
      if (*ppData) {
        goto _exit;
H
Hongze Cheng 已提交
105
      } else {
H
Hongze Cheng 已提交
106 107 108
        pReader->metaDone = 1;
        code = metaSnapReaderClose(&pReader->pMetaReader);
        if (code) goto _err;
H
Hongze Cheng 已提交
109 110 111 112
      }
    }
  }

H
Hongze Cheng 已提交
113
  // TSDB ==============
H
Hongze Cheng 已提交
114
  if (!pReader->tsdbDone) {
H
Hongze Cheng 已提交
115
    // open if not
H
Hongze Cheng 已提交
116
    if (pReader->pTsdbReader == NULL) {
L
Liu Jicong 已提交
117 118
      code = tsdbSnapReaderOpen(pReader->pVnode->pTsdb, pReader->sver, pReader->ever, SNAP_DATA_TSDB,
                                &pReader->pTsdbReader);
H
Hongze Cheng 已提交
119 120 121 122 123 124 125 126 127 128 129 130 131 132 133
      if (code) goto _err;
    }

    code = tsdbSnapRead(pReader->pTsdbReader, ppData);
    if (code) {
      goto _err;
    } else {
      if (*ppData) {
        goto _exit;
      } else {
        pReader->tsdbDone = 1;
        code = tsdbSnapReaderClose(&pReader->pTsdbReader);
        if (code) goto _err;
      }
    }
H
Hongze Cheng 已提交
134 135
  }

L
Liu Jicong 已提交
136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168
  // TQ ================
  if (!pReader->tqHandleDone) {
    if (pReader->pTqSnapReader == NULL) {
      code = tqSnapReaderOpen(pReader->pVnode->pTq, pReader->sver, pReader->ever, &pReader->pTqSnapReader);
      if (code < 0) goto _err;
    }

    code = tqSnapRead(pReader->pTqSnapReader, ppData);
    if (code) {
      goto _err;
    } else {
      if (*ppData) {
        goto _exit;
      } else {
        pReader->tqHandleDone = 1;
        code = tqSnapReaderClose(&pReader->pTqSnapReader);
        if (code) goto _err;
      }
    }
  }
  if (!pReader->tqOffsetDone) {
    if (pReader->pTqOffsetReader == NULL) {
      code = tqOffsetReaderOpen(pReader->pVnode->pTq, pReader->sver, pReader->ever, &pReader->pTqOffsetReader);
      if (code < 0) goto _err;
    }

    code = tqOffsetSnapRead(pReader->pTqOffsetReader, ppData);
    if (code) {
      goto _err;
    } else {
      if (*ppData) {
        goto _exit;
      } else {
H
Hongze Cheng 已提交
169
        pReader->tqOffsetDone = 1;
L
Liu Jicong 已提交
170 171 172 173 174 175 176 177 178 179 180 181
        code = tqOffsetReaderClose(&pReader->pTqOffsetReader);
        if (code) goto _err;
      }
    }
  }

  // STREAM ============
  if (!pReader->streamTaskDone) {
  }
  if (!pReader->streamStateDone) {
  }

C
Cary Xu 已提交
182
  // RSMA ==============
C
Cary Xu 已提交
183 184 185 186 187 188 189 190 191 192 193 194 195 196
  if (VND_IS_RSMA(pReader->pVnode) && !pReader->rsmaDone) {
    // open if not
    if (pReader->pRsmaReader == NULL) {
      code = rsmaSnapReaderOpen(pReader->pVnode->pSma, pReader->sver, pReader->ever, &pReader->pRsmaReader);
      if (code) goto _err;
    }

    code = rsmaSnapRead(pReader->pRsmaReader, ppData);
    if (code) {
      goto _err;
    } else {
      if (*ppData) {
        goto _exit;
      } else {
C
Cary Xu 已提交
197
        pReader->rsmaDone = 1;
C
Cary Xu 已提交
198 199
        code = rsmaSnapReaderClose(&pReader->pRsmaReader);
        if (code) goto _err;
C
Cary Xu 已提交
200 201 202 203
      }
    }
  }

H
Hongze Cheng 已提交
204 205
  *ppData = NULL;
  *nData = 0;
H
Hongze Cheng 已提交
206 207

_exit:
H
Hongze Cheng 已提交
208
  if (*ppData) {
H
Hongze Cheng 已提交
209 210
    SSnapDataHdr *pHdr = (SSnapDataHdr *)(*ppData);

H
Hongze Cheng 已提交
211
    pReader->index++;
H
Hongze Cheng 已提交
212 213
    *nData = sizeof(SSnapDataHdr) + pHdr->size;
    pHdr->index = pReader->index;
S
Shengliang Guan 已提交
214
    vInfo("vgId:%d, vnode snapshot read data,index:%" PRId64 " type:%d nData:%d ", TD_VID(pReader->pVnode),
H
Hongze Cheng 已提交
215
          pReader->index, pHdr->type, *nData);
H
Hongze Cheng 已提交
216
  } else {
S
Shengliang Guan 已提交
217
    vInfo("vgId:%d, vnode snapshot read data end, index:%" PRId64, TD_VID(pReader->pVnode), pReader->index);
H
Hongze Cheng 已提交
218
  }
H
Hongze Cheng 已提交
219 220 221
  return code;

_err:
S
Shengliang Guan 已提交
222
  vError("vgId:%d, vnode snapshot read failed since %s", TD_VID(pReader->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
223
  return code;
H
more  
Hongze Cheng 已提交
224 225
}

H
Hongze Cheng 已提交
226
// SVSnapWriter ========================================================
H
Hongze Cheng 已提交
227 228 229 230
struct SVSnapWriter {
  SVnode *pVnode;
  int64_t sver;
  int64_t ever;
H
Hongze Cheng 已提交
231
  int64_t commitID;
H
Hongze Cheng 已提交
232
  int64_t index;
H
Hongze Cheng 已提交
233 234 235 236
  // meta
  SMetaSnapWriter *pMetaSnapWriter;
  // tsdb
  STsdbSnapWriter *pTsdbSnapWriter;
L
Liu Jicong 已提交
237 238 239 240 241 242
  // tq
  STqSnapWriter   *pTqSnapWriter;
  STqOffsetWriter *pTqOffsetWriter;
  // stream
  SStreamTaskWriter  *pStreamTaskWriter;
  SStreamStateWriter *pStreamStateWriter;
C
Cary Xu 已提交
243
  // rsma
244
  SRSmaSnapWriter *pRsmaSnapWriter;
H
Hongze Cheng 已提交
245 246
};

H
Hongze Cheng 已提交
247
int32_t vnodeSnapWriterOpen(SVnode *pVnode, int64_t sver, int64_t ever, SVSnapWriter **ppWriter) {
H
Hongze Cheng 已提交
248 249
  int32_t       code = 0;
  SVSnapWriter *pWriter = NULL;
H
more  
Hongze Cheng 已提交
250 251

  // alloc
H
Hongze Cheng 已提交
252
  pWriter = (SVSnapWriter *)taosMemoryCalloc(1, sizeof(*pWriter));
H
more  
Hongze Cheng 已提交
253 254 255 256 257 258 259
  if (pWriter == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }
  pWriter->pVnode = pVnode;
  pWriter->sver = sver;
  pWriter->ever = ever;
H
Hongze Cheng 已提交
260 261

  // commit it
H
Hongze Cheng 已提交
262
  code = vnodeSyncCommit(pVnode);
H
Hongze Cheng 已提交
263 264 265 266
  if (code) {
    taosMemoryFree(pWriter);
    goto _err;
  }
H
Hongze Cheng 已提交
267 268 269

  // inc commit ID
  pVnode->state.commitID++;
H
Hongze Cheng 已提交
270
  pWriter->commitID = pVnode->state.commitID;
H
more  
Hongze Cheng 已提交
271

S
Shengliang Guan 已提交
272
  vInfo("vgId:%d, vnode snapshot writer opened, sver:%" PRId64 " ever:%" PRId64 " commit id:%" PRId64, TD_VID(pVnode),
H
Hongze Cheng 已提交
273
        sver, ever, pWriter->commitID);
H
Hongze Cheng 已提交
274
  *ppWriter = pWriter;
H
more  
Hongze Cheng 已提交
275 276 277
  return code;

_err:
S
Shengliang Guan 已提交
278
  vError("vgId:%d, vnode snapshot writer open failed since %s", TD_VID(pVnode), tstrerror(code));
H
Hongze Cheng 已提交
279
  *ppWriter = NULL;
H
more  
Hongze Cheng 已提交
280 281 282
  return code;
}

283
int32_t vnodeSnapWriterClose(SVSnapWriter *pWriter, int8_t rollback, SSnapshot *pSnapshot) {
H
more  
Hongze Cheng 已提交
284
  int32_t code = 0;
H
Hongze Cheng 已提交
285
  SVnode *pVnode = pWriter->pVnode;
H
more  
Hongze Cheng 已提交
286

H
Hongze Cheng 已提交
287 288 289 290
  if (pWriter->pMetaSnapWriter) {
    code = metaSnapWriterClose(&pWriter->pMetaSnapWriter, rollback);
    if (code) goto _err;
  }
H
Hongze Cheng 已提交
291

H
Hongze Cheng 已提交
292 293 294 295
  if (pWriter->pTsdbSnapWriter) {
    code = tsdbSnapWriterClose(&pWriter->pTsdbSnapWriter, rollback);
    if (code) goto _err;
  }
H
more  
Hongze Cheng 已提交
296

C
Cary Xu 已提交
297 298 299 300 301
  if (pWriter->pRsmaSnapWriter) {
    code = rsmaSnapWriterClose(&pWriter->pRsmaSnapWriter, rollback);
    if (code) goto _err;
  }

H
Hongze Cheng 已提交
302 303 304 305 306 307
  if (!rollback) {
    SVnodeInfo info = {0};
    char       dir[TSDB_FILENAME_LEN];

    pVnode->state.committed = pWriter->ever;
    pVnode->state.applied = pWriter->ever;
308 309
    pVnode->state.applyTerm = pSnapshot->lastApplyTerm;
    pVnode->state.commitTerm = pSnapshot->lastApplyTerm;
H
Hongze Cheng 已提交
310 311 312 313 314 315 316 317 318 319 320

    info.config = pVnode->config;
    info.state.committed = pVnode->state.applied;
    info.state.commitTerm = pVnode->state.applyTerm;
    info.state.commitID = pVnode->state.commitID;
    snprintf(dir, TSDB_FILENAME_LEN, "%s%s%s", tfsGetPrimaryPath(pVnode->pTfs), TD_DIRSEP, pVnode->path);
    code = vnodeSaveInfo(dir, &info);
    if (code) goto _err;

    code = vnodeCommitInfo(dir, &info);
    if (code) goto _err;
H
Hongze Cheng 已提交
321 322

    vnodeBegin(pVnode);
H
Hongze Cheng 已提交
323
  } else {
324
    tAssert(0);
H
Hongze Cheng 已提交
325 326
  }

H
Hongze Cheng 已提交
327
_exit:
S
Shengliang Guan 已提交
328
  vInfo("vgId:%d, vnode snapshot writer closed, rollback:%d", TD_VID(pVnode), rollback);
H
more  
Hongze Cheng 已提交
329 330
  taosMemoryFree(pWriter);
  return code;
H
Hongze Cheng 已提交
331 332

_err:
S
Shengliang Guan 已提交
333
  vError("vgId:%d, vnode snapshot writer close failed since %s", TD_VID(pWriter->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
334
  return code;
H
Hongze Cheng 已提交
335 336
}

H
Hongze Cheng 已提交
337
int32_t vnodeSnapWrite(SVSnapWriter *pWriter, uint8_t *pData, uint32_t nData) {
H
Hongze Cheng 已提交
338
  int32_t       code = 0;
H
Hongze Cheng 已提交
339
  SSnapDataHdr *pHdr = (SSnapDataHdr *)pData;
H
Hongze Cheng 已提交
340 341
  SVnode       *pVnode = pWriter->pVnode;

H
Hongze Cheng 已提交
342 343 344
  ASSERT(pHdr->size + sizeof(SSnapDataHdr) == nData);
  ASSERT(pHdr->index == pWriter->index + 1);
  pWriter->index = pHdr->index;
H
Hongze Cheng 已提交
345

S
Shengliang Guan 已提交
346
  vInfo("vgId:%d, vnode snapshot write data, index:%" PRId64 " type:%d nData:%d", TD_VID(pVnode), pHdr->index,
H
Hongze Cheng 已提交
347
        pHdr->type, nData);
H
Hongze Cheng 已提交
348

C
Cary Xu 已提交
349 350 351 352 353 354 355
  switch (pHdr->type) {
    case SNAP_DATA_META: {
      // meta
      if (pWriter->pMetaSnapWriter == NULL) {
        code = metaSnapWriterOpen(pVnode->pMeta, pWriter->sver, pWriter->ever, &pWriter->pMetaSnapWriter);
        if (code) goto _err;
      }
H
Hongze Cheng 已提交
356

C
Cary Xu 已提交
357
      code = metaSnapWrite(pWriter->pMetaSnapWriter, pData, nData);
H
Hongze Cheng 已提交
358
      if (code) goto _err;
C
Cary Xu 已提交
359
    } break;
H
Hongze Cheng 已提交
360 361
    case SNAP_DATA_TSDB:
    case SNAP_DATA_DEL: {
C
Cary Xu 已提交
362 363 364 365 366
      // tsdb
      if (pWriter->pTsdbSnapWriter == NULL) {
        code = tsdbSnapWriterOpen(pVnode->pTsdb, pWriter->sver, pWriter->ever, &pWriter->pTsdbSnapWriter);
        if (code) goto _err;
      }
H
Hongze Cheng 已提交
367

C
Cary Xu 已提交
368 369 370
      code = tsdbSnapWrite(pWriter->pTsdbSnapWriter, pData, nData);
      if (code) goto _err;
    } break;
L
Liu Jicong 已提交
371 372 373 374 375 376 377 378
    case SNAP_DATA_TQ_HANDLE: {
    } break;
    case SNAP_DATA_TQ_OFFSET: {
    } break;
    case SNAP_DATA_STREAM_TASK: {
    } break;
    case SNAP_DATA_STREAM_STATE: {
    } break;
C
Cary Xu 已提交
379
    case SNAP_DATA_RSMA1:
C
Cary Xu 已提交
380
    case SNAP_DATA_RSMA2:
C
Cary Xu 已提交
381
    case SNAP_DATA_QTASK: {
C
Cary Xu 已提交
382
      // rsma1/rsma2/qtask for rsma
C
Cary Xu 已提交
383 384 385 386
      if (pWriter->pRsmaSnapWriter == NULL) {
        code = rsmaSnapWriterOpen(pVnode->pSma, pWriter->sver, pWriter->ever, &pWriter->pRsmaSnapWriter);
        if (code) goto _err;
      }
H
Hongze Cheng 已提交
387

C
Cary Xu 已提交
388 389 390 391 392
      code = rsmaSnapWrite(pWriter->pRsmaSnapWriter, pData, nData);
      if (code) goto _err;
    } break;
    default:
      break;
H
Hongze Cheng 已提交
393
  }
H
Hongze Cheng 已提交
394
_exit:
H
Hongze Cheng 已提交
395 396 397
  return code;

_err:
S
Shengliang Guan 已提交
398
  vError("vgId:%d, vnode snapshot write failed since %s, index:%" PRId64 " type:%d nData:%d", TD_VID(pVnode),
H
Hongze Cheng 已提交
399
         tstrerror(code), pHdr->index, pHdr->type, nData);
H
Hongze Cheng 已提交
400
  return code;
L
Liu Jicong 已提交
401
}