vnodeSnapshot.c 10.9 KB
Newer Older
H
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

H
Hongze Cheng 已提交
16
#include "vnd.h"
H
Hongze Cheng 已提交
17

H
Hongze Cheng 已提交
18
// SVSnapReader ========================================================
H
Hongze Cheng 已提交
19
struct SVSnapReader {
H
Hongze Cheng 已提交
20 21 22
  SVnode *pVnode;
  int64_t sver;
  int64_t ever;
H
Hongze Cheng 已提交
23
  int64_t index;
H
Hongze Cheng 已提交
24 25
  // meta
  int8_t           metaDone;
H
Hongze Cheng 已提交
26
  SMetaSnapReader *pMetaReader;
H
Hongze Cheng 已提交
27 28
  // tsdb
  int8_t           tsdbDone;
H
Hongze Cheng 已提交
29
  STsdbSnapReader *pTsdbReader;
L
Liu Jicong 已提交
30 31 32 33 34 35 36 37 38 39
  // tq
  int8_t           tqHandleDone;
  STqSnapReader   *pTqSnapReader;
  int8_t           tqOffsetDone;
  STqOffsetReader *pTqOffsetReader;
  // stream
  int8_t              streamTaskDone;
  SStreamTaskReader  *pStreamTaskReader;
  int8_t              streamStateDone;
  SStreamStateReader *pStreamStateReader;
C
Cary Xu 已提交
40
  // rsma
C
Cary Xu 已提交
41
  int8_t           rsmaDone;
42
  SRSmaSnapReader *pRsmaReader;
H
Hongze Cheng 已提交
43 44
};

H
Hongze Cheng 已提交
45
int32_t vnodeSnapReaderOpen(SVnode *pVnode, int64_t sver, int64_t ever, SVSnapReader **ppReader) {
H
Hongze Cheng 已提交
46
  int32_t       code = 0;
H
Hongze Cheng 已提交
47
  SVSnapReader *pReader = NULL;
H
Hongze Cheng 已提交
48

H
Hongze Cheng 已提交
49
  pReader = (SVSnapReader *)taosMemoryCalloc(1, sizeof(*pReader));
H
Hongze Cheng 已提交
50 51 52 53 54 55 56 57
  if (pReader == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }
  pReader->pVnode = pVnode;
  pReader->sver = sver;
  pReader->ever = ever;

S
Shengliang Guan 已提交
58
  vInfo("vgId:%d, vnode snapshot reader opened, sver:%" PRId64 " ever:%" PRId64, TD_VID(pVnode), sver, ever);
H
Hongze Cheng 已提交
59
  *ppReader = pReader;
H
Hongze Cheng 已提交
60
  return code;
H
Hongze Cheng 已提交
61 62

_err:
S
Shengliang Guan 已提交
63
  vError("vgId:%d, vnode snapshot reader open failed since %s", TD_VID(pVnode), tstrerror(code));
H
Hongze Cheng 已提交
64
  *ppReader = NULL;
H
Hongze Cheng 已提交
65
  return code;
H
Hongze Cheng 已提交
66 67
}

H
Hongze Cheng 已提交
68
int32_t vnodeSnapReaderClose(SVSnapReader *pReader) {
H
Hongze Cheng 已提交
69 70
  int32_t code = 0;

C
Cary Xu 已提交
71 72 73 74
  if (pReader->pRsmaReader) {
    rsmaSnapReaderClose(&pReader->pRsmaReader);
  }

H
Hongze Cheng 已提交
75 76 77 78 79 80 81
  if (pReader->pTsdbReader) {
    tsdbSnapReaderClose(&pReader->pTsdbReader);
  }

  if (pReader->pMetaReader) {
    metaSnapReaderClose(&pReader->pMetaReader);
  }
H
Hongze Cheng 已提交
82

S
Shengliang Guan 已提交
83
  vInfo("vgId:%d, vnode snapshot reader closed", TD_VID(pReader->pVnode));
H
Hongze Cheng 已提交
84
  taosMemoryFree(pReader);
H
Hongze Cheng 已提交
85
  return code;
H
Hongze Cheng 已提交
86 87
}

H
Hongze Cheng 已提交
88
int32_t vnodeSnapRead(SVSnapReader *pReader, uint8_t **ppData, uint32_t *nData) {
H
Hongze Cheng 已提交
89 90
  int32_t code = 0;

H
Hongze Cheng 已提交
91
  // META ==============
H
Hongze Cheng 已提交
92
  if (!pReader->metaDone) {
H
Hongze Cheng 已提交
93 94 95 96 97 98 99
    // open reader if not
    if (pReader->pMetaReader == NULL) {
      code = metaSnapReaderOpen(pReader->pVnode->pMeta, pReader->sver, pReader->ever, &pReader->pMetaReader);
      if (code) goto _err;
    }

    code = metaSnapRead(pReader->pMetaReader, ppData);
H
Hongze Cheng 已提交
100
    if (code) {
H
Hongze Cheng 已提交
101 102 103 104
      goto _err;
    } else {
      if (*ppData) {
        goto _exit;
H
Hongze Cheng 已提交
105
      } else {
H
Hongze Cheng 已提交
106 107 108
        pReader->metaDone = 1;
        code = metaSnapReaderClose(&pReader->pMetaReader);
        if (code) goto _err;
H
Hongze Cheng 已提交
109 110 111 112
      }
    }
  }

H
Hongze Cheng 已提交
113
  // TSDB ==============
H
Hongze Cheng 已提交
114
  if (!pReader->tsdbDone) {
H
Hongze Cheng 已提交
115
    // open if not
H
Hongze Cheng 已提交
116
    if (pReader->pTsdbReader == NULL) {
L
Liu Jicong 已提交
117 118
      code = tsdbSnapReaderOpen(pReader->pVnode->pTsdb, pReader->sver, pReader->ever, SNAP_DATA_TSDB,
                                &pReader->pTsdbReader);
H
Hongze Cheng 已提交
119 120 121 122 123 124 125 126 127 128 129 130 131 132 133
      if (code) goto _err;
    }

    code = tsdbSnapRead(pReader->pTsdbReader, ppData);
    if (code) {
      goto _err;
    } else {
      if (*ppData) {
        goto _exit;
      } else {
        pReader->tsdbDone = 1;
        code = tsdbSnapReaderClose(&pReader->pTsdbReader);
        if (code) goto _err;
      }
    }
H
Hongze Cheng 已提交
134 135
  }

L
Liu Jicong 已提交
136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181
  // TQ ================
  if (!pReader->tqHandleDone) {
    if (pReader->pTqSnapReader == NULL) {
      code = tqSnapReaderOpen(pReader->pVnode->pTq, pReader->sver, pReader->ever, &pReader->pTqSnapReader);
      if (code < 0) goto _err;
    }

    code = tqSnapRead(pReader->pTqSnapReader, ppData);
    if (code) {
      goto _err;
    } else {
      if (*ppData) {
        goto _exit;
      } else {
        pReader->tqHandleDone = 1;
        code = tqSnapReaderClose(&pReader->pTqSnapReader);
        if (code) goto _err;
      }
    }
  }
  if (!pReader->tqOffsetDone) {
    if (pReader->pTqOffsetReader == NULL) {
      code = tqOffsetReaderOpen(pReader->pVnode->pTq, pReader->sver, pReader->ever, &pReader->pTqOffsetReader);
      if (code < 0) goto _err;
    }

    code = tqOffsetSnapRead(pReader->pTqOffsetReader, ppData);
    if (code) {
      goto _err;
    } else {
      if (*ppData) {
        goto _exit;
      } else {
        pReader->tqHandleDone = 1;
        code = tqOffsetReaderClose(&pReader->pTqOffsetReader);
        if (code) goto _err;
      }
    }
  }

  // STREAM ============
  if (!pReader->streamTaskDone) {
  }
  if (!pReader->streamStateDone) {
  }

C
Cary Xu 已提交
182
  // RSMA ==============
C
Cary Xu 已提交
183 184 185 186 187 188 189 190 191 192 193 194 195 196
  if (VND_IS_RSMA(pReader->pVnode) && !pReader->rsmaDone) {
    // open if not
    if (pReader->pRsmaReader == NULL) {
      code = rsmaSnapReaderOpen(pReader->pVnode->pSma, pReader->sver, pReader->ever, &pReader->pRsmaReader);
      if (code) goto _err;
    }

    code = rsmaSnapRead(pReader->pRsmaReader, ppData);
    if (code) {
      goto _err;
    } else {
      if (*ppData) {
        goto _exit;
      } else {
C
Cary Xu 已提交
197
        pReader->rsmaDone = 1;
C
Cary Xu 已提交
198 199
        code = rsmaSnapReaderClose(&pReader->pRsmaReader);
        if (code) goto _err;
C
Cary Xu 已提交
200 201 202 203
      }
    }
  }

H
Hongze Cheng 已提交
204 205
  *ppData = NULL;
  *nData = 0;
H
Hongze Cheng 已提交
206 207

_exit:
H
Hongze Cheng 已提交
208
  if (*ppData) {
H
Hongze Cheng 已提交
209 210
    SSnapDataHdr *pHdr = (SSnapDataHdr *)(*ppData);

H
Hongze Cheng 已提交
211
    pReader->index++;
H
Hongze Cheng 已提交
212 213
    *nData = sizeof(SSnapDataHdr) + pHdr->size;
    pHdr->index = pReader->index;
S
Shengliang Guan 已提交
214
    vInfo("vgId:%d, vnode snapshot read data,index:%" PRId64 " type:%d nData:%d ", TD_VID(pReader->pVnode),
H
Hongze Cheng 已提交
215
          pReader->index, pHdr->type, *nData);
H
Hongze Cheng 已提交
216
  } else {
S
Shengliang Guan 已提交
217
    vInfo("vgId:%d, vnode snapshot read data end, index:%" PRId64, TD_VID(pReader->pVnode), pReader->index);
H
Hongze Cheng 已提交
218
  }
H
Hongze Cheng 已提交
219 220 221
  return code;

_err:
H
Hongze Cheng 已提交
222
  vError("vgId:% vnode snapshot read failed since %s", TD_VID(pReader->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
223
  return code;
H
more  
Hongze Cheng 已提交
224 225
}

H
Hongze Cheng 已提交
226
// SVSnapWriter ========================================================
H
Hongze Cheng 已提交
227 228 229 230
struct SVSnapWriter {
  SVnode *pVnode;
  int64_t sver;
  int64_t ever;
H
Hongze Cheng 已提交
231
  int64_t commitID;
H
Hongze Cheng 已提交
232
  int64_t index;
H
Hongze Cheng 已提交
233 234 235 236
  // meta
  SMetaSnapWriter *pMetaSnapWriter;
  // tsdb
  STsdbSnapWriter *pTsdbSnapWriter;
L
Liu Jicong 已提交
237 238 239 240 241 242
  // tq
  STqSnapWriter   *pTqSnapWriter;
  STqOffsetWriter *pTqOffsetWriter;
  // stream
  SStreamTaskWriter  *pStreamTaskWriter;
  SStreamStateWriter *pStreamStateWriter;
C
Cary Xu 已提交
243
  // rsma
244
  SRSmaSnapWriter *pRsmaSnapWriter;
H
Hongze Cheng 已提交
245 246
};

H
Hongze Cheng 已提交
247
int32_t vnodeSnapWriterOpen(SVnode *pVnode, int64_t sver, int64_t ever, SVSnapWriter **ppWriter) {
H
Hongze Cheng 已提交
248 249
  int32_t       code = 0;
  SVSnapWriter *pWriter = NULL;
H
more  
Hongze Cheng 已提交
250 251

  // alloc
H
Hongze Cheng 已提交
252
  pWriter = (SVSnapWriter *)taosMemoryCalloc(1, sizeof(*pWriter));
H
more  
Hongze Cheng 已提交
253 254 255 256 257 258 259
  if (pWriter == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto _err;
  }
  pWriter->pVnode = pVnode;
  pWriter->sver = sver;
  pWriter->ever = ever;
H
Hongze Cheng 已提交
260 261 262 263 264 265 266

  // commit it
  code = vnodeCommit(pVnode);
  if (code) goto _err;

  // inc commit ID
  pVnode->state.commitID++;
H
Hongze Cheng 已提交
267
  pWriter->commitID = pVnode->state.commitID;
H
more  
Hongze Cheng 已提交
268

S
Shengliang Guan 已提交
269
  vInfo("vgId:%d, vnode snapshot writer opened, sver:%" PRId64 " ever:%" PRId64 " commit id:%" PRId64, TD_VID(pVnode),
H
Hongze Cheng 已提交
270
        sver, ever, pWriter->commitID);
H
Hongze Cheng 已提交
271
  *ppWriter = pWriter;
H
more  
Hongze Cheng 已提交
272 273 274
  return code;

_err:
S
Shengliang Guan 已提交
275
  vError("vgId:%d, vnode snapshot writer open failed since %s", TD_VID(pVnode), tstrerror(code));
H
Hongze Cheng 已提交
276
  *ppWriter = NULL;
H
more  
Hongze Cheng 已提交
277 278 279
  return code;
}

280
int32_t vnodeSnapWriterClose(SVSnapWriter *pWriter, int8_t rollback, SSnapshot *pSnapshot) {
H
more  
Hongze Cheng 已提交
281
  int32_t code = 0;
H
Hongze Cheng 已提交
282
  SVnode *pVnode = pWriter->pVnode;
H
more  
Hongze Cheng 已提交
283

H
Hongze Cheng 已提交
284 285 286 287
  if (pWriter->pMetaSnapWriter) {
    code = metaSnapWriterClose(&pWriter->pMetaSnapWriter, rollback);
    if (code) goto _err;
  }
H
Hongze Cheng 已提交
288

H
Hongze Cheng 已提交
289 290 291 292
  if (pWriter->pTsdbSnapWriter) {
    code = tsdbSnapWriterClose(&pWriter->pTsdbSnapWriter, rollback);
    if (code) goto _err;
  }
H
more  
Hongze Cheng 已提交
293

C
Cary Xu 已提交
294 295 296 297 298
  if (pWriter->pRsmaSnapWriter) {
    code = rsmaSnapWriterClose(&pWriter->pRsmaSnapWriter, rollback);
    if (code) goto _err;
  }

H
Hongze Cheng 已提交
299 300 301 302 303 304
  if (!rollback) {
    SVnodeInfo info = {0};
    char       dir[TSDB_FILENAME_LEN];

    pVnode->state.committed = pWriter->ever;
    pVnode->state.applied = pWriter->ever;
305 306
    pVnode->state.applyTerm = pSnapshot->lastApplyTerm;
    pVnode->state.commitTerm = pSnapshot->lastApplyTerm;
H
Hongze Cheng 已提交
307 308 309 310 311 312 313 314 315 316 317

    info.config = pVnode->config;
    info.state.committed = pVnode->state.applied;
    info.state.commitTerm = pVnode->state.applyTerm;
    info.state.commitID = pVnode->state.commitID;
    snprintf(dir, TSDB_FILENAME_LEN, "%s%s%s", tfsGetPrimaryPath(pVnode->pTfs), TD_DIRSEP, pVnode->path);
    code = vnodeSaveInfo(dir, &info);
    if (code) goto _err;

    code = vnodeCommitInfo(dir, &info);
    if (code) goto _err;
H
Hongze Cheng 已提交
318 319

    vnodeBegin(pVnode);
H
Hongze Cheng 已提交
320 321 322 323
  } else {
    ASSERT(0);
  }

H
Hongze Cheng 已提交
324
_exit:
S
Shengliang Guan 已提交
325
  vInfo("vgId:%d, vnode snapshot writer closed, rollback:%d", TD_VID(pVnode), rollback);
H
more  
Hongze Cheng 已提交
326 327
  taosMemoryFree(pWriter);
  return code;
H
Hongze Cheng 已提交
328 329

_err:
S
Shengliang Guan 已提交
330
  vError("vgId:%d, vnode snapshot writer close failed since %s", TD_VID(pWriter->pVnode), tstrerror(code));
H
Hongze Cheng 已提交
331
  return code;
H
Hongze Cheng 已提交
332 333
}

H
Hongze Cheng 已提交
334
int32_t vnodeSnapWrite(SVSnapWriter *pWriter, uint8_t *pData, uint32_t nData) {
H
Hongze Cheng 已提交
335
  int32_t       code = 0;
H
Hongze Cheng 已提交
336
  SSnapDataHdr *pHdr = (SSnapDataHdr *)pData;
H
Hongze Cheng 已提交
337 338
  SVnode       *pVnode = pWriter->pVnode;

H
Hongze Cheng 已提交
339 340 341
  ASSERT(pHdr->size + sizeof(SSnapDataHdr) == nData);
  ASSERT(pHdr->index == pWriter->index + 1);
  pWriter->index = pHdr->index;
H
Hongze Cheng 已提交
342

S
Shengliang Guan 已提交
343
  vInfo("vgId:%d, vnode snapshot write data, index:%" PRId64 " type:%d nData:%d", TD_VID(pVnode), pHdr->index,
H
Hongze Cheng 已提交
344
        pHdr->type, nData);
H
Hongze Cheng 已提交
345

C
Cary Xu 已提交
346 347 348 349 350 351 352
  switch (pHdr->type) {
    case SNAP_DATA_META: {
      // meta
      if (pWriter->pMetaSnapWriter == NULL) {
        code = metaSnapWriterOpen(pVnode->pMeta, pWriter->sver, pWriter->ever, &pWriter->pMetaSnapWriter);
        if (code) goto _err;
      }
H
Hongze Cheng 已提交
353

C
Cary Xu 已提交
354
      code = metaSnapWrite(pWriter->pMetaSnapWriter, pData, nData);
H
Hongze Cheng 已提交
355
      if (code) goto _err;
C
Cary Xu 已提交
356
    } break;
H
Hongze Cheng 已提交
357 358
    case SNAP_DATA_TSDB:
    case SNAP_DATA_DEL: {
C
Cary Xu 已提交
359 360 361 362 363
      // tsdb
      if (pWriter->pTsdbSnapWriter == NULL) {
        code = tsdbSnapWriterOpen(pVnode->pTsdb, pWriter->sver, pWriter->ever, &pWriter->pTsdbSnapWriter);
        if (code) goto _err;
      }
H
Hongze Cheng 已提交
364

C
Cary Xu 已提交
365 366 367
      code = tsdbSnapWrite(pWriter->pTsdbSnapWriter, pData, nData);
      if (code) goto _err;
    } break;
L
Liu Jicong 已提交
368 369 370 371 372 373 374 375
    case SNAP_DATA_TQ_HANDLE: {
    } break;
    case SNAP_DATA_TQ_OFFSET: {
    } break;
    case SNAP_DATA_STREAM_TASK: {
    } break;
    case SNAP_DATA_STREAM_STATE: {
    } break;
C
Cary Xu 已提交
376
    case SNAP_DATA_RSMA1:
C
Cary Xu 已提交
377
    case SNAP_DATA_RSMA2:
C
Cary Xu 已提交
378
    case SNAP_DATA_QTASK: {
C
Cary Xu 已提交
379
      // rsma1/rsma2/qtask for rsma
C
Cary Xu 已提交
380 381 382 383
      if (pWriter->pRsmaSnapWriter == NULL) {
        code = rsmaSnapWriterOpen(pVnode->pSma, pWriter->sver, pWriter->ever, &pWriter->pRsmaSnapWriter);
        if (code) goto _err;
      }
H
Hongze Cheng 已提交
384

C
Cary Xu 已提交
385 386 387 388 389
      code = rsmaSnapWrite(pWriter->pRsmaSnapWriter, pData, nData);
      if (code) goto _err;
    } break;
    default:
      break;
H
Hongze Cheng 已提交
390
  }
H
Hongze Cheng 已提交
391
_exit:
H
Hongze Cheng 已提交
392 393 394
  return code;

_err:
S
Shengliang Guan 已提交
395
  vError("vgId:%d, vnode snapshot write failed since %s, index:%" PRId64 " type:%d nData:%d", TD_VID(pVnode),
H
Hongze Cheng 已提交
396
         tstrerror(code), pHdr->index, pHdr->type, nData);
H
Hongze Cheng 已提交
397
  return code;
L
Liu Jicong 已提交
398
}