walRead.c 19.2 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
S
Shengliang Guan 已提交
14 15
 */

L
Liu Jicong 已提交
16
#include "taoserror.h"
L
Liu Jicong 已提交
17
#include "walInt.h"
S
Shengliang Guan 已提交
18

L
Liu Jicong 已提交
19 20 21 22
static int32_t walFetchHeadNew(SWalReader *pRead, int64_t fetchVer);
static int32_t walFetchBodyNew(SWalReader *pRead);
static int32_t walSkipFetchBodyNew(SWalReader *pRead);

L
Liu Jicong 已提交
23
SWalReader *walOpenReader(SWal *pWal, SWalFilterCond *cond) {
24 25
  SWalReader *pReader = taosMemoryCalloc(1, sizeof(SWalReader));
  if (pReader == NULL) {
26
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
27 28
    return NULL;
  }
29

30 31 32 33 34 35 36
  pReader->pWal = pWal;
  pReader->readerId = tGenIdPI64();
  pReader->pIdxFile = NULL;
  pReader->pLogFile = NULL;
  pReader->curVersion = -1;
  pReader->curFileFirstVer = -1;
  pReader->capacity = 0;
L
Liu Jicong 已提交
37
  if (cond) {
38
    pReader->cond = *cond;
L
Liu Jicong 已提交
39
  } else {
40
//    pReader->cond.scanUncommited = 0;
41 42 43
    pReader->cond.scanNotApplied = 0;
    pReader->cond.scanMeta = 0;
    pReader->cond.enableRef = 0;
L
Liu Jicong 已提交
44
  }
L
fix  
Liu Jicong 已提交
45

46
  taosThreadMutexInit(&pReader->mutex, NULL);
L
fix  
Liu Jicong 已提交
47

48 49
  pReader->pHead = taosMemoryMalloc(sizeof(SWalCkHead));
  if (pReader->pHead == NULL) {
S
Shengliang Guan 已提交
50
    terrno = TSDB_CODE_OUT_OF_MEMORY;
51
    taosMemoryFree(pReader);
L
Liu Jicong 已提交
52 53
    return NULL;
  }
L
Liu Jicong 已提交
54

55
  /*if (pReader->cond.enableRef) {*/
L
Liu Jicong 已提交
56
  /* taosHashPut(pWal->pRefHash, &pReader->readerId, sizeof(int64_t), &pReader, sizeof(void *));*/
57 58 59
  /*}*/

  return pReader;
L
Liu Jicong 已提交
60 61
}

62 63 64 65 66
void walCloseReader(SWalReader *pReader) {
  taosCloseFile(&pReader->pIdxFile);
  taosCloseFile(&pReader->pLogFile);
  taosMemoryFreeClear(pReader->pHead);
  taosMemoryFree(pReader);
L
Liu Jicong 已提交
67 68
}

69 70 71 72
int32_t walNextValidMsg(SWalReader *pReader) {
  int64_t fetchVer = pReader->curVersion;
  int64_t lastVer = walGetLastVer(pReader->pWal);
  int64_t committedVer = walGetCommittedVer(pReader->pWal);
73
  int64_t appliedVer = walGetAppliedVer(pReader->pWal);
L
Liu Jicong 已提交
74

S
Shengliang Guan 已提交
75
  wDebug("vgId:%d, wal start to fetch, index:%" PRId64 ", last index:%" PRId64 " commit index:%" PRId64
76 77
         ", applied index:%" PRId64,
         pReader->pWal->cfg.vgId, fetchVer, lastVer, committedVer, appliedVer);
78 79 80 81
  if (fetchVer > appliedVer){
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
    return -1;
  }
82
  while (fetchVer <= appliedVer) {
83
    if (walFetchHeadNew(pReader, fetchVer) < 0) {
L
Liu Jicong 已提交
84 85
      return -1;
    }
86

87 88 89
    int32_t type = pReader->pHead->head.msgType;
    if (type == TDMT_VND_SUBMIT || ((type == TDMT_VND_DELETE) && (pReader->cond.deleteMsg == 1)) ||
        (IS_META_MSG(type) && pReader->cond.scanMeta)) {
90
      if (walFetchBodyNew(pReader) < 0) {
L
Liu Jicong 已提交
91 92 93 94
        return -1;
      }
      return 0;
    } else {
95
      if (walSkipFetchBodyNew(pReader) < 0) {
L
Liu Jicong 已提交
96 97
        return -1;
      }
98

wmmhello's avatar
wmmhello 已提交
99
      fetchVer = pReader->curVersion;
L
Liu Jicong 已提交
100 101
    }
  }
102

L
Liu Jicong 已提交
103
  return -1;
L
Liu Jicong 已提交
104
}
L
Liu Jicong 已提交
105

106
int64_t walReaderGetCurrentVer(const SWalReader *pReader) { return pReader->curVersion; }
107
int64_t walReaderGetValidFirstVer(const SWalReader *pReader) { return walGetFirstVer(pReader->pWal); }
108 109 110 111 112 113 114 115
void    walReaderSetSkipToVersion(SWalReader *pReader, int64_t ver) { atomic_store_64(&pReader->skipToVersion, ver); }

// this function is NOT multi-thread safe, and no need to be.
int64_t walReaderGetSkipToVersion(SWalReader *pReader) {
  int64_t newVersion = pReader->skipToVersion;
  pReader->skipToVersion = 0;
  return newVersion;
}
116

117 118 119 120 121 122 123
void walReaderValidVersionRange(SWalReader *pReader, int64_t *sver, int64_t *ever) {
  *sver = walGetFirstVer(pReader->pWal);
  int64_t lastVer = walGetLastVer(pReader->pWal);
  int64_t committedVer = walGetCommittedVer(pReader->pWal);
  *ever = pReader->cond.scanUncommited ? lastVer : committedVer;
}

124 125 126 127 128 129
void walReaderVerifyOffset(SWalReader *pWalReader, STqOffsetVal* pOffset){
  // if offset version is small than first version , let's seek to first version
  taosThreadMutexLock(&pWalReader->pWal->mutex);
  int64_t firstVer = walGetFirstVer((pWalReader)->pWal);
  taosThreadMutexUnlock(&pWalReader->pWal->mutex);

130 131
  if (pOffset->version < firstVer){
    pOffset->version = firstVer;
132 133 134
  }
}

135
static int64_t walReadSeekFilePos(SWalReader *pReader, int64_t fileFirstVer, int64_t ver) {
L
Liu Jicong 已提交
136
  int64_t ret = 0;
L
Liu Jicong 已提交
137

138 139
  TdFilePtr pIdxTFile = pReader->pIdxFile;
  TdFilePtr pLogTFile = pReader->pLogFile;
L
Liu Jicong 已提交
140 141

  // seek position
L
Liu Jicong 已提交
142
  int64_t offset = (ver - fileFirstVer) * sizeof(SWalIdxEntry);
L
Liu Jicong 已提交
143 144
  ret = taosLSeekFile(pIdxTFile, offset, SEEK_SET);
  if (ret < 0) {
L
Liu Jicong 已提交
145
    terrno = TAOS_SYSTEM_ERROR(errno);
146 147
    wError("vgId:%d, failed to seek idx file, index:%" PRId64 ", pos:%" PRId64 ", since %s", pReader->pWal->cfg.vgId,
           ver, offset, terrstr());
L
Liu Jicong 已提交
148 149
    return -1;
  }
L
Liu Jicong 已提交
150
  SWalIdxEntry entry = {0};
L
Liu Jicong 已提交
151 152 153
  if ((ret = taosReadFile(pIdxTFile, &entry, sizeof(SWalIdxEntry))) != sizeof(SWalIdxEntry)) {
    if (ret < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
154
      wError("vgId:%d, failed to read idx file, since %s", pReader->pWal->cfg.vgId, terrstr());
L
Liu Jicong 已提交
155 156
    } else {
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
157
      wError("vgId:%d, read idx file incompletely, read bytes %" PRId64 ", bytes should be %ld",
158
             pReader->pWal->cfg.vgId, ret, sizeof(SWalIdxEntry));
L
Liu Jicong 已提交
159
    }
L
Liu Jicong 已提交
160 161
    return -1;
  }
L
Liu Jicong 已提交
162 163 164

  ret = taosLSeekFile(pLogTFile, entry.offset, SEEK_SET);
  if (ret < 0) {
L
Liu Jicong 已提交
165
    terrno = TAOS_SYSTEM_ERROR(errno);
166 167
    wError("vgId:%d, failed to seek log file, index:%" PRId64 ", pos:%" PRId64 ", since %s", pReader->pWal->cfg.vgId,
           ver, entry.offset, terrstr());
L
Liu Jicong 已提交
168 169
    return -1;
  }
L
Liu Jicong 已提交
170
  return ret;
L
Liu Jicong 已提交
171 172
}

173
static int32_t walReadChangeFile(SWalReader *pReader, int64_t fileFirstVer) {
wmmhello's avatar
wmmhello 已提交
174
  char fnameStr[WAL_FILE_LEN] = {0};
L
Liu Jicong 已提交
175

176 177
  taosCloseFile(&pReader->pIdxFile);
  taosCloseFile(&pReader->pLogFile);
L
Liu Jicong 已提交
178

179 180 181
  walBuildLogName(pReader->pWal, fileFirstVer, fnameStr);
  TdFilePtr pLogFile = taosOpenFile(fnameStr, TD_FILE_READ);
  if (pLogFile == NULL) {
L
Liu Jicong 已提交
182
    terrno = TAOS_SYSTEM_ERROR(errno);
183
    wError("vgId:%d, cannot open file %s, since %s", pReader->pWal->cfg.vgId, fnameStr, terrstr());
L
Liu Jicong 已提交
184 185 186
    return -1;
  }

187
  pReader->pLogFile = pLogFile;
L
Liu Jicong 已提交
188

189 190 191
  walBuildIdxName(pReader->pWal, fileFirstVer, fnameStr);
  TdFilePtr pIdxFile = taosOpenFile(fnameStr, TD_FILE_READ);
  if (pIdxFile == NULL) {
L
Liu Jicong 已提交
192
    terrno = TAOS_SYSTEM_ERROR(errno);
193
    wError("vgId:%d, cannot open file %s, since %s", pReader->pWal->cfg.vgId, fnameStr, terrstr());
L
Liu Jicong 已提交
194 195 196
    return -1;
  }

197
  pReader->pIdxFile = pIdxFile;
198 199 200

  pReader->curFileFirstVer = fileFirstVer;

L
Liu Jicong 已提交
201 202 203
  return 0;
}

204 205
int32_t walReadSeekVerImpl(SWalReader *pReader, int64_t ver) {
  SWal *pWal = pReader->pWal;
L
Liu Jicong 已提交
206

207
  // bsearch in fileSet
L
Liu Jicong 已提交
208
  SWalFileInfo tmpInfo;
L
Liu Jicong 已提交
209
  tmpInfo.firstVer = ver;
L
Liu Jicong 已提交
210
  SWalFileInfo *pRet = taosArraySearch(pWal->fileInfoSet, &tmpInfo, compareWalFileInfo, TD_LE);
211
  if (pRet == NULL) {
212
    wError("failed to find WAL log file with ver:%" PRId64, ver);
213 214 215
    terrno = TSDB_CODE_WAL_INVALID_VER;
    return -1;
  }
216

217
  if (pReader->curFileFirstVer != pRet->firstVer) {
L
Liu Jicong 已提交
218
    // error code was set inner
219
    if (walReadChangeFile(pReader, pRet->firstVer) < 0) {
L
Liu Jicong 已提交
220 221 222 223
      return -1;
    }
  }

L
Liu Jicong 已提交
224
  // error code was set inner
225
  if (walReadSeekFilePos(pReader, pRet->firstVer, ver) < 0) {
L
Liu Jicong 已提交
226 227
    return -1;
  }
L
Liu Jicong 已提交
228

229 230
  wDebug("vgId:%d, wal version reset from %" PRId64 " to %" PRId64, pReader->pWal->cfg.vgId,
         pReader->curVersion, ver);
L
Liu Jicong 已提交
231

232
  pReader->curVersion = ver;
L
Liu Jicong 已提交
233 234 235
  return 0;
}

236
int32_t walReaderSeekVer(SWalReader *pReader, int64_t ver) {
237
  SWal *pWal = pReader->pWal;
238
  if (ver == pReader->curVersion) {
S
Shengliang Guan 已提交
239
    wDebug("vgId:%d, wal index:%" PRId64 " match, no need to reset", pReader->pWal->cfg.vgId, ver);
L
Liu Jicong 已提交
240 241 242 243
    return 0;
  }

  if (ver > pWal->vers.lastVer || ver < pWal->vers.firstVer) {
244
    wInfo("vgId:%d, invalid index:%" PRId64 ", first index:%" PRId64 ", last index:%" PRId64, pReader->pWal->cfg.vgId,
L
Liu Jicong 已提交
245 246 247 248 249
           ver, pWal->vers.firstVer, pWal->vers.lastVer);
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
    return -1;
  }

250
  if (walReadSeekVerImpl(pReader, ver) < 0) {
L
Liu Jicong 已提交
251 252 253
    return -1;
  }

L
Liu Jicong 已提交
254 255 256
  return 0;
}

L
Liu Jicong 已提交
257
void walSetReaderCapacity(SWalReader *pRead, int32_t capacity) { pRead->capacity = capacity; }
258

L
Liu Jicong 已提交
259 260
static int32_t walFetchHeadNew(SWalReader *pRead, int64_t fetchVer) {
  int64_t contLen;
L
Liu Jicong 已提交
261 262
  bool    seeked = false;

S
Shengliang Guan 已提交
263
  wDebug("vgId:%d, wal starts to fetch head, index:%" PRId64, pRead->pWal->cfg.vgId, fetchVer);
264

265
  if (pRead->curVersion != fetchVer) {
266
    if (walReaderSeekVer(pRead, fetchVer) < 0) {
L
Liu Jicong 已提交
267 268
      return -1;
    }
L
Liu Jicong 已提交
269 270
    seeked = true;
  }
271

L
Liu Jicong 已提交
272 273 274 275 276
  while (1) {
    contLen = taosReadFile(pRead->pLogFile, pRead->pHead, sizeof(SWalCkHead));
    if (contLen == sizeof(SWalCkHead)) {
      break;
    } else if (contLen == 0 && !seeked) {
277 278 279
      if(walReadSeekVerImpl(pRead, fetchVer) < 0){
        return -1;
      }
L
Liu Jicong 已提交
280 281
      seeked = true;
      continue;
L
Liu Jicong 已提交
282
    } else {
L
Liu Jicong 已提交
283 284 285 286 287 288
      if (contLen < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
      } else {
        terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
      }
      return -1;
L
Liu Jicong 已提交
289 290
    }
  }
291
//  pRead->curInvalid = 0;
L
Liu Jicong 已提交
292 293 294
  return 0;
}

L
Liu Jicong 已提交
295 296
static int32_t walFetchBodyNew(SWalReader *pReader) {
  SWalCont *pReadHead = &pReader->pHead->head;
L
Liu Jicong 已提交
297 298
  int64_t   ver = pReadHead->version;

299
  wDebug("vgId:%d, wal starts to fetch body, ver:%" PRId64 " ,len:%d, total", pReader->pWal->cfg.vgId, ver,
L
Liu Jicong 已提交
300
         pReadHead->bodyLen);
301

L
Liu Jicong 已提交
302 303
  if (pReader->capacity < pReadHead->bodyLen) {
    SWalCkHead *ptr = (SWalCkHead *)taosMemoryRealloc(pReader->pHead, sizeof(SWalCkHead) + pReadHead->bodyLen);
L
Liu Jicong 已提交
304
    if (ptr == NULL) {
S
Shengliang Guan 已提交
305
      terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
306 307
      return -1;
    }
308

L
Liu Jicong 已提交
309 310 311
    pReader->pHead = ptr;
    pReadHead = &pReader->pHead->head;
    pReader->capacity = pReadHead->bodyLen;
L
Liu Jicong 已提交
312 313
  }

L
Liu Jicong 已提交
314
  if (pReadHead->bodyLen != taosReadFile(pReader->pLogFile, pReadHead->body, pReadHead->bodyLen)) {
L
Liu Jicong 已提交
315 316
    if (pReadHead->bodyLen < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
317
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since %s",
L
Liu Jicong 已提交
318
             pReader->pWal->cfg.vgId, pReader->pHead->head.version, ver, tstrerror(terrno));
L
Liu Jicong 已提交
319
    } else {
S
Shengliang Guan 已提交
320
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since file corrupted",
L
Liu Jicong 已提交
321
             pReader->pWal->cfg.vgId, pReader->pHead->head.version, ver);
L
Liu Jicong 已提交
322 323 324 325 326
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    }
    return -1;
  }

L
Liu Jicong 已提交
327 328
  if (walValidBodyCksum(pReader->pHead) != 0) {
    wError("vgId:%d, wal fetch body error:%" PRId64 ", since body checksum not passed", pReader->pWal->cfg.vgId, ver);
L
Liu Jicong 已提交
329 330 331 332
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

333
  wDebug("vgId:%d, index:%" PRId64 " is fetched, type:%d, cursor advance", pReader->pWal->cfg.vgId, ver, pReader->pHead->head.msgType);
L
Liu Jicong 已提交
334
  pReader->curVersion = ver + 1;
L
Liu Jicong 已提交
335 336 337 338 339 340 341 342 343
  return 0;
}

static int32_t walSkipFetchBodyNew(SWalReader *pRead) {
  int64_t code;

  code = taosLSeekFile(pRead->pLogFile, pRead->pHead->head.bodyLen, SEEK_CUR);
  if (code < 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
344
//    pRead->curInvalid = 1;
L
Liu Jicong 已提交
345 346 347 348
    return -1;
  }

  pRead->curVersion++;
S
Shengliang Guan 已提交
349
  wDebug("vgId:%d, version advance to %" PRId64 ", skip fetch", pRead->pWal->cfg.vgId, pRead->curVersion);
L
Liu Jicong 已提交
350 351 352 353

  return 0;
}

L
Liu Jicong 已提交
354
int32_t walFetchHead(SWalReader *pRead, int64_t ver, SWalCkHead *pHead) {
L
Liu Jicong 已提交
355
  int64_t code;
356 357 358
  int64_t contLen;
  bool    seeked = false;

S
Shengliang Guan 已提交
359
  wDebug("vgId:%d, try to fetch ver %" PRId64 ", first ver:%" PRId64 ", commit ver:%" PRId64 ", last ver:%" PRId64
L
Liu Jicong 已提交
360 361 362
         ", applied ver:%" PRId64,
         pRead->pWal->cfg.vgId, ver, pRead->pWal->vers.firstVer, pRead->pWal->vers.commitVer, pRead->pWal->vers.lastVer,
         pRead->pWal->vers.appliedVer);
L
Liu Jicong 已提交
363

364
  // TODO: valid ver
365 366 367
  if (ver > pRead->pWal->vers.commitVer) {
    return -1;
  }
368

369
  if (pRead->curVersion != ver) {
370
    code = walReaderSeekVer(pRead, ver);
371
    if (code < 0) {
372 373
//      pRead->curVersion = ver;
//      pRead->curInvalid = 1;
374 375 376
      return -1;
    }
    seeked = true;
377 378
  }

379 380 381 382 383
  while (1) {
    contLen = taosReadFile(pRead->pLogFile, pHead, sizeof(SWalCkHead));
    if (contLen == sizeof(SWalCkHead)) {
      break;
    } else if (contLen == 0 && !seeked) {
384 385 386
      if(walReadSeekVerImpl(pRead, ver) < 0){
        return -1;
      }
387 388 389 390 391 392 393 394
      seeked = true;
      continue;
    } else {
      if (contLen < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
      } else {
        terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
      }
395
//      pRead->curInvalid = 1;
396 397
      return -1;
    }
398 399 400 401 402
  }

  code = walValidHeadCksum(pHead);

  if (code != 0) {
L
Liu Jicong 已提交
403
    wError("vgId:%d, unexpected wal log index:%" PRId64 ", since head checksum not passed", pRead->pWal->cfg.vgId, ver);
404 405 406 407
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

408
//  pRead->curInvalid = 0;
409 410 411
  return 0;
}

L
Liu Jicong 已提交
412
int32_t walSkipFetchBody(SWalReader *pRead, const SWalCkHead *pHead) {
L
Liu Jicong 已提交
413
  int64_t code;
414

S
Shengliang Guan 已提交
415
  wDebug("vgId:%d, skip fetch body %" PRId64 ", first ver:%" PRId64 ", commit ver:%" PRId64 ", last ver:%" PRId64
L
Liu Jicong 已提交
416 417 418 419
         ", applied ver:%" PRId64,
         pRead->pWal->cfg.vgId, pHead->head.version, pRead->pWal->vers.firstVer, pRead->pWal->vers.commitVer,
         pRead->pWal->vers.lastVer, pRead->pWal->vers.appliedVer);

L
Liu Jicong 已提交
420
  code = taosLSeekFile(pRead->pLogFile, pHead->head.bodyLen, SEEK_CUR);
421 422
  if (code < 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
423
//    pRead->curInvalid = 1;
424 425 426 427 428 429 430 431
    return -1;
  }

  pRead->curVersion++;

  return 0;
}

L
Liu Jicong 已提交
432
int32_t walFetchBody(SWalReader *pRead, SWalCkHead **ppHead) {
L
Liu Jicong 已提交
433 434
  SWalCont *pReadHead = &((*ppHead)->head);
  int64_t   ver = pReadHead->version;
435

S
Shengliang Guan 已提交
436
  wDebug("vgId:%d, fetch body %" PRId64 ", first ver:%" PRId64 ", commit ver:%" PRId64 ", last ver:%" PRId64
L
Liu Jicong 已提交
437 438 439 440
         ", applied ver:%" PRId64,
         pRead->pWal->cfg.vgId, ver, pRead->pWal->vers.firstVer, pRead->pWal->vers.commitVer, pRead->pWal->vers.lastVer,
         pRead->pWal->vers.appliedVer);

441
  if (pRead->capacity < pReadHead->bodyLen) {
L
Liu Jicong 已提交
442
    SWalCkHead *ptr = (SWalCkHead *)taosMemoryRealloc(*ppHead, sizeof(SWalCkHead) + pReadHead->bodyLen);
443
    if (ptr == NULL) {
S
Shengliang Guan 已提交
444
      terrno = TSDB_CODE_OUT_OF_MEMORY;
445 446
      return -1;
    }
L
Liu Jicong 已提交
447
    *ppHead = ptr;
L
Liu Jicong 已提交
448
    pReadHead = &((*ppHead)->head);
449 450 451
    pRead->capacity = pReadHead->bodyLen;
  }

L
Liu Jicong 已提交
452
  if (pReadHead->bodyLen != taosReadFile(pRead->pLogFile, pReadHead->body, pReadHead->bodyLen)) {
453 454 455 456 457 458 459 460 461
    if (pReadHead->bodyLen < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since %s",
             pRead->pWal->cfg.vgId, pReadHead->version, ver, tstrerror(terrno));
    } else {
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since file corrupted",
             pRead->pWal->cfg.vgId, pReadHead->version, ver);
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    }
462
//    pRead->curInvalid = 1;
463 464 465 466
    return -1;
  }

  if (pReadHead->version != ver) {
S
Shengliang Guan 已提交
467
    wError("vgId:%d, wal fetch body error, index:%" PRId64 ", read request index:%" PRId64, pRead->pWal->cfg.vgId,
468
           pReadHead->version, ver);
469
//    pRead->curInvalid = 1;
470 471 472 473 474
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

  if (walValidBodyCksum(*ppHead) != 0) {
475 476
    wError("vgId:%d, wal fetch body error, index:%" PRId64 ", since body checksum not passed", pRead->pWal->cfg.vgId,
           ver);
477
//    pRead->curInvalid = 1;
478 479 480 481 482 483 484 485
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

  pRead->curVersion = ver + 1;
  return 0;
}

486
int32_t walReadVer(SWalReader *pReader, int64_t ver) {
S
Shengliang Guan 已提交
487
  wDebug("vgId:%d, wal start to read index:%" PRId64, pReader->pWal->cfg.vgId, ver);
L
Liu Jicong 已提交
488
  int64_t contLen;
489
  int32_t code;
L
Liu Jicong 已提交
490
  bool    seeked = false;
491

492
  if (walIsEmpty(pReader->pWal)) {
493 494 495 496
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
    return -1;
  }

497 498 499
  if (ver > pReader->pWal->vers.lastVer || ver < pReader->pWal->vers.firstVer) {
    wDebug("vgId:%d, invalid index:%" PRId64 ", first index:%" PRId64 ", last index:%" PRId64, pReader->pWal->cfg.vgId,
           ver, pReader->pWal->vers.firstVer, pReader->pWal->vers.lastVer);
M
Minghao Li 已提交
500 501 502 503
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
    return -1;
  }

504 505
  taosThreadMutexLock(&pReader->mutex);

506
  if (pReader->curVersion != ver) {
507
    if (walReaderSeekVer(pReader, ver) < 0) {
508
      wError("vgId:%d, unexpected wal log, index:%" PRId64 ", since %s", pReader->pWal->cfg.vgId, ver, terrstr());
509
      taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
510 511 512 513
      return -1;
    }
    seeked = true;
  }
L
Liu Jicong 已提交
514

L
Liu Jicong 已提交
515
  while (1) {
516
    contLen = taosReadFile(pReader->pLogFile, pReader->pHead, sizeof(SWalCkHead));
L
Liu Jicong 已提交
517 518 519
    if (contLen == sizeof(SWalCkHead)) {
      break;
    } else if (contLen == 0 && !seeked) {
520 521 522 523
      if(walReadSeekVerImpl(pReader, ver) < 0){
        taosThreadMutexUnlock(&pReader->mutex);
        return -1;
      }
L
Liu Jicong 已提交
524 525 526 527 528 529 530 531
      seeked = true;
      continue;
    } else {
      if (contLen < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
      } else {
        terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
      }
532 533
      wError("vgId:%d, failed to read WAL record head, index:%" PRId64 ", from log file since %s",
             pReader->pWal->cfg.vgId, ver, terrstr());
534
      taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
535
      return -1;
M
Minghao Li 已提交
536
    }
L
Liu Jicong 已提交
537
  }
538

539 540 541
  code = walValidHeadCksum(pReader->pHead);
  if (code != 0) {
    wError("vgId:%d, unexpected wal log, index:%" PRId64 ", since head checksum not passed", pReader->pWal->cfg.vgId,
542
           ver);
L
Liu Jicong 已提交
543
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
544
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
545 546
    return -1;
  }
547

548
  if (pReader->capacity < pReader->pHead->head.bodyLen) {
L
Liu Jicong 已提交
549 550
    SWalCkHead *ptr =
        (SWalCkHead *)taosMemoryRealloc(pReader->pHead, sizeof(SWalCkHead) + pReader->pHead->head.bodyLen);
L
Liu Jicong 已提交
551
    if (ptr == NULL) {
S
Shengliang Guan 已提交
552
      terrno = TSDB_CODE_OUT_OF_MEMORY;
553
      taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
554 555
      return -1;
    }
L
Liu Jicong 已提交
556
    pReader->pHead = ptr;
557
    pReader->capacity = pReader->pHead->head.bodyLen;
L
Liu Jicong 已提交
558
  }
L
Liu Jicong 已提交
559

560 561
  if ((contLen = taosReadFile(pReader->pLogFile, pReader->pHead->head.body, pReader->pHead->head.bodyLen)) !=
      pReader->pHead->head.bodyLen) {
L
Liu Jicong 已提交
562
    if (contLen < 0)
L
Liu Jicong 已提交
563
      terrno = TAOS_SYSTEM_ERROR(errno);
M
Minghao Li 已提交
564
    else {
L
Liu Jicong 已提交
565
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
M
Minghao Li 已提交
566
    }
567 568
    wError("vgId:%d, failed to read WAL record body, index:%" PRId64 ", from log file since %s",
           pReader->pWal->cfg.vgId, ver, terrstr());
569
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
570 571
    return -1;
  }
L
Liu Jicong 已提交
572

573 574 575
  if (pReader->pHead->head.version != ver) {
    wError("vgId:%d, unexpected wal log, index:%" PRId64 ", read request index:%" PRId64, pReader->pWal->cfg.vgId,
           pReader->pHead->head.version, ver);
576
//    pReader->curInvalid = 1;
L
Liu Jicong 已提交
577
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
578
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
579 580
    return -1;
  }
L
Liu Jicong 已提交
581

582 583 584
  code = walValidBodyCksum(pReader->pHead);
  if (code != 0) {
    wError("vgId:%d, unexpected wal log, index:%" PRId64 ", since body checksum not passed", pReader->pWal->cfg.vgId,
585
           ver);
586 587
    uint32_t readCkSum = walCalcBodyCksum(pReader->pHead->head.body, pReader->pHead->head.bodyLen);
    uint32_t logCkSum = pReader->pHead->cksumBody;
S
Shengliang Guan 已提交
588
    wError("checksum written into log:%u, checksum calculated:%u", logCkSum, readCkSum);
589
//    pReader->curInvalid = 1;
L
Liu Jicong 已提交
590
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
591
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
592 593
    return -1;
  }
594
  pReader->curVersion++;
L
Liu Jicong 已提交
595

596 597
  taosThreadMutexUnlock(&pReader->mutex);

L
Liu Jicong 已提交
598 599
  return 0;
}
600 601 602 603 604 605

void walReadReset(SWalReader *pReader) {
  taosThreadMutexLock(&pReader->mutex);
  taosCloseFile(&pReader->pIdxFile);
  taosCloseFile(&pReader->pLogFile);
  pReader->curFileFirstVer = -1;
606
  pReader->curVersion = -1;
607 608
  taosThreadMutexUnlock(&pReader->mutex);
}