walRead.c 18.7 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
S
Shengliang Guan 已提交
14 15
 */

L
Liu Jicong 已提交
16
#include "taoserror.h"
L
Liu Jicong 已提交
17
#include "walInt.h"
S
Shengliang Guan 已提交
18

L
Liu Jicong 已提交
19 20 21 22
static int32_t walFetchHeadNew(SWalReader *pRead, int64_t fetchVer);
static int32_t walFetchBodyNew(SWalReader *pRead);
static int32_t walSkipFetchBodyNew(SWalReader *pRead);

L
Liu Jicong 已提交
23
SWalReader *walOpenReader(SWal *pWal, SWalFilterCond *cond) {
24 25
  SWalReader *pReader = taosMemoryCalloc(1, sizeof(SWalReader));
  if (pReader == NULL) {
26
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
27 28
    return NULL;
  }
29

30 31 32 33 34 35 36
  pReader->pWal = pWal;
  pReader->readerId = tGenIdPI64();
  pReader->pIdxFile = NULL;
  pReader->pLogFile = NULL;
  pReader->curVersion = -1;
  pReader->curFileFirstVer = -1;
  pReader->capacity = 0;
L
Liu Jicong 已提交
37
  if (cond) {
38
    pReader->cond = *cond;
L
Liu Jicong 已提交
39
  } else {
40
//    pReader->cond.scanUncommited = 0;
41 42 43
    pReader->cond.scanNotApplied = 0;
    pReader->cond.scanMeta = 0;
    pReader->cond.enableRef = 0;
L
Liu Jicong 已提交
44
  }
L
fix  
Liu Jicong 已提交
45

46
  taosThreadMutexInit(&pReader->mutex, NULL);
L
fix  
Liu Jicong 已提交
47

48 49
  pReader->pHead = taosMemoryMalloc(sizeof(SWalCkHead));
  if (pReader->pHead == NULL) {
S
Shengliang Guan 已提交
50
    terrno = TSDB_CODE_OUT_OF_MEMORY;
51
    taosMemoryFree(pReader);
L
Liu Jicong 已提交
52 53
    return NULL;
  }
L
Liu Jicong 已提交
54

55
  /*if (pReader->cond.enableRef) {*/
L
Liu Jicong 已提交
56
  /* taosHashPut(pWal->pRefHash, &pReader->readerId, sizeof(int64_t), &pReader, sizeof(void *));*/
57 58 59
  /*}*/

  return pReader;
L
Liu Jicong 已提交
60 61
}

62 63 64 65 66 67 68 69
void walCloseReader(SWalReader *pReader) {
  taosCloseFile(&pReader->pIdxFile);
  taosCloseFile(&pReader->pLogFile);
  /*if (pReader->cond.enableRef) {*/
  /*taosHashRemove(pReader->pWal->pRefHash, &pReader->readerId, sizeof(int64_t));*/
  /*}*/
  taosMemoryFreeClear(pReader->pHead);
  taosMemoryFree(pReader);
L
Liu Jicong 已提交
70 71
}

72 73 74 75 76
int32_t walNextValidMsg(SWalReader *pReader) {
  int64_t fetchVer = pReader->curVersion;
  int64_t lastVer = walGetLastVer(pReader->pWal);
  int64_t committedVer = walGetCommittedVer(pReader->pWal);
  int64_t appliedVer = walGetAppliedVer(pReader->pWal);
77 78 79
  if(appliedVer < committedVer){   // wait apply ver equal to commit ver, otherwise may lost data when consume data [TD-24010]
    wDebug("vgId:%d, wal apply ver:%"PRId64" smaller than commit ver:%"PRId64, pReader->pWal->cfg.vgId, appliedVer, committedVer);
//    taosMsleep(10);
80 81
  }
//  int64_t endVer = pReader->cond.scanUncommited ? lastVer : committedVer;
82
  int64_t endVer = TMIN(appliedVer, committedVer);
L
Liu Jicong 已提交
83

S
Shengliang Guan 已提交
84
  wDebug("vgId:%d, wal start to fetch, index:%" PRId64 ", last index:%" PRId64 " commit index:%" PRId64
85 86 87
         ", applied index:%" PRId64", end index:%" PRId64,
         pReader->pWal->cfg.vgId, fetchVer, lastVer, committedVer, appliedVer, endVer);
  while (fetchVer <= endVer) {
88
    if (walFetchHeadNew(pReader, fetchVer) < 0) {
L
Liu Jicong 已提交
89 90
      return -1;
    }
91 92 93
    if (pReader->pHead->head.msgType == TDMT_VND_SUBMIT ||
        (IS_META_MSG(pReader->pHead->head.msgType) && pReader->cond.scanMeta)) {
      if (walFetchBodyNew(pReader) < 0) {
L
Liu Jicong 已提交
94 95 96 97
        return -1;
      }
      return 0;
    } else {
98
      if (walSkipFetchBodyNew(pReader) < 0) {
L
Liu Jicong 已提交
99 100
        return -1;
      }
wmmhello's avatar
wmmhello 已提交
101
      fetchVer = pReader->curVersion;
L
Liu Jicong 已提交
102 103 104
    }
  }
  return -1;
L
Liu Jicong 已提交
105
}
L
Liu Jicong 已提交
106

107
int64_t walReaderGetCurrentVer(const SWalReader *pReader) { return pReader->curVersion; }
108
int64_t walReaderGetValidFirstVer(const SWalReader *pReader) { return walGetFirstVer(pReader->pWal); }
109

110 111 112 113 114 115 116
void walReaderValidVersionRange(SWalReader *pReader, int64_t *sver, int64_t *ever) {
  *sver = walGetFirstVer(pReader->pWal);
  int64_t lastVer = walGetLastVer(pReader->pWal);
  int64_t committedVer = walGetCommittedVer(pReader->pWal);
  *ever = pReader->cond.scanUncommited ? lastVer : committedVer;
}

117
static int64_t walReadSeekFilePos(SWalReader *pReader, int64_t fileFirstVer, int64_t ver) {
L
Liu Jicong 已提交
118
  int64_t ret = 0;
L
Liu Jicong 已提交
119

120 121
  TdFilePtr pIdxTFile = pReader->pIdxFile;
  TdFilePtr pLogTFile = pReader->pLogFile;
L
Liu Jicong 已提交
122 123

  // seek position
L
Liu Jicong 已提交
124
  int64_t offset = (ver - fileFirstVer) * sizeof(SWalIdxEntry);
L
Liu Jicong 已提交
125 126
  ret = taosLSeekFile(pIdxTFile, offset, SEEK_SET);
  if (ret < 0) {
L
Liu Jicong 已提交
127
    terrno = TAOS_SYSTEM_ERROR(errno);
128 129
    wError("vgId:%d, failed to seek idx file, index:%" PRId64 ", pos:%" PRId64 ", since %s", pReader->pWal->cfg.vgId,
           ver, offset, terrstr());
L
Liu Jicong 已提交
130 131
    return -1;
  }
L
Liu Jicong 已提交
132
  SWalIdxEntry entry = {0};
L
Liu Jicong 已提交
133 134 135
  if ((ret = taosReadFile(pIdxTFile, &entry, sizeof(SWalIdxEntry))) != sizeof(SWalIdxEntry)) {
    if (ret < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
136
      wError("vgId:%d, failed to read idx file, since %s", pReader->pWal->cfg.vgId, terrstr());
L
Liu Jicong 已提交
137 138
    } else {
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
139
      wError("vgId:%d, read idx file incompletely, read bytes %" PRId64 ", bytes should be %ld",
140
             pReader->pWal->cfg.vgId, ret, sizeof(SWalIdxEntry));
L
Liu Jicong 已提交
141
    }
L
Liu Jicong 已提交
142 143
    return -1;
  }
L
Liu Jicong 已提交
144 145 146

  ret = taosLSeekFile(pLogTFile, entry.offset, SEEK_SET);
  if (ret < 0) {
L
Liu Jicong 已提交
147
    terrno = TAOS_SYSTEM_ERROR(errno);
148 149
    wError("vgId:%d, failed to seek log file, index:%" PRId64 ", pos:%" PRId64 ", since %s", pReader->pWal->cfg.vgId,
           ver, entry.offset, terrstr());
L
Liu Jicong 已提交
150 151
    return -1;
  }
L
Liu Jicong 已提交
152
  return ret;
L
Liu Jicong 已提交
153 154
}

155
static int32_t walReadChangeFile(SWalReader *pReader, int64_t fileFirstVer) {
wmmhello's avatar
wmmhello 已提交
156
  char fnameStr[WAL_FILE_LEN] = {0};
L
Liu Jicong 已提交
157

158 159
  taosCloseFile(&pReader->pIdxFile);
  taosCloseFile(&pReader->pLogFile);
L
Liu Jicong 已提交
160

161 162 163
  walBuildLogName(pReader->pWal, fileFirstVer, fnameStr);
  TdFilePtr pLogFile = taosOpenFile(fnameStr, TD_FILE_READ);
  if (pLogFile == NULL) {
L
Liu Jicong 已提交
164
    terrno = TAOS_SYSTEM_ERROR(errno);
165
    wError("vgId:%d, cannot open file %s, since %s", pReader->pWal->cfg.vgId, fnameStr, terrstr());
L
Liu Jicong 已提交
166 167 168
    return -1;
  }

169
  pReader->pLogFile = pLogFile;
L
Liu Jicong 已提交
170

171 172 173
  walBuildIdxName(pReader->pWal, fileFirstVer, fnameStr);
  TdFilePtr pIdxFile = taosOpenFile(fnameStr, TD_FILE_READ);
  if (pIdxFile == NULL) {
L
Liu Jicong 已提交
174
    terrno = TAOS_SYSTEM_ERROR(errno);
175
    wError("vgId:%d, cannot open file %s, since %s", pReader->pWal->cfg.vgId, fnameStr, terrstr());
L
Liu Jicong 已提交
176 177 178
    return -1;
  }

179
  pReader->pIdxFile = pIdxFile;
180 181 182

  pReader->curFileFirstVer = fileFirstVer;

L
Liu Jicong 已提交
183 184 185
  return 0;
}

186 187
int32_t walReadSeekVerImpl(SWalReader *pReader, int64_t ver) {
  SWal *pWal = pReader->pWal;
L
Liu Jicong 已提交
188

189
  // bsearch in fileSet
L
Liu Jicong 已提交
190
  SWalFileInfo tmpInfo;
L
Liu Jicong 已提交
191
  tmpInfo.firstVer = ver;
L
Liu Jicong 已提交
192
  SWalFileInfo *pRet = taosArraySearch(pWal->fileInfoSet, &tmpInfo, compareWalFileInfo, TD_LE);
193
  if (pRet == NULL) {
194
    wError("failed to find WAL log file with ver:%" PRId64, ver);
195 196 197
    terrno = TSDB_CODE_WAL_INVALID_VER;
    return -1;
  }
198

199
  if (pReader->curFileFirstVer != pRet->firstVer) {
L
Liu Jicong 已提交
200
    // error code was set inner
201
    if (walReadChangeFile(pReader, pRet->firstVer) < 0) {
L
Liu Jicong 已提交
202 203 204 205
      return -1;
    }
  }

L
Liu Jicong 已提交
206
  // error code was set inner
207
  if (walReadSeekFilePos(pReader, pRet->firstVer, ver) < 0) {
L
Liu Jicong 已提交
208 209
    return -1;
  }
L
Liu Jicong 已提交
210

211 212
  wDebug("vgId:%d, wal version reset from %" PRId64 " to %" PRId64, pReader->pWal->cfg.vgId,
         pReader->curVersion, ver);
L
Liu Jicong 已提交
213

214
  pReader->curVersion = ver;
L
Liu Jicong 已提交
215 216 217
  return 0;
}

218
int32_t walReaderSeekVer(SWalReader *pReader, int64_t ver) {
219
  SWal *pWal = pReader->pWal;
220
  if (ver == pReader->curVersion) {
S
Shengliang Guan 已提交
221
    wDebug("vgId:%d, wal index:%" PRId64 " match, no need to reset", pReader->pWal->cfg.vgId, ver);
L
Liu Jicong 已提交
222 223 224 225
    return 0;
  }

  if (ver > pWal->vers.lastVer || ver < pWal->vers.firstVer) {
226
    wInfo("vgId:%d, invalid index:%" PRId64 ", first index:%" PRId64 ", last index:%" PRId64, pReader->pWal->cfg.vgId,
L
Liu Jicong 已提交
227 228 229 230 231
           ver, pWal->vers.firstVer, pWal->vers.lastVer);
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
    return -1;
  }

232
  if (walReadSeekVerImpl(pReader, ver) < 0) {
L
Liu Jicong 已提交
233 234 235
    return -1;
  }

L
Liu Jicong 已提交
236 237 238
  return 0;
}

L
Liu Jicong 已提交
239
void walSetReaderCapacity(SWalReader *pRead, int32_t capacity) { pRead->capacity = capacity; }
240

L
Liu Jicong 已提交
241 242
static int32_t walFetchHeadNew(SWalReader *pRead, int64_t fetchVer) {
  int64_t contLen;
L
Liu Jicong 已提交
243 244
  bool    seeked = false;

S
Shengliang Guan 已提交
245
  wDebug("vgId:%d, wal starts to fetch head, index:%" PRId64, pRead->pWal->cfg.vgId, fetchVer);
246

247
  if (pRead->curVersion != fetchVer) {
248
    if (walReaderSeekVer(pRead, fetchVer) < 0) {
L
Liu Jicong 已提交
249 250
      return -1;
    }
L
Liu Jicong 已提交
251 252
    seeked = true;
  }
253

L
Liu Jicong 已提交
254 255 256 257 258 259 260 261
  while (1) {
    contLen = taosReadFile(pRead->pLogFile, pRead->pHead, sizeof(SWalCkHead));
    if (contLen == sizeof(SWalCkHead)) {
      break;
    } else if (contLen == 0 && !seeked) {
      walReadSeekVerImpl(pRead, fetchVer);
      seeked = true;
      continue;
L
Liu Jicong 已提交
262
    } else {
L
Liu Jicong 已提交
263 264 265 266 267 268
      if (contLen < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
      } else {
        terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
      }
      return -1;
L
Liu Jicong 已提交
269 270
    }
  }
271
//  pRead->curInvalid = 0;
L
Liu Jicong 已提交
272 273 274
  return 0;
}

L
Liu Jicong 已提交
275 276
static int32_t walFetchBodyNew(SWalReader *pReader) {
  SWalCont *pReadHead = &pReader->pHead->head;
L
Liu Jicong 已提交
277 278
  int64_t   ver = pReadHead->version;

279
  wDebug("vgId:%d, wal starts to fetch body, ver:%" PRId64 " ,len:%d, total", pReader->pWal->cfg.vgId, ver,
L
Liu Jicong 已提交
280
         pReadHead->bodyLen);
281

L
Liu Jicong 已提交
282 283
  if (pReader->capacity < pReadHead->bodyLen) {
    SWalCkHead *ptr = (SWalCkHead *)taosMemoryRealloc(pReader->pHead, sizeof(SWalCkHead) + pReadHead->bodyLen);
L
Liu Jicong 已提交
284
    if (ptr == NULL) {
S
Shengliang Guan 已提交
285
      terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
286 287
      return -1;
    }
L
Liu Jicong 已提交
288 289 290
    pReader->pHead = ptr;
    pReadHead = &pReader->pHead->head;
    pReader->capacity = pReadHead->bodyLen;
L
Liu Jicong 已提交
291 292
  }

L
Liu Jicong 已提交
293
  if (pReadHead->bodyLen != taosReadFile(pReader->pLogFile, pReadHead->body, pReadHead->bodyLen)) {
L
Liu Jicong 已提交
294 295
    if (pReadHead->bodyLen < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
296
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since %s",
L
Liu Jicong 已提交
297
             pReader->pWal->cfg.vgId, pReader->pHead->head.version, ver, tstrerror(terrno));
L
Liu Jicong 已提交
298
    } else {
S
Shengliang Guan 已提交
299
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since file corrupted",
L
Liu Jicong 已提交
300
             pReader->pWal->cfg.vgId, pReader->pHead->head.version, ver);
L
Liu Jicong 已提交
301 302
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    }
303
//    pRead->curInvalid = 1;
L
Liu Jicong 已提交
304 305 306
    return -1;
  }

L
Liu Jicong 已提交
307 308
  if (walValidBodyCksum(pReader->pHead) != 0) {
    wError("vgId:%d, wal fetch body error:%" PRId64 ", since body checksum not passed", pReader->pWal->cfg.vgId, ver);
309
//    pRead->curInvalid = 1;
wmmhello's avatar
wmmhello 已提交
310

L
Liu Jicong 已提交
311 312 313 314
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

L
Liu Jicong 已提交
315 316
  wDebug("vgId:%d, index:%" PRId64 " is fetched, cursor advance", pReader->pWal->cfg.vgId, ver);
  pReader->curVersion = ver + 1;
L
Liu Jicong 已提交
317 318 319 320 321 322 323 324 325
  return 0;
}

static int32_t walSkipFetchBodyNew(SWalReader *pRead) {
  int64_t code;

  code = taosLSeekFile(pRead->pLogFile, pRead->pHead->head.bodyLen, SEEK_CUR);
  if (code < 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
326
//    pRead->curInvalid = 1;
L
Liu Jicong 已提交
327 328 329 330
    return -1;
  }

  pRead->curVersion++;
S
Shengliang Guan 已提交
331
  wDebug("vgId:%d, version advance to %" PRId64 ", skip fetch", pRead->pWal->cfg.vgId, pRead->curVersion);
L
Liu Jicong 已提交
332 333 334 335

  return 0;
}

L
Liu Jicong 已提交
336
int32_t walFetchHead(SWalReader *pRead, int64_t ver, SWalCkHead *pHead) {
L
Liu Jicong 已提交
337
  int64_t code;
338 339 340
  int64_t contLen;
  bool    seeked = false;

S
Shengliang Guan 已提交
341
  wDebug("vgId:%d, try to fetch ver %" PRId64 ", first ver:%" PRId64 ", commit ver:%" PRId64 ", last ver:%" PRId64
L
Liu Jicong 已提交
342 343 344
         ", applied ver:%" PRId64,
         pRead->pWal->cfg.vgId, ver, pRead->pWal->vers.firstVer, pRead->pWal->vers.commitVer, pRead->pWal->vers.lastVer,
         pRead->pWal->vers.appliedVer);
L
Liu Jicong 已提交
345

346
  // TODO: valid ver
347
  if (ver > pRead->pWal->vers.appliedVer) {
L
Liu Jicong 已提交
348 349
    return -1;
  }
350

351
  if (pRead->curVersion != ver) {
352
    code = walReaderSeekVer(pRead, ver);
353
    if (code < 0) {
354 355
//      pRead->curVersion = ver;
//      pRead->curInvalid = 1;
356 357 358
      return -1;
    }
    seeked = true;
359 360
  }

361 362 363 364 365 366 367 368 369 370 371 372 373 374
  while (1) {
    contLen = taosReadFile(pRead->pLogFile, pHead, sizeof(SWalCkHead));
    if (contLen == sizeof(SWalCkHead)) {
      break;
    } else if (contLen == 0 && !seeked) {
      walReadSeekVerImpl(pRead, ver);
      seeked = true;
      continue;
    } else {
      if (contLen < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
      } else {
        terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
      }
375
//      pRead->curInvalid = 1;
376 377
      return -1;
    }
378 379 380 381 382
  }

  code = walValidHeadCksum(pHead);

  if (code != 0) {
L
Liu Jicong 已提交
383
    wError("vgId:%d, unexpected wal log index:%" PRId64 ", since head checksum not passed", pRead->pWal->cfg.vgId, ver);
384 385 386 387
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

388
//  pRead->curInvalid = 0;
389 390 391
  return 0;
}

L
Liu Jicong 已提交
392
int32_t walSkipFetchBody(SWalReader *pRead, const SWalCkHead *pHead) {
L
Liu Jicong 已提交
393
  int64_t code;
394

S
Shengliang Guan 已提交
395
  wDebug("vgId:%d, skip fetch body %" PRId64 ", first ver:%" PRId64 ", commit ver:%" PRId64 ", last ver:%" PRId64
L
Liu Jicong 已提交
396 397 398 399
         ", applied ver:%" PRId64,
         pRead->pWal->cfg.vgId, pHead->head.version, pRead->pWal->vers.firstVer, pRead->pWal->vers.commitVer,
         pRead->pWal->vers.lastVer, pRead->pWal->vers.appliedVer);

L
Liu Jicong 已提交
400
  code = taosLSeekFile(pRead->pLogFile, pHead->head.bodyLen, SEEK_CUR);
401 402
  if (code < 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
403
//    pRead->curInvalid = 1;
404 405 406 407 408 409 410 411
    return -1;
  }

  pRead->curVersion++;

  return 0;
}

L
Liu Jicong 已提交
412
int32_t walFetchBody(SWalReader *pRead, SWalCkHead **ppHead) {
L
Liu Jicong 已提交
413 414
  SWalCont *pReadHead = &((*ppHead)->head);
  int64_t   ver = pReadHead->version;
415

S
Shengliang Guan 已提交
416
  wDebug("vgId:%d, fetch body %" PRId64 ", first ver:%" PRId64 ", commit ver:%" PRId64 ", last ver:%" PRId64
L
Liu Jicong 已提交
417 418 419 420
         ", applied ver:%" PRId64,
         pRead->pWal->cfg.vgId, ver, pRead->pWal->vers.firstVer, pRead->pWal->vers.commitVer, pRead->pWal->vers.lastVer,
         pRead->pWal->vers.appliedVer);

421
  if (pRead->capacity < pReadHead->bodyLen) {
L
Liu Jicong 已提交
422
    SWalCkHead *ptr = (SWalCkHead *)taosMemoryRealloc(*ppHead, sizeof(SWalCkHead) + pReadHead->bodyLen);
423
    if (ptr == NULL) {
S
Shengliang Guan 已提交
424
      terrno = TSDB_CODE_OUT_OF_MEMORY;
425 426
      return -1;
    }
L
Liu Jicong 已提交
427
    *ppHead = ptr;
L
Liu Jicong 已提交
428
    pReadHead = &((*ppHead)->head);
429 430 431
    pRead->capacity = pReadHead->bodyLen;
  }

L
Liu Jicong 已提交
432
  if (pReadHead->bodyLen != taosReadFile(pRead->pLogFile, pReadHead->body, pReadHead->bodyLen)) {
433 434 435 436 437 438 439 440 441
    if (pReadHead->bodyLen < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since %s",
             pRead->pWal->cfg.vgId, pReadHead->version, ver, tstrerror(terrno));
    } else {
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since file corrupted",
             pRead->pWal->cfg.vgId, pReadHead->version, ver);
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    }
442
//    pRead->curInvalid = 1;
443 444 445 446
    return -1;
  }

  if (pReadHead->version != ver) {
S
Shengliang Guan 已提交
447
    wError("vgId:%d, wal fetch body error, index:%" PRId64 ", read request index:%" PRId64, pRead->pWal->cfg.vgId,
448
           pReadHead->version, ver);
449
//    pRead->curInvalid = 1;
450 451 452 453 454
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

  if (walValidBodyCksum(*ppHead) != 0) {
455 456
    wError("vgId:%d, wal fetch body error, index:%" PRId64 ", since body checksum not passed", pRead->pWal->cfg.vgId,
           ver);
457
//    pRead->curInvalid = 1;
458 459 460 461 462 463 464 465
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

  pRead->curVersion = ver + 1;
  return 0;
}

466
int32_t walReadVer(SWalReader *pReader, int64_t ver) {
S
Shengliang Guan 已提交
467
  wDebug("vgId:%d, wal start to read index:%" PRId64, pReader->pWal->cfg.vgId, ver);
L
Liu Jicong 已提交
468
  int64_t contLen;
469
  int32_t code;
L
Liu Jicong 已提交
470
  bool    seeked = false;
471

472
  if (walIsEmpty(pReader->pWal)) {
473 474 475 476
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
    return -1;
  }

477 478 479
  if (ver > pReader->pWal->vers.lastVer || ver < pReader->pWal->vers.firstVer) {
    wDebug("vgId:%d, invalid index:%" PRId64 ", first index:%" PRId64 ", last index:%" PRId64, pReader->pWal->cfg.vgId,
           ver, pReader->pWal->vers.firstVer, pReader->pWal->vers.lastVer);
M
Minghao Li 已提交
480 481 482 483
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
    return -1;
  }

484 485
  taosThreadMutexLock(&pReader->mutex);

486
  if (pReader->curVersion != ver) {
487
    if (walReaderSeekVer(pReader, ver) < 0) {
488
      wError("vgId:%d, unexpected wal log, index:%" PRId64 ", since %s", pReader->pWal->cfg.vgId, ver, terrstr());
489
      taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
490 491 492 493
      return -1;
    }
    seeked = true;
  }
L
Liu Jicong 已提交
494

L
Liu Jicong 已提交
495
  while (1) {
496
    contLen = taosReadFile(pReader->pLogFile, pReader->pHead, sizeof(SWalCkHead));
L
Liu Jicong 已提交
497 498 499
    if (contLen == sizeof(SWalCkHead)) {
      break;
    } else if (contLen == 0 && !seeked) {
500
      walReadSeekVerImpl(pReader, ver);
L
Liu Jicong 已提交
501 502 503 504 505 506 507 508
      seeked = true;
      continue;
    } else {
      if (contLen < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
      } else {
        terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
      }
509 510
      wError("vgId:%d, failed to read WAL record head, index:%" PRId64 ", from log file since %s",
             pReader->pWal->cfg.vgId, ver, terrstr());
511
      taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
512
      return -1;
M
Minghao Li 已提交
513
    }
L
Liu Jicong 已提交
514
  }
515

516 517 518
  code = walValidHeadCksum(pReader->pHead);
  if (code != 0) {
    wError("vgId:%d, unexpected wal log, index:%" PRId64 ", since head checksum not passed", pReader->pWal->cfg.vgId,
519
           ver);
L
Liu Jicong 已提交
520
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
521
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
522 523
    return -1;
  }
524

525
  if (pReader->capacity < pReader->pHead->head.bodyLen) {
L
Liu Jicong 已提交
526 527
    SWalCkHead *ptr =
        (SWalCkHead *)taosMemoryRealloc(pReader->pHead, sizeof(SWalCkHead) + pReader->pHead->head.bodyLen);
L
Liu Jicong 已提交
528
    if (ptr == NULL) {
S
Shengliang Guan 已提交
529
      terrno = TSDB_CODE_OUT_OF_MEMORY;
530
      taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
531 532
      return -1;
    }
L
Liu Jicong 已提交
533
    pReader->pHead = ptr;
534
    pReader->capacity = pReader->pHead->head.bodyLen;
L
Liu Jicong 已提交
535
  }
L
Liu Jicong 已提交
536

537 538
  if ((contLen = taosReadFile(pReader->pLogFile, pReader->pHead->head.body, pReader->pHead->head.bodyLen)) !=
      pReader->pHead->head.bodyLen) {
L
Liu Jicong 已提交
539
    if (contLen < 0)
L
Liu Jicong 已提交
540
      terrno = TAOS_SYSTEM_ERROR(errno);
M
Minghao Li 已提交
541
    else {
L
Liu Jicong 已提交
542
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
M
Minghao Li 已提交
543
    }
544 545
    wError("vgId:%d, failed to read WAL record body, index:%" PRId64 ", from log file since %s",
           pReader->pWal->cfg.vgId, ver, terrstr());
546
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
547 548
    return -1;
  }
L
Liu Jicong 已提交
549

550 551 552
  if (pReader->pHead->head.version != ver) {
    wError("vgId:%d, unexpected wal log, index:%" PRId64 ", read request index:%" PRId64, pReader->pWal->cfg.vgId,
           pReader->pHead->head.version, ver);
553
//    pReader->curInvalid = 1;
L
Liu Jicong 已提交
554
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
555
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
556 557
    return -1;
  }
L
Liu Jicong 已提交
558

559 560 561
  code = walValidBodyCksum(pReader->pHead);
  if (code != 0) {
    wError("vgId:%d, unexpected wal log, index:%" PRId64 ", since body checksum not passed", pReader->pWal->cfg.vgId,
562
           ver);
563 564
    uint32_t readCkSum = walCalcBodyCksum(pReader->pHead->head.body, pReader->pHead->head.bodyLen);
    uint32_t logCkSum = pReader->pHead->cksumBody;
S
Shengliang Guan 已提交
565
    wError("checksum written into log:%u, checksum calculated:%u", logCkSum, readCkSum);
566
//    pReader->curInvalid = 1;
L
Liu Jicong 已提交
567
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
568
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
569 570
    return -1;
  }
571
  pReader->curVersion++;
L
Liu Jicong 已提交
572

573 574
  taosThreadMutexUnlock(&pReader->mutex);

L
Liu Jicong 已提交
575 576
  return 0;
}
577 578 579 580 581 582

void walReadReset(SWalReader *pReader) {
  taosThreadMutexLock(&pReader->mutex);
  taosCloseFile(&pReader->pIdxFile);
  taosCloseFile(&pReader->pLogFile);
  pReader->curFileFirstVer = -1;
583
  pReader->curVersion = -1;
584 585
  taosThreadMutexUnlock(&pReader->mutex);
}