walRead.c 18.4 KB
Newer Older
H
refact  
Hongze Cheng 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
S
Shengliang Guan 已提交
14 15
 */

L
Liu Jicong 已提交
16
#include "taoserror.h"
L
Liu Jicong 已提交
17
#include "walInt.h"
S
Shengliang Guan 已提交
18

L
Liu Jicong 已提交
19 20 21 22
static int32_t walFetchHeadNew(SWalReader *pRead, int64_t fetchVer);
static int32_t walFetchBodyNew(SWalReader *pRead);
static int32_t walSkipFetchBodyNew(SWalReader *pRead);

L
Liu Jicong 已提交
23
SWalReader *walOpenReader(SWal *pWal, SWalFilterCond *cond) {
24 25
  SWalReader *pReader = taosMemoryCalloc(1, sizeof(SWalReader));
  if (pReader == NULL) {
26
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
27 28
    return NULL;
  }
29

30 31 32 33 34 35 36 37
  pReader->pWal = pWal;
  pReader->readerId = tGenIdPI64();
  pReader->pIdxFile = NULL;
  pReader->pLogFile = NULL;
  pReader->curVersion = -1;
  pReader->curFileFirstVer = -1;
  pReader->curInvalid = 1;
  pReader->capacity = 0;
L
Liu Jicong 已提交
38
  if (cond) {
39
    pReader->cond = *cond;
L
Liu Jicong 已提交
40
  } else {
41 42 43 44
    pReader->cond.scanUncommited = 0;
    pReader->cond.scanNotApplied = 0;
    pReader->cond.scanMeta = 0;
    pReader->cond.enableRef = 0;
L
Liu Jicong 已提交
45
  }
L
fix  
Liu Jicong 已提交
46

47
  taosThreadMutexInit(&pReader->mutex, NULL);
L
fix  
Liu Jicong 已提交
48

49 50
  pReader->pHead = taosMemoryMalloc(sizeof(SWalCkHead));
  if (pReader->pHead == NULL) {
S
Shengliang Guan 已提交
51
    terrno = TSDB_CODE_OUT_OF_MEMORY;
52
    taosMemoryFree(pReader);
L
Liu Jicong 已提交
53 54
    return NULL;
  }
L
Liu Jicong 已提交
55

56
  /*if (pReader->cond.enableRef) {*/
L
Liu Jicong 已提交
57
  /* taosHashPut(pWal->pRefHash, &pReader->readerId, sizeof(int64_t), &pReader, sizeof(void *));*/
58 59 60
  /*}*/

  return pReader;
L
Liu Jicong 已提交
61 62
}

63 64 65 66 67 68 69 70
void walCloseReader(SWalReader *pReader) {
  taosCloseFile(&pReader->pIdxFile);
  taosCloseFile(&pReader->pLogFile);
  /*if (pReader->cond.enableRef) {*/
  /*taosHashRemove(pReader->pWal->pRefHash, &pReader->readerId, sizeof(int64_t));*/
  /*}*/
  taosMemoryFreeClear(pReader->pHead);
  taosMemoryFree(pReader);
L
Liu Jicong 已提交
71 72
}

73 74 75 76 77 78
int32_t walNextValidMsg(SWalReader *pReader) {
  int64_t fetchVer = pReader->curVersion;
  int64_t lastVer = walGetLastVer(pReader->pWal);
  int64_t committedVer = walGetCommittedVer(pReader->pWal);
  int64_t appliedVer = walGetAppliedVer(pReader->pWal);
  int64_t endVer = pReader->cond.scanUncommited ? lastVer : committedVer;
L
Liu Jicong 已提交
79 80
  endVer = TMIN(appliedVer, endVer);

S
Shengliang Guan 已提交
81 82
  wDebug("vgId:%d, wal start to fetch, index:%" PRId64 ", last index:%" PRId64 " commit index:%" PRId64
         ", applied index:%" PRId64 ", end index:%" PRId64,
83 84
         pReader->pWal->cfg.vgId, fetchVer, lastVer, committedVer, appliedVer, endVer);
  pReader->curStopped = 0;
L
Liu Jicong 已提交
85
  while (fetchVer <= endVer) {
86
    if (walFetchHeadNew(pReader, fetchVer) < 0) {
L
Liu Jicong 已提交
87 88
      return -1;
    }
89 90 91
    if (pReader->pHead->head.msgType == TDMT_VND_SUBMIT ||
        (IS_META_MSG(pReader->pHead->head.msgType) && pReader->cond.scanMeta)) {
      if (walFetchBodyNew(pReader) < 0) {
L
Liu Jicong 已提交
92 93 94 95
        return -1;
      }
      return 0;
    } else {
96
      if (walSkipFetchBodyNew(pReader) < 0) {
L
Liu Jicong 已提交
97 98
        return -1;
      }
wmmhello's avatar
wmmhello 已提交
99
      fetchVer = pReader->curVersion;
L
Liu Jicong 已提交
100 101
    }
  }
102
  pReader->curStopped = 1;
L
Liu Jicong 已提交
103
  return -1;
L
Liu Jicong 已提交
104
}
L
Liu Jicong 已提交
105

106
static int64_t walReadSeekFilePos(SWalReader *pReader, int64_t fileFirstVer, int64_t ver) {
L
Liu Jicong 已提交
107
  int64_t ret = 0;
L
Liu Jicong 已提交
108

109 110
  TdFilePtr pIdxTFile = pReader->pIdxFile;
  TdFilePtr pLogTFile = pReader->pLogFile;
L
Liu Jicong 已提交
111 112

  // seek position
L
Liu Jicong 已提交
113
  int64_t offset = (ver - fileFirstVer) * sizeof(SWalIdxEntry);
L
Liu Jicong 已提交
114 115
  ret = taosLSeekFile(pIdxTFile, offset, SEEK_SET);
  if (ret < 0) {
L
Liu Jicong 已提交
116
    terrno = TAOS_SYSTEM_ERROR(errno);
117 118
    wError("vgId:%d, failed to seek idx file, index:%" PRId64 ", pos:%" PRId64 ", since %s", pReader->pWal->cfg.vgId,
           ver, offset, terrstr());
L
Liu Jicong 已提交
119 120
    return -1;
  }
L
Liu Jicong 已提交
121
  SWalIdxEntry entry = {0};
L
Liu Jicong 已提交
122 123 124
  if ((ret = taosReadFile(pIdxTFile, &entry, sizeof(SWalIdxEntry))) != sizeof(SWalIdxEntry)) {
    if (ret < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
125
      wError("vgId:%d, failed to read idx file, since %s", pReader->pWal->cfg.vgId, terrstr());
L
Liu Jicong 已提交
126 127
    } else {
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
128
      wError("vgId:%d, read idx file incompletely, read bytes %" PRId64 ", bytes should be %ld",
129
             pReader->pWal->cfg.vgId, ret, sizeof(SWalIdxEntry));
L
Liu Jicong 已提交
130
    }
L
Liu Jicong 已提交
131 132
    return -1;
  }
L
Liu Jicong 已提交
133

134
  ASSERT(entry.ver == ver);
L
Liu Jicong 已提交
135 136
  ret = taosLSeekFile(pLogTFile, entry.offset, SEEK_SET);
  if (ret < 0) {
L
Liu Jicong 已提交
137
    terrno = TAOS_SYSTEM_ERROR(errno);
138 139
    wError("vgId:%d, failed to seek log file, index:%" PRId64 ", pos:%" PRId64 ", since %s", pReader->pWal->cfg.vgId,
           ver, entry.offset, terrstr());
L
Liu Jicong 已提交
140 141
    return -1;
  }
L
Liu Jicong 已提交
142
  return ret;
L
Liu Jicong 已提交
143 144
}

145
static int32_t walReadChangeFile(SWalReader *pReader, int64_t fileFirstVer) {
wmmhello's avatar
wmmhello 已提交
146
  char fnameStr[WAL_FILE_LEN] = {0};
L
Liu Jicong 已提交
147

148 149
  taosCloseFile(&pReader->pIdxFile);
  taosCloseFile(&pReader->pLogFile);
L
Liu Jicong 已提交
150

151 152 153
  walBuildLogName(pReader->pWal, fileFirstVer, fnameStr);
  TdFilePtr pLogFile = taosOpenFile(fnameStr, TD_FILE_READ);
  if (pLogFile == NULL) {
L
Liu Jicong 已提交
154
    terrno = TAOS_SYSTEM_ERROR(errno);
155
    wError("vgId:%d, cannot open file %s, since %s", pReader->pWal->cfg.vgId, fnameStr, terrstr());
L
Liu Jicong 已提交
156 157 158
    return -1;
  }

159
  pReader->pLogFile = pLogFile;
L
Liu Jicong 已提交
160

161 162 163
  walBuildIdxName(pReader->pWal, fileFirstVer, fnameStr);
  TdFilePtr pIdxFile = taosOpenFile(fnameStr, TD_FILE_READ);
  if (pIdxFile == NULL) {
L
Liu Jicong 已提交
164
    terrno = TAOS_SYSTEM_ERROR(errno);
165
    wError("vgId:%d, cannot open file %s, since %s", pReader->pWal->cfg.vgId, fnameStr, terrstr());
L
Liu Jicong 已提交
166 167 168
    return -1;
  }

169
  pReader->pIdxFile = pIdxFile;
170 171 172

  pReader->curFileFirstVer = fileFirstVer;

L
Liu Jicong 已提交
173 174 175
  return 0;
}

176 177
int32_t walReadSeekVerImpl(SWalReader *pReader, int64_t ver) {
  SWal *pWal = pReader->pWal;
L
Liu Jicong 已提交
178

179
  // bsearch in fileSet
L
Liu Jicong 已提交
180
  SWalFileInfo tmpInfo;
L
Liu Jicong 已提交
181
  tmpInfo.firstVer = ver;
L
Liu Jicong 已提交
182
  SWalFileInfo *pRet = taosArraySearch(pWal->fileInfoSet, &tmpInfo, compareWalFileInfo, TD_LE);
183
  if (pRet == NULL) {
184
    wError("failed to find WAL log file with ver:%" PRId64, ver);
185 186 187
    terrno = TSDB_CODE_WAL_INVALID_VER;
    return -1;
  }
188
  if (pReader->curFileFirstVer != pRet->firstVer) {
L
Liu Jicong 已提交
189
    // error code was set inner
190
    if (walReadChangeFile(pReader, pRet->firstVer) < 0) {
L
Liu Jicong 已提交
191 192 193 194
      return -1;
    }
  }

L
Liu Jicong 已提交
195
  // error code was set inner
196
  if (walReadSeekFilePos(pReader, pRet->firstVer, ver) < 0) {
L
Liu Jicong 已提交
197 198
    return -1;
  }
L
Liu Jicong 已提交
199

L
Liu Jicong 已提交
200
  wDebug("vgId:%d, wal version reset from %" PRId64 "(invalid:%d) to %" PRId64, pReader->pWal->cfg.vgId,
S
Shengliang Guan 已提交
201
         pReader->curVersion, pReader->curInvalid, ver);
L
Liu Jicong 已提交
202

203
  pReader->curVersion = ver;
L
Liu Jicong 已提交
204 205 206
  return 0;
}

207 208 209
int32_t walReadSeekVer(SWalReader *pReader, int64_t ver) {
  SWal *pWal = pReader->pWal;
  if (!pReader->curInvalid && ver == pReader->curVersion) {
S
Shengliang Guan 已提交
210
    wDebug("vgId:%d, wal index:%" PRId64 " match, no need to reset", pReader->pWal->cfg.vgId, ver);
L
Liu Jicong 已提交
211 212 213
    return 0;
  }

214 215
  pReader->curInvalid = 1;
  pReader->curVersion = ver;
L
Liu Jicong 已提交
216

L
Liu Jicong 已提交
217
  if (ver > pWal->vers.lastVer || ver < pWal->vers.firstVer) {
218
    wDebug("vgId:%d, invalid index:%" PRId64 ", first index:%" PRId64 ", last index:%" PRId64, pReader->pWal->cfg.vgId,
L
Liu Jicong 已提交
219 220 221 222 223 224 225
           ver, pWal->vers.firstVer, pWal->vers.lastVer);
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
    return -1;
  }
  if (ver < pWal->vers.snapshotVer) {
  }

226
  if (walReadSeekVerImpl(pReader, ver) < 0) {
L
Liu Jicong 已提交
227 228 229
    return -1;
  }

L
Liu Jicong 已提交
230 231 232
  return 0;
}

L
Liu Jicong 已提交
233
void walSetReaderCapacity(SWalReader *pRead, int32_t capacity) { pRead->capacity = capacity; }
234

L
Liu Jicong 已提交
235 236
static int32_t walFetchHeadNew(SWalReader *pRead, int64_t fetchVer) {
  int64_t contLen;
L
Liu Jicong 已提交
237 238
  bool    seeked = false;

S
Shengliang Guan 已提交
239
  wDebug("vgId:%d, wal starts to fetch head, index:%" PRId64, pRead->pWal->cfg.vgId, fetchVer);
240

L
Liu Jicong 已提交
241
  if (pRead->curInvalid || pRead->curVersion != fetchVer) {
L
Liu Jicong 已提交
242
    if (walReadSeekVer(pRead, fetchVer) < 0) {
L
Liu Jicong 已提交
243 244
      pRead->curVersion = fetchVer;
      pRead->curInvalid = 1;
L
Liu Jicong 已提交
245 246
      return -1;
    }
L
Liu Jicong 已提交
247 248 249 250 251 252 253 254 255 256
    seeked = true;
  }
  while (1) {
    contLen = taosReadFile(pRead->pLogFile, pRead->pHead, sizeof(SWalCkHead));
    if (contLen == sizeof(SWalCkHead)) {
      break;
    } else if (contLen == 0 && !seeked) {
      walReadSeekVerImpl(pRead, fetchVer);
      seeked = true;
      continue;
L
Liu Jicong 已提交
257
    } else {
L
Liu Jicong 已提交
258 259 260 261 262 263 264
      if (contLen < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
      } else {
        terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
      }
      pRead->curInvalid = 1;
      return -1;
L
Liu Jicong 已提交
265 266
    }
  }
L
Liu Jicong 已提交
267
  pRead->curInvalid = 0;
L
Liu Jicong 已提交
268 269 270 271 272 273 274
  return 0;
}

static int32_t walFetchBodyNew(SWalReader *pRead) {
  SWalCont *pReadHead = &pRead->pHead->head;
  int64_t   ver = pReadHead->version;

S
Shengliang Guan 已提交
275
  wDebug("vgId:%d, wal starts to fetch body, index:%" PRId64, pRead->pWal->cfg.vgId, ver);
276

L
Liu Jicong 已提交
277
  if (pRead->capacity < pReadHead->bodyLen) {
L
Liu Jicong 已提交
278
    SWalCkHead *ptr = (SWalCkHead *)taosMemoryRealloc(pRead->pHead, sizeof(SWalCkHead) + pReadHead->bodyLen);
L
Liu Jicong 已提交
279
    if (ptr == NULL) {
S
Shengliang Guan 已提交
280
      terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
281 282
      return -1;
    }
L
Liu Jicong 已提交
283
    pRead->pHead = ptr;
L
Liu Jicong 已提交
284 285 286 287 288 289 290
    pReadHead = &pRead->pHead->head;
    pRead->capacity = pReadHead->bodyLen;
  }

  if (pReadHead->bodyLen != taosReadFile(pRead->pLogFile, pReadHead->body, pReadHead->bodyLen)) {
    if (pReadHead->bodyLen < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
291
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since %s",
S
Shengliang Guan 已提交
292
             pRead->pWal->cfg.vgId, pRead->pHead->head.version, ver, tstrerror(terrno));
L
Liu Jicong 已提交
293
    } else {
S
Shengliang Guan 已提交
294
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since file corrupted",
S
Shengliang Guan 已提交
295
             pRead->pWal->cfg.vgId, pRead->pHead->head.version, ver);
L
Liu Jicong 已提交
296 297
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    }
L
Liu Jicong 已提交
298
    pRead->curInvalid = 1;
L
Liu Jicong 已提交
299 300 301 302
    return -1;
  }

  if (walValidBodyCksum(pRead->pHead) != 0) {
S
Shengliang Guan 已提交
303
    wError("vgId:%d, wal fetch body error:%" PRId64 ", since body checksum not passed", pRead->pWal->cfg.vgId, ver);
L
Liu Jicong 已提交
304
    pRead->curInvalid = 1;
L
Liu Jicong 已提交
305 306 307 308
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

S
Shengliang Guan 已提交
309
  wDebug("vgId:%d, index:%" PRId64 " is fetched, cursor advance", pRead->pWal->cfg.vgId, ver);
L
Liu Jicong 已提交
310 311 312 313 314 315 316
  pRead->curVersion = ver + 1;
  return 0;
}

static int32_t walSkipFetchBodyNew(SWalReader *pRead) {
  int64_t code;

317 318
  ASSERT(pRead->curVersion == pRead->pHead->head.version);
  ASSERT(pRead->curInvalid == 0);
L
Liu Jicong 已提交
319 320 321 322

  code = taosLSeekFile(pRead->pLogFile, pRead->pHead->head.bodyLen, SEEK_CUR);
  if (code < 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
323
    pRead->curInvalid = 1;
L
Liu Jicong 已提交
324 325 326 327
    return -1;
  }

  pRead->curVersion++;
S
Shengliang Guan 已提交
328
  wDebug("vgId:%d, version advance to %" PRId64 ", skip fetch", pRead->pWal->cfg.vgId, pRead->curVersion);
L
Liu Jicong 已提交
329 330 331 332

  return 0;
}

L
Liu Jicong 已提交
333
int32_t walFetchHead(SWalReader *pRead, int64_t ver, SWalCkHead *pHead) {
L
Liu Jicong 已提交
334
  int64_t code;
335 336 337
  int64_t contLen;
  bool    seeked = false;

S
Shengliang Guan 已提交
338
  wDebug("vgId:%d, try to fetch ver %" PRId64 ", first ver:%" PRId64 ", commit ver:%" PRId64 ", last ver:%" PRId64
L
Liu Jicong 已提交
339 340 341
         ", applied ver:%" PRId64,
         pRead->pWal->cfg.vgId, ver, pRead->pWal->vers.firstVer, pRead->pWal->vers.commitVer, pRead->pWal->vers.lastVer,
         pRead->pWal->vers.appliedVer);
L
Liu Jicong 已提交
342

343
  // TODO: valid ver
344
  if (ver > pRead->pWal->vers.appliedVer) {
L
Liu Jicong 已提交
345 346
    return -1;
  }
347

L
Liu Jicong 已提交
348
  if (pRead->curInvalid || pRead->curVersion != ver) {
349
    code = walReadSeekVer(pRead, ver);
350 351 352 353 354 355
    if (code < 0) {
      pRead->curVersion = ver;
      pRead->curInvalid = 1;
      return -1;
    }
    seeked = true;
356 357
  }

358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374
  while (1) {
    contLen = taosReadFile(pRead->pLogFile, pHead, sizeof(SWalCkHead));
    if (contLen == sizeof(SWalCkHead)) {
      break;
    } else if (contLen == 0 && !seeked) {
      walReadSeekVerImpl(pRead, ver);
      seeked = true;
      continue;
    } else {
      if (contLen < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
      } else {
        terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
      }
      pRead->curInvalid = 1;
      return -1;
    }
375 376 377 378 379
  }

  code = walValidHeadCksum(pHead);

  if (code != 0) {
L
Liu Jicong 已提交
380
    wError("vgId:%d, unexpected wal log index:%" PRId64 ", since head checksum not passed", pRead->pWal->cfg.vgId, ver);
381 382 383 384
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

385
  pRead->curInvalid = 0;
386 387 388
  return 0;
}

L
Liu Jicong 已提交
389
int32_t walSkipFetchBody(SWalReader *pRead, const SWalCkHead *pHead) {
L
Liu Jicong 已提交
390
  int64_t code;
391

S
Shengliang Guan 已提交
392
  wDebug("vgId:%d, skip fetch body %" PRId64 ", first ver:%" PRId64 ", commit ver:%" PRId64 ", last ver:%" PRId64
L
Liu Jicong 已提交
393 394 395 396
         ", applied ver:%" PRId64,
         pRead->pWal->cfg.vgId, pHead->head.version, pRead->pWal->vers.firstVer, pRead->pWal->vers.commitVer,
         pRead->pWal->vers.lastVer, pRead->pWal->vers.appliedVer);

397 398
  ASSERT(pRead->curVersion == pHead->head.version);
  ASSERT(pRead->curInvalid == 0);
399

L
Liu Jicong 已提交
400
  code = taosLSeekFile(pRead->pLogFile, pHead->head.bodyLen, SEEK_CUR);
401 402
  if (code < 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
403
    pRead->curInvalid = 1;
404 405 406 407 408 409 410 411
    return -1;
  }

  pRead->curVersion++;

  return 0;
}

L
Liu Jicong 已提交
412
int32_t walFetchBody(SWalReader *pRead, SWalCkHead **ppHead) {
L
Liu Jicong 已提交
413 414
  SWalCont *pReadHead = &((*ppHead)->head);
  int64_t   ver = pReadHead->version;
415

S
Shengliang Guan 已提交
416
  wDebug("vgId:%d, fetch body %" PRId64 ", first ver:%" PRId64 ", commit ver:%" PRId64 ", last ver:%" PRId64
L
Liu Jicong 已提交
417 418 419 420
         ", applied ver:%" PRId64,
         pRead->pWal->cfg.vgId, ver, pRead->pWal->vers.firstVer, pRead->pWal->vers.commitVer, pRead->pWal->vers.lastVer,
         pRead->pWal->vers.appliedVer);

421
  if (pRead->capacity < pReadHead->bodyLen) {
L
Liu Jicong 已提交
422
    SWalCkHead *ptr = (SWalCkHead *)taosMemoryRealloc(*ppHead, sizeof(SWalCkHead) + pReadHead->bodyLen);
423
    if (ptr == NULL) {
S
Shengliang Guan 已提交
424
      terrno = TSDB_CODE_OUT_OF_MEMORY;
425 426
      return -1;
    }
L
Liu Jicong 已提交
427
    *ppHead = ptr;
L
Liu Jicong 已提交
428
    pReadHead = &((*ppHead)->head);
429 430 431
    pRead->capacity = pReadHead->bodyLen;
  }

L
Liu Jicong 已提交
432
  if (pReadHead->bodyLen != taosReadFile(pRead->pLogFile, pReadHead->body, pReadHead->bodyLen)) {
433 434 435 436 437 438 439 440 441 442
    if (pReadHead->bodyLen < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since %s",
             pRead->pWal->cfg.vgId, pReadHead->version, ver, tstrerror(terrno));
    } else {
      wError("vgId:%d, wal fetch body error:%" PRId64 ", read request index:%" PRId64 ", since file corrupted",
             pRead->pWal->cfg.vgId, pReadHead->version, ver);
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    }
    pRead->curInvalid = 1;
443 444 445 446
    return -1;
  }

  if (pReadHead->version != ver) {
S
Shengliang Guan 已提交
447
    wError("vgId:%d, wal fetch body error, index:%" PRId64 ", read request index:%" PRId64, pRead->pWal->cfg.vgId,
448
           pReadHead->version, ver);
L
Liu Jicong 已提交
449
    pRead->curInvalid = 1;
450 451 452 453 454
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

  if (walValidBodyCksum(*ppHead) != 0) {
455 456
    wError("vgId:%d, wal fetch body error, index:%" PRId64 ", since body checksum not passed", pRead->pWal->cfg.vgId,
           ver);
L
Liu Jicong 已提交
457
    pRead->curInvalid = 1;
458 459 460 461 462 463 464 465
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
    return -1;
  }

  pRead->curVersion = ver + 1;
  return 0;
}

466
int32_t walReadVer(SWalReader *pReader, int64_t ver) {
S
Shengliang Guan 已提交
467
  wDebug("vgId:%d, wal start to read index:%" PRId64, pReader->pWal->cfg.vgId, ver);
L
Liu Jicong 已提交
468
  int64_t contLen;
469
  int32_t code;
L
Liu Jicong 已提交
470
  bool    seeked = false;
471

472
  if (walIsEmpty(pReader->pWal)) {
473 474 475 476
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
    return -1;
  }

477 478 479
  if (ver > pReader->pWal->vers.lastVer || ver < pReader->pWal->vers.firstVer) {
    wDebug("vgId:%d, invalid index:%" PRId64 ", first index:%" PRId64 ", last index:%" PRId64, pReader->pWal->cfg.vgId,
           ver, pReader->pWal->vers.firstVer, pReader->pWal->vers.lastVer);
M
Minghao Li 已提交
480 481 482 483
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
    return -1;
  }

484 485
  taosThreadMutexLock(&pReader->mutex);

486 487 488
  if (pReader->curInvalid || pReader->curVersion != ver) {
    if (walReadSeekVer(pReader, ver) < 0) {
      wError("vgId:%d, unexpected wal log, index:%" PRId64 ", since %s", pReader->pWal->cfg.vgId, ver, terrstr());
489
      taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
490 491 492 493
      return -1;
    }
    seeked = true;
  }
L
Liu Jicong 已提交
494

L
Liu Jicong 已提交
495
  while (1) {
496
    contLen = taosReadFile(pReader->pLogFile, pReader->pHead, sizeof(SWalCkHead));
L
Liu Jicong 已提交
497 498 499
    if (contLen == sizeof(SWalCkHead)) {
      break;
    } else if (contLen == 0 && !seeked) {
500
      walReadSeekVerImpl(pReader, ver);
L
Liu Jicong 已提交
501 502 503 504 505 506 507 508
      seeked = true;
      continue;
    } else {
      if (contLen < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
      } else {
        terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
      }
509 510
      wError("vgId:%d, failed to read WAL record head, index:%" PRId64 ", from log file since %s",
             pReader->pWal->cfg.vgId, ver, terrstr());
511
      taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
512
      return -1;
M
Minghao Li 已提交
513
    }
L
Liu Jicong 已提交
514
  }
515

516 517 518
  code = walValidHeadCksum(pReader->pHead);
  if (code != 0) {
    wError("vgId:%d, unexpected wal log, index:%" PRId64 ", since head checksum not passed", pReader->pWal->cfg.vgId,
519
           ver);
L
Liu Jicong 已提交
520
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
521
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
522 523
    return -1;
  }
524

525
  if (pReader->capacity < pReader->pHead->head.bodyLen) {
L
Liu Jicong 已提交
526 527
    SWalCkHead *ptr =
        (SWalCkHead *)taosMemoryRealloc(pReader->pHead, sizeof(SWalCkHead) + pReader->pHead->head.bodyLen);
L
Liu Jicong 已提交
528
    if (ptr == NULL) {
S
Shengliang Guan 已提交
529
      terrno = TSDB_CODE_OUT_OF_MEMORY;
530
      taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
531 532
      return -1;
    }
L
Liu Jicong 已提交
533
    pReader->pHead = ptr;
534
    pReader->capacity = pReader->pHead->head.bodyLen;
L
Liu Jicong 已提交
535
  }
L
Liu Jicong 已提交
536

537 538
  if ((contLen = taosReadFile(pReader->pLogFile, pReader->pHead->head.body, pReader->pHead->head.bodyLen)) !=
      pReader->pHead->head.bodyLen) {
L
Liu Jicong 已提交
539
    if (contLen < 0)
L
Liu Jicong 已提交
540
      terrno = TAOS_SYSTEM_ERROR(errno);
M
Minghao Li 已提交
541
    else {
L
Liu Jicong 已提交
542
      terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
M
Minghao Li 已提交
543
    }
544 545
    wError("vgId:%d, failed to read WAL record body, index:%" PRId64 ", from log file since %s",
           pReader->pWal->cfg.vgId, ver, terrstr());
546
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
547 548
    return -1;
  }
L
Liu Jicong 已提交
549

550 551 552 553
  if (pReader->pHead->head.version != ver) {
    wError("vgId:%d, unexpected wal log, index:%" PRId64 ", read request index:%" PRId64, pReader->pWal->cfg.vgId,
           pReader->pHead->head.version, ver);
    pReader->curInvalid = 1;
L
Liu Jicong 已提交
554
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
555
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
556 557
    return -1;
  }
L
Liu Jicong 已提交
558

559 560 561
  code = walValidBodyCksum(pReader->pHead);
  if (code != 0) {
    wError("vgId:%d, unexpected wal log, index:%" PRId64 ", since body checksum not passed", pReader->pWal->cfg.vgId,
562
           ver);
563 564
    uint32_t readCkSum = walCalcBodyCksum(pReader->pHead->head.body, pReader->pHead->head.bodyLen);
    uint32_t logCkSum = pReader->pHead->cksumBody;
S
Shengliang Guan 已提交
565
    wError("checksum written into log:%u, checksum calculated:%u", logCkSum, readCkSum);
566
    pReader->curInvalid = 1;
L
Liu Jicong 已提交
567
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
568
    taosThreadMutexUnlock(&pReader->mutex);
L
Liu Jicong 已提交
569 570
    return -1;
  }
571
  pReader->curVersion++;
L
Liu Jicong 已提交
572

573 574
  taosThreadMutexUnlock(&pReader->mutex);

L
Liu Jicong 已提交
575 576
  return 0;
}
577 578 579 580 581 582 583 584 585

void walReadReset(SWalReader *pReader) {
  taosThreadMutexLock(&pReader->mutex);
  taosCloseFile(&pReader->pIdxFile);
  taosCloseFile(&pReader->pLogFile);
  pReader->curInvalid = 1;
  pReader->curFileFirstVer = -1;
  taosThreadMutexUnlock(&pReader->mutex);
}