walMeta.c 30.6 KB
Newer Older
L
Liu Jicong 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

L
Liu Jicong 已提交
16
#include "cJSON.h"
L
Liu Jicong 已提交
17 18
#include "os.h"
#include "taoserror.h"
19
#include "tglobal.h"
L
Liu Jicong 已提交
20
#include "tutil.h"
L
Liu Jicong 已提交
21 22
#include "walInt.h"

A
Alex Duan 已提交
23

24 25 26 27
bool FORCE_INLINE walLogExist(SWal* pWal, int64_t ver) {
  return !walIsEmpty(pWal) && walGetFirstVer(pWal) <= ver && walGetLastVer(pWal) >= ver;
}

28
bool FORCE_INLINE walIsEmpty(SWal* pWal) {
L
Liu Jicong 已提交
29
  return (pWal->vers.firstVer == -1 || pWal->vers.lastVer < pWal->vers.firstVer);  // [firstVer, lastVer + 1)
30
}
L
Liu Jicong 已提交
31

L
Liu Jicong 已提交
32
int64_t FORCE_INLINE walGetFirstVer(SWal* pWal) { return pWal->vers.firstVer; }
L
Liu Jicong 已提交
33

L
Liu Jicong 已提交
34
int64_t FORCE_INLINE walGetSnapshotVer(SWal* pWal) { return pWal->vers.snapshotVer; }
L
Liu Jicong 已提交
35

L
Liu Jicong 已提交
36
int64_t FORCE_INLINE walGetLastVer(SWal* pWal) { return pWal->vers.lastVer; }
L
Liu Jicong 已提交
37

L
Liu Jicong 已提交
38 39
int64_t FORCE_INLINE walGetCommittedVer(SWal* pWal) { return pWal->vers.commitVer; }

L
Liu Jicong 已提交
40 41
int64_t FORCE_INLINE walGetAppliedVer(SWal* pWal) { return pWal->vers.appliedVer; }

42 43 44 45 46 47
static FORCE_INLINE int walBuildMetaName(SWal* pWal, int metaVer, char* buf) {
  return sprintf(buf, "%s/meta-ver%d", pWal->path, metaVer);
}

static FORCE_INLINE int walBuildTmpMetaName(SWal* pWal, char* buf) {
  return sprintf(buf, "%s/meta-ver.tmp", pWal->path);
L
Liu Jicong 已提交
48 49
}

50
static FORCE_INLINE int64_t walScanLogGetLastVer(SWal* pWal, int32_t fileIdx) {
51
  int32_t       sz = taosArrayGetSize(pWal->fileInfoSet);
52
  SWalFileInfo* pFileInfo = taosArrayGet(pWal->fileInfoSet, fileIdx);
L
Liu Jicong 已提交
53
  char          fnameStr[WAL_FILE_LEN];
54
  walBuildLogName(pWal, pFileInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
55

L
Liu Jicong 已提交
56 57
  int64_t fileSize = 0;
  taosStatFile(fnameStr, &fileSize, NULL);
L
Liu Jicong 已提交
58

59
  TdFilePtr pFile = taosOpenFile(fnameStr, TD_FILE_READ | TD_FILE_WRITE);
60
  if (pFile == NULL) {
61
    wError("vgId:%d, failed to open file due to %s. file:%s", pWal->cfg.vgId, strerror(errno), fnameStr);
L
Liu Jicong 已提交
62 63 64 65
    terrno = TAOS_SYSTEM_ERROR(errno);
    return -1;
  }

66 67 68
  // ensure size as non-negative
  pFileInfo->fileSize = TMAX(0, pFileInfo->fileSize);

69
  int64_t  stepSize = WAL_SCAN_BUF_SIZE;
L
Liu Jicong 已提交
70
  uint64_t magic = WAL_MAGIC;
71 72
  int64_t  walCkHeadSz = sizeof(SWalCkHead);
  int64_t  end = fileSize;
73 74
  int64_t  capacity = 0;
  int64_t  readSize = 0;
75
  char*    buf = NULL;
76
  int64_t  offset = TMIN(pFileInfo->fileSize, fileSize);
77 78 79
  int64_t  retVer = -1;
  int64_t  lastEntryBeginOffset = 0;
  int64_t  lastEntryEndOffset = 0;
80 81
  int64_t  recordLen = 0;
  bool     forwardStage = false;
82

83 84
  // check recover size
  if (2 * tsWalFsyncDataSizeLimit + offset < end) {
85 86 87
    wWarn("vgId:%d, possibly corrupted WAL range exceeds size limit (i.e. %" PRId64 " bytes). offset:%" PRId64
          ", end:%" PRId64 ", file:%s",
          pWal->cfg.vgId, 2 * tsWalFsyncDataSizeLimit, offset, end, fnameStr);
88
  }
89 90 91

  // search for the valid last WAL entry, e.g. block by block
  while (1) {
92
    offset = (lastEntryEndOffset > 0) ? offset : TMAX(0, offset - stepSize + walCkHeadSz - 1);
93 94
    end = TMIN(offset + stepSize, fileSize);

95 96 97 98 99
    readSize = end - offset;
    capacity = readSize + sizeof(magic);

    void* ptr = taosMemoryRealloc(buf, capacity);
    if (ptr == NULL) {
S
Shengliang Guan 已提交
100
      terrno = TSDB_CODE_OUT_OF_MEMORY;
101 102 103
      goto _err;
    }
    buf = ptr;
L
Liu Jicong 已提交
104

105 106 107 108 109 110 111 112 113 114 115 116 117
    int64_t ret = taosLSeekFile(pFile, offset, SEEK_SET);
    if (ret < 0) {
      wError("vgId:%d, failed to lseek file due to %s. offset:%" PRId64 "", pWal->cfg.vgId, strerror(errno), offset);
      terrno = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }

    if (readSize != taosReadFile(pFile, buf, readSize)) {
      wError("vgId:%d, failed to read file due to %s. readSize:%" PRId64 ", file:%s", pWal->cfg.vgId, strerror(errno),
             readSize, fnameStr);
      terrno = TAOS_SYSTEM_ERROR(errno);
      goto _err;
    }
L
Liu Jicong 已提交
118

119 120
    char*       candidate = NULL;
    char*       haystack = buf;
121 122
    int64_t     pos = 0;
    SWalCkHead* logContent = NULL;
123

124 125 126 127 128 129 130 131 132 133
    while (true) {
      forwardStage = (lastEntryEndOffset > 0 || offset == 0);
      terrno = TSDB_CODE_SUCCESS;
      if (forwardStage) {
        candidate = (readSize - (haystack - buf)) > 0 ? haystack : NULL;
      } else {
        candidate = tmemmem(haystack, readSize - (haystack - buf), (char*)&magic, sizeof(magic));
      }

      if (candidate == NULL) break;
134 135
      pos = candidate - buf;

136
      // validate head
137
      int64_t len = readSize - pos;
138
      if (len < walCkHeadSz) {
139
        break;
140
      }
141

142
      logContent = (SWalCkHead*)(buf + pos);
143
      if (walValidHeadCksum(logContent) != 0) {
144
        terrno = TSDB_CODE_WAL_CHKSUM_MISMATCH;
145
        wWarn("vgId:%d, failed to validate checksum of wal entry header. offset:%" PRId64 ", file:%s", pWal->cfg.vgId,
146 147
              offset + pos, fnameStr);
        haystack = buf + pos + 1;
148
        if (forwardStage) {
149 150 151 152 153 154 155
          break;
        } else {
          continue;
        }
      }

      // validate body
156 157 158
      recordLen = walCkHeadSz + logContent->head.bodyLen;
      if (len < recordLen) {
        int64_t extraSize = recordLen - len;
159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180
        if (capacity < readSize + extraSize + sizeof(magic)) {
          capacity += extraSize;
          void* ptr = taosMemoryRealloc(buf, capacity);
          if (ptr == NULL) {
            terrno = TSDB_CODE_OUT_OF_MEMORY;
            goto _err;
          }
          buf = ptr;
        }
        int64_t ret = taosLSeekFile(pFile, offset + readSize, SEEK_SET);
        if (ret < 0) {
          wError("vgId:%d, failed to lseek file due to %s. offset:%" PRId64 "", pWal->cfg.vgId, strerror(errno),
                 offset);
          terrno = TAOS_SYSTEM_ERROR(errno);
          break;
        }
        if (extraSize != taosReadFile(pFile, buf + readSize, extraSize)) {
          wError("vgId:%d, failed to read file due to %s. offset:%" PRId64 ", extraSize:%" PRId64 ", file:%s",
                 pWal->cfg.vgId, strerror(errno), offset + readSize, extraSize, fnameStr);
          terrno = TAOS_SYSTEM_ERROR(errno);
          break;
        }
181
      }
182 183

      logContent = (SWalCkHead*)(buf + pos);
184 185
      if (walValidBodyCksum(logContent) != 0) {
        terrno = TSDB_CODE_WAL_CHKSUM_MISMATCH;
186
        wWarn("vgId:%d, failed to validate checksum of wal entry body. offset:%" PRId64 ", file:%s", pWal->cfg.vgId,
187 188
              offset + pos, fnameStr);
        haystack = buf + pos + 1;
189
        if (forwardStage) {
190 191 192 193 194 195 196
          break;
        } else {
          continue;
        }
      }

      // found one
197 198
      retVer = logContent->head.version;
      lastEntryBeginOffset = offset + pos;
199
      lastEntryEndOffset = offset + pos + recordLen;
200 201

      // try next
202
      haystack = buf + pos + recordLen;
L
Liu Jicong 已提交
203
    }
204

205 206
    offset = (lastEntryEndOffset > 0) ? lastEntryEndOffset : offset;
    if (forwardStage && (terrno != TSDB_CODE_SUCCESS || end == fileSize)) break;
207 208
  }

209
  if (retVer < 0) {
210
    terrno = TSDB_CODE_WAL_LOG_NOT_EXIST;
L
Liu Jicong 已提交
211
  }
L
Liu Jicong 已提交
212 213 214

  // truncate file
  if (lastEntryEndOffset != fileSize) {
215 216
    wWarn("vgId:%d, repair meta truncate file %s to %" PRId64 ", orig size %" PRId64, pWal->cfg.vgId, fnameStr,
          lastEntryEndOffset, fileSize);
217

218
    if (taosFtruncateFile(pFile, lastEntryEndOffset) < 0) {
219 220 221
      wError("failed to truncate file due to %s. file:%s", strerror(errno), fnameStr);
      terrno = TAOS_SYSTEM_ERROR(errno);
      goto _err;
222
    }
223

224
    if (taosFsyncFile(pFile) < 0) {
225 226 227
      wError("failed to fsync file due to %s. file:%s", strerror(errno), fnameStr);
      terrno = TAOS_SYSTEM_ERROR(errno);
      goto _err;
228
    }
L
Liu Jicong 已提交
229
  }
230

231
  pFileInfo->fileSize = lastEntryEndOffset;
L
Liu Jicong 已提交
232

233 234
  taosCloseFile(&pFile);
  taosMemoryFree(buf);
L
Liu Jicong 已提交
235
  return retVer;
236 237 238 239 240

_err:
  taosCloseFile(&pFile);
  taosMemoryFree(buf);
  return -1;
L
Liu Jicong 已提交
241 242
}

243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273
static void walRebuildFileInfoSet(SArray* metaLogList, SArray* actualLogList) {
  int metaFileNum = taosArrayGetSize(metaLogList);
  int actualFileNum = taosArrayGetSize(actualLogList);
  int j = 0;

  // both of the lists in asc order
  for (int i = 0; i < actualFileNum; i++) {
    SWalFileInfo* pLogInfo = taosArrayGet(actualLogList, i);
    while (j < metaFileNum) {
      SWalFileInfo* pMetaInfo = taosArrayGet(metaLogList, j);
      if (pMetaInfo->firstVer < pLogInfo->firstVer) {
        j++;
      } else if (pMetaInfo->firstVer == pLogInfo->firstVer) {
        (*pLogInfo) = *pMetaInfo;
        j++;
        break;
      } else {
        break;
      }
    }
  }

  taosArrayClear(metaLogList);

  for (int i = 0; i < actualFileNum; i++) {
    SWalFileInfo* pFileInfo = taosArrayGet(actualLogList, i);
    taosArrayPush(metaLogList, pFileInfo);
  }
}

void walAlignVersions(SWal* pWal) {
274 275
  if (pWal->vers.firstVer > pWal->vers.snapshotVer + 1) {
    wWarn("vgId:%d, firstVer:%" PRId64 " is larger than snapshotVer:%" PRId64 " + 1. align with it.", pWal->cfg.vgId,
276
          pWal->vers.firstVer, pWal->vers.snapshotVer);
277
    pWal->vers.firstVer = pWal->vers.snapshotVer + 1;
278 279
  }
  if (pWal->vers.lastVer < pWal->vers.snapshotVer) {
280
    wWarn("vgId:%d, lastVer:%" PRId64 " is less than snapshotVer:%" PRId64 ". align with it.", pWal->cfg.vgId,
281
          pWal->vers.lastVer, pWal->vers.snapshotVer);
282 283 284
    if (pWal->vers.lastVer < pWal->vers.firstVer) {
      pWal->vers.firstVer = pWal->vers.snapshotVer + 1;
    }
285 286
    pWal->vers.lastVer = pWal->vers.snapshotVer;
  }
287 288 289
  // reset commitVer and appliedVer
  pWal->vers.commitVer = pWal->vers.snapshotVer;
  pWal->vers.appliedVer = pWal->vers.snapshotVer;
290
  wInfo("vgId:%d, reset commitVer to %" PRId64, pWal->cfg.vgId, pWal->vers.commitVer);
291 292
}

293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322
int walRepairLogFileTs(SWal* pWal, bool* updateMeta) {
  int32_t sz = taosArrayGetSize(pWal->fileInfoSet);
  int32_t fileIdx = -1;
  int32_t lastCloseTs = 0;
  char    fnameStr[WAL_FILE_LEN] = {0};

  while (++fileIdx < sz - 1) {
    SWalFileInfo* pFileInfo = taosArrayGet(pWal->fileInfoSet, fileIdx);
    if (pFileInfo->closeTs != -1) {
      lastCloseTs = pFileInfo->closeTs;
      continue;
    }

    walBuildLogName(pWal, pFileInfo->firstVer, fnameStr);
    int32_t mtime = 0;
    if (taosStatFile(fnameStr, NULL, &mtime) < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
      wError("vgId:%d, failed to stat file due to %s, file:%s", pWal->cfg.vgId, strerror(errno), fnameStr);
      return -1;
    }

    if (updateMeta != NULL) *updateMeta = true;
    if (pFileInfo->createTs == -1) pFileInfo->createTs = lastCloseTs;
    pFileInfo->closeTs = mtime;
    lastCloseTs = pFileInfo->closeTs;
  }

  return 0;
}

323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349
bool walLogEntriesComplete(const SWal* pWal) {
  int32_t sz = taosArrayGetSize(pWal->fileInfoSet);
  bool    complete = true;
  int32_t fileIdx = -1;
  int64_t index = pWal->vers.firstVer;

  while (++fileIdx < sz) {
    SWalFileInfo* pFileInfo = taosArrayGet(pWal->fileInfoSet, fileIdx);
    if (pFileInfo->firstVer != index) {
      break;
    }
    index = pFileInfo->lastVer + ((fileIdx + 1 < sz) ? 1 : 0);
  }
  // empty is regarded as complete
  if (sz != 0) {
    complete = (index == pWal->vers.lastVer);
  }

  if (!complete) {
    wError("vgId:%d, WAL log entries incomplete in range [%" PRId64 ", %" PRId64 "], aligned with snaphotVer:%" PRId64,
           pWal->cfg.vgId, pWal->vers.firstVer, pWal->vers.lastVer, pWal->vers.snapshotVer);
    terrno = TSDB_CODE_WAL_LOG_INCOMPLETE;
  }

  return complete;
}

350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378
int walTrimIdxFile(SWal* pWal, int32_t fileIdx) {
  SWalFileInfo* pFileInfo = taosArrayGet(pWal->fileInfoSet, fileIdx);
  ASSERT(pFileInfo != NULL);
  char fnameStr[WAL_FILE_LEN];
  walBuildIdxName(pWal, pFileInfo->firstVer, fnameStr);

  int64_t fileSize = 0;
  taosStatFile(fnameStr, &fileSize, NULL);
  int64_t records = TMAX(0, pFileInfo->lastVer - pFileInfo->firstVer + 1);
  int64_t lastEndOffset = records * sizeof(SWalIdxEntry);

  if (fileSize <= lastEndOffset) {
    return 0;
  }

  TdFilePtr pFile = taosOpenFile(fnameStr, TD_FILE_READ | TD_FILE_WRITE);
  if (pFile == NULL) {
    terrno = TAOS_SYSTEM_ERROR(errno);
    return -1;
  }

  wInfo("vgId:%d, trim idx file. file: %s, size: %" PRId64 ", offset: %" PRId64, pWal->cfg.vgId, fnameStr, fileSize,
        lastEndOffset);

  taosFtruncateFile(pFile, lastEndOffset);
  taosCloseFile(&pFile);
  return 0;
}

L
Liu Jicong 已提交
379 380 381 382
int walCheckAndRepairMeta(SWal* pWal) {
  // load log files, get first/snapshot/last version info
  const char* logPattern = "^[0-9]+.log$";
  const char* idxPattern = "^[0-9]+.idx$";
L
Liu Jicong 已提交
383 384
  regex_t     logRegPattern;
  regex_t     idxRegPattern;
L
Liu Jicong 已提交
385 386 387

  regcomp(&logRegPattern, logPattern, REG_EXTENDED);
  regcomp(&idxRegPattern, idxPattern, REG_EXTENDED);
L
Liu Jicong 已提交
388

wafwerar's avatar
wafwerar 已提交
389 390
  TdDirPtr pDir = taosOpenDir(pWal->path);
  if (pDir == NULL) {
L
Liu Jicong 已提交
391 392
    regfree(&logRegPattern);
    regfree(&idxRegPattern);
L
Liu Jicong 已提交
393 394 395 396
    wError("vgId:%d, path:%s, failed to open since %s", pWal->cfg.vgId, pWal->path, strerror(errno));
    return -1;
  }

397 398
  SArray* actualLog = taosArrayInit(8, sizeof(SWalFileInfo));

L
Liu Jicong 已提交
399
  // scan log files and build new meta
wafwerar's avatar
wafwerar 已提交
400 401 402
  TdDirEntryPtr pDirEntry;
  while ((pDirEntry = taosReadDir(pDir)) != NULL) {
    char* name = taosDirEntryBaseName(taosGetDirEntryName(pDirEntry));
L
Liu Jicong 已提交
403 404
    int   code = regexec(&logRegPattern, name, 0, NULL, 0);
    if (code == 0) {
L
Liu Jicong 已提交
405 406 407
      SWalFileInfo fileInfo;
      memset(&fileInfo, -1, sizeof(SWalFileInfo));
      sscanf(name, "%" PRId64 ".log", &fileInfo.firstVer);
408
      taosArrayPush(actualLog, &fileInfo);
L
Liu Jicong 已提交
409 410 411
    }
  }

wafwerar's avatar
wafwerar 已提交
412
  taosCloseDir(&pDir);
L
Liu Jicong 已提交
413 414 415
  regfree(&logRegPattern);
  regfree(&idxRegPattern);

416
  taosArraySort(actualLog, compareWalFileInfo);
L
Liu Jicong 已提交
417

418 419 420 421 422 423 424 425 426 427 428 429
  int     metaFileNum = taosArrayGetSize(pWal->fileInfoSet);
  int     actualFileNum = taosArrayGetSize(actualLog);
  int64_t firstVerPrev = pWal->vers.firstVer;
  int64_t lastVerPrev = pWal->vers.lastVer;
  int64_t totSize = 0;
  bool    updateMeta = (metaFileNum != actualFileNum);

  // rebuild meta of file info
  walRebuildFileInfoSet(pWal->fileInfoSet, actualLog);
  taosArrayDestroy(actualLog);

  int32_t sz = taosArrayGetSize(pWal->fileInfoSet);
L
Liu Jicong 已提交
430

431 432 433 434
  // scan and determine the lastVer
  int32_t fileIdx = sz;

  while (--fileIdx >= 0) {
L
Liu Jicong 已提交
435
    char          fnameStr[WAL_FILE_LEN];
436 437 438
    int64_t       fileSize = 0;
    SWalFileInfo* pFileInfo = taosArrayGet(pWal->fileInfoSet, fileIdx);

L
Liu Jicong 已提交
439
    walBuildLogName(pWal, pFileInfo->firstVer, fnameStr);
440 441 442 443 444
    int32_t code = taosStatFile(fnameStr, &fileSize, NULL);
    if (code < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
      wError("failed to stat file since %s. file:%s", terrstr(), fnameStr);
      return -1;
L
Liu Jicong 已提交
445 446
    }

447 448 449
    if (pFileInfo->lastVer >= pFileInfo->firstVer && fileSize == pFileInfo->fileSize) {
      totSize += pFileInfo->fileSize;
      continue;
L
Liu Jicong 已提交
450
    }
451
    updateMeta = true;
L
Liu Jicong 已提交
452

453 454
    (void)walTrimIdxFile(pWal, fileIdx);

455 456 457 458 459
    int64_t lastVer = walScanLogGetLastVer(pWal, fileIdx);
    if (lastVer < 0) {
      if (terrno != TSDB_CODE_WAL_LOG_NOT_EXIST) {
        wError("failed to scan wal last ver since %s", terrstr());
        return -1;
L
Liu Jicong 已提交
460
      }
461 462
      // empty log file
      lastVer = pFileInfo->firstVer - 1;
L
Liu Jicong 已提交
463 464
    }

465 466 467
    // update lastVer
    pFileInfo->lastVer = lastVer;
    totSize += pFileInfo->fileSize;
L
Liu Jicong 已提交
468
  }
L
Liu Jicong 已提交
469

470
  // reset vers info and so on
L
Liu Jicong 已提交
471
  actualFileNum = taosArrayGetSize(pWal->fileInfoSet);
L
Liu Jicong 已提交
472
  pWal->writeCur = actualFileNum - 1;
473 474
  pWal->totSize = totSize;
  pWal->vers.lastVer = -1;
L
Liu Jicong 已提交
475
  if (actualFileNum > 0) {
476 477
    pWal->vers.firstVer = ((SWalFileInfo*)taosArrayGet(pWal->fileInfoSet, 0))->firstVer;
    pWal->vers.lastVer = ((SWalFileInfo*)taosArrayGetLast(pWal->fileInfoSet))->lastVer;
L
Liu Jicong 已提交
478
  }
479
  (void)walAlignVersions(pWal);
L
Liu Jicong 已提交
480

481 482 483 484 485
  // repair ts of files
  if (walRepairLogFileTs(pWal, &updateMeta) < 0) {
    return -1;
  }

486 487 488 489
  // update meta file
  if (updateMeta) {
    (void)walSaveMeta(pWal);
  }
490 491 492 493 494

  if (!walLogEntriesComplete(pWal)) {
    return -1;
  }

495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511
  return 0;
}

int walReadLogHead(TdFilePtr pLogFile, int64_t offset, SWalCkHead* pCkHead) {
  if (taosLSeekFile(pLogFile, offset, SEEK_SET) < 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
    return -1;
  }

  if (taosReadFile(pLogFile, pCkHead, sizeof(SWalCkHead)) != sizeof(SWalCkHead)) {
    terrno = TAOS_SYSTEM_ERROR(errno);
    return -1;
  }

  if (walValidHeadCksum(pCkHead) != 0) {
    terrno = TSDB_CODE_WAL_CHKSUM_MISMATCH;
    return -1;
L
Liu Jicong 已提交
512 513
  }

L
Liu Jicong 已提交
514 515 516
  return 0;
}

517
int walCheckAndRepairIdxFile(SWal* pWal, int32_t fileIdx) {
L
Liu Jicong 已提交
518
  int32_t       sz = taosArrayGetSize(pWal->fileInfoSet);
519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561
  SWalFileInfo* pFileInfo = taosArrayGet(pWal->fileInfoSet, fileIdx);
  char          fnameStr[WAL_FILE_LEN];
  walBuildIdxName(pWal, pFileInfo->firstVer, fnameStr);
  char fLogNameStr[WAL_FILE_LEN];
  walBuildLogName(pWal, pFileInfo->firstVer, fLogNameStr);
  int64_t fileSize = 0;

  if (taosStatFile(fnameStr, &fileSize, NULL) < 0 && errno != ENOENT) {
    wError("vgId:%d, failed to stat file due to %s. file:%s", pWal->cfg.vgId, strerror(errno), fnameStr);
    terrno = TAOS_SYSTEM_ERROR(errno);
    return -1;
  }

  if (fileSize == (pFileInfo->lastVer - pFileInfo->firstVer + 1) * sizeof(SWalIdxEntry)) {
    return 0;
  }

  // start to repair
  int64_t      offset = fileSize - fileSize % sizeof(SWalIdxEntry);
  TdFilePtr    pLogFile = NULL;
  TdFilePtr    pIdxFile = NULL;
  SWalIdxEntry idxEntry = {.ver = pFileInfo->firstVer - 1, .offset = -sizeof(SWalCkHead)};
  SWalCkHead   ckHead;
  memset(&ckHead, 0, sizeof(ckHead));
  ckHead.head.version = idxEntry.ver;

  pIdxFile = taosOpenFile(fnameStr, TD_FILE_READ | TD_FILE_WRITE | TD_FILE_CREATE);
  if (pIdxFile == NULL) {
    wError("vgId:%d, failed to open file due to %s. file:%s", pWal->cfg.vgId, strerror(errno), fnameStr);
    terrno = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  pLogFile = taosOpenFile(fLogNameStr, TD_FILE_READ);
  if (pLogFile == NULL) {
    terrno = TAOS_SYSTEM_ERROR(errno);
    wError("vgId:%d, cannot open file %s, since %s", pWal->cfg.vgId, fLogNameStr, terrstr());
    goto _err;
  }

  // determine the last valid entry end, i.e. offset
  while ((offset -= sizeof(SWalIdxEntry)) >= 0) {
    if (taosLSeekFile(pIdxFile, offset, SEEK_SET) < 0) {
562
      wError("vgId:%d, failed to seek file due to %s. offset:%" PRId64 ", file:%s", pWal->cfg.vgId, strerror(errno),
563
             offset, fnameStr);
L
Liu Jicong 已提交
564
      terrno = TAOS_SYSTEM_ERROR(errno);
565 566 567 568 569 570 571 572
      goto _err;
    }

    if (taosReadFile(pIdxFile, &idxEntry, sizeof(SWalIdxEntry)) != sizeof(SWalIdxEntry)) {
      wError("vgId:%d, failed to read file due to %s. offset:%" PRId64 ", file:%s", pWal->cfg.vgId, strerror(errno),
             offset, fnameStr);
      terrno = TAOS_SYSTEM_ERROR(errno);
      goto _err;
L
Liu Jicong 已提交
573 574
    }

575
    if (idxEntry.ver > pFileInfo->lastVer) {
L
Liu Jicong 已提交
576 577
      continue;
    }
L
Liu Jicong 已提交
578

579 580 581 582
    if (offset != (idxEntry.ver - pFileInfo->firstVer) * sizeof(SWalIdxEntry)) {
      continue;
    }

583 584 585 586
    if (walReadLogHead(pLogFile, idxEntry.offset, &ckHead) < 0) {
      wWarn("vgId:%d, failed to read log file since %s. file:%s, offset:%" PRId64 ", idx entry ver:%" PRId64 "",
            pWal->cfg.vgId, terrstr(), fLogNameStr, idxEntry.offset, idxEntry.ver);
      continue;
L
Liu Jicong 已提交
587 588
    }

589 590
    if (idxEntry.ver == ckHead.head.version) {
      break;
L
Liu Jicong 已提交
591
    }
592 593
  }
  offset += sizeof(SWalIdxEntry);
L
Liu Jicong 已提交
594

L
Liu Jicong 已提交
595
  /*A(offset == (idxEntry.ver - pFileInfo->firstVer + 1) * sizeof(SWalIdxEntry));*/
596

597 598 599 600
  // ftruncate idx file
  if (offset < fileSize) {
    if (taosFtruncateFile(pIdxFile, offset) < 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
601 602
      wError("vgId:%d, failed to ftruncate file since %s. offset:%" PRId64 ", file:%s", pWal->cfg.vgId, terrstr(),
             offset, fnameStr);
603 604 605 606 607 608 609
      goto _err;
    }
  }

  // rebuild idx file
  if (taosLSeekFile(pIdxFile, 0, SEEK_END) < 0) {
    terrno = TAOS_SYSTEM_ERROR(errno);
610 611
    wError("vgId:%d, failed to seek file since %s. offset:%" PRId64 ", file:%s", pWal->cfg.vgId, terrstr(), offset,
           fnameStr);
612 613 614
    goto _err;
  }

615
  int64_t count = 0;
616
  while (idxEntry.ver < pFileInfo->lastVer) {
L
Liu Jicong 已提交
617
    /*A(idxEntry.ver == ckHead.head.version);*/
618 619 620 621 622

    idxEntry.ver += 1;
    idxEntry.offset += sizeof(SWalCkHead) + ckHead.head.bodyLen;

    if (walReadLogHead(pLogFile, idxEntry.offset, &ckHead) < 0) {
623 624
      wError("vgId:%d, failed to read wal log head since %s. index:%" PRId64 ", offset:%" PRId64 ", file:%s",
             pWal->cfg.vgId, terrstr(), idxEntry.ver, idxEntry.offset, fLogNameStr);
625 626 627
      goto _err;
    }
    if (taosWriteFile(pIdxFile, &idxEntry, sizeof(SWalIdxEntry)) < 0) {
628
      terrno = TAOS_SYSTEM_ERROR(errno);
629 630 631
      wError("vgId:%d, failed to append file since %s. file:%s", pWal->cfg.vgId, terrstr(), fnameStr);
      goto _err;
    }
632
    count++;
633 634 635
  }

  if (taosFsyncFile(pIdxFile) < 0) {
636
    terrno = TAOS_SYSTEM_ERROR(errno);
637 638 639 640
    wError("vgId:%d, faild to fsync file since %s. file:%s", pWal->cfg.vgId, terrstr(), fnameStr);
    goto _err;
  }

641 642 643 644 645
  if (count > 0) {
    wInfo("vgId:%d, rebuilt %" PRId64 " wal idx entries until lastVer: %" PRId64, pWal->cfg.vgId, count,
          pFileInfo->lastVer);
  }

646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662
  (void)taosCloseFile(&pLogFile);
  (void)taosCloseFile(&pIdxFile);
  return 0;

_err:
  (void)taosCloseFile(&pLogFile);
  (void)taosCloseFile(&pIdxFile);
  return -1;
}

int walCheckAndRepairIdx(SWal* pWal) {
  int32_t sz = taosArrayGetSize(pWal->fileInfoSet);
  int32_t fileIdx = sz;
  while (--fileIdx >= 0) {
    if (walCheckAndRepairIdxFile(pWal, fileIdx) < 0) {
      wError("vgId:%d, failed to repair idx file since %s. fileIdx:%d", pWal->cfg.vgId, terrstr(), fileIdx);
      return -1;
L
Liu Jicong 已提交
663 664
    }
  }
L
Liu Jicong 已提交
665 666 667
  return 0;
}

L
Liu Jicong 已提交
668 669 670 671
int walRollFileInfo(SWal* pWal) {
  int64_t ts = taosGetTimestampSec();

  SArray* pArray = pWal->fileInfoSet;
L
Liu Jicong 已提交
672
  if (taosArrayGetSize(pArray) != 0) {
L
Liu Jicong 已提交
673
    SWalFileInfo* pInfo = taosArrayGetLast(pArray);
L
Liu Jicong 已提交
674
    pInfo->lastVer = pWal->vers.lastVer;
L
Liu Jicong 已提交
675 676 677
    pInfo->closeTs = ts;
  }

L
Liu Jicong 已提交
678
  // TODO: change to emplace back
wafwerar's avatar
wafwerar 已提交
679
  SWalFileInfo* pNewInfo = taosMemoryMalloc(sizeof(SWalFileInfo));
L
Liu Jicong 已提交
680
  if (pNewInfo == NULL) {
S
Shengliang Guan 已提交
681
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
682 683
    return -1;
  }
L
Liu Jicong 已提交
684
  pNewInfo->firstVer = pWal->vers.lastVer + 1;
L
Liu Jicong 已提交
685 686 687 688
  pNewInfo->lastVer = -1;
  pNewInfo->createTs = ts;
  pNewInfo->closeTs = -1;
  pNewInfo->fileSize = 0;
689
  pNewInfo->syncedOffset = 0;
L
Liu Jicong 已提交
690
  taosArrayPush(pArray, pNewInfo);
wafwerar's avatar
wafwerar 已提交
691
  taosMemoryFree(pNewInfo);
L
Liu Jicong 已提交
692 693 694
  return 0;
}

695
char* walMetaSerialize(SWal* pWal) {
L
Liu Jicong 已提交
696
  char   buf[30];
L
Liu Jicong 已提交
697
  int    sz = taosArrayGetSize(pWal->fileInfoSet);
698 699 700 701
  cJSON* pRoot = cJSON_CreateObject();
  cJSON* pMeta = cJSON_CreateObject();
  cJSON* pFiles = cJSON_CreateArray();
  cJSON* pField;
L
Liu Jicong 已提交
702
  if (pRoot == NULL || pMeta == NULL || pFiles == NULL) {
L
Liu Jicong 已提交
703
    if (pRoot) {
L
Liu Jicong 已提交
704 705
      cJSON_Delete(pRoot);
    }
L
Liu Jicong 已提交
706
    if (pMeta) {
L
Liu Jicong 已提交
707 708
      cJSON_Delete(pMeta);
    }
L
Liu Jicong 已提交
709
    if (pFiles) {
L
Liu Jicong 已提交
710 711
      cJSON_Delete(pFiles);
    }
S
Shengliang Guan 已提交
712
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
713 714
    return NULL;
  }
715
  cJSON_AddItemToObject(pRoot, "meta", pMeta);
L
Liu Jicong 已提交
716
  sprintf(buf, "%" PRId64, pWal->vers.firstVer);
717
  cJSON_AddStringToObject(pMeta, "firstVer", buf);
L
Liu Jicong 已提交
718
  sprintf(buf, "%" PRId64, pWal->vers.snapshotVer);
719
  cJSON_AddStringToObject(pMeta, "snapshotVer", buf);
L
Liu Jicong 已提交
720
  sprintf(buf, "%" PRId64, pWal->vers.commitVer);
721
  cJSON_AddStringToObject(pMeta, "commitVer", buf);
L
Liu Jicong 已提交
722
  sprintf(buf, "%" PRId64, pWal->vers.lastVer);
723 724 725
  cJSON_AddStringToObject(pMeta, "lastVer", buf);

  cJSON_AddItemToObject(pRoot, "files", pFiles);
L
Liu Jicong 已提交
726
  SWalFileInfo* pData = pWal->fileInfoSet->pData;
L
Liu Jicong 已提交
727
  for (int i = 0; i < sz; i++) {
L
Liu Jicong 已提交
728
    SWalFileInfo* pInfo = &pData[i];
729
    cJSON_AddItemToArray(pFiles, pField = cJSON_CreateObject());
L
Liu Jicong 已提交
730
    if (pField == NULL) {
731
      cJSON_Delete(pRoot);
L
Liu Jicong 已提交
732 733
      return NULL;
    }
L
Liu Jicong 已提交
734 735
    // cjson only support int32_t or double
    // string are used to prohibit the loss of precision
736 737 738 739 740 741 742 743 744 745
    sprintf(buf, "%" PRId64, pInfo->firstVer);
    cJSON_AddStringToObject(pField, "firstVer", buf);
    sprintf(buf, "%" PRId64, pInfo->lastVer);
    cJSON_AddStringToObject(pField, "lastVer", buf);
    sprintf(buf, "%" PRId64, pInfo->createTs);
    cJSON_AddStringToObject(pField, "createTs", buf);
    sprintf(buf, "%" PRId64, pInfo->closeTs);
    cJSON_AddStringToObject(pField, "closeTs", buf);
    sprintf(buf, "%" PRId64, pInfo->fileSize);
    cJSON_AddStringToObject(pField, "fileSize", buf);
L
Liu Jicong 已提交
746
  }
L
Liu Jicong 已提交
747 748 749
  char* serialized = cJSON_Print(pRoot);
  cJSON_Delete(pRoot);
  return serialized;
L
Liu Jicong 已提交
750 751
}

752
int walMetaDeserialize(SWal* pWal, const char* bytes) {
L
Liu Jicong 已提交
753
  /*A(taosArrayGetSize(pWal->fileInfoSet) == 0);*/
754 755
  cJSON *pRoot, *pMeta, *pFiles, *pInfoJson, *pField;
  pRoot = cJSON_Parse(bytes);
756
  if (!pRoot) goto _err;
757
  pMeta = cJSON_GetObjectItem(pRoot, "meta");
758
  if (!pMeta) goto _err;
759
  pField = cJSON_GetObjectItem(pMeta, "firstVer");
760
  if (!pField) goto _err;
L
Liu Jicong 已提交
761
  pWal->vers.firstVer = atoll(cJSON_GetStringValue(pField));
762
  pField = cJSON_GetObjectItem(pMeta, "snapshotVer");
763
  if (!pField) goto _err;
L
Liu Jicong 已提交
764
  pWal->vers.snapshotVer = atoll(cJSON_GetStringValue(pField));
765
  pField = cJSON_GetObjectItem(pMeta, "commitVer");
766
  if (!pField) goto _err;
L
Liu Jicong 已提交
767
  pWal->vers.commitVer = atoll(cJSON_GetStringValue(pField));
768
  pField = cJSON_GetObjectItem(pMeta, "lastVer");
769
  if (!pField) goto _err;
L
Liu Jicong 已提交
770
  pWal->vers.lastVer = atoll(cJSON_GetStringValue(pField));
771 772 773

  pFiles = cJSON_GetObjectItem(pRoot, "files");
  int sz = cJSON_GetArraySize(pFiles);
L
Liu Jicong 已提交
774
  // deserialize
L
Liu Jicong 已提交
775 776
  SArray* pArray = pWal->fileInfoSet;
  taosArrayEnsureCap(pArray, sz);
777

L
Liu Jicong 已提交
778
  for (int i = 0; i < sz; i++) {
779
    pInfoJson = cJSON_GetArrayItem(pFiles, i);
780
    if (!pInfoJson) goto _err;
781 782 783

    SWalFileInfo info = {0};

L
Liu Jicong 已提交
784
    pField = cJSON_GetObjectItem(pInfoJson, "firstVer");
785
    if (!pField) goto _err;
786
    info.firstVer = atoll(cJSON_GetStringValue(pField));
L
Liu Jicong 已提交
787
    pField = cJSON_GetObjectItem(pInfoJson, "lastVer");
788
    if (!pField) goto _err;
789
    info.lastVer = atoll(cJSON_GetStringValue(pField));
L
Liu Jicong 已提交
790
    pField = cJSON_GetObjectItem(pInfoJson, "createTs");
791
    if (!pField) goto _err;
792
    info.createTs = atoll(cJSON_GetStringValue(pField));
L
Liu Jicong 已提交
793
    pField = cJSON_GetObjectItem(pInfoJson, "closeTs");
794
    if (!pField) goto _err;
795
    info.closeTs = atoll(cJSON_GetStringValue(pField));
L
Liu Jicong 已提交
796
    pField = cJSON_GetObjectItem(pInfoJson, "fileSize");
797
    if (!pField) goto _err;
798 799
    info.fileSize = atoll(cJSON_GetStringValue(pField));
    taosArrayPush(pArray, &info);
L
Liu Jicong 已提交
800
  }
801
  pWal->fileInfoSet = pArray;
L
Liu Jicong 已提交
802
  pWal->writeCur = sz - 1;
L
Liu Jicong 已提交
803
  cJSON_Delete(pRoot);
804
  return 0;
805 806 807 808

_err:
  cJSON_Delete(pRoot);
  return -1;
L
Liu Jicong 已提交
809 810 811
}

static int walFindCurMetaVer(SWal* pWal) {
L
Liu Jicong 已提交
812 813
  const char* pattern = "^meta-ver[0-9]+$";
  regex_t     walMetaRegexPattern;
L
Liu Jicong 已提交
814 815
  regcomp(&walMetaRegexPattern, pattern, REG_EXTENDED);

wafwerar's avatar
wafwerar 已提交
816 817
  TdDirPtr pDir = taosOpenDir(pWal->path);
  if (pDir == NULL) {
L
Liu Jicong 已提交
818
    wError("vgId:%d, path:%s, failed to open since %s", pWal->cfg.vgId, pWal->path, strerror(errno));
L
Liu Jicong 已提交
819 820 821
    return -1;
  }

wafwerar's avatar
wafwerar 已提交
822
  TdDirEntryPtr pDirEntry;
L
Liu Jicong 已提交
823

L
Liu Jicong 已提交
824
  // find existing meta-ver[x].json
L
Liu Jicong 已提交
825
  int metaVer = -1;
wafwerar's avatar
wafwerar 已提交
826 827
  while ((pDirEntry = taosReadDir(pDir)) != NULL) {
    char* name = taosDirEntryBaseName(taosGetDirEntryName(pDirEntry));
L
Liu Jicong 已提交
828 829
    int   code = regexec(&walMetaRegexPattern, name, 0, NULL, 0);
    if (code == 0) {
L
Liu Jicong 已提交
830
      sscanf(name, "meta-ver%d", &metaVer);
L
Liu Jicong 已提交
831
      wDebug("vgId:%d, wal find current meta: %s is the meta file, ver %d", pWal->cfg.vgId, name, metaVer);
L
Liu Jicong 已提交
832 833
      break;
    }
L
Liu Jicong 已提交
834
    wDebug("vgId:%d, wal find current meta: %s is not meta file", pWal->cfg.vgId, name);
L
Liu Jicong 已提交
835
  }
wafwerar's avatar
wafwerar 已提交
836
  taosCloseDir(&pDir);
L
Liu Jicong 已提交
837
  regfree(&walMetaRegexPattern);
L
Liu Jicong 已提交
838 839 840
  return metaVer;
}

841 842 843 844 845 846
void walUpdateSyncedOffset(SWal* pWal) {
  SWalFileInfo* pFileInfo = walGetCurFileInfo(pWal);
  if (pFileInfo == NULL) return;
  pFileInfo->syncedOffset = pFileInfo->fileSize;
}

L
Liu Jicong 已提交
847
int walSaveMeta(SWal* pWal) {
L
Liu Jicong 已提交
848
  int  metaVer = walFindCurMetaVer(pWal);
L
Liu Jicong 已提交
849
  char fnameStr[WAL_FILE_LEN];
850
  char tmpFnameStr[WAL_FILE_LEN];
851 852 853 854 855 856 857 858 859 860 861 862 863 864
  int  n;

  // fsync the idx and log file at first to ensure validity of meta
  if (taosFsyncFile(pWal->pIdxFile) < 0) {
    wError("vgId:%d, failed to sync idx file due to %s", pWal->cfg.vgId, strerror(errno));
    terrno = TAOS_SYSTEM_ERROR(errno);
    return -1;
  }

  if (taosFsyncFile(pWal->pLogFile) < 0) {
    wError("vgId:%d, failed to sync log file due to %s", pWal->cfg.vgId, strerror(errno));
    terrno = TAOS_SYSTEM_ERROR(errno);
    return -1;
  }
865

866 867 868
  // update synced offset
  (void)walUpdateSyncedOffset(pWal);

869 870
  // flush to a tmpfile
  n = walBuildTmpMetaName(pWal, tmpFnameStr);
L
Liu Jicong 已提交
871
  if (n >= sizeof(tmpFnameStr)) {
L
Liu Jicong 已提交
872 873
    return -1;
  }
874 875

  TdFilePtr pMetaFile = taosOpenFile(tmpFnameStr, TD_FILE_CREATE | TD_FILE_WRITE | TD_FILE_TRUNC);
L
Liu Jicong 已提交
876
  if (pMetaFile == NULL) {
877
    wError("vgId:%d, failed to open file due to %s. file:%s", pWal->cfg.vgId, strerror(errno), tmpFnameStr);
878
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
879 880
    return -1;
  }
881

882
  char* serialized = walMetaSerialize(pWal);
L
Liu Jicong 已提交
883
  int   len = strlen(serialized);
L
Liu Jicong 已提交
884
  if (len != taosWriteFile(pMetaFile, serialized, len)) {
885
    wError("vgId:%d, failed to write file due to %s. file:%s", pWal->cfg.vgId, strerror(errno), tmpFnameStr);
886 887 888
    terrno = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }
L
Liu Jicong 已提交
889

890
  if (taosFsyncFile(pMetaFile) < 0) {
891
    wError("vgId:%d, failed to sync file due to %s. file:%s", pWal->cfg.vgId, strerror(errno), tmpFnameStr);
892 893 894 895 896
    terrno = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  if (taosCloseFile(&pMetaFile) < 0) {
897
    wError("vgId:%d, failed to close file due to %s. file:%s", pWal->cfg.vgId, strerror(errno), tmpFnameStr);
898 899 900 901 902 903
    terrno = TAOS_SYSTEM_ERROR(errno);
    goto _err;
  }

  // rename it
  n = walBuildMetaName(pWal, metaVer + 1, fnameStr);
L
Liu Jicong 已提交
904
  if (n >= sizeof(fnameStr)) {
L
Liu Jicong 已提交
905 906
    goto _err;
  }
907 908 909 910 911

  if (taosRenameFile(tmpFnameStr, fnameStr) < 0) {
    wError("failed to rename file due to %s. dest:%s", strerror(errno), fnameStr);
    terrno = TAOS_SYSTEM_ERROR(errno);
    goto _err;
L
Liu Jicong 已提交
912
  }
L
Liu Jicong 已提交
913 914 915

  // delete old file
  if (metaVer > -1) {
L
Liu Jicong 已提交
916
    walBuildMetaName(pWal, metaVer, fnameStr);
917
    taosRemoveFile(fnameStr);
L
Liu Jicong 已提交
918
  }
wafwerar's avatar
wafwerar 已提交
919
  taosMemoryFree(serialized);
L
Liu Jicong 已提交
920
  return 0;
921 922 923 924 925

_err:
  taosCloseFile(&pMetaFile);
  taosMemoryFree(serialized);
  return -1;
L
Liu Jicong 已提交
926 927
}

L
Liu Jicong 已提交
928
int walLoadMeta(SWal* pWal) {
L
Liu Jicong 已提交
929
  // find existing meta file
L
Liu Jicong 已提交
930
  int metaVer = walFindCurMetaVer(pWal);
L
Liu Jicong 已提交
931
  if (metaVer == -1) {
S
Shengliang Guan 已提交
932
    wDebug("vgId:%d, wal find meta ver %d", pWal->cfg.vgId, metaVer);
L
Liu Jicong 已提交
933
    return -1;
L
Liu Jicong 已提交
934 935 936
  }
  char fnameStr[WAL_FILE_LEN];
  walBuildMetaName(pWal, metaVer, fnameStr);
L
Liu Jicong 已提交
937
  // read metafile
L
Liu Jicong 已提交
938 939
  int64_t fileSize = 0;
  taosStatFile(fnameStr, &fileSize, NULL);
L
Liu Jicong 已提交
940
  if (fileSize == 0) {
941
    (void)taosRemoveFile(fnameStr);
S
Shengliang Guan 已提交
942
    wDebug("vgId:%d, wal find empty meta ver %d", pWal->cfg.vgId, metaVer);
L
Liu Jicong 已提交
943 944
    return -1;
  }
L
Liu Jicong 已提交
945
  int   size = (int)fileSize;
wafwerar's avatar
wafwerar 已提交
946
  char* buf = taosMemoryMalloc(size + 5);
L
Liu Jicong 已提交
947
  if (buf == NULL) {
S
Shengliang Guan 已提交
948
    terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
949 950
    return -1;
  }
L
Liu Jicong 已提交
951
  memset(buf, 0, size + 5);
952 953
  TdFilePtr pFile = taosOpenFile(fnameStr, TD_FILE_READ);
  if (pFile == NULL) {
L
Liu Jicong 已提交
954
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
L
Liu Jicong 已提交
955
    taosMemoryFree(buf);
L
Liu Jicong 已提交
956 957
    return -1;
  }
958
  if (taosReadFile(pFile, buf, size) != size) {
L
Liu Jicong 已提交
959
    terrno = TAOS_SYSTEM_ERROR(errno);
960
    taosCloseFile(&pFile);
wafwerar's avatar
wafwerar 已提交
961
    taosMemoryFree(buf);
L
Liu Jicong 已提交
962 963
    return -1;
  }
L
Liu Jicong 已提交
964
  // load into fileInfoSet
965
  int code = walMetaDeserialize(pWal, buf);
966 967 968 969
  if (code < 0) {
    wError("failed to deserialize wal meta. file:%s", fnameStr);
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
  }
970
  taosCloseFile(&pFile);
wafwerar's avatar
wafwerar 已提交
971
  taosMemoryFree(buf);
L
Liu Jicong 已提交
972
  return code;
L
Liu Jicong 已提交
973
}
974 975 976 977 978 979

int walRemoveMeta(SWal* pWal) {
  int metaVer = walFindCurMetaVer(pWal);
  if (metaVer == -1) return 0;
  char fnameStr[WAL_FILE_LEN];
  walBuildMetaName(pWal, metaVer, fnameStr);
L
Liu Jicong 已提交
980
  return taosRemoveFile(fnameStr);
981
}