walWrite.c 20.2 KB
Newer Older
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#include "os.h"
S
Shengliang Guan 已提交
17
#include "taoserror.h"
18
#include "tchecksum.h"
19
#include "tglobal.h"
S
Shengliang Guan 已提交
20
#include "walInt.h"
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
21

22 23 24
int32_t walRestoreFromSnapshot(SWal *pWal, int64_t ver) {
  taosThreadMutexLock(&pWal->mutex);

L
Liu Jicong 已提交
25 26
  wInfo("vgId:%d, restore from snapshot, version %" PRId64, pWal->cfg.vgId, ver);

27 28
  void *pIter = NULL;
  while (1) {
L
Liu Jicong 已提交
29
    pIter = taosHashIterate(pWal->pRefHash, pIter);
30
    if (pIter == NULL) break;
L
Liu Jicong 已提交
31
    SWalRef *pRef = *(SWalRef **)pIter;
L
Liu Jicong 已提交
32
    if (pRef->refVer != -1 && pRef->refVer <= ver) {
33
      taosHashCancelIterate(pWal->pRefHash, pIter);
L
Liu Jicong 已提交
34
      taosThreadMutexUnlock(&pWal->mutex);
35 36 37 38
      return -1;
    }
  }

L
Liu Jicong 已提交
39 40
  taosCloseFile(&pWal->pLogFile);
  taosCloseFile(&pWal->pIdxFile);
41 42 43 44 45 46 47

  if (pWal->vers.firstVer != -1) {
    int32_t fileSetSize = taosArrayGetSize(pWal->fileInfoSet);
    for (int32_t i = 0; i < fileSetSize; i++) {
      SWalFileInfo *pFileInfo = taosArrayGet(pWal->fileInfoSet, i);
      char          fnameStr[WAL_FILE_LEN];
      walBuildLogName(pWal, pFileInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
48 49
      if (taosRemoveFile(fnameStr) < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
50
        wError("vgId:%d, restore from snapshot, cannot remove file %s since %s", pWal->cfg.vgId, fnameStr, terrstr());
L
Liu Jicong 已提交
51
        taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
52 53
        return -1;
      }
S
Shengliang Guan 已提交
54
      wInfo("vgId:%d, restore from snapshot, remove file %s", pWal->cfg.vgId, fnameStr);
55 56

      walBuildIdxName(pWal, pFileInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
57 58
      if (taosRemoveFile(fnameStr) < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
59
        wError("vgId:%d, cannot remove file %s since %s", pWal->cfg.vgId, fnameStr, terrstr());
L
Liu Jicong 已提交
60
        taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
61 62
        return -1;
      }
S
Shengliang Guan 已提交
63
      wInfo("vgId:%d, restore from snapshot, remove file %s", pWal->cfg.vgId, fnameStr);
64 65
    }
  }
66
  (void)walRemoveMeta(pWal);
67 68 69 70 71 72

  pWal->writeCur = -1;
  pWal->totSize = 0;
  pWal->lastRollSeq = -1;

  taosArrayClear(pWal->fileInfoSet);
73
  pWal->vers.firstVer = ver + 1;
74
  pWal->vers.lastVer = ver;
75 76
  pWal->vers.commitVer = ver;
  pWal->vers.snapshotVer = ver;
77
  pWal->vers.verInSnapshotting = -1;
78 79 80

  taosThreadMutexUnlock(&pWal->mutex);
  return 0;
81 82
}

L
Liu Jicong 已提交
83 84 85 86 87 88
int32_t walApplyVer(SWal *pWal, int64_t ver) {
  // TODO: error check
  pWal->vers.appliedVer = ver;
  return 0;
}

L
Liu Jicong 已提交
89
int32_t walCommit(SWal *pWal, int64_t ver) {
L
Liu Jicong 已提交
90 91 92
  if (ver < pWal->vers.commitVer) {
    return 0;
  }
L
Liu Jicong 已提交
93
  if (ver > pWal->vers.lastVer || pWal->vers.commitVer < pWal->vers.snapshotVer) {
L
Liu Jicong 已提交
94
    terrno = TSDB_CODE_WAL_INVALID_VER;
L
Liu Jicong 已提交
95 96
    return -1;
  }
L
Liu Jicong 已提交
97
  pWal->vers.commitVer = ver;
L
Liu Jicong 已提交
98 99 100 101
  return 0;
}

int32_t walRollback(SWal *pWal, int64_t ver) {
102
  taosThreadMutexLock(&pWal->mutex);
L
Liu Jicong 已提交
103
  wInfo("vgId:%d, wal rollback for version %" PRId64, pWal->cfg.vgId, ver);
L
Liu Jicong 已提交
104 105
  int64_t code;
  char    fnameStr[WAL_FILE_LEN];
106
  if (ver > pWal->vers.lastVer || ver <= pWal->vers.commitVer || ver <= pWal->vers.snapshotVer) {
L
Liu Jicong 已提交
107
    terrno = TSDB_CODE_WAL_INVALID_VER;
L
Liu Jicong 已提交
108
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
109 110 111
    return -1;
  }

L
Liu Jicong 已提交
112 113
  // find correct file
  if (ver < walGetLastFileFirstVer(pWal)) {
L
Liu Jicong 已提交
114 115 116
    // change current files
    code = walChangeWrite(pWal, ver);
    if (code < 0) {
L
Liu Jicong 已提交
117
      taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
118 119 120
      return -1;
    }

121
    // delete files in descending order
L
Liu Jicong 已提交
122
    int fileSetSize = taosArrayGetSize(pWal->fileInfoSet);
123
    for (int i = pWal->writeCur + 1; i < fileSetSize; i++) {
X
Xiaoyu Wang 已提交
124
      SWalFileInfo *pInfo = taosArrayPop(pWal->fileInfoSet);
125 126

      walBuildLogName(pWal, pInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
127
      wDebug("vgId:%d, wal remove file %s for rollback", pWal->cfg.vgId, fnameStr);
128
      taosRemoveFile(fnameStr);
129
      walBuildIdxName(pWal, pInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
130
      wDebug("vgId:%d, wal remove file %s for rollback", pWal->cfg.vgId, fnameStr);
131
      taosRemoveFile(fnameStr);
L
Liu Jicong 已提交
132 133 134 135
    }
  }

  walBuildIdxName(pWal, walGetCurFileFirstVer(pWal), fnameStr);
L
Liu Jicong 已提交
136
  TdFilePtr pIdxFile = taosOpenFile(fnameStr, TD_FILE_WRITE | TD_FILE_READ | TD_FILE_APPEND);
L
Liu Jicong 已提交
137

L
Liu Jicong 已提交
138
  if (pIdxFile == NULL) {
wafwerar's avatar
wafwerar 已提交
139
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
140 141
    return -1;
  }
L
Liu Jicong 已提交
142
  int64_t idxOff = walGetVerIdxOffset(pWal, ver);
L
Liu Jicong 已提交
143
  code = taosLSeekFile(pIdxFile, idxOff, SEEK_SET);
L
Liu Jicong 已提交
144
  if (code < 0) {
wafwerar's avatar
wafwerar 已提交
145
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
146 147
    return -1;
  }
L
Liu Jicong 已提交
148
  // read idx file and get log file pos
L
Liu Jicong 已提交
149
  SWalIdxEntry entry;
L
Liu Jicong 已提交
150
  if (taosReadFile(pIdxFile, &entry, sizeof(SWalIdxEntry)) != sizeof(SWalIdxEntry)) {
wafwerar's avatar
wafwerar 已提交
151
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
152 153 154 155
    return -1;
  }

  walBuildLogName(pWal, walGetCurFileFirstVer(pWal), fnameStr);
L
Liu Jicong 已提交
156
  TdFilePtr pLogFile = taosOpenFile(fnameStr, TD_FILE_WRITE | TD_FILE_READ | TD_FILE_APPEND);
L
Liu Jicong 已提交
157
  wDebug("vgId:%d, wal truncate file %s", pWal->cfg.vgId, fnameStr);
L
Liu Jicong 已提交
158
  if (pLogFile == NULL) {
L
Liu Jicong 已提交
159
    // TODO
L
Liu Jicong 已提交
160
    terrno = TAOS_SYSTEM_ERROR(errno);
wafwerar's avatar
wafwerar 已提交
161
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
162 163
    return -1;
  }
L
Liu Jicong 已提交
164
  code = taosLSeekFile(pLogFile, entry.offset, SEEK_SET);
L
Liu Jicong 已提交
165 166
  if (code < 0) {
    // TODO
L
Liu Jicong 已提交
167
    terrno = TAOS_SYSTEM_ERROR(errno);
wafwerar's avatar
wafwerar 已提交
168
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
169 170
    return -1;
  }
L
Liu Jicong 已提交
171
  // validate offset
L
Liu Jicong 已提交
172
  SWalCkHead head;
L
Liu Jicong 已提交
173
  int64_t    size = taosReadFile(pLogFile, &head, sizeof(SWalCkHead));
L
Liu Jicong 已提交
174
  if (size != sizeof(SWalCkHead)) {
L
Liu Jicong 已提交
175
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
176 177 178 179
    return -1;
  }
  code = walValidHeadCksum(&head);

L
Liu Jicong 已提交
180
  if (code != 0) {
L
Liu Jicong 已提交
181
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
L
Liu Jicong 已提交
182
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
183 184
    return -1;
  }
L
Liu Jicong 已提交
185
  if (head.head.version != ver) {
L
Liu Jicong 已提交
186
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
L
Liu Jicong 已提交
187
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
188 189
    return -1;
  }
L
Liu Jicong 已提交
190

L
Liu Jicong 已提交
191
  // truncate old files
L
Liu Jicong 已提交
192
  code = taosFtruncateFile(pLogFile, entry.offset);
L
Liu Jicong 已提交
193
  if (code < 0) {
L
Liu Jicong 已提交
194
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
195
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
196 197
    return -1;
  }
L
Liu Jicong 已提交
198
  code = taosFtruncateFile(pIdxFile, idxOff);
L
Liu Jicong 已提交
199
  if (code < 0) {
L
Liu Jicong 已提交
200
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
201
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
202 203
    return -1;
  }
L
Liu Jicong 已提交
204
  pWal->vers.lastVer = ver - 1;
L
Liu Jicong 已提交
205 206
  ((SWalFileInfo *)taosArrayGetLast(pWal->fileInfoSet))->lastVer = ver - 1;
  ((SWalFileInfo *)taosArrayGetLast(pWal->fileInfoSet))->fileSize = entry.offset;
L
Liu Jicong 已提交
207 208 209
  taosCloseFile(&pIdxFile);
  taosCloseFile(&pLogFile);

210 211 212 213 214 215
  code = walSaveMeta(pWal);
  if (code < 0) {
    wError("vgId:%d, failed to save meta since %s", pWal->cfg.vgId, terrstr());
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }
L
Liu Jicong 已提交
216

L
Liu Jicong 已提交
217
  // unlock
wafwerar's avatar
wafwerar 已提交
218
  taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
219 220
  return 0;
}
L
Liu Jicong 已提交
221

L
Liu Jicong 已提交
222 223 224 225 226
static FORCE_INLINE int32_t walCheckAndRoll(SWal *pWal) {
  if (taosArrayGetSize(pWal->fileInfoSet) == 0) {
    if (walRollImpl(pWal) < 0) {
      return -1;
    }
227 228 229 230 231 232 233 234 235 236 237
    return 0;
  }

  int64_t passed = walGetSeq() - pWal->lastRollSeq;
  if (pWal->cfg.rollPeriod != -1 && pWal->cfg.rollPeriod != 0 && passed > pWal->cfg.rollPeriod) {
    if (walRollImpl(pWal) < 0) {
      return -1;
    }
  } else if (pWal->cfg.segSize != -1 && pWal->cfg.segSize != 0 && walGetLastFileSize(pWal) > pWal->cfg.segSize) {
    if (walRollImpl(pWal) < 0) {
      return -1;
L
Liu Jicong 已提交
238 239
    }
  }
240

241
  if (walGetLastFileCachedSize(pWal) > tsWalFsyncDataSizeLimit) {
242 243 244 245 246
    if (walSaveMeta(pWal) < 0) {
      return -1;
    }
  }

L
Liu Jicong 已提交
247 248 249
  return 0;
}

250
int32_t walBeginSnapshot(SWal *pWal, int64_t ver, int64_t logRetention) {
251
  taosThreadMutexLock(&pWal->mutex);
252
  ASSERT(logRetention >= 0);
L
Liu Jicong 已提交
253
  pWal->vers.verInSnapshotting = ver;
254 255 256 257 258
  pWal->vers.logRetention = logRetention;

  wDebug("vgId:%d, wal begin snapshot for version %" PRId64 ", log retention %" PRId64 " first ver %" PRId64
         ", last ver %" PRId64,
         pWal->cfg.vgId, ver, pWal->vers.logRetention, pWal->vers.firstVer, pWal->vers.lastVer);
L
Liu Jicong 已提交
259
  // check file rolling
260 261 262 263
  if (walGetLastFileSize(pWal) != 0) {
    if (walRollImpl(pWal) < 0) {
      wError("vgId:%d, failed to roll wal files since %s", pWal->cfg.vgId, terrstr());
      goto _err;
L
Liu Jicong 已提交
264
    }
L
Liu Jicong 已提交
265
  }
266

267
  taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
268
  return 0;
269 270 271 272

_err:
  taosThreadMutexUnlock(&pWal->mutex);
  return -1;
L
Liu Jicong 已提交
273 274
}

L
Liu Jicong 已提交
275
int32_t walEndSnapshot(SWal *pWal) {
L
Liu Jicong 已提交
276 277
  int32_t code = 0;
  taosThreadMutexLock(&pWal->mutex);
L
Liu Jicong 已提交
278
  int64_t ver = pWal->vers.verInSnapshotting;
L
Liu Jicong 已提交
279

280 281 282
  wDebug("vgId:%d, wal end snapshot for version %" PRId64 ", log retention %" PRId64 " first ver %" PRId64
         ", last ver %" PRId64,
         pWal->cfg.vgId, ver, pWal->vers.logRetention, pWal->vers.firstVer, pWal->vers.lastVer);
L
Liu Jicong 已提交
283

L
Liu Jicong 已提交
284 285 286 287
  if (ver == -1) {
    code = -1;
    goto END;
  };
L
Liu Jicong 已提交
288

L
Liu Jicong 已提交
289
  pWal->vers.snapshotVer = ver;
L
Liu Jicong 已提交
290 291
  int ts = taosGetTimestampSec();

292
  ver = TMAX(ver - pWal->vers.logRetention, pWal->vers.firstVer - 1);
293 294 295

  bool hasTopic = false;
  int64_t refVer = ver;
296
  void *pIter = NULL;
297 298 299 300 301
  while (1) {
    pIter = taosHashIterate(pWal->pRefHash, pIter);
    if (pIter == NULL) break;
    SWalRef *pRef = *(SWalRef **)pIter;
    if (pRef->refVer == -1) continue;
302
    refVer = TMIN(refVer, pRef->refVer - 1);
L
Liu Jicong 已提交
303
    wDebug("vgId:%d, wal found ref %" PRId64 ", refId %" PRId64, pWal->cfg.vgId, pRef->refVer, pRef->refId);
304 305 306 307 308
    hasTopic = true;
  }
  // compatible mode
  if (pWal->cfg.retentionPeriod == 0 && hasTopic) {
    ver = TMIN(ver, refVer);
309 310
  }

L
Liu Jicong 已提交
311 312 313
  int          deleteCnt = 0;
  int64_t      newTotSize = pWal->totSize;
  SWalFileInfo tmp;
L
Liu Jicong 已提交
314
  tmp.firstVer = ver;
L
Liu Jicong 已提交
315
  // find files safe to delete
L
Liu Jicong 已提交
316
  SWalFileInfo *pInfo = taosArraySearch(pWal->fileInfoSet, &tmp, compareWalFileInfo, TD_LE);
317
  if (pInfo) {
L
Liu Jicong 已提交
318
    SWalFileInfo *pLastFileInfo = taosArrayGetLast(pWal->fileInfoSet);
L
Liu Jicong 已提交
319
    wDebug("vgId:%d, wal search found file info: first:%" PRId64 " last:%" PRId64, pWal->cfg.vgId, pInfo->firstVer,
L
Liu Jicong 已提交
320
           pInfo->lastVer);
321
    if (ver >= pInfo->lastVer) {
322
      pInfo++;
L
Liu Jicong 已提交
323
      wDebug("vgId:%d, wal remove advance one file: first:%" PRId64 " last:%" PRId64, pWal->cfg.vgId, pInfo->firstVer,
L
Liu Jicong 已提交
324
             pInfo->lastVer);
325
    }
L
Liu Jicong 已提交
326
    if (pInfo <= pLastFileInfo) {
L
Liu Jicong 已提交
327
      wDebug("vgId:%d, wal end remove for first:%" PRId64 " last:%" PRId64, pWal->cfg.vgId, pInfo->firstVer,
L
Liu Jicong 已提交
328
             pInfo->lastVer);
L
Liu Jicong 已提交
329
    } else {
L
Liu Jicong 已提交
330
      wDebug("vgId:%d, wal no remove", pWal->cfg.vgId);
331
    }
332

333 334
    // iterate files, until the searched result
    for (SWalFileInfo *iter = pWal->fileInfoSet->pData; iter < pInfo; iter++) {
L
Liu Jicong 已提交
335 336 337
      wDebug("vgId:%d, wal check remove file %" PRId64 "(file size %" PRId64 " close ts %" PRId64
             "), new tot size %" PRId64,
             pWal->cfg.vgId, iter->firstVer, iter->fileSize, iter->closeTs, newTotSize);
338
      if ((pWal->cfg.retentionSize != -1 && pWal->cfg.retentionSize != 0 && newTotSize > pWal->cfg.retentionSize) ||
339 340
          ((pWal->cfg.retentionPeriod == 0) || (pWal->cfg.retentionPeriod != -1 && iter->closeTs != -1 &&
                                                iter->closeTs + pWal->cfg.retentionPeriod < ts))) {
341
        // delete according to file size or close time
L
Liu Jicong 已提交
342
        wDebug("vgId:%d, check pass", pWal->cfg.vgId);
343 344
        deleteCnt++;
        newTotSize -= iter->fileSize;
345
        taosArrayPush(pWal->toDeleteFiles, iter);
346
      }
L
Liu Jicong 已提交
347
      wDebug("vgId:%d, check not pass", pWal->cfg.vgId);
348
    }
L
Liu Jicong 已提交
349

350
  UPDATE_META:
351
    // make new array, remove files
352
    taosArrayPopFrontBatch(pWal->fileInfoSet, deleteCnt);
353 354
    if (taosArrayGetSize(pWal->fileInfoSet) == 0) {
      pWal->writeCur = -1;
355
      pWal->vers.firstVer = pWal->vers.lastVer + 1;
356 357 358
    } else {
      pWal->vers.firstVer = ((SWalFileInfo *)taosArrayGet(pWal->fileInfoSet, 0))->firstVer;
    }
L
Liu Jicong 已提交
359
  }
L
Liu Jicong 已提交
360
  pWal->writeCur = taosArrayGetSize(pWal->fileInfoSet) - 1;
L
Liu Jicong 已提交
361
  pWal->totSize = newTotSize;
L
Liu Jicong 已提交
362
  pWal->vers.verInSnapshotting = -1;
L
Liu Jicong 已提交
363

L
Liu Jicong 已提交
364
  // save snapshot ver, commit ver
L
Liu Jicong 已提交
365
  code = walSaveMeta(pWal);
L
Liu Jicong 已提交
366
  if (code < 0) {
L
Liu Jicong 已提交
367
    goto END;
L
Liu Jicong 已提交
368 369
  }

370 371 372 373 374 375 376 377 378 379 380 381 382 383 384
  // delete files
  deleteCnt = taosArrayGetSize(pWal->toDeleteFiles);
  wDebug("vgId:%d, wal should delete %d files", pWal->cfg.vgId, deleteCnt);
  char fnameStr[WAL_FILE_LEN];
  for (int i = 0; i < deleteCnt; i++) {
    pInfo = taosArrayGet(pWal->toDeleteFiles, i);
    walBuildLogName(pWal, pInfo->firstVer, fnameStr);
    wDebug("vgId:%d, wal remove file %s", pWal->cfg.vgId, fnameStr);
    if (taosRemoveFile(fnameStr) < 0 && errno != ENOENT) {
      wError("vgId:%d, failed to remove log file %s due to %s", pWal->cfg.vgId, fnameStr, strerror(errno));
      goto END;
    }
    walBuildIdxName(pWal, pInfo->firstVer, fnameStr);
    wDebug("vgId:%d, wal remove file %s", pWal->cfg.vgId, fnameStr);
    if (taosRemoveFile(fnameStr) < 0 && errno != ENOENT) {
L
Liu Jicong 已提交
385 386
      wError("vgId:%d, failed to remove idx file %s due to %s", pWal->cfg.vgId, fnameStr, strerror(errno));
      goto END;
387 388 389 390
    }
  }
  taosArrayClear(pWal->toDeleteFiles);

L
Liu Jicong 已提交
391 392 393
END:
  taosThreadMutexUnlock(&pWal->mutex);
  return code;
L
Liu Jicong 已提交
394 395
}

L
Liu Jicong 已提交
396
int32_t walRollImpl(SWal *pWal) {
L
Liu Jicong 已提交
397
  int32_t code = 0;
398

L
Liu Jicong 已提交
399
  if (pWal->pIdxFile != NULL) {
400 401 402 403 404
    code = taosFsyncFile(pWal->pIdxFile);
    if (code != 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
      goto END;
    }
L
Liu Jicong 已提交
405
    code = taosCloseFile(&pWal->pIdxFile);
L
Liu Jicong 已提交
406
    if (code != 0) {
L
Liu Jicong 已提交
407
      terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
408
      goto END;
L
Liu Jicong 已提交
409
    }
L
Liu Jicong 已提交
410
  }
411

L
Liu Jicong 已提交
412
  if (pWal->pLogFile != NULL) {
413 414 415 416 417
    code = taosFsyncFile(pWal->pLogFile);
    if (code != 0) {
      terrno = TAOS_SYSTEM_ERROR(errno);
      goto END;
    }
L
Liu Jicong 已提交
418
    code = taosCloseFile(&pWal->pLogFile);
L
Liu Jicong 已提交
419
    if (code != 0) {
L
Liu Jicong 已提交
420
      terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
421
      goto END;
L
Liu Jicong 已提交
422
    }
L
Liu Jicong 已提交
423
  }
424

L
Liu Jicong 已提交
425
  TdFilePtr pIdxFile, pLogFile;
L
Liu Jicong 已提交
426
  // create new file
L
Liu Jicong 已提交
427
  int64_t newFileFirstVer = pWal->vers.lastVer + 1;
L
Liu Jicong 已提交
428
  char    fnameStr[WAL_FILE_LEN];
L
Liu Jicong 已提交
429 430 431
  walBuildIdxName(pWal, newFileFirstVer, fnameStr);
  pIdxFile = taosOpenFile(fnameStr, TD_FILE_CREATE | TD_FILE_WRITE | TD_FILE_APPEND);
  if (pIdxFile == NULL) {
L
Liu Jicong 已提交
432
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
433 434
    code = -1;
    goto END;
L
Liu Jicong 已提交
435
  }
L
Liu Jicong 已提交
436 437
  walBuildLogName(pWal, newFileFirstVer, fnameStr);
  pLogFile = taosOpenFile(fnameStr, TD_FILE_CREATE | TD_FILE_WRITE | TD_FILE_APPEND);
438
  wDebug("vgId:%d, wal create new file for write:%s", pWal->cfg.vgId, fnameStr);
L
Liu Jicong 已提交
439
  if (pLogFile == NULL) {
L
Liu Jicong 已提交
440
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
441 442
    code = -1;
    goto END;
L
Liu Jicong 已提交
443
  }
L
Liu Jicong 已提交
444
  // error code was set inner
L
Liu Jicong 已提交
445
  code = walRollFileInfo(pWal);
L
Liu Jicong 已提交
446
  if (code != 0) {
L
Liu Jicong 已提交
447
    goto END;
L
Liu Jicong 已提交
448
  }
L
Liu Jicong 已提交
449

L
Liu Jicong 已提交
450
  // switch file
L
Liu Jicong 已提交
451 452
  pWal->pIdxFile = pIdxFile;
  pWal->pLogFile = pLogFile;
L
Liu Jicong 已提交
453
  pWal->writeCur = taosArrayGetSize(pWal->fileInfoSet) - 1;
L
Liu Jicong 已提交
454 455

  pWal->lastRollSeq = walGetSeq();
L
Liu Jicong 已提交
456

457 458 459 460 461
  code = walSaveMeta(pWal);
  if (code < 0) {
    wError("vgId:%d, failed to save meta since %s", pWal->cfg.vgId, terrstr());
    goto END;
  }
L
Liu Jicong 已提交
462

L
Liu Jicong 已提交
463 464
END:
  return code;
L
Liu Jicong 已提交
465 466
}

L
Liu Jicong 已提交
467
static int32_t walWriteIndex(SWal *pWal, int64_t ver, int64_t offset) {
L
Liu Jicong 已提交
468
  SWalIdxEntry  entry = {.ver = ver, .offset = offset};
469
  SWalFileInfo *pFileInfo = walGetCurFileInfo(pWal);
L
Liu Jicong 已提交
470

471
  int64_t idxOffset = (entry.ver - pFileInfo->firstVer) * sizeof(SWalIdxEntry);
S
Shengliang Guan 已提交
472
  wDebug("vgId:%d, write index, index:%" PRId64 ", offset:%" PRId64 ", at %" PRId64, pWal->cfg.vgId, ver, offset,
S
Shengliang Guan 已提交
473
         idxOffset);
474

L
Liu Jicong 已提交
475
  int64_t size = taosWriteFile(pWal->pIdxFile, &entry, sizeof(SWalIdxEntry));
L
Liu Jicong 已提交
476
  if (size != sizeof(SWalIdxEntry)) {
477
    wError("vgId:%d, failed to write idx entry due to %s. ver:%" PRId64, pWal->cfg.vgId, strerror(errno), ver);
L
Liu Jicong 已提交
478
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
479
    return -1;
L
Liu Jicong 已提交
480
  }
481

482 483 484 485 486
  // check alignment of idx entries
  int64_t endOffset = taosLSeekFile(pWal->pIdxFile, 0, SEEK_END);
  if (endOffset < 0) {
    wFatal("vgId:%d, failed to seek end of idxfile due to %s. ver:%" PRId64 "", pWal->cfg.vgId, strerror(errno), ver);
  }
L
Liu Jicong 已提交
487 488 489
  return 0;
}

L
Liu Jicong 已提交
490 491 492
static FORCE_INLINE int32_t walWriteImpl(SWal *pWal, int64_t index, tmsg_t msgType, SWalSyncInfo syncMeta,
                                         const void *body, int32_t bodyLen) {
  int64_t code = 0;
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
493

L
Liu Jicong 已提交
494
  int64_t       offset = walGetCurFileOffset(pWal);
495
  SWalFileInfo *pFileInfo = walGetCurFileInfo(pWal);
L
Liu Jicong 已提交
496

L
Liu Jicong 已提交
497
  pWal->writeHead.head.version = index;
L
Liu Jicong 已提交
498
  pWal->writeHead.head.bodyLen = bodyLen;
L
Liu Jicong 已提交
499
  pWal->writeHead.head.msgType = msgType;
500
  pWal->writeHead.head.ingestTs = 0;
L
Liu Jicong 已提交
501

502
  // sync info for sync module
L
Liu Jicong 已提交
503
  pWal->writeHead.head.syncMeta = syncMeta;
L
Liu Jicong 已提交
504

L
Liu Jicong 已提交
505 506
  pWal->writeHead.cksumHead = walCalcHeadCksum(&pWal->writeHead);
  pWal->writeHead.cksumBody = walCalcBodyCksum(body, bodyLen);
507 508
  wDebug("vgId:%d, wal write log %" PRId64 ", msgType: %s, cksum head %u cksum body %u", pWal->cfg.vgId, index,
         TMSG_INFO(msgType), pWal->writeHead.cksumHead, pWal->writeHead.cksumBody);
L
Liu Jicong 已提交
509

510 511 512 513 514
  code = walWriteIndex(pWal, index, offset);
  if (code < 0) {
    goto END;
  }

L
Liu Jicong 已提交
515
  if (taosWriteFile(pWal->pLogFile, &pWal->writeHead, sizeof(SWalCkHead)) != sizeof(SWalCkHead)) {
L
fix  
Liu Jicong 已提交
516
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
517 518
    wError("vgId:%d, file:%" PRId64 ".log, failed to write since %s", pWal->cfg.vgId, walGetLastFileFirstVer(pWal),
           strerror(errno));
L
Liu Jicong 已提交
519 520
    code = -1;
    goto END;
J
Jeff Tao 已提交
521
  }
S
TD-1846  
Shengliang Guan 已提交
522

L
Liu Jicong 已提交
523
  if (taosWriteFile(pWal->pLogFile, (char *)body, bodyLen) != bodyLen) {
L
fix  
Liu Jicong 已提交
524
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
525 526
    wError("vgId:%d, file:%" PRId64 ".log, failed to write since %s", pWal->cfg.vgId, walGetLastFileFirstVer(pWal),
           strerror(errno));
L
Liu Jicong 已提交
527 528
    code = -1;
    goto END;
L
Liu Jicong 已提交
529
  }
L
Liu Jicong 已提交
530

L
Liu Jicong 已提交
531
  // set status
532 533 534
  if (pWal->vers.firstVer == -1) {
    pWal->vers.firstVer = 0;
  }
L
Liu Jicong 已提交
535
  pWal->vers.lastVer = index;
L
Liu Jicong 已提交
536
  pWal->totSize += sizeof(SWalCkHead) + bodyLen;
537 538
  pFileInfo->lastVer = index;
  pFileInfo->fileSize += sizeof(SWalCkHead) + bodyLen;
L
Liu Jicong 已提交
539

L
Liu Jicong 已提交
540
  return 0;
541

L
Liu Jicong 已提交
542
END:
543 544
  // recover in a reverse order
  if (taosFtruncateFile(pWal->pLogFile, offset) < 0) {
545 546
    wFatal("vgId:%d, failed to ftruncate logfile to offset:%" PRId64 " during recovery due to %s", pWal->cfg.vgId,
           offset, strerror(errno));
547 548 549 550 551
    terrno = TAOS_SYSTEM_ERROR(errno);
  }

  int64_t idxOffset = (index - pFileInfo->firstVer) * sizeof(SWalIdxEntry);
  if (taosFtruncateFile(pWal->pIdxFile, idxOffset) < 0) {
552 553
    wFatal("vgId:%d, failed to ftruncate idxfile to offset:%" PRId64 "during recovery due to %s", pWal->cfg.vgId,
           idxOffset, strerror(errno));
554 555
    terrno = TAOS_SYSTEM_ERROR(errno);
  }
L
Liu Jicong 已提交
556 557 558
  return -1;
}

B
Benguang Zhao 已提交
559 560
int64_t walAppendLog(SWal *pWal, int64_t index, tmsg_t msgType, SWalSyncInfo syncMeta, const void *body,
                     int32_t bodyLen) {
L
Liu Jicong 已提交
561 562
  taosThreadMutexLock(&pWal->mutex);

B
Benguang Zhao 已提交
563 564 565 566 567
  if (index != pWal->vers.lastVer + 1) {
    terrno = TSDB_CODE_WAL_INVALID_VER;
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }
L
Liu Jicong 已提交
568 569 570 571 572 573

  if (walCheckAndRoll(pWal) < 0) {
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }

L
Liu Jicong 已提交
574
  if (pWal->pLogFile == NULL || pWal->pIdxFile == NULL || pWal->writeCur < 0) {
L
Liu Jicong 已提交
575 576 577 578 579 580 581 582 583 584 585
    if (walInitWriteFile(pWal) < 0) {
      taosThreadMutexUnlock(&pWal->mutex);
      return -1;
    }
  }

  if (walWriteImpl(pWal, index, msgType, syncMeta, body, bodyLen) < 0) {
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }

wafwerar's avatar
wafwerar 已提交
586
  taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
587 588
  return index;
}
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
589

L
Liu Jicong 已提交
590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609
int32_t walWriteWithSyncInfo(SWal *pWal, int64_t index, tmsg_t msgType, SWalSyncInfo syncMeta, const void *body,
                             int32_t bodyLen) {
  int32_t code = 0;

  taosThreadMutexLock(&pWal->mutex);

  // concurrency control:
  // if logs are write with assigned index,
  // smaller index must be write before larger one
  if (index != pWal->vers.lastVer + 1) {
    terrno = TSDB_CODE_WAL_INVALID_VER;
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }

  if (walCheckAndRoll(pWal) < 0) {
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }

L
Liu Jicong 已提交
610
  if (pWal->pIdxFile == NULL || pWal->pIdxFile == NULL || pWal->writeCur < 0) {
L
Liu Jicong 已提交
611 612 613 614 615 616 617 618 619 620 621 622 623
    if (walInitWriteFile(pWal) < 0) {
      taosThreadMutexUnlock(&pWal->mutex);
      return -1;
    }
  }

  if (walWriteImpl(pWal, index, msgType, syncMeta, body, bodyLen) < 0) {
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }

  taosThreadMutexUnlock(&pWal->mutex);
  return code;
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
624 625
}

L
Liu Jicong 已提交
626
int32_t walWrite(SWal *pWal, int64_t index, tmsg_t msgType, const void *body, int32_t bodyLen) {
L
Liu Jicong 已提交
627
  SWalSyncInfo syncMeta = {
L
Liu Jicong 已提交
628 629 630 631
      .isWeek = -1,
      .seqNum = UINT64_MAX,
      .term = UINT64_MAX,
  };
L
Liu Jicong 已提交
632
  return walWriteWithSyncInfo(pWal, index, msgType, syncMeta, body, bodyLen);
L
Liu Jicong 已提交
633 634
}

L
Liu Jicong 已提交
635
void walFsync(SWal *pWal, bool forceFsync) {
636
  taosThreadMutexLock(&pWal->mutex);
L
Liu Jicong 已提交
637
  if (forceFsync || (pWal->cfg.level == TAOS_WAL_FSYNC && pWal->cfg.fsyncPeriod == 0)) {
L
Liu Jicong 已提交
638
    wTrace("vgId:%d, fileId:%" PRId64 ".log, do fsync", pWal->cfg.vgId, walGetCurFileFirstVer(pWal));
L
Liu Jicong 已提交
639
    if (taosFsyncFile(pWal->pLogFile) < 0) {
L
Liu Jicong 已提交
640 641
      wError("vgId:%d, file:%" PRId64 ".log, fsync failed since %s", pWal->cfg.vgId, walGetCurFileFirstVer(pWal),
             strerror(errno));
642 643
    }
  }
644
  taosThreadMutexUnlock(&pWal->mutex);
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
645
}