walWrite.c 18.8 KB
Newer Older
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#include "os.h"
S
Shengliang Guan 已提交
17
#include "taoserror.h"
18
#include "tchecksum.h"
S
Shengliang Guan 已提交
19
#include "walInt.h"
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
20

21 22 23 24 25
int32_t walRestoreFromSnapshot(SWal *pWal, int64_t ver) {
  taosThreadMutexLock(&pWal->mutex);

  void *pIter = NULL;
  while (1) {
L
Liu Jicong 已提交
26
    pIter = taosHashIterate(pWal->pRefHash, pIter);
27 28
    if (pIter == NULL) break;
    SWalRef *pRef = (SWalRef *)pIter;
L
Liu Jicong 已提交
29
    if (pRef->refVer != -1 && pRef->refVer <= ver) {
30
      taosHashCancelIterate(pWal->pRefHash, pIter);
L
Liu Jicong 已提交
31
      taosThreadMutexUnlock(&pWal->mutex);
32 33 34 35
      return -1;
    }
  }

L
Liu Jicong 已提交
36 37
  taosCloseFile(&pWal->pLogFile);
  taosCloseFile(&pWal->pIdxFile);
38 39 40 41 42 43 44

  if (pWal->vers.firstVer != -1) {
    int32_t fileSetSize = taosArrayGetSize(pWal->fileInfoSet);
    for (int32_t i = 0; i < fileSetSize; i++) {
      SWalFileInfo *pFileInfo = taosArrayGet(pWal->fileInfoSet, i);
      char          fnameStr[WAL_FILE_LEN];
      walBuildLogName(pWal, pFileInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
45 46
      if (taosRemoveFile(fnameStr) < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
47
        wError("vgId:%d, restore from snapshot, cannot remove file %s since %s", pWal->cfg.vgId, fnameStr, terrstr());
L
Liu Jicong 已提交
48
        taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
49 50
        return -1;
      }
S
Shengliang Guan 已提交
51
      wInfo("vgId:%d, restore from snapshot, remove file %s", pWal->cfg.vgId, fnameStr);
52 53

      walBuildIdxName(pWal, pFileInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
54 55
      if (taosRemoveFile(fnameStr) < 0) {
        terrno = TAOS_SYSTEM_ERROR(errno);
S
Shengliang Guan 已提交
56
        wError("vgId:%d, cannot remove file %s since %s", pWal->cfg.vgId, fnameStr, terrstr());
L
Liu Jicong 已提交
57
        taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
58 59
        return -1;
      }
S
Shengliang Guan 已提交
60
      wInfo("vgId:%d, restore from snapshot, remove file %s", pWal->cfg.vgId, fnameStr);
61 62 63 64 65 66 67 68 69 70
    }
  }
  walRemoveMeta(pWal);

  pWal->writeCur = -1;
  pWal->totSize = 0;
  pWal->lastRollSeq = -1;

  taosArrayClear(pWal->fileInfoSet);
  pWal->vers.firstVer = -1;
71 72 73 74
  pWal->vers.lastVer = ver;
  pWal->vers.commitVer = ver - 1;
  pWal->vers.snapshotVer = ver - 1;
  pWal->vers.verInSnapshotting = -1;
75 76 77

  taosThreadMutexUnlock(&pWal->mutex);
  return 0;
78 79
}

L
Liu Jicong 已提交
80 81 82 83 84 85
int32_t walApplyVer(SWal *pWal, int64_t ver) {
  // TODO: error check
  pWal->vers.appliedVer = ver;
  return 0;
}

L
Liu Jicong 已提交
86
int32_t walCommit(SWal *pWal, int64_t ver) {
L
Liu Jicong 已提交
87 88
  ASSERT(pWal->vers.commitVer >= pWal->vers.snapshotVer);
  ASSERT(pWal->vers.commitVer <= pWal->vers.lastVer);
L
Liu Jicong 已提交
89 90 91 92
  if (ver < pWal->vers.commitVer) {
    return 0;
  }
  if (ver > pWal->vers.lastVer) {
L
Liu Jicong 已提交
93
    terrno = TSDB_CODE_WAL_INVALID_VER;
L
Liu Jicong 已提交
94 95
    return -1;
  }
L
Liu Jicong 已提交
96
  pWal->vers.commitVer = ver;
L
Liu Jicong 已提交
97 98 99 100
  return 0;
}

int32_t walRollback(SWal *pWal, int64_t ver) {
101
  taosThreadMutexLock(&pWal->mutex);
L
Liu Jicong 已提交
102 103
  int64_t code;
  char    fnameStr[WAL_FILE_LEN];
L
Liu Jicong 已提交
104
  if (ver > pWal->vers.lastVer || ver < pWal->vers.commitVer) {
L
Liu Jicong 已提交
105
    terrno = TSDB_CODE_WAL_INVALID_VER;
L
Liu Jicong 已提交
106
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
107 108 109
    return -1;
  }

L
Liu Jicong 已提交
110 111
  // find correct file
  if (ver < walGetLastFileFirstVer(pWal)) {
L
Liu Jicong 已提交
112 113 114
    // change current files
    code = walChangeWrite(pWal, ver);
    if (code < 0) {
L
Liu Jicong 已提交
115
      taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
116 117 118
      return -1;
    }

L
Liu Jicong 已提交
119
    // delete files
L
Liu Jicong 已提交
120
    int fileSetSize = taosArrayGetSize(pWal->fileInfoSet);
L
Liu Jicong 已提交
121
    for (int i = pWal->writeCur + 1; i < fileSetSize; i++) {
L
Liu Jicong 已提交
122
      walBuildLogName(pWal, ((SWalFileInfo *)taosArrayGet(pWal->fileInfoSet, i))->firstVer, fnameStr);
123
      taosRemoveFile(fnameStr);
L
Liu Jicong 已提交
124
      walBuildIdxName(pWal, ((SWalFileInfo *)taosArrayGet(pWal->fileInfoSet, i))->firstVer, fnameStr);
125
      taosRemoveFile(fnameStr);
L
Liu Jicong 已提交
126
    }
L
Liu Jicong 已提交
127
    // pop from fileInfoSet
L
Liu Jicong 已提交
128 129 130 131
    taosArraySetSize(pWal->fileInfoSet, pWal->writeCur + 1);
  }

  walBuildIdxName(pWal, walGetCurFileFirstVer(pWal), fnameStr);
L
Liu Jicong 已提交
132
  TdFilePtr pIdxFile = taosOpenFile(fnameStr, TD_FILE_WRITE | TD_FILE_READ | TD_FILE_APPEND);
L
Liu Jicong 已提交
133

L
Liu Jicong 已提交
134
  if (pIdxFile == NULL) {
L
Liu Jicong 已提交
135
    ASSERT(0);
wafwerar's avatar
wafwerar 已提交
136
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
137 138
    return -1;
  }
L
Liu Jicong 已提交
139
  int64_t idxOff = walGetVerIdxOffset(pWal, ver);
L
Liu Jicong 已提交
140
  code = taosLSeekFile(pIdxFile, idxOff, SEEK_SET);
L
Liu Jicong 已提交
141
  if (code < 0) {
L
Liu Jicong 已提交
142
    ASSERT(0);
wafwerar's avatar
wafwerar 已提交
143
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
144 145
    return -1;
  }
L
Liu Jicong 已提交
146
  // read idx file and get log file pos
L
Liu Jicong 已提交
147
  SWalIdxEntry entry;
L
Liu Jicong 已提交
148
  if (taosReadFile(pIdxFile, &entry, sizeof(SWalIdxEntry)) != sizeof(SWalIdxEntry)) {
L
Liu Jicong 已提交
149
    ASSERT(0);
wafwerar's avatar
wafwerar 已提交
150
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
151 152 153 154 155
    return -1;
  }
  ASSERT(entry.ver == ver);

  walBuildLogName(pWal, walGetCurFileFirstVer(pWal), fnameStr);
L
Liu Jicong 已提交
156 157
  TdFilePtr pLogFile = taosOpenFile(fnameStr, TD_FILE_WRITE | TD_FILE_READ | TD_FILE_APPEND);
  if (pLogFile == NULL) {
L
Liu Jicong 已提交
158
    // TODO
L
Liu Jicong 已提交
159
    terrno = TAOS_SYSTEM_ERROR(errno);
wafwerar's avatar
wafwerar 已提交
160
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
161 162
    return -1;
  }
L
Liu Jicong 已提交
163
  code = taosLSeekFile(pLogFile, entry.offset, SEEK_SET);
L
Liu Jicong 已提交
164 165
  if (code < 0) {
    // TODO
L
Liu Jicong 已提交
166
    terrno = TAOS_SYSTEM_ERROR(errno);
wafwerar's avatar
wafwerar 已提交
167
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
168 169
    return -1;
  }
L
Liu Jicong 已提交
170
  // validate offset
L
Liu Jicong 已提交
171
  SWalCkHead head;
L
Liu Jicong 已提交
172 173
  ASSERT(taosValidFile(pLogFile));
  int64_t size = taosReadFile(pLogFile, &head, sizeof(SWalCkHead));
L
Liu Jicong 已提交
174
  if (size != sizeof(SWalCkHead)) {
L
Liu Jicong 已提交
175
    ASSERT(0);
L
Liu Jicong 已提交
176
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
177 178 179 180 181
    return -1;
  }
  code = walValidHeadCksum(&head);

  ASSERT(code == 0);
L
Liu Jicong 已提交
182
  if (code != 0) {
L
Liu Jicong 已提交
183
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
M
Minghao Li 已提交
184
    ASSERT(0);
L
Liu Jicong 已提交
185
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
186 187
    return -1;
  }
L
Liu Jicong 已提交
188
  if (head.head.version != ver) {
L
Liu Jicong 已提交
189 190
    ASSERT(0);
    terrno = TSDB_CODE_WAL_FILE_CORRUPTED;
L
Liu Jicong 已提交
191
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
192 193
    return -1;
  }
L
Liu Jicong 已提交
194

L
Liu Jicong 已提交
195
  // truncate old files
L
Liu Jicong 已提交
196
  code = taosFtruncateFile(pLogFile, entry.offset);
L
Liu Jicong 已提交
197
  if (code < 0) {
L
Liu Jicong 已提交
198 199
    ASSERT(0);
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
200
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
201 202
    return -1;
  }
L
Liu Jicong 已提交
203
  code = taosFtruncateFile(pIdxFile, idxOff);
L
Liu Jicong 已提交
204
  if (code < 0) {
L
Liu Jicong 已提交
205 206
    ASSERT(0);
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
207
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
208 209
    return -1;
  }
L
Liu Jicong 已提交
210
  pWal->vers.lastVer = ver - 1;
L
Liu Jicong 已提交
211 212 213 214
  if (pWal->vers.lastVer < pWal->vers.firstVer) {
    ASSERT(pWal->vers.lastVer == pWal->vers.firstVer - 1);
    pWal->vers.firstVer = -1;
  }
L
Liu Jicong 已提交
215 216
  ((SWalFileInfo *)taosArrayGetLast(pWal->fileInfoSet))->lastVer = ver - 1;
  ((SWalFileInfo *)taosArrayGetLast(pWal->fileInfoSet))->fileSize = entry.offset;
217 218 219 220
  if (((SWalFileInfo *)taosArrayGetLast(pWal->fileInfoSet))->lastVer < ver - 1) {
    ASSERT(((SWalFileInfo *)taosArrayGetLast(pWal->fileInfoSet))->fileSize == 0);
    ((SWalFileInfo *)taosArrayGetLast(pWal->fileInfoSet))->firstVer = -1;
  }
L
Liu Jicong 已提交
221 222 223
  taosCloseFile(&pIdxFile);
  taosCloseFile(&pLogFile);

224 225 226 227 228 229
  code = walSaveMeta(pWal);
  if (code < 0) {
    wError("vgId:%d, failed to save meta since %s", pWal->cfg.vgId, terrstr());
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }
L
Liu Jicong 已提交
230

L
Liu Jicong 已提交
231
  // unlock
wafwerar's avatar
wafwerar 已提交
232
  taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
233 234
  return 0;
}
L
Liu Jicong 已提交
235

L
Liu Jicong 已提交
236 237 238 239 240
static FORCE_INLINE int32_t walCheckAndRoll(SWal *pWal) {
  if (taosArrayGetSize(pWal->fileInfoSet) == 0) {
    if (walRollImpl(pWal) < 0) {
      return -1;
    }
241 242 243 244 245 246 247 248 249 250 251
    return 0;
  }

  int64_t passed = walGetSeq() - pWal->lastRollSeq;
  if (pWal->cfg.rollPeriod != -1 && pWal->cfg.rollPeriod != 0 && passed > pWal->cfg.rollPeriod) {
    if (walRollImpl(pWal) < 0) {
      return -1;
    }
  } else if (pWal->cfg.segSize != -1 && pWal->cfg.segSize != 0 && walGetLastFileSize(pWal) > pWal->cfg.segSize) {
    if (walRollImpl(pWal) < 0) {
      return -1;
L
Liu Jicong 已提交
252 253
    }
  }
254

L
Liu Jicong 已提交
255 256 257
  return 0;
}

L
Liu Jicong 已提交
258
int32_t walBeginSnapshot(SWal *pWal, int64_t ver) {
L
Liu Jicong 已提交
259
  pWal->vers.verInSnapshotting = ver;
L
Liu Jicong 已提交
260 261
  wDebug("vgId:%d, wal begin snapshot for version %" PRId64 ", first ver %" PRId64 ", last ver %" PRId64,
         pWal->cfg.vgId, ver, pWal->vers.firstVer, pWal->vers.lastVer);
L
Liu Jicong 已提交
262 263
  // check file rolling
  if (pWal->cfg.retentionPeriod == 0) {
L
Liu Jicong 已提交
264
    taosThreadMutexLock(&pWal->mutex);
L
Liu Jicong 已提交
265 266 267
    if (walGetLastFileSize(pWal) != 0) {
      walRollImpl(pWal);
    }
L
Liu Jicong 已提交
268
    taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
269 270 271 272 273
  }

  return 0;
}

L
Liu Jicong 已提交
274
int32_t walEndSnapshot(SWal *pWal) {
L
Liu Jicong 已提交
275 276
  int32_t code = 0;
  taosThreadMutexLock(&pWal->mutex);
L
Liu Jicong 已提交
277
  int64_t ver = pWal->vers.verInSnapshotting;
L
Liu Jicong 已提交
278 279 280 281

  wDebug("vgId:%d, wal end snapshot for version %" PRId64 ", first ver %" PRId64 ", last ver %" PRId64, pWal->cfg.vgId,
         ver, pWal->vers.firstVer, pWal->vers.lastVer);

L
Liu Jicong 已提交
282 283 284 285
  if (ver == -1) {
    code = -1;
    goto END;
  };
L
Liu Jicong 已提交
286

L
Liu Jicong 已提交
287
  pWal->vers.snapshotVer = ver;
L
Liu Jicong 已提交
288 289
  int ts = taosGetTimestampSec();

290
  void *pIter = NULL;
291 292 293 294 295
  while (1) {
    pIter = taosHashIterate(pWal->pRefHash, pIter);
    if (pIter == NULL) break;
    SWalRef *pRef = *(SWalRef **)pIter;
    if (pRef->refVer == -1) continue;
L
Liu Jicong 已提交
296 297
    ver = TMIN(ver, pRef->refVer - 1);
    wDebug("vgId:%d, wal found ref %" PRId64 ", refId %" PRId64, pWal->cfg.vgId, pRef->refVer, pRef->refId);
298 299
  }

L
Liu Jicong 已提交
300 301 302
  int          deleteCnt = 0;
  int64_t      newTotSize = pWal->totSize;
  SWalFileInfo tmp;
L
Liu Jicong 已提交
303
  tmp.firstVer = ver;
L
Liu Jicong 已提交
304
  // find files safe to delete
L
Liu Jicong 已提交
305
  SWalFileInfo *pInfo = taosArraySearch(pWal->fileInfoSet, &tmp, compareWalFileInfo, TD_LE);
306 307
  if (pInfo) {
    if (ver >= pInfo->lastVer) {
L
Liu Jicong 已提交
308
      pInfo--;
309
    }
L
Liu Jicong 已提交
310 311 312 313
    if (POINTER_DISTANCE(pInfo, pWal->fileInfoSet->pData) > 0) {
      wDebug("vgId:%d, begin remove from %" PRId64, pWal->cfg.vgId, pInfo->firstVer);
    } else {
      wDebug("vgId:%d, no remove", pWal->cfg.vgId);
314 315 316 317 318 319 320 321 322 323
    }
    // iterate files, until the searched result
    for (SWalFileInfo *iter = pWal->fileInfoSet->pData; iter < pInfo; iter++) {
      if ((pWal->cfg.retentionSize != -1 && newTotSize > pWal->cfg.retentionSize) ||
          (pWal->cfg.retentionPeriod != -1 && iter->closeTs + pWal->cfg.retentionPeriod > ts)) {
        // delete according to file size or close time
        deleteCnt++;
        newTotSize -= iter->fileSize;
      }
    }
324 325
    int32_t actualDelete = 0;
    char    fnameStr[WAL_FILE_LEN];
326 327 328 329
    // remove file
    for (int i = 0; i < deleteCnt; i++) {
      pInfo = taosArrayGet(pWal->fileInfoSet, i);
      walBuildLogName(pWal, pInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
330
      wDebug("vgId:%d, remove file %s", pWal->cfg.vgId, fnameStr);
331 332 333
      if (taosRemoveFile(fnameStr) < 0) {
        goto UPDATE_META;
      }
334
      walBuildIdxName(pWal, pInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
335
      wDebug("vgId:%d, remove file %s", pWal->cfg.vgId, fnameStr);
336 337 338 339
      if (taosRemoveFile(fnameStr) < 0) {
        ASSERT(0);
      }
      actualDelete++;
L
Liu Jicong 已提交
340 341
    }

342
  UPDATE_META:
343
    // make new array, remove files
344
    taosArrayPopFrontBatch(pWal->fileInfoSet, actualDelete);
345 346 347 348 349 350
    if (taosArrayGetSize(pWal->fileInfoSet) == 0) {
      pWal->writeCur = -1;
      pWal->vers.firstVer = -1;
    } else {
      pWal->vers.firstVer = ((SWalFileInfo *)taosArrayGet(pWal->fileInfoSet, 0))->firstVer;
    }
L
Liu Jicong 已提交
351
  }
L
Liu Jicong 已提交
352
  pWal->writeCur = taosArrayGetSize(pWal->fileInfoSet) - 1;
L
Liu Jicong 已提交
353
  pWal->totSize = newTotSize;
L
Liu Jicong 已提交
354
  pWal->vers.verInSnapshotting = -1;
L
Liu Jicong 已提交
355

L
Liu Jicong 已提交
356
  // save snapshot ver, commit ver
L
Liu Jicong 已提交
357
  code = walSaveMeta(pWal);
L
Liu Jicong 已提交
358
  if (code < 0) {
L
Liu Jicong 已提交
359
    goto END;
L
Liu Jicong 已提交
360 361
  }

L
Liu Jicong 已提交
362 363 364
END:
  taosThreadMutexUnlock(&pWal->mutex);
  return code;
L
Liu Jicong 已提交
365 366
}

L
Liu Jicong 已提交
367
int32_t walRollImpl(SWal *pWal) {
L
Liu Jicong 已提交
368
  int32_t code = 0;
L
Liu Jicong 已提交
369 370
  if (pWal->pIdxFile != NULL) {
    code = taosCloseFile(&pWal->pIdxFile);
L
Liu Jicong 已提交
371
    if (code != 0) {
L
Liu Jicong 已提交
372
      terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
373
      goto END;
L
Liu Jicong 已提交
374
    }
L
Liu Jicong 已提交
375
  }
L
Liu Jicong 已提交
376 377
  if (pWal->pLogFile != NULL) {
    code = taosCloseFile(&pWal->pLogFile);
L
Liu Jicong 已提交
378
    if (code != 0) {
L
Liu Jicong 已提交
379
      terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
380
      goto END;
L
Liu Jicong 已提交
381
    }
L
Liu Jicong 已提交
382
  }
L
Liu Jicong 已提交
383
  TdFilePtr pIdxFile, pLogFile;
L
Liu Jicong 已提交
384
  // create new file
L
Liu Jicong 已提交
385
  int64_t newFileFirstVer = pWal->vers.lastVer + 1;
L
Liu Jicong 已提交
386
  char    fnameStr[WAL_FILE_LEN];
L
Liu Jicong 已提交
387 388 389
  walBuildIdxName(pWal, newFileFirstVer, fnameStr);
  pIdxFile = taosOpenFile(fnameStr, TD_FILE_CREATE | TD_FILE_WRITE | TD_FILE_APPEND);
  if (pIdxFile == NULL) {
L
Liu Jicong 已提交
390
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
391 392
    code = -1;
    goto END;
L
Liu Jicong 已提交
393
  }
L
Liu Jicong 已提交
394 395 396
  walBuildLogName(pWal, newFileFirstVer, fnameStr);
  pLogFile = taosOpenFile(fnameStr, TD_FILE_CREATE | TD_FILE_WRITE | TD_FILE_APPEND);
  if (pLogFile == NULL) {
L
Liu Jicong 已提交
397
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
398 399
    code = -1;
    goto END;
L
Liu Jicong 已提交
400
  }
L
Liu Jicong 已提交
401
  // error code was set inner
L
Liu Jicong 已提交
402
  code = walRollFileInfo(pWal);
L
Liu Jicong 已提交
403
  if (code != 0) {
L
Liu Jicong 已提交
404
    goto END;
L
Liu Jicong 已提交
405
  }
L
Liu Jicong 已提交
406

L
Liu Jicong 已提交
407
  // switch file
L
Liu Jicong 已提交
408 409
  pWal->pIdxFile = pIdxFile;
  pWal->pLogFile = pLogFile;
L
Liu Jicong 已提交
410
  pWal->writeCur = taosArrayGetSize(pWal->fileInfoSet) - 1;
L
fix  
Liu Jicong 已提交
411
  ASSERT(pWal->writeCur >= 0);
L
Liu Jicong 已提交
412 413

  pWal->lastRollSeq = walGetSeq();
L
Liu Jicong 已提交
414

415 416 417 418 419
  code = walSaveMeta(pWal);
  if (code < 0) {
    wError("vgId:%d, failed to save meta since %s", pWal->cfg.vgId, terrstr());
    goto END;
  }
L
Liu Jicong 已提交
420

L
Liu Jicong 已提交
421 422
END:
  return code;
L
Liu Jicong 已提交
423 424
}

L
Liu Jicong 已提交
425
static int32_t walWriteIndex(SWal *pWal, int64_t ver, int64_t offset) {
L
Liu Jicong 已提交
426
  SWalIdxEntry  entry = {.ver = ver, .offset = offset};
427 428 429 430
  SWalFileInfo *pFileInfo = walGetCurFileInfo(pWal);
  ASSERT(pFileInfo != NULL);
  ASSERT(pFileInfo->firstVer >= 0);
  int64_t idxOffset = (entry.ver - pFileInfo->firstVer) * sizeof(SWalIdxEntry);
S
Shengliang Guan 已提交
431
  wDebug("vgId:%d, write index, index:%" PRId64 ", offset:%" PRId64 ", at %" PRId64, pWal->cfg.vgId, ver, offset,
S
Shengliang Guan 已提交
432
         idxOffset);
433

L
Liu Jicong 已提交
434
  int64_t size = taosWriteFile(pWal->pIdxFile, &entry, sizeof(SWalIdxEntry));
L
Liu Jicong 已提交
435
  if (size != sizeof(SWalIdxEntry)) {
436
    wError("vgId:%d, failed to write idx entry due to %s. ver:%" PRId64, pWal->cfg.vgId, strerror(errno), ver);
L
Liu Jicong 已提交
437
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
438
    return -1;
L
Liu Jicong 已提交
439
  }
440

441 442 443 444 445
  // check alignment of idx entries
  int64_t endOffset = taosLSeekFile(pWal->pIdxFile, 0, SEEK_END);
  if (endOffset < 0) {
    wFatal("vgId:%d, failed to seek end of idxfile due to %s. ver:%" PRId64 "", pWal->cfg.vgId, strerror(errno), ver);
  }
L
Liu Jicong 已提交
446
  ASSERT(endOffset == idxOffset + sizeof(SWalIdxEntry) && "Offset of idx entries misaligned");
L
Liu Jicong 已提交
447 448 449
  return 0;
}

L
Liu Jicong 已提交
450 451 452
static FORCE_INLINE int32_t walWriteImpl(SWal *pWal, int64_t index, tmsg_t msgType, SWalSyncInfo syncMeta,
                                         const void *body, int32_t bodyLen) {
  int64_t code = 0;
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
453

L
Liu Jicong 已提交
454
  int64_t       offset = walGetCurFileOffset(pWal);
455 456
  SWalFileInfo *pFileInfo = walGetCurFileInfo(pWal);
  ASSERT(pFileInfo != NULL);
L
Liu Jicong 已提交
457

458 459 460
  if (pFileInfo->firstVer == -1) {
    pFileInfo->firstVer = index;
  }
L
Liu Jicong 已提交
461
  pWal->writeHead.head.version = index;
L
Liu Jicong 已提交
462
  pWal->writeHead.head.bodyLen = bodyLen;
L
Liu Jicong 已提交
463
  pWal->writeHead.head.msgType = msgType;
464
  pWal->writeHead.head.ingestTs = 0;
L
Liu Jicong 已提交
465

466
  // sync info for sync module
L
Liu Jicong 已提交
467
  pWal->writeHead.head.syncMeta = syncMeta;
L
Liu Jicong 已提交
468

L
Liu Jicong 已提交
469 470
  pWal->writeHead.cksumHead = walCalcHeadCksum(&pWal->writeHead);
  pWal->writeHead.cksumBody = walCalcBodyCksum(body, bodyLen);
471
  wDebug("vgId:%d, wal write log %" PRId64 ", msgType: %s", pWal->cfg.vgId, index, TMSG_INFO(msgType));
L
Liu Jicong 已提交
472

473 474 475 476 477
  code = walWriteIndex(pWal, index, offset);
  if (code < 0) {
    goto END;
  }

L
Liu Jicong 已提交
478
  if (taosWriteFile(pWal->pLogFile, &pWal->writeHead, sizeof(SWalCkHead)) != sizeof(SWalCkHead)) {
L
fix  
Liu Jicong 已提交
479
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
480 481
    wError("vgId:%d, file:%" PRId64 ".log, failed to write since %s", pWal->cfg.vgId, walGetLastFileFirstVer(pWal),
           strerror(errno));
L
Liu Jicong 已提交
482 483
    code = -1;
    goto END;
J
Jeff Tao 已提交
484
  }
S
TD-1846  
Shengliang Guan 已提交
485

L
Liu Jicong 已提交
486
  if (taosWriteFile(pWal->pLogFile, (char *)body, bodyLen) != bodyLen) {
L
fix  
Liu Jicong 已提交
487
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
488 489
    wError("vgId:%d, file:%" PRId64 ".log, failed to write since %s", pWal->cfg.vgId, walGetLastFileFirstVer(pWal),
           strerror(errno));
L
Liu Jicong 已提交
490 491
    code = -1;
    goto END;
L
Liu Jicong 已提交
492
  }
L
Liu Jicong 已提交
493

L
Liu Jicong 已提交
494
  // set status
495
  if (pWal->vers.firstVer == -1) pWal->vers.firstVer = index;
L
Liu Jicong 已提交
496
  pWal->vers.lastVer = index;
L
Liu Jicong 已提交
497
  pWal->totSize += sizeof(SWalCkHead) + bodyLen;
498 499
  pFileInfo->lastVer = index;
  pFileInfo->fileSize += sizeof(SWalCkHead) + bodyLen;
L
Liu Jicong 已提交
500

L
Liu Jicong 已提交
501
  return 0;
502

L
Liu Jicong 已提交
503
END:
504 505
  // recover in a reverse order
  if (taosFtruncateFile(pWal->pLogFile, offset) < 0) {
506 507
    wFatal("vgId:%d, failed to ftruncate logfile to offset:%" PRId64 " during recovery due to %s", pWal->cfg.vgId,
           offset, strerror(errno));
508 509 510 511 512 513
    terrno = TAOS_SYSTEM_ERROR(errno);
    ASSERT(0 && "failed to recover from error");
  }

  int64_t idxOffset = (index - pFileInfo->firstVer) * sizeof(SWalIdxEntry);
  if (taosFtruncateFile(pWal->pIdxFile, idxOffset) < 0) {
514 515
    wFatal("vgId:%d, failed to ftruncate idxfile to offset:%" PRId64 "during recovery due to %s", pWal->cfg.vgId,
           idxOffset, strerror(errno));
516 517 518
    terrno = TAOS_SYSTEM_ERROR(errno);
    ASSERT(0 && "failed to recover from error");
  }
L
Liu Jicong 已提交
519 520 521 522 523 524 525 526 527 528 529 530 531
  return -1;
}

int64_t walAppendLog(SWal *pWal, tmsg_t msgType, SWalSyncInfo syncMeta, const void *body, int32_t bodyLen) {
  taosThreadMutexLock(&pWal->mutex);

  int64_t index = pWal->vers.lastVer + 1;

  if (walCheckAndRoll(pWal) < 0) {
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }

L
Liu Jicong 已提交
532
  if (pWal->pLogFile == NULL || pWal->pIdxFile == NULL || pWal->writeCur < 0) {
L
Liu Jicong 已提交
533 534 535 536 537 538
    if (walInitWriteFile(pWal) < 0) {
      taosThreadMutexUnlock(&pWal->mutex);
      return -1;
    }
  }

L
Liu Jicong 已提交
539
  ASSERT(pWal->pLogFile != NULL && pWal->pIdxFile != NULL && pWal->writeCur >= 0);
L
Liu Jicong 已提交
540 541 542 543 544 545

  if (walWriteImpl(pWal, index, msgType, syncMeta, body, bodyLen) < 0) {
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }

wafwerar's avatar
wafwerar 已提交
546
  taosThreadMutexUnlock(&pWal->mutex);
L
Liu Jicong 已提交
547 548
  return index;
}
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
549

L
Liu Jicong 已提交
550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569
int32_t walWriteWithSyncInfo(SWal *pWal, int64_t index, tmsg_t msgType, SWalSyncInfo syncMeta, const void *body,
                             int32_t bodyLen) {
  int32_t code = 0;

  taosThreadMutexLock(&pWal->mutex);

  // concurrency control:
  // if logs are write with assigned index,
  // smaller index must be write before larger one
  if (index != pWal->vers.lastVer + 1) {
    terrno = TSDB_CODE_WAL_INVALID_VER;
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }

  if (walCheckAndRoll(pWal) < 0) {
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }

L
Liu Jicong 已提交
570
  if (pWal->pIdxFile == NULL || pWal->pIdxFile == NULL || pWal->writeCur < 0) {
L
Liu Jicong 已提交
571 572 573 574 575 576
    if (walInitWriteFile(pWal) < 0) {
      taosThreadMutexUnlock(&pWal->mutex);
      return -1;
    }
  }

L
Liu Jicong 已提交
577
  ASSERT(pWal->pIdxFile != NULL && pWal->pLogFile != NULL && pWal->writeCur >= 0);
L
Liu Jicong 已提交
578 579 580 581 582 583 584 585

  if (walWriteImpl(pWal, index, msgType, syncMeta, body, bodyLen) < 0) {
    taosThreadMutexUnlock(&pWal->mutex);
    return -1;
  }

  taosThreadMutexUnlock(&pWal->mutex);
  return code;
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
586 587
}

L
Liu Jicong 已提交
588
int32_t walWrite(SWal *pWal, int64_t index, tmsg_t msgType, const void *body, int32_t bodyLen) {
L
Liu Jicong 已提交
589
  SWalSyncInfo syncMeta = {
L
Liu Jicong 已提交
590 591 592 593
      .isWeek = -1,
      .seqNum = UINT64_MAX,
      .term = UINT64_MAX,
  };
L
Liu Jicong 已提交
594
  return walWriteWithSyncInfo(pWal, index, msgType, syncMeta, body, bodyLen);
L
Liu Jicong 已提交
595 596
}

L
Liu Jicong 已提交
597
void walFsync(SWal *pWal, bool forceFsync) {
L
Liu Jicong 已提交
598
  if (forceFsync || (pWal->cfg.level == TAOS_WAL_FSYNC && pWal->cfg.fsyncPeriod == 0)) {
599 600 601 602 603
    wTrace("vgId:%d, fileId:%" PRId64 ".idx, do fsync", pWal->cfg.vgId, walGetCurFileFirstVer(pWal));
    if (taosFsyncFile(pWal->pIdxFile) < 0) {
      wError("vgId:%d, file:%" PRId64 ".idx, fsync failed since %s", pWal->cfg.vgId, walGetCurFileFirstVer(pWal),
             strerror(errno));
    }
L
Liu Jicong 已提交
604
    wTrace("vgId:%d, fileId:%" PRId64 ".log, do fsync", pWal->cfg.vgId, walGetCurFileFirstVer(pWal));
L
Liu Jicong 已提交
605
    if (taosFsyncFile(pWal->pLogFile) < 0) {
L
Liu Jicong 已提交
606 607
      wError("vgId:%d, file:%" PRId64 ".log, fsync failed since %s", pWal->cfg.vgId, walGetCurFileFirstVer(pWal),
             strerror(errno));
608 609
    }
  }
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
610
}