walWrite.c 10.1 KB
Newer Older
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

S
Shengliang Guan 已提交
16
#define _DEFAULT_SOURCE
L
Liu Jicong 已提交
17

陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
18
#include "os.h"
S
Shengliang Guan 已提交
19
#include "taoserror.h"
20
#include "tchecksum.h"
S
TD-1895  
Shengliang Guan 已提交
21
#include "tfile.h"
S
Shengliang Guan 已提交
22
#include "walInt.h"
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
23

L
Liu Jicong 已提交
24
int32_t walCommit(SWal *pWal, int64_t ver) {
L
Liu Jicong 已提交
25 26
  ASSERT(pWal->vers.commitVer >= pWal->vers.snapshotVer);
  ASSERT(pWal->vers.commitVer <= pWal->vers.lastVer);
L
Liu Jicong 已提交
27
  if (ver < pWal->vers.commitVer || ver > pWal->vers.lastVer) {
L
Liu Jicong 已提交
28
    terrno = TSDB_CODE_WAL_INVALID_VER;
L
Liu Jicong 已提交
29 30
    return -1;
  }
L
Liu Jicong 已提交
31
  pWal->vers.commitVer = ver;
L
Liu Jicong 已提交
32 33 34 35
  return 0;
}

int32_t walRollback(SWal *pWal, int64_t ver) {
L
Liu Jicong 已提交
36
  int  code;
L
Liu Jicong 已提交
37
  char fnameStr[WAL_FILE_LEN];
L
Liu Jicong 已提交
38
  if (ver == pWal->vers.lastVer) {
L
Liu Jicong 已提交
39 40
    return 0;
  }
L
Liu Jicong 已提交
41
  if (ver > pWal->vers.lastVer || ver < pWal->vers.commitVer) {
L
Liu Jicong 已提交
42
    terrno = TSDB_CODE_WAL_INVALID_VER;
L
Liu Jicong 已提交
43 44 45 46
    return -1;
  }
  pthread_mutex_lock(&pWal->mutex);

L
Liu Jicong 已提交
47 48 49
  // find correct file
  if (ver < walGetLastFileFirstVer(pWal)) {
    // close current files
L
Liu Jicong 已提交
50 51
    tfClose(pWal->writeIdxTfd);
    tfClose(pWal->writeLogTfd);
L
Liu Jicong 已提交
52
    // open old files
L
Liu Jicong 已提交
53
    code = walChangeFile(pWal, ver);
L
Liu Jicong 已提交
54
    if (code != 0) {
L
Liu Jicong 已提交
55 56 57
      return -1;
    }

L
Liu Jicong 已提交
58
    // delete files
L
Liu Jicong 已提交
59
    int fileSetSize = taosArrayGetSize(pWal->fileInfoSet);
L
Liu Jicong 已提交
60
    for (int i = pWal->writeCur; i < fileSetSize; i++) {
L
Liu Jicong 已提交
61
      walBuildLogName(pWal, ((SWalFileInfo *)taosArrayGet(pWal->fileInfoSet, i))->firstVer, fnameStr);
L
Liu Jicong 已提交
62
      remove(fnameStr);
L
Liu Jicong 已提交
63
      walBuildIdxName(pWal, ((SWalFileInfo *)taosArrayGet(pWal->fileInfoSet, i))->firstVer, fnameStr);
L
Liu Jicong 已提交
64 65
      remove(fnameStr);
    }
L
Liu Jicong 已提交
66
    // pop from fileInfoSet
L
Liu Jicong 已提交
67 68 69 70 71 72
    taosArraySetSize(pWal->fileInfoSet, pWal->writeCur + 1);
  }

  walBuildIdxName(pWal, walGetCurFileFirstVer(pWal), fnameStr);
  int64_t idxTfd = tfOpenReadWrite(fnameStr);

L
Liu Jicong 已提交
73 74
  // TODO:change to deserialize function
  if (idxTfd < 0) {
L
Liu Jicong 已提交
75 76 77
    pthread_mutex_unlock(&pWal->mutex);
    return -1;
  }
L
Liu Jicong 已提交
78
  int64_t idxOff = walGetVerIdxOffset(pWal, ver);
L
Liu Jicong 已提交
79
  code = tfLseek(idxTfd, idxOff, SEEK_SET);
L
Liu Jicong 已提交
80
  if (code < 0) {
L
Liu Jicong 已提交
81 82 83
    pthread_mutex_unlock(&pWal->mutex);
    return -1;
  }
L
Liu Jicong 已提交
84 85
  // read idx file and get log file pos
  // TODO:change to deserialize function
L
Liu Jicong 已提交
86 87
  SWalIdxEntry entry;
  if (tfRead(idxTfd, &entry, sizeof(SWalIdxEntry)) != sizeof(SWalIdxEntry)) {
L
Liu Jicong 已提交
88 89 90 91 92 93 94
    pthread_mutex_unlock(&pWal->mutex);
    return -1;
  }
  ASSERT(entry.ver == ver);

  walBuildLogName(pWal, walGetCurFileFirstVer(pWal), fnameStr);
  int64_t logTfd = tfOpenReadWrite(fnameStr);
L
Liu Jicong 已提交
95 96
  if (logTfd < 0) {
    // TODO
L
Liu Jicong 已提交
97 98 99 100
    pthread_mutex_unlock(&pWal->mutex);
    return -1;
  }
  code = tfLseek(logTfd, entry.offset, SEEK_SET);
L
Liu Jicong 已提交
101 102
  if (code < 0) {
    // TODO
L
Liu Jicong 已提交
103 104 105
    pthread_mutex_unlock(&pWal->mutex);
    return -1;
  }
L
Liu Jicong 已提交
106
  // validate offset
L
Liu Jicong 已提交
107 108 109
  SWalHead head;
  ASSERT(tfValid(logTfd));
  int size = tfRead(logTfd, &head, sizeof(SWalHead));
L
Liu Jicong 已提交
110
  if (size != sizeof(SWalHead)) {
L
Liu Jicong 已提交
111 112 113 114 115
    return -1;
  }
  code = walValidHeadCksum(&head);

  ASSERT(code == 0);
L
Liu Jicong 已提交
116
  if (code != 0) {
L
Liu Jicong 已提交
117 118
    return -1;
  }
L
Liu Jicong 已提交
119 120
  if (head.head.version != ver) {
    // TODO
L
Liu Jicong 已提交
121 122
    return -1;
  }
L
Liu Jicong 已提交
123
  // truncate old files
L
Liu Jicong 已提交
124
  code = tfFtruncate(logTfd, entry.offset);
L
Liu Jicong 已提交
125
  if (code < 0) {
L
Liu Jicong 已提交
126 127 128
    return -1;
  }
  code = tfFtruncate(idxTfd, idxOff);
L
Liu Jicong 已提交
129
  if (code < 0) {
L
Liu Jicong 已提交
130 131
    return -1;
  }
L
Liu Jicong 已提交
132
  pWal->vers.lastVer = ver - 1;
L
Liu Jicong 已提交
133 134
  ((SWalFileInfo *)taosArrayGetLast(pWal->fileInfoSet))->lastVer = ver - 1;
  ((SWalFileInfo *)taosArrayGetLast(pWal->fileInfoSet))->fileSize = entry.offset;
L
Liu Jicong 已提交
135

L
Liu Jicong 已提交
136
  // unlock
L
Liu Jicong 已提交
137 138 139
  pthread_mutex_unlock(&pWal->mutex);
  return 0;
}
L
Liu Jicong 已提交
140

L
Liu Jicong 已提交
141
int32_t walBeginSnapshot(SWal *pWal, int64_t ver) {
L
Liu Jicong 已提交
142
  pWal->vers.verInSnapshotting = ver;
L
Liu Jicong 已提交
143 144
  // check file rolling
  if (pWal->cfg.retentionPeriod == 0) {
L
Liu Jicong 已提交
145 146 147 148 149 150
    walRoll(pWal);
  }

  return 0;
}

L
Liu Jicong 已提交
151
int32_t walEndSnapshot(SWal *pWal) {
L
Liu Jicong 已提交
152
  int64_t ver = pWal->vers.verInSnapshotting;
S
Shengliang Guan 已提交
153
  if (ver == -1) return 0;
L
Liu Jicong 已提交
154

L
Liu Jicong 已提交
155
  pWal->vers.snapshotVer = ver;
L
Liu Jicong 已提交
156 157
  int ts = taosGetTimestampSec();

L
Liu Jicong 已提交
158 159 160
  int          deleteCnt = 0;
  int64_t      newTotSize = pWal->totSize;
  SWalFileInfo tmp;
L
Liu Jicong 已提交
161
  tmp.firstVer = ver;
L
Liu Jicong 已提交
162
  // find files safe to delete
L
Liu Jicong 已提交
163
  SWalFileInfo *pInfo = taosArraySearch(pWal->fileInfoSet, &tmp, compareWalFileInfo, TD_LE);
L
Liu Jicong 已提交
164
  if (ver >= pInfo->lastVer) {
L
Liu Jicong 已提交
165 166
    pInfo++;
  }
L
Liu Jicong 已提交
167
  // iterate files, until the searched result
L
Liu Jicong 已提交
168
  for (SWalFileInfo *iter = pWal->fileInfoSet->pData; iter < pInfo; iter++) {
L
Liu Jicong 已提交
169 170
    if (pWal->totSize > pWal->cfg.retentionSize || iter->closeTs + pWal->cfg.retentionPeriod > ts) {
      // delete according to file size or close time
L
Liu Jicong 已提交
171 172 173 174 175
      deleteCnt++;
      newTotSize -= iter->fileSize;
    }
  }
  char fnameStr[WAL_FILE_LEN];
L
Liu Jicong 已提交
176 177
  // remove file
  for (int i = 0; i < deleteCnt; i++) {
L
Liu Jicong 已提交
178
    SWalFileInfo *pInfo = taosArrayGet(pWal->fileInfoSet, i);
L
Liu Jicong 已提交
179
    walBuildLogName(pWal, pInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
180
    remove(fnameStr);
L
Liu Jicong 已提交
181
    walBuildIdxName(pWal, pInfo->firstVer, fnameStr);
L
Liu Jicong 已提交
182 183 184
    remove(fnameStr);
  }

L
Liu Jicong 已提交
185 186 187
  // make new array, remove files
  taosArrayPopFrontBatch(pWal->fileInfoSet, deleteCnt);
  if (taosArrayGetSize(pWal->fileInfoSet) == 0) {
L
Liu Jicong 已提交
188
    pWal->writeCur = -1;
L
Liu Jicong 已提交
189
    pWal->vers.firstVer = -1;
L
Liu Jicong 已提交
190
  } else {
L
Liu Jicong 已提交
191
    pWal->vers.firstVer = ((SWalFileInfo *)taosArrayGet(pWal->fileInfoSet, 0))->firstVer;
L
Liu Jicong 已提交
192
  }
L
Liu Jicong 已提交
193 194
  pWal->writeCur = taosArrayGetSize(pWal->fileInfoSet) - 1;
  ;
L
Liu Jicong 已提交
195
  pWal->totSize = newTotSize;
L
Liu Jicong 已提交
196
  pWal->vers.verInSnapshotting = -1;
L
Liu Jicong 已提交
197

L
Liu Jicong 已提交
198
  // save snapshot ver, commit ver
L
Liu Jicong 已提交
199
  int code = walSaveMeta(pWal);
L
Liu Jicong 已提交
200
  if (code != 0) {
L
Liu Jicong 已提交
201 202 203 204 205 206
    return -1;
  }

  return 0;
}

L
Liu Jicong 已提交
207
int walRoll(SWal *pWal) {
L
Liu Jicong 已提交
208
  int code = 0;
L
Liu Jicong 已提交
209
  if (pWal->writeIdxTfd != -1) {
L
Liu Jicong 已提交
210
    code = tfClose(pWal->writeIdxTfd);
L
Liu Jicong 已提交
211
    if (code != 0) {
L
Liu Jicong 已提交
212 213
      return -1;
    }
L
Liu Jicong 已提交
214
  }
L
Liu Jicong 已提交
215
  if (pWal->writeLogTfd != -1) {
L
Liu Jicong 已提交
216
    code = tfClose(pWal->writeLogTfd);
L
Liu Jicong 已提交
217
    if (code != 0) {
L
Liu Jicong 已提交
218 219
      return -1;
    }
L
Liu Jicong 已提交
220 221
  }
  int64_t idxTfd, logTfd;
L
Liu Jicong 已提交
222
  // create new file
L
Liu Jicong 已提交
223
  int64_t newFileFirstVersion = pWal->vers.lastVer + 1;
L
Liu Jicong 已提交
224
  char    fnameStr[WAL_FILE_LEN];
L
Liu Jicong 已提交
225
  walBuildIdxName(pWal, newFileFirstVersion, fnameStr);
L
Liu Jicong 已提交
226
  idxTfd = tfOpenCreateWriteAppend(fnameStr);
L
Liu Jicong 已提交
227
  if (idxTfd < 0) {
L
Liu Jicong 已提交
228 229 230 231
    ASSERT(0);
    return -1;
  }
  walBuildLogName(pWal, newFileFirstVersion, fnameStr);
L
Liu Jicong 已提交
232
  logTfd = tfOpenCreateWriteAppend(fnameStr);
L
Liu Jicong 已提交
233
  if (logTfd < 0) {
L
Liu Jicong 已提交
234 235 236 237
    ASSERT(0);
    return -1;
  }
  code = walRollFileInfo(pWal);
L
Liu Jicong 已提交
238
  if (code != 0) {
L
Liu Jicong 已提交
239 240 241
    ASSERT(0);
    return -1;
  }
L
Liu Jicong 已提交
242

L
Liu Jicong 已提交
243
  // switch file
L
Liu Jicong 已提交
244 245
  pWal->writeIdxTfd = idxTfd;
  pWal->writeLogTfd = logTfd;
L
Liu Jicong 已提交
246
  pWal->writeCur = taosArrayGetSize(pWal->fileInfoSet) - 1;
L
fix  
Liu Jicong 已提交
247
  ASSERT(pWal->writeCur >= 0);
L
Liu Jicong 已提交
248 249 250 251 252

  pWal->lastRollSeq = walGetSeq();
  return 0;
}

L
Liu Jicong 已提交
253
static int walWriteIndex(SWal *pWal, int64_t ver, int64_t offset) {
L
Liu Jicong 已提交
254 255 256
  SWalIdxEntry entry = {.ver = ver, .offset = offset};
  int          size = tfWrite(pWal->writeIdxTfd, &entry, sizeof(SWalIdxEntry));
  if (size != sizeof(SWalIdxEntry)) {
L
Liu Jicong 已提交
257
    terrno = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
258
    // TODO truncate
L
Liu Jicong 已提交
259
    return -1;
L
Liu Jicong 已提交
260 261 262 263
  }
  return 0;
}

L
Liu Jicong 已提交
264
int64_t walWrite(SWal *pWal, int64_t index, uint8_t msgType, const void *body, int32_t bodyLen) {
L
Liu Jicong 已提交
265
  if (pWal == NULL) return -1;
L
Liu Jicong 已提交
266
  int code = 0;
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
267

S
TD-1652  
Shengliang Guan 已提交
268
  // no wal
L
Liu Jicong 已提交
269
  if (pWal->cfg.level == TAOS_WAL_NOLOG) return 0;
L
Liu Jicong 已提交
270

L
Liu Jicong 已提交
271
  if (index == pWal->vers.lastVer + 1) {
L
Liu Jicong 已提交
272
    if (taosArrayGetSize(pWal->fileInfoSet) == 0) {
L
Liu Jicong 已提交
273
      pWal->vers.firstVer = index;
L
Liu Jicong 已提交
274 275
      code = walRoll(pWal);
      ASSERT(code == 0);
L
Liu Jicong 已提交
276
    } else {
L
Liu Jicong 已提交
277
      int64_t passed = walGetSeq() - pWal->lastRollSeq;
L
Liu Jicong 已提交
278
      if (pWal->cfg.rollPeriod != -1 && pWal->cfg.rollPeriod != 0 && passed > pWal->cfg.rollPeriod) {
L
Liu Jicong 已提交
279
        walRoll(pWal);
L
Liu Jicong 已提交
280
      } else if (pWal->cfg.segSize != -1 && pWal->cfg.segSize != 0 && walGetLastFileSize(pWal) > pWal->cfg.segSize) {
L
Liu Jicong 已提交
281 282
        walRoll(pWal);
      }
L
Liu Jicong 已提交
283 284
    }
  } else {
L
Liu Jicong 已提交
285 286
    // reject skip log or rewrite log
    // must truncate explicitly first
L
Liu Jicong 已提交
287 288
    return -1;
  }
L
Liu Jicong 已提交
289
  /*if (!tfValid(pWal->writeLogTfd)) return -1;*/
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
290

L
Liu Jicong 已提交
291 292
  ASSERT(pWal->writeCur >= 0);

293
  pthread_mutex_lock(&pWal->mutex);
L
Liu Jicong 已提交
294 295 296 297
  if (pWal->writeIdxTfd == -1 || pWal->writeLogTfd == -1) {
    walChangeFileToLast(pWal);
  }

L
Liu Jicong 已提交
298
  pWal->writeHead.head.version = index;
L
Liu Jicong 已提交
299

L
Liu Jicong 已提交
300
  int64_t offset = walGetCurFileOffset(pWal);
L
Liu Jicong 已提交
301 302 303 304
  pWal->writeHead.head.len = bodyLen;
  pWal->writeHead.head.msgType = msgType;
  pWal->writeHead.cksumHead = walCalcHeadCksum(&pWal->writeHead);
  pWal->writeHead.cksumBody = walCalcBodyCksum(body, bodyLen);
305

L
Liu Jicong 已提交
306
  if (tfWrite(pWal->writeLogTfd, &pWal->writeHead, sizeof(SWalHead)) != sizeof(SWalHead)) {
L
Liu Jicong 已提交
307
    // ftruncate
S
TD-1846  
Shengliang Guan 已提交
308
    code = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
309 310
    wError("vgId:%d, file:%" PRId64 ".log, failed to write since %s", pWal->cfg.vgId, walGetLastFileFirstVer(pWal),
           strerror(errno));
J
Jeff Tao 已提交
311
  }
S
TD-1846  
Shengliang Guan 已提交
312

L
Liu Jicong 已提交
313 314
  if (tfWrite(pWal->writeLogTfd, (char *)body, bodyLen) != bodyLen) {
    // ftruncate
L
Liu Jicong 已提交
315
    code = TAOS_SYSTEM_ERROR(errno);
L
Liu Jicong 已提交
316 317
    wError("vgId:%d, file:%" PRId64 ".log, failed to write since %s", pWal->cfg.vgId, walGetLastFileFirstVer(pWal),
           strerror(errno));
L
Liu Jicong 已提交
318
  }
L
Liu Jicong 已提交
319

L
Liu Jicong 已提交
320
  code = walWriteIndex(pWal, index, offset);
L
Liu Jicong 已提交
321 322
  if (code != 0) {
    // TODO
L
Liu Jicong 已提交
323
    return -1;
L
Liu Jicong 已提交
324
  }
325

L
Liu Jicong 已提交
326
  // set status
L
Liu Jicong 已提交
327
  pWal->vers.lastVer = index;
L
Liu Jicong 已提交
328
  pWal->totSize += sizeof(SWalHead) + bodyLen;
L
Liu Jicong 已提交
329 330
  walGetCurFileInfo(pWal)->lastVer = index;
  walGetCurFileInfo(pWal)->fileSize += sizeof(SWalHead) + bodyLen;
L
Liu Jicong 已提交
331

L
Liu Jicong 已提交
332
  pthread_mutex_unlock(&pWal->mutex);
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
333

S
TD-1846  
Shengliang Guan 已提交
334
  return code;
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
335 336
}

L
Liu Jicong 已提交
337
void walFsync(SWal *pWal, bool forceFsync) {
L
Liu Jicong 已提交
338
  if (forceFsync || (pWal->cfg.level == TAOS_WAL_FSYNC && pWal->cfg.fsyncPeriod == 0)) {
L
Liu Jicong 已提交
339
    wTrace("vgId:%d, fileId:%" PRId64 ".log, do fsync", pWal->cfg.vgId, walGetCurFileFirstVer(pWal));
L
Liu Jicong 已提交
340
    if (tfFsync(pWal->writeLogTfd) < 0) {
L
Liu Jicong 已提交
341 342
      wError("vgId:%d, file:%" PRId64 ".log, fsync failed since %s", pWal->cfg.vgId, walGetCurFileFirstVer(pWal),
             strerror(errno));
343 344
    }
  }
陶建辉(Jeff)'s avatar
陶建辉(Jeff) 已提交
345 346
}

L
Liu Jicong 已提交
347
/*static int walValidateOffset(SWal* pWal, int64_t ver) {*/
L
Liu Jicong 已提交
348 349 350 351 352 353 354
/*int code = 0;*/
/*SWalHead *pHead = NULL;*/
/*code = (int)walRead(pWal, &pHead, ver);*/
/*if(pHead->head.version != ver) {*/
/*return -1;*/
/*}*/
/*return 0;*/
L
Liu Jicong 已提交
355
/*}*/
L
Liu Jicong 已提交
356

L
Liu Jicong 已提交
357
/*static int64_t walGetOffset(SWal* pWal, int64_t ver) {*/
L
Liu Jicong 已提交
358 359 360 361
/*int code = walSeekVer(pWal, ver);*/
/*if(code != 0) {*/
/*return -1;*/
/*}*/
L
Liu Jicong 已提交
362

L
Liu Jicong 已提交
363 364 365 366
/*code = walValidateOffset(pWal, ver);*/
/*if(code != 0) {*/
/*return -1;*/
/*}*/
L
Liu Jicong 已提交
367

L
Liu Jicong 已提交
368
/*return 0;*/
L
Liu Jicong 已提交
369
/*}*/