mndTrans.c 53.6 KB
Newer Older
S
Shengliang Guan 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#define _DEFAULT_SOURCE
S
Shengliang Guan 已提交
17
#include "mndTrans.h"
S
Shengliang Guan 已提交
18
#include "mndAuth.h"
L
Liu Jicong 已提交
19
#include "mndConsumer.h"
S
Shengliang Guan 已提交
20
#include "mndDb.h"
S
Shengliang Guan 已提交
21
#include "mndShow.h"
S
Shengliang Guan 已提交
22
#include "mndSync.h"
S
Shengliang Guan 已提交
23
#include "mndUser.h"
S
Shengliang Guan 已提交
24

25 26
#define TRANS_VER_NUMBER   1
#define TRANS_ARRAY_SIZE   8
S
Shengliang Guan 已提交
27
#define TRANS_RESERVE_SIZE 64
S
Shengliang Guan 已提交
28

S
Shengliang Guan 已提交
29 30 31
static SSdbRaw *mndTransActionEncode(STrans *pTrans);
static SSdbRow *mndTransActionDecode(SSdbRaw *pRaw);
static int32_t  mndTransActionInsert(SSdb *pSdb, STrans *pTrans);
S
Shengliang Guan 已提交
32
static int32_t  mndTransActionUpdate(SSdb *pSdb, STrans *OldTrans, STrans *pOld);
33
static int32_t  mndTransActionDelete(SSdb *pSdb, STrans *pTrans, bool callFunc);
S
Shengliang Guan 已提交
34

S
Shengliang Guan 已提交
35
static int32_t mndTransAppendLog(SArray *pArray, SSdbRaw *pRaw);
S
Shengliang Guan 已提交
36
static int32_t mndTransAppendAction(SArray *pArray, STransAction *pAction);
S
Shengliang Guan 已提交
37 38
static void    mndTransDropLogs(SArray *pArray);
static void    mndTransDropActions(SArray *pArray);
39
static void    mndTransDropData(STrans *pTrans);
40
static int32_t mndTransExecuteActions(SMnode *pMnode, STrans *pTrans, SArray *pArray);
S
Shengliang Guan 已提交
41 42 43 44
static int32_t mndTransExecuteRedoLogs(SMnode *pMnode, STrans *pTrans);
static int32_t mndTransExecuteUndoLogs(SMnode *pMnode, STrans *pTrans);
static int32_t mndTransExecuteRedoActions(SMnode *pMnode, STrans *pTrans);
static int32_t mndTransExecuteUndoActions(SMnode *pMnode, STrans *pTrans);
45
static int32_t mndTransExecuteCommitActions(SMnode *pMnode, STrans *pTrans);
S
Shengliang Guan 已提交
46 47 48 49 50
static bool    mndTransPerformPrepareStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerformRedoLogStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerformRedoActionStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerformUndoLogStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerformUndoActionStage(SMnode *pMnode, STrans *pTrans);
51
static bool    mndTransPerformCommitActionStage(SMnode *pMnode, STrans *pTrans);
S
Shengliang Guan 已提交
52 53 54
static bool    mndTransPerformCommitStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerformRollbackStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerfromFinishedStage(SMnode *pMnode, STrans *pTrans);
55
static bool    mndCannotExecuteTransAction(SMnode *pMnode) { return !pMnode->deploy && !mndIsMaster(pMnode); }
S
Shengliang Guan 已提交
56

57
static void    mndTransSendRpcRsp(SMnode *pMnode, STrans *pTrans);
S
Shengliang Guan 已提交
58 59
static int32_t mndProcessTransReq(SRpcMsg *pReq);
static int32_t mndProcessKillTransReq(SRpcMsg *pReq);
S
Shengliang Guan 已提交
60

S
Shengliang Guan 已提交
61
static int32_t mndRetrieveTrans(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows);
S
Shengliang Guan 已提交
62 63
static void    mndCancelGetNextTrans(SMnode *pMnode, void *pIter);

S
Shengliang Guan 已提交
64
int32_t mndInitTrans(SMnode *pMnode) {
S
Shengliang Guan 已提交
65 66 67 68 69 70 71 72 73
  SSdbTable table = {
      .sdbType = SDB_TRANS,
      .keyType = SDB_KEY_INT32,
      .encodeFp = (SdbEncodeFp)mndTransActionEncode,
      .decodeFp = (SdbDecodeFp)mndTransActionDecode,
      .insertFp = (SdbInsertFp)mndTransActionInsert,
      .updateFp = (SdbUpdateFp)mndTransActionUpdate,
      .deleteFp = (SdbDeleteFp)mndTransActionDelete,
  };
S
Shengliang Guan 已提交
74

S
Shengliang Guan 已提交
75
  mndSetMsgHandle(pMnode, TDMT_MND_TRANS_TIMER, mndProcessTransReq);
S
Shengliang Guan 已提交
76
  mndSetMsgHandle(pMnode, TDMT_MND_KILL_TRANS, mndProcessKillTransReq);
S
Shengliang Guan 已提交
77

S
Shengliang Guan 已提交
78
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_TRANS, mndRetrieveTrans);
S
Shengliang Guan 已提交
79
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_TRANS, mndCancelGetNextTrans);
S
Shengliang Guan 已提交
80 81 82 83 84
  return sdbSetTable(pMnode->pSdb, table);
}

void mndCleanupTrans(SMnode *pMnode) {}

85 86 87
static int32_t mndTransGetActionsSize(SArray *pArray) {
  int32_t actionNum = taosArrayGetSize(pArray);
  int32_t rawDataLen = 0;
S
Shengliang Guan 已提交
88

89 90
  for (int32_t i = 0; i < actionNum; ++i) {
    STransAction *pAction = taosArrayGet(pArray, i);
91
    if (pAction->actionType == TRANS_ACTION_RAW) {
92
      rawDataLen += (sdbGetRawTotalSize(pAction->pRaw) + sizeof(int32_t));
93
    } else if (pAction->actionType == TRANS_ACTION_MSG) {
94
      rawDataLen += (sizeof(STransAction) + pAction->contLen);
95 96
    } else {
      // empty
97
    }
98
    rawDataLen += sizeof(int8_t);
S
Shengliang Guan 已提交
99 100
  }

101 102
  return rawDataLen;
}
S
Shengliang Guan 已提交
103

104 105
static SSdbRaw *mndTransActionEncode(STrans *pTrans) {
  terrno = TSDB_CODE_OUT_OF_MEMORY;
S
Shengliang Guan 已提交
106

107 108 109 110
  int32_t rawDataLen = sizeof(STrans) + TRANS_RESERVE_SIZE;
  rawDataLen += mndTransGetActionsSize(pTrans->redoActions);
  rawDataLen += mndTransGetActionsSize(pTrans->undoActions);
  rawDataLen += mndTransGetActionsSize(pTrans->commitActions);
S
Shengliang Guan 已提交
111

S
Shengliang Guan 已提交
112
  SSdbRaw *pRaw = sdbAllocRaw(SDB_TRANS, TRANS_VER_NUMBER, rawDataLen);
S
Shengliang Guan 已提交
113
  if (pRaw == NULL) {
S
Shengliang Guan 已提交
114
    mError("trans:%d, failed to alloc raw since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
115 116 117 118
    return NULL;
  }

  int32_t dataPos = 0;
119
  SDB_SET_INT32(pRaw, dataPos, pTrans->id, _OVER)
S
Shengliang Guan 已提交
120 121 122 123
  SDB_SET_INT8(pRaw, dataPos, pTrans->stage, _OVER)
  SDB_SET_INT8(pRaw, dataPos, pTrans->policy, _OVER)
  SDB_SET_INT8(pRaw, dataPos, pTrans->conflict, _OVER)
  SDB_SET_INT8(pRaw, dataPos, pTrans->exec, _OVER)
124
  SDB_SET_INT64(pRaw, dataPos, pTrans->createdTime, _OVER)
125 126
  SDB_SET_BINARY(pRaw, dataPos, pTrans->dbname1, TSDB_DB_FNAME_LEN, _OVER)
  SDB_SET_BINARY(pRaw, dataPos, pTrans->dbname2, TSDB_DB_FNAME_LEN, _OVER)
127
  SDB_SET_INT32(pRaw, dataPos, pTrans->redoActionPos, _OVER)
128 129 130 131

  int32_t redoActionNum = taosArrayGetSize(pTrans->redoActions);
  int32_t undoActionNum = taosArrayGetSize(pTrans->undoActions);
  int32_t commitActionNum = taosArrayGetSize(pTrans->commitActions);
132 133
  SDB_SET_INT32(pRaw, dataPos, redoActionNum, _OVER)
  SDB_SET_INT32(pRaw, dataPos, undoActionNum, _OVER)
134
  SDB_SET_INT32(pRaw, dataPos, commitActionNum, _OVER)
S
Shengliang Guan 已提交
135

S
Shengliang Guan 已提交
136 137
  for (int32_t i = 0; i < redoActionNum; ++i) {
    STransAction *pAction = taosArrayGet(pTrans->redoActions, i);
138 139 140
    SDB_SET_INT32(pRaw, dataPos, pAction->id, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->errCode, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->acceptableCode, _OVER)
141
    SDB_SET_INT8(pRaw, dataPos, pAction->actionType, _OVER)
142
    SDB_SET_INT8(pRaw, dataPos, pAction->stage, _OVER)
143
    if (pAction->actionType == TRANS_ACTION_RAW) {
144
      int32_t len = sdbGetRawTotalSize(pAction->pRaw);
145
      SDB_SET_INT8(pRaw, dataPos, pAction->rawWritten, _OVER)
146 147
      SDB_SET_INT32(pRaw, dataPos, len, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, (void *)pAction->pRaw, len, _OVER)
148
    } else if (pAction->actionType == TRANS_ACTION_MSG) {
149 150
      SDB_SET_BINARY(pRaw, dataPos, (void *)&pAction->epSet, sizeof(SEpSet), _OVER)
      SDB_SET_INT16(pRaw, dataPos, pAction->msgType, _OVER)
151 152
      SDB_SET_INT8(pRaw, dataPos, pAction->msgSent, _OVER)
      SDB_SET_INT8(pRaw, dataPos, pAction->msgReceived, _OVER)
153 154
      SDB_SET_INT32(pRaw, dataPos, pAction->contLen, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, pAction->pCont, pAction->contLen, _OVER)
155 156
    } else {
      // nothing
157
    }
S
Shengliang Guan 已提交
158 159 160 161
  }

  for (int32_t i = 0; i < undoActionNum; ++i) {
    STransAction *pAction = taosArrayGet(pTrans->undoActions, i);
162 163 164
    SDB_SET_INT32(pRaw, dataPos, pAction->id, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->errCode, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->acceptableCode, _OVER)
165
    SDB_SET_INT8(pRaw, dataPos, pAction->actionType, _OVER)
166
    SDB_SET_INT8(pRaw, dataPos, pAction->stage, _OVER)
167
    if (pAction->actionType == TRANS_ACTION_RAW) {
168
      int32_t len = sdbGetRawTotalSize(pAction->pRaw);
169
      SDB_SET_INT8(pRaw, dataPos, pAction->rawWritten, _OVER)
170 171
      SDB_SET_INT32(pRaw, dataPos, len, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, (void *)pAction->pRaw, len, _OVER)
172
    } else if (pAction->actionType == TRANS_ACTION_MSG) {
173 174
      SDB_SET_BINARY(pRaw, dataPos, (void *)&pAction->epSet, sizeof(SEpSet), _OVER)
      SDB_SET_INT16(pRaw, dataPos, pAction->msgType, _OVER)
175 176
      SDB_SET_INT8(pRaw, dataPos, pAction->msgSent, _OVER)
      SDB_SET_INT8(pRaw, dataPos, pAction->msgReceived, _OVER)
177 178
      SDB_SET_INT32(pRaw, dataPos, pAction->contLen, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, pAction->pCont, pAction->contLen, _OVER)
179 180
    } else {
      // nothing
181 182 183 184 185
    }
  }

  for (int32_t i = 0; i < commitActionNum; ++i) {
    STransAction *pAction = taosArrayGet(pTrans->commitActions, i);
186 187 188
    SDB_SET_INT32(pRaw, dataPos, pAction->id, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->errCode, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->acceptableCode, _OVER)
189
    SDB_SET_INT8(pRaw, dataPos, pAction->actionType, _OVER)
190
    SDB_SET_INT8(pRaw, dataPos, pAction->stage, _OVER)
191
    if (pAction->actionType == TRANS_ACTION_RAW) {
192
      int32_t len = sdbGetRawTotalSize(pAction->pRaw);
193
      SDB_SET_INT8(pRaw, dataPos, pAction->rawWritten, _OVER)
194 195
      SDB_SET_INT32(pRaw, dataPos, len, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, (void *)pAction->pRaw, len, _OVER)
196
    } else if (pAction->actionType == TRANS_ACTION_MSG) {
197 198
      SDB_SET_BINARY(pRaw, dataPos, (void *)&pAction->epSet, sizeof(SEpSet), _OVER)
      SDB_SET_INT16(pRaw, dataPos, pAction->msgType, _OVER)
199 200
      SDB_SET_INT8(pRaw, dataPos, pAction->msgSent, _OVER)
      SDB_SET_INT8(pRaw, dataPos, pAction->msgReceived, _OVER)
201 202
      SDB_SET_INT32(pRaw, dataPos, pAction->contLen, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, pAction->pCont, pAction->contLen, _OVER)
203 204
    } else {
      // nothing
205
    }
206 207
  }

208 209 210
  SDB_SET_INT32(pRaw, dataPos, pTrans->startFunc, _OVER)
  SDB_SET_INT32(pRaw, dataPos, pTrans->stopFunc, _OVER)
  SDB_SET_INT32(pRaw, dataPos, pTrans->paramLen, _OVER)
211
  if (pTrans->param != NULL) {
212
    SDB_SET_BINARY(pRaw, dataPos, pTrans->param, pTrans->paramLen, _OVER)
213 214
  }

215 216
  SDB_SET_RESERVE(pRaw, dataPos, TRANS_RESERVE_SIZE, _OVER)
  SDB_SET_DATALEN(pRaw, dataPos, _OVER)
217 218 219

  terrno = 0;

220
_OVER:
221 222 223 224
  if (terrno != 0) {
    mError("trans:%d, failed to encode to raw:%p len:%d since %s", pTrans->id, pRaw, dataPos, terrstr());
    sdbFreeRaw(pRaw);
    return NULL;
S
Shengliang Guan 已提交
225 226
  }

S
Shengliang Guan 已提交
227
  mTrace("trans:%d, encode to raw:%p, row:%p len:%d", pTrans->id, pRaw, pTrans, dataPos);
S
Shengliang Guan 已提交
228 229 230
  return pRaw;
}

S
Shengliang Guan 已提交
231
static SSdbRow *mndTransActionDecode(SSdbRaw *pRaw) {
232 233
  terrno = TSDB_CODE_OUT_OF_MEMORY;

234 235 236
  SSdbRow     *pRow = NULL;
  STrans      *pTrans = NULL;
  char        *pData = NULL;
237 238 239 240
  int32_t      dataLen = 0;
  int8_t       sver = 0;
  int32_t      redoActionNum = 0;
  int32_t      undoActionNum = 0;
241
  int32_t      commitActionNum = 0;
242 243 244
  int32_t      dataPos = 0;
  STransAction action = {0};

S
Shengliang Guan 已提交
245
  if (sdbGetRawSoftVer(pRaw, &sver) != 0) goto _OVER;
S
Shengliang Guan 已提交
246

S
Shengliang Guan 已提交
247
  if (sver != TRANS_VER_NUMBER) {
S
Shengliang Guan 已提交
248
    terrno = TSDB_CODE_SDB_INVALID_DATA_VER;
S
Shengliang Guan 已提交
249
    goto _OVER;
S
Shengliang Guan 已提交
250 251
  }

252
  pRow = sdbAllocRow(sizeof(STrans));
S
Shengliang Guan 已提交
253
  if (pRow == NULL) goto _OVER;
254 255

  pTrans = sdbGetRowObj(pRow);
S
Shengliang Guan 已提交
256
  if (pTrans == NULL) goto _OVER;
S
Shengliang Guan 已提交
257

S
Shengliang Guan 已提交
258
  SDB_GET_INT32(pRaw, dataPos, &pTrans->id, _OVER)
S
Shengliang Guan 已提交
259

S
Shengliang Guan 已提交
260 261 262 263 264 265 266 267 268
  int8_t stage = 0;
  int8_t policy = 0;
  int8_t conflict = 0;
  int8_t exec = 0;
  int8_t actionType = 0;
  SDB_GET_INT8(pRaw, dataPos, &stage, _OVER)
  SDB_GET_INT8(pRaw, dataPos, &policy, _OVER)
  SDB_GET_INT8(pRaw, dataPos, &conflict, _OVER)
  SDB_GET_INT8(pRaw, dataPos, &exec, _OVER)
S
Shengliang Guan 已提交
269
  pTrans->stage = stage;
270
  pTrans->policy = policy;
271 272
  pTrans->conflict = conflict;
  pTrans->exec = exec;
S
Shengliang Guan 已提交
273
  SDB_GET_INT64(pRaw, dataPos, &pTrans->createdTime, _OVER)
274 275
  SDB_GET_BINARY(pRaw, dataPos, pTrans->dbname1, TSDB_DB_FNAME_LEN, _OVER)
  SDB_GET_BINARY(pRaw, dataPos, pTrans->dbname2, TSDB_DB_FNAME_LEN, _OVER)
276
  SDB_GET_INT32(pRaw, dataPos, &pTrans->redoActionPos, _OVER)
S
Shengliang Guan 已提交
277 278
  SDB_GET_INT32(pRaw, dataPos, &redoActionNum, _OVER)
  SDB_GET_INT32(pRaw, dataPos, &undoActionNum, _OVER)
279
  SDB_GET_INT32(pRaw, dataPos, &commitActionNum, _OVER)
S
Shengliang Guan 已提交
280

S
Shengliang Guan 已提交
281 282
  pTrans->redoActions = taosArrayInit(redoActionNum, sizeof(STransAction));
  pTrans->undoActions = taosArrayInit(undoActionNum, sizeof(STransAction));
283
  pTrans->commitActions = taosArrayInit(commitActionNum, sizeof(STransAction));
S
Shengliang Guan 已提交
284

S
Shengliang Guan 已提交
285 286
  if (pTrans->redoActions == NULL) goto _OVER;
  if (pTrans->undoActions == NULL) goto _OVER;
287
  if (pTrans->commitActions == NULL) goto _OVER;
S
Shengliang Guan 已提交
288 289

  for (int32_t i = 0; i < redoActionNum; ++i) {
290 291 292
    SDB_GET_INT32(pRaw, dataPos, &action.id, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.errCode, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.acceptableCode, _OVER)
293 294
    SDB_GET_INT8(pRaw, dataPos, &actionType, _OVER)
    action.actionType = actionType;
S
Shengliang Guan 已提交
295 296
    SDB_GET_INT8(pRaw, dataPos, &stage, _OVER)
    action.stage = stage;
297
    if (action.actionType == TRANS_ACTION_RAW) {
298
      SDB_GET_INT8(pRaw, dataPos, &action.rawWritten, _OVER)
299
      SDB_GET_INT32(pRaw, dataPos, &dataLen, _OVER)
300 301
      action.pRaw = taosMemoryMalloc(dataLen);
      if (action.pRaw == NULL) goto _OVER;
S
Shengliang Guan 已提交
302
      // mTrace("raw:%p, is created", pData);
303 304 305
      SDB_GET_BINARY(pRaw, dataPos, (void *)action.pRaw, dataLen, _OVER);
      if (taosArrayPush(pTrans->redoActions, &action) == NULL) goto _OVER;
      action.pRaw = NULL;
306
    } else if (action.actionType == TRANS_ACTION_MSG) {
307 308
      SDB_GET_BINARY(pRaw, dataPos, (void *)&action.epSet, sizeof(SEpSet), _OVER);
      SDB_GET_INT16(pRaw, dataPos, &action.msgType, _OVER)
309 310
      SDB_GET_INT8(pRaw, dataPos, &action.msgSent, _OVER)
      SDB_GET_INT8(pRaw, dataPos, &action.msgReceived, _OVER)
311 312 313 314 315 316
      SDB_GET_INT32(pRaw, dataPos, &action.contLen, _OVER)
      action.pCont = taosMemoryMalloc(action.contLen);
      if (action.pCont == NULL) goto _OVER;
      SDB_GET_BINARY(pRaw, dataPos, action.pCont, action.contLen, _OVER);
      if (taosArrayPush(pTrans->redoActions, &action) == NULL) goto _OVER;
      action.pCont = NULL;
317 318
    } else {
      if (taosArrayPush(pTrans->redoActions, &action) == NULL) goto _OVER;
319
    }
S
Shengliang Guan 已提交
320 321 322
  }

  for (int32_t i = 0; i < undoActionNum; ++i) {
323 324 325
    SDB_GET_INT32(pRaw, dataPos, &action.id, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.errCode, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.acceptableCode, _OVER)
326 327
    SDB_GET_INT8(pRaw, dataPos, &actionType, _OVER)
    action.actionType = actionType;
S
Shengliang Guan 已提交
328 329
    SDB_GET_INT8(pRaw, dataPos, &stage, _OVER)
    action.stage = stage;
330
    if (action.actionType == TRANS_ACTION_RAW) {
331
      SDB_GET_INT8(pRaw, dataPos, &action.rawWritten, _OVER)
332
      SDB_GET_INT32(pRaw, dataPos, &dataLen, _OVER)
333 334
      action.pRaw = taosMemoryMalloc(dataLen);
      if (action.pRaw == NULL) goto _OVER;
S
Shengliang Guan 已提交
335
      // mTrace("raw:%p, is created", action.pRaw);
336 337 338
      SDB_GET_BINARY(pRaw, dataPos, (void *)action.pRaw, dataLen, _OVER);
      if (taosArrayPush(pTrans->undoActions, &action) == NULL) goto _OVER;
      action.pRaw = NULL;
339
    } else if (action.actionType == TRANS_ACTION_MSG) {
340 341
      SDB_GET_BINARY(pRaw, dataPos, (void *)&action.epSet, sizeof(SEpSet), _OVER);
      SDB_GET_INT16(pRaw, dataPos, &action.msgType, _OVER)
342 343
      SDB_GET_INT8(pRaw, dataPos, &action.msgSent, _OVER)
      SDB_GET_INT8(pRaw, dataPos, &action.msgReceived, _OVER)
344 345 346 347 348 349
      SDB_GET_INT32(pRaw, dataPos, &action.contLen, _OVER)
      action.pCont = taosMemoryMalloc(action.contLen);
      if (action.pCont == NULL) goto _OVER;
      SDB_GET_BINARY(pRaw, dataPos, action.pCont, action.contLen, _OVER);
      if (taosArrayPush(pTrans->undoActions, &action) == NULL) goto _OVER;
      action.pCont = NULL;
350 351
    } else {
      if (taosArrayPush(pTrans->redoActions, &action) == NULL) goto _OVER;
352 353 354 355
    }
  }

  for (int32_t i = 0; i < commitActionNum; ++i) {
356 357 358
    SDB_GET_INT32(pRaw, dataPos, &action.id, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.errCode, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.acceptableCode, _OVER)
359 360
    SDB_GET_INT8(pRaw, dataPos, &actionType, _OVER)
    action.actionType = actionType;
S
Shengliang Guan 已提交
361 362
    SDB_GET_INT8(pRaw, dataPos, &stage, _OVER)
    action.stage = stage;
363
    if (action.actionType) {
364
      SDB_GET_INT8(pRaw, dataPos, &action.rawWritten, _OVER)
365
      SDB_GET_INT32(pRaw, dataPos, &dataLen, _OVER)
366 367
      action.pRaw = taosMemoryMalloc(dataLen);
      if (action.pRaw == NULL) goto _OVER;
S
Shengliang Guan 已提交
368
      // mTrace("raw:%p, is created", action.pRaw);
369 370 371
      SDB_GET_BINARY(pRaw, dataPos, (void *)action.pRaw, dataLen, _OVER);
      if (taosArrayPush(pTrans->commitActions, &action) == NULL) goto _OVER;
      action.pRaw = NULL;
372
    } else if (action.actionType == TRANS_ACTION_MSG) {
373 374
      SDB_GET_BINARY(pRaw, dataPos, (void *)&action.epSet, sizeof(SEpSet), _OVER);
      SDB_GET_INT16(pRaw, dataPos, &action.msgType, _OVER)
375 376
      SDB_GET_INT8(pRaw, dataPos, &action.msgSent, _OVER)
      SDB_GET_INT8(pRaw, dataPos, &action.msgReceived, _OVER)
377 378 379 380 381 382
      SDB_GET_INT32(pRaw, dataPos, &action.contLen, _OVER)
      action.pCont = taosMemoryMalloc(action.contLen);
      if (action.pCont == NULL) goto _OVER;
      SDB_GET_BINARY(pRaw, dataPos, action.pCont, action.contLen, _OVER);
      if (taosArrayPush(pTrans->commitActions, &action) == NULL) goto _OVER;
      action.pCont = NULL;
383 384
    } else {
      if (taosArrayPush(pTrans->redoActions, &action) == NULL) goto _OVER;
385
    }
S
Shengliang Guan 已提交
386 387
  }

S
Shengliang Guan 已提交
388 389 390
  SDB_GET_INT32(pRaw, dataPos, &pTrans->startFunc, _OVER)
  SDB_GET_INT32(pRaw, dataPos, &pTrans->stopFunc, _OVER)
  SDB_GET_INT32(pRaw, dataPos, &pTrans->paramLen, _OVER)
391 392
  if (pTrans->paramLen != 0) {
    pTrans->param = taosMemoryMalloc(pTrans->paramLen);
S
Shengliang Guan 已提交
393
    SDB_GET_BINARY(pRaw, dataPos, pTrans->param, pTrans->paramLen, _OVER);
394 395
  }

S
Shengliang Guan 已提交
396
  SDB_GET_RESERVE(pRaw, dataPos, TRANS_RESERVE_SIZE, _OVER)
397 398

  terrno = 0;
S
Shengliang Guan 已提交
399

S
Shengliang Guan 已提交
400
_OVER:
401 402 403
  if (terrno != 0) {
    mError("trans:%d, failed to parse from raw:%p since %s", pTrans->id, pRaw, terrstr());
    mndTransDropData(pTrans);
wafwerar's avatar
wafwerar 已提交
404 405
    taosMemoryFreeClear(pRow);
    taosMemoryFreeClear(action.pCont);
S
Shengliang Guan 已提交
406 407 408
    return NULL;
  }

S
Shengliang Guan 已提交
409
  mTrace("trans:%d, decode from raw:%p, row:%p", pTrans->id, pRaw, pTrans);
S
Shengliang Guan 已提交
410 411 412
  return pRow;
}

S
Shengliang Guan 已提交
413 414 415 416 417 418 419 420
static const char *mndTransStr(ETrnStage stage) {
  switch (stage) {
    case TRN_STAGE_PREPARE:
      return "prepare";
    case TRN_STAGE_REDO_ACTION:
      return "redoAction";
    case TRN_STAGE_ROLLBACK:
      return "rollback";
421 422 423 424 425 426
    case TRN_STAGE_UNDO_ACTION:
      return "undoAction";
    case TRN_STAGE_COMMIT:
      return "commit";
    case TRN_STAGE_COMMIT_ACTION:
      return "commitAction";
S
Shengliang Guan 已提交
427 428 429 430 431 432 433
    case TRN_STAGE_FINISHED:
      return "finished";
    default:
      return "invalid";
  }
}

434 435 436 437 438 439 440 441
static void mndTransTestStartFunc(SMnode *pMnode, void *param, int32_t paramLen) {
  mInfo("test trans start, param:%s, len:%d", (char *)param, paramLen);
}

static void mndTransTestStopFunc(SMnode *pMnode, void *param, int32_t paramLen) {
  mInfo("test trans stop, param:%s, len:%d", (char *)param, paramLen);
}

S
Shengliang Guan 已提交
442
static TransCbFp mndTransGetCbFp(ETrnFunc ftype) {
443
  switch (ftype) {
S
Shengliang Guan 已提交
444
    case TRANS_START_FUNC_TEST:
445
      return mndTransTestStartFunc;
S
Shengliang Guan 已提交
446
    case TRANS_STOP_FUNC_TEST:
447
      return mndTransTestStopFunc;
S
Shengliang Guan 已提交
448
    case TRANS_START_FUNC_MQ_REB:
L
Liu Jicong 已提交
449
      return mndRebCntInc;
450
    case TRANS_STOP_FUNC_MQ_REB:
L
Liu Jicong 已提交
451
      return mndRebCntDec;
452 453 454 455 456
    default:
      return NULL;
  }
}

S
Shengliang Guan 已提交
457
static int32_t mndTransActionInsert(SSdb *pSdb, STrans *pTrans) {
S
Shengliang Guan 已提交
458
  mTrace("trans:%d, perform insert action, row:%p stage:%s", pTrans->id, pTrans, mndTransStr(pTrans->stage));
459 460 461 462 463 464 465 466

  if (pTrans->startFunc > 0) {
    TransCbFp fp = mndTransGetCbFp(pTrans->startFunc);
    if (fp) {
      (*fp)(pSdb->pMnode, pTrans->param, pTrans->paramLen);
    }
  }

S
Shengliang Guan 已提交
467 468 469
  return 0;
}

470
static void mndTransDropData(STrans *pTrans) {
S
Shengliang Guan 已提交
471 472
  mndTransDropActions(pTrans->redoActions);
  mndTransDropActions(pTrans->undoActions);
473
  mndTransDropActions(pTrans->commitActions);
S
Shengliang Guan 已提交
474
  if (pTrans->rpcRsp != NULL) {
wafwerar's avatar
wafwerar 已提交
475
    taosMemoryFree(pTrans->rpcRsp);
S
Shengliang Guan 已提交
476 477 478
    pTrans->rpcRsp = NULL;
    pTrans->rpcRspLen = 0;
  }
479 480 481 482 483
  if (pTrans->param != NULL) {
    taosMemoryFree(pTrans->param);
    pTrans->param = NULL;
    pTrans->paramLen = 0;
  }
484
}
S
Shengliang Guan 已提交
485

486
static int32_t mndTransActionDelete(SSdb *pSdb, STrans *pTrans, bool callFunc) {
487
  mTrace("trans:%d, perform delete action, row:%p stage:%s callfunc:%d", pTrans->id, pTrans, mndTransStr(pTrans->stage),
488 489 490 491 492 493 494 495
         callFunc);
  if (pTrans->stopFunc > 0 && callFunc) {
    TransCbFp fp = mndTransGetCbFp(pTrans->stopFunc);
    if (fp) {
      (*fp)(pSdb->pMnode, pTrans->param, pTrans->paramLen);
    }
  }

496
  mndTransDropData(pTrans);
S
Shengliang Guan 已提交
497 498 499
  return 0;
}

500 501 502 503 504 505 506 507
static void mndTransUpdateActions(SArray *pOldArray, SArray *pNewArray) {
  for (int32_t i = 0; i < taosArrayGetSize(pOldArray); ++i) {
    STransAction *pOldAction = taosArrayGet(pOldArray, i);
    STransAction *pNewAction = taosArrayGet(pNewArray, i);
    pOldAction->rawWritten = pNewAction->rawWritten;
    pOldAction->msgSent = pNewAction->msgSent;
    pOldAction->msgReceived = pNewAction->msgReceived;
    pOldAction->errCode = pNewAction->errCode;
508
  }
509
}
510

511
static int32_t mndTransActionUpdate(SSdb *pSdb, STrans *pOld, STrans *pNew) {
S
Shengliang Guan 已提交
512 513
  mTrace("trans:%d, perform update action, old row:%p stage:%s, new row:%p stage:%s", pOld->id, pOld,
         mndTransStr(pOld->stage), pNew, mndTransStr(pNew->stage));
514 515 516
  mndTransUpdateActions(pOld->redoActions, pNew->redoActions);
  mndTransUpdateActions(pOld->undoActions, pNew->undoActions);
  mndTransUpdateActions(pOld->commitActions, pNew->commitActions);
S
Shengliang Guan 已提交
517
  pOld->stage = pNew->stage;
518
  pOld->redoActionPos = pNew->redoActionPos;
519 520 521

  if (pOld->stage == TRN_STAGE_COMMIT) {
    pOld->stage = TRN_STAGE_COMMIT_ACTION;
522
    mTrace("trans:%d, stage from commit to commitAction since perform update action", pNew->id);
523 524 525
  }

  if (pOld->stage == TRN_STAGE_ROLLBACK) {
526 527
    pOld->stage = TRN_STAGE_REDO_ACTION;
    mTrace("trans:%d, stage from rollback to undoAction since perform update action", pNew->id);
528
  }
529

S
Shengliang Guan 已提交
530 531 532
  return 0;
}

533
STrans *mndAcquireTrans(SMnode *pMnode, int32_t transId) {
534
  STrans *pTrans = sdbAcquire(pMnode->pSdb, SDB_TRANS, &transId);
S
Shengliang Guan 已提交
535 536 537 538
  if (pTrans == NULL) {
    terrno = TSDB_CODE_MND_TRANS_NOT_EXIST;
  }
  return pTrans;
S
Shengliang Guan 已提交
539 540
}

541
void mndReleaseTrans(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
542 543 544 545
  SSdb *pSdb = pMnode->pSdb;
  sdbRelease(pSdb, pTrans);
}

546
STrans *mndTransCreate(SMnode *pMnode, ETrnPolicy policy, ETrnConflct conflict, const SRpcMsg *pReq) {
wafwerar's avatar
wafwerar 已提交
547
  STrans *pTrans = taosMemoryCalloc(1, sizeof(STrans));
S
Shengliang Guan 已提交
548 549 550 551 552 553
  if (pTrans == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    mError("failed to create transaction since %s", terrstr());
    return NULL;
  }

S
Shengliang Guan 已提交
554
  pTrans->id = sdbGetMaxId(pMnode->pSdb, SDB_TRANS);
S
Shengliang Guan 已提交
555 556
  pTrans->stage = TRN_STAGE_PREPARE;
  pTrans->policy = policy;
557 558
  pTrans->conflict = conflict;
  pTrans->exec = TRN_EXEC_PRARLLEL;
S
Shengliang Guan 已提交
559
  pTrans->createdTime = taosGetTimestampMs();
S
Shengliang Guan 已提交
560 561
  pTrans->redoActions = taosArrayInit(TRANS_ARRAY_SIZE, sizeof(STransAction));
  pTrans->undoActions = taosArrayInit(TRANS_ARRAY_SIZE, sizeof(STransAction));
562
  pTrans->commitActions = taosArrayInit(TRANS_ARRAY_SIZE, sizeof(STransAction));
S
Shengliang Guan 已提交
563

564
  if (pTrans->redoActions == NULL || pTrans->undoActions == NULL || pTrans->commitActions == NULL) {
S
Shengliang Guan 已提交
565 566 567 568 569
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    mError("failed to create transaction since %s", terrstr());
    return NULL;
  }

570 571
  if (pReq != NULL) pTrans->rpcInfo = pReq->info;
  mTrace("trans:%d, local object is created, data:%p", pTrans->id, pTrans);
S
Shengliang Guan 已提交
572 573 574
  return pTrans;
}

S
Shengliang Guan 已提交
575
static void mndTransDropActions(SArray *pArray) {
S
Shengliang Guan 已提交
576 577
  int32_t size = taosArrayGetSize(pArray);
  for (int32_t i = 0; i < size; ++i) {
S
Shengliang Guan 已提交
578
    STransAction *pAction = taosArrayGet(pArray, i);
579
    if (pAction->actionType == TRANS_ACTION_RAW) {
580
      taosMemoryFreeClear(pAction->pRaw);
581
    } else if (pAction->actionType == TRANS_ACTION_MSG) {
582
      taosMemoryFreeClear(pAction->pCont);
583 584
    } else {
      // nothing
585
    }
S
Shengliang Guan 已提交
586 587 588 589 590
  }

  taosArrayDestroy(pArray);
}

S
Shengliang Guan 已提交
591
void mndTransDrop(STrans *pTrans) {
S
Shengliang 已提交
592 593
  if (pTrans != NULL) {
    mndTransDropData(pTrans);
594
    mTrace("trans:%d, local object is freed, data:%p", pTrans->id, pTrans);
wafwerar's avatar
wafwerar 已提交
595
    taosMemoryFreeClear(pTrans);
S
Shengliang 已提交
596
  }
S
Shengliang Guan 已提交
597 598
}

599
static int32_t mndTransAppendAction(SArray *pArray, STransAction *pAction) {
600 601
  pAction->id = taosArrayGetSize(pArray);

602
  void *ptr = taosArrayPush(pArray, pAction);
S
Shengliang Guan 已提交
603 604 605 606 607 608 609 610
  if (ptr == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }

  return 0;
}

611
int32_t mndTransAppendRedolog(STrans *pTrans, SSdbRaw *pRaw) {
612 613 614 615 616 617
  STransAction action = {.stage = TRN_STAGE_REDO_ACTION, .actionType = TRANS_ACTION_RAW, .pRaw = pRaw};
  return mndTransAppendAction(pTrans->redoActions, &action);
}

int32_t mndTransAppendNullLog(STrans *pTrans) {
  STransAction action = {.stage = TRN_STAGE_REDO_ACTION, .actionType = TRANS_ACTION_NULL};
618 619
  return mndTransAppendAction(pTrans->redoActions, &action);
}
S
Shengliang Guan 已提交
620

621
int32_t mndTransAppendUndolog(STrans *pTrans, SSdbRaw *pRaw) {
622
  STransAction action = {.stage = TRN_STAGE_UNDO_ACTION, .actionType = TRANS_ACTION_RAW, .pRaw = pRaw};
623 624
  return mndTransAppendAction(pTrans->undoActions, &action);
}
S
Shengliang Guan 已提交
625

626
int32_t mndTransAppendCommitlog(STrans *pTrans, SSdbRaw *pRaw) {
627
  STransAction action = {.stage = TRN_STAGE_COMMIT_ACTION, .actionType = TRANS_ACTION_RAW, .pRaw = pRaw};
628
  return mndTransAppendAction(pTrans->commitActions, &action);
S
Shengliang Guan 已提交
629 630
}

S
Shengliang Guan 已提交
631
int32_t mndTransAppendRedoAction(STrans *pTrans, STransAction *pAction) {
632
  pAction->stage = TRN_STAGE_REDO_ACTION;
633
  pAction->actionType = TRANS_ACTION_MSG;
S
Shengliang Guan 已提交
634
  return mndTransAppendAction(pTrans->redoActions, pAction);
S
Shengliang Guan 已提交
635 636
}

S
Shengliang Guan 已提交
637
int32_t mndTransAppendUndoAction(STrans *pTrans, STransAction *pAction) {
638
  pAction->stage = TRN_STAGE_UNDO_ACTION;
639
  pAction->actionType = TRANS_ACTION_MSG;
S
Shengliang Guan 已提交
640
  return mndTransAppendAction(pTrans->undoActions, pAction);
S
Shengliang Guan 已提交
641 642
}

S
Shengliang Guan 已提交
643 644 645 646 647
void mndTransSetRpcRsp(STrans *pTrans, void *pCont, int32_t contLen) {
  pTrans->rpcRsp = pCont;
  pTrans->rpcRspLen = contLen;
}

S
Shengliang Guan 已提交
648
void mndTransSetCb(STrans *pTrans, ETrnFunc startFunc, ETrnFunc stopFunc, void *param, int32_t paramLen) {
649 650 651 652
  pTrans->startFunc = startFunc;
  pTrans->stopFunc = stopFunc;
  pTrans->param = param;
  pTrans->paramLen = paramLen;
653 654
}

655 656 657 658 659 660 661 662
void mndTransSetDbName(STrans *pTrans, const char *dbname1, const char *dbname2) {
  if (dbname1 != NULL) {
    memcpy(pTrans->dbname1, dbname1, TSDB_DB_FNAME_LEN);
  }
  if (dbname2 != NULL) {
    memcpy(pTrans->dbname2, dbname2, TSDB_DB_FNAME_LEN);
  }
}
S
Shengliang Guan 已提交
663

664
void mndTransSetSerial(STrans *pTrans) { pTrans->exec = TRN_EXEC_SERIAL; }
665

S
Shengliang Guan 已提交
666
static int32_t mndTransSync(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
667
  SSdbRaw *pRaw = mndTransActionEncode(pTrans);
S
Shengliang Guan 已提交
668
  if (pRaw == NULL) {
S
Shengliang Guan 已提交
669
    mError("trans:%d, failed to encode while sync trans since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
670 671
    return -1;
  }
S
Shengliang Guan 已提交
672
  sdbSetRawStatus(pRaw, SDB_STATUS_READY);
S
Shengliang Guan 已提交
673

S
Shengliang Guan 已提交
674
  mDebug("trans:%d, sync to other mnodes, stage:%s", pTrans->id, mndTransStr(pTrans->stage));
S
Shengliang Guan 已提交
675
  int32_t code = mndSyncPropose(pMnode, pRaw, pTrans->id);
S
Shengliang Guan 已提交
676 677 678
  if (code != 0) {
    mError("trans:%d, failed to sync since %s", pTrans->id, terrstr());
    sdbFreeRaw(pRaw);
S
Shengliang Guan 已提交
679 680 681
    return -1;
  }

682
  sdbFreeRaw(pRaw);
S
Shengliang Guan 已提交
683
  mDebug("trans:%d, sync finished", pTrans->id);
S
Shengliang Guan 已提交
684 685 686
  return 0;
}

S
Shengliang Guan 已提交
687 688 689 690 691 692
static bool mndCheckDbConflict(const char *db, STrans *pTrans) {
  if (db[0] == 0) return false;
  if (strcmp(db, pTrans->dbname1) == 0 || strcmp(db, pTrans->dbname2) == 0) return true;
  return false;
}

693
static bool mndCheckTransConflict(SMnode *pMnode, STrans *pNew) {
S
Shengliang Guan 已提交
694
  STrans *pTrans = NULL;
695
  void   *pIter = NULL;
696
  bool    conflict = false;
697

698
  if (pNew->conflict == TRN_CONFLICT_NOTHING) return conflict;
S
Shengliang Guan 已提交
699 700 701 702 703

  while (1) {
    pIter = sdbFetch(pMnode->pSdb, SDB_TRANS, pIter, (void **)&pTrans);
    if (pIter == NULL) break;

704 705 706
    if (pNew->conflict == TRN_CONFLICT_GLOBAL) conflict = true;
    if (pNew->conflict == TRN_CONFLICT_DB) {
      if (pTrans->conflict == TRN_CONFLICT_GLOBAL) conflict = true;
707
      if (pTrans->conflict == TRN_CONFLICT_DB || pTrans->conflict == TRN_CONFLICT_DB_INSIDE) {
S
Shengliang Guan 已提交
708 709
        if (mndCheckDbConflict(pNew->dbname1, pTrans)) conflict = true;
        if (mndCheckDbConflict(pNew->dbname2, pTrans)) conflict = true;
710
      }
711 712 713
    }
    if (pNew->conflict == TRN_CONFLICT_DB_INSIDE) {
      if (pTrans->conflict == TRN_CONFLICT_GLOBAL) conflict = true;
714
      if (pTrans->conflict == TRN_CONFLICT_DB) {
S
Shengliang Guan 已提交
715 716
        if (mndCheckDbConflict(pNew->dbname1, pTrans)) conflict = true;
        if (mndCheckDbConflict(pNew->dbname2, pTrans)) conflict = true;
717
      }
S
Shengliang Guan 已提交
718
    }
S
Shengliang Guan 已提交
719

720 721
    mError("trans:%d, can't execute since conflict with trans:%d, db1:%s db2:%s", pNew->id, pTrans->id, pTrans->dbname1,
           pTrans->dbname2);
S
Shengliang Guan 已提交
722 723 724
    sdbRelease(pMnode->pSdb, pTrans);
  }

725
  return conflict;
S
Shengliang Guan 已提交
726 727
}

S
Shengliang Guan 已提交
728
int32_t mndTransPrepare(SMnode *pMnode, STrans *pTrans) {
729
  if (pTrans->conflict == TRN_CONFLICT_DB || pTrans->conflict == TRN_CONFLICT_DB_INSIDE) {
730
    if (strlen(pTrans->dbname1) == 0 && strlen(pTrans->dbname2) == 0) {
731 732 733 734 735 736
      terrno = TSDB_CODE_MND_TRANS_CONFLICT;
      mError("trans:%d, failed to prepare conflict db not set", pTrans->id);
      return -1;
    }
  }

737 738
  if (mndCheckTransConflict(pMnode, pTrans)) {
    terrno = TSDB_CODE_MND_TRANS_CONFLICT;
S
Shengliang Guan 已提交
739 740 741 742
    mError("trans:%d, failed to prepare since %s", pTrans->id, terrstr());
    return -1;
  }

743
  if (taosArrayGetSize(pTrans->commitActions) <= 0) {
744 745 746 747 748
    terrno = TSDB_CODE_MND_TRANS_CLOG_IS_NULL;
    mError("trans:%d, failed to prepare since %s", pTrans->id, terrstr());
    return -1;
  }

S
Shengliang Guan 已提交
749 750 751 752 753 754 755
  mDebug("trans:%d, prepare transaction", pTrans->id);
  if (mndTransSync(pMnode, pTrans) != 0) {
    mError("trans:%d, failed to prepare since %s", pTrans->id, terrstr());
    return -1;
  }
  mDebug("trans:%d, prepare finished", pTrans->id);

S
Shengliang Guan 已提交
756 757
  STrans *pNew = mndAcquireTrans(pMnode, pTrans->id);
  if (pNew == NULL) {
S
Shengliang Guan 已提交
758
    mError("trans:%d, failed to read from sdb since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
759 760 761
    return -1;
  }

S
Shengliang Guan 已提交
762
  pNew->rpcInfo = pTrans->rpcInfo;
S
Shengliang Guan 已提交
763 764 765 766 767
  pNew->rpcRsp = pTrans->rpcRsp;
  pNew->rpcRspLen = pTrans->rpcRspLen;
  pTrans->rpcRsp = NULL;
  pTrans->rpcRspLen = 0;

S
Shengliang Guan 已提交
768 769
  mndTransExecute(pMnode, pNew);
  mndReleaseTrans(pMnode, pNew);
S
Shengliang Guan 已提交
770 771 772
  return 0;
}

S
Shengliang Guan 已提交
773 774 775 776
static int32_t mndTransCommit(SMnode *pMnode, STrans *pTrans) {
  mDebug("trans:%d, commit transaction", pTrans->id);
  if (mndTransSync(pMnode, pTrans) != 0) {
    mError("trans:%d, failed to commit since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
777
    return -1;
S
Shengliang Guan 已提交
778 779
  }
  mDebug("trans:%d, commit finished", pTrans->id);
S
Shengliang Guan 已提交
780 781 782
  return 0;
}

S
Shengliang Guan 已提交
783
static int32_t mndTransRollback(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
784
  mDebug("trans:%d, rollback transaction", pTrans->id);
S
Shengliang Guan 已提交
785 786
  if (mndTransSync(pMnode, pTrans) != 0) {
    mError("trans:%d, failed to rollback since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
787
    return -1;
S
Shengliang Guan 已提交
788
  }
S
Shengliang Guan 已提交
789 790
  mDebug("trans:%d, rollback finished", pTrans->id);
  return 0;
S
Shengliang Guan 已提交
791
}
S
Shengliang Guan 已提交
792

793
static void mndTransSendRpcRsp(SMnode *pMnode, STrans *pTrans) {
794 795
  bool    sendRsp = false;
  int32_t code = pTrans->code;
796 797 798 799 800 801

  if (pTrans->stage == TRN_STAGE_FINISHED) {
    sendRsp = true;
  }

  if (pTrans->policy == TRN_POLICY_ROLLBACK) {
802
    if (pTrans->stage == TRN_STAGE_UNDO_ACTION || pTrans->stage == TRN_STAGE_ROLLBACK) {
803
      if (code == 0) code = TSDB_CODE_MND_TRANS_UNKNOW_ERROR;
804
      sendRsp = true;
805
    }
806
  } else {
807
    if (pTrans->stage == TRN_STAGE_REDO_ACTION && pTrans->failedTimes > 2) {
808
      if (code == 0) code = TSDB_CODE_MND_TRANS_UNKNOW_ERROR;
809
      sendRsp = true;
810
    }
S
Shengliang Guan 已提交
811
  }
812

S
Shengliang Guan 已提交
813
  if (sendRsp && pTrans->rpcInfo.handle != NULL) {
814 815
    mDebug("trans:%d, send rsp, code:0x%x stage:%s app:%p", pTrans->id, code, mndTransStr(pTrans->stage),
           pTrans->rpcInfo.ahandle);
816
    if (code == TSDB_CODE_RPC_NETWORK_UNAVAIL) {
817
      code = TSDB_CODE_MND_TRANS_NETWORK_UNAVAILL;
818 819 820 821 822 823 824 825 826 827 828 829 830
    }
    SRpcMsg rspMsg = {.code = code, .info = pTrans->rpcInfo};

    if (pTrans->rpcRspLen != 0) {
      void *rpcCont = rpcMallocCont(pTrans->rpcRspLen);
      if (rpcCont != NULL) {
        memcpy(rpcCont, pTrans->rpcRsp, pTrans->rpcRspLen);
        rspMsg.pCont = rpcCont;
        rspMsg.contLen = pTrans->rpcRspLen;
      }
      taosMemoryFree(pTrans->rpcRsp);
    }

S
shm  
Shengliang Guan 已提交
831
    tmsgSendRsp(&rspMsg);
S
Shengliang Guan 已提交
832
    pTrans->rpcInfo.handle = NULL;
S
Shengliang Guan 已提交
833 834
    pTrans->rpcRsp = NULL;
    pTrans->rpcRspLen = 0;
835
  }
S
Shengliang Guan 已提交
836 837
}

838
int32_t mndTransProcessRsp(SRpcMsg *pRsp) {
S
Shengliang Guan 已提交
839 840
  SMnode *pMnode = pRsp->info.node;
  int64_t signature = (int64_t)(pRsp->info.ahandle);
S
Shengliang Guan 已提交
841 842
  int32_t transId = (int32_t)(signature >> 32);
  int32_t action = (int32_t)((signature << 32) >> 32);
843 844 845 846

  STrans *pTrans = mndAcquireTrans(pMnode, transId);
  if (pTrans == NULL) {
    mError("trans:%d, failed to get transId from vnode rsp since %s", transId, terrstr());
S
Shengliang Guan 已提交
847
    goto _OVER;
848 849 850
  }

  SArray *pArray = NULL;
S
Shengliang Guan 已提交
851
  if (pTrans->stage == TRN_STAGE_REDO_ACTION) {
852
    pArray = pTrans->redoActions;
S
Shengliang Guan 已提交
853
  } else if (pTrans->stage == TRN_STAGE_UNDO_ACTION) {
854 855
    pArray = pTrans->undoActions;
  } else {
S
Shengliang Guan 已提交
856
    mError("trans:%d, invalid trans stage:%d while recv action rsp", pTrans->id, pTrans->stage);
S
Shengliang Guan 已提交
857
    goto _OVER;
858 859 860
  }

  if (pArray == NULL) {
S
Shengliang Guan 已提交
861
    mError("trans:%d, invalid trans stage:%d", transId, pTrans->stage);
S
Shengliang Guan 已提交
862
    goto _OVER;
863 864 865
  }

  int32_t actionNum = taosArrayGetSize(pTrans->redoActions);
S
Shengliang Guan 已提交
866
  if (action < 0 || action >= actionNum) {
867
    mError("trans:%d, invalid action:%d", transId, action);
S
Shengliang Guan 已提交
868
    goto _OVER;
869 870 871 872 873
  }

  STransAction *pAction = taosArrayGet(pArray, action);
  if (pAction != NULL) {
    pAction->msgReceived = 1;
S
Shengliang Guan 已提交
874
    pAction->errCode = pRsp->code;
875 876
  }

877 878
  mDebug("trans:%d, %s:%d response is received, code:0x%x, accept:0x%x", transId, mndTransStr(pAction->stage), action,
         pRsp->code, pAction->acceptableCode);
879 880
  mndTransExecute(pMnode, pTrans);

S
Shengliang Guan 已提交
881
_OVER:
882
  mndReleaseTrans(pMnode, pTrans);
883
  return 0;
884 885
}

S
Shengliang Guan 已提交
886 887 888 889 890
static void mndTransResetActions(SMnode *pMnode, STrans *pTrans, SArray *pArray) {
  int32_t numOfActions = taosArrayGetSize(pArray);

  for (int32_t action = 0; action < numOfActions; ++action) {
    STransAction *pAction = taosArrayGet(pArray, action);
891 892 893 894
    if (pAction->msgSent && pAction->msgReceived &&
        (pAction->errCode == 0 || pAction->errCode == pAction->acceptableCode))
      continue;
    if (pAction->rawWritten && (pAction->errCode == 0 || pAction->errCode == pAction->acceptableCode)) continue;
S
Shengliang Guan 已提交
895

896
    pAction->rawWritten = 0;
S
Shengliang Guan 已提交
897 898
    pAction->msgSent = 0;
    pAction->msgReceived = 0;
S
Shengliang Guan 已提交
899 900
    if (pAction->errCode == TSDB_CODE_RPC_REDIRECT || pAction->errCode == TSDB_CODE_SYN_NOT_IN_NEW_CONFIG ||
        pAction->errCode == TSDB_CODE_SYN_INTERNAL_ERROR || pAction->errCode == TSDB_CODE_SYN_NOT_LEADER) {
901 902 903 904 905 906
      pAction->epSet.inUse = (pAction->epSet.inUse + 1) % pAction->epSet.numOfEps;
      mDebug("trans:%d, %s:%d execute status is reset and set epset inuse:%d", pTrans->id, mndTransStr(pAction->stage),
             action, pAction->epSet.inUse);
    } else {
      mDebug("trans:%d, %s:%d execute status is reset", pTrans->id, mndTransStr(pAction->stage), action);
    }
S
Shengliang Guan 已提交
907 908 909 910
    pAction->errCode = 0;
  }
}

911
static int32_t mndTransWriteSingleLog(SMnode *pMnode, STrans *pTrans, STransAction *pAction) {
912 913
  if (pAction->rawWritten) return 0;

914
  int32_t code = sdbWriteWithoutFree(pMnode->pSdb, pAction->pRaw);
915 916 917 918
  if (code == 0 || terrno == TSDB_CODE_SDB_OBJ_NOT_THERE) {
    pAction->rawWritten = true;
    pAction->errCode = 0;
    code = 0;
S
Shengliang Guan 已提交
919 920
    mDebug("trans:%d, %s:%d write to sdb, type:%s status:%s", pTrans->id, mndTransStr(pAction->stage), pAction->id,
           sdbTableName(pAction->pRaw->type), sdbStatusName(pAction->pRaw->status));
921 922 923 924 925

    pTrans->lastAction = pAction->id;
    pTrans->lastMsgType = pAction->msgType;
    pTrans->lastEpset = pAction->epSet;
    pTrans->lastErrorNo = 0;
926
  } else {
927
    pAction->errCode = (terrno != 0) ? terrno : code;
S
Shengliang Guan 已提交
928 929
    mError("trans:%d, %s:%d failed to write sdb since %s, type:%s status:%s", pTrans->id, mndTransStr(pAction->stage),
           pAction->id, terrstr(), sdbTableName(pAction->pRaw->type), sdbStatusName(pAction->pRaw->status));
930 931 932 933
    pTrans->lastAction = pAction->id;
    pTrans->lastMsgType = pAction->msgType;
    pTrans->lastEpset = pAction->epSet;
    pTrans->lastErrorNo = pAction->errCode;
934 935 936 937 938 939 940
  }

  return code;
}

static int32_t mndTransSendSingleMsg(SMnode *pMnode, STrans *pTrans, STransAction *pAction) {
  if (pAction->msgSent) return 0;
941
  if (mndCannotExecuteTransAction(pMnode)) return -1;
942 943 944 945 946 947 948 949 950 951 952 953 954

  int64_t signature = pTrans->id;
  signature = (signature << 32);
  signature += pAction->id;

  SRpcMsg rpcMsg = {.msgType = pAction->msgType, .contLen = pAction->contLen, .info.ahandle = (void *)signature};
  rpcMsg.pCont = rpcMallocCont(pAction->contLen);
  if (rpcMsg.pCont == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  memcpy(rpcMsg.pCont, pAction->pCont, pAction->contLen);

S
Shengliang Guan 已提交
955 956 957
  char    detail[1024] = {0};
  int32_t len = snprintf(detail, sizeof(detail), "msgType:%s numOfEps:%d inUse:%d", TMSG_INFO(pAction->msgType),
                         pAction->epSet.numOfEps, pAction->epSet.inUse);
S
Shengliang Guan 已提交
958
  for (int32_t i = 0; i < pAction->epSet.numOfEps; ++i) {
S
Shengliang Guan 已提交
959 960 961 962
    len += snprintf(detail + len, sizeof(detail) - len, " ep:%d-%s:%u", i, pAction->epSet.eps[i].fqdn,
                    pAction->epSet.eps[i].port);
  }

963 964 965 966 967
  int32_t code = tmsgSendReq(&pAction->epSet, &rpcMsg);
  if (code == 0) {
    pAction->msgSent = 1;
    pAction->msgReceived = 0;
    pAction->errCode = 0;
S
Shengliang Guan 已提交
968
    mDebug("trans:%d, %s:%d is sent, %s", pTrans->id, mndTransStr(pAction->stage), pAction->id, detail);
969 970 971 972 973 974 975

    pTrans->lastAction = pAction->id;
    pTrans->lastMsgType = pAction->msgType;
    pTrans->lastEpset = pAction->epSet;
    if (pTrans->lastErrorNo == 0) {
      pTrans->lastErrorNo = TSDB_CODE_ACTION_IN_PROGRESS;
    }
976 977 978 979
  } else {
    pAction->msgSent = 0;
    pAction->msgReceived = 0;
    pAction->errCode = (terrno != 0) ? terrno : code;
S
Shengliang Guan 已提交
980 981
    mError("trans:%d, %s:%d not send since %s, %s", pTrans->id, mndTransStr(pAction->stage), pAction->id, terrstr(),
           detail);
982 983 984 985 986

    pTrans->lastAction = pAction->id;
    pTrans->lastMsgType = pAction->msgType;
    pTrans->lastEpset = pAction->epSet;
    pTrans->lastErrorNo = pAction->errCode;
987 988 989 990 991
  }

  return code;
}

992 993 994
static int32_t mndTransExecNullMsg(SMnode *pMnode, STrans *pTrans, STransAction *pAction) {
  pAction->rawWritten = 0;
  pAction->errCode = 0;
S
Shengliang Guan 已提交
995
  mDebug("trans:%d, %s:%d confirm action executed", pTrans->id, mndTransStr(pAction->stage), pAction->id);
996 997 998 999 1000 1001 1002 1003

  pTrans->lastAction = pAction->id;
  pTrans->lastMsgType = pAction->msgType;
  pTrans->lastEpset = pAction->epSet;
  pTrans->lastErrorNo == 0;
  return 0;
}

1004
static int32_t mndTransExecSingleAction(SMnode *pMnode, STrans *pTrans, STransAction *pAction) {
1005
  if (pAction->actionType == TRANS_ACTION_RAW) {
1006
    return mndTransWriteSingleLog(pMnode, pTrans, pAction);
1007
  } else if (pAction->actionType == TRANS_ACTION_MSG) {
1008
    return mndTransSendSingleMsg(pMnode, pTrans, pAction);
1009
  } else {
1010
    return mndTransExecNullMsg(pMnode, pTrans, pAction);
1011 1012 1013
  }
}

1014
static int32_t mndTransExecSingleActions(SMnode *pMnode, STrans *pTrans, SArray *pArray) {
1015
  int32_t numOfActions = taosArrayGetSize(pArray);
1016
  int32_t code = 0;
1017 1018 1019

  for (int32_t action = 0; action < numOfActions; ++action) {
    STransAction *pAction = taosArrayGet(pArray, action);
1020
    code = mndTransExecSingleAction(pMnode, pTrans, pAction);
1021
    if (code != 0) break;
S
Shengliang Guan 已提交
1022 1023
  }

1024
  return code;
S
Shengliang Guan 已提交
1025 1026 1027 1028 1029 1030
}

static int32_t mndTransExecuteActions(SMnode *pMnode, STrans *pTrans, SArray *pArray) {
  int32_t numOfActions = taosArrayGetSize(pArray);
  if (numOfActions == 0) return 0;

1031
  if (mndTransExecSingleActions(pMnode, pTrans, pArray) != 0) {
S
Shengliang Guan 已提交
1032 1033 1034
    return -1;
  }

1035 1036 1037
  int32_t       numOfExecuted = 0;
  int32_t       errCode = 0;
  STransAction *pErrAction = NULL;
1038 1039
  for (int32_t action = 0; action < numOfActions; ++action) {
    STransAction *pAction = taosArrayGet(pArray, action);
1040
    if (pAction->msgReceived || pAction->rawWritten) {
1041
      numOfExecuted++;
1042
      if (pAction->errCode != 0 && pAction->errCode != pAction->acceptableCode) {
S
Shengliang Guan 已提交
1043
        errCode = pAction->errCode;
1044
        pErrAction = pAction;
1045 1046 1047 1048
      }
    }
  }

1049
  if (numOfExecuted == numOfActions) {
S
Shengliang Guan 已提交
1050
    if (errCode == 0) {
1051 1052 1053
      pTrans->lastAction = 0;
      pTrans->lastMsgType = 0;
      memset(&pTrans->lastEpset, 0, sizeof(pTrans->lastEpset));
S
Shengliang Guan 已提交
1054
      pTrans->lastErrorNo = 0;
S
Shengliang Guan 已提交
1055 1056 1057
      mDebug("trans:%d, all %d actions execute successfully", pTrans->id, numOfActions);
      return 0;
    } else {
S
Shengliang Guan 已提交
1058
      mError("trans:%d, all %d actions executed, code:0x%x", pTrans->id, numOfActions, errCode & 0XFFFF);
1059
      if (pErrAction != NULL) {
1060
        pTrans->lastAction = pErrAction->id;
S
Shengliang Guan 已提交
1061
        pTrans->lastMsgType = pErrAction->msgType;
1062
        pTrans->lastEpset = pErrAction->epSet;
S
Shengliang Guan 已提交
1063
        pTrans->lastErrorNo = pErrAction->errCode;
1064
      }
S
Shengliang Guan 已提交
1065 1066 1067 1068
      mndTransResetActions(pMnode, pTrans, pArray);
      terrno = errCode;
      return errCode;
    }
1069
  } else {
1070
    mDebug("trans:%d, %d of %d actions executed", pTrans->id, numOfExecuted, numOfActions);
S
Shengliang Guan 已提交
1071
    return TSDB_CODE_ACTION_IN_PROGRESS;
1072
  }
S
Shengliang Guan 已提交
1073 1074
}

S
Shengliang Guan 已提交
1075
static int32_t mndTransExecuteRedoActions(SMnode *pMnode, STrans *pTrans) {
1076
  int32_t code = mndTransExecuteActions(pMnode, pTrans, pTrans->redoActions);
S
Shengliang Guan 已提交
1077
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
1078
    mError("failed to execute redoActions since:%s, code:0x%x", terrstr(), terrno);
1079 1080
  }
  return code;
S
Shengliang Guan 已提交
1081
}
S
Shengliang Guan 已提交
1082

S
Shengliang Guan 已提交
1083
static int32_t mndTransExecuteUndoActions(SMnode *pMnode, STrans *pTrans) {
1084
  int32_t code = mndTransExecuteActions(pMnode, pTrans, pTrans->undoActions);
S
Shengliang Guan 已提交
1085
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
1086 1087 1088
    mError("failed to execute undoActions since %s", terrstr());
  }
  return code;
S
Shengliang Guan 已提交
1089
}
S
Shengliang Guan 已提交
1090

1091
static int32_t mndTransExecuteCommitActions(SMnode *pMnode, STrans *pTrans) {
1092
  int32_t code = mndTransExecuteActions(pMnode, pTrans, pTrans->commitActions);
1093
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
1094 1095 1096 1097 1098
    mError("failed to execute commitActions since %s", terrstr());
  }
  return code;
}

1099
static int32_t mndTransExecuteRedoActionsSerial(SMnode *pMnode, STrans *pTrans) {
1100 1101 1102 1103
  int32_t code = 0;
  int32_t numOfActions = taosArrayGetSize(pTrans->redoActions);
  if (numOfActions == 0) return code;
  if (pTrans->redoActionPos >= numOfActions) return code;
S
Shengliang Guan 已提交
1104

1105 1106
  for (int32_t action = pTrans->redoActionPos; action < numOfActions; ++action) {
    STransAction *pAction = taosArrayGet(pTrans->redoActions, pTrans->redoActionPos);
S
Shengliang Guan 已提交
1107

1108 1109 1110 1111 1112 1113
    code = mndTransExecSingleAction(pMnode, pTrans, pAction);
    if (code == 0) {
      if (pAction->msgSent) {
        if (pAction->msgReceived) {
          if (pAction->errCode != 0 && pAction->errCode != pAction->acceptableCode) {
            code = pAction->errCode;
1114 1115 1116
            pAction->msgSent = 0;
            pAction->msgReceived = 0;
            mDebug("trans:%d, %s:%d execute status is reset", pTrans->id, mndTransStr(pAction->stage), action);
1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127
          }
        } else {
          code = TSDB_CODE_ACTION_IN_PROGRESS;
        }
      }
      if (pAction->rawWritten) {
        if (pAction->errCode != 0 && pAction->errCode != pAction->acceptableCode) {
          code = pAction->errCode;
        }
      }
    }
1128

1129
    if (code == 0) {
S
Shengliang Guan 已提交
1130
      pTrans->lastAction = action;
1131
      pTrans->lastMsgType = 0;
S
Shengliang Guan 已提交
1132
      pTrans->lastErrorNo = 0;
1133
      memset(&pTrans->lastEpset, 0, sizeof(pTrans->lastEpset));
1134
    } else {
1135
      pTrans->lastAction = action;
S
Shengliang Guan 已提交
1136
      pTrans->lastMsgType = pAction->msgType;
1137 1138
      pTrans->lastErrorNo = code;
      pTrans->lastEpset = pAction->epSet;
1139 1140
    }

1141
    if (mndCannotExecuteTransAction(pMnode)) break;
1142

1143
    if (code == 0) {
1144
      pTrans->code = 0;
1145 1146 1147 1148 1149
      pTrans->redoActionPos++;
      mDebug("trans:%d, %s:%d is executed and need sync to other mnodes", pTrans->id, mndTransStr(pAction->stage),
             pAction->id);
      code = mndTransSync(pMnode, pTrans);
      if (code != 0) {
1150 1151 1152
        pTrans->code = terrno;
        mError("trans:%d, %s:%d is executed and failed to sync to other mnodes since %s", pTrans->id,
               mndTransStr(pAction->stage), pAction->id, terrstr());
1153 1154 1155 1156 1157
      }
    } else if (code == TSDB_CODE_ACTION_IN_PROGRESS) {
      mDebug("trans:%d, %s:%d is in progress and wait it finish", pTrans->id, mndTransStr(pAction->stage), pAction->id);
      break;
    } else {
1158 1159
      terrno = code;
      pTrans->code = code;
S
Shengliang Guan 已提交
1160
      break;
1161
    }
S
Shengliang Guan 已提交
1162
  }
S
Shengliang Guan 已提交
1163

1164 1165 1166 1167 1168 1169 1170
  return code;
}

static bool mndTransPerformPrepareStage(SMnode *pMnode, STrans *pTrans) {
  bool continueExec = true;
  pTrans->stage = TRN_STAGE_REDO_ACTION;
  mDebug("trans:%d, stage from prepare to redoAction", pTrans->id);
S
Shengliang Guan 已提交
1171
  return continueExec;
S
Shengliang Guan 已提交
1172 1173
}

S
Shengliang Guan 已提交
1174 1175
static bool mndTransPerformRedoActionStage(SMnode *pMnode, STrans *pTrans) {
  bool    continueExec = true;
1176 1177
  int32_t code = 0;

1178
  if (pTrans->exec == TRN_EXEC_SERIAL) {
1179
    code = mndTransExecuteRedoActionsSerial(pMnode, pTrans);
1180 1181 1182
  } else {
    code = mndTransExecuteRedoActions(pMnode, pTrans);
  }
S
Shengliang Guan 已提交
1183

1184
  if (mndCannotExecuteTransAction(pMnode)) return false;
1185

S
Shengliang Guan 已提交
1186
  if (code == 0) {
S
Shengliang Guan 已提交
1187
    pTrans->code = 0;
S
Shengliang Guan 已提交
1188
    pTrans->stage = TRN_STAGE_COMMIT;
S
Shengliang Guan 已提交
1189 1190
    mDebug("trans:%d, stage from redoAction to commit", pTrans->id);
    continueExec = true;
S
Shengliang Guan 已提交
1191
  } else if (code == TSDB_CODE_ACTION_IN_PROGRESS) {
S
Shengliang Guan 已提交
1192 1193
    mDebug("trans:%d, stage keep on redoAction since %s", pTrans->id, tstrerror(code));
    continueExec = false;
S
Shengliang Guan 已提交
1194
  } else {
S
Shengliang Guan 已提交
1195
    pTrans->code = terrno;
S
Shengliang Guan 已提交
1196
    if (pTrans->policy == TRN_POLICY_ROLLBACK) {
1197 1198
      pTrans->stage = TRN_STAGE_ROLLBACK;
      mError("trans:%d, stage from redoAction to rollback since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
1199
      continueExec = true;
S
Shengliang Guan 已提交
1200
    } else {
S
Shengliang Guan 已提交
1201 1202 1203
      pTrans->failedTimes++;
      mError("trans:%d, stage keep on redoAction since %s, failedTimes:%d", pTrans->id, terrstr(), pTrans->failedTimes);
      continueExec = false;
S
Shengliang Guan 已提交
1204 1205 1206
    }
  }

S
Shengliang Guan 已提交
1207
  return continueExec;
S
Shengliang Guan 已提交
1208 1209
}

S
Shengliang Guan 已提交
1210
static bool mndTransPerformCommitStage(SMnode *pMnode, STrans *pTrans) {
1211
  if (mndCannotExecuteTransAction(pMnode)) return false;
1212

S
Shengliang Guan 已提交
1213 1214 1215 1216 1217
  bool    continueExec = true;
  int32_t code = mndTransCommit(pMnode, pTrans);

  if (code == 0) {
    pTrans->code = 0;
1218 1219
    pTrans->stage = TRN_STAGE_COMMIT_ACTION;
    mDebug("trans:%d, stage from commit to commitAction", pTrans->id);
S
Shengliang Guan 已提交
1220 1221 1222
    continueExec = true;
  } else {
    pTrans->code = terrno;
1223 1224 1225
    pTrans->failedTimes++;
    mError("trans:%d, stage keep on commit since %s, failedTimes:%d", pTrans->id, terrstr(), pTrans->failedTimes);
    continueExec = false;
S
Shengliang Guan 已提交
1226 1227 1228
  }

  return continueExec;
S
Shengliang Guan 已提交
1229 1230
}

1231
static bool mndTransPerformCommitActionStage(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
1232
  bool    continueExec = true;
1233
  int32_t code = mndTransExecuteCommitActions(pMnode, pTrans);
S
Shengliang Guan 已提交
1234 1235

  if (code == 0) {
S
Shengliang Guan 已提交
1236 1237
    pTrans->code = 0;
    pTrans->stage = TRN_STAGE_FINISHED;
1238
    mDebug("trans:%d, stage from commitAction to finished", pTrans->id);
S
Shengliang Guan 已提交
1239
    continueExec = true;
S
Shengliang Guan 已提交
1240
  } else {
S
Shengliang Guan 已提交
1241 1242
    pTrans->code = terrno;
    pTrans->failedTimes++;
1243
    mError("trans:%d, stage keep on commitAction since %s, failedTimes:%d", pTrans->id, terrstr(), pTrans->failedTimes);
S
Shengliang Guan 已提交
1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254
    continueExec = false;
  }

  return continueExec;
}

static bool mndTransPerformUndoActionStage(SMnode *pMnode, STrans *pTrans) {
  bool    continueExec = true;
  int32_t code = mndTransExecuteUndoActions(pMnode, pTrans);

  if (code == 0) {
1255 1256
    pTrans->stage = TRN_STAGE_FINISHED;
    mDebug("trans:%d, stage from undoAction to finished", pTrans->id);
S
Shengliang Guan 已提交
1257
    continueExec = true;
S
Shengliang Guan 已提交
1258
  } else if (code == TSDB_CODE_ACTION_IN_PROGRESS) {
S
Shengliang Guan 已提交
1259
    mDebug("trans:%d, stage keep on undoAction since %s", pTrans->id, tstrerror(code));
S
Shengliang Guan 已提交
1260 1261 1262
    continueExec = false;
  } else {
    pTrans->failedTimes++;
1263
    mError("trans:%d, stage keep on undoAction since %s, failedTimes:%d", pTrans->id, terrstr(), pTrans->failedTimes);
S
Shengliang Guan 已提交
1264 1265 1266 1267 1268 1269 1270
    continueExec = false;
  }

  return continueExec;
}

static bool mndTransPerformRollbackStage(SMnode *pMnode, STrans *pTrans) {
1271
  if (mndCannotExecuteTransAction(pMnode)) return false;
1272

S
Shengliang Guan 已提交
1273 1274 1275 1276
  bool    continueExec = true;
  int32_t code = mndTransRollback(pMnode, pTrans);

  if (code == 0) {
1277 1278
    pTrans->stage = TRN_STAGE_UNDO_ACTION;
    mDebug("trans:%d, stage from rollback to undoAction", pTrans->id);
S
Shengliang Guan 已提交
1279 1280 1281
    continueExec = true;
  } else {
    pTrans->failedTimes++;
1282
    mError("trans:%d, stage keep on rollback since %s, failedTimes:%d", pTrans->id, terrstr(), pTrans->failedTimes);
S
Shengliang Guan 已提交
1283
    continueExec = false;
S
Shengliang Guan 已提交
1284 1285
  }

S
Shengliang Guan 已提交
1286 1287 1288 1289 1290 1291 1292 1293
  return continueExec;
}

static bool mndTransPerfromFinishedStage(SMnode *pMnode, STrans *pTrans) {
  bool continueExec = false;

  SSdbRaw *pRaw = mndTransActionEncode(pTrans);
  if (pRaw == NULL) {
S
Shengliang Guan 已提交
1294
    mError("trans:%d, failed to encode while finish trans since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
1295 1296 1297 1298 1299 1300 1301 1302
  }
  sdbSetRawStatus(pRaw, SDB_STATUS_DROPPED);

  int32_t code = sdbWrite(pMnode->pSdb, pRaw);
  if (code != 0) {
    mError("trans:%d, failed to write sdb since %s", pTrans->id, terrstr());
  }

1303
  mDebug("trans:%d, execute finished, code:0x%x, failedTimes:%d", pTrans->id, pTrans->code, pTrans->failedTimes);
S
Shengliang Guan 已提交
1304
  return continueExec;
S
Shengliang Guan 已提交
1305
}
S
Shengliang Guan 已提交
1306

1307
void mndTransExecute(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
1308
  bool continueExec = true;
S
Shengliang Guan 已提交
1309

S
Shengliang Guan 已提交
1310
  while (continueExec) {
1311
    mDebug("trans:%d, continue to execute, stage:%s", pTrans->id, mndTransStr(pTrans->stage));
S
Shengliang Guan 已提交
1312
    pTrans->lastExecTime = taosGetTimestampMs();
S
Shengliang Guan 已提交
1313 1314
    switch (pTrans->stage) {
      case TRN_STAGE_PREPARE:
S
Shengliang Guan 已提交
1315 1316 1317 1318 1319
        continueExec = mndTransPerformPrepareStage(pMnode, pTrans);
        break;
      case TRN_STAGE_REDO_ACTION:
        continueExec = mndTransPerformRedoActionStage(pMnode, pTrans);
        break;
1320 1321 1322 1323 1324
      case TRN_STAGE_COMMIT:
        continueExec = mndTransPerformCommitStage(pMnode, pTrans);
        break;
      case TRN_STAGE_COMMIT_ACTION:
        continueExec = mndTransPerformCommitActionStage(pMnode, pTrans);
S
Shengliang Guan 已提交
1325 1326
        break;
      case TRN_STAGE_ROLLBACK:
S
Shengliang Guan 已提交
1327 1328
        continueExec = mndTransPerformRollbackStage(pMnode, pTrans);
        break;
1329 1330 1331
      case TRN_STAGE_UNDO_ACTION:
        continueExec = mndTransPerformUndoActionStage(pMnode, pTrans);
        break;
S
Shengliang Guan 已提交
1332 1333
      case TRN_STAGE_FINISHED:
        continueExec = mndTransPerfromFinishedStage(pMnode, pTrans);
S
Shengliang Guan 已提交
1334
        break;
S
Shengliang Guan 已提交
1335
      default:
S
Shengliang Guan 已提交
1336 1337
        continueExec = false;
        break;
S
Shengliang Guan 已提交
1338 1339 1340
    }
  }

1341
  mndTransSendRpcRsp(pMnode, pTrans);
S
Shengliang Guan 已提交
1342
}
S
Shengliang Guan 已提交
1343

S
Shengliang Guan 已提交
1344 1345
static int32_t mndProcessTransReq(SRpcMsg *pReq) {
  mndTransPullup(pReq->info.node);
S
Shengliang Guan 已提交
1346 1347 1348
  return 0;
}

1349
int32_t mndKillTrans(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
1350 1351 1352 1353 1354 1355 1356 1357 1358 1359
  SArray *pArray = NULL;
  if (pTrans->stage == TRN_STAGE_REDO_ACTION) {
    pArray = pTrans->redoActions;
  } else if (pTrans->stage == TRN_STAGE_UNDO_ACTION) {
    pArray = pTrans->undoActions;
  } else {
    terrno = TSDB_CODE_MND_TRANS_INVALID_STAGE;
    return -1;
  }

1360
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
S
Shengliang Guan 已提交
1361
    STransAction *pAction = taosArrayGet(pArray, i);
S
Shengliang Guan 已提交
1362 1363 1364 1365 1366
    mInfo("trans:%d, %s:%d set processed for kill msg received, errCode from %s to success", pTrans->id,
          mndTransStr(pAction->stage), i, tstrerror(pAction->errCode));
    pAction->msgSent = 1;
    pAction->msgReceived = 1;
    pAction->errCode = 0;
S
Shengliang Guan 已提交
1367 1368 1369 1370 1371 1372
  }

  mndTransExecute(pMnode, pTrans);
  return 0;
}

S
Shengliang Guan 已提交
1373 1374
static int32_t mndProcessKillTransReq(SRpcMsg *pReq) {
  SMnode       *pMnode = pReq->info.node;
S
Shengliang Guan 已提交
1375
  SKillTransReq killReq = {0};
S
Shengliang Guan 已提交
1376
  int32_t       code = -1;
1377
  STrans       *pTrans = NULL;
S
Shengliang Guan 已提交
1378

S
Shengliang Guan 已提交
1379
  if (tDeserializeSKillTransReq(pReq->pCont, pReq->contLen, &killReq) != 0) {
S
Shengliang Guan 已提交
1380
    terrno = TSDB_CODE_INVALID_MSG;
S
Shengliang Guan 已提交
1381
    goto _OVER;
S
Shengliang Guan 已提交
1382 1383 1384 1385
  }

  mInfo("trans:%d, start to kill", killReq.transId);

1386
  if (mndCheckOperAuth(pMnode, pReq->info.conn.user, MND_OPER_KILL_TRANS) != 0) {
S
Shengliang Guan 已提交
1387
    goto _OVER;
S
Shengliang Guan 已提交
1388 1389
  }

S
Shengliang Guan 已提交
1390
  pTrans = mndAcquireTrans(pMnode, killReq.transId);
S
Shengliang Guan 已提交
1391
  if (pTrans == NULL) {
1392
    goto _OVER;
S
Shengliang Guan 已提交
1393 1394
  }

S
Shengliang Guan 已提交
1395 1396
  code = mndKillTrans(pMnode, pTrans);

S
Shengliang Guan 已提交
1397
_OVER:
1398
  if (code != 0) {
S
Shengliang Guan 已提交
1399 1400 1401
    mError("trans:%d, failed to kill since %s", killReq.transId, terrstr());
  }

S
Shengliang Guan 已提交
1402
  mndReleaseTrans(pMnode, pTrans);
S
Shengliang Guan 已提交
1403
  return code;
S
Shengliang Guan 已提交
1404 1405
}

1406 1407
static int32_t mndCompareTransId(int32_t *pTransId1, int32_t *pTransId2) { return *pTransId1 >= *pTransId2 ? 1 : 0; }

S
Shengliang Guan 已提交
1408
void mndTransPullup(SMnode *pMnode) {
1409 1410 1411
  SSdb   *pSdb = pMnode->pSdb;
  SArray *pArray = taosArrayInit(sdbGetSize(pSdb, SDB_TRANS), sizeof(int32_t));
  if (pArray == NULL) return;
S
Shengliang Guan 已提交
1412

1413
  void *pIter = NULL;
S
Shengliang Guan 已提交
1414
  while (1) {
1415
    STrans *pTrans = NULL;
S
Shengliang Guan 已提交
1416 1417
    pIter = sdbFetch(pMnode->pSdb, SDB_TRANS, pIter, (void **)&pTrans);
    if (pIter == NULL) break;
1418 1419 1420
    taosArrayPush(pArray, &pTrans->id);
    sdbRelease(pSdb, pTrans);
  }
S
Shengliang Guan 已提交
1421

1422 1423 1424 1425 1426 1427 1428 1429 1430
  taosArraySort(pArray, (__compar_fn_t)mndCompareTransId);

  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
    int32_t *pTransId = taosArrayGet(pArray, i);
    STrans  *pTrans = mndAcquireTrans(pMnode, *pTransId);
    if (pTrans != NULL) {
      mndTransExecute(pMnode, pTrans);
    }
    mndReleaseTrans(pMnode, pTrans);
S
Shengliang Guan 已提交
1431
  }
S
Shengliang Guan 已提交
1432

1433 1434
  // todo, set to SDB_WRITE_DELTA
  sdbWriteFile(pMnode->pSdb, 0);
1435
  taosArrayDestroy(pArray);
1436
}
S
Shengliang Guan 已提交
1437

S
Shengliang Guan 已提交
1438 1439
static int32_t mndRetrieveTrans(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows) {
  SMnode *pMnode = pReq->info.node;
1440
  SSdb   *pSdb = pMnode->pSdb;
S
Shengliang Guan 已提交
1441 1442 1443
  int32_t numOfRows = 0;
  STrans *pTrans = NULL;
  int32_t cols = 0;
1444
  char   *pWrite;
S
Shengliang Guan 已提交
1445 1446 1447 1448 1449 1450 1451

  while (numOfRows < rows) {
    pShow->pIter = sdbFetch(pSdb, SDB_TRANS, pShow->pIter, (void **)&pTrans);
    if (pShow->pIter == NULL) break;

    cols = 0;

S
Shengliang Guan 已提交
1452 1453
    SColumnInfoData *pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)&pTrans->id, false);
S
Shengliang Guan 已提交
1454

S
Shengliang Guan 已提交
1455 1456
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)&pTrans->createdTime, false);
S
Shengliang Guan 已提交
1457

S
Shengliang Guan 已提交
1458
    char stage[TSDB_TRANS_STAGE_LEN + VARSTR_HEADER_SIZE] = {0};
1459
    STR_WITH_MAXSIZE_TO_VARSTR(stage, mndTransStr(pTrans->stage), pShow->pMeta->pSchemas[cols].bytes);
S
Shengliang Guan 已提交
1460 1461
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)stage, false);
S
Shengliang Guan 已提交
1462

1463 1464 1465 1466 1467 1468 1469
    char dbname1[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
    STR_WITH_MAXSIZE_TO_VARSTR(dbname1, mndGetDbStr(pTrans->dbname1), pShow->pMeta->pSchemas[cols].bytes);
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)dbname1, false);

    char dbname2[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
    STR_WITH_MAXSIZE_TO_VARSTR(dbname2, mndGetDbStr(pTrans->dbname2), pShow->pMeta->pSchemas[cols].bytes);
S
Shengliang Guan 已提交
1470
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1471
    colDataAppend(pColInfo, numOfRows, (const char *)dbname2, false);
S
Shengliang Guan 已提交
1472

1473 1474 1475
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)&pTrans->failedTimes, false);

S
Shengliang Guan 已提交
1476 1477
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)&pTrans->lastExecTime, false);
S
Shengliang Guan 已提交
1478

1479 1480 1481 1482 1483 1484 1485 1486 1487 1488
    char    lastInfo[TSDB_TRANS_ERROR_LEN + VARSTR_HEADER_SIZE] = {0};
    char    detail[TSDB_TRANS_ERROR_LEN] = {0};
    int32_t len = snprintf(detail, sizeof(detail), "action:%d code:0x%x(%s) ", pTrans->lastAction,
                           pTrans->lastErrorNo & 0xFFFF, tstrerror(pTrans->lastErrorNo));
    SEpSet  epset = pTrans->lastEpset;
    if (epset.numOfEps > 0) {
      len += snprintf(detail + len, sizeof(detail) - len, "msgType:%s numOfEps:%d inUse:%d ",
                      TMSG_INFO(pTrans->lastMsgType), epset.numOfEps, epset.inUse);
      for (int32_t i = 0; i < pTrans->lastEpset.numOfEps; ++i) {
        len += snprintf(detail + len, sizeof(detail) - len, "ep:%d-%s:%u ", i, epset.eps[i].fqdn, epset.eps[i].port);
1489 1490
      }
    }
1491
    STR_WITH_MAXSIZE_TO_VARSTR(lastInfo, detail, pShow->pMeta->pSchemas[cols].bytes);
S
Shengliang Guan 已提交
1492
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1493
    colDataAppend(pColInfo, numOfRows, (const char *)lastInfo, false);
S
Shengliang Guan 已提交
1494 1495 1496 1497 1498

    numOfRows++;
    sdbRelease(pSdb, pTrans);
  }

1499
  pShow->numOfRows += numOfRows;
S
Shengliang Guan 已提交
1500 1501 1502 1503 1504 1505 1506
  return numOfRows;
}

static void mndCancelGetNextTrans(SMnode *pMnode, void *pIter) {
  SSdb *pSdb = pMnode->pSdb;
  sdbCancelFetch(pSdb, pIter);
}