mndTrans.c 55.4 KB
Newer Older
S
Shengliang Guan 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

#define _DEFAULT_SOURCE
S
Shengliang Guan 已提交
17
#include "mndTrans.h"
L
Liu Jicong 已提交
18
#include "mndConsumer.h"
S
Shengliang Guan 已提交
19
#include "mndDb.h"
20
#include "mndPrivilege.h"
S
Shengliang Guan 已提交
21
#include "mndShow.h"
S
Shengliang Guan 已提交
22
#include "mndSync.h"
S
Shengliang Guan 已提交
23
#include "mndUser.h"
S
Shengliang Guan 已提交
24

25 26
#define TRANS_VER_NUMBER   1
#define TRANS_ARRAY_SIZE   8
S
Shengliang Guan 已提交
27
#define TRANS_RESERVE_SIZE 64
S
Shengliang Guan 已提交
28

S
Shengliang Guan 已提交
29 30 31
static SSdbRaw *mndTransActionEncode(STrans *pTrans);
static SSdbRow *mndTransActionDecode(SSdbRaw *pRaw);
static int32_t  mndTransActionInsert(SSdb *pSdb, STrans *pTrans);
S
Shengliang Guan 已提交
32
static int32_t  mndTransActionUpdate(SSdb *pSdb, STrans *OldTrans, STrans *pOld);
33
static int32_t  mndTransActionDelete(SSdb *pSdb, STrans *pTrans, bool callFunc);
S
Shengliang Guan 已提交
34

S
Shengliang Guan 已提交
35
static int32_t mndTransAppendLog(SArray *pArray, SSdbRaw *pRaw);
S
Shengliang Guan 已提交
36
static int32_t mndTransAppendAction(SArray *pArray, STransAction *pAction);
S
Shengliang Guan 已提交
37 38
static void    mndTransDropLogs(SArray *pArray);
static void    mndTransDropActions(SArray *pArray);
39
static void    mndTransDropData(STrans *pTrans);
40
static int32_t mndTransExecuteActions(SMnode *pMnode, STrans *pTrans, SArray *pArray);
S
Shengliang Guan 已提交
41 42 43 44
static int32_t mndTransExecuteRedoLogs(SMnode *pMnode, STrans *pTrans);
static int32_t mndTransExecuteUndoLogs(SMnode *pMnode, STrans *pTrans);
static int32_t mndTransExecuteRedoActions(SMnode *pMnode, STrans *pTrans);
static int32_t mndTransExecuteUndoActions(SMnode *pMnode, STrans *pTrans);
45
static int32_t mndTransExecuteCommitActions(SMnode *pMnode, STrans *pTrans);
S
Shengliang Guan 已提交
46 47 48 49 50
static bool    mndTransPerformPrepareStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerformRedoLogStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerformRedoActionStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerformUndoLogStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerformUndoActionStage(SMnode *pMnode, STrans *pTrans);
51
static bool    mndTransPerformCommitActionStage(SMnode *pMnode, STrans *pTrans);
S
Shengliang Guan 已提交
52 53 54
static bool    mndTransPerformCommitStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerformRollbackStage(SMnode *pMnode, STrans *pTrans);
static bool    mndTransPerfromFinishedStage(SMnode *pMnode, STrans *pTrans);
55
static bool    mndCannotExecuteTransAction(SMnode *pMnode) { return !pMnode->deploy && !mndIsMaster(pMnode); }
S
Shengliang Guan 已提交
56

57
static void    mndTransSendRpcRsp(SMnode *pMnode, STrans *pTrans);
58
static int32_t mndProcessTransTimer(SRpcMsg *pReq);
wmmhello's avatar
wmmhello 已提交
59
static int32_t mndProcessTtl(SRpcMsg *pReq);
S
Shengliang Guan 已提交
60
static int32_t mndProcessKillTransReq(SRpcMsg *pReq);
S
Shengliang Guan 已提交
61

S
Shengliang Guan 已提交
62
static int32_t mndRetrieveTrans(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows);
S
Shengliang Guan 已提交
63 64
static void    mndCancelGetNextTrans(SMnode *pMnode, void *pIter);

S
Shengliang Guan 已提交
65
int32_t mndInitTrans(SMnode *pMnode) {
S
Shengliang Guan 已提交
66 67 68 69 70 71 72 73 74
  SSdbTable table = {
      .sdbType = SDB_TRANS,
      .keyType = SDB_KEY_INT32,
      .encodeFp = (SdbEncodeFp)mndTransActionEncode,
      .decodeFp = (SdbDecodeFp)mndTransActionDecode,
      .insertFp = (SdbInsertFp)mndTransActionInsert,
      .updateFp = (SdbUpdateFp)mndTransActionUpdate,
      .deleteFp = (SdbDeleteFp)mndTransActionDelete,
  };
S
Shengliang Guan 已提交
75

76
  mndSetMsgHandle(pMnode, TDMT_MND_TRANS_TIMER, mndProcessTransTimer);
S
Shengliang Guan 已提交
77
  mndSetMsgHandle(pMnode, TDMT_MND_KILL_TRANS, mndProcessKillTransReq);
S
Shengliang Guan 已提交
78

S
Shengliang Guan 已提交
79
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_TRANS, mndRetrieveTrans);
S
Shengliang Guan 已提交
80
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_TRANS, mndCancelGetNextTrans);
S
Shengliang Guan 已提交
81 82 83 84 85
  return sdbSetTable(pMnode->pSdb, table);
}

void mndCleanupTrans(SMnode *pMnode) {}

86 87 88
static int32_t mndTransGetActionsSize(SArray *pArray) {
  int32_t actionNum = taosArrayGetSize(pArray);
  int32_t rawDataLen = 0;
S
Shengliang Guan 已提交
89

90 91
  for (int32_t i = 0; i < actionNum; ++i) {
    STransAction *pAction = taosArrayGet(pArray, i);
92
    if (pAction->actionType == TRANS_ACTION_RAW) {
93
      rawDataLen += (sdbGetRawTotalSize(pAction->pRaw) + sizeof(int32_t));
94
    } else if (pAction->actionType == TRANS_ACTION_MSG) {
95
      rawDataLen += (sizeof(STransAction) + pAction->contLen);
96 97
    } else {
      // empty
98
    }
99
    rawDataLen += sizeof(int8_t);
S
Shengliang Guan 已提交
100 101
  }

102 103
  return rawDataLen;
}
S
Shengliang Guan 已提交
104

105 106
static SSdbRaw *mndTransActionEncode(STrans *pTrans) {
  terrno = TSDB_CODE_OUT_OF_MEMORY;
S
Shengliang Guan 已提交
107

108 109 110 111
  int32_t rawDataLen = sizeof(STrans) + TRANS_RESERVE_SIZE;
  rawDataLen += mndTransGetActionsSize(pTrans->redoActions);
  rawDataLen += mndTransGetActionsSize(pTrans->undoActions);
  rawDataLen += mndTransGetActionsSize(pTrans->commitActions);
S
Shengliang Guan 已提交
112

S
Shengliang Guan 已提交
113
  SSdbRaw *pRaw = sdbAllocRaw(SDB_TRANS, TRANS_VER_NUMBER, rawDataLen);
S
Shengliang Guan 已提交
114
  if (pRaw == NULL) {
S
Shengliang Guan 已提交
115
    mError("trans:%d, failed to alloc raw since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
116 117 118 119
    return NULL;
  }

  int32_t dataPos = 0;
120
  SDB_SET_INT32(pRaw, dataPos, pTrans->id, _OVER)
S
Shengliang Guan 已提交
121 122 123 124
  SDB_SET_INT8(pRaw, dataPos, pTrans->stage, _OVER)
  SDB_SET_INT8(pRaw, dataPos, pTrans->policy, _OVER)
  SDB_SET_INT8(pRaw, dataPos, pTrans->conflict, _OVER)
  SDB_SET_INT8(pRaw, dataPos, pTrans->exec, _OVER)
125
  SDB_SET_INT64(pRaw, dataPos, pTrans->createdTime, _OVER)
126 127
  SDB_SET_BINARY(pRaw, dataPos, pTrans->dbname1, TSDB_DB_FNAME_LEN, _OVER)
  SDB_SET_BINARY(pRaw, dataPos, pTrans->dbname2, TSDB_DB_FNAME_LEN, _OVER)
128
  SDB_SET_INT32(pRaw, dataPos, pTrans->redoActionPos, _OVER)
129 130 131 132

  int32_t redoActionNum = taosArrayGetSize(pTrans->redoActions);
  int32_t undoActionNum = taosArrayGetSize(pTrans->undoActions);
  int32_t commitActionNum = taosArrayGetSize(pTrans->commitActions);
133 134
  SDB_SET_INT32(pRaw, dataPos, redoActionNum, _OVER)
  SDB_SET_INT32(pRaw, dataPos, undoActionNum, _OVER)
135
  SDB_SET_INT32(pRaw, dataPos, commitActionNum, _OVER)
S
Shengliang Guan 已提交
136

S
Shengliang Guan 已提交
137 138
  for (int32_t i = 0; i < redoActionNum; ++i) {
    STransAction *pAction = taosArrayGet(pTrans->redoActions, i);
139 140 141
    SDB_SET_INT32(pRaw, dataPos, pAction->id, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->errCode, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->acceptableCode, _OVER)
142
    SDB_SET_INT32(pRaw, dataPos, pAction->retryCode, _OVER)
143
    SDB_SET_INT8(pRaw, dataPos, pAction->actionType, _OVER)
144
    SDB_SET_INT8(pRaw, dataPos, pAction->stage, _OVER)
145
    SDB_SET_INT8(pRaw, dataPos, pAction->reserved, _OVER)
146
    if (pAction->actionType == TRANS_ACTION_RAW) {
147
      int32_t len = sdbGetRawTotalSize(pAction->pRaw);
148
      SDB_SET_INT8(pRaw, dataPos, pAction->rawWritten, _OVER)
149 150
      SDB_SET_INT32(pRaw, dataPos, len, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, (void *)pAction->pRaw, len, _OVER)
151
    } else if (pAction->actionType == TRANS_ACTION_MSG) {
152 153
      SDB_SET_BINARY(pRaw, dataPos, (void *)&pAction->epSet, sizeof(SEpSet), _OVER)
      SDB_SET_INT16(pRaw, dataPos, pAction->msgType, _OVER)
154 155
      SDB_SET_INT8(pRaw, dataPos, pAction->msgSent, _OVER)
      SDB_SET_INT8(pRaw, dataPos, pAction->msgReceived, _OVER)
156 157
      SDB_SET_INT32(pRaw, dataPos, pAction->contLen, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, pAction->pCont, pAction->contLen, _OVER)
158 159
    } else {
      // nothing
160
    }
S
Shengliang Guan 已提交
161 162 163 164
  }

  for (int32_t i = 0; i < undoActionNum; ++i) {
    STransAction *pAction = taosArrayGet(pTrans->undoActions, i);
165 166 167
    SDB_SET_INT32(pRaw, dataPos, pAction->id, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->errCode, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->acceptableCode, _OVER)
168
    SDB_SET_INT32(pRaw, dataPos, pAction->retryCode, _OVER)
169
    SDB_SET_INT8(pRaw, dataPos, pAction->actionType, _OVER)
170
    SDB_SET_INT8(pRaw, dataPos, pAction->stage, _OVER)
171
    SDB_SET_INT8(pRaw, dataPos, pAction->reserved, _OVER)
172
    if (pAction->actionType == TRANS_ACTION_RAW) {
173
      int32_t len = sdbGetRawTotalSize(pAction->pRaw);
174
      SDB_SET_INT8(pRaw, dataPos, pAction->rawWritten, _OVER)
175 176
      SDB_SET_INT32(pRaw, dataPos, len, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, (void *)pAction->pRaw, len, _OVER)
177
    } else if (pAction->actionType == TRANS_ACTION_MSG) {
178 179
      SDB_SET_BINARY(pRaw, dataPos, (void *)&pAction->epSet, sizeof(SEpSet), _OVER)
      SDB_SET_INT16(pRaw, dataPos, pAction->msgType, _OVER)
180 181
      SDB_SET_INT8(pRaw, dataPos, pAction->msgSent, _OVER)
      SDB_SET_INT8(pRaw, dataPos, pAction->msgReceived, _OVER)
182 183
      SDB_SET_INT32(pRaw, dataPos, pAction->contLen, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, pAction->pCont, pAction->contLen, _OVER)
184 185
    } else {
      // nothing
186 187 188 189 190
    }
  }

  for (int32_t i = 0; i < commitActionNum; ++i) {
    STransAction *pAction = taosArrayGet(pTrans->commitActions, i);
191 192 193
    SDB_SET_INT32(pRaw, dataPos, pAction->id, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->errCode, _OVER)
    SDB_SET_INT32(pRaw, dataPos, pAction->acceptableCode, _OVER)
194
    SDB_SET_INT32(pRaw, dataPos, pAction->retryCode, _OVER)
195
    SDB_SET_INT8(pRaw, dataPos, pAction->actionType, _OVER)
196
    SDB_SET_INT8(pRaw, dataPos, pAction->stage, _OVER)
197
    SDB_SET_INT8(pRaw, dataPos, pAction->reserved, _OVER)
198
    if (pAction->actionType == TRANS_ACTION_RAW) {
199
      int32_t len = sdbGetRawTotalSize(pAction->pRaw);
200
      SDB_SET_INT8(pRaw, dataPos, pAction->rawWritten, _OVER)
201 202
      SDB_SET_INT32(pRaw, dataPos, len, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, (void *)pAction->pRaw, len, _OVER)
203
    } else if (pAction->actionType == TRANS_ACTION_MSG) {
204 205
      SDB_SET_BINARY(pRaw, dataPos, (void *)&pAction->epSet, sizeof(SEpSet), _OVER)
      SDB_SET_INT16(pRaw, dataPos, pAction->msgType, _OVER)
206 207
      SDB_SET_INT8(pRaw, dataPos, pAction->msgSent, _OVER)
      SDB_SET_INT8(pRaw, dataPos, pAction->msgReceived, _OVER)
208 209
      SDB_SET_INT32(pRaw, dataPos, pAction->contLen, _OVER)
      SDB_SET_BINARY(pRaw, dataPos, pAction->pCont, pAction->contLen, _OVER)
210 211
    } else {
      // nothing
212
    }
213 214
  }

215 216 217
  SDB_SET_INT32(pRaw, dataPos, pTrans->startFunc, _OVER)
  SDB_SET_INT32(pRaw, dataPos, pTrans->stopFunc, _OVER)
  SDB_SET_INT32(pRaw, dataPos, pTrans->paramLen, _OVER)
218
  if (pTrans->param != NULL) {
219
    SDB_SET_BINARY(pRaw, dataPos, pTrans->param, pTrans->paramLen, _OVER)
220 221
  }

222 223
  SDB_SET_RESERVE(pRaw, dataPos, TRANS_RESERVE_SIZE, _OVER)
  SDB_SET_DATALEN(pRaw, dataPos, _OVER)
224 225 226

  terrno = 0;

227
_OVER:
228 229 230 231
  if (terrno != 0) {
    mError("trans:%d, failed to encode to raw:%p len:%d since %s", pTrans->id, pRaw, dataPos, terrstr());
    sdbFreeRaw(pRaw);
    return NULL;
S
Shengliang Guan 已提交
232 233
  }

S
Shengliang Guan 已提交
234
  mTrace("trans:%d, encode to raw:%p, row:%p len:%d", pTrans->id, pRaw, pTrans, dataPos);
S
Shengliang Guan 已提交
235 236 237
  return pRaw;
}

S
Shengliang Guan 已提交
238
static SSdbRow *mndTransActionDecode(SSdbRaw *pRaw) {
239 240
  terrno = TSDB_CODE_OUT_OF_MEMORY;

241 242 243
  SSdbRow     *pRow = NULL;
  STrans      *pTrans = NULL;
  char        *pData = NULL;
244 245 246 247
  int32_t      dataLen = 0;
  int8_t       sver = 0;
  int32_t      redoActionNum = 0;
  int32_t      undoActionNum = 0;
248
  int32_t      commitActionNum = 0;
249 250 251
  int32_t      dataPos = 0;
  STransAction action = {0};

S
Shengliang Guan 已提交
252
  if (sdbGetRawSoftVer(pRaw, &sver) != 0) goto _OVER;
S
Shengliang Guan 已提交
253

S
Shengliang Guan 已提交
254
  if (sver != TRANS_VER_NUMBER) {
S
Shengliang Guan 已提交
255
    terrno = TSDB_CODE_SDB_INVALID_DATA_VER;
S
Shengliang Guan 已提交
256
    goto _OVER;
S
Shengliang Guan 已提交
257 258
  }

259
  pRow = sdbAllocRow(sizeof(STrans));
S
Shengliang Guan 已提交
260
  if (pRow == NULL) goto _OVER;
261 262

  pTrans = sdbGetRowObj(pRow);
S
Shengliang Guan 已提交
263
  if (pTrans == NULL) goto _OVER;
S
Shengliang Guan 已提交
264

S
Shengliang Guan 已提交
265
  SDB_GET_INT32(pRaw, dataPos, &pTrans->id, _OVER)
S
Shengliang Guan 已提交
266

S
Shengliang Guan 已提交
267 268 269 270 271 272 273 274 275
  int8_t stage = 0;
  int8_t policy = 0;
  int8_t conflict = 0;
  int8_t exec = 0;
  int8_t actionType = 0;
  SDB_GET_INT8(pRaw, dataPos, &stage, _OVER)
  SDB_GET_INT8(pRaw, dataPos, &policy, _OVER)
  SDB_GET_INT8(pRaw, dataPos, &conflict, _OVER)
  SDB_GET_INT8(pRaw, dataPos, &exec, _OVER)
S
Shengliang Guan 已提交
276
  pTrans->stage = stage;
277
  pTrans->policy = policy;
278 279
  pTrans->conflict = conflict;
  pTrans->exec = exec;
S
Shengliang Guan 已提交
280
  SDB_GET_INT64(pRaw, dataPos, &pTrans->createdTime, _OVER)
281 282
  SDB_GET_BINARY(pRaw, dataPos, pTrans->dbname1, TSDB_DB_FNAME_LEN, _OVER)
  SDB_GET_BINARY(pRaw, dataPos, pTrans->dbname2, TSDB_DB_FNAME_LEN, _OVER)
283
  SDB_GET_INT32(pRaw, dataPos, &pTrans->redoActionPos, _OVER)
S
Shengliang Guan 已提交
284 285
  SDB_GET_INT32(pRaw, dataPos, &redoActionNum, _OVER)
  SDB_GET_INT32(pRaw, dataPos, &undoActionNum, _OVER)
286
  SDB_GET_INT32(pRaw, dataPos, &commitActionNum, _OVER)
S
Shengliang Guan 已提交
287

S
Shengliang Guan 已提交
288 289
  pTrans->redoActions = taosArrayInit(redoActionNum, sizeof(STransAction));
  pTrans->undoActions = taosArrayInit(undoActionNum, sizeof(STransAction));
290
  pTrans->commitActions = taosArrayInit(commitActionNum, sizeof(STransAction));
S
Shengliang Guan 已提交
291

S
Shengliang Guan 已提交
292 293
  if (pTrans->redoActions == NULL) goto _OVER;
  if (pTrans->undoActions == NULL) goto _OVER;
294
  if (pTrans->commitActions == NULL) goto _OVER;
S
Shengliang Guan 已提交
295 296

  for (int32_t i = 0; i < redoActionNum; ++i) {
297 298 299
    SDB_GET_INT32(pRaw, dataPos, &action.id, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.errCode, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.acceptableCode, _OVER)
300
    SDB_GET_INT32(pRaw, dataPos, &action.retryCode, _OVER)
301 302
    SDB_GET_INT8(pRaw, dataPos, &actionType, _OVER)
    action.actionType = actionType;
S
Shengliang Guan 已提交
303 304
    SDB_GET_INT8(pRaw, dataPos, &stage, _OVER)
    action.stage = stage;
305
    SDB_GET_INT8(pRaw, dataPos, &action.reserved, _OVER)
306
    if (action.actionType == TRANS_ACTION_RAW) {
307
      SDB_GET_INT8(pRaw, dataPos, &action.rawWritten, _OVER)
308
      SDB_GET_INT32(pRaw, dataPos, &dataLen, _OVER)
309 310
      action.pRaw = taosMemoryMalloc(dataLen);
      if (action.pRaw == NULL) goto _OVER;
S
Shengliang Guan 已提交
311
      // mTrace("raw:%p, is created", pData);
312 313 314
      SDB_GET_BINARY(pRaw, dataPos, (void *)action.pRaw, dataLen, _OVER);
      if (taosArrayPush(pTrans->redoActions, &action) == NULL) goto _OVER;
      action.pRaw = NULL;
315
    } else if (action.actionType == TRANS_ACTION_MSG) {
316 317
      SDB_GET_BINARY(pRaw, dataPos, (void *)&action.epSet, sizeof(SEpSet), _OVER);
      SDB_GET_INT16(pRaw, dataPos, &action.msgType, _OVER)
318 319
      SDB_GET_INT8(pRaw, dataPos, &action.msgSent, _OVER)
      SDB_GET_INT8(pRaw, dataPos, &action.msgReceived, _OVER)
320 321 322 323 324 325
      SDB_GET_INT32(pRaw, dataPos, &action.contLen, _OVER)
      action.pCont = taosMemoryMalloc(action.contLen);
      if (action.pCont == NULL) goto _OVER;
      SDB_GET_BINARY(pRaw, dataPos, action.pCont, action.contLen, _OVER);
      if (taosArrayPush(pTrans->redoActions, &action) == NULL) goto _OVER;
      action.pCont = NULL;
326 327
    } else {
      if (taosArrayPush(pTrans->redoActions, &action) == NULL) goto _OVER;
328
    }
S
Shengliang Guan 已提交
329 330 331
  }

  for (int32_t i = 0; i < undoActionNum; ++i) {
332 333 334
    SDB_GET_INT32(pRaw, dataPos, &action.id, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.errCode, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.acceptableCode, _OVER)
335
    SDB_GET_INT32(pRaw, dataPos, &action.retryCode, _OVER)
336 337
    SDB_GET_INT8(pRaw, dataPos, &actionType, _OVER)
    action.actionType = actionType;
S
Shengliang Guan 已提交
338 339
    SDB_GET_INT8(pRaw, dataPos, &stage, _OVER)
    action.stage = stage;
340
    SDB_GET_INT8(pRaw, dataPos, &action.reserved, _OVER)
341
    if (action.actionType == TRANS_ACTION_RAW) {
342
      SDB_GET_INT8(pRaw, dataPos, &action.rawWritten, _OVER)
343
      SDB_GET_INT32(pRaw, dataPos, &dataLen, _OVER)
344 345
      action.pRaw = taosMemoryMalloc(dataLen);
      if (action.pRaw == NULL) goto _OVER;
S
Shengliang Guan 已提交
346
      // mTrace("raw:%p, is created", action.pRaw);
347 348 349
      SDB_GET_BINARY(pRaw, dataPos, (void *)action.pRaw, dataLen, _OVER);
      if (taosArrayPush(pTrans->undoActions, &action) == NULL) goto _OVER;
      action.pRaw = NULL;
350
    } else if (action.actionType == TRANS_ACTION_MSG) {
351 352
      SDB_GET_BINARY(pRaw, dataPos, (void *)&action.epSet, sizeof(SEpSet), _OVER);
      SDB_GET_INT16(pRaw, dataPos, &action.msgType, _OVER)
353 354
      SDB_GET_INT8(pRaw, dataPos, &action.msgSent, _OVER)
      SDB_GET_INT8(pRaw, dataPos, &action.msgReceived, _OVER)
355 356 357 358 359 360
      SDB_GET_INT32(pRaw, dataPos, &action.contLen, _OVER)
      action.pCont = taosMemoryMalloc(action.contLen);
      if (action.pCont == NULL) goto _OVER;
      SDB_GET_BINARY(pRaw, dataPos, action.pCont, action.contLen, _OVER);
      if (taosArrayPush(pTrans->undoActions, &action) == NULL) goto _OVER;
      action.pCont = NULL;
361 362
    } else {
      if (taosArrayPush(pTrans->redoActions, &action) == NULL) goto _OVER;
363 364 365 366
    }
  }

  for (int32_t i = 0; i < commitActionNum; ++i) {
367 368 369
    SDB_GET_INT32(pRaw, dataPos, &action.id, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.errCode, _OVER)
    SDB_GET_INT32(pRaw, dataPos, &action.acceptableCode, _OVER)
370
    SDB_GET_INT32(pRaw, dataPos, &action.retryCode, _OVER)
371 372
    SDB_GET_INT8(pRaw, dataPos, &actionType, _OVER)
    action.actionType = actionType;
S
Shengliang Guan 已提交
373 374
    SDB_GET_INT8(pRaw, dataPos, &stage, _OVER)
    action.stage = stage;
375
    SDB_GET_INT8(pRaw, dataPos, &action.reserved, _OVER)
376
    if (action.actionType) {
377
      SDB_GET_INT8(pRaw, dataPos, &action.rawWritten, _OVER)
378
      SDB_GET_INT32(pRaw, dataPos, &dataLen, _OVER)
379 380
      action.pRaw = taosMemoryMalloc(dataLen);
      if (action.pRaw == NULL) goto _OVER;
S
Shengliang Guan 已提交
381
      // mTrace("raw:%p, is created", action.pRaw);
382 383 384
      SDB_GET_BINARY(pRaw, dataPos, (void *)action.pRaw, dataLen, _OVER);
      if (taosArrayPush(pTrans->commitActions, &action) == NULL) goto _OVER;
      action.pRaw = NULL;
385
    } else if (action.actionType == TRANS_ACTION_MSG) {
386 387
      SDB_GET_BINARY(pRaw, dataPos, (void *)&action.epSet, sizeof(SEpSet), _OVER);
      SDB_GET_INT16(pRaw, dataPos, &action.msgType, _OVER)
388 389
      SDB_GET_INT8(pRaw, dataPos, &action.msgSent, _OVER)
      SDB_GET_INT8(pRaw, dataPos, &action.msgReceived, _OVER)
390 391 392 393 394 395
      SDB_GET_INT32(pRaw, dataPos, &action.contLen, _OVER)
      action.pCont = taosMemoryMalloc(action.contLen);
      if (action.pCont == NULL) goto _OVER;
      SDB_GET_BINARY(pRaw, dataPos, action.pCont, action.contLen, _OVER);
      if (taosArrayPush(pTrans->commitActions, &action) == NULL) goto _OVER;
      action.pCont = NULL;
396 397
    } else {
      if (taosArrayPush(pTrans->redoActions, &action) == NULL) goto _OVER;
398
    }
S
Shengliang Guan 已提交
399 400
  }

S
Shengliang Guan 已提交
401 402 403
  SDB_GET_INT32(pRaw, dataPos, &pTrans->startFunc, _OVER)
  SDB_GET_INT32(pRaw, dataPos, &pTrans->stopFunc, _OVER)
  SDB_GET_INT32(pRaw, dataPos, &pTrans->paramLen, _OVER)
404 405
  if (pTrans->paramLen != 0) {
    pTrans->param = taosMemoryMalloc(pTrans->paramLen);
S
Shengliang Guan 已提交
406
    SDB_GET_BINARY(pRaw, dataPos, pTrans->param, pTrans->paramLen, _OVER);
407 408
  }

S
Shengliang Guan 已提交
409
  SDB_GET_RESERVE(pRaw, dataPos, TRANS_RESERVE_SIZE, _OVER)
410 411

  terrno = 0;
S
Shengliang Guan 已提交
412

S
Shengliang Guan 已提交
413
_OVER:
414 415 416
  if (terrno != 0) {
    mError("trans:%d, failed to parse from raw:%p since %s", pTrans->id, pRaw, terrstr());
    mndTransDropData(pTrans);
wafwerar's avatar
wafwerar 已提交
417 418
    taosMemoryFreeClear(pRow);
    taosMemoryFreeClear(action.pCont);
S
Shengliang Guan 已提交
419 420 421
    return NULL;
  }

S
Shengliang Guan 已提交
422
  mTrace("trans:%d, decode from raw:%p, row:%p", pTrans->id, pRaw, pTrans);
S
Shengliang Guan 已提交
423 424 425
  return pRow;
}

S
Shengliang Guan 已提交
426 427 428 429 430 431 432 433
static const char *mndTransStr(ETrnStage stage) {
  switch (stage) {
    case TRN_STAGE_PREPARE:
      return "prepare";
    case TRN_STAGE_REDO_ACTION:
      return "redoAction";
    case TRN_STAGE_ROLLBACK:
      return "rollback";
434 435 436 437 438 439
    case TRN_STAGE_UNDO_ACTION:
      return "undoAction";
    case TRN_STAGE_COMMIT:
      return "commit";
    case TRN_STAGE_COMMIT_ACTION:
      return "commitAction";
S
Shengliang Guan 已提交
440 441 442 443 444 445 446
    case TRN_STAGE_FINISHED:
      return "finished";
    default:
      return "invalid";
  }
}

447
static void mndTransTestStartFunc(SMnode *pMnode, void *param, int32_t paramLen) {
S
Shengliang Guan 已提交
448
  mDebug("test trans start, param:%s, len:%d", (char *)param, paramLen);
449 450 451
}

static void mndTransTestStopFunc(SMnode *pMnode, void *param, int32_t paramLen) {
S
Shengliang Guan 已提交
452
  mDebug("test trans stop, param:%s, len:%d", (char *)param, paramLen);
453 454
}

S
Shengliang Guan 已提交
455
static TransCbFp mndTransGetCbFp(ETrnFunc ftype) {
456
  switch (ftype) {
S
Shengliang Guan 已提交
457
    case TRANS_START_FUNC_TEST:
458
      return mndTransTestStartFunc;
S
Shengliang Guan 已提交
459
    case TRANS_STOP_FUNC_TEST:
460
      return mndTransTestStopFunc;
S
Shengliang Guan 已提交
461
    case TRANS_START_FUNC_MQ_REB:
L
Liu Jicong 已提交
462
      return mndRebCntInc;
463
    case TRANS_STOP_FUNC_MQ_REB:
L
Liu Jicong 已提交
464
      return mndRebCntDec;
465 466 467 468 469
    default:
      return NULL;
  }
}

S
Shengliang Guan 已提交
470
static int32_t mndTransActionInsert(SSdb *pSdb, STrans *pTrans) {
S
Shengliang Guan 已提交
471
  mTrace("trans:%d, perform insert action, row:%p stage:%s", pTrans->id, pTrans, mndTransStr(pTrans->stage));
472 473 474 475 476 477

  if (pTrans->startFunc > 0) {
    TransCbFp fp = mndTransGetCbFp(pTrans->startFunc);
    if (fp) {
      (*fp)(pSdb->pMnode, pTrans->param, pTrans->paramLen);
    }
478
    pTrans->startFunc = 0;
479 480
  }

S
Shengliang Guan 已提交
481 482 483
  return 0;
}

484
static void mndTransDropData(STrans *pTrans) {
485 486 487 488 489 490 491 492 493 494 495 496
  if (pTrans->redoActions != NULL) {
    mndTransDropActions(pTrans->redoActions);
    pTrans->redoActions = NULL;
  }
  if (pTrans->undoActions != NULL) {
    mndTransDropActions(pTrans->undoActions);
    pTrans->undoActions = NULL;
  }
  if (pTrans->commitActions != NULL) {
    mndTransDropActions(pTrans->commitActions);
    pTrans->commitActions = NULL;
  }
S
Shengliang Guan 已提交
497
  if (pTrans->rpcRsp != NULL) {
wafwerar's avatar
wafwerar 已提交
498
    taosMemoryFree(pTrans->rpcRsp);
S
Shengliang Guan 已提交
499 500 501
    pTrans->rpcRsp = NULL;
    pTrans->rpcRspLen = 0;
  }
502 503 504 505 506
  if (pTrans->param != NULL) {
    taosMemoryFree(pTrans->param);
    pTrans->param = NULL;
    pTrans->paramLen = 0;
  }
507
}
S
Shengliang Guan 已提交
508

509
static int32_t mndTransActionDelete(SSdb *pSdb, STrans *pTrans, bool callFunc) {
510
  mTrace("trans:%d, perform delete action, row:%p stage:%s callfunc:%d", pTrans->id, pTrans, mndTransStr(pTrans->stage),
511 512 513 514 515 516
         callFunc);
  if (pTrans->stopFunc > 0 && callFunc) {
    TransCbFp fp = mndTransGetCbFp(pTrans->stopFunc);
    if (fp) {
      (*fp)(pSdb->pMnode, pTrans->param, pTrans->paramLen);
    }
517
    pTrans->stopFunc = 0;
518 519
  }

520
  mndTransDropData(pTrans);
S
Shengliang Guan 已提交
521 522 523
  return 0;
}

524 525 526 527 528 529 530 531
static void mndTransUpdateActions(SArray *pOldArray, SArray *pNewArray) {
  for (int32_t i = 0; i < taosArrayGetSize(pOldArray); ++i) {
    STransAction *pOldAction = taosArrayGet(pOldArray, i);
    STransAction *pNewAction = taosArrayGet(pNewArray, i);
    pOldAction->rawWritten = pNewAction->rawWritten;
    pOldAction->msgSent = pNewAction->msgSent;
    pOldAction->msgReceived = pNewAction->msgReceived;
    pOldAction->errCode = pNewAction->errCode;
532
  }
533
}
534

535
static int32_t mndTransActionUpdate(SSdb *pSdb, STrans *pOld, STrans *pNew) {
S
Shengliang Guan 已提交
536 537
  mTrace("trans:%d, perform update action, old row:%p stage:%s, new row:%p stage:%s", pOld->id, pOld,
         mndTransStr(pOld->stage), pNew, mndTransStr(pNew->stage));
538 539 540
  mndTransUpdateActions(pOld->redoActions, pNew->redoActions);
  mndTransUpdateActions(pOld->undoActions, pNew->undoActions);
  mndTransUpdateActions(pOld->commitActions, pNew->commitActions);
S
Shengliang Guan 已提交
541
  pOld->stage = pNew->stage;
542
  pOld->redoActionPos = pNew->redoActionPos;
543 544 545

  if (pOld->stage == TRN_STAGE_COMMIT) {
    pOld->stage = TRN_STAGE_COMMIT_ACTION;
546
    mTrace("trans:%d, stage from commit to commitAction since perform update action", pNew->id);
547 548 549
  }

  if (pOld->stage == TRN_STAGE_ROLLBACK) {
550 551
    pOld->stage = TRN_STAGE_REDO_ACTION;
    mTrace("trans:%d, stage from rollback to undoAction since perform update action", pNew->id);
552
  }
553

S
Shengliang Guan 已提交
554 555 556
  return 0;
}

557
STrans *mndAcquireTrans(SMnode *pMnode, int32_t transId) {
558
  STrans *pTrans = sdbAcquire(pMnode->pSdb, SDB_TRANS, &transId);
S
Shengliang Guan 已提交
559 560 561 562
  if (pTrans == NULL) {
    terrno = TSDB_CODE_MND_TRANS_NOT_EXIST;
  }
  return pTrans;
S
Shengliang Guan 已提交
563 564
}

565
void mndReleaseTrans(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
566 567 568 569
  SSdb *pSdb = pMnode->pSdb;
  sdbRelease(pSdb, pTrans);
}

570
STrans *mndTransCreate(SMnode *pMnode, ETrnPolicy policy, ETrnConflct conflict, const SRpcMsg *pReq) {
wafwerar's avatar
wafwerar 已提交
571
  STrans *pTrans = taosMemoryCalloc(1, sizeof(STrans));
S
Shengliang Guan 已提交
572 573 574 575 576 577
  if (pTrans == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    mError("failed to create transaction since %s", terrstr());
    return NULL;
  }

S
Shengliang Guan 已提交
578
  pTrans->id = sdbGetMaxId(pMnode->pSdb, SDB_TRANS);
S
Shengliang Guan 已提交
579 580
  pTrans->stage = TRN_STAGE_PREPARE;
  pTrans->policy = policy;
581 582
  pTrans->conflict = conflict;
  pTrans->exec = TRN_EXEC_PRARLLEL;
S
Shengliang Guan 已提交
583
  pTrans->createdTime = taosGetTimestampMs();
S
Shengliang Guan 已提交
584 585
  pTrans->redoActions = taosArrayInit(TRANS_ARRAY_SIZE, sizeof(STransAction));
  pTrans->undoActions = taosArrayInit(TRANS_ARRAY_SIZE, sizeof(STransAction));
586
  pTrans->commitActions = taosArrayInit(TRANS_ARRAY_SIZE, sizeof(STransAction));
S
Shengliang Guan 已提交
587

588
  if (pTrans->redoActions == NULL || pTrans->undoActions == NULL || pTrans->commitActions == NULL) {
S
Shengliang Guan 已提交
589 590 591 592 593
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    mError("failed to create transaction since %s", terrstr());
    return NULL;
  }

594 595
  if (pReq != NULL) pTrans->rpcInfo = pReq->info;
  mTrace("trans:%d, local object is created, data:%p", pTrans->id, pTrans);
S
Shengliang Guan 已提交
596 597 598
  return pTrans;
}

S
Shengliang Guan 已提交
599
static void mndTransDropActions(SArray *pArray) {
S
Shengliang Guan 已提交
600 601
  int32_t size = taosArrayGetSize(pArray);
  for (int32_t i = 0; i < size; ++i) {
S
Shengliang Guan 已提交
602
    STransAction *pAction = taosArrayGet(pArray, i);
603
    if (pAction->actionType == TRANS_ACTION_RAW) {
604
      taosMemoryFreeClear(pAction->pRaw);
605
    } else if (pAction->actionType == TRANS_ACTION_MSG) {
606
      taosMemoryFreeClear(pAction->pCont);
607 608
    } else {
      // nothing
609
    }
S
Shengliang Guan 已提交
610 611 612 613 614
  }

  taosArrayDestroy(pArray);
}

S
Shengliang Guan 已提交
615
void mndTransDrop(STrans *pTrans) {
S
Shengliang 已提交
616 617
  if (pTrans != NULL) {
    mndTransDropData(pTrans);
618
    mTrace("trans:%d, local object is freed, data:%p", pTrans->id, pTrans);
wafwerar's avatar
wafwerar 已提交
619
    taosMemoryFreeClear(pTrans);
S
Shengliang 已提交
620
  }
S
Shengliang Guan 已提交
621 622
}

623
static int32_t mndTransAppendAction(SArray *pArray, STransAction *pAction) {
624 625
  pAction->id = taosArrayGetSize(pArray);

626
  void *ptr = taosArrayPush(pArray, pAction);
S
Shengliang Guan 已提交
627 628 629 630 631 632 633 634
  if (ptr == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }

  return 0;
}

635
int32_t mndTransAppendRedolog(STrans *pTrans, SSdbRaw *pRaw) {
636 637 638 639 640 641
  STransAction action = {.stage = TRN_STAGE_REDO_ACTION, .actionType = TRANS_ACTION_RAW, .pRaw = pRaw};
  return mndTransAppendAction(pTrans->redoActions, &action);
}

int32_t mndTransAppendNullLog(STrans *pTrans) {
  STransAction action = {.stage = TRN_STAGE_REDO_ACTION, .actionType = TRANS_ACTION_NULL};
642 643
  return mndTransAppendAction(pTrans->redoActions, &action);
}
S
Shengliang Guan 已提交
644

645
int32_t mndTransAppendUndolog(STrans *pTrans, SSdbRaw *pRaw) {
646
  STransAction action = {.stage = TRN_STAGE_UNDO_ACTION, .actionType = TRANS_ACTION_RAW, .pRaw = pRaw};
647 648
  return mndTransAppendAction(pTrans->undoActions, &action);
}
S
Shengliang Guan 已提交
649

650
int32_t mndTransAppendCommitlog(STrans *pTrans, SSdbRaw *pRaw) {
651
  STransAction action = {.stage = TRN_STAGE_COMMIT_ACTION, .actionType = TRANS_ACTION_RAW, .pRaw = pRaw};
652
  return mndTransAppendAction(pTrans->commitActions, &action);
S
Shengliang Guan 已提交
653 654
}

S
Shengliang Guan 已提交
655
int32_t mndTransAppendRedoAction(STrans *pTrans, STransAction *pAction) {
656
  pAction->stage = TRN_STAGE_REDO_ACTION;
657
  pAction->actionType = TRANS_ACTION_MSG;
S
Shengliang Guan 已提交
658
  return mndTransAppendAction(pTrans->redoActions, pAction);
S
Shengliang Guan 已提交
659 660
}

S
Shengliang Guan 已提交
661
int32_t mndTransAppendUndoAction(STrans *pTrans, STransAction *pAction) {
662
  pAction->stage = TRN_STAGE_UNDO_ACTION;
663
  pAction->actionType = TRANS_ACTION_MSG;
S
Shengliang Guan 已提交
664
  return mndTransAppendAction(pTrans->undoActions, pAction);
S
Shengliang Guan 已提交
665 666
}

S
Shengliang Guan 已提交
667 668 669 670 671
void mndTransSetRpcRsp(STrans *pTrans, void *pCont, int32_t contLen) {
  pTrans->rpcRsp = pCont;
  pTrans->rpcRspLen = contLen;
}

S
Shengliang Guan 已提交
672
void mndTransSetCb(STrans *pTrans, ETrnFunc startFunc, ETrnFunc stopFunc, void *param, int32_t paramLen) {
673 674 675 676
  pTrans->startFunc = startFunc;
  pTrans->stopFunc = stopFunc;
  pTrans->param = param;
  pTrans->paramLen = paramLen;
677 678
}

679 680 681 682 683 684 685 686
void mndTransSetDbName(STrans *pTrans, const char *dbname1, const char *dbname2) {
  if (dbname1 != NULL) {
    memcpy(pTrans->dbname1, dbname1, TSDB_DB_FNAME_LEN);
  }
  if (dbname2 != NULL) {
    memcpy(pTrans->dbname2, dbname2, TSDB_DB_FNAME_LEN);
  }
}
S
Shengliang Guan 已提交
687

688
void mndTransSetSerial(STrans *pTrans) { pTrans->exec = TRN_EXEC_SERIAL; }
689

S
Shengliang Guan 已提交
690
static int32_t mndTransSync(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
691
  SSdbRaw *pRaw = mndTransActionEncode(pTrans);
S
Shengliang Guan 已提交
692
  if (pRaw == NULL) {
S
Shengliang Guan 已提交
693
    mError("trans:%d, failed to encode while sync trans since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
694 695
    return -1;
  }
S
Shengliang Guan 已提交
696
  sdbSetRawStatus(pRaw, SDB_STATUS_READY);
S
Shengliang Guan 已提交
697

S
Shengliang Guan 已提交
698
  mDebug("trans:%d, sync to other mnodes, stage:%s", pTrans->id, mndTransStr(pTrans->stage));
S
Shengliang Guan 已提交
699
  int32_t code = mndSyncPropose(pMnode, pRaw, pTrans->id);
S
Shengliang Guan 已提交
700 701 702
  if (code != 0) {
    mError("trans:%d, failed to sync since %s", pTrans->id, terrstr());
    sdbFreeRaw(pRaw);
S
Shengliang Guan 已提交
703 704 705
    return -1;
  }

706
  sdbFreeRaw(pRaw);
S
Shengliang Guan 已提交
707
  mDebug("trans:%d, sync finished", pTrans->id);
S
Shengliang Guan 已提交
708 709 710
  return 0;
}

S
Shengliang Guan 已提交
711 712 713 714 715 716
static bool mndCheckDbConflict(const char *db, STrans *pTrans) {
  if (db[0] == 0) return false;
  if (strcmp(db, pTrans->dbname1) == 0 || strcmp(db, pTrans->dbname2) == 0) return true;
  return false;
}

717
static bool mndCheckTransConflict(SMnode *pMnode, STrans *pNew) {
S
Shengliang Guan 已提交
718
  STrans *pTrans = NULL;
719
  void   *pIter = NULL;
720
  bool    conflict = false;
721

722
  if (pNew->conflict == TRN_CONFLICT_NOTHING) return conflict;
S
Shengliang Guan 已提交
723 724 725 726 727

  while (1) {
    pIter = sdbFetch(pMnode->pSdb, SDB_TRANS, pIter, (void **)&pTrans);
    if (pIter == NULL) break;

728 729 730
    if (pNew->conflict == TRN_CONFLICT_GLOBAL) conflict = true;
    if (pNew->conflict == TRN_CONFLICT_DB) {
      if (pTrans->conflict == TRN_CONFLICT_GLOBAL) conflict = true;
731
      if (pTrans->conflict == TRN_CONFLICT_DB || pTrans->conflict == TRN_CONFLICT_DB_INSIDE) {
S
Shengliang Guan 已提交
732 733
        if (mndCheckDbConflict(pNew->dbname1, pTrans)) conflict = true;
        if (mndCheckDbConflict(pNew->dbname2, pTrans)) conflict = true;
734
      }
735 736 737
    }
    if (pNew->conflict == TRN_CONFLICT_DB_INSIDE) {
      if (pTrans->conflict == TRN_CONFLICT_GLOBAL) conflict = true;
738
      if (pTrans->conflict == TRN_CONFLICT_DB) {
S
Shengliang Guan 已提交
739 740
        if (mndCheckDbConflict(pNew->dbname1, pTrans)) conflict = true;
        if (mndCheckDbConflict(pNew->dbname2, pTrans)) conflict = true;
741
      }
S
Shengliang Guan 已提交
742
    }
S
Shengliang Guan 已提交
743

744 745
    mError("trans:%d, can't execute since conflict with trans:%d, db1:%s db2:%s", pNew->id, pTrans->id, pTrans->dbname1,
           pTrans->dbname2);
S
Shengliang Guan 已提交
746 747 748
    sdbRelease(pMnode->pSdb, pTrans);
  }

749
  return conflict;
S
Shengliang Guan 已提交
750 751
}

S
Shengliang Guan 已提交
752
int32_t mndTransPrepare(SMnode *pMnode, STrans *pTrans) {
753
  if (pTrans->conflict == TRN_CONFLICT_DB || pTrans->conflict == TRN_CONFLICT_DB_INSIDE) {
754
    if (strlen(pTrans->dbname1) == 0 && strlen(pTrans->dbname2) == 0) {
755 756 757 758 759 760
      terrno = TSDB_CODE_MND_TRANS_CONFLICT;
      mError("trans:%d, failed to prepare conflict db not set", pTrans->id);
      return -1;
    }
  }

761 762
  if (mndCheckTransConflict(pMnode, pTrans)) {
    terrno = TSDB_CODE_MND_TRANS_CONFLICT;
S
Shengliang Guan 已提交
763 764 765 766
    mError("trans:%d, failed to prepare since %s", pTrans->id, terrstr());
    return -1;
  }

767
  if (taosArrayGetSize(pTrans->commitActions) <= 0) {
768 769 770 771 772
    terrno = TSDB_CODE_MND_TRANS_CLOG_IS_NULL;
    mError("trans:%d, failed to prepare since %s", pTrans->id, terrstr());
    return -1;
  }

S
Shengliang Guan 已提交
773 774 775 776 777 778 779
  mDebug("trans:%d, prepare transaction", pTrans->id);
  if (mndTransSync(pMnode, pTrans) != 0) {
    mError("trans:%d, failed to prepare since %s", pTrans->id, terrstr());
    return -1;
  }
  mDebug("trans:%d, prepare finished", pTrans->id);

S
Shengliang Guan 已提交
780 781
  STrans *pNew = mndAcquireTrans(pMnode, pTrans->id);
  if (pNew == NULL) {
S
Shengliang Guan 已提交
782
    mError("trans:%d, failed to read from sdb since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
783 784 785
    return -1;
  }

S
Shengliang Guan 已提交
786
  pNew->rpcInfo = pTrans->rpcInfo;
S
Shengliang Guan 已提交
787 788 789 790 791
  pNew->rpcRsp = pTrans->rpcRsp;
  pNew->rpcRspLen = pTrans->rpcRspLen;
  pTrans->rpcRsp = NULL;
  pTrans->rpcRspLen = 0;

S
Shengliang Guan 已提交
792 793
  mndTransExecute(pMnode, pNew);
  mndReleaseTrans(pMnode, pNew);
S
Shengliang Guan 已提交
794 795 796
  return 0;
}

S
Shengliang Guan 已提交
797 798 799 800
static int32_t mndTransCommit(SMnode *pMnode, STrans *pTrans) {
  mDebug("trans:%d, commit transaction", pTrans->id);
  if (mndTransSync(pMnode, pTrans) != 0) {
    mError("trans:%d, failed to commit since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
801
    return -1;
S
Shengliang Guan 已提交
802 803
  }
  mDebug("trans:%d, commit finished", pTrans->id);
S
Shengliang Guan 已提交
804 805 806
  return 0;
}

S
Shengliang Guan 已提交
807
static int32_t mndTransRollback(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
808
  mDebug("trans:%d, rollback transaction", pTrans->id);
S
Shengliang Guan 已提交
809 810
  if (mndTransSync(pMnode, pTrans) != 0) {
    mError("trans:%d, failed to rollback since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
811
    return -1;
S
Shengliang Guan 已提交
812
  }
S
Shengliang Guan 已提交
813 814
  mDebug("trans:%d, rollback finished", pTrans->id);
  return 0;
S
Shengliang Guan 已提交
815
}
S
Shengliang Guan 已提交
816

817
static void mndTransSendRpcRsp(SMnode *pMnode, STrans *pTrans) {
818 819
  bool    sendRsp = false;
  int32_t code = pTrans->code;
820 821 822 823 824 825

  if (pTrans->stage == TRN_STAGE_FINISHED) {
    sendRsp = true;
  }

  if (pTrans->policy == TRN_POLICY_ROLLBACK) {
826
    if (pTrans->stage == TRN_STAGE_UNDO_ACTION || pTrans->stage == TRN_STAGE_ROLLBACK) {
827
      if (code == 0) code = TSDB_CODE_MND_TRANS_UNKNOW_ERROR;
828
      sendRsp = true;
829
    }
830
  } else {
831
    if (pTrans->stage == TRN_STAGE_REDO_ACTION && pTrans->failedTimes > 6) {
832
      if (code == 0) code = TSDB_CODE_MND_TRANS_UNKNOW_ERROR;
833
      sendRsp = true;
834
    }
S
Shengliang Guan 已提交
835
  }
836

S
Shengliang Guan 已提交
837
  if (sendRsp && pTrans->rpcInfo.handle != NULL) {
838 839
    mDebug("trans:%d, send rsp, code:0x%x stage:%s app:%p", pTrans->id, code, mndTransStr(pTrans->stage),
           pTrans->rpcInfo.ahandle);
840
    if (code == TSDB_CODE_RPC_NETWORK_UNAVAIL) {
841
      code = TSDB_CODE_MND_TRANS_NETWORK_UNAVAILL;
842 843 844 845 846 847 848 849 850 851 852 853 854
    }
    SRpcMsg rspMsg = {.code = code, .info = pTrans->rpcInfo};

    if (pTrans->rpcRspLen != 0) {
      void *rpcCont = rpcMallocCont(pTrans->rpcRspLen);
      if (rpcCont != NULL) {
        memcpy(rpcCont, pTrans->rpcRsp, pTrans->rpcRspLen);
        rspMsg.pCont = rpcCont;
        rspMsg.contLen = pTrans->rpcRspLen;
      }
      taosMemoryFree(pTrans->rpcRsp);
    }

S
shm  
Shengliang Guan 已提交
855
    tmsgSendRsp(&rspMsg);
S
Shengliang Guan 已提交
856
    pTrans->rpcInfo.handle = NULL;
S
Shengliang Guan 已提交
857 858
    pTrans->rpcRsp = NULL;
    pTrans->rpcRspLen = 0;
859
  }
S
Shengliang Guan 已提交
860 861
}

862
int32_t mndTransProcessRsp(SRpcMsg *pRsp) {
S
Shengliang Guan 已提交
863 864
  SMnode *pMnode = pRsp->info.node;
  int64_t signature = (int64_t)(pRsp->info.ahandle);
S
Shengliang Guan 已提交
865 866
  int32_t transId = (int32_t)(signature >> 32);
  int32_t action = (int32_t)((signature << 32) >> 32);
867 868 869 870

  STrans *pTrans = mndAcquireTrans(pMnode, transId);
  if (pTrans == NULL) {
    mError("trans:%d, failed to get transId from vnode rsp since %s", transId, terrstr());
S
Shengliang Guan 已提交
871
    goto _OVER;
872 873 874
  }

  SArray *pArray = NULL;
S
Shengliang Guan 已提交
875
  if (pTrans->stage == TRN_STAGE_REDO_ACTION) {
876
    pArray = pTrans->redoActions;
S
Shengliang Guan 已提交
877
  } else if (pTrans->stage == TRN_STAGE_UNDO_ACTION) {
878 879
    pArray = pTrans->undoActions;
  } else {
S
Shengliang Guan 已提交
880
    mError("trans:%d, invalid trans stage:%d while recv action rsp", pTrans->id, pTrans->stage);
S
Shengliang Guan 已提交
881
    goto _OVER;
882 883 884
  }

  if (pArray == NULL) {
S
Shengliang Guan 已提交
885
    mError("trans:%d, invalid trans stage:%d", transId, pTrans->stage);
S
Shengliang Guan 已提交
886
    goto _OVER;
887 888 889
  }

  int32_t actionNum = taosArrayGetSize(pTrans->redoActions);
S
Shengliang Guan 已提交
890
  if (action < 0 || action >= actionNum) {
891
    mError("trans:%d, invalid action:%d", transId, action);
S
Shengliang Guan 已提交
892
    goto _OVER;
893 894 895 896 897
  }

  STransAction *pAction = taosArrayGet(pArray, action);
  if (pAction != NULL) {
    pAction->msgReceived = 1;
S
Shengliang Guan 已提交
898
    pAction->errCode = pRsp->code;
899 900
  }

901 902
  mDebug("trans:%d, %s:%d response is received, code:0x%x, accept:0x%x retry:0x%x", transId,
         mndTransStr(pAction->stage), action, pRsp->code, pAction->acceptableCode, pAction->retryCode);
903 904
  mndTransExecute(pMnode, pTrans);

S
Shengliang Guan 已提交
905
_OVER:
906
  mndReleaseTrans(pMnode, pTrans);
907
  return 0;
908 909
}

910 911 912 913 914 915 916 917 918 919 920 921 922 923 924
static void mndTransResetAction(SMnode *pMnode, STrans *pTrans, STransAction *pAction) {
  pAction->rawWritten = 0;
  pAction->msgSent = 0;
  pAction->msgReceived = 0;
  if (pAction->errCode == TSDB_CODE_RPC_REDIRECT || pAction->errCode == TSDB_CODE_SYN_NEW_CONFIG_ERROR ||
      pAction->errCode == TSDB_CODE_SYN_INTERNAL_ERROR || pAction->errCode == TSDB_CODE_SYN_NOT_LEADER) {
    pAction->epSet.inUse = (pAction->epSet.inUse + 1) % pAction->epSet.numOfEps;
    mDebug("trans:%d, %s:%d execute status is reset and set epset inuse:%d", pTrans->id, mndTransStr(pAction->stage),
           pAction->id, pAction->epSet.inUse);
  } else {
    mDebug("trans:%d, %s:%d execute status is reset", pTrans->id, mndTransStr(pAction->stage), pAction->id);
  }
  pAction->errCode = 0;
}

S
Shengliang Guan 已提交
925 926 927 928 929
static void mndTransResetActions(SMnode *pMnode, STrans *pTrans, SArray *pArray) {
  int32_t numOfActions = taosArrayGetSize(pArray);

  for (int32_t action = 0; action < numOfActions; ++action) {
    STransAction *pAction = taosArrayGet(pArray, action);
930 931 932 933
    if (pAction->msgSent && pAction->msgReceived &&
        (pAction->errCode == 0 || pAction->errCode == pAction->acceptableCode))
      continue;
    if (pAction->rawWritten && (pAction->errCode == 0 || pAction->errCode == pAction->acceptableCode)) continue;
S
Shengliang Guan 已提交
934

935
    mndTransResetAction(pMnode, pTrans, pAction);
S
Shengliang Guan 已提交
936 937 938
  }
}

939
static int32_t mndTransWriteSingleLog(SMnode *pMnode, STrans *pTrans, STransAction *pAction) {
940 941
  if (pAction->rawWritten) return 0;

942
  int32_t code = sdbWriteWithoutFree(pMnode->pSdb, pAction->pRaw);
943 944 945 946
  if (code == 0 || terrno == TSDB_CODE_SDB_OBJ_NOT_THERE) {
    pAction->rawWritten = true;
    pAction->errCode = 0;
    code = 0;
S
Shengliang Guan 已提交
947 948
    mDebug("trans:%d, %s:%d write to sdb, type:%s status:%s", pTrans->id, mndTransStr(pAction->stage), pAction->id,
           sdbTableName(pAction->pRaw->type), sdbStatusName(pAction->pRaw->status));
949 950 951 952 953

    pTrans->lastAction = pAction->id;
    pTrans->lastMsgType = pAction->msgType;
    pTrans->lastEpset = pAction->epSet;
    pTrans->lastErrorNo = 0;
954
  } else {
955
    pAction->errCode = (terrno != 0) ? terrno : code;
S
Shengliang Guan 已提交
956 957
    mError("trans:%d, %s:%d failed to write sdb since %s, type:%s status:%s", pTrans->id, mndTransStr(pAction->stage),
           pAction->id, terrstr(), sdbTableName(pAction->pRaw->type), sdbStatusName(pAction->pRaw->status));
958 959 960 961
    pTrans->lastAction = pAction->id;
    pTrans->lastMsgType = pAction->msgType;
    pTrans->lastEpset = pAction->epSet;
    pTrans->lastErrorNo = pAction->errCode;
962 963 964 965 966 967 968
  }

  return code;
}

static int32_t mndTransSendSingleMsg(SMnode *pMnode, STrans *pTrans, STransAction *pAction) {
  if (pAction->msgSent) return 0;
969
  if (mndCannotExecuteTransAction(pMnode)) return -1;
970 971 972 973 974 975 976 977 978 979 980 981 982

  int64_t signature = pTrans->id;
  signature = (signature << 32);
  signature += pAction->id;

  SRpcMsg rpcMsg = {.msgType = pAction->msgType, .contLen = pAction->contLen, .info.ahandle = (void *)signature};
  rpcMsg.pCont = rpcMallocCont(pAction->contLen);
  if (rpcMsg.pCont == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
  memcpy(rpcMsg.pCont, pAction->pCont, pAction->contLen);

S
Shengliang Guan 已提交
983 984 985
  char    detail[1024] = {0};
  int32_t len = snprintf(detail, sizeof(detail), "msgType:%s numOfEps:%d inUse:%d", TMSG_INFO(pAction->msgType),
                         pAction->epSet.numOfEps, pAction->epSet.inUse);
S
Shengliang Guan 已提交
986
  for (int32_t i = 0; i < pAction->epSet.numOfEps; ++i) {
S
Shengliang Guan 已提交
987 988 989 990
    len += snprintf(detail + len, sizeof(detail) - len, " ep:%d-%s:%u", i, pAction->epSet.eps[i].fqdn,
                    pAction->epSet.eps[i].port);
  }

991 992 993 994 995
  int32_t code = tmsgSendReq(&pAction->epSet, &rpcMsg);
  if (code == 0) {
    pAction->msgSent = 1;
    pAction->msgReceived = 0;
    pAction->errCode = 0;
S
Shengliang Guan 已提交
996
    mDebug("trans:%d, %s:%d is sent, %s", pTrans->id, mndTransStr(pAction->stage), pAction->id, detail);
997 998 999 1000 1001 1002 1003

    pTrans->lastAction = pAction->id;
    pTrans->lastMsgType = pAction->msgType;
    pTrans->lastEpset = pAction->epSet;
    if (pTrans->lastErrorNo == 0) {
      pTrans->lastErrorNo = TSDB_CODE_ACTION_IN_PROGRESS;
    }
1004 1005 1006 1007
  } else {
    pAction->msgSent = 0;
    pAction->msgReceived = 0;
    pAction->errCode = (terrno != 0) ? terrno : code;
S
Shengliang Guan 已提交
1008 1009
    mError("trans:%d, %s:%d not send since %s, %s", pTrans->id, mndTransStr(pAction->stage), pAction->id, terrstr(),
           detail);
1010 1011 1012 1013 1014

    pTrans->lastAction = pAction->id;
    pTrans->lastMsgType = pAction->msgType;
    pTrans->lastEpset = pAction->epSet;
    pTrans->lastErrorNo = pAction->errCode;
1015 1016 1017 1018 1019
  }

  return code;
}

1020 1021 1022
static int32_t mndTransExecNullMsg(SMnode *pMnode, STrans *pTrans, STransAction *pAction) {
  pAction->rawWritten = 0;
  pAction->errCode = 0;
S
Shengliang Guan 已提交
1023
  mDebug("trans:%d, %s:%d confirm action executed", pTrans->id, mndTransStr(pAction->stage), pAction->id);
1024 1025 1026 1027 1028 1029 1030 1031

  pTrans->lastAction = pAction->id;
  pTrans->lastMsgType = pAction->msgType;
  pTrans->lastEpset = pAction->epSet;
  pTrans->lastErrorNo == 0;
  return 0;
}

1032
static int32_t mndTransExecSingleAction(SMnode *pMnode, STrans *pTrans, STransAction *pAction) {
1033
  if (pAction->actionType == TRANS_ACTION_RAW) {
1034
    return mndTransWriteSingleLog(pMnode, pTrans, pAction);
1035
  } else if (pAction->actionType == TRANS_ACTION_MSG) {
1036
    return mndTransSendSingleMsg(pMnode, pTrans, pAction);
1037
  } else {
1038
    return mndTransExecNullMsg(pMnode, pTrans, pAction);
1039 1040 1041
  }
}

1042
static int32_t mndTransExecSingleActions(SMnode *pMnode, STrans *pTrans, SArray *pArray) {
1043
  int32_t numOfActions = taosArrayGetSize(pArray);
1044
  int32_t code = 0;
1045 1046 1047

  for (int32_t action = 0; action < numOfActions; ++action) {
    STransAction *pAction = taosArrayGet(pArray, action);
1048
    code = mndTransExecSingleAction(pMnode, pTrans, pAction);
1049
    if (code != 0) break;
S
Shengliang Guan 已提交
1050 1051
  }

1052
  return code;
S
Shengliang Guan 已提交
1053 1054 1055 1056 1057 1058
}

static int32_t mndTransExecuteActions(SMnode *pMnode, STrans *pTrans, SArray *pArray) {
  int32_t numOfActions = taosArrayGetSize(pArray);
  if (numOfActions == 0) return 0;

1059
  if (mndTransExecSingleActions(pMnode, pTrans, pArray) != 0) {
S
Shengliang Guan 已提交
1060 1061 1062
    return -1;
  }

1063 1064 1065
  int32_t       numOfExecuted = 0;
  int32_t       errCode = 0;
  STransAction *pErrAction = NULL;
1066 1067
  for (int32_t action = 0; action < numOfActions; ++action) {
    STransAction *pAction = taosArrayGet(pArray, action);
1068
    if (pAction->msgReceived || pAction->rawWritten) {
1069
      numOfExecuted++;
1070
      if (pAction->errCode != 0 && pAction->errCode != pAction->acceptableCode) {
S
Shengliang Guan 已提交
1071
        errCode = pAction->errCode;
1072
        pErrAction = pAction;
1073 1074 1075 1076
      }
    }
  }

1077
  if (numOfExecuted == numOfActions) {
S
Shengliang Guan 已提交
1078
    if (errCode == 0) {
1079 1080 1081
      pTrans->lastAction = 0;
      pTrans->lastMsgType = 0;
      memset(&pTrans->lastEpset, 0, sizeof(pTrans->lastEpset));
S
Shengliang Guan 已提交
1082
      pTrans->lastErrorNo = 0;
S
Shengliang Guan 已提交
1083 1084 1085
      mDebug("trans:%d, all %d actions execute successfully", pTrans->id, numOfActions);
      return 0;
    } else {
S
Shengliang Guan 已提交
1086
      mError("trans:%d, all %d actions executed, code:0x%x", pTrans->id, numOfActions, errCode & 0XFFFF);
1087
      if (pErrAction != NULL) {
1088
        pTrans->lastAction = pErrAction->id;
S
Shengliang Guan 已提交
1089
        pTrans->lastMsgType = pErrAction->msgType;
1090
        pTrans->lastEpset = pErrAction->epSet;
S
Shengliang Guan 已提交
1091
        pTrans->lastErrorNo = pErrAction->errCode;
1092
      }
S
Shengliang Guan 已提交
1093 1094 1095 1096
      mndTransResetActions(pMnode, pTrans, pArray);
      terrno = errCode;
      return errCode;
    }
1097
  } else {
1098
    mDebug("trans:%d, %d of %d actions executed", pTrans->id, numOfExecuted, numOfActions);
S
Shengliang Guan 已提交
1099
    return TSDB_CODE_ACTION_IN_PROGRESS;
1100
  }
S
Shengliang Guan 已提交
1101 1102
}

S
Shengliang Guan 已提交
1103
static int32_t mndTransExecuteRedoActions(SMnode *pMnode, STrans *pTrans) {
1104
  int32_t code = mndTransExecuteActions(pMnode, pTrans, pTrans->redoActions);
S
Shengliang Guan 已提交
1105
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
1106
    mError("failed to execute redoActions since:%s, code:0x%x", terrstr(), terrno);
1107 1108
  }
  return code;
S
Shengliang Guan 已提交
1109
}
S
Shengliang Guan 已提交
1110

S
Shengliang Guan 已提交
1111
static int32_t mndTransExecuteUndoActions(SMnode *pMnode, STrans *pTrans) {
1112
  int32_t code = mndTransExecuteActions(pMnode, pTrans, pTrans->undoActions);
S
Shengliang Guan 已提交
1113
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
1114 1115 1116
    mError("failed to execute undoActions since %s", terrstr());
  }
  return code;
S
Shengliang Guan 已提交
1117
}
S
Shengliang Guan 已提交
1118

1119
static int32_t mndTransExecuteCommitActions(SMnode *pMnode, STrans *pTrans) {
1120
  int32_t code = mndTransExecuteActions(pMnode, pTrans, pTrans->commitActions);
1121
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
1122 1123 1124 1125 1126
    mError("failed to execute commitActions since %s", terrstr());
  }
  return code;
}

1127
static int32_t mndTransExecuteRedoActionsSerial(SMnode *pMnode, STrans *pTrans) {
1128 1129 1130 1131
  int32_t code = 0;
  int32_t numOfActions = taosArrayGetSize(pTrans->redoActions);
  if (numOfActions == 0) return code;
  if (pTrans->redoActionPos >= numOfActions) return code;
S
Shengliang Guan 已提交
1132

1133 1134
  for (int32_t action = pTrans->redoActionPos; action < numOfActions; ++action) {
    STransAction *pAction = taosArrayGet(pTrans->redoActions, pTrans->redoActionPos);
S
Shengliang Guan 已提交
1135

1136 1137 1138 1139 1140 1141
    code = mndTransExecSingleAction(pMnode, pTrans, pAction);
    if (code == 0) {
      if (pAction->msgSent) {
        if (pAction->msgReceived) {
          if (pAction->errCode != 0 && pAction->errCode != pAction->acceptableCode) {
            code = pAction->errCode;
1142 1143 1144
            mndTransResetAction(pMnode, pTrans, pAction);
          } else {
            mDebug("trans:%d, %s:%d execute successfully", pTrans->id, mndTransStr(pAction->stage), action);
1145 1146 1147 1148
          }
        } else {
          code = TSDB_CODE_ACTION_IN_PROGRESS;
        }
S
Shengliang Guan 已提交
1149
      } else if (pAction->rawWritten) {
1150 1151
        if (pAction->errCode != 0 && pAction->errCode != pAction->acceptableCode) {
          code = pAction->errCode;
1152 1153
        } else {
          mDebug("trans:%d, %s:%d write successfully", pTrans->id, mndTransStr(pAction->stage), action);
1154
        }
S
Shengliang Guan 已提交
1155
      } else {
1156 1157
      }
    }
1158

1159
    if (code == 0) {
1160
      pTrans->failedTimes = 0;
S
Shengliang Guan 已提交
1161
      pTrans->lastAction = action;
1162
      pTrans->lastMsgType = 0;
S
Shengliang Guan 已提交
1163
      pTrans->lastErrorNo = 0;
1164
      memset(&pTrans->lastEpset, 0, sizeof(pTrans->lastEpset));
1165
    } else {
1166
      pTrans->lastAction = action;
S
Shengliang Guan 已提交
1167
      pTrans->lastMsgType = pAction->msgType;
1168 1169
      pTrans->lastErrorNo = code;
      pTrans->lastEpset = pAction->epSet;
1170 1171
    }

1172
    if (mndCannotExecuteTransAction(pMnode)) break;
1173

1174
    if (code == 0) {
1175
      pTrans->code = 0;
1176 1177 1178 1179 1180
      pTrans->redoActionPos++;
      mDebug("trans:%d, %s:%d is executed and need sync to other mnodes", pTrans->id, mndTransStr(pAction->stage),
             pAction->id);
      code = mndTransSync(pMnode, pTrans);
      if (code != 0) {
1181 1182 1183
        pTrans->code = terrno;
        mError("trans:%d, %s:%d is executed and failed to sync to other mnodes since %s", pTrans->id,
               mndTransStr(pAction->stage), pAction->id, terrstr());
1184 1185 1186 1187
      }
    } else if (code == TSDB_CODE_ACTION_IN_PROGRESS) {
      mDebug("trans:%d, %s:%d is in progress and wait it finish", pTrans->id, mndTransStr(pAction->stage), pAction->id);
      break;
1188 1189 1190
    } else if (code == pAction->retryCode) {
      mDebug("trans:%d, %s:%d receive code:0x%x and retry", pTrans->id, mndTransStr(pAction->stage), pAction->id, code);
      taosMsleep(300);
1191
      action--;
1192
      continue;
1193
    } else {
1194 1195
      terrno = code;
      pTrans->code = code;
1196 1197
      mDebug("trans:%d, %s:%d receive code:0x%x and wait another schedule, failedTimes:%d", pTrans->id,
             mndTransStr(pAction->stage), pAction->id, code, pTrans->failedTimes);
S
Shengliang Guan 已提交
1198
      break;
1199
    }
S
Shengliang Guan 已提交
1200
  }
S
Shengliang Guan 已提交
1201

1202 1203 1204 1205 1206 1207 1208
  return code;
}

static bool mndTransPerformPrepareStage(SMnode *pMnode, STrans *pTrans) {
  bool continueExec = true;
  pTrans->stage = TRN_STAGE_REDO_ACTION;
  mDebug("trans:%d, stage from prepare to redoAction", pTrans->id);
S
Shengliang Guan 已提交
1209
  return continueExec;
S
Shengliang Guan 已提交
1210 1211
}

S
Shengliang Guan 已提交
1212 1213
static bool mndTransPerformRedoActionStage(SMnode *pMnode, STrans *pTrans) {
  bool    continueExec = true;
1214 1215
  int32_t code = 0;

1216
  if (pTrans->exec == TRN_EXEC_SERIAL) {
1217
    code = mndTransExecuteRedoActionsSerial(pMnode, pTrans);
1218 1219 1220
  } else {
    code = mndTransExecuteRedoActions(pMnode, pTrans);
  }
S
Shengliang Guan 已提交
1221

1222
  if (mndCannotExecuteTransAction(pMnode)) return false;
1223

S
Shengliang Guan 已提交
1224
  if (code == 0) {
S
Shengliang Guan 已提交
1225
    pTrans->code = 0;
S
Shengliang Guan 已提交
1226
    pTrans->stage = TRN_STAGE_COMMIT;
S
Shengliang Guan 已提交
1227 1228
    mDebug("trans:%d, stage from redoAction to commit", pTrans->id);
    continueExec = true;
S
Shengliang Guan 已提交
1229
  } else if (code == TSDB_CODE_ACTION_IN_PROGRESS) {
S
Shengliang Guan 已提交
1230 1231
    mDebug("trans:%d, stage keep on redoAction since %s", pTrans->id, tstrerror(code));
    continueExec = false;
S
Shengliang Guan 已提交
1232
  } else {
S
Shengliang Guan 已提交
1233
    pTrans->code = terrno;
S
Shengliang Guan 已提交
1234
    if (pTrans->policy == TRN_POLICY_ROLLBACK) {
1235 1236
      pTrans->stage = TRN_STAGE_ROLLBACK;
      mError("trans:%d, stage from redoAction to rollback since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
1237
      continueExec = true;
S
Shengliang Guan 已提交
1238
    } else {
S
Shengliang Guan 已提交
1239 1240 1241
      pTrans->failedTimes++;
      mError("trans:%d, stage keep on redoAction since %s, failedTimes:%d", pTrans->id, terrstr(), pTrans->failedTimes);
      continueExec = false;
S
Shengliang Guan 已提交
1242 1243 1244
    }
  }

S
Shengliang Guan 已提交
1245
  return continueExec;
S
Shengliang Guan 已提交
1246 1247
}

S
Shengliang Guan 已提交
1248
static bool mndTransPerformCommitStage(SMnode *pMnode, STrans *pTrans) {
1249
  if (mndCannotExecuteTransAction(pMnode)) return false;
1250

S
Shengliang Guan 已提交
1251 1252 1253 1254 1255
  bool    continueExec = true;
  int32_t code = mndTransCommit(pMnode, pTrans);

  if (code == 0) {
    pTrans->code = 0;
1256 1257
    pTrans->stage = TRN_STAGE_COMMIT_ACTION;
    mDebug("trans:%d, stage from commit to commitAction", pTrans->id);
S
Shengliang Guan 已提交
1258 1259 1260
    continueExec = true;
  } else {
    pTrans->code = terrno;
1261 1262 1263
    pTrans->failedTimes++;
    mError("trans:%d, stage keep on commit since %s, failedTimes:%d", pTrans->id, terrstr(), pTrans->failedTimes);
    continueExec = false;
S
Shengliang Guan 已提交
1264 1265 1266
  }

  return continueExec;
S
Shengliang Guan 已提交
1267 1268
}

1269
static bool mndTransPerformCommitActionStage(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
1270
  bool    continueExec = true;
1271
  int32_t code = mndTransExecuteCommitActions(pMnode, pTrans);
S
Shengliang Guan 已提交
1272 1273

  if (code == 0) {
S
Shengliang Guan 已提交
1274 1275
    pTrans->code = 0;
    pTrans->stage = TRN_STAGE_FINISHED;
1276
    mDebug("trans:%d, stage from commitAction to finished", pTrans->id);
S
Shengliang Guan 已提交
1277
    continueExec = true;
S
Shengliang Guan 已提交
1278
  } else {
S
Shengliang Guan 已提交
1279 1280
    pTrans->code = terrno;
    pTrans->failedTimes++;
1281
    mError("trans:%d, stage keep on commitAction since %s, failedTimes:%d", pTrans->id, terrstr(), pTrans->failedTimes);
S
Shengliang Guan 已提交
1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292
    continueExec = false;
  }

  return continueExec;
}

static bool mndTransPerformUndoActionStage(SMnode *pMnode, STrans *pTrans) {
  bool    continueExec = true;
  int32_t code = mndTransExecuteUndoActions(pMnode, pTrans);

  if (code == 0) {
1293 1294
    pTrans->stage = TRN_STAGE_FINISHED;
    mDebug("trans:%d, stage from undoAction to finished", pTrans->id);
S
Shengliang Guan 已提交
1295
    continueExec = true;
S
Shengliang Guan 已提交
1296
  } else if (code == TSDB_CODE_ACTION_IN_PROGRESS) {
S
Shengliang Guan 已提交
1297
    mDebug("trans:%d, stage keep on undoAction since %s", pTrans->id, tstrerror(code));
S
Shengliang Guan 已提交
1298 1299 1300
    continueExec = false;
  } else {
    pTrans->failedTimes++;
1301
    mError("trans:%d, stage keep on undoAction since %s, failedTimes:%d", pTrans->id, terrstr(), pTrans->failedTimes);
S
Shengliang Guan 已提交
1302 1303 1304 1305 1306 1307 1308
    continueExec = false;
  }

  return continueExec;
}

static bool mndTransPerformRollbackStage(SMnode *pMnode, STrans *pTrans) {
1309
  if (mndCannotExecuteTransAction(pMnode)) return false;
1310

S
Shengliang Guan 已提交
1311 1312 1313 1314
  bool    continueExec = true;
  int32_t code = mndTransRollback(pMnode, pTrans);

  if (code == 0) {
1315 1316
    pTrans->stage = TRN_STAGE_UNDO_ACTION;
    mDebug("trans:%d, stage from rollback to undoAction", pTrans->id);
S
Shengliang Guan 已提交
1317 1318 1319
    continueExec = true;
  } else {
    pTrans->failedTimes++;
1320
    mError("trans:%d, stage keep on rollback since %s, failedTimes:%d", pTrans->id, terrstr(), pTrans->failedTimes);
S
Shengliang Guan 已提交
1321
    continueExec = false;
S
Shengliang Guan 已提交
1322 1323
  }

S
Shengliang Guan 已提交
1324 1325 1326 1327 1328 1329 1330 1331
  return continueExec;
}

static bool mndTransPerfromFinishedStage(SMnode *pMnode, STrans *pTrans) {
  bool continueExec = false;

  SSdbRaw *pRaw = mndTransActionEncode(pTrans);
  if (pRaw == NULL) {
S
Shengliang Guan 已提交
1332
    mError("trans:%d, failed to encode while finish trans since %s", pTrans->id, terrstr());
S
Shengliang Guan 已提交
1333 1334 1335 1336 1337 1338 1339 1340
  }
  sdbSetRawStatus(pRaw, SDB_STATUS_DROPPED);

  int32_t code = sdbWrite(pMnode->pSdb, pRaw);
  if (code != 0) {
    mError("trans:%d, failed to write sdb since %s", pTrans->id, terrstr());
  }

1341
  mDebug("trans:%d, execute finished, code:0x%x, failedTimes:%d", pTrans->id, pTrans->code, pTrans->failedTimes);
S
Shengliang Guan 已提交
1342
  return continueExec;
S
Shengliang Guan 已提交
1343
}
S
Shengliang Guan 已提交
1344

1345
void mndTransExecute(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
1346
  bool continueExec = true;
S
Shengliang Guan 已提交
1347

S
Shengliang Guan 已提交
1348
  while (continueExec) {
1349
    mDebug("trans:%d, continue to execute, stage:%s", pTrans->id, mndTransStr(pTrans->stage));
S
Shengliang Guan 已提交
1350
    pTrans->lastExecTime = taosGetTimestampMs();
S
Shengliang Guan 已提交
1351 1352
    switch (pTrans->stage) {
      case TRN_STAGE_PREPARE:
S
Shengliang Guan 已提交
1353 1354 1355 1356 1357
        continueExec = mndTransPerformPrepareStage(pMnode, pTrans);
        break;
      case TRN_STAGE_REDO_ACTION:
        continueExec = mndTransPerformRedoActionStage(pMnode, pTrans);
        break;
1358 1359 1360 1361 1362
      case TRN_STAGE_COMMIT:
        continueExec = mndTransPerformCommitStage(pMnode, pTrans);
        break;
      case TRN_STAGE_COMMIT_ACTION:
        continueExec = mndTransPerformCommitActionStage(pMnode, pTrans);
S
Shengliang Guan 已提交
1363 1364
        break;
      case TRN_STAGE_ROLLBACK:
S
Shengliang Guan 已提交
1365 1366
        continueExec = mndTransPerformRollbackStage(pMnode, pTrans);
        break;
1367 1368 1369
      case TRN_STAGE_UNDO_ACTION:
        continueExec = mndTransPerformUndoActionStage(pMnode, pTrans);
        break;
S
Shengliang Guan 已提交
1370 1371
      case TRN_STAGE_FINISHED:
        continueExec = mndTransPerfromFinishedStage(pMnode, pTrans);
S
Shengliang Guan 已提交
1372
        break;
S
Shengliang Guan 已提交
1373
      default:
S
Shengliang Guan 已提交
1374 1375
        continueExec = false;
        break;
S
Shengliang Guan 已提交
1376 1377 1378
    }
  }

1379
  mndTransSendRpcRsp(pMnode, pTrans);
S
Shengliang Guan 已提交
1380
}
S
Shengliang Guan 已提交
1381

1382
static int32_t mndProcessTransTimer(SRpcMsg *pReq) {
S
Shengliang Guan 已提交
1383
  mndTransPullup(pReq->info.node);
S
Shengliang Guan 已提交
1384 1385 1386
  return 0;
}

1387
int32_t mndKillTrans(SMnode *pMnode, STrans *pTrans) {
S
Shengliang Guan 已提交
1388 1389 1390 1391 1392 1393 1394 1395 1396 1397
  SArray *pArray = NULL;
  if (pTrans->stage == TRN_STAGE_REDO_ACTION) {
    pArray = pTrans->redoActions;
  } else if (pTrans->stage == TRN_STAGE_UNDO_ACTION) {
    pArray = pTrans->undoActions;
  } else {
    terrno = TSDB_CODE_MND_TRANS_INVALID_STAGE;
    return -1;
  }

1398
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
S
Shengliang Guan 已提交
1399
    STransAction *pAction = taosArrayGet(pArray, i);
S
Shengliang Guan 已提交
1400 1401 1402 1403 1404
    mInfo("trans:%d, %s:%d set processed for kill msg received, errCode from %s to success", pTrans->id,
          mndTransStr(pAction->stage), i, tstrerror(pAction->errCode));
    pAction->msgSent = 1;
    pAction->msgReceived = 1;
    pAction->errCode = 0;
S
Shengliang Guan 已提交
1405 1406 1407 1408 1409 1410
  }

  mndTransExecute(pMnode, pTrans);
  return 0;
}

S
Shengliang Guan 已提交
1411 1412
static int32_t mndProcessKillTransReq(SRpcMsg *pReq) {
  SMnode       *pMnode = pReq->info.node;
S
Shengliang Guan 已提交
1413
  SKillTransReq killReq = {0};
S
Shengliang Guan 已提交
1414
  int32_t       code = -1;
1415
  STrans       *pTrans = NULL;
S
Shengliang Guan 已提交
1416

S
Shengliang Guan 已提交
1417
  if (tDeserializeSKillTransReq(pReq->pCont, pReq->contLen, &killReq) != 0) {
S
Shengliang Guan 已提交
1418
    terrno = TSDB_CODE_INVALID_MSG;
S
Shengliang Guan 已提交
1419
    goto _OVER;
S
Shengliang Guan 已提交
1420 1421 1422
  }

  mInfo("trans:%d, start to kill", killReq.transId);
1423
  if (mndCheckOperPrivilege(pMnode, pReq->info.conn.user, MND_OPER_KILL_TRANS) != 0) {
S
Shengliang Guan 已提交
1424
    goto _OVER;
S
Shengliang Guan 已提交
1425 1426
  }

S
Shengliang Guan 已提交
1427
  pTrans = mndAcquireTrans(pMnode, killReq.transId);
S
Shengliang Guan 已提交
1428
  if (pTrans == NULL) {
1429
    goto _OVER;
S
Shengliang Guan 已提交
1430 1431
  }

S
Shengliang Guan 已提交
1432 1433
  code = mndKillTrans(pMnode, pTrans);

S
Shengliang Guan 已提交
1434
_OVER:
1435
  if (code != 0) {
S
Shengliang Guan 已提交
1436 1437 1438
    mError("trans:%d, failed to kill since %s", killReq.transId, terrstr());
  }

S
Shengliang Guan 已提交
1439
  mndReleaseTrans(pMnode, pTrans);
S
Shengliang Guan 已提交
1440
  return code;
S
Shengliang Guan 已提交
1441 1442
}

1443 1444
static int32_t mndCompareTransId(int32_t *pTransId1, int32_t *pTransId2) { return *pTransId1 >= *pTransId2 ? 1 : 0; }

S
Shengliang Guan 已提交
1445
void mndTransPullup(SMnode *pMnode) {
1446 1447 1448
  SSdb   *pSdb = pMnode->pSdb;
  SArray *pArray = taosArrayInit(sdbGetSize(pSdb, SDB_TRANS), sizeof(int32_t));
  if (pArray == NULL) return;
S
Shengliang Guan 已提交
1449

1450
  void *pIter = NULL;
S
Shengliang Guan 已提交
1451
  while (1) {
1452
    STrans *pTrans = NULL;
S
Shengliang Guan 已提交
1453 1454
    pIter = sdbFetch(pMnode->pSdb, SDB_TRANS, pIter, (void **)&pTrans);
    if (pIter == NULL) break;
1455 1456 1457
    taosArrayPush(pArray, &pTrans->id);
    sdbRelease(pSdb, pTrans);
  }
S
Shengliang Guan 已提交
1458

1459 1460 1461 1462 1463 1464 1465 1466 1467
  taosArraySort(pArray, (__compar_fn_t)mndCompareTransId);

  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
    int32_t *pTransId = taosArrayGet(pArray, i);
    STrans  *pTrans = mndAcquireTrans(pMnode, *pTransId);
    if (pTrans != NULL) {
      mndTransExecute(pMnode, pTrans);
    }
    mndReleaseTrans(pMnode, pTrans);
S
Shengliang Guan 已提交
1468
  }
S
Shengliang Guan 已提交
1469

1470
  sdbWriteFile(pMnode->pSdb, SDB_WRITE_DELTA);
1471
  taosArrayDestroy(pArray);
1472
}
S
Shengliang Guan 已提交
1473

S
Shengliang Guan 已提交
1474 1475
static int32_t mndRetrieveTrans(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows) {
  SMnode *pMnode = pReq->info.node;
1476
  SSdb   *pSdb = pMnode->pSdb;
S
Shengliang Guan 已提交
1477 1478 1479
  int32_t numOfRows = 0;
  STrans *pTrans = NULL;
  int32_t cols = 0;
1480
  char   *pWrite;
S
Shengliang Guan 已提交
1481 1482 1483 1484 1485 1486 1487

  while (numOfRows < rows) {
    pShow->pIter = sdbFetch(pSdb, SDB_TRANS, pShow->pIter, (void **)&pTrans);
    if (pShow->pIter == NULL) break;

    cols = 0;

S
Shengliang Guan 已提交
1488 1489
    SColumnInfoData *pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)&pTrans->id, false);
S
Shengliang Guan 已提交
1490

S
Shengliang Guan 已提交
1491 1492
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)&pTrans->createdTime, false);
S
Shengliang Guan 已提交
1493

S
Shengliang Guan 已提交
1494
    char stage[TSDB_TRANS_STAGE_LEN + VARSTR_HEADER_SIZE] = {0};
1495
    STR_WITH_MAXSIZE_TO_VARSTR(stage, mndTransStr(pTrans->stage), pShow->pMeta->pSchemas[cols].bytes);
S
Shengliang Guan 已提交
1496 1497
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)stage, false);
S
Shengliang Guan 已提交
1498

1499 1500 1501 1502 1503 1504 1505
    char dbname1[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
    STR_WITH_MAXSIZE_TO_VARSTR(dbname1, mndGetDbStr(pTrans->dbname1), pShow->pMeta->pSchemas[cols].bytes);
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)dbname1, false);

    char dbname2[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
    STR_WITH_MAXSIZE_TO_VARSTR(dbname2, mndGetDbStr(pTrans->dbname2), pShow->pMeta->pSchemas[cols].bytes);
S
Shengliang Guan 已提交
1506
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1507
    colDataAppend(pColInfo, numOfRows, (const char *)dbname2, false);
S
Shengliang Guan 已提交
1508

1509 1510 1511
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)&pTrans->failedTimes, false);

S
Shengliang Guan 已提交
1512 1513
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
    colDataAppend(pColInfo, numOfRows, (const char *)&pTrans->lastExecTime, false);
S
Shengliang Guan 已提交
1514

1515 1516 1517 1518 1519 1520 1521 1522 1523 1524
    char    lastInfo[TSDB_TRANS_ERROR_LEN + VARSTR_HEADER_SIZE] = {0};
    char    detail[TSDB_TRANS_ERROR_LEN] = {0};
    int32_t len = snprintf(detail, sizeof(detail), "action:%d code:0x%x(%s) ", pTrans->lastAction,
                           pTrans->lastErrorNo & 0xFFFF, tstrerror(pTrans->lastErrorNo));
    SEpSet  epset = pTrans->lastEpset;
    if (epset.numOfEps > 0) {
      len += snprintf(detail + len, sizeof(detail) - len, "msgType:%s numOfEps:%d inUse:%d ",
                      TMSG_INFO(pTrans->lastMsgType), epset.numOfEps, epset.inUse);
      for (int32_t i = 0; i < pTrans->lastEpset.numOfEps; ++i) {
        len += snprintf(detail + len, sizeof(detail) - len, "ep:%d-%s:%u ", i, epset.eps[i].fqdn, epset.eps[i].port);
1525 1526
      }
    }
1527
    STR_WITH_MAXSIZE_TO_VARSTR(lastInfo, detail, pShow->pMeta->pSchemas[cols].bytes);
S
Shengliang Guan 已提交
1528
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1529
    colDataAppend(pColInfo, numOfRows, (const char *)lastInfo, false);
S
Shengliang Guan 已提交
1530 1531 1532 1533 1534

    numOfRows++;
    sdbRelease(pSdb, pTrans);
  }

1535
  pShow->numOfRows += numOfRows;
S
Shengliang Guan 已提交
1536 1537 1538 1539 1540 1541 1542
  return numOfRows;
}

static void mndCancelGetNextTrans(SMnode *pMnode, void *pIter) {
  SSdb *pSdb = pMnode->pSdb;
  sdbCancelFetch(pSdb, pIter);
}