clientTmq.c 72.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

L
Liu Jicong 已提交
16
#include "cJSON.h"
17 18 19
#include "clientInt.h"
#include "clientLog.h"
#include "parser.h"
H
Haojun Liao 已提交
20
#include "tdatablock.h"
21 22
#include "tdef.h"
#include "tglobal.h"
X
Xiaoyu Wang 已提交
23
#include "tqueue.h"
24
#include "tref.h"
L
Liu Jicong 已提交
25 26
#include "ttimer.h"

27
#define EMPTY_BLOCK_POLL_IDLE_DURATION  10
28
#define DEFAULT_AUTO_COMMIT_INTERVAL    5000
29

X
Xiaoyu Wang 已提交
30
struct SMqMgmt {
31 32 33
  int8_t  inited;
  tmr_h   timer;
  int32_t rsetId;
34
};
L
Liu Jicong 已提交
35

X
Xiaoyu Wang 已提交
36 37
static TdThreadOnce   tmqInit = PTHREAD_ONCE_INIT;  // initialize only once
volatile int32_t      tmqInitRes = 0;               // initialize rsp code
38
static struct SMqMgmt tmqMgmt = {0};
39

L
Liu Jicong 已提交
40 41 42 43 44 45
typedef struct {
  int8_t  tmqRspType;
  int32_t epoch;
} SMqRspWrapper;

typedef struct {
L
Liu Jicong 已提交
46 47 48
  int8_t      tmqRspType;
  int32_t     epoch;
  SMqAskEpRsp msg;
L
Liu Jicong 已提交
49 50
} SMqAskEpRspWrapper;

L
Liu Jicong 已提交
51
struct tmq_list_t {
L
Liu Jicong 已提交
52
  SArray container;
L
Liu Jicong 已提交
53
};
L
Liu Jicong 已提交
54

L
Liu Jicong 已提交
55
struct tmq_conf_t {
56 57 58 59 60 61 62 63
  char           clientId[256];
  char           groupId[TSDB_CGROUP_LEN];
  int8_t         autoCommit;
  int8_t         resetOffset;
  int8_t         withTbName;
  int8_t         snapEnable;
  int32_t        snapBatchSize;
  bool           hbBgEnable;
64 65 66 67 68
  uint16_t       port;
  int32_t        autoCommitInterval;
  char*          ip;
  char*          user;
  char*          pass;
69
  tmq_commit_cb* commitCb;
L
Liu Jicong 已提交
70
  void*          commitCbUserParam;
L
Liu Jicong 已提交
71 72 73
};

struct tmq_t {
74 75 76 77 78 79 80 81 82 83
  int64_t        refId;
  char           groupId[TSDB_CGROUP_LEN];
  char           clientId[256];
  int8_t         withTbName;
  int8_t         useSnapshot;
  int8_t         autoCommit;
  int32_t        autoCommitInterval;
  int32_t        resetOffsetCfg;
  uint64_t       consumerId;
  bool           hbBgEnable;
L
Liu Jicong 已提交
84 85
  tmq_commit_cb* commitCb;
  void*          commitCbUserParam;
L
Liu Jicong 已提交
86 87 88 89

  // status
  int8_t  status;
  int32_t epoch;
L
Liu Jicong 已提交
90 91
#if 0
  int8_t  epStatus;
L
Liu Jicong 已提交
92
  int32_t epSkipCnt;
L
Liu Jicong 已提交
93
#endif
94 95 96
  // poll info
  int64_t       pollCnt;
  int64_t       totalRows;
L
Liu Jicong 已提交
97

L
Liu Jicong 已提交
98
  // timer
99 100 101 102
  tmr_h         hbLiveTimer;
  tmr_h         epTimer;
  tmr_h         reportTimer;
  tmr_h         commitTimer;
H
Haojun Liao 已提交
103 104 105 106 107 108 109
  STscObj*      pTscObj;       // connection
  SArray*       clientTopics;  // SArray<SMqClientTopic>
  STaosQueue*   mqueue;        // queue of rsp
  STaosQall*    qall;
  STaosQueue*   delayedTask;   // delayed task queue for heartbeat and auto commit
  TdThreadMutex lock;          // used to protect the operation on each topic, when updating the epsets.
  tsem_t        rspSem;
L
Liu Jicong 已提交
110 111
};

X
Xiaoyu Wang 已提交
112 113 114 115 116 117 118 119
enum {
  TMQ_VG_STATUS__IDLE = 0,
  TMQ_VG_STATUS__WAIT,
};

enum {
  TMQ_CONSUMER_STATUS__INIT = 0,
  TMQ_CONSUMER_STATUS__READY,
120
  TMQ_CONSUMER_STATUS__NO_TOPIC,
L
Liu Jicong 已提交
121
  TMQ_CONSUMER_STATUS__RECOVER,
L
Liu Jicong 已提交
122 123
};

L
Liu Jicong 已提交
124
enum {
125
  TMQ_DELAYED_TASK__ASK_EP = 1,
L
Liu Jicong 已提交
126 127 128 129
  TMQ_DELAYED_TASK__REPORT,
  TMQ_DELAYED_TASK__COMMIT,
};

L
Liu Jicong 已提交
130
typedef struct {
H
Haojun Liao 已提交
131
  int64_t      pollCnt;
132
  int64_t      numOfRows;
L
Liu Jicong 已提交
133 134
  STqOffsetVal committedOffset;
  STqOffsetVal currentOffset;
H
Haojun Liao 已提交
135 136 137
  int32_t      vgId;
  int32_t      vgStatus;
  int32_t      vgSkipCnt;
H
Haojun Liao 已提交
138
  int64_t      emptyBlockReceiveTs; // once empty block is received, idle for ignoreCnt then start to poll data
H
Haojun Liao 已提交
139
  SEpSet       epSet;
140 141
} SMqClientVg;

L
Liu Jicong 已提交
142
typedef struct {
143 144 145
  char           topicName[TSDB_TOPIC_FNAME_LEN];
  char           db[TSDB_DB_FNAME_LEN];
  SArray*        vgs;  // SArray<SMqClientVg>
L
Liu Jicong 已提交
146
  SSchemaWrapper schema;
147 148
} SMqClientTopic;

L
Liu Jicong 已提交
149 150
typedef struct {
  int8_t          tmqRspType;
151 152
  int32_t         epoch;         // epoch can be used to guard the vgHandle
  int32_t         vgId;
L
Liu Jicong 已提交
153 154
  SMqClientVg*    vgHandle;
  SMqClientTopic* topicHandle;
H
Haojun Liao 已提交
155
  uint64_t        reqId;
156
  SEpSet*         pEpset;
L
Liu Jicong 已提交
157
  union {
L
Liu Jicong 已提交
158 159
    SMqDataRsp dataRsp;
    SMqMetaRsp metaRsp;
L
Liu Jicong 已提交
160
    STaosxRsp  taosxRsp;
L
Liu Jicong 已提交
161
  };
L
Liu Jicong 已提交
162 163
} SMqPollRspWrapper;

L
Liu Jicong 已提交
164
typedef struct {
165 166
  int64_t refId;
  int32_t epoch;
L
Liu Jicong 已提交
167 168
  tsem_t  rspSem;
  int32_t rspErr;
L
Liu Jicong 已提交
169
} SMqSubscribeCbParam;
L
Liu Jicong 已提交
170

L
Liu Jicong 已提交
171
typedef struct {
172 173
  int64_t refId;
  int32_t epoch;
L
Liu Jicong 已提交
174
  int32_t code;
L
Liu Jicong 已提交
175
  int32_t async;
X
Xiaoyu Wang 已提交
176
  tsem_t  rspSem;
177 178
} SMqAskEpCbParam;

L
Liu Jicong 已提交
179
typedef struct {
180 181
  int64_t         refId;
  int32_t         epoch;
L
Liu Jicong 已提交
182
  SMqClientVg*    pVg;
L
Liu Jicong 已提交
183
  SMqClientTopic* pTopic;
L
Liu Jicong 已提交
184
  int32_t         vgId;
L
Liu Jicong 已提交
185
  tsem_t          rspSem;
H
Haojun Liao 已提交
186
  uint64_t        requestId; // request id for debug purpose
X
Xiaoyu Wang 已提交
187
} SMqPollCbParam;
188

189
typedef struct {
190 191
  int64_t        refId;
  int32_t        epoch;
L
Liu Jicong 已提交
192 193
  int8_t         automatic;
  int8_t         async;
L
Liu Jicong 已提交
194 195
  int32_t        waitingRspNum;
  int32_t        totalRspNum;
L
Liu Jicong 已提交
196
  int32_t        rspErr;
197
  tmq_commit_cb* userCb;
L
Liu Jicong 已提交
198 199 200 201
  /*SArray*        successfulOffsets;*/
  /*SArray*        failedOffsets;*/
  void*  userParam;
  tsem_t rspSem;
202 203 204 205 206
} SMqCommitCbParamSet;

typedef struct {
  SMqCommitCbParamSet* params;
  STqOffset*           pOffset;
H
Haojun Liao 已提交
207 208 209
  char                 topicName[TSDB_TOPIC_FNAME_LEN];
  int32_t              vgId;
  tmq_t*               pTmq;
210
} SMqCommitCbParam;
211

212
static int32_t tmqAskEp(tmq_t* tmq, bool async);
213 214
static int32_t makeTopicVgroupKey(char* dst, const char* topicName, int32_t vg);
static int32_t tmqCommitDone(SMqCommitCbParamSet* pParamSet);
215 216
static int32_t doSendCommitMsg(tmq_t* tmq, SMqClientVg* pVg, const char* pTopicName, SMqCommitCbParamSet* pParamSet,
                               int32_t index, int32_t totalVgroups);
217
static void tmqCommitRspCountDown(SMqCommitCbParamSet* pParamSet, int64_t consumerId, const char* pTopic, int32_t vgId);
218

219
tmq_conf_t* tmq_conf_new() {
wafwerar's avatar
wafwerar 已提交
220
  tmq_conf_t* conf = taosMemoryCalloc(1, sizeof(tmq_conf_t));
221 222 223 224 225
  if (conf == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return conf;
  }

226
  conf->withTbName = false;
L
Liu Jicong 已提交
227
  conf->autoCommit = true;
228
  conf->autoCommitInterval = DEFAULT_AUTO_COMMIT_INTERVAL;
229
  conf->resetOffset = TMQ_OFFSET__RESET_EARLIEAST;
230
  conf->hbBgEnable = true;
231

232 233 234
  return conf;
}

L
Liu Jicong 已提交
235
void tmq_conf_destroy(tmq_conf_t* conf) {
L
Liu Jicong 已提交
236
  if (conf) {
237 238 239 240 241 242 243 244 245
    if (conf->ip) {
      taosMemoryFree(conf->ip);
    }
    if (conf->user) {
      taosMemoryFree(conf->user);
    }
    if (conf->pass) {
      taosMemoryFree(conf->pass);
    }
L
Liu Jicong 已提交
246 247
    taosMemoryFree(conf);
  }
L
Liu Jicong 已提交
248 249 250
}

tmq_conf_res_t tmq_conf_set(tmq_conf_t* conf, const char* key, const char* value) {
251
  if (strcasecmp(key, "group.id") == 0) {
L
Liu Jicong 已提交
252
    tstrncpy(conf->groupId, value, TSDB_CGROUP_LEN);
L
Liu Jicong 已提交
253
    return TMQ_CONF_OK;
254
  }
L
Liu Jicong 已提交
255

256
  if (strcasecmp(key, "client.id") == 0) {
L
Liu Jicong 已提交
257
    tstrncpy(conf->clientId, value, 256);
L
Liu Jicong 已提交
258 259
    return TMQ_CONF_OK;
  }
L
Liu Jicong 已提交
260

261 262
  if (strcasecmp(key, "enable.auto.commit") == 0) {
    if (strcasecmp(value, "true") == 0) {
L
Liu Jicong 已提交
263
      conf->autoCommit = true;
L
Liu Jicong 已提交
264
      return TMQ_CONF_OK;
265
    } else if (strcasecmp(value, "false") == 0) {
L
Liu Jicong 已提交
266
      conf->autoCommit = false;
L
Liu Jicong 已提交
267 268 269 270
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
271
  }
L
Liu Jicong 已提交
272

273
  if (strcasecmp(key, "auto.commit.interval.ms") == 0) {
274
    conf->autoCommitInterval = taosStr2int64(value);
L
Liu Jicong 已提交
275 276 277
    return TMQ_CONF_OK;
  }

278 279 280
  if (strcasecmp(key, "auto.offset.reset") == 0) {
    if (strcasecmp(value, "none") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_NONE;
L
Liu Jicong 已提交
281
      return TMQ_CONF_OK;
282 283
    } else if (strcasecmp(value, "earliest") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_EARLIEAST;
L
Liu Jicong 已提交
284
      return TMQ_CONF_OK;
285 286
    } else if (strcasecmp(value, "latest") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_LATEST;
L
Liu Jicong 已提交
287 288 289 290 291
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
  }
L
Liu Jicong 已提交
292

293 294
  if (strcasecmp(key, "msg.with.table.name") == 0) {
    if (strcasecmp(value, "true") == 0) {
295
      conf->withTbName = true;
L
Liu Jicong 已提交
296
      return TMQ_CONF_OK;
297
    } else if (strcasecmp(value, "false") == 0) {
298
      conf->withTbName = false;
L
Liu Jicong 已提交
299
      return TMQ_CONF_OK;
300 301 302 303 304
    } else {
      return TMQ_CONF_INVALID;
    }
  }

305 306
  if (strcasecmp(key, "experimental.snapshot.enable") == 0) {
    if (strcasecmp(value, "true") == 0) {
L
Liu Jicong 已提交
307
      conf->snapEnable = true;
308
      return TMQ_CONF_OK;
309
    } else if (strcasecmp(value, "false") == 0) {
L
Liu Jicong 已提交
310
      conf->snapEnable = false;
311 312 313 314 315 316
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
  }

317
  if (strcasecmp(key, "experimental.snapshot.batch.size") == 0) {
318
    conf->snapBatchSize = taosStr2int64(value);
L
Liu Jicong 已提交
319 320 321
    return TMQ_CONF_OK;
  }

322 323
  if (strcasecmp(key, "enable.heartbeat.background") == 0) {
    if (strcasecmp(value, "true") == 0) {
324
      conf->hbBgEnable = true;
L
Liu Jicong 已提交
325
      return TMQ_CONF_OK;
326
    } else if (strcasecmp(value, "false") == 0) {
327
      conf->hbBgEnable = false;
L
Liu Jicong 已提交
328 329 330 331 332 333
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
  }

334
  if (strcasecmp(key, "td.connect.ip") == 0) {
335
    conf->ip = taosStrdup(value);
L
Liu Jicong 已提交
336 337
    return TMQ_CONF_OK;
  }
338

339
  if (strcasecmp(key, "td.connect.user") == 0) {
340
    conf->user = taosStrdup(value);
L
Liu Jicong 已提交
341 342
    return TMQ_CONF_OK;
  }
343

344
  if (strcasecmp(key, "td.connect.pass") == 0) {
345
    conf->pass = taosStrdup(value);
L
Liu Jicong 已提交
346 347
    return TMQ_CONF_OK;
  }
348

349
  if (strcasecmp(key, "td.connect.port") == 0) {
350
    conf->port = taosStr2int64(value);
L
Liu Jicong 已提交
351 352
    return TMQ_CONF_OK;
  }
353

354
  if (strcasecmp(key, "td.connect.db") == 0) {
L
Liu Jicong 已提交
355 356 357
    return TMQ_CONF_OK;
  }

L
Liu Jicong 已提交
358
  return TMQ_CONF_UNKNOWN;
359 360 361
}

tmq_list_t* tmq_list_new() {
L
Liu Jicong 已提交
362
  return (tmq_list_t*)taosArrayInit(0, sizeof(void*));
363 364
}

L
Liu Jicong 已提交
365 366
int32_t tmq_list_append(tmq_list_t* list, const char* src) {
  SArray* container = &list->container;
367
  if (src == NULL || src[0] == 0) return -1;
368
  char* topic = taosStrdup(src);
369 370 371
  if (topic[0] != '`') {
    strtolower(topic, src);
  }
L
fix  
Liu Jicong 已提交
372
  if (taosArrayPush(container, &topic) == NULL) return -1;
373 374 375
  return 0;
}

L
Liu Jicong 已提交
376
void tmq_list_destroy(tmq_list_t* list) {
L
Liu Jicong 已提交
377
  SArray* container = &list->container;
L
Liu Jicong 已提交
378
  taosArrayDestroyP(container, taosMemoryFree);
L
Liu Jicong 已提交
379 380
}

L
Liu Jicong 已提交
381 382 383 384 385 386 387 388 389 390
int32_t tmq_list_get_size(const tmq_list_t* list) {
  const SArray* container = &list->container;
  return taosArrayGetSize(container);
}

char** tmq_list_to_c_array(const tmq_list_t* list) {
  const SArray* container = &list->container;
  return container->pData;
}

391 392 393 394 395
static SMqClientVg* foundClientVg(SArray* pTopicList, const char* pName, int32_t vgId, int32_t* index, int32_t* numOfVgroups) {
  int32_t numOfTopics = taosArrayGetSize(pTopicList);
  *index = -1;
  *numOfVgroups = 0;

396
  for(int32_t i = 0; i < numOfTopics; ++i) {
397 398
    SMqClientTopic* pTopic = taosArrayGet(pTopicList, i);
    if (strcmp(pTopic->topicName, pName) != 0) {
399 400 401
      continue;
    }

402 403
    *numOfVgroups = taosArrayGetSize(pTopic->vgs);
    for (int32_t j = 0; j < (*numOfVgroups); ++j) {
404
      SMqClientVg* pClientVg = taosArrayGet(pTopic->vgs, j);
405 406 407
      if (pClientVg->vgId == vgId) {
        *index = j;
        return pClientVg;
408 409
      }
    }
L
Liu Jicong 已提交
410
  }
411 412

  return NULL;
L
Liu Jicong 已提交
413
}
414

415 416 417
// Two problems do not need to be addressed here
// 1. update to of epset. the response of poll request will automatically handle this problem
// 2. commit failure. This one needs to be resolved.
H
Haojun Liao 已提交
418
static int32_t tmqCommitCb(void* param, SDataBuf* pBuf, int32_t code) {
419
  SMqCommitCbParam*    pParam = (SMqCommitCbParam*)param;
420
  SMqCommitCbParamSet* pParamSet = (SMqCommitCbParamSet*)pParam->params;
H
Haojun Liao 已提交
421

422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450
//  if (code != TSDB_CODE_SUCCESS) { // if commit offset failed, let's try again
//    taosThreadMutexLock(&pParam->pTmq->lock);
//    int32_t numOfVgroups, index;
//    SMqClientVg* pVg = foundClientVg(pParam->pTmq->clientTopics, pParam->topicName, pParam->vgId, &index, &numOfVgroups);
//    if (pVg == NULL) {
//      tscDebug("consumer:0x%" PRIx64
//               " subKey:%s vgId:%d commit failed, code:%s has been transferred to other consumer, no need retry ordinal:%d/%d",
//               pParam->pTmq->consumerId, pParam->pOffset->subKey, pParam->vgId, tstrerror(code), index + 1, numOfVgroups);
//    } else { // let's retry the commit
//      int32_t code1 = doSendCommitMsg(pParam->pTmq, pVg, pParam->topicName, pParamSet, index, numOfVgroups);
//      if (code1 != TSDB_CODE_SUCCESS) {  // retry failed.
//        tscError("consumer:0x%" PRIx64 " topic:%s vgId:%d offset:%" PRId64
//                 " retry failed, ignore this commit. code:%s ordinal:%d/%d",
//                 pParam->pTmq->consumerId, pParam->topicName, pVg->vgId, pVg->committedOffset.version,
//                 tstrerror(terrno), index + 1, numOfVgroups);
//      }
//    }
//
//    taosThreadMutexUnlock(&pParam->pTmq->lock);
//
//    taosMemoryFree(pParam->pOffset);
//    taosMemoryFree(pBuf->pData);
//    taosMemoryFree(pBuf->pEpSet);
//
//    tmqCommitRspCountDown(pParamSet, pParam->pTmq->consumerId, pParam->topicName, pParam->vgId);
//    return 0;
//  }
//
//  // todo replace the pTmq with refId
451

L
Liu Jicong 已提交
452
  taosMemoryFree(pParam->pOffset);
L
Liu Jicong 已提交
453
  taosMemoryFree(pBuf->pData);
dengyihao's avatar
dengyihao 已提交
454
  taosMemoryFree(pBuf->pEpSet);
L
Liu Jicong 已提交
455

456
  tmqCommitRspCountDown(pParamSet, pParam->pTmq->consumerId, pParam->topicName, pParam->vgId);
457 458 459
  return 0;
}

460 461
static int32_t doSendCommitMsg(tmq_t* tmq, SMqClientVg* pVg, const char* pTopicName, SMqCommitCbParamSet* pParamSet,
                               int32_t index, int32_t totalVgroups) {
L
Liu Jicong 已提交
462 463 464 465 466
  STqOffset* pOffset = taosMemoryCalloc(1, sizeof(STqOffset));
  if (pOffset == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
467

L
Liu Jicong 已提交
468
  pOffset->val = pVg->currentOffset;
469

L
Liu Jicong 已提交
470 471 472
  int32_t groupLen = strlen(tmq->groupId);
  memcpy(pOffset->subKey, tmq->groupId, groupLen);
  pOffset->subKey[groupLen] = TMQ_SEPARATOR;
H
Haojun Liao 已提交
473
  strcpy(pOffset->subKey + groupLen + 1, pTopicName);
L
Liu Jicong 已提交
474

475 476
  int32_t len = 0;
  int32_t code = 0;
L
Liu Jicong 已提交
477 478 479 480
  tEncodeSize(tEncodeSTqOffset, pOffset, len, code);
  if (code < 0) {
    return -1;
  }
481

L
Liu Jicong 已提交
482
  void* buf = taosMemoryCalloc(1, sizeof(SMsgHead) + len);
L
Liu Jicong 已提交
483 484 485 486
  if (buf == NULL) {
    taosMemoryFree(pOffset);
    return -1;
  }
487

L
Liu Jicong 已提交
488
  ((SMsgHead*)buf)->vgId = htonl(pVg->vgId);
L
Liu Jicong 已提交
489

L
Liu Jicong 已提交
490 491 492 493 494
  void* abuf = POINTER_SHIFT(buf, sizeof(SMsgHead));

  SEncoder encoder;
  tEncoderInit(&encoder, abuf, len);
  tEncodeSTqOffset(&encoder, pOffset);
L
Liu Jicong 已提交
495
  tEncoderClear(&encoder);
L
Liu Jicong 已提交
496 497

  // build param
498
  SMqCommitCbParam* pParam = taosMemoryCalloc(1, sizeof(SMqCommitCbParam));
L
Liu Jicong 已提交
499
  if (pParam == NULL) {
L
Liu Jicong 已提交
500
    taosMemoryFree(pOffset);
L
Liu Jicong 已提交
501 502 503
    taosMemoryFree(buf);
    return -1;
  }
504

L
Liu Jicong 已提交
505 506
  pParam->params = pParamSet;
  pParam->pOffset = pOffset;
H
Haojun Liao 已提交
507 508 509
  pParam->vgId = pVg->vgId;
  pParam->pTmq = tmq;

H
Haojun Liao 已提交
510
  tstrncpy(pParam->topicName, pTopicName, tListLen(pParam->topicName));
L
Liu Jicong 已提交
511 512 513 514

  // build send info
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (pMsgSendInfo == NULL) {
L
Liu Jicong 已提交
515
    taosMemoryFree(pOffset);
L
Liu Jicong 已提交
516 517
    taosMemoryFree(buf);
    taosMemoryFree(pParam);
L
Liu Jicong 已提交
518 519
    return -1;
  }
520

L
Liu Jicong 已提交
521 522 523 524 525 526 527 528 529
  pMsgSendInfo->msgInfo = (SDataBuf){
      .pData = buf,
      .len = sizeof(SMsgHead) + len,
      .handle = NULL,
  };

  pMsgSendInfo->requestId = generateRequestId();
  pMsgSendInfo->requestObjRefId = 0;
  pMsgSendInfo->param = pParam;
L
Liu Jicong 已提交
530
  pMsgSendInfo->paramFreeFp = taosMemoryFree;
531
  pMsgSendInfo->fp = tmqCommitCb;
L
Liu Jicong 已提交
532
  pMsgSendInfo->msgType = TDMT_VND_TMQ_COMMIT_OFFSET;
L
Liu Jicong 已提交
533

L
Liu Jicong 已提交
534 535 536
  atomic_add_fetch_32(&pParamSet->waitingRspNum, 1);
  atomic_add_fetch_32(&pParamSet->totalRspNum, 1);

H
Haojun Liao 已提交
537
  SEp* pEp = GET_ACTIVE_EP(&pVg->epSet);
538 539 540 541 542 543 544 545
  char offsetBuf[80] = {0};
  tFormatOffset(offsetBuf, tListLen(offsetBuf), &pOffset->val);

  char commitBuf[80] = {0};
  tFormatOffset(commitBuf, tListLen(commitBuf), &pVg->committedOffset);
  tscDebug("consumer:0x%" PRIx64 " topic:%s on vgId:%d send offset:%s prev:%s, ep:%s:%d, ordinal:%d/%d, req:0x%" PRIx64,
           tmq->consumerId, pOffset->subKey, pVg->vgId, offsetBuf, commitBuf, pEp->fqdn, pEp->port, index + 1,
           totalVgroups, pMsgSendInfo->requestId);
H
Haojun Liao 已提交
546

L
Liu Jicong 已提交
547 548 549 550 551
  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &pVg->epSet, &transporterId, pMsgSendInfo);
  return 0;
}

H
Haojun Liao 已提交
552
static int32_t tmqCommitMsgImpl(tmq_t* tmq, const TAOS_RES* msg, int8_t async, tmq_commit_cb* userCb, void* userParam) {
L
Liu Jicong 已提交
553 554 555 556 557 558 559 560 561 562
  char*   topic;
  int32_t vgId;
  if (TD_RES_TMQ(msg)) {
    SMqRspObj* pRspObj = (SMqRspObj*)msg;
    topic = pRspObj->topic;
    vgId = pRspObj->vgId;
  } else if (TD_RES_TMQ_META(msg)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)msg;
    topic = pMetaRspObj->topic;
    vgId = pMetaRspObj->vgId;
L
Liu Jicong 已提交
563
  } else if (TD_RES_TMQ_METADATA(msg)) {
564 565 566
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)msg;
    topic = pRspObj->topic;
    vgId = pRspObj->vgId;
L
Liu Jicong 已提交
567 568 569 570 571 572 573 574 575
  } else {
    return TSDB_CODE_TMQ_INVALID_MSG;
  }

  SMqCommitCbParamSet* pParamSet = taosMemoryCalloc(1, sizeof(SMqCommitCbParamSet));
  if (pParamSet == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
H
Haojun Liao 已提交
576

577 578
  pParamSet->refId = tmq->refId;
  pParamSet->epoch = tmq->epoch;
L
Liu Jicong 已提交
579 580 581 582 583 584
  pParamSet->automatic = 0;
  pParamSet->async = async;
  pParamSet->userCb = userCb;
  pParamSet->userParam = userParam;
  tsem_init(&pParamSet->rspSem, 0, 0);

L
Liu Jicong 已提交
585 586
  int32_t code = -1;

H
Haojun Liao 已提交
587
  taosThreadMutexLock(&tmq->lock);
H
Haojun Liao 已提交
588 589 590 591
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);

  tscDebug("consumer:0x%" PRIx64 " user invoked commit offset for %d", tmq->consumerId, numOfTopics);
  for (int32_t i = 0; i < numOfTopics; i++) {
L
Liu Jicong 已提交
592
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
593 594 595 596 597 598
    if (strcmp(pTopic->topicName, topic) != 0) {
      continue;
    }

    int32_t numOfVgroups = taosArrayGetSize(pTopic->vgs);
    for (int32_t j = 0; j < numOfVgroups; j++) {
L
Liu Jicong 已提交
599
      SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);
H
Haojun Liao 已提交
600 601 602
      if (pVg->vgId != vgId) {
        continue;
      }
L
Liu Jicong 已提交
603

L
Liu Jicong 已提交
604
      if (pVg->currentOffset.type > 0 && !tOffsetEqual(&pVg->currentOffset, &pVg->committedOffset)) {
605
        if (doSendCommitMsg(tmq, pVg, pTopic->topicName, pParamSet, j, numOfVgroups) < 0) {
L
Liu Jicong 已提交
606 607
          tsem_destroy(&pParamSet->rspSem);
          taosMemoryFree(pParamSet);
L
Liu Jicong 已提交
608
          goto FAIL;
L
Liu Jicong 已提交
609
        }
L
Liu Jicong 已提交
610
        goto HANDLE_RSP;
L
Liu Jicong 已提交
611 612
      }
    }
L
Liu Jicong 已提交
613
  }
L
Liu Jicong 已提交
614

L
Liu Jicong 已提交
615 616 617 618
HANDLE_RSP:
  if (pParamSet->totalRspNum == 0) {
    tsem_destroy(&pParamSet->rspSem);
    taosMemoryFree(pParamSet);
H
Haojun Liao 已提交
619
    taosThreadMutexUnlock(&tmq->lock);
L
Liu Jicong 已提交
620 621 622
    return 0;
  }

L
Liu Jicong 已提交
623
  if (!async) {
H
Haojun Liao 已提交
624
    taosThreadMutexUnlock(&tmq->lock);
L
Liu Jicong 已提交
625 626 627
    tsem_wait(&pParamSet->rspSem);
    code = pParamSet->rspErr;
    tsem_destroy(&pParamSet->rspSem);
L
Liu Jicong 已提交
628
    taosMemoryFree(pParamSet);
L
Liu Jicong 已提交
629 630 631 632 633 634
    return code;
  } else {
    code = 0;
  }

FAIL:
H
Haojun Liao 已提交
635
  taosThreadMutexUnlock(&tmq->lock);
L
Liu Jicong 已提交
636 637 638
  if (code != 0 && async) {
    userCb(tmq, code, userParam);
  }
H
Haojun Liao 已提交
639

L
Liu Jicong 已提交
640 641 642
  return 0;
}

643
static int32_t doAutoCommit(tmq_t* tmq, int8_t automatic, int8_t async, tmq_commit_cb* userCb, void* userParam) {
L
Liu Jicong 已提交
644 645
  int32_t code = -1;

646 647
  SMqCommitCbParamSet* pParamSet = taosMemoryCalloc(1, sizeof(SMqCommitCbParamSet));
  if (pParamSet == NULL) {
L
Liu Jicong 已提交
648 649 650 651 652 653 654 655
    code = TSDB_CODE_OUT_OF_MEMORY;
    if (async) {
      if (automatic) {
        tmq->commitCb(tmq, code, tmq->commitCbUserParam);
      } else {
        userCb(tmq, code, userParam);
      }
    }
656 657
    return -1;
  }
658 659 660 661

  pParamSet->refId = tmq->refId;
  pParamSet->epoch = tmq->epoch;

662 663 664 665 666 667
  pParamSet->automatic = automatic;
  pParamSet->async = async;
  pParamSet->userCb = userCb;
  pParamSet->userParam = userParam;
  tsem_init(&pParamSet->rspSem, 0, 0);

668 669 670
  // init as 1 to prevent concurrency issue
  pParamSet->waitingRspNum = 1;

H
Haojun Liao 已提交
671
  taosThreadMutexLock(&tmq->lock);
672
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);
X
Xiaoyu Wang 已提交
673
  tscDebug("consumer:0x%" PRIx64 " start to commit offset for %d topics", tmq->consumerId, numOfTopics);
674 675

  for (int32_t i = 0; i < numOfTopics; i++) {
676
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
677
    int32_t         numOfVgroups = taosArrayGetSize(pTopic->vgs);
L
Liu Jicong 已提交
678

679 680
    tscDebug("consumer:0x%" PRIx64 " commit offset for topics:%s, numOfVgs:%d", tmq->consumerId, pTopic->topicName,
             numOfVgroups);
681
    for (int32_t j = 0; j < numOfVgroups; j++) {
682 683 684 685 686 687 688 689
      SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);

      if (pVg->currentOffset.type > 0 && !tOffsetEqual(&pVg->currentOffset, &pVg->committedOffset)) {
        code = doSendCommitMsg(tmq, pVg, pTopic->topicName, pParamSet, j, numOfVgroups);
        if (code != TSDB_CODE_SUCCESS) {
          tscError("consumer:0x%" PRIx64 " topic:%s vgId:%d offset:%" PRId64 " failed, code:%s ordinal:%d/%d",
                   tmq->consumerId, pTopic->topicName, pVg->vgId, pVg->committedOffset.version, tstrerror(terrno),
                   j + 1, numOfVgroups);
L
Liu Jicong 已提交
690 691
          continue;
        }
H
Haojun Liao 已提交
692 693 694

        // update the offset value.
        pVg->committedOffset = pVg->currentOffset;
695
      } else {
696 697
        tscDebug("consumer:0x%" PRIx64 " topic:%s vgId:%d, no commit, current:%" PRId64 ", ordinal:%d/%d",
                 tmq->consumerId, pTopic->topicName, pVg->vgId, pVg->currentOffset.version, j + 1, numOfVgroups);
698 699 700 701
      }
    }
  }

H
Haojun Liao 已提交
702
  tscDebug("consumer:0x%" PRIx64 " total commit:%d for %d topics", tmq->consumerId, pParamSet->waitingRspNum - 1,
703
           numOfTopics);
H
Haojun Liao 已提交
704 705
  taosThreadMutexUnlock(&tmq->lock);

L
Liu Jicong 已提交
706
  // no request is sent
L
Liu Jicong 已提交
707 708 709 710 711 712
  if (pParamSet->totalRspNum == 0) {
    tsem_destroy(&pParamSet->rspSem);
    taosMemoryFree(pParamSet);
    return 0;
  }

L
Liu Jicong 已提交
713
  // count down since waiting rsp num init as 1
714
  tmqCommitRspCountDown(pParamSet, tmq->consumerId, "", 0);
715

716 717 718 719
  if (!async) {
    tsem_wait(&pParamSet->rspSem);
    code = pParamSet->rspErr;
    tsem_destroy(&pParamSet->rspSem);
720
    taosMemoryFree(pParamSet);
L
Liu Jicong 已提交
721
#if 0
722 723
    taosArrayDestroyP(pParamSet->successfulOffsets, taosMemoryFree);
    taosArrayDestroyP(pParamSet->failedOffsets, taosMemoryFree);
L
Liu Jicong 已提交
724
#endif
L
Liu Jicong 已提交
725
  }
726

L
Liu Jicong 已提交
727 728 729
  return code;
}

730 731
static int32_t tmqCommitInner(tmq_t* tmq, const TAOS_RES* msg, int8_t automatic, int8_t async, tmq_commit_cb* userCb,
                              void* userParam) {
H
Haojun Liao 已提交
732
  if (msg) { // user invoked commit
L
Liu Jicong 已提交
733
    return tmqCommitMsgImpl(tmq, msg, async, userCb, userParam);
734
  } else {  // this for auto commit
735
    return doAutoCommit(tmq, automatic, async, userCb, userParam);
L
Liu Jicong 已提交
736
  }
737 738
}

739 740
static void generateTimedTask(int64_t refId, int32_t type) {
  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
741
  if (tmq != NULL) {
S
Shengliang Guan 已提交
742
    int8_t* pTaskType = taosAllocateQitem(sizeof(int8_t), DEF_QITEM, 0);
743
    *pTaskType = type;
744 745 746
    taosWriteQitem(tmq->delayedTask, pTaskType);
    tsem_post(&tmq->rspSem);
  }
747
  taosReleaseRef(tmqMgmt.rsetId, refId);
748 749 750 751 752
}

void tmqAssignAskEpTask(void* param, void* tmrId) {
  int64_t refId = *(int64_t*)param;
  generateTimedTask(refId, TMQ_DELAYED_TASK__ASK_EP);
753
  taosMemoryFree(param);
L
Liu Jicong 已提交
754 755 756
}

void tmqAssignDelayedCommitTask(void* param, void* tmrId) {
757
  int64_t refId = *(int64_t*)param;
758
  generateTimedTask(refId, TMQ_DELAYED_TASK__COMMIT);
759
  taosMemoryFree(param);
L
Liu Jicong 已提交
760 761 762
}

void tmqAssignDelayedReportTask(void* param, void* tmrId) {
763 764 765
  int64_t refId = *(int64_t*)param;
  tmq_t*  tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
  if (tmq != NULL) {
S
Shengliang Guan 已提交
766
    int8_t* pTaskType = taosAllocateQitem(sizeof(int8_t), DEF_QITEM, 0);
767 768 769 770
    *pTaskType = TMQ_DELAYED_TASK__REPORT;
    taosWriteQitem(tmq->delayedTask, pTaskType);
    tsem_post(&tmq->rspSem);
  }
771 772

  taosReleaseRef(tmqMgmt.rsetId, refId);
773
  taosMemoryFree(param);
L
Liu Jicong 已提交
774 775
}

776
int32_t tmqHbCb(void* param, SDataBuf* pMsg, int32_t code) {
dengyihao's avatar
dengyihao 已提交
777 778 779 780
  if (pMsg) {
    taosMemoryFree(pMsg->pData);
    taosMemoryFree(pMsg->pEpSet);
  }
781 782 783 784
  return 0;
}

void tmqSendHbReq(void* param, void* tmrId) {
785
  int64_t refId = *(int64_t*)param;
786

787 788
  tmq_t*  tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
  if (tmq == NULL) {
L
Liu Jicong 已提交
789
    taosMemoryFree(param);
790 791
    return;
  }
D
dapan1121 已提交
792 793 794 795 796

  SMqHbReq req = {0};
  req.consumerId = tmq->consumerId;
  req.epoch = tmq->epoch;

L
Liu Jicong 已提交
797
  int32_t tlen = tSerializeSMqHbReq(NULL, 0, &req);
D
dapan1121 已提交
798 799
  if (tlen < 0) {
    tscError("tSerializeSMqHbReq failed");
800
    goto OVER;
D
dapan1121 已提交
801
  }
802

L
Liu Jicong 已提交
803
  void* pReq = taosMemoryCalloc(1, tlen);
D
dapan1121 已提交
804 805
  if (tlen < 0) {
    tscError("failed to malloc MqHbReq msg, size:%d", tlen);
806
    goto OVER;
D
dapan1121 已提交
807
  }
808

D
dapan1121 已提交
809 810 811
  if (tSerializeSMqHbReq(pReq, tlen, &req) < 0) {
    tscError("tSerializeSMqHbReq %d failed", tlen);
    taosMemoryFree(pReq);
812
    goto OVER;
D
dapan1121 已提交
813
  }
814 815 816 817

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(pReq);
L
Liu Jicong 已提交
818
    goto OVER;
819
  }
820

821 822
  sendInfo->msgInfo = (SDataBuf){
      .pData = pReq,
D
dapan1121 已提交
823
      .len = tlen,
824 825 826 827 828 829 830
      .handle = NULL,
  };

  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
  sendInfo->param = NULL;
  sendInfo->fp = tmqHbCb;
L
Liu Jicong 已提交
831
  sendInfo->msgType = TDMT_MND_TMQ_HB;
832 833 834 835 836 837 838

  SEpSet epSet = getEpSet_s(&tmq->pTscObj->pAppInfo->mgmtEp);

  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);

OVER:
839
  taosTmrReset(tmqSendHbReq, 1000, param, tmqMgmt.timer, &tmq->hbLiveTimer);
840
  taosReleaseRef(tmqMgmt.rsetId, refId);
841 842
}

843
int32_t tmqHandleAllDelayedTask(tmq_t* pTmq) {
L
Liu Jicong 已提交
844
  STaosQall* qall = taosAllocateQall();
845
  taosReadAllQitems(pTmq->delayedTask, qall);
L
Liu Jicong 已提交
846

847 848 849 850
  if (qall->numOfItems == 0) {
    taosFreeQall(qall);
    return TSDB_CODE_SUCCESS;
  }
851

X
Xiaoyu Wang 已提交
852
  tscDebug("consumer:0x%" PRIx64 " handle delayed %d tasks before poll data", pTmq->consumerId, qall->numOfItems);
853 854
  int8_t* pTaskType = NULL;
  taosGetQitem(qall, (void**)&pTaskType);
L
Liu Jicong 已提交
855

856
  while (pTaskType != NULL) {
857
    if (*pTaskType == TMQ_DELAYED_TASK__ASK_EP) {
858
      tmqAskEp(pTmq, true);
859 860

      int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
861
      *pRefId = pTmq->refId;
862

X
Xiaoyu Wang 已提交
863
      tscDebug("consumer:0x%" PRIx64 " retrieve ep from mnode in 1s", pTmq->consumerId);
864
      taosTmrReset(tmqAssignAskEpTask, 1000, pRefId, tmqMgmt.timer, &pTmq->epTimer);
L
Liu Jicong 已提交
865
    } else if (*pTaskType == TMQ_DELAYED_TASK__COMMIT) {
866
      tmqCommitInner(pTmq, NULL, 1, 1, pTmq->commitCb, pTmq->commitCbUserParam);
867 868

      int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
869
      *pRefId = pTmq->refId;
870

X
Xiaoyu Wang 已提交
871
      tscDebug("consumer:0x%" PRIx64 " commit to vnode(s) in %.2fs", pTmq->consumerId,
X
Xiaoyu Wang 已提交
872
               pTmq->autoCommitInterval / 1000.0);
873
      taosTmrReset(tmqAssignDelayedCommitTask, pTmq->autoCommitInterval, pRefId, tmqMgmt.timer, &pTmq->commitTimer);
L
Liu Jicong 已提交
874 875
    } else if (*pTaskType == TMQ_DELAYED_TASK__REPORT) {
    }
876

L
Liu Jicong 已提交
877
    taosFreeQitem(pTaskType);
878
    taosGetQitem(qall, (void**)&pTaskType);
L
Liu Jicong 已提交
879
  }
880

L
Liu Jicong 已提交
881 882 883 884
  taosFreeQall(qall);
  return 0;
}

885
static void* tmqFreeRspWrapper(SMqRspWrapper* rspWrapper) {
L
Liu Jicong 已提交
886 887 888 889 890 891 892
  if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__END_RSP) {
    // do nothing
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__EP_RSP) {
    SMqAskEpRspWrapper* pEpRspWrapper = (SMqAskEpRspWrapper*)rspWrapper;
    tDeleteSMqAskEpRsp(&pEpRspWrapper->msg);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
893 894
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
895 896 897 898 899 900
    taosArrayDestroyP(pRsp->dataRsp.blockData, taosMemoryFree);
    taosArrayDestroy(pRsp->dataRsp.blockDataLen);
    taosArrayDestroyP(pRsp->dataRsp.blockTbName, taosMemoryFree);
    taosArrayDestroyP(pRsp->dataRsp.blockSchema, (FDelete)tDeleteSSchemaWrapper);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_META_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
901 902
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
903 904 905
    taosMemoryFree(pRsp->metaRsp.metaRsp);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__TAOSX_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
906 907
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
908 909 910 911 912 913 914 915
    taosArrayDestroyP(pRsp->taosxRsp.blockData, taosMemoryFree);
    taosArrayDestroy(pRsp->taosxRsp.blockDataLen);
    taosArrayDestroyP(pRsp->taosxRsp.blockTbName, taosMemoryFree);
    taosArrayDestroyP(pRsp->taosxRsp.blockSchema, (FDelete)tDeleteSSchemaWrapper);
    // taosx
    taosArrayDestroy(pRsp->taosxRsp.createTableLen);
    taosArrayDestroyP(pRsp->taosxRsp.createTableReq, taosMemoryFree);
  }
916 917

  return NULL;
L
Liu Jicong 已提交
918 919
}

L
Liu Jicong 已提交
920
void tmqClearUnhandleMsg(tmq_t* tmq) {
L
Liu Jicong 已提交
921
  SMqRspWrapper* rspWrapper = NULL;
L
Liu Jicong 已提交
922
  while (1) {
L
Liu Jicong 已提交
923 924 925 926 927
    taosGetQitem(tmq->qall, (void**)&rspWrapper);
    if (rspWrapper) {
      tmqFreeRspWrapper(rspWrapper);
      taosFreeQitem(rspWrapper);
    } else {
L
Liu Jicong 已提交
928
      break;
L
Liu Jicong 已提交
929
    }
L
Liu Jicong 已提交
930 931
  }

L
Liu Jicong 已提交
932
  rspWrapper = NULL;
L
Liu Jicong 已提交
933 934
  taosReadAllQitems(tmq->mqueue, tmq->qall);
  while (1) {
L
Liu Jicong 已提交
935 936 937 938 939
    taosGetQitem(tmq->qall, (void**)&rspWrapper);
    if (rspWrapper) {
      tmqFreeRspWrapper(rspWrapper);
      taosFreeQitem(rspWrapper);
    } else {
L
Liu Jicong 已提交
940
      break;
L
Liu Jicong 已提交
941
    }
L
Liu Jicong 已提交
942 943 944
  }
}

D
dapan1121 已提交
945
int32_t tmqSubscribeCb(void* param, SDataBuf* pMsg, int32_t code) {
L
Liu Jicong 已提交
946 947
  SMqSubscribeCbParam* pParam = (SMqSubscribeCbParam*)param;
  pParam->rspErr = code;
dengyihao's avatar
dengyihao 已提交
948 949

  taosMemoryFree(pMsg->pEpSet);
L
Liu Jicong 已提交
950 951 952
  tsem_post(&pParam->rspSem);
  return 0;
}
953

L
Liu Jicong 已提交
954
int32_t tmq_subscription(tmq_t* tmq, tmq_list_t** topics) {
X
Xiaoyu Wang 已提交
955 956 957 958
  if (*topics == NULL) {
    *topics = tmq_list_new();
  }
  for (int i = 0; i < taosArrayGetSize(tmq->clientTopics); i++) {
L
Liu Jicong 已提交
959
    SMqClientTopic* topic = taosArrayGet(tmq->clientTopics, i);
L
Liu Jicong 已提交
960
    tmq_list_append(*topics, strchr(topic->topicName, '.') + 1);
X
Xiaoyu Wang 已提交
961
  }
L
Liu Jicong 已提交
962
  return 0;
X
Xiaoyu Wang 已提交
963 964
}

L
Liu Jicong 已提交
965
int32_t tmq_unsubscribe(tmq_t* tmq) {
L
Liu Jicong 已提交
966 967
  int32_t     rsp;
  int32_t     retryCnt = 0;
L
Liu Jicong 已提交
968
  tmq_list_t* lst = tmq_list_new();
L
Liu Jicong 已提交
969 970 971 972 973 974 975 976 977 978
  while (1) {
    rsp = tmq_subscribe(tmq, lst);
    if (rsp != TSDB_CODE_MND_CONSUMER_NOT_READY || retryCnt > 5) {
      break;
    } else {
      retryCnt++;
      taosMsleep(500);
    }
  }

L
Liu Jicong 已提交
979 980
  tmq_list_destroy(lst);
  return rsp;
X
Xiaoyu Wang 已提交
981 982
}

983 984 985 986 987 988
static void freeClientVgImpl(void* param) {
  SMqClientTopic* pTopic = param;
  taosMemoryFreeClear(pTopic->schema.pSchema);
  taosArrayDestroy(pTopic->vgs);
}

989
void tmqFreeImpl(void* handle) {
990 991
  tmq_t*  tmq = (tmq_t*)handle;
  int64_t id = tmq->consumerId;
L
Liu Jicong 已提交
992

993
  // TODO stop timer
L
Liu Jicong 已提交
994 995 996 997
  if (tmq->mqueue) {
    tmqClearUnhandleMsg(tmq);
    taosCloseQueue(tmq->mqueue);
  }
L
Liu Jicong 已提交
998

H
Haojun Liao 已提交
999 1000 1001 1002 1003
  if (tmq->delayedTask) {
    taosCloseQueue(tmq->delayedTask);
  }

  taosFreeQall(tmq->qall);
1004
  tsem_destroy(&tmq->rspSem);
H
Haojun Liao 已提交
1005
  taosThreadMutexDestroy(&tmq->lock);
L
Liu Jicong 已提交
1006

1007
  taosArrayDestroyEx(tmq->clientTopics, freeClientVgImpl);
1008 1009
  taos_close_internal(tmq->pTscObj);
  taosMemoryFree(tmq);
1010 1011

  tscDebug("consumer:0x%" PRIx64 " closed", id);
L
Liu Jicong 已提交
1012 1013
}

1014 1015 1016 1017 1018 1019 1020 1021 1022
static void tmqMgmtInit(void) {
  tmqInitRes = 0;
  tmqMgmt.timer = taosTmrInit(1000, 100, 360000, "TMQ");

  if (tmqMgmt.timer == NULL) {
    tmqInitRes = TSDB_CODE_OUT_OF_MEMORY;
  }

  tmqMgmt.rsetId = taosOpenRef(10000, tmqFreeImpl);
1023
  if (tmqMgmt.rsetId < 0) {
1024 1025 1026 1027
    tmqInitRes = terrno;
  }
}

L
Liu Jicong 已提交
1028
tmq_t* tmq_consumer_new(tmq_conf_t* conf, char* errstr, int32_t errstrLen) {
1029 1030 1031 1032
  taosThreadOnce(&tmqInit, tmqMgmtInit);
  if (tmqInitRes != 0) {
    terrno = tmqInitRes;
    return NULL;
L
Liu Jicong 已提交
1033 1034
  }

L
Liu Jicong 已提交
1035 1036
  tmq_t* pTmq = taosMemoryCalloc(1, sizeof(tmq_t));
  if (pTmq == NULL) {
L
Liu Jicong 已提交
1037
    terrno = TSDB_CODE_OUT_OF_MEMORY;
1038
    tscError("failed to create consumer, groupId:%s, code:%s", conf->groupId, terrstr());
L
Liu Jicong 已提交
1039 1040
    return NULL;
  }
L
Liu Jicong 已提交
1041

L
Liu Jicong 已提交
1042 1043 1044
  const char* user = conf->user == NULL ? TSDB_DEFAULT_USER : conf->user;
  const char* pass = conf->pass == NULL ? TSDB_DEFAULT_PASS : conf->pass;

L
Liu Jicong 已提交
1045 1046 1047
  pTmq->clientTopics = taosArrayInit(0, sizeof(SMqClientTopic));
  pTmq->mqueue = taosOpenQueue();
  pTmq->delayedTask = taosOpenQueue();
H
Haojun Liao 已提交
1048
  pTmq->qall = taosAllocateQall();
L
Liu Jicong 已提交
1049

H
Haojun Liao 已提交
1050
  taosThreadMutexInit(&pTmq->lock, NULL);
X
Xiaoyu Wang 已提交
1051 1052
  if (pTmq->clientTopics == NULL || pTmq->mqueue == NULL || pTmq->qall == NULL || pTmq->delayedTask == NULL ||
      conf->groupId[0] == 0) {
L
Liu Jicong 已提交
1053
    terrno = TSDB_CODE_OUT_OF_MEMORY;
1054
    tscError("consumer:0x%" PRIx64 " setup failed since %s, groupId:%s", pTmq->consumerId, terrstr(),
S
Shengliang Guan 已提交
1055
             pTmq->groupId);
1056
    goto _failed;
L
Liu Jicong 已提交
1057
  }
L
Liu Jicong 已提交
1058

L
Liu Jicong 已提交
1059 1060
  // init status
  pTmq->status = TMQ_CONSUMER_STATUS__INIT;
L
Liu Jicong 已提交
1061 1062
  pTmq->pollCnt = 0;
  pTmq->epoch = 0;
L
Liu Jicong 已提交
1063 1064
  /*pTmq->epStatus = 0;*/
  /*pTmq->epSkipCnt = 0;*/
L
Liu Jicong 已提交
1065

L
Liu Jicong 已提交
1066 1067 1068
  // set conf
  strcpy(pTmq->clientId, conf->clientId);
  strcpy(pTmq->groupId, conf->groupId);
1069
  pTmq->withTbName = conf->withTbName;
L
Liu Jicong 已提交
1070
  pTmq->useSnapshot = conf->snapEnable;
L
Liu Jicong 已提交
1071
  pTmq->autoCommit = conf->autoCommit;
L
Liu Jicong 已提交
1072
  pTmq->autoCommitInterval = conf->autoCommitInterval;
L
Liu Jicong 已提交
1073 1074
  pTmq->commitCb = conf->commitCb;
  pTmq->commitCbUserParam = conf->commitCbUserParam;
L
Liu Jicong 已提交
1075 1076
  pTmq->resetOffsetCfg = conf->resetOffset;

1077 1078
  pTmq->hbBgEnable = conf->hbBgEnable;

L
Liu Jicong 已提交
1079
  // assign consumerId
L
Liu Jicong 已提交
1080
  pTmq->consumerId = tGenIdPI64();
X
Xiaoyu Wang 已提交
1081

L
Liu Jicong 已提交
1082 1083
  // init semaphore
  if (tsem_init(&pTmq->rspSem, 0, 0) != 0) {
1084
    tscError("consumer:0x %" PRIx64 " setup failed since %s, consumer group %s", pTmq->consumerId, terrstr(),
S
Shengliang Guan 已提交
1085
             pTmq->groupId);
1086
    goto _failed;
L
Liu Jicong 已提交
1087
  }
L
Liu Jicong 已提交
1088

L
Liu Jicong 已提交
1089 1090 1091
  // init connection
  pTmq->pTscObj = taos_connect_internal(conf->ip, user, pass, NULL, NULL, conf->port, CONN_TYPE__TMQ);
  if (pTmq->pTscObj == NULL) {
1092
    tscError("consumer:0x%" PRIx64 " setup failed since %s, groupId:%s", pTmq->consumerId, terrstr(), pTmq->groupId);
L
Liu Jicong 已提交
1093
    tsem_destroy(&pTmq->rspSem);
1094
    goto _failed;
L
Liu Jicong 已提交
1095
  }
L
Liu Jicong 已提交
1096

1097 1098
  pTmq->refId = taosAddRef(tmqMgmt.rsetId, pTmq);
  if (pTmq->refId < 0) {
1099
    goto _failed;
1100 1101
  }

1102
  if (pTmq->hbBgEnable) {
L
Liu Jicong 已提交
1103 1104
    int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
    *pRefId = pTmq->refId;
1105
    pTmq->hbLiveTimer = taosTmrStart(tmqSendHbReq, 1000, pRefId, tmqMgmt.timer);
1106 1107
  }

1108 1109 1110
  char         buf[80] = {0};
  STqOffsetVal offset = {.type = pTmq->resetOffsetCfg};
  tFormatOffset(buf, tListLen(buf), &offset);
1111 1112
  tscInfo("consumer:0x%" PRIx64 " is setup, refId:%"PRId64", groupId:%s, snapshot:%d, autoCommit:%d, commitInterval:%dms, offset:%s, backgroudHB:%d",
          pTmq->consumerId, pTmq->refId, pTmq->groupId, pTmq->useSnapshot, pTmq->autoCommit, pTmq->autoCommitInterval, buf,
1113
          pTmq->hbBgEnable);
L
Liu Jicong 已提交
1114

1115
  return pTmq;
1116

1117 1118
_failed:
  tmqFreeImpl(pTmq);
L
Liu Jicong 已提交
1119
  return NULL;
1120 1121
}

L
Liu Jicong 已提交
1122
int32_t tmq_subscribe(tmq_t* tmq, const tmq_list_t* topic_list) {
1123
  const int32_t   MAX_RETRY_COUNT = 120 * 2;  // let's wait for 2 mins at most
L
Liu Jicong 已提交
1124 1125 1126
  const SArray*   container = &topic_list->container;
  int32_t         sz = taosArrayGetSize(container);
  void*           buf = NULL;
L
Liu Jicong 已提交
1127
  SMsgSendInfo*   sendInfo = NULL;
L
Liu Jicong 已提交
1128
  SCMSubscribeReq req = {0};
1129
  int32_t         code = 0;
1130

1131
  tscDebug("consumer:0x%" PRIx64 " cgroup:%s, subscribe %d topics", tmq->consumerId, tmq->groupId, sz);
L
Liu Jicong 已提交
1132

1133
  req.consumerId = tmq->consumerId;
L
Liu Jicong 已提交
1134
  tstrncpy(req.clientId, tmq->clientId, 256);
L
Liu Jicong 已提交
1135
  tstrncpy(req.cgroup, tmq->groupId, TSDB_CGROUP_LEN);
1136 1137
  req.topicNames = taosArrayInit(sz, sizeof(void*));

1138 1139 1140 1141
  if (req.topicNames == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
1142

L
Liu Jicong 已提交
1143 1144
  for (int32_t i = 0; i < sz; i++) {
    char* topic = taosArrayGetP(container, i);
1145 1146

    SName name = {0};
L
Liu Jicong 已提交
1147 1148 1149 1150
    tNameSetDbName(&name, tmq->pTscObj->acctId, topic, strlen(topic));
    char* topicFName = taosMemoryCalloc(1, TSDB_TOPIC_FNAME_LEN);
    if (topicFName == NULL) {
      goto FAIL;
1151 1152
    }

1153
    tNameExtractFullName(&name, topicFName);
X
Xiaoyu Wang 已提交
1154
    tscDebug("consumer:0x%" PRIx64 " subscribe topic:%s", tmq->consumerId, topicFName);
L
Liu Jicong 已提交
1155 1156

    taosArrayPush(req.topicNames, &topicFName);
1157 1158
  }

L
Liu Jicong 已提交
1159
  int32_t tlen = tSerializeSCMSubscribeReq(NULL, &req);
1160

L
Liu Jicong 已提交
1161
  buf = taosMemoryMalloc(tlen);
1162 1163 1164 1165
  if (buf == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
L
Liu Jicong 已提交
1166

1167 1168 1169
  void* abuf = buf;
  tSerializeSCMSubscribeReq(&abuf, &req);

L
Liu Jicong 已提交
1170
  sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
1171 1172 1173 1174
  if (sendInfo == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
1175

X
Xiaoyu Wang 已提交
1176
  SMqSubscribeCbParam param = {
L
Liu Jicong 已提交
1177
      .rspErr = 0,
1178 1179
      .refId = tmq->refId,
      .epoch = tmq->epoch,
X
Xiaoyu Wang 已提交
1180
  };
L
Liu Jicong 已提交
1181

1182 1183 1184
  if (tsem_init(&param.rspSem, 0, 0) != 0) {
    goto FAIL;
  }
L
Liu Jicong 已提交
1185 1186

  sendInfo->msgInfo = (SDataBuf){
X
Xiaoyu Wang 已提交
1187 1188 1189 1190
      .pData = buf,
      .len = tlen,
      .handle = NULL,
  };
1191

L
Liu Jicong 已提交
1192 1193
  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
L
Liu Jicong 已提交
1194 1195
  sendInfo->param = &param;
  sendInfo->fp = tmqSubscribeCb;
L
Liu Jicong 已提交
1196
  sendInfo->msgType = TDMT_MND_TMQ_SUBSCRIBE;
L
Liu Jicong 已提交
1197

1198 1199 1200 1201 1202
  SEpSet epSet = getEpSet_s(&tmq->pTscObj->pAppInfo->mgmtEp);

  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);

L
Liu Jicong 已提交
1203 1204
  // avoid double free if msg is sent
  buf = NULL;
L
Liu Jicong 已提交
1205
  sendInfo = NULL;
L
Liu Jicong 已提交
1206

L
Liu Jicong 已提交
1207 1208
  tsem_wait(&param.rspSem);
  tsem_destroy(&param.rspSem);
1209

1210 1211 1212 1213
  if (param.rspErr != 0) {
    code = param.rspErr;
    goto FAIL;
  }
L
Liu Jicong 已提交
1214

L
Liu Jicong 已提交
1215
  int32_t retryCnt = 0;
L
Liu Jicong 已提交
1216
  while (TSDB_CODE_MND_CONSUMER_NOT_READY == tmqAskEp(tmq, false)) {
1217
    if (retryCnt++ > MAX_RETRY_COUNT) {
L
Liu Jicong 已提交
1218 1219
      goto FAIL;
    }
1220

X
Xiaoyu Wang 已提交
1221
    tscDebug("consumer:0x%" PRIx64 ", mnd not ready for subscribe, retry:%d in 500ms", tmq->consumerId, retryCnt);
L
Liu Jicong 已提交
1222 1223
    taosMsleep(500);
  }
1224

1225 1226
  // init ep timer
  if (tmq->epTimer == NULL) {
1227 1228 1229
    int64_t* pRefId1 = taosMemoryMalloc(sizeof(int64_t));
    *pRefId1 = tmq->refId;
    tmq->epTimer = taosTmrStart(tmqAssignAskEpTask, 1000, pRefId1, tmqMgmt.timer);
1230
  }
L
Liu Jicong 已提交
1231 1232

  // init auto commit timer
1233
  if (tmq->autoCommit && tmq->commitTimer == NULL) {
1234 1235 1236
    int64_t* pRefId2 = taosMemoryMalloc(sizeof(int64_t));
    *pRefId2 = tmq->refId;
    tmq->commitTimer = taosTmrStart(tmqAssignDelayedCommitTask, tmq->autoCommitInterval, pRefId2, tmqMgmt.timer);
L
Liu Jicong 已提交
1237 1238
  }

L
Liu Jicong 已提交
1239
FAIL:
L
Liu Jicong 已提交
1240
  taosArrayDestroyP(req.topicNames, taosMemoryFree);
L
Liu Jicong 已提交
1241
  taosMemoryFree(buf);
L
Liu Jicong 已提交
1242
  taosMemoryFree(sendInfo);
L
Liu Jicong 已提交
1243

L
Liu Jicong 已提交
1244
  return code;
1245 1246
}

L
Liu Jicong 已提交
1247
void tmq_conf_set_auto_commit_cb(tmq_conf_t* conf, tmq_commit_cb* cb, void* param) {
1248
  conf->commitCb = cb;
L
Liu Jicong 已提交
1249
  conf->commitCbUserParam = param;
L
Liu Jicong 已提交
1250
}
1251

D
dapan1121 已提交
1252
int32_t tmqPollCb(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1253
  SMqPollCbParam* pParam = (SMqPollCbParam*)param;
1254 1255

  int64_t         refId = pParam->refId;
X
Xiaoyu Wang 已提交
1256
  SMqClientVg*    pVg = pParam->pVg;
L
Liu Jicong 已提交
1257
  SMqClientTopic* pTopic = pParam->pTopic;
1258

1259
  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
1260 1261 1262 1263
  if (tmq == NULL) {
    tsem_destroy(&pParam->rspSem);
    taosMemoryFree(pParam);
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1264
    taosMemoryFree(pMsg->pEpSet);
1265 1266 1267 1268
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    return -1;
  }

H
Haojun Liao 已提交
1269 1270 1271 1272
  int32_t  epoch = pParam->epoch;
  int32_t  vgId = pParam->vgId;
  uint64_t requestId = pParam->requestId;

L
Liu Jicong 已提交
1273
  taosMemoryFree(pParam);
H
Haojun Liao 已提交
1274

L
Liu Jicong 已提交
1275
  if (code != 0) {
H
Haojun Liao 已提交
1276 1277
    tscWarn("consumer:0x%" PRIx64 " msg from vgId:%d discarded, epoch %d, since %s, reqId:0x%" PRIx64, tmq->consumerId,
            vgId, epoch, tstrerror(code), requestId);
H
Haojun Liao 已提交
1278

L
Liu Jicong 已提交
1279
    if (pMsg->pData) taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1280 1281
    if (pMsg->pEpSet) taosMemoryFree(pMsg->pEpSet);

H
Haojun Liao 已提交
1282
    // in case of consumer mismatch, wait for 500ms and retry
L
Liu Jicong 已提交
1283
    if (code == TSDB_CODE_TMQ_CONSUMER_MISMATCH) {
1284
      taosMsleep(500);
L
Liu Jicong 已提交
1285
      atomic_store_8(&tmq->status, TMQ_CONSUMER_STATUS__RECOVER);
1286
      tscDebug("consumer:0x%" PRIx64" wait for the re-balance, wait for 500ms and set status to be RECOVER", tmq->consumerId);
H
Haojun Liao 已提交
1287
    } else if (code == TSDB_CODE_TQ_NO_COMMITTED_OFFSET) {
S
Shengliang Guan 已提交
1288
      SMqPollRspWrapper* pRspWrapper = taosAllocateQitem(sizeof(SMqPollRspWrapper), DEF_QITEM, 0);
L
Liu Jicong 已提交
1289
      if (pRspWrapper == NULL) {
H
Haojun Liao 已提交
1290 1291
        tscWarn("consumer:0x%" PRIx64 " msg from vgId:%d discarded, epoch %d since out of memory, reqId:0x%" PRIx64,
                tmq->consumerId, vgId, epoch, requestId);
L
Liu Jicong 已提交
1292 1293
        goto CREATE_MSG_FAIL;
      }
H
Haojun Liao 已提交
1294

L
Liu Jicong 已提交
1295 1296 1297
      pRspWrapper->tmqRspType = TMQ_MSG_TYPE__END_RSP;
      taosWriteQitem(tmq->mqueue, pRspWrapper);
    }
H
Haojun Liao 已提交
1298

L
fix txn  
Liu Jicong 已提交
1299
    goto CREATE_MSG_FAIL;
L
Liu Jicong 已提交
1300 1301
  }

X
Xiaoyu Wang 已提交
1302 1303 1304
  int32_t msgEpoch = ((SMqRspHead*)pMsg->pData)->epoch;
  int32_t tmqEpoch = atomic_load_32(&tmq->epoch);
  if (msgEpoch < tmqEpoch) {
L
Liu Jicong 已提交
1305
    // do not write into queue since updating epoch reset
H
Haojun Liao 已提交
1306 1307 1308
    tscWarn("consumer:0x%" PRIx64 " msg discard from vgId:%d since from earlier epoch, rsp epoch %d, current epoch %d, reqId:0x%"PRIx64,
            tmq->consumerId, vgId, msgEpoch, tmqEpoch, requestId);

1309
    tsem_post(&tmq->rspSem);
1310 1311
    taosReleaseRef(tmqMgmt.rsetId, refId);

L
Liu Jicong 已提交
1312
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1313
    taosMemoryFree(pMsg->pEpSet);
X
Xiaoyu Wang 已提交
1314 1315 1316 1317
    return 0;
  }

  if (msgEpoch != tmqEpoch) {
H
Haojun Liao 已提交
1318 1319
    tscWarn("consumer:0x%" PRIx64 " mismatch rsp from vgId:%d, epoch %d, current epoch %d, reqId:0x%" PRIx64,
            tmq->consumerId, vgId, msgEpoch, tmqEpoch, requestId);
X
Xiaoyu Wang 已提交
1320 1321
  }

L
Liu Jicong 已提交
1322 1323 1324
  // handle meta rsp
  int8_t rspType = ((SMqRspHead*)pMsg->pData)->mqMsgType;

S
Shengliang Guan 已提交
1325
  SMqPollRspWrapper* pRspWrapper = taosAllocateQitem(sizeof(SMqPollRspWrapper), DEF_QITEM, 0);
L
Liu Jicong 已提交
1326
  if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1327
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1328
    taosMemoryFree(pMsg->pEpSet);
H
Haojun Liao 已提交
1329
    tscWarn("consumer:0x%"PRIx64" msg discard from vgId:%d, epoch %d since out of memory", tmq->consumerId, vgId, epoch);
L
fix txn  
Liu Jicong 已提交
1330
    goto CREATE_MSG_FAIL;
L
Liu Jicong 已提交
1331
  }
L
Liu Jicong 已提交
1332

L
Liu Jicong 已提交
1333
  pRspWrapper->tmqRspType = rspType;
L
Liu Jicong 已提交
1334 1335
  pRspWrapper->vgHandle = pVg;
  pRspWrapper->topicHandle = pTopic;
H
Haojun Liao 已提交
1336
  pRspWrapper->reqId = requestId;
1337
  pRspWrapper->pEpset = pMsg->pEpSet;
1338
  pRspWrapper->vgId = pVg->vgId;
L
Liu Jicong 已提交
1339

1340
  pMsg->pEpSet = NULL;
L
Liu Jicong 已提交
1341
  if (rspType == TMQ_MSG_TYPE__POLL_RSP) {
L
Liu Jicong 已提交
1342 1343 1344
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeSMqDataRsp(&decoder, &pRspWrapper->dataRsp);
wmmhello's avatar
wmmhello 已提交
1345
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1346
    memcpy(&pRspWrapper->dataRsp, pMsg->pData, sizeof(SMqRspHead));
L
Liu Jicong 已提交
1347

H
Haojun Liao 已提交
1348 1349 1350 1351
    char buf[80];
    tFormatOffset(buf, 80, &pRspWrapper->dataRsp.rspOffset);
    tscDebug("consumer:0x%" PRIx64 " recv poll rsp, vgId:%d, req:%" PRId64 ", rsp:%s type %d, reqId:0x%" PRIx64,
             tmq->consumerId, vgId, pRspWrapper->dataRsp.reqOffset.version, buf, rspType, requestId);
L
Liu Jicong 已提交
1352
  } else if (rspType == TMQ_MSG_TYPE__POLL_META_RSP) {
1353 1354 1355 1356
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeSMqMetaRsp(&decoder, &pRspWrapper->metaRsp);
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1357
    memcpy(&pRspWrapper->metaRsp, pMsg->pData, sizeof(SMqRspHead));
L
Liu Jicong 已提交
1358 1359 1360 1361 1362 1363
  } else if (rspType == TMQ_MSG_TYPE__TAOSX_RSP) {
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeSTaosxRsp(&decoder, &pRspWrapper->taosxRsp);
    tDecoderClear(&decoder);
    memcpy(&pRspWrapper->taosxRsp, pMsg->pData, sizeof(SMqRspHead));
H
Haojun Liao 已提交
1364 1365
  } else { // invalid rspType
    tscError("consumer:0x%"PRIx64" invalid rsp msg received, type:%d ignored", tmq->consumerId, rspType);
L
Liu Jicong 已提交
1366
  }
L
Liu Jicong 已提交
1367

L
Liu Jicong 已提交
1368
  taosMemoryFree(pMsg->pData);
H
Haojun Liao 已提交
1369
  taosWriteQitem(tmq->mqueue, pRspWrapper);
L
Liu Jicong 已提交
1370

H
Haojun Liao 已提交
1371 1372 1373
  tscDebug("consumer:0x%" PRIx64 " put poll res into mqueue, type:%d, vgId:%d, total in queue:%d, reqId:0x%" PRIx64,
           tmq->consumerId, rspType, vgId, tmq->mqueue->numOfItems, requestId);

1374
  tsem_post(&tmq->rspSem);
1375 1376
  taosReleaseRef(tmqMgmt.rsetId, refId);

L
Liu Jicong 已提交
1377
  return 0;
H
Haojun Liao 已提交
1378

L
fix txn  
Liu Jicong 已提交
1379
CREATE_MSG_FAIL:
L
Liu Jicong 已提交
1380
  if (epoch == tmq->epoch) {
L
Liu Jicong 已提交
1381 1382
    atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
  }
H
Haojun Liao 已提交
1383

1384
  tsem_post(&tmq->rspSem);
1385 1386
  taosReleaseRef(tmqMgmt.rsetId, refId);

L
Liu Jicong 已提交
1387
  return -1;
1388 1389
}

H
Haojun Liao 已提交
1390 1391 1392 1393 1394
typedef struct SVgroupSaveInfo {
  STqOffsetVal offset;
  int64_t      numOfRows;
} SVgroupSaveInfo;

H
Haojun Liao 已提交
1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411
static void initClientTopicFromRsp(SMqClientTopic* pTopic, SMqSubTopicEp* pTopicEp, SHashObj* pVgOffsetHashMap,
                                   tmq_t* tmq) {
  pTopic->schema = pTopicEp->schema;
  pTopicEp->schema.nCols = 0;
  pTopicEp->schema.pSchema = NULL;

  char vgKey[TSDB_TOPIC_FNAME_LEN + 22];
  int32_t vgNumGet = taosArrayGetSize(pTopicEp->vgs);

  tstrncpy(pTopic->topicName, pTopicEp->topic, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pTopic->db, pTopicEp->db, TSDB_DB_FNAME_LEN);

  tscDebug("consumer:0x%" PRIx64 ", update topic:%s, numOfVgs:%d", tmq->consumerId, pTopic->topicName, vgNumGet);
  pTopic->vgs = taosArrayInit(vgNumGet, sizeof(SMqClientVg));

  for (int32_t j = 0; j < vgNumGet; j++) {
    SMqSubVgEp* pVgEp = taosArrayGet(pTopicEp->vgs, j);
H
Haojun Liao 已提交
1412 1413

    makeTopicVgroupKey(vgKey, pTopic->topicName, pVgEp->vgId);
H
Haojun Liao 已提交
1414
    SVgroupSaveInfo* pInfo = taosHashGet(pVgOffsetHashMap, vgKey, strlen(vgKey));
H
Haojun Liao 已提交
1415

H
Haojun Liao 已提交
1416
    int64_t numOfRows = 0;
H
Haojun Liao 已提交
1417
    STqOffsetVal  offsetNew = {.type = tmq->resetOffsetCfg};
H
Haojun Liao 已提交
1418 1419 1420
    if (pInfo != NULL) {
      offsetNew = pInfo->offset;
      numOfRows = pInfo->numOfRows;
H
Haojun Liao 已提交
1421 1422 1423 1424 1425 1426 1427 1428 1429
    }

    SMqClientVg clientVg = {
        .pollCnt = 0,
        .currentOffset = offsetNew,
        .vgId = pVgEp->vgId,
        .epSet = pVgEp->epSet,
        .vgStatus = TMQ_VG_STATUS__IDLE,
        .vgSkipCnt = 0,
H
Haojun Liao 已提交
1430
        .emptyBlockReceiveTs = 0,
H
Haojun Liao 已提交
1431
        .numOfRows = numOfRows,
H
Haojun Liao 已提交
1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447
    };

    taosArrayPush(pTopic->vgs, &clientVg);
  }
}

static void freeClientVgInfo(void* param) {
  SMqClientTopic* pTopic = param;
  if (pTopic->schema.nCols) {
    taosMemoryFreeClear(pTopic->schema.pSchema);
  }

  taosArrayDestroy(pTopic->vgs);
}

static bool tmqUpdateEp(tmq_t* tmq, int32_t epoch, const SMqAskEpRsp* pRsp) {
1448 1449
  bool set = false;

1450
  int32_t topicNumCur = taosArrayGetSize(tmq->clientTopics);
1451
  int32_t topicNumGet = taosArrayGetSize(pRsp->topics);
1452

X
Xiaoyu Wang 已提交
1453 1454
  char vgKey[TSDB_TOPIC_FNAME_LEN + 22];
  tscDebug("consumer:0x%" PRIx64 " update ep epoch from %d to epoch %d, incoming topics:%d, existed topics:%d",
1455
           tmq->consumerId, tmq->epoch, epoch, topicNumGet, topicNumCur);
1456 1457 1458 1459 1460 1461

  SArray* newTopics = taosArrayInit(topicNumGet, sizeof(SMqClientTopic));
  if (newTopics == NULL) {
    return false;
  }

H
Haojun Liao 已提交
1462 1463
  SHashObj* pVgOffsetHashMap = taosHashInit(64, MurmurHash3_32, false, HASH_NO_LOCK);
  if (pVgOffsetHashMap == NULL) {
1464 1465 1466
    taosArrayDestroy(newTopics);
    return false;
  }
1467

H
Haojun Liao 已提交
1468
  // todo extract method
1469 1470 1471 1472 1473
  for (int32_t i = 0; i < topicNumCur; i++) {
    // find old topic
    SMqClientTopic* pTopicCur = taosArrayGet(tmq->clientTopics, i);
    if (pTopicCur->vgs) {
      int32_t vgNumCur = taosArrayGetSize(pTopicCur->vgs);
1474
      tscDebug("consumer:0x%" PRIx64 ", new vg num: %d", tmq->consumerId, vgNumCur);
1475 1476
      for (int32_t j = 0; j < vgNumCur; j++) {
        SMqClientVg* pVgCur = taosArrayGet(pTopicCur->vgs, j);
H
Haojun Liao 已提交
1477 1478
        makeTopicVgroupKey(vgKey, pTopicCur->topicName, pVgCur->vgId);

L
Liu Jicong 已提交
1479
        char buf[80];
L
Liu Jicong 已提交
1480
        tFormatOffset(buf, 80, &pVgCur->currentOffset);
H
Haojun Liao 已提交
1481
        tscDebug("consumer:0x%" PRIx64 ", epoch:%d vgId:%d vgKey:%s, offset:%s", tmq->consumerId, epoch,
L
Liu Jicong 已提交
1482
                 pVgCur->vgId, vgKey, buf);
H
Haojun Liao 已提交
1483 1484 1485

        SVgroupSaveInfo info = {.offset = pVgCur->currentOffset, .numOfRows = pVgCur->numOfRows};
        taosHashPut(pVgOffsetHashMap, vgKey, strlen(vgKey), &info, sizeof(SVgroupSaveInfo));
1486 1487 1488 1489 1490 1491 1492
      }
    }
  }

  for (int32_t i = 0; i < topicNumGet; i++) {
    SMqClientTopic topic = {0};
    SMqSubTopicEp* pTopicEp = taosArrayGet(pRsp->topics, i);
H
Haojun Liao 已提交
1493
    initClientTopicFromRsp(&topic, pTopicEp, pVgOffsetHashMap, tmq);
1494 1495
    taosArrayPush(newTopics, &topic);
  }
1496

H
Haojun Liao 已提交
1497 1498 1499
  taosHashCleanup(pVgOffsetHashMap);

  taosThreadMutexLock(&tmq->lock);
1500
  // destroy current buffered existed topics info
1501
  if (tmq->clientTopics) {
H
Haojun Liao 已提交
1502
    taosArrayDestroyEx(tmq->clientTopics, freeClientVgInfo);
X
Xiaoyu Wang 已提交
1503
  }
1504

H
Haojun Liao 已提交
1505 1506
  tmq->clientTopics = newTopics;
  taosThreadMutexUnlock(&tmq->lock);
1507

H
Haojun Liao 已提交
1508 1509
  int8_t flag = (topicNumGet == 0)? TMQ_CONSUMER_STATUS__NO_TOPIC:TMQ_CONSUMER_STATUS__READY;
  atomic_store_8(&tmq->status, flag);
X
Xiaoyu Wang 已提交
1510
  atomic_store_32(&tmq->epoch, epoch);
H
Haojun Liao 已提交
1511

1512
  tscDebug("consumer:0x%" PRIx64 " update topic info completed", tmq->consumerId);
X
Xiaoyu Wang 已提交
1513 1514 1515
  return set;
}

H
Haojun Liao 已提交
1516
static int32_t tmqAskEpCb(void* param, SDataBuf* pMsg, int32_t code) {
1517
  SMqAskEpCbParam* pParam = (SMqAskEpCbParam*)param;
L
Liu Jicong 已提交
1518
  int8_t           async = pParam->async;
1519 1520 1521 1522 1523 1524 1525 1526 1527
  tmq_t*           tmq = taosAcquireRef(tmqMgmt.rsetId, pParam->refId);

  if (tmq == NULL) {
    if (!async) {
      tsem_destroy(&pParam->rspSem);
    } else {
      taosMemoryFree(pParam);
    }
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1528
    taosMemoryFree(pMsg->pEpSet);
1529 1530 1531 1532
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    return -1;
  }

L
Liu Jicong 已提交
1533
  pParam->code = code;
H
Haojun Liao 已提交
1534
  if (code != TSDB_CODE_SUCCESS) {
X
Xiaoyu Wang 已提交
1535 1536
    tscError("consumer:0x%" PRIx64 ", get topic endpoint error, async:%d, code:%s", tmq->consumerId, pParam->async,
             tstrerror(code));
L
Liu Jicong 已提交
1537
    goto END;
1538
  }
L
Liu Jicong 已提交
1539

L
Liu Jicong 已提交
1540
  // tmq's epoch is monotonically increase,
L
Liu Jicong 已提交
1541
  // so it's safe to discard any old epoch msg.
L
Liu Jicong 已提交
1542
  // Epoch will only increase when received newer epoch ep msg
L
Liu Jicong 已提交
1543 1544 1545
  SMqRspHead* head = pMsg->pData;
  int32_t     epoch = atomic_load_32(&tmq->epoch);
  if (head->epoch <= epoch) {
1546 1547
    tscDebug("consumer:0x%" PRIx64 ", recv ep, msg epoch %d, current epoch %d, no need to update local ep",
             tmq->consumerId, head->epoch, epoch);
1548 1549 1550 1551 1552 1553 1554 1555
    if (tmq->status == TMQ_CONSUMER_STATUS__RECOVER) {
      SMqAskEpRsp rsp;
      tDecodeSMqAskEpRsp(POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), &rsp);
      int8_t flag = (taosArrayGetSize(rsp.topics) == 0) ? TMQ_CONSUMER_STATUS__NO_TOPIC : TMQ_CONSUMER_STATUS__READY;
      atomic_store_8(&tmq->status, flag);
      tDeleteSMqAskEpRsp(&rsp);
    }

L
Liu Jicong 已提交
1556
    goto END;
1557
  }
L
Liu Jicong 已提交
1558

1559 1560 1561
  tscDebug("consumer:0x%" PRIx64 ", recv ep, msg epoch %d, current epoch %d, update local ep", tmq->consumerId,
           head->epoch, epoch);

L
Liu Jicong 已提交
1562
  if (!async) {
L
Liu Jicong 已提交
1563 1564
    SMqAskEpRsp rsp;
    tDecodeSMqAskEpRsp(POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), &rsp);
L
Liu Jicong 已提交
1565
    tmqUpdateEp(tmq, head->epoch, &rsp);
L
Liu Jicong 已提交
1566
    tDeleteSMqAskEpRsp(&rsp);
X
Xiaoyu Wang 已提交
1567
  } else {
S
Shengliang Guan 已提交
1568
    SMqAskEpRspWrapper* pWrapper = taosAllocateQitem(sizeof(SMqAskEpRspWrapper), DEF_QITEM, 0);
L
Liu Jicong 已提交
1569
    if (pWrapper == NULL) {
X
Xiaoyu Wang 已提交
1570
      terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
1571 1572
      code = -1;
      goto END;
X
Xiaoyu Wang 已提交
1573
    }
1574

L
Liu Jicong 已提交
1575 1576 1577
    pWrapper->tmqRspType = TMQ_MSG_TYPE__EP_RSP;
    pWrapper->epoch = head->epoch;
    memcpy(&pWrapper->msg, pMsg->pData, sizeof(SMqRspHead));
L
Liu Jicong 已提交
1578
    tDecodeSMqAskEpRsp(POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), &pWrapper->msg);
L
Liu Jicong 已提交
1579

L
Liu Jicong 已提交
1580
    taosWriteQitem(tmq->mqueue, pWrapper);
1581
    tsem_post(&tmq->rspSem);
1582
  }
L
Liu Jicong 已提交
1583 1584

END:
1585 1586
  taosReleaseRef(tmqMgmt.rsetId, pParam->refId);

L
Liu Jicong 已提交
1587
  if (!async) {
L
Liu Jicong 已提交
1588
    tsem_post(&pParam->rspSem);
L
Liu Jicong 已提交
1589 1590
  } else {
    taosMemoryFree(pParam);
L
Liu Jicong 已提交
1591
  }
dengyihao's avatar
dengyihao 已提交
1592 1593

  taosMemoryFree(pMsg->pEpSet);
L
Liu Jicong 已提交
1594
  taosMemoryFree(pMsg->pData);
L
Liu Jicong 已提交
1595
  return code;
1596 1597
}

L
Liu Jicong 已提交
1598
void tmqBuildConsumeReqImpl(SMqPollReq* pReq, tmq_t* tmq, int64_t timeout, SMqClientTopic* pTopic, SMqClientVg* pVg) {
L
Liu Jicong 已提交
1599 1600 1601 1602
  int32_t groupLen = strlen(tmq->groupId);
  memcpy(pReq->subKey, tmq->groupId, groupLen);
  pReq->subKey[groupLen] = TMQ_SEPARATOR;
  strcpy(pReq->subKey + groupLen + 1, pTopic->topicName);
1603

1604
  pReq->withTbName = tmq->withTbName;
L
Liu Jicong 已提交
1605
  pReq->consumerId = tmq->consumerId;
1606
  pReq->timeout = timeout;
X
Xiaoyu Wang 已提交
1607
  pReq->epoch = tmq->epoch;
L
Liu Jicong 已提交
1608
  /*pReq->currentOffset = reqOffset;*/
L
Liu Jicong 已提交
1609
  pReq->reqOffset = pVg->currentOffset;
D
dapan1121 已提交
1610
  pReq->head.vgId = pVg->vgId;
1611 1612
  pReq->useSnapshot = tmq->useSnapshot;
  pReq->reqId = generateRequestId();
1613 1614
}

L
Liu Jicong 已提交
1615 1616
SMqMetaRspObj* tmqBuildMetaRspFromWrapper(SMqPollRspWrapper* pWrapper) {
  SMqMetaRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqMetaRspObj));
L
Liu Jicong 已提交
1617
  pRspObj->resType = RES_TYPE__TMQ_META;
L
Liu Jicong 已提交
1618 1619 1620 1621 1622 1623 1624 1625
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
  pRspObj->vgId = pWrapper->vgHandle->vgId;

  memcpy(&pRspObj->metaRsp, &pWrapper->metaRsp, sizeof(SMqMetaRsp));
  return pRspObj;
}

1626
SMqRspObj* tmqBuildRspFromWrapper(SMqPollRspWrapper* pWrapper, SMqClientVg* pVg, int64_t* numOfRows) {
L
Liu Jicong 已提交
1627 1628
  SMqRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqRspObj));
  pRspObj->resType = RES_TYPE__TMQ;
1629

1630
  (*numOfRows) = 0;
L
Liu Jicong 已提交
1631 1632
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
1633

L
Liu Jicong 已提交
1634
  pRspObj->vgId = pWrapper->vgHandle->vgId;
L
Liu Jicong 已提交
1635
  pRspObj->resIter = -1;
L
Liu Jicong 已提交
1636
  memcpy(&pRspObj->rsp, &pWrapper->dataRsp, sizeof(SMqDataRsp));
L
Liu Jicong 已提交
1637

L
Liu Jicong 已提交
1638 1639
  pRspObj->resInfo.totalRows = 0;
  pRspObj->resInfo.precision = TSDB_TIME_PRECISION_MILLI;
1640

L
Liu Jicong 已提交
1641
  if (!pWrapper->dataRsp.withSchema) {
L
Liu Jicong 已提交
1642 1643
    setResSchemaInfo(&pRspObj->resInfo, pWrapper->topicHandle->schema.pSchema, pWrapper->topicHandle->schema.nCols);
  }
L
Liu Jicong 已提交
1644

1645 1646 1647 1648 1649
  // extract the rows in this data packet
  for(int32_t i = 0; i < pRspObj->rsp.blockNum; ++i) {
    SRetrieveTableRsp* pRetrieve = (SRetrieveTableRsp*)taosArrayGetP(pRspObj->rsp.blockData, i);
    int64_t rows = htobe64(pRetrieve->numOfRows);
    pVg->numOfRows += rows;
1650
    (*numOfRows) += rows;
1651 1652
  }

L
Liu Jicong 已提交
1653
  return pRspObj;
X
Xiaoyu Wang 已提交
1654 1655
}

L
Liu Jicong 已提交
1656 1657
SMqTaosxRspObj* tmqBuildTaosxRspFromWrapper(SMqPollRspWrapper* pWrapper) {
  SMqTaosxRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqTaosxRspObj));
1658
  pRspObj->resType = RES_TYPE__TMQ_METADATA;
L
Liu Jicong 已提交
1659 1660 1661 1662
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
  pRspObj->vgId = pWrapper->vgHandle->vgId;
  pRspObj->resIter = -1;
1663
  memcpy(&pRspObj->rsp, &pWrapper->taosxRsp, sizeof(STaosxRsp));
L
Liu Jicong 已提交
1664 1665 1666

  pRspObj->resInfo.totalRows = 0;
  pRspObj->resInfo.precision = TSDB_TIME_PRECISION_MILLI;
1667
  if (!pWrapper->taosxRsp.withSchema) {
L
Liu Jicong 已提交
1668 1669 1670 1671 1672 1673
    setResSchemaInfo(&pRspObj->resInfo, pWrapper->topicHandle->schema.pSchema, pWrapper->topicHandle->schema.nCols);
  }

  return pRspObj;
}

1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706
static int32_t handleErrorBeforePoll(SMqClientVg* pVg, tmq_t* pTmq) {
  atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
  tsem_post(&pTmq->rspSem);
  return -1;
}

static int32_t doTmqPollImpl(tmq_t* pTmq, SMqClientTopic* pTopic, SMqClientVg* pVg, int64_t timeout) {
  SMqPollReq req = {0};
  tmqBuildConsumeReqImpl(&req, pTmq, timeout, pTopic, pVg);

  int32_t msgSize = tSerializeSMqPollReq(NULL, 0, &req);
  if (msgSize < 0) {
    return handleErrorBeforePoll(pVg, pTmq);
  }

  char* msg = taosMemoryCalloc(1, msgSize);
  if (NULL == msg) {
    return handleErrorBeforePoll(pVg, pTmq);
  }

  if (tSerializeSMqPollReq(msg, msgSize, &req) < 0) {
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  SMqPollCbParam* pParam = taosMemoryMalloc(sizeof(SMqPollCbParam));
  if (pParam == NULL) {
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  pParam->refId = pTmq->refId;
  pParam->epoch = pTmq->epoch;
X
Xiaoyu Wang 已提交
1707
  pParam->pVg = pVg;  // pVg may be released,fix it
1708 1709
  pParam->pTopic = pTopic;
  pParam->vgId = pVg->vgId;
H
Haojun Liao 已提交
1710
  pParam->requestId = req.reqId;
1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(pParam);
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  sendInfo->msgInfo = (SDataBuf){
      .pData = msg,
      .len = msgSize,
      .handle = NULL,
  };

  sendInfo->requestId = req.reqId;
  sendInfo->requestObjRefId = 0;
  sendInfo->param = pParam;
  sendInfo->fp = tmqPollCb;
  sendInfo->msgType = TDMT_VND_TMQ_CONSUME;

  int64_t transporterId = 0;
  char    offsetFormatBuf[80];
  tFormatOffset(offsetFormatBuf, tListLen(offsetFormatBuf), &pVg->currentOffset);

H
Haojun Liao 已提交
1735
  tscDebug("consumer:0x%" PRIx64 " send poll to %s vgId:%d, epoch %d, req:%s, reqId:0x%" PRIx64,
1736 1737 1738 1739 1740 1741 1742 1743 1744
           pTmq->consumerId, pTopic->topicName, pVg->vgId, pTmq->epoch, offsetFormatBuf, req.reqId);
  asyncSendMsgToServer(pTmq->pTscObj->pAppInfo->pTransporter, &pVg->epSet, &transporterId, sendInfo);

  pVg->pollCnt++;
  pTmq->pollCnt++;

  return TSDB_CODE_SUCCESS;
}

1745
// broadcast the poll request to all related vnodes
H
Haojun Liao 已提交
1746
static int32_t tmqPollImpl(tmq_t* tmq, int64_t timeout) {
1747
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);
X
Xiaoyu Wang 已提交
1748
  tscDebug("consumer:0x%" PRIx64 " start to poll data, numOfTopics:%d", tmq->consumerId, numOfTopics);
1749 1750

  for (int i = 0; i < numOfTopics; i++) {
X
Xiaoyu Wang 已提交
1751
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
X
Xiaoyu Wang 已提交
1752
    int32_t         numOfVg = taosArrayGetSize(pTopic->vgs);
1753 1754

    for (int j = 0; j < numOfVg; j++) {
X
Xiaoyu Wang 已提交
1755
      SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);
1756
      if (taosGetTimestampMs() - pVg->emptyBlockReceiveTs < EMPTY_BLOCK_POLL_IDLE_DURATION) { // less than 100ms
1757
        tscTrace("consumer:0x%" PRIx64 " epoch %d, vgId:%d idle for 10ms before start next poll", tmq->consumerId, tmq->epoch,
H
Haojun Liao 已提交
1758
                 pVg->vgId);
H
Haojun Liao 已提交
1759 1760 1761
        continue;
      }

1762
      int32_t vgStatus = atomic_val_compare_exchange_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE, TMQ_VG_STATUS__WAIT);
1763
      if (vgStatus == TMQ_VG_STATUS__WAIT) {
L
Liu Jicong 已提交
1764
        int32_t vgSkipCnt = atomic_add_fetch_32(&pVg->vgSkipCnt, 1);
H
Haojun Liao 已提交
1765
        tscTrace("consumer:0x%" PRIx64 " epoch %d wait poll-rsp, skip vgId:%d skip cnt %d", tmq->consumerId, tmq->epoch,
X
Xiaoyu Wang 已提交
1766
                 pVg->vgId, vgSkipCnt);
X
Xiaoyu Wang 已提交
1767
        continue;
L
temp  
Liu Jicong 已提交
1768 1769 1770 1771
#if 0
        if (skipCnt < 30000) {
          continue;
        } else {
1772
        tscDebug("consumer:0x%" PRIx64 ",skip vgId:%d skip too much reset", tmq->consumerId, pVg->vgId);
L
temp  
Liu Jicong 已提交
1773 1774
        }
#endif
X
Xiaoyu Wang 已提交
1775
      }
1776

L
Liu Jicong 已提交
1777
      atomic_store_32(&pVg->vgSkipCnt, 0);
1778 1779 1780
      int32_t code = doTmqPollImpl(tmq, pTopic, pVg, timeout);
      if (code != TSDB_CODE_SUCCESS) {
        return code;
D
dapan1121 已提交
1781
      }
X
Xiaoyu Wang 已提交
1782 1783
    }
  }
1784

1785
  tscDebug("consumer:0x%" PRIx64 " end to poll data", tmq->consumerId);
X
Xiaoyu Wang 已提交
1786 1787 1788
  return 0;
}

H
Haojun Liao 已提交
1789
static int32_t tmqHandleNoPollRsp(tmq_t* tmq, SMqRspWrapper* rspWrapper, bool* pReset) {
L
Liu Jicong 已提交
1790
  if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__EP_RSP) {
L
fix  
Liu Jicong 已提交
1791
    /*printf("ep %d %d\n", rspMsg->head.epoch, tmq->epoch);*/
L
Liu Jicong 已提交
1792 1793
    if (rspWrapper->epoch > atomic_load_32(&tmq->epoch)) {
      SMqAskEpRspWrapper* pEpRspWrapper = (SMqAskEpRspWrapper*)rspWrapper;
L
Liu Jicong 已提交
1794
      SMqAskEpRsp*        rspMsg = &pEpRspWrapper->msg;
L
Liu Jicong 已提交
1795
      tmqUpdateEp(tmq, rspWrapper->epoch, rspMsg);
L
temp  
Liu Jicong 已提交
1796
      /*tmqClearUnhandleMsg(tmq);*/
L
Liu Jicong 已提交
1797
      tDeleteSMqAskEpRsp(rspMsg);
X
Xiaoyu Wang 已提交
1798 1799
      *pReset = true;
    } else {
L
Liu Jicong 已提交
1800
      tmqFreeRspWrapper(rspWrapper);
X
Xiaoyu Wang 已提交
1801 1802 1803 1804 1805 1806 1807 1808
      *pReset = false;
    }
  } else {
    return -1;
  }
  return 0;
}

H
Haojun Liao 已提交
1809
static void* tmqHandleAllRsp(tmq_t* tmq, int64_t timeout, bool pollIfReset) {
H
Haojun Liao 已提交
1810
  tscDebug("consumer:0x%" PRIx64 " start to handle the rsp, total:%d", tmq->consumerId, tmq->qall->numOfItems);
1811

X
Xiaoyu Wang 已提交
1812
  while (1) {
1813 1814
    SMqRspWrapper* pRspWrapper = NULL;
    taosGetQitem(tmq->qall, (void**)&pRspWrapper);
1815

1816
    if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1817
      taosReadAllQitems(tmq->mqueue, tmq->qall);
1818 1819
      taosGetQitem(tmq->qall, (void**)&pRspWrapper);
      if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1820 1821
        return NULL;
      }
X
Xiaoyu Wang 已提交
1822 1823
    }

1824
    tscDebug("consumer:0x%"PRIx64" handle rsp, type:%d", tmq->consumerId, pRspWrapper->tmqRspType);
H
Haojun Liao 已提交
1825

1826 1827
    if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__END_RSP) {
      taosFreeQitem(pRspWrapper);
L
Liu Jicong 已提交
1828
      terrno = TSDB_CODE_TQ_NO_COMMITTED_OFFSET;
H
Haojun Liao 已提交
1829
      tscError("consumer:0x%" PRIx64 " unexpected rsp from poll, code:%s", tmq->consumerId, tstrerror(terrno));
L
Liu Jicong 已提交
1830
      return NULL;
1831 1832
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
H
Haojun Liao 已提交
1833

1834
      int32_t consumerEpoch = atomic_load_32(&tmq->epoch);
1835 1836 1837
      SMqDataRsp* pDataRsp = &pollRspWrapper->dataRsp;

      if (pDataRsp->head.epoch == consumerEpoch) {
L
Liu Jicong 已提交
1838
        SMqClientVg* pVg = pollRspWrapper->vgHandle;
1839 1840 1841 1842 1843 1844 1845 1846 1847 1848

        // update the epset
        if (pollRspWrapper->pEpset != NULL) {
          SEp* pEp = GET_ACTIVE_EP(pollRspWrapper->pEpset);
          SEp* pOld = GET_ACTIVE_EP(&(pVg->epSet));
          tscDebug("consumer:0x%" PRIx64 " update epset vgId:%d, ep:%s:%d, old ep:%s:%d", tmq->consumerId,
                   pVg->vgId, pEp->fqdn, pEp->port, pOld->fqdn, pOld->port);
          pVg->epSet = *pollRspWrapper->pEpset;
        }

1849
        // update the local offset value only for the returned values.
1850
        pVg->currentOffset = pDataRsp->rspOffset;
X
Xiaoyu Wang 已提交
1851
        atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
H
Haojun Liao 已提交
1852

1853 1854 1855
        char buf[80];
        tFormatOffset(buf, 80, &pDataRsp->rspOffset);
        if (pDataRsp->blockNum == 0) {
H
Haojun Liao 已提交
1856 1857
          tscDebug("consumer:0x%" PRIx64 " empty block received, vgId:%d, offset:%s, vg total:%"PRId64" total:%"PRId64" reqId:0x%" PRIx64, tmq->consumerId,
                   pVg->vgId, buf, pVg->numOfRows, tmq->totalRows, pollRspWrapper->reqId);
1858
          pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1859
          taosFreeQitem(pollRspWrapper);
1860
        } else {  // build rsp
1861 1862
          int64_t numOfRows = 0;
          SMqRspObj* pRsp = tmqBuildRspFromWrapper(pollRspWrapper, pVg, &numOfRows);
H
Haojun Liao 已提交
1863 1864
          tmq->totalRows += numOfRows;

H
Haojun Liao 已提交
1865
          tscDebug("consumer:0x%" PRIx64 " process poll rsp, vgId:%d, offset:%s, blocks:%d, rows:%" PRId64
H
Haojun Liao 已提交
1866
                   " vg total:%" PRId64 " total:%" PRId64 ", reqId:0x%" PRIx64,
H
Haojun Liao 已提交
1867
                   tmq->consumerId, pVg->vgId, buf, pDataRsp->blockNum, numOfRows, pVg->numOfRows, tmq->totalRows,
H
Haojun Liao 已提交
1868
                   pollRspWrapper->reqId);
1869 1870 1871
          taosFreeQitem(pollRspWrapper);
          return pRsp;
        }
X
Xiaoyu Wang 已提交
1872
      } else {
H
Haojun Liao 已提交
1873
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
1874
                 tmq->consumerId, pollRspWrapper->vgId, pDataRsp->head.epoch, consumerEpoch);
1875
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1876 1877
        taosFreeQitem(pollRspWrapper);
      }
1878 1879
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_META_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
L
Liu Jicong 已提交
1880
      int32_t            consumerEpoch = atomic_load_32(&tmq->epoch);
1881 1882 1883

      tscDebug("consumer:0x%" PRIx64 " process meta rsp", tmq->consumerId);

L
Liu Jicong 已提交
1884
      if (pollRspWrapper->metaRsp.head.epoch == consumerEpoch) {
L
Liu Jicong 已提交
1885
        SMqClientVg* pVg = pollRspWrapper->vgHandle;
wmmhello's avatar
wmmhello 已提交
1886
        pVg->currentOffset = pollRspWrapper->metaRsp.rspOffset;
L
Liu Jicong 已提交
1887 1888
        atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
        // build rsp
L
Liu Jicong 已提交
1889
        SMqMetaRspObj* pRsp = tmqBuildMetaRspFromWrapper(pollRspWrapper);
L
Liu Jicong 已提交
1890 1891 1892
        taosFreeQitem(pollRspWrapper);
        return pRsp;
      } else {
H
Haojun Liao 已提交
1893
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
1894
                 tmq->consumerId, pollRspWrapper->vgId, pollRspWrapper->metaRsp.head.epoch, consumerEpoch);
1895
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1896
        taosFreeQitem(pollRspWrapper);
X
Xiaoyu Wang 已提交
1897
      }
1898 1899
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__TAOSX_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
L
Liu Jicong 已提交
1900
      int32_t consumerEpoch = atomic_load_32(&tmq->epoch);
H
Haojun Liao 已提交
1901

L
Liu Jicong 已提交
1902 1903 1904 1905
      if (pollRspWrapper->taosxRsp.head.epoch == consumerEpoch) {
        SMqClientVg* pVg = pollRspWrapper->vgHandle;
        pVg->currentOffset = pollRspWrapper->taosxRsp.rspOffset;
        atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
H
Haojun Liao 已提交
1906

L
Liu Jicong 已提交
1907
        if (pollRspWrapper->taosxRsp.blockNum == 0) {
H
Haojun Liao 已提交
1908 1909
          tscDebug("consumer:0x%" PRIx64 " taosx empty block received, vgId:%d, vg total:%" PRId64 " reqId:0x%" PRIx64,
                   tmq->consumerId, pVg->vgId, pVg->numOfRows, pollRspWrapper->reqId);
H
Haojun Liao 已提交
1910
          pVg->emptyBlockReceiveTs = taosGetTimestampMs();
1911
          pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
H
Haojun Liao 已提交
1912
          taosFreeQitem(pollRspWrapper);
L
Liu Jicong 已提交
1913
          continue;
H
Haojun Liao 已提交
1914 1915
        } else {
          pVg->emptyBlockReceiveTs = 0; // reset the ts
L
Liu Jicong 已提交
1916
        }
wmmhello's avatar
wmmhello 已提交
1917

L
Liu Jicong 已提交
1918
        // build rsp
wmmhello's avatar
wmmhello 已提交
1919
        void* pRsp = NULL;
1920
        int64_t numOfRows = 0;
L
Liu Jicong 已提交
1921
        if (pollRspWrapper->taosxRsp.createTableNum == 0) {
1922
          pRsp = tmqBuildRspFromWrapper(pollRspWrapper, pVg, &numOfRows);
L
Liu Jicong 已提交
1923
        } else {
wmmhello's avatar
wmmhello 已提交
1924 1925
          pRsp = tmqBuildTaosxRspFromWrapper(pollRspWrapper);
        }
H
Haojun Liao 已提交
1926

1927 1928
        tmq->totalRows += numOfRows;

H
Haojun Liao 已提交
1929 1930
        char buf[80];
        tFormatOffset(buf, 80, &pVg->currentOffset);
H
Haojun Liao 已提交
1931
        tscDebug("consumer:0x%" PRIx64 " process taosx poll rsp, vgId:%d, offset:%s, blocks:%d, rows:%" PRId64
H
Haojun Liao 已提交
1932
                 ", vg total:%" PRId64 " total:%"PRId64" reqId:0x%" PRIx64,
H
Haojun Liao 已提交
1933
                 tmq->consumerId, pVg->vgId, buf, pollRspWrapper->dataRsp.blockNum, numOfRows, pVg->numOfRows,
H
Haojun Liao 已提交
1934
                 tmq->totalRows, pollRspWrapper->reqId);
H
Haojun Liao 已提交
1935 1936

        taosFreeQitem(pollRspWrapper);
L
Liu Jicong 已提交
1937
        return pRsp;
H
Haojun Liao 已提交
1938

L
Liu Jicong 已提交
1939
      } else {
H
Haojun Liao 已提交
1940
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
1941
                 tmq->consumerId, pollRspWrapper->vgId, pollRspWrapper->taosxRsp.head.epoch, consumerEpoch);
1942
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1943 1944
        taosFreeQitem(pollRspWrapper);
      }
X
Xiaoyu Wang 已提交
1945
    } else {
H
Haojun Liao 已提交
1946 1947
      tscDebug("consumer:0x%" PRIx64 " not data msg received", tmq->consumerId);

X
Xiaoyu Wang 已提交
1948
      bool reset = false;
1949 1950
      tmqHandleNoPollRsp(tmq, pRspWrapper, &reset);
      taosFreeQitem(pRspWrapper);
X
Xiaoyu Wang 已提交
1951
      if (pollIfReset && reset) {
1952
        tscDebug("consumer:0x%" PRIx64 ", reset and repoll", tmq->consumerId);
1953
        tmqPollImpl(tmq, timeout);
X
Xiaoyu Wang 已提交
1954 1955 1956 1957 1958
      }
    }
  }
}

1959
TAOS_RES* tmq_consumer_poll(tmq_t* tmq, int64_t timeout) {
L
Liu Jicong 已提交
1960 1961
  void*   rspObj;
  int64_t startTime = taosGetTimestampMs();
L
Liu Jicong 已提交
1962

1963
  tscDebug("consumer:0x%" PRIx64 " start to poll at %"PRId64", timeout:%" PRId64, tmq->consumerId, startTime, timeout);
L
Liu Jicong 已提交
1964

1965 1966 1967
#if 0
  tmqHandleAllDelayedTask(tmq);
  tmqPollImpl(tmq, timeout);
1968
  rspObj = tmqHandleAllRsp(tmq, timeout, false);
L
Liu Jicong 已提交
1969 1970
  if (rspObj) {
    return (TAOS_RES*)rspObj;
L
fix  
Liu Jicong 已提交
1971
  }
1972
#endif
X
Xiaoyu Wang 已提交
1973

1974
  // in no topic status, delayed task also need to be processed
L
Liu Jicong 已提交
1975
  if (atomic_load_8(&tmq->status) == TMQ_CONSUMER_STATUS__INIT) {
1976
    tscDebug("consumer:0x%" PRIx64 " poll return since consumer is init", tmq->consumerId);
1977
    taosMsleep(500);  //     sleep for a while
1978 1979 1980
    return NULL;
  }

wmmhello's avatar
wmmhello 已提交
1981
  while (atomic_load_8(&tmq->status) == TMQ_CONSUMER_STATUS__RECOVER) {
L
Liu Jicong 已提交
1982 1983
    int32_t retryCnt = 0;
    while (TSDB_CODE_MND_CONSUMER_NOT_READY == tmqAskEp(tmq, false)) {
H
Haojun Liao 已提交
1984
      if (retryCnt++ > 40) {
L
Liu Jicong 已提交
1985 1986
        return NULL;
      }
1987

H
Haojun Liao 已提交
1988
      tscDebug("consumer:0x%" PRIx64 " not ready, retry:%d/40 in 500ms", tmq->consumerId, retryCnt);
L
Liu Jicong 已提交
1989 1990 1991 1992
      taosMsleep(500);
    }
  }

X
Xiaoyu Wang 已提交
1993
  while (1) {
L
Liu Jicong 已提交
1994
    tmqHandleAllDelayedTask(tmq);
1995

L
Liu Jicong 已提交
1996
    if (tmqPollImpl(tmq, timeout) < 0) {
1997
      tscDebug("consumer:0x%" PRIx64 " return due to poll error", tmq->consumerId);
L
Liu Jicong 已提交
1998
    }
L
Liu Jicong 已提交
1999

2000
    rspObj = tmqHandleAllRsp(tmq, timeout, false);
L
Liu Jicong 已提交
2001
    if (rspObj) {
2002
      tscDebug("consumer:0x%" PRIx64 " return rsp %p", tmq->consumerId, rspObj);
L
Liu Jicong 已提交
2003
      return (TAOS_RES*)rspObj;
L
Liu Jicong 已提交
2004
    } else if (terrno == TSDB_CODE_TQ_NO_COMMITTED_OFFSET) {
2005
      tscDebug("consumer:0x%" PRIx64 " return null since no committed offset", tmq->consumerId);
L
Liu Jicong 已提交
2006
      return NULL;
X
Xiaoyu Wang 已提交
2007
    }
2008

2009
    if (timeout >= 0) {
L
Liu Jicong 已提交
2010
      int64_t currentTime = taosGetTimestampMs();
2011 2012 2013
      int64_t elapsedTime = currentTime - startTime;
      if (elapsedTime > timeout) {
        tscDebug("consumer:0x%" PRIx64 " (epoch %d) timeout, no rsp, start time %" PRId64 ", current time %" PRId64,
L
Liu Jicong 已提交
2014
                 tmq->consumerId, tmq->epoch, startTime, currentTime);
X
Xiaoyu Wang 已提交
2015 2016
        return NULL;
      }
2017
      tsem_timewait(&tmq->rspSem, (timeout - elapsedTime));
L
Liu Jicong 已提交
2018 2019
    } else {
      // use tsem_timewait instead of tsem_wait to avoid unexpected stuck
L
Liu Jicong 已提交
2020
      tsem_timewait(&tmq->rspSem, 1000);
X
Xiaoyu Wang 已提交
2021 2022 2023 2024
    }
  }
}

2025 2026 2027 2028 2029 2030 2031 2032 2033 2034 2035 2036 2037 2038
static void displayConsumeStatistics(const tmq_t* pTmq) {
  int32_t numOfTopics = taosArrayGetSize(pTmq->clientTopics);
  tscDebug("consumer:0x%" PRIx64 " closing poll:%" PRId64 " rows:%" PRId64 " topics:%d, final epoch:%d",
           pTmq->consumerId, pTmq->pollCnt, pTmq->totalRows, numOfTopics, pTmq->epoch);

  tscDebug("consumer:0x%" PRIx64 " rows dist begin: ", pTmq->consumerId);
  for (int32_t i = 0; i < numOfTopics; ++i) {
    SMqClientTopic* pTopics = taosArrayGet(pTmq->clientTopics, i);

    tscDebug("consumer:0x%" PRIx64 " topic:%d", pTmq->consumerId, i);
    int32_t numOfVgs = taosArrayGetSize(pTopics->vgs);
    for (int32_t j = 0; j < numOfVgs; ++j) {
      SMqClientVg* pVg = taosArrayGet(pTopics->vgs, j);
      tscDebug("topic:%s, %d. vgId:%d rows:%" PRId64, pTopics->topicName, j, pVg->vgId, pVg->numOfRows);
2039
    }
2040
  }
2041

2042 2043
  tscDebug("consumer:0x%" PRIx64 " rows dist end", pTmq->consumerId);
}
2044

2045 2046 2047
int32_t tmq_consumer_close(tmq_t* tmq) {
  tscDebug("consumer:0x%" PRIx64" start to close consumer, status:%d", tmq->consumerId, tmq->status);
  displayConsumeStatistics(tmq);
2048

2049 2050 2051 2052 2053 2054
  if (tmq->status == TMQ_CONSUMER_STATUS__READY) {
    // if auto commit is set, commit before close consumer. Otherwise, do nothing.
    if (tmq->autoCommit) {
      int32_t rsp = tmq_commit_sync(tmq, NULL);
      if (rsp != 0) {
        return rsp;
2055 2056 2057
      }
    }

L
Liu Jicong 已提交
2058
    int32_t     retryCnt = 0;
2059
    tmq_list_t* lst = tmq_list_new();
L
Liu Jicong 已提交
2060
    while (1) {
2061
      int32_t rsp = tmq_subscribe(tmq, lst);
L
Liu Jicong 已提交
2062 2063 2064 2065 2066 2067 2068 2069
      if (rsp != TSDB_CODE_MND_CONSUMER_NOT_READY || retryCnt > 5) {
        break;
      } else {
        retryCnt++;
        taosMsleep(500);
      }
    }

2070
    tmq_list_destroy(lst);
2071 2072
  } else {
    tscWarn("consumer:0x%" PRIx64" not in ready state, close it directly", tmq->consumerId);
L
Liu Jicong 已提交
2073
  }
H
Haojun Liao 已提交
2074

2075
  taosRemoveRef(tmqMgmt.rsetId, tmq->refId);
L
Liu Jicong 已提交
2076
  return 0;
2077
}
L
Liu Jicong 已提交
2078

L
Liu Jicong 已提交
2079 2080
const char* tmq_err2str(int32_t err) {
  if (err == 0) {
L
Liu Jicong 已提交
2081
    return "success";
L
Liu Jicong 已提交
2082
  } else if (err == -1) {
L
Liu Jicong 已提交
2083 2084 2085
    return "fail";
  } else {
    return tstrerror(err);
L
Liu Jicong 已提交
2086 2087
  }
}
L
Liu Jicong 已提交
2088

L
Liu Jicong 已提交
2089 2090 2091 2092 2093
tmq_res_t tmq_get_res_type(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    return TMQ_RES_DATA;
  } else if (TD_RES_TMQ_META(res)) {
    return TMQ_RES_TABLE_META;
2094 2095
  } else if (TD_RES_TMQ_METADATA(res)) {
    return TMQ_RES_METADATA;
L
Liu Jicong 已提交
2096 2097 2098 2099 2100
  } else {
    return TMQ_RES_INVALID;
  }
}

L
Liu Jicong 已提交
2101
const char* tmq_get_topic_name(TAOS_RES* res) {
L
Liu Jicong 已提交
2102 2103
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
L
Liu Jicong 已提交
2104
    return strchr(pRspObj->topic, '.') + 1;
L
Liu Jicong 已提交
2105 2106 2107
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return strchr(pMetaRspObj->topic, '.') + 1;
2108 2109 2110
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return strchr(pRspObj->topic, '.') + 1;
L
Liu Jicong 已提交
2111 2112 2113 2114 2115
  } else {
    return NULL;
  }
}

L
Liu Jicong 已提交
2116 2117 2118 2119
const char* tmq_get_db_name(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    return strchr(pRspObj->db, '.') + 1;
L
Liu Jicong 已提交
2120 2121 2122
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return strchr(pMetaRspObj->db, '.') + 1;
2123 2124 2125
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return strchr(pRspObj->db, '.') + 1;
L
Liu Jicong 已提交
2126 2127 2128 2129 2130
  } else {
    return NULL;
  }
}

L
Liu Jicong 已提交
2131 2132 2133 2134
int32_t tmq_get_vgroup_id(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    return pRspObj->vgId;
L
Liu Jicong 已提交
2135 2136 2137
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return pMetaRspObj->vgId;
2138
  } else if (TD_RES_TMQ_METADATA(res)) {
2139 2140
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return pRspObj->vgId;
L
Liu Jicong 已提交
2141 2142 2143 2144
  } else {
    return -1;
  }
}
L
Liu Jicong 已提交
2145 2146 2147 2148 2149 2150 2151 2152

const char* tmq_get_table_name(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    if (!pRspObj->rsp.withTbName || pRspObj->rsp.blockTbName == NULL || pRspObj->resIter < 0 ||
        pRspObj->resIter >= pRspObj->rsp.blockNum) {
      return NULL;
    }
2153
    return (const char*)taosArrayGetP(pRspObj->rsp.blockTbName, pRspObj->resIter);
2154 2155
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
L
Liu Jicong 已提交
2156 2157 2158
    if (!pRspObj->rsp.withTbName || pRspObj->rsp.blockTbName == NULL || pRspObj->resIter < 0 ||
        pRspObj->resIter >= pRspObj->rsp.blockNum) {
      return NULL;
2159
    }
L
Liu Jicong 已提交
2160 2161
    return (const char*)taosArrayGetP(pRspObj->rsp.blockTbName, pRspObj->resIter);
  }
L
Liu Jicong 已提交
2162 2163
  return NULL;
}
2164

L
Liu Jicong 已提交
2165
void tmq_commit_async(tmq_t* tmq, const TAOS_RES* msg, tmq_commit_cb* cb, void* param) {
L
Liu Jicong 已提交
2166
  tmqCommitInner(tmq, msg, 0, 1, cb, param);
L
Liu Jicong 已提交
2167 2168
}

2169
int32_t tmq_commit_sync(tmq_t* tmq, const TAOS_RES* msg) {
L
Liu Jicong 已提交
2170
  return tmqCommitInner(tmq, msg, 0, 0, NULL, NULL);
2171
}
2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257 2258 2259 2260 2261

int32_t tmqAskEp(tmq_t* tmq, bool async) {
  int32_t code = TSDB_CODE_SUCCESS;
#if 0
  int8_t  epStatus = atomic_val_compare_exchange_8(&tmq->epStatus, 0, 1);
  if (epStatus == 1) {
    int32_t epSkipCnt = atomic_add_fetch_32(&tmq->epSkipCnt, 1);
    tscTrace("consumer:0x%" PRIx64 ", skip ask ep cnt %d", tmq->consumerId, epSkipCnt);
    if (epSkipCnt < 5000) return 0;
  }
  atomic_store_32(&tmq->epSkipCnt, 0);
#endif

  SMqAskEpReq req = {0};
  req.consumerId = tmq->consumerId;
  req.epoch = tmq->epoch;
  strcpy(req.cgroup, tmq->groupId);

  int32_t tlen = tSerializeSMqAskEpReq(NULL, 0, &req);
  if (tlen < 0) {
    tscError("consumer:0x%" PRIx64 ", tSerializeSMqAskEpReq failed", tmq->consumerId);
    return -1;
  }

  void* pReq = taosMemoryCalloc(1, tlen);
  if (pReq == NULL) {
    tscError("consumer:0x%" PRIx64 ", failed to malloc askEpReq msg, size:%d", tmq->consumerId, tlen);
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }

  if (tSerializeSMqAskEpReq(pReq, tlen, &req) < 0) {
    tscError("consumer:0x%" PRIx64 ", tSerializeSMqAskEpReq %d failed", tmq->consumerId, tlen);
    taosMemoryFree(pReq);
    return -1;
  }

  SMqAskEpCbParam* pParam = taosMemoryCalloc(1, sizeof(SMqAskEpCbParam));
  if (pParam == NULL) {
    tscError("consumer:0x%" PRIx64 ", failed to malloc subscribe param", tmq->consumerId);
    taosMemoryFree(pReq);
    return -1;
  }

  pParam->refId = tmq->refId;
  pParam->epoch = tmq->epoch;
  pParam->async = async;
  tsem_init(&pParam->rspSem, 0, 0);

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    tsem_destroy(&pParam->rspSem);
    taosMemoryFree(pParam);
    taosMemoryFree(pReq);
    return -1;
  }

  sendInfo->msgInfo = (SDataBuf){
      .pData = pReq,
      .len = tlen,
      .handle = NULL,
  };

  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
  sendInfo->param = pParam;
  sendInfo->fp = tmqAskEpCb;
  sendInfo->msgType = TDMT_MND_TMQ_ASK_EP;

  SEpSet epSet = getEpSet_s(&tmq->pTscObj->pAppInfo->mgmtEp);
  tscDebug("consumer:0x%" PRIx64 " ask ep from mnode, async:%d, reqId:0x%" PRIx64, tmq->consumerId, async,
           sendInfo->requestId);

  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);

  if (!async) {
    tsem_wait(&pParam->rspSem);
    code = pParam->code;
    taosMemoryFree(pParam);
  }

  return code;
}

int32_t makeTopicVgroupKey(char* dst, const char* topicName, int32_t vg) {
  return sprintf(dst, "%s:%d", topicName, vg);
}

int32_t tmqCommitDone(SMqCommitCbParamSet* pParamSet) {
2262 2263 2264
  int64_t refId = pParamSet->refId;

  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
2265 2266 2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278
  if (tmq == NULL) {
    if (!pParamSet->async) {
      tsem_destroy(&pParamSet->rspSem);
    }
    taosMemoryFree(pParamSet);
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    return -1;
  }

  // if no more waiting rsp
  if (pParamSet->async) {
    // call async cb func
    if (pParamSet->automatic && tmq->commitCb) {
      tmq->commitCb(tmq, pParamSet->rspErr, tmq->commitCbUserParam);
2279
    } else if (!pParamSet->automatic && pParamSet->userCb) { // sem post
2280 2281
      pParamSet->userCb(tmq, pParamSet->rspErr, pParamSet->userParam);
    }
2282

2283 2284 2285 2286 2287 2288 2289 2290 2291
    taosMemoryFree(pParamSet);
  } else {
    tsem_post(&pParamSet->rspSem);
  }

#if 0
  taosArrayDestroyP(pParamSet->successfulOffsets, taosMemoryFree);
    taosArrayDestroyP(pParamSet->failedOffsets, taosMemoryFree);
#endif
2292 2293

  taosReleaseRef(tmqMgmt.rsetId, refId);
2294
  return 0;
2295 2296 2297 2298 2299
}

void tmqCommitRspCountDown(SMqCommitCbParamSet* pParamSet, int64_t consumerId, const char* pTopic, int32_t vgId) {
  int32_t waitingRspNum = atomic_sub_fetch_32(&pParamSet->waitingRspNum, 1);
  if (waitingRspNum == 0) {
H
Haojun Liao 已提交
2300 2301
    tscDebug("consumer:0x%" PRIx64 " topic:%s vgId:%d all commit-rsp received, commit completed", consumerId, pTopic,
             vgId);
2302
    tmqCommitDone(pParamSet);
H
Haojun Liao 已提交
2303 2304 2305
  } else {
    tscDebug("consumer:0x%" PRIx64 " topic:%s vgId:%d commit-rsp received, remain:%d", consumerId, pTopic, vgId,
             waitingRspNum);
2306 2307
  }
}