clientTmq.c 72.6 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

L
Liu Jicong 已提交
16
#include "cJSON.h"
17 18 19
#include "clientInt.h"
#include "clientLog.h"
#include "parser.h"
H
Haojun Liao 已提交
20
#include "tdatablock.h"
21 22
#include "tdef.h"
#include "tglobal.h"
X
Xiaoyu Wang 已提交
23
#include "tqueue.h"
24
#include "tref.h"
L
Liu Jicong 已提交
25 26
#include "ttimer.h"

27
#define EMPTY_BLOCK_POLL_IDLE_DURATION  10
28
#define DEFAULT_AUTO_COMMIT_INTERVAL    5000
29

30 31
typedef void (*__tmq_askep_fn_t)(tmq_t* pTmq, int32_t code, SDataBuf* pBuf, void* pParam);

X
Xiaoyu Wang 已提交
32
struct SMqMgmt {
33 34 35
  int8_t  inited;
  tmr_h   timer;
  int32_t rsetId;
36
};
L
Liu Jicong 已提交
37

X
Xiaoyu Wang 已提交
38 39
static TdThreadOnce   tmqInit = PTHREAD_ONCE_INIT;  // initialize only once
volatile int32_t      tmqInitRes = 0;               // initialize rsp code
40
static struct SMqMgmt tmqMgmt = {0};
41

L
Liu Jicong 已提交
42 43 44 45 46 47
typedef struct {
  int8_t  tmqRspType;
  int32_t epoch;
} SMqRspWrapper;

typedef struct {
L
Liu Jicong 已提交
48 49 50
  int8_t      tmqRspType;
  int32_t     epoch;
  SMqAskEpRsp msg;
L
Liu Jicong 已提交
51 52
} SMqAskEpRspWrapper;

L
Liu Jicong 已提交
53
struct tmq_list_t {
L
Liu Jicong 已提交
54
  SArray container;
L
Liu Jicong 已提交
55
};
L
Liu Jicong 已提交
56

L
Liu Jicong 已提交
57
struct tmq_conf_t {
58 59 60 61 62 63 64 65
  char           clientId[256];
  char           groupId[TSDB_CGROUP_LEN];
  int8_t         autoCommit;
  int8_t         resetOffset;
  int8_t         withTbName;
  int8_t         snapEnable;
  int32_t        snapBatchSize;
  bool           hbBgEnable;
66 67 68 69 70
  uint16_t       port;
  int32_t        autoCommitInterval;
  char*          ip;
  char*          user;
  char*          pass;
71
  tmq_commit_cb* commitCb;
L
Liu Jicong 已提交
72
  void*          commitCbUserParam;
L
Liu Jicong 已提交
73 74 75
};

struct tmq_t {
76 77 78 79 80 81 82 83 84 85
  int64_t        refId;
  char           groupId[TSDB_CGROUP_LEN];
  char           clientId[256];
  int8_t         withTbName;
  int8_t         useSnapshot;
  int8_t         autoCommit;
  int32_t        autoCommitInterval;
  int32_t        resetOffsetCfg;
  uint64_t       consumerId;
  bool           hbBgEnable;
L
Liu Jicong 已提交
86 87
  tmq_commit_cb* commitCb;
  void*          commitCbUserParam;
L
Liu Jicong 已提交
88 89 90 91

  // status
  int8_t  status;
  int32_t epoch;
L
Liu Jicong 已提交
92 93
#if 0
  int8_t  epStatus;
L
Liu Jicong 已提交
94
  int32_t epSkipCnt;
L
Liu Jicong 已提交
95
#endif
96 97 98
  // poll info
  int64_t       pollCnt;
  int64_t       totalRows;
L
Liu Jicong 已提交
99

L
Liu Jicong 已提交
100
  // timer
101 102 103 104
  tmr_h         hbLiveTimer;
  tmr_h         epTimer;
  tmr_h         reportTimer;
  tmr_h         commitTimer;
H
Haojun Liao 已提交
105 106 107 108 109 110
  STscObj*      pTscObj;       // connection
  SArray*       clientTopics;  // SArray<SMqClientTopic>
  STaosQueue*   mqueue;        // queue of rsp
  STaosQall*    qall;
  STaosQueue*   delayedTask;   // delayed task queue for heartbeat and auto commit
  tsem_t        rspSem;
L
Liu Jicong 已提交
111 112
};

113 114
typedef struct SAskEpInfo {
  int32_t code;
H
Haojun Liao 已提交
115
  tsem_t  sem;
116 117
} SAskEpInfo;

X
Xiaoyu Wang 已提交
118 119 120 121 122 123 124 125
enum {
  TMQ_VG_STATUS__IDLE = 0,
  TMQ_VG_STATUS__WAIT,
};

enum {
  TMQ_CONSUMER_STATUS__INIT = 0,
  TMQ_CONSUMER_STATUS__READY,
126
  TMQ_CONSUMER_STATUS__NO_TOPIC,
L
Liu Jicong 已提交
127
  TMQ_CONSUMER_STATUS__RECOVER,
L
Liu Jicong 已提交
128 129
};

L
Liu Jicong 已提交
130
enum {
131
  TMQ_DELAYED_TASK__ASK_EP = 1,
L
Liu Jicong 已提交
132 133 134 135
  TMQ_DELAYED_TASK__REPORT,
  TMQ_DELAYED_TASK__COMMIT,
};

L
Liu Jicong 已提交
136
typedef struct {
H
Haojun Liao 已提交
137
  int64_t      pollCnt;
138
  int64_t      numOfRows;
L
Liu Jicong 已提交
139 140
  STqOffsetVal committedOffset;
  STqOffsetVal currentOffset;
H
Haojun Liao 已提交
141 142 143
  int32_t      vgId;
  int32_t      vgStatus;
  int32_t      vgSkipCnt;
H
Haojun Liao 已提交
144
  int64_t      emptyBlockReceiveTs; // once empty block is received, idle for ignoreCnt then start to poll data
H
Haojun Liao 已提交
145
  SEpSet       epSet;
146 147
} SMqClientVg;

L
Liu Jicong 已提交
148
typedef struct {
149 150 151
  char           topicName[TSDB_TOPIC_FNAME_LEN];
  char           db[TSDB_DB_FNAME_LEN];
  SArray*        vgs;  // SArray<SMqClientVg>
L
Liu Jicong 已提交
152
  SSchemaWrapper schema;
153 154
} SMqClientTopic;

L
Liu Jicong 已提交
155 156
typedef struct {
  int8_t          tmqRspType;
157 158
  int32_t         epoch;         // epoch can be used to guard the vgHandle
  int32_t         vgId;
L
Liu Jicong 已提交
159 160
  SMqClientVg*    vgHandle;
  SMqClientTopic* topicHandle;
H
Haojun Liao 已提交
161
  uint64_t        reqId;
162
  SEpSet*         pEpset;
L
Liu Jicong 已提交
163
  union {
L
Liu Jicong 已提交
164 165
    SMqDataRsp dataRsp;
    SMqMetaRsp metaRsp;
L
Liu Jicong 已提交
166
    STaosxRsp  taosxRsp;
L
Liu Jicong 已提交
167
  };
L
Liu Jicong 已提交
168 169
} SMqPollRspWrapper;

L
Liu Jicong 已提交
170
typedef struct {
171 172
  int64_t refId;
  int32_t epoch;
L
Liu Jicong 已提交
173 174
  tsem_t  rspSem;
  int32_t rspErr;
L
Liu Jicong 已提交
175
} SMqSubscribeCbParam;
L
Liu Jicong 已提交
176

L
Liu Jicong 已提交
177
typedef struct {
178 179 180 181
  int64_t          refId;
  int32_t          epoch;
  void*            pParam;
  __tmq_askep_fn_t pUserFn;
182 183
} SMqAskEpCbParam;

L
Liu Jicong 已提交
184
typedef struct {
185 186
  int64_t         refId;
  int32_t         epoch;
L
Liu Jicong 已提交
187
  SMqClientVg*    pVg;
L
Liu Jicong 已提交
188
  SMqClientTopic* pTopic;
L
Liu Jicong 已提交
189
  int32_t         vgId;
H
Haojun Liao 已提交
190
  uint64_t        requestId; // request id for debug purpose
X
Xiaoyu Wang 已提交
191
} SMqPollCbParam;
192

193
typedef struct {
194 195
  int64_t        refId;
  int32_t        epoch;
L
Liu Jicong 已提交
196 197
  int32_t        waitingRspNum;
  int32_t        totalRspNum;
198
  int32_t        code;
199
  tmq_commit_cb* callbackFn;
L
Liu Jicong 已提交
200 201
  /*SArray*        successfulOffsets;*/
  /*SArray*        failedOffsets;*/
202
  void*          userParam;
203 204 205 206 207
} SMqCommitCbParamSet;

typedef struct {
  SMqCommitCbParamSet* params;
  STqOffset*           pOffset;
H
Haojun Liao 已提交
208 209 210
  char                 topicName[TSDB_TOPIC_FNAME_LEN];
  int32_t              vgId;
  tmq_t*               pTmq;
211
} SMqCommitCbParam;
212

213
static int32_t doAskEp(tmq_t* tmq);
214 215
static int32_t makeTopicVgroupKey(char* dst, const char* topicName, int32_t vg);
static int32_t tmqCommitDone(SMqCommitCbParamSet* pParamSet);
216 217
static int32_t doSendCommitMsg(tmq_t* tmq, SMqClientVg* pVg, const char* pTopicName, SMqCommitCbParamSet* pParamSet,
                               int32_t index, int32_t totalVgroups);
218 219 220
static void commitRspCountDown(SMqCommitCbParamSet* pParamSet, int64_t consumerId, const char* pTopic, int32_t vgId);
static void asyncAskEp(tmq_t* pTmq, __tmq_askep_fn_t askEpFn, void* param);
static void addToQueueCallbackFn(tmq_t* pTmq, int32_t code, SDataBuf* pDataBuf, void* param);
221

222
tmq_conf_t* tmq_conf_new() {
wafwerar's avatar
wafwerar 已提交
223
  tmq_conf_t* conf = taosMemoryCalloc(1, sizeof(tmq_conf_t));
224 225 226 227 228
  if (conf == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return conf;
  }

229
  conf->withTbName = false;
L
Liu Jicong 已提交
230
  conf->autoCommit = true;
231
  conf->autoCommitInterval = DEFAULT_AUTO_COMMIT_INTERVAL;
232
  conf->resetOffset = TMQ_OFFSET__RESET_EARLIEAST;
233
  conf->hbBgEnable = true;
234

235 236 237
  return conf;
}

L
Liu Jicong 已提交
238
void tmq_conf_destroy(tmq_conf_t* conf) {
L
Liu Jicong 已提交
239
  if (conf) {
240 241 242 243 244 245 246 247 248
    if (conf->ip) {
      taosMemoryFree(conf->ip);
    }
    if (conf->user) {
      taosMemoryFree(conf->user);
    }
    if (conf->pass) {
      taosMemoryFree(conf->pass);
    }
L
Liu Jicong 已提交
249 250
    taosMemoryFree(conf);
  }
L
Liu Jicong 已提交
251 252 253
}

tmq_conf_res_t tmq_conf_set(tmq_conf_t* conf, const char* key, const char* value) {
254
  if (strcasecmp(key, "group.id") == 0) {
L
Liu Jicong 已提交
255
    tstrncpy(conf->groupId, value, TSDB_CGROUP_LEN);
L
Liu Jicong 已提交
256
    return TMQ_CONF_OK;
257
  }
L
Liu Jicong 已提交
258

259
  if (strcasecmp(key, "client.id") == 0) {
L
Liu Jicong 已提交
260
    tstrncpy(conf->clientId, value, 256);
L
Liu Jicong 已提交
261 262
    return TMQ_CONF_OK;
  }
L
Liu Jicong 已提交
263

264 265
  if (strcasecmp(key, "enable.auto.commit") == 0) {
    if (strcasecmp(value, "true") == 0) {
L
Liu Jicong 已提交
266
      conf->autoCommit = true;
L
Liu Jicong 已提交
267
      return TMQ_CONF_OK;
268
    } else if (strcasecmp(value, "false") == 0) {
L
Liu Jicong 已提交
269
      conf->autoCommit = false;
L
Liu Jicong 已提交
270 271 272 273
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
274
  }
L
Liu Jicong 已提交
275

276
  if (strcasecmp(key, "auto.commit.interval.ms") == 0) {
277
    conf->autoCommitInterval = taosStr2int64(value);
L
Liu Jicong 已提交
278 279 280
    return TMQ_CONF_OK;
  }

281 282 283
  if (strcasecmp(key, "auto.offset.reset") == 0) {
    if (strcasecmp(value, "none") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_NONE;
L
Liu Jicong 已提交
284
      return TMQ_CONF_OK;
285 286
    } else if (strcasecmp(value, "earliest") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_EARLIEAST;
L
Liu Jicong 已提交
287
      return TMQ_CONF_OK;
288 289
    } else if (strcasecmp(value, "latest") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_LATEST;
L
Liu Jicong 已提交
290 291 292 293 294
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
  }
L
Liu Jicong 已提交
295

296 297
  if (strcasecmp(key, "msg.with.table.name") == 0) {
    if (strcasecmp(value, "true") == 0) {
298
      conf->withTbName = true;
L
Liu Jicong 已提交
299
      return TMQ_CONF_OK;
300
    } else if (strcasecmp(value, "false") == 0) {
301
      conf->withTbName = false;
L
Liu Jicong 已提交
302
      return TMQ_CONF_OK;
303 304 305 306 307
    } else {
      return TMQ_CONF_INVALID;
    }
  }

308 309
  if (strcasecmp(key, "experimental.snapshot.enable") == 0) {
    if (strcasecmp(value, "true") == 0) {
L
Liu Jicong 已提交
310
      conf->snapEnable = true;
311
      return TMQ_CONF_OK;
312
    } else if (strcasecmp(value, "false") == 0) {
L
Liu Jicong 已提交
313
      conf->snapEnable = false;
314 315 316 317 318 319
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
  }

320
  if (strcasecmp(key, "experimental.snapshot.batch.size") == 0) {
321
    conf->snapBatchSize = taosStr2int64(value);
L
Liu Jicong 已提交
322 323 324
    return TMQ_CONF_OK;
  }

325
  if (strcasecmp(key, "enable.heartbeat.background") == 0) {
326 327 328 329 330 331 332 333
//    if (strcasecmp(value, "true") == 0) {
//      conf->hbBgEnable = true;
//      return TMQ_CONF_OK;
//    } else if (strcasecmp(value, "false") == 0) {
//      conf->hbBgEnable = false;
//      return TMQ_CONF_OK;
//    } else {
      tscError("the default value of enable.heartbeat.background is true, can not be seted");
L
Liu Jicong 已提交
334
      return TMQ_CONF_INVALID;
335
//    }
L
Liu Jicong 已提交
336 337
  }

338
  if (strcasecmp(key, "td.connect.ip") == 0) {
339
    conf->ip = taosStrdup(value);
L
Liu Jicong 已提交
340 341
    return TMQ_CONF_OK;
  }
342

343
  if (strcasecmp(key, "td.connect.user") == 0) {
344
    conf->user = taosStrdup(value);
L
Liu Jicong 已提交
345 346
    return TMQ_CONF_OK;
  }
347

348
  if (strcasecmp(key, "td.connect.pass") == 0) {
349
    conf->pass = taosStrdup(value);
L
Liu Jicong 已提交
350 351
    return TMQ_CONF_OK;
  }
352

353
  if (strcasecmp(key, "td.connect.port") == 0) {
354
    conf->port = taosStr2int64(value);
L
Liu Jicong 已提交
355 356
    return TMQ_CONF_OK;
  }
357

358
  if (strcasecmp(key, "td.connect.db") == 0) {
L
Liu Jicong 已提交
359 360 361
    return TMQ_CONF_OK;
  }

L
Liu Jicong 已提交
362
  return TMQ_CONF_UNKNOWN;
363 364 365
}

tmq_list_t* tmq_list_new() {
L
Liu Jicong 已提交
366
  return (tmq_list_t*)taosArrayInit(0, sizeof(void*));
367 368
}

L
Liu Jicong 已提交
369 370
int32_t tmq_list_append(tmq_list_t* list, const char* src) {
  SArray* container = &list->container;
371
  if (src == NULL || src[0] == 0) return -1;
372
  char* topic = taosStrdup(src);
373 374 375
  if (topic[0] != '`') {
    strtolower(topic, src);
  }
L
fix  
Liu Jicong 已提交
376
  if (taosArrayPush(container, &topic) == NULL) return -1;
377 378 379
  return 0;
}

L
Liu Jicong 已提交
380
void tmq_list_destroy(tmq_list_t* list) {
L
Liu Jicong 已提交
381
  SArray* container = &list->container;
L
Liu Jicong 已提交
382
  taosArrayDestroyP(container, taosMemoryFree);
L
Liu Jicong 已提交
383 384
}

L
Liu Jicong 已提交
385 386 387 388 389 390 391 392 393 394
int32_t tmq_list_get_size(const tmq_list_t* list) {
  const SArray* container = &list->container;
  return taosArrayGetSize(container);
}

char** tmq_list_to_c_array(const tmq_list_t* list) {
  const SArray* container = &list->container;
  return container->pData;
}

395 396 397 398 399
static SMqClientVg* foundClientVg(SArray* pTopicList, const char* pName, int32_t vgId, int32_t* index, int32_t* numOfVgroups) {
  int32_t numOfTopics = taosArrayGetSize(pTopicList);
  *index = -1;
  *numOfVgroups = 0;

400
  for(int32_t i = 0; i < numOfTopics; ++i) {
401 402
    SMqClientTopic* pTopic = taosArrayGet(pTopicList, i);
    if (strcmp(pTopic->topicName, pName) != 0) {
403 404 405
      continue;
    }

406 407
    *numOfVgroups = taosArrayGetSize(pTopic->vgs);
    for (int32_t j = 0; j < (*numOfVgroups); ++j) {
408
      SMqClientVg* pClientVg = taosArrayGet(pTopic->vgs, j);
409 410 411
      if (pClientVg->vgId == vgId) {
        *index = j;
        return pClientVg;
412 413
      }
    }
L
Liu Jicong 已提交
414
  }
415 416

  return NULL;
L
Liu Jicong 已提交
417
}
418

419 420 421
// Two problems do not need to be addressed here
// 1. update to of epset. the response of poll request will automatically handle this problem
// 2. commit failure. This one needs to be resolved.
H
Haojun Liao 已提交
422
static int32_t tmqCommitCb(void* param, SDataBuf* pBuf, int32_t code) {
423
  SMqCommitCbParam*    pParam = (SMqCommitCbParam*)param;
424
  SMqCommitCbParamSet* pParamSet = (SMqCommitCbParamSet*)pParam->params;
H
Haojun Liao 已提交
425

426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449
//  if (code != TSDB_CODE_SUCCESS) { // if commit offset failed, let's try again
//    taosThreadMutexLock(&pParam->pTmq->lock);
//    int32_t numOfVgroups, index;
//    SMqClientVg* pVg = foundClientVg(pParam->pTmq->clientTopics, pParam->topicName, pParam->vgId, &index, &numOfVgroups);
//    if (pVg == NULL) {
//      tscDebug("consumer:0x%" PRIx64
//               " subKey:%s vgId:%d commit failed, code:%s has been transferred to other consumer, no need retry ordinal:%d/%d",
//               pParam->pTmq->consumerId, pParam->pOffset->subKey, pParam->vgId, tstrerror(code), index + 1, numOfVgroups);
//    } else { // let's retry the commit
//      int32_t code1 = doSendCommitMsg(pParam->pTmq, pVg, pParam->topicName, pParamSet, index, numOfVgroups);
//      if (code1 != TSDB_CODE_SUCCESS) {  // retry failed.
//        tscError("consumer:0x%" PRIx64 " topic:%s vgId:%d offset:%" PRId64
//                 " retry failed, ignore this commit. code:%s ordinal:%d/%d",
//                 pParam->pTmq->consumerId, pParam->topicName, pVg->vgId, pVg->committedOffset.version,
//                 tstrerror(terrno), index + 1, numOfVgroups);
//      }
//    }
//
//    taosThreadMutexUnlock(&pParam->pTmq->lock);
//
//    taosMemoryFree(pParam->pOffset);
//    taosMemoryFree(pBuf->pData);
//    taosMemoryFree(pBuf->pEpSet);
//
450
//    commitRspCountDown(pParamSet, pParam->pTmq->consumerId, pParam->topicName, pParam->vgId);
451 452 453 454
//    return 0;
//  }
//
//  // todo replace the pTmq with refId
455

L
Liu Jicong 已提交
456
  taosMemoryFree(pParam->pOffset);
L
Liu Jicong 已提交
457
  taosMemoryFree(pBuf->pData);
dengyihao's avatar
dengyihao 已提交
458
  taosMemoryFree(pBuf->pEpSet);
L
Liu Jicong 已提交
459

460
  commitRspCountDown(pParamSet, pParam->pTmq->consumerId, pParam->topicName, pParam->vgId);
461 462 463
  return 0;
}

464 465
static int32_t doSendCommitMsg(tmq_t* tmq, SMqClientVg* pVg, const char* pTopicName, SMqCommitCbParamSet* pParamSet,
                               int32_t index, int32_t totalVgroups) {
L
Liu Jicong 已提交
466 467
  STqOffset* pOffset = taosMemoryCalloc(1, sizeof(STqOffset));
  if (pOffset == NULL) {
468
    return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
469
  }
470

L
Liu Jicong 已提交
471
  pOffset->val = pVg->currentOffset;
472

L
Liu Jicong 已提交
473 474 475
  int32_t groupLen = strlen(tmq->groupId);
  memcpy(pOffset->subKey, tmq->groupId, groupLen);
  pOffset->subKey[groupLen] = TMQ_SEPARATOR;
H
Haojun Liao 已提交
476
  strcpy(pOffset->subKey + groupLen + 1, pTopicName);
L
Liu Jicong 已提交
477

478 479
  int32_t len = 0;
  int32_t code = 0;
L
Liu Jicong 已提交
480 481
  tEncodeSize(tEncodeSTqOffset, pOffset, len, code);
  if (code < 0) {
482
    return TSDB_CODE_INVALID_PARA;
L
Liu Jicong 已提交
483
  }
484

L
Liu Jicong 已提交
485
  void* buf = taosMemoryCalloc(1, sizeof(SMsgHead) + len);
L
Liu Jicong 已提交
486 487
  if (buf == NULL) {
    taosMemoryFree(pOffset);
488
    return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
489
  }
490

L
Liu Jicong 已提交
491
  ((SMsgHead*)buf)->vgId = htonl(pVg->vgId);
L
Liu Jicong 已提交
492

L
Liu Jicong 已提交
493 494 495 496 497
  void* abuf = POINTER_SHIFT(buf, sizeof(SMsgHead));

  SEncoder encoder;
  tEncoderInit(&encoder, abuf, len);
  tEncodeSTqOffset(&encoder, pOffset);
L
Liu Jicong 已提交
498
  tEncoderClear(&encoder);
L
Liu Jicong 已提交
499 500

  // build param
501
  SMqCommitCbParam* pParam = taosMemoryCalloc(1, sizeof(SMqCommitCbParam));
L
Liu Jicong 已提交
502
  if (pParam == NULL) {
L
Liu Jicong 已提交
503
    taosMemoryFree(pOffset);
L
Liu Jicong 已提交
504
    taosMemoryFree(buf);
505
    return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
506
  }
507

L
Liu Jicong 已提交
508 509
  pParam->params = pParamSet;
  pParam->pOffset = pOffset;
H
Haojun Liao 已提交
510 511 512
  pParam->vgId = pVg->vgId;
  pParam->pTmq = tmq;

H
Haojun Liao 已提交
513
  tstrncpy(pParam->topicName, pTopicName, tListLen(pParam->topicName));
L
Liu Jicong 已提交
514 515 516 517

  // build send info
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (pMsgSendInfo == NULL) {
L
Liu Jicong 已提交
518
    taosMemoryFree(pOffset);
L
Liu Jicong 已提交
519 520
    taosMemoryFree(buf);
    taosMemoryFree(pParam);
521
    return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
522
  }
523

L
Liu Jicong 已提交
524 525 526 527 528 529 530 531 532
  pMsgSendInfo->msgInfo = (SDataBuf){
      .pData = buf,
      .len = sizeof(SMsgHead) + len,
      .handle = NULL,
  };

  pMsgSendInfo->requestId = generateRequestId();
  pMsgSendInfo->requestObjRefId = 0;
  pMsgSendInfo->param = pParam;
L
Liu Jicong 已提交
533
  pMsgSendInfo->paramFreeFp = taosMemoryFree;
534
  pMsgSendInfo->fp = tmqCommitCb;
L
Liu Jicong 已提交
535
  pMsgSendInfo->msgType = TDMT_VND_TMQ_COMMIT_OFFSET;
L
Liu Jicong 已提交
536

L
Liu Jicong 已提交
537 538 539
  atomic_add_fetch_32(&pParamSet->waitingRspNum, 1);
  atomic_add_fetch_32(&pParamSet->totalRspNum, 1);

H
Haojun Liao 已提交
540
  SEp* pEp = GET_ACTIVE_EP(&pVg->epSet);
541 542 543 544 545 546 547 548
  char offsetBuf[80] = {0};
  tFormatOffset(offsetBuf, tListLen(offsetBuf), &pOffset->val);

  char commitBuf[80] = {0};
  tFormatOffset(commitBuf, tListLen(commitBuf), &pVg->committedOffset);
  tscDebug("consumer:0x%" PRIx64 " topic:%s on vgId:%d send offset:%s prev:%s, ep:%s:%d, ordinal:%d/%d, req:0x%" PRIx64,
           tmq->consumerId, pOffset->subKey, pVg->vgId, offsetBuf, commitBuf, pEp->fqdn, pEp->port, index + 1,
           totalVgroups, pMsgSendInfo->requestId);
H
Haojun Liao 已提交
549

L
Liu Jicong 已提交
550 551
  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &pVg->epSet, &transporterId, pMsgSendInfo);
552 553

  return TSDB_CODE_SUCCESS;
L
Liu Jicong 已提交
554 555
}

556 557 558 559 560 561 562 563 564 565 566 567 568
static void asyncCommitOffset(tmq_t* tmq, const TAOS_RES* pRes, tmq_commit_cb* pCommitFp, void* userParam) {
  char*   pTopicName = NULL;
  int32_t vgId = 0;
  int32_t code = 0;

  if (pRes == NULL || tmq == NULL) {
    pCommitFp(tmq, TSDB_CODE_INVALID_PARA, userParam);
    return;
  }

  if (TD_RES_TMQ(pRes)) {
    SMqRspObj* pRspObj = (SMqRspObj*)pRes;
    pTopicName = pRspObj->topic;
L
Liu Jicong 已提交
569
    vgId = pRspObj->vgId;
570 571 572
  } else if (TD_RES_TMQ_META(pRes)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)pRes;
    pTopicName = pMetaRspObj->topic;
L
Liu Jicong 已提交
573
    vgId = pMetaRspObj->vgId;
574 575 576
  } else if (TD_RES_TMQ_METADATA(pRes)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)pRes;
    pTopicName = pRspObj->topic;
577
    vgId = pRspObj->vgId;
L
Liu Jicong 已提交
578
  } else {
579 580
    pCommitFp(tmq, TSDB_CODE_TMQ_INVALID_MSG, userParam);
    return;
L
Liu Jicong 已提交
581 582 583 584
  }

  SMqCommitCbParamSet* pParamSet = taosMemoryCalloc(1, sizeof(SMqCommitCbParamSet));
  if (pParamSet == NULL) {
585 586
    pCommitFp(tmq, TSDB_CODE_OUT_OF_MEMORY, userParam);
    return;
L
Liu Jicong 已提交
587
  }
H
Haojun Liao 已提交
588

589 590
  pParamSet->refId = tmq->refId;
  pParamSet->epoch = tmq->epoch;
591
  pParamSet->callbackFn = pCommitFp;
L
Liu Jicong 已提交
592
  pParamSet->userParam = userParam;
L
Liu Jicong 已提交
593

H
Haojun Liao 已提交
594 595
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);

596 597 598 599
  tscDebug("consumer:0x%" PRIx64 " do manual commit offset for %s, vgId:%d", tmq->consumerId, pTopicName, vgId);

  int32_t i = 0;
  for (; i < numOfTopics; i++) {
L
Liu Jicong 已提交
600
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
601 602
    if (strcmp(pTopic->topicName, pTopicName) == 0) {
      break;
603
    }
604
  }
605

606
  if (i == numOfTopics) {
H
Haojun Liao 已提交
607
    tscWarn("consumer:0x%" PRIx64 " failed to find the specified topic:%s, total topics:%d", tmq->consumerId, pTopicName,
608 609 610 611 612
            numOfTopics);
    taosMemoryFree(pParamSet);
    pCommitFp(tmq, TSDB_CODE_SUCCESS, userParam);
    return;
  }
L
Liu Jicong 已提交
613

614 615 616 617 618 619 620 621
  SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);

  int32_t j = 0;
  int32_t numOfVgroups = taosArrayGetSize(pTopic->vgs);
  for (j = 0; j < numOfVgroups; j++) {
    SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);
    if (pVg->vgId == vgId) {
      break;
L
Liu Jicong 已提交
622
    }
L
Liu Jicong 已提交
623
  }
L
Liu Jicong 已提交
624

625
  if (j == numOfVgroups) {
H
Haojun Liao 已提交
626
    tscWarn("consumer:0x%" PRIx64 " failed to find the specified vgId:%d, total Vgs:%d, topic:%s", tmq->consumerId, vgId,
627
            numOfVgroups, pTopicName);
L
Liu Jicong 已提交
628
    taosMemoryFree(pParamSet);
629 630
    pCommitFp(tmq, TSDB_CODE_SUCCESS, userParam);
    return;
L
Liu Jicong 已提交
631 632
  }

633 634 635
  SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);
  if (pVg->currentOffset.type > 0 && !tOffsetEqual(&pVg->currentOffset, &pVg->committedOffset)) {
    code = doSendCommitMsg(tmq, pVg, pTopic->topicName, pParamSet, j, numOfVgroups);
L
Liu Jicong 已提交
636

637 638 639 640 641 642 643 644
    // failed to commit, callback user function directly.
    if (code != TSDB_CODE_SUCCESS) {
      taosMemoryFree(pParamSet);
      pCommitFp(tmq, code, userParam);
    }
  } else { // do not perform commit, callback user function directly.
    taosMemoryFree(pParamSet);
    pCommitFp(tmq, code, userParam);
L
Liu Jicong 已提交
645 646 647
  }
}

648
static void asyncCommitAllOffsets(tmq_t* tmq, tmq_commit_cb* pCommitFp, void* userParam) {
649 650
  SMqCommitCbParamSet* pParamSet = taosMemoryCalloc(1, sizeof(SMqCommitCbParamSet));
  if (pParamSet == NULL) {
651 652
    pCommitFp(tmq, TSDB_CODE_OUT_OF_MEMORY, userParam);
    return;
653
  }
654 655 656

  pParamSet->refId = tmq->refId;
  pParamSet->epoch = tmq->epoch;
657
  pParamSet->callbackFn = pCommitFp;
658 659
  pParamSet->userParam = userParam;

660 661 662
  // init as 1 to prevent concurrency issue
  pParamSet->waitingRspNum = 1;

663
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);
X
Xiaoyu Wang 已提交
664
  tscDebug("consumer:0x%" PRIx64 " start to commit offset for %d topics", tmq->consumerId, numOfTopics);
665 666

  for (int32_t i = 0; i < numOfTopics; i++) {
667
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
668
    int32_t         numOfVgroups = taosArrayGetSize(pTopic->vgs);
L
Liu Jicong 已提交
669

670 671
    tscDebug("consumer:0x%" PRIx64 " commit offset for topics:%s, numOfVgs:%d", tmq->consumerId, pTopic->topicName,
             numOfVgroups);
672
    for (int32_t j = 0; j < numOfVgroups; j++) {
673 674 675
      SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);

      if (pVg->currentOffset.type > 0 && !tOffsetEqual(&pVg->currentOffset, &pVg->committedOffset)) {
676
        int32_t code = doSendCommitMsg(tmq, pVg, pTopic->topicName, pParamSet, j, numOfVgroups);
677 678 679 680
        if (code != TSDB_CODE_SUCCESS) {
          tscError("consumer:0x%" PRIx64 " topic:%s vgId:%d offset:%" PRId64 " failed, code:%s ordinal:%d/%d",
                   tmq->consumerId, pTopic->topicName, pVg->vgId, pVg->committedOffset.version, tstrerror(terrno),
                   j + 1, numOfVgroups);
L
Liu Jicong 已提交
681 682
          continue;
        }
H
Haojun Liao 已提交
683 684 685

        // update the offset value.
        pVg->committedOffset = pVg->currentOffset;
686
      } else {
687
        tscDebug("consumer:0x%" PRIx64 " topic:%s vgId:%d, not commit, current:%" PRId64 ", ordinal:%d/%d",
688
                 tmq->consumerId, pTopic->topicName, pVg->vgId, pVg->currentOffset.version, j + 1, numOfVgroups);
689 690 691 692
      }
    }
  }

H
Haojun Liao 已提交
693
  tscDebug("consumer:0x%" PRIx64 " total commit:%d for %d topics", tmq->consumerId, pParamSet->waitingRspNum - 1,
694
           numOfTopics);
H
Haojun Liao 已提交
695

L
Liu Jicong 已提交
696
  // no request is sent
L
Liu Jicong 已提交
697 698
  if (pParamSet->totalRspNum == 0) {
    taosMemoryFree(pParamSet);
699 700
    pCommitFp(tmq, TSDB_CODE_SUCCESS, userParam);
    return;
L
Liu Jicong 已提交
701 702
  }

L
Liu Jicong 已提交
703
  // count down since waiting rsp num init as 1
704
  commitRspCountDown(pParamSet, tmq->consumerId, "", 0);
705 706
}

707 708
static void generateTimedTask(int64_t refId, int32_t type) {
  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
709
  if (tmq != NULL) {
S
Shengliang Guan 已提交
710
    int8_t* pTaskType = taosAllocateQitem(sizeof(int8_t), DEF_QITEM, 0);
711
    *pTaskType = type;
712 713 714
    taosWriteQitem(tmq->delayedTask, pTaskType);
    tsem_post(&tmq->rspSem);
  }
715
  taosReleaseRef(tmqMgmt.rsetId, refId);
716 717 718 719 720
}

void tmqAssignAskEpTask(void* param, void* tmrId) {
  int64_t refId = *(int64_t*)param;
  generateTimedTask(refId, TMQ_DELAYED_TASK__ASK_EP);
721
  taosMemoryFree(param);
L
Liu Jicong 已提交
722 723 724
}

void tmqAssignDelayedCommitTask(void* param, void* tmrId) {
725
  int64_t refId = *(int64_t*)param;
726
  generateTimedTask(refId, TMQ_DELAYED_TASK__COMMIT);
727
  taosMemoryFree(param);
L
Liu Jicong 已提交
728 729 730
}

void tmqAssignDelayedReportTask(void* param, void* tmrId) {
731 732 733
  int64_t refId = *(int64_t*)param;
  tmq_t*  tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
  if (tmq != NULL) {
S
Shengliang Guan 已提交
734
    int8_t* pTaskType = taosAllocateQitem(sizeof(int8_t), DEF_QITEM, 0);
735 736 737 738
    *pTaskType = TMQ_DELAYED_TASK__REPORT;
    taosWriteQitem(tmq->delayedTask, pTaskType);
    tsem_post(&tmq->rspSem);
  }
739 740

  taosReleaseRef(tmqMgmt.rsetId, refId);
741
  taosMemoryFree(param);
L
Liu Jicong 已提交
742 743
}

744
int32_t tmqHbCb(void* param, SDataBuf* pMsg, int32_t code) {
dengyihao's avatar
dengyihao 已提交
745 746 747 748
  if (pMsg) {
    taosMemoryFree(pMsg->pData);
    taosMemoryFree(pMsg->pEpSet);
  }
749 750 751 752
  return 0;
}

void tmqSendHbReq(void* param, void* tmrId) {
753
  int64_t refId = *(int64_t*)param;
754

755 756
  tmq_t*  tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
  if (tmq == NULL) {
L
Liu Jicong 已提交
757
    taosMemoryFree(param);
758 759
    return;
  }
D
dapan1121 已提交
760 761 762 763 764

  SMqHbReq req = {0};
  req.consumerId = tmq->consumerId;
  req.epoch = tmq->epoch;

L
Liu Jicong 已提交
765
  int32_t tlen = tSerializeSMqHbReq(NULL, 0, &req);
D
dapan1121 已提交
766 767
  if (tlen < 0) {
    tscError("tSerializeSMqHbReq failed");
768
    goto OVER;
D
dapan1121 已提交
769
  }
770

L
Liu Jicong 已提交
771
  void* pReq = taosMemoryCalloc(1, tlen);
D
dapan1121 已提交
772 773
  if (tlen < 0) {
    tscError("failed to malloc MqHbReq msg, size:%d", tlen);
774
    goto OVER;
D
dapan1121 已提交
775
  }
776

D
dapan1121 已提交
777 778 779
  if (tSerializeSMqHbReq(pReq, tlen, &req) < 0) {
    tscError("tSerializeSMqHbReq %d failed", tlen);
    taosMemoryFree(pReq);
780
    goto OVER;
D
dapan1121 已提交
781
  }
782 783 784 785

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(pReq);
L
Liu Jicong 已提交
786
    goto OVER;
787
  }
788

789 790
  sendInfo->msgInfo = (SDataBuf){
      .pData = pReq,
D
dapan1121 已提交
791
      .len = tlen,
792 793 794 795 796 797 798
      .handle = NULL,
  };

  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
  sendInfo->param = NULL;
  sendInfo->fp = tmqHbCb;
L
Liu Jicong 已提交
799
  sendInfo->msgType = TDMT_MND_TMQ_HB;
800 801 802 803 804 805 806

  SEpSet epSet = getEpSet_s(&tmq->pTscObj->pAppInfo->mgmtEp);

  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);

OVER:
807
  taosTmrReset(tmqSendHbReq, 1000, param, tmqMgmt.timer, &tmq->hbLiveTimer);
808
  taosReleaseRef(tmqMgmt.rsetId, refId);
809 810
}

811 812 813 814 815 816
static void defaultCommitCbFn(tmq_t* pTmq, int32_t code, void* param) {
  if (code != 0) {
    tscDebug("consumer:0x%"PRIx64", failed to commit offset, code:%s", pTmq->consumerId, tstrerror(code));
  }
}

817
int32_t tmqHandleAllDelayedTask(tmq_t* pTmq) {
L
Liu Jicong 已提交
818
  STaosQall* qall = taosAllocateQall();
819
  taosReadAllQitems(pTmq->delayedTask, qall);
L
Liu Jicong 已提交
820

821 822 823 824
  if (qall->numOfItems == 0) {
    taosFreeQall(qall);
    return TSDB_CODE_SUCCESS;
  }
825

X
Xiaoyu Wang 已提交
826
  tscDebug("consumer:0x%" PRIx64 " handle delayed %d tasks before poll data", pTmq->consumerId, qall->numOfItems);
827 828
  int8_t* pTaskType = NULL;
  taosGetQitem(qall, (void**)&pTaskType);
L
Liu Jicong 已提交
829

830
  while (pTaskType != NULL) {
831
    if (*pTaskType == TMQ_DELAYED_TASK__ASK_EP) {
832
      asyncAskEp(pTmq, addToQueueCallbackFn, NULL);
833 834

      int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
835
      *pRefId = pTmq->refId;
836

X
Xiaoyu Wang 已提交
837
      tscDebug("consumer:0x%" PRIx64 " retrieve ep from mnode in 1s", pTmq->consumerId);
838
      taosTmrReset(tmqAssignAskEpTask, 1000, pRefId, tmqMgmt.timer, &pTmq->epTimer);
L
Liu Jicong 已提交
839
    } else if (*pTaskType == TMQ_DELAYED_TASK__COMMIT) {
840 841 842
      tmq_commit_cb* pCallbackFn = pTmq->commitCb? pTmq->commitCb:defaultCommitCbFn;

      asyncCommitAllOffsets(pTmq, pCallbackFn, pTmq->commitCbUserParam);
843
      int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
844
      *pRefId = pTmq->refId;
845

846
      tscDebug("consumer:0x%" PRIx64 " next commit to vnode(s) in %.2fs", pTmq->consumerId,
X
Xiaoyu Wang 已提交
847
               pTmq->autoCommitInterval / 1000.0);
848
      taosTmrReset(tmqAssignDelayedCommitTask, pTmq->autoCommitInterval, pRefId, tmqMgmt.timer, &pTmq->commitTimer);
L
Liu Jicong 已提交
849 850
    } else if (*pTaskType == TMQ_DELAYED_TASK__REPORT) {
    }
851

L
Liu Jicong 已提交
852
    taosFreeQitem(pTaskType);
853
    taosGetQitem(qall, (void**)&pTaskType);
L
Liu Jicong 已提交
854
  }
855

L
Liu Jicong 已提交
856 857 858 859
  taosFreeQall(qall);
  return 0;
}

860
static void* tmqFreeRspWrapper(SMqRspWrapper* rspWrapper) {
L
Liu Jicong 已提交
861 862 863 864 865 866 867
  if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__END_RSP) {
    // do nothing
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__EP_RSP) {
    SMqAskEpRspWrapper* pEpRspWrapper = (SMqAskEpRspWrapper*)rspWrapper;
    tDeleteSMqAskEpRsp(&pEpRspWrapper->msg);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
868 869
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
870 871 872 873 874 875
    taosArrayDestroyP(pRsp->dataRsp.blockData, taosMemoryFree);
    taosArrayDestroy(pRsp->dataRsp.blockDataLen);
    taosArrayDestroyP(pRsp->dataRsp.blockTbName, taosMemoryFree);
    taosArrayDestroyP(pRsp->dataRsp.blockSchema, (FDelete)tDeleteSSchemaWrapper);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_META_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
876 877
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
878 879 880
    taosMemoryFree(pRsp->metaRsp.metaRsp);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__TAOSX_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
881 882
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
883 884 885 886 887 888 889 890
    taosArrayDestroyP(pRsp->taosxRsp.blockData, taosMemoryFree);
    taosArrayDestroy(pRsp->taosxRsp.blockDataLen);
    taosArrayDestroyP(pRsp->taosxRsp.blockTbName, taosMemoryFree);
    taosArrayDestroyP(pRsp->taosxRsp.blockSchema, (FDelete)tDeleteSSchemaWrapper);
    // taosx
    taosArrayDestroy(pRsp->taosxRsp.createTableLen);
    taosArrayDestroyP(pRsp->taosxRsp.createTableReq, taosMemoryFree);
  }
891 892

  return NULL;
L
Liu Jicong 已提交
893 894
}

L
Liu Jicong 已提交
895
void tmqClearUnhandleMsg(tmq_t* tmq) {
L
Liu Jicong 已提交
896
  SMqRspWrapper* rspWrapper = NULL;
L
Liu Jicong 已提交
897
  while (1) {
L
Liu Jicong 已提交
898 899 900 901 902
    taosGetQitem(tmq->qall, (void**)&rspWrapper);
    if (rspWrapper) {
      tmqFreeRspWrapper(rspWrapper);
      taosFreeQitem(rspWrapper);
    } else {
L
Liu Jicong 已提交
903
      break;
L
Liu Jicong 已提交
904
    }
L
Liu Jicong 已提交
905 906
  }

L
Liu Jicong 已提交
907
  rspWrapper = NULL;
L
Liu Jicong 已提交
908 909
  taosReadAllQitems(tmq->mqueue, tmq->qall);
  while (1) {
L
Liu Jicong 已提交
910 911 912 913 914
    taosGetQitem(tmq->qall, (void**)&rspWrapper);
    if (rspWrapper) {
      tmqFreeRspWrapper(rspWrapper);
      taosFreeQitem(rspWrapper);
    } else {
L
Liu Jicong 已提交
915
      break;
L
Liu Jicong 已提交
916
    }
L
Liu Jicong 已提交
917 918 919
  }
}

D
dapan1121 已提交
920
int32_t tmqSubscribeCb(void* param, SDataBuf* pMsg, int32_t code) {
L
Liu Jicong 已提交
921 922
  SMqSubscribeCbParam* pParam = (SMqSubscribeCbParam*)param;
  pParam->rspErr = code;
dengyihao's avatar
dengyihao 已提交
923 924

  taosMemoryFree(pMsg->pEpSet);
L
Liu Jicong 已提交
925 926 927
  tsem_post(&pParam->rspSem);
  return 0;
}
928

L
Liu Jicong 已提交
929
int32_t tmq_subscription(tmq_t* tmq, tmq_list_t** topics) {
X
Xiaoyu Wang 已提交
930 931 932 933
  if (*topics == NULL) {
    *topics = tmq_list_new();
  }
  for (int i = 0; i < taosArrayGetSize(tmq->clientTopics); i++) {
L
Liu Jicong 已提交
934
    SMqClientTopic* topic = taosArrayGet(tmq->clientTopics, i);
L
Liu Jicong 已提交
935
    tmq_list_append(*topics, strchr(topic->topicName, '.') + 1);
X
Xiaoyu Wang 已提交
936
  }
L
Liu Jicong 已提交
937
  return 0;
X
Xiaoyu Wang 已提交
938 939
}

L
Liu Jicong 已提交
940
int32_t tmq_unsubscribe(tmq_t* tmq) {
L
Liu Jicong 已提交
941 942
  int32_t     rsp;
  int32_t     retryCnt = 0;
L
Liu Jicong 已提交
943
  tmq_list_t* lst = tmq_list_new();
L
Liu Jicong 已提交
944 945 946 947 948 949 950 951 952 953
  while (1) {
    rsp = tmq_subscribe(tmq, lst);
    if (rsp != TSDB_CODE_MND_CONSUMER_NOT_READY || retryCnt > 5) {
      break;
    } else {
      retryCnt++;
      taosMsleep(500);
    }
  }

L
Liu Jicong 已提交
954 955
  tmq_list_destroy(lst);
  return rsp;
X
Xiaoyu Wang 已提交
956 957
}

958 959 960 961 962 963
static void freeClientVgImpl(void* param) {
  SMqClientTopic* pTopic = param;
  taosMemoryFreeClear(pTopic->schema.pSchema);
  taosArrayDestroy(pTopic->vgs);
}

964
void tmqFreeImpl(void* handle) {
965 966
  tmq_t*  tmq = (tmq_t*)handle;
  int64_t id = tmq->consumerId;
L
Liu Jicong 已提交
967

968
  // TODO stop timer
L
Liu Jicong 已提交
969 970 971 972
  if (tmq->mqueue) {
    tmqClearUnhandleMsg(tmq);
    taosCloseQueue(tmq->mqueue);
  }
L
Liu Jicong 已提交
973

H
Haojun Liao 已提交
974 975 976 977 978
  if (tmq->delayedTask) {
    taosCloseQueue(tmq->delayedTask);
  }

  taosFreeQall(tmq->qall);
979
  tsem_destroy(&tmq->rspSem);
L
Liu Jicong 已提交
980

981
  taosArrayDestroyEx(tmq->clientTopics, freeClientVgImpl);
982 983
  taos_close_internal(tmq->pTscObj);
  taosMemoryFree(tmq);
984 985

  tscDebug("consumer:0x%" PRIx64 " closed", id);
L
Liu Jicong 已提交
986 987
}

988 989 990 991 992 993 994 995 996
static void tmqMgmtInit(void) {
  tmqInitRes = 0;
  tmqMgmt.timer = taosTmrInit(1000, 100, 360000, "TMQ");

  if (tmqMgmt.timer == NULL) {
    tmqInitRes = TSDB_CODE_OUT_OF_MEMORY;
  }

  tmqMgmt.rsetId = taosOpenRef(10000, tmqFreeImpl);
997
  if (tmqMgmt.rsetId < 0) {
998 999 1000 1001
    tmqInitRes = terrno;
  }
}

L
Liu Jicong 已提交
1002
tmq_t* tmq_consumer_new(tmq_conf_t* conf, char* errstr, int32_t errstrLen) {
1003 1004 1005 1006
  taosThreadOnce(&tmqInit, tmqMgmtInit);
  if (tmqInitRes != 0) {
    terrno = tmqInitRes;
    return NULL;
L
Liu Jicong 已提交
1007 1008
  }

L
Liu Jicong 已提交
1009 1010
  tmq_t* pTmq = taosMemoryCalloc(1, sizeof(tmq_t));
  if (pTmq == NULL) {
L
Liu Jicong 已提交
1011
    terrno = TSDB_CODE_OUT_OF_MEMORY;
1012
    tscError("failed to create consumer, groupId:%s, code:%s", conf->groupId, terrstr());
L
Liu Jicong 已提交
1013 1014
    return NULL;
  }
L
Liu Jicong 已提交
1015

L
Liu Jicong 已提交
1016 1017 1018
  const char* user = conf->user == NULL ? TSDB_DEFAULT_USER : conf->user;
  const char* pass = conf->pass == NULL ? TSDB_DEFAULT_PASS : conf->pass;

L
Liu Jicong 已提交
1019 1020 1021
  pTmq->clientTopics = taosArrayInit(0, sizeof(SMqClientTopic));
  pTmq->mqueue = taosOpenQueue();
  pTmq->delayedTask = taosOpenQueue();
H
Haojun Liao 已提交
1022
  pTmq->qall = taosAllocateQall();
L
Liu Jicong 已提交
1023

X
Xiaoyu Wang 已提交
1024 1025
  if (pTmq->clientTopics == NULL || pTmq->mqueue == NULL || pTmq->qall == NULL || pTmq->delayedTask == NULL ||
      conf->groupId[0] == 0) {
L
Liu Jicong 已提交
1026
    terrno = TSDB_CODE_OUT_OF_MEMORY;
1027
    tscError("consumer:0x%" PRIx64 " setup failed since %s, groupId:%s", pTmq->consumerId, terrstr(),
S
Shengliang Guan 已提交
1028
             pTmq->groupId);
1029
    goto _failed;
L
Liu Jicong 已提交
1030
  }
L
Liu Jicong 已提交
1031

L
Liu Jicong 已提交
1032 1033
  // init status
  pTmq->status = TMQ_CONSUMER_STATUS__INIT;
L
Liu Jicong 已提交
1034 1035
  pTmq->pollCnt = 0;
  pTmq->epoch = 0;
L
Liu Jicong 已提交
1036

L
Liu Jicong 已提交
1037 1038 1039
  // set conf
  strcpy(pTmq->clientId, conf->clientId);
  strcpy(pTmq->groupId, conf->groupId);
1040
  pTmq->withTbName = conf->withTbName;
L
Liu Jicong 已提交
1041
  pTmq->useSnapshot = conf->snapEnable;
L
Liu Jicong 已提交
1042
  pTmq->autoCommit = conf->autoCommit;
L
Liu Jicong 已提交
1043
  pTmq->autoCommitInterval = conf->autoCommitInterval;
L
Liu Jicong 已提交
1044 1045
  pTmq->commitCb = conf->commitCb;
  pTmq->commitCbUserParam = conf->commitCbUserParam;
L
Liu Jicong 已提交
1046 1047
  pTmq->resetOffsetCfg = conf->resetOffset;

1048 1049
  pTmq->hbBgEnable = conf->hbBgEnable;

L
Liu Jicong 已提交
1050
  // assign consumerId
L
Liu Jicong 已提交
1051
  pTmq->consumerId = tGenIdPI64();
X
Xiaoyu Wang 已提交
1052

L
Liu Jicong 已提交
1053 1054
  // init semaphore
  if (tsem_init(&pTmq->rspSem, 0, 0) != 0) {
1055
    tscError("consumer:0x %" PRIx64 " setup failed since %s, consumer group %s", pTmq->consumerId, terrstr(),
S
Shengliang Guan 已提交
1056
             pTmq->groupId);
1057
    goto _failed;
L
Liu Jicong 已提交
1058
  }
L
Liu Jicong 已提交
1059

L
Liu Jicong 已提交
1060 1061 1062
  // init connection
  pTmq->pTscObj = taos_connect_internal(conf->ip, user, pass, NULL, NULL, conf->port, CONN_TYPE__TMQ);
  if (pTmq->pTscObj == NULL) {
1063
    tscError("consumer:0x%" PRIx64 " setup failed since %s, groupId:%s", pTmq->consumerId, terrstr(), pTmq->groupId);
L
Liu Jicong 已提交
1064
    tsem_destroy(&pTmq->rspSem);
1065
    goto _failed;
L
Liu Jicong 已提交
1066
  }
L
Liu Jicong 已提交
1067

1068 1069
  pTmq->refId = taosAddRef(tmqMgmt.rsetId, pTmq);
  if (pTmq->refId < 0) {
1070
    goto _failed;
1071 1072
  }

1073
  if (pTmq->hbBgEnable) {
L
Liu Jicong 已提交
1074 1075
    int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
    *pRefId = pTmq->refId;
1076
    pTmq->hbLiveTimer = taosTmrStart(tmqSendHbReq, 1000, pRefId, tmqMgmt.timer);
1077 1078
  }

1079 1080 1081
  char         buf[80] = {0};
  STqOffsetVal offset = {.type = pTmq->resetOffsetCfg};
  tFormatOffset(buf, tListLen(buf), &offset);
1082 1083
  tscInfo("consumer:0x%" PRIx64 " is setup, refId:%"PRId64", groupId:%s, snapshot:%d, autoCommit:%d, commitInterval:%dms, offset:%s, backgroudHB:%d",
          pTmq->consumerId, pTmq->refId, pTmq->groupId, pTmq->useSnapshot, pTmq->autoCommit, pTmq->autoCommitInterval, buf,
1084
          pTmq->hbBgEnable);
L
Liu Jicong 已提交
1085

1086
  return pTmq;
1087

1088 1089
_failed:
  tmqFreeImpl(pTmq);
L
Liu Jicong 已提交
1090
  return NULL;
1091 1092
}

L
Liu Jicong 已提交
1093
int32_t tmq_subscribe(tmq_t* tmq, const tmq_list_t* topic_list) {
1094
  const int32_t   MAX_RETRY_COUNT = 120 * 2;  // let's wait for 2 mins at most
L
Liu Jicong 已提交
1095 1096 1097
  const SArray*   container = &topic_list->container;
  int32_t         sz = taosArrayGetSize(container);
  void*           buf = NULL;
L
Liu Jicong 已提交
1098
  SMsgSendInfo*   sendInfo = NULL;
L
Liu Jicong 已提交
1099
  SCMSubscribeReq req = {0};
1100
  int32_t         code = 0;
1101

1102
  tscDebug("consumer:0x%" PRIx64 " cgroup:%s, subscribe %d topics", tmq->consumerId, tmq->groupId, sz);
L
Liu Jicong 已提交
1103

1104
  req.consumerId = tmq->consumerId;
L
Liu Jicong 已提交
1105
  tstrncpy(req.clientId, tmq->clientId, 256);
L
Liu Jicong 已提交
1106
  tstrncpy(req.cgroup, tmq->groupId, TSDB_CGROUP_LEN);
1107 1108
  req.topicNames = taosArrayInit(sz, sizeof(void*));

1109 1110 1111 1112
  if (req.topicNames == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
1113

L
Liu Jicong 已提交
1114 1115
  for (int32_t i = 0; i < sz; i++) {
    char* topic = taosArrayGetP(container, i);
1116 1117

    SName name = {0};
L
Liu Jicong 已提交
1118 1119 1120 1121
    tNameSetDbName(&name, tmq->pTscObj->acctId, topic, strlen(topic));
    char* topicFName = taosMemoryCalloc(1, TSDB_TOPIC_FNAME_LEN);
    if (topicFName == NULL) {
      goto FAIL;
1122 1123
    }

1124
    tNameExtractFullName(&name, topicFName);
X
Xiaoyu Wang 已提交
1125
    tscDebug("consumer:0x%" PRIx64 " subscribe topic:%s", tmq->consumerId, topicFName);
L
Liu Jicong 已提交
1126 1127

    taosArrayPush(req.topicNames, &topicFName);
1128 1129
  }

L
Liu Jicong 已提交
1130
  int32_t tlen = tSerializeSCMSubscribeReq(NULL, &req);
1131

L
Liu Jicong 已提交
1132
  buf = taosMemoryMalloc(tlen);
1133 1134 1135 1136
  if (buf == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
L
Liu Jicong 已提交
1137

1138 1139 1140
  void* abuf = buf;
  tSerializeSCMSubscribeReq(&abuf, &req);

L
Liu Jicong 已提交
1141
  sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
1142 1143 1144 1145
  if (sendInfo == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
1146

X
Xiaoyu Wang 已提交
1147
  SMqSubscribeCbParam param = {
L
Liu Jicong 已提交
1148
      .rspErr = 0,
1149 1150
      .refId = tmq->refId,
      .epoch = tmq->epoch,
X
Xiaoyu Wang 已提交
1151
  };
L
Liu Jicong 已提交
1152

1153 1154 1155
  if (tsem_init(&param.rspSem, 0, 0) != 0) {
    goto FAIL;
  }
L
Liu Jicong 已提交
1156 1157

  sendInfo->msgInfo = (SDataBuf){
X
Xiaoyu Wang 已提交
1158 1159 1160 1161
      .pData = buf,
      .len = tlen,
      .handle = NULL,
  };
1162

L
Liu Jicong 已提交
1163 1164
  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
L
Liu Jicong 已提交
1165 1166
  sendInfo->param = &param;
  sendInfo->fp = tmqSubscribeCb;
L
Liu Jicong 已提交
1167
  sendInfo->msgType = TDMT_MND_TMQ_SUBSCRIBE;
L
Liu Jicong 已提交
1168

1169 1170 1171 1172 1173
  SEpSet epSet = getEpSet_s(&tmq->pTscObj->pAppInfo->mgmtEp);

  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);

L
Liu Jicong 已提交
1174 1175
  // avoid double free if msg is sent
  buf = NULL;
L
Liu Jicong 已提交
1176
  sendInfo = NULL;
L
Liu Jicong 已提交
1177

L
Liu Jicong 已提交
1178 1179
  tsem_wait(&param.rspSem);
  tsem_destroy(&param.rspSem);
1180

1181 1182 1183 1184
  if (param.rspErr != 0) {
    code = param.rspErr;
    goto FAIL;
  }
L
Liu Jicong 已提交
1185

L
Liu Jicong 已提交
1186
  int32_t retryCnt = 0;
1187
  while (TSDB_CODE_MND_CONSUMER_NOT_READY == doAskEp(tmq)) {
1188
    if (retryCnt++ > MAX_RETRY_COUNT) {
L
Liu Jicong 已提交
1189 1190
      goto FAIL;
    }
1191

X
Xiaoyu Wang 已提交
1192
    tscDebug("consumer:0x%" PRIx64 ", mnd not ready for subscribe, retry:%d in 500ms", tmq->consumerId, retryCnt);
L
Liu Jicong 已提交
1193 1194
    taosMsleep(500);
  }
1195

1196 1197
  // init ep timer
  if (tmq->epTimer == NULL) {
1198 1199 1200
    int64_t* pRefId1 = taosMemoryMalloc(sizeof(int64_t));
    *pRefId1 = tmq->refId;
    tmq->epTimer = taosTmrStart(tmqAssignAskEpTask, 1000, pRefId1, tmqMgmt.timer);
1201
  }
L
Liu Jicong 已提交
1202 1203

  // init auto commit timer
1204
  if (tmq->autoCommit && tmq->commitTimer == NULL) {
1205 1206 1207
    int64_t* pRefId2 = taosMemoryMalloc(sizeof(int64_t));
    *pRefId2 = tmq->refId;
    tmq->commitTimer = taosTmrStart(tmqAssignDelayedCommitTask, tmq->autoCommitInterval, pRefId2, tmqMgmt.timer);
L
Liu Jicong 已提交
1208 1209
  }

L
Liu Jicong 已提交
1210
FAIL:
L
Liu Jicong 已提交
1211
  taosArrayDestroyP(req.topicNames, taosMemoryFree);
L
Liu Jicong 已提交
1212
  taosMemoryFree(buf);
L
Liu Jicong 已提交
1213
  taosMemoryFree(sendInfo);
L
Liu Jicong 已提交
1214

L
Liu Jicong 已提交
1215
  return code;
1216 1217
}

L
Liu Jicong 已提交
1218
void tmq_conf_set_auto_commit_cb(tmq_conf_t* conf, tmq_commit_cb* cb, void* param) {
1219
  conf->commitCb = cb;
L
Liu Jicong 已提交
1220
  conf->commitCbUserParam = param;
L
Liu Jicong 已提交
1221
}
1222

D
dapan1121 已提交
1223
int32_t tmqPollCb(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1224
  SMqPollCbParam* pParam = (SMqPollCbParam*)param;
1225 1226

  int64_t         refId = pParam->refId;
X
Xiaoyu Wang 已提交
1227
  SMqClientVg*    pVg = pParam->pVg;
L
Liu Jicong 已提交
1228
  SMqClientTopic* pTopic = pParam->pTopic;
1229

1230
  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
1231 1232 1233
  if (tmq == NULL) {
    taosMemoryFree(pParam);
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1234
    taosMemoryFree(pMsg->pEpSet);
1235 1236 1237 1238
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    return -1;
  }

H
Haojun Liao 已提交
1239 1240 1241 1242
  int32_t  epoch = pParam->epoch;
  int32_t  vgId = pParam->vgId;
  uint64_t requestId = pParam->requestId;

L
Liu Jicong 已提交
1243
  taosMemoryFree(pParam);
H
Haojun Liao 已提交
1244

L
Liu Jicong 已提交
1245
  if (code != 0) {
H
Haojun Liao 已提交
1246 1247
    tscWarn("consumer:0x%" PRIx64 " msg from vgId:%d discarded, epoch %d, since %s, reqId:0x%" PRIx64, tmq->consumerId,
            vgId, epoch, tstrerror(code), requestId);
H
Haojun Liao 已提交
1248

L
Liu Jicong 已提交
1249
    if (pMsg->pData) taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1250 1251
    if (pMsg->pEpSet) taosMemoryFree(pMsg->pEpSet);

H
Haojun Liao 已提交
1252
    // in case of consumer mismatch, wait for 500ms and retry
L
Liu Jicong 已提交
1253
    if (code == TSDB_CODE_TMQ_CONSUMER_MISMATCH) {
1254
      taosMsleep(500);
L
Liu Jicong 已提交
1255
      atomic_store_8(&tmq->status, TMQ_CONSUMER_STATUS__RECOVER);
1256
      tscDebug("consumer:0x%" PRIx64" wait for the re-balance, wait for 500ms and set status to be RECOVER", tmq->consumerId);
H
Haojun Liao 已提交
1257
    } else if (code == TSDB_CODE_TQ_NO_COMMITTED_OFFSET) {
S
Shengliang Guan 已提交
1258
      SMqPollRspWrapper* pRspWrapper = taosAllocateQitem(sizeof(SMqPollRspWrapper), DEF_QITEM, 0);
L
Liu Jicong 已提交
1259
      if (pRspWrapper == NULL) {
H
Haojun Liao 已提交
1260 1261
        tscWarn("consumer:0x%" PRIx64 " msg from vgId:%d discarded, epoch %d since out of memory, reqId:0x%" PRIx64,
                tmq->consumerId, vgId, epoch, requestId);
L
Liu Jicong 已提交
1262 1263
        goto CREATE_MSG_FAIL;
      }
H
Haojun Liao 已提交
1264

L
Liu Jicong 已提交
1265 1266
      pRspWrapper->tmqRspType = TMQ_MSG_TYPE__END_RSP;
      taosWriteQitem(tmq->mqueue, pRspWrapper);
1267 1268
    }else if(code == TSDB_CODE_WAL_LOG_NOT_EXIST){    //poll data while insert
      taosMsleep(500);
L
Liu Jicong 已提交
1269
    }
H
Haojun Liao 已提交
1270

L
fix txn  
Liu Jicong 已提交
1271
    goto CREATE_MSG_FAIL;
L
Liu Jicong 已提交
1272 1273
  }

X
Xiaoyu Wang 已提交
1274 1275 1276
  int32_t msgEpoch = ((SMqRspHead*)pMsg->pData)->epoch;
  int32_t tmqEpoch = atomic_load_32(&tmq->epoch);
  if (msgEpoch < tmqEpoch) {
L
Liu Jicong 已提交
1277
    // do not write into queue since updating epoch reset
H
Haojun Liao 已提交
1278 1279 1280
    tscWarn("consumer:0x%" PRIx64 " msg discard from vgId:%d since from earlier epoch, rsp epoch %d, current epoch %d, reqId:0x%"PRIx64,
            tmq->consumerId, vgId, msgEpoch, tmqEpoch, requestId);

1281
    tsem_post(&tmq->rspSem);
1282 1283
    taosReleaseRef(tmqMgmt.rsetId, refId);

L
Liu Jicong 已提交
1284
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1285
    taosMemoryFree(pMsg->pEpSet);
X
Xiaoyu Wang 已提交
1286 1287 1288 1289
    return 0;
  }

  if (msgEpoch != tmqEpoch) {
H
Haojun Liao 已提交
1290 1291
    tscWarn("consumer:0x%" PRIx64 " mismatch rsp from vgId:%d, epoch %d, current epoch %d, reqId:0x%" PRIx64,
            tmq->consumerId, vgId, msgEpoch, tmqEpoch, requestId);
X
Xiaoyu Wang 已提交
1292 1293
  }

L
Liu Jicong 已提交
1294 1295 1296
  // handle meta rsp
  int8_t rspType = ((SMqRspHead*)pMsg->pData)->mqMsgType;

S
Shengliang Guan 已提交
1297
  SMqPollRspWrapper* pRspWrapper = taosAllocateQitem(sizeof(SMqPollRspWrapper), DEF_QITEM, 0);
L
Liu Jicong 已提交
1298
  if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1299
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1300
    taosMemoryFree(pMsg->pEpSet);
H
Haojun Liao 已提交
1301
    tscWarn("consumer:0x%"PRIx64" msg discard from vgId:%d, epoch %d since out of memory", tmq->consumerId, vgId, epoch);
L
fix txn  
Liu Jicong 已提交
1302
    goto CREATE_MSG_FAIL;
L
Liu Jicong 已提交
1303
  }
L
Liu Jicong 已提交
1304

L
Liu Jicong 已提交
1305
  pRspWrapper->tmqRspType = rspType;
L
Liu Jicong 已提交
1306 1307
  pRspWrapper->vgHandle = pVg;
  pRspWrapper->topicHandle = pTopic;
H
Haojun Liao 已提交
1308
  pRspWrapper->reqId = requestId;
1309
  pRspWrapper->pEpset = pMsg->pEpSet;
1310
  pRspWrapper->vgId = pVg->vgId;
L
Liu Jicong 已提交
1311

1312
  pMsg->pEpSet = NULL;
L
Liu Jicong 已提交
1313
  if (rspType == TMQ_MSG_TYPE__POLL_RSP) {
L
Liu Jicong 已提交
1314 1315 1316
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeSMqDataRsp(&decoder, &pRspWrapper->dataRsp);
wmmhello's avatar
wmmhello 已提交
1317
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1318
    memcpy(&pRspWrapper->dataRsp, pMsg->pData, sizeof(SMqRspHead));
L
Liu Jicong 已提交
1319

H
Haojun Liao 已提交
1320 1321
    char buf[80];
    tFormatOffset(buf, 80, &pRspWrapper->dataRsp.rspOffset);
H
Haojun Liao 已提交
1322
    tscDebug("consumer:0x%" PRIx64 " recv poll rsp, vgId:%d, req ver:%" PRId64 ", rsp:%s type %d, reqId:0x%" PRIx64,
H
Haojun Liao 已提交
1323
             tmq->consumerId, vgId, pRspWrapper->dataRsp.reqOffset.version, buf, rspType, requestId);
L
Liu Jicong 已提交
1324
  } else if (rspType == TMQ_MSG_TYPE__POLL_META_RSP) {
1325 1326 1327 1328
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeSMqMetaRsp(&decoder, &pRspWrapper->metaRsp);
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1329
    memcpy(&pRspWrapper->metaRsp, pMsg->pData, sizeof(SMqRspHead));
L
Liu Jicong 已提交
1330 1331 1332 1333 1334 1335
  } else if (rspType == TMQ_MSG_TYPE__TAOSX_RSP) {
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeSTaosxRsp(&decoder, &pRspWrapper->taosxRsp);
    tDecoderClear(&decoder);
    memcpy(&pRspWrapper->taosxRsp, pMsg->pData, sizeof(SMqRspHead));
H
Haojun Liao 已提交
1336 1337
  } else { // invalid rspType
    tscError("consumer:0x%"PRIx64" invalid rsp msg received, type:%d ignored", tmq->consumerId, rspType);
L
Liu Jicong 已提交
1338
  }
L
Liu Jicong 已提交
1339

L
Liu Jicong 已提交
1340
  taosMemoryFree(pMsg->pData);
H
Haojun Liao 已提交
1341
  taosWriteQitem(tmq->mqueue, pRspWrapper);
L
Liu Jicong 已提交
1342

1343
  int32_t total = taosQueueItemSize(tmq->mqueue);
H
Haojun Liao 已提交
1344
  tscDebug("consumer:0x%" PRIx64 " put poll res into mqueue, type:%d, vgId:%d, total in queue:%d, reqId:0x%" PRIx64,
1345
           tmq->consumerId, rspType, vgId, total, requestId);
H
Haojun Liao 已提交
1346

1347
  tsem_post(&tmq->rspSem);
1348 1349
  taosReleaseRef(tmqMgmt.rsetId, refId);

L
Liu Jicong 已提交
1350
  return 0;
H
Haojun Liao 已提交
1351

L
fix txn  
Liu Jicong 已提交
1352
CREATE_MSG_FAIL:
L
Liu Jicong 已提交
1353
  if (epoch == tmq->epoch) {
L
Liu Jicong 已提交
1354 1355
    atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
  }
H
Haojun Liao 已提交
1356

1357
  tsem_post(&tmq->rspSem);
1358 1359
  taosReleaseRef(tmqMgmt.rsetId, refId);

L
Liu Jicong 已提交
1360
  return -1;
1361 1362
}

H
Haojun Liao 已提交
1363 1364 1365 1366 1367
typedef struct SVgroupSaveInfo {
  STqOffsetVal offset;
  int64_t      numOfRows;
} SVgroupSaveInfo;

H
Haojun Liao 已提交
1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384
static void initClientTopicFromRsp(SMqClientTopic* pTopic, SMqSubTopicEp* pTopicEp, SHashObj* pVgOffsetHashMap,
                                   tmq_t* tmq) {
  pTopic->schema = pTopicEp->schema;
  pTopicEp->schema.nCols = 0;
  pTopicEp->schema.pSchema = NULL;

  char vgKey[TSDB_TOPIC_FNAME_LEN + 22];
  int32_t vgNumGet = taosArrayGetSize(pTopicEp->vgs);

  tstrncpy(pTopic->topicName, pTopicEp->topic, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pTopic->db, pTopicEp->db, TSDB_DB_FNAME_LEN);

  tscDebug("consumer:0x%" PRIx64 ", update topic:%s, numOfVgs:%d", tmq->consumerId, pTopic->topicName, vgNumGet);
  pTopic->vgs = taosArrayInit(vgNumGet, sizeof(SMqClientVg));

  for (int32_t j = 0; j < vgNumGet; j++) {
    SMqSubVgEp* pVgEp = taosArrayGet(pTopicEp->vgs, j);
H
Haojun Liao 已提交
1385 1386

    makeTopicVgroupKey(vgKey, pTopic->topicName, pVgEp->vgId);
H
Haojun Liao 已提交
1387
    SVgroupSaveInfo* pInfo = taosHashGet(pVgOffsetHashMap, vgKey, strlen(vgKey));
H
Haojun Liao 已提交
1388

H
Haojun Liao 已提交
1389
    int64_t numOfRows = 0;
H
Haojun Liao 已提交
1390
    STqOffsetVal  offsetNew = {.type = tmq->resetOffsetCfg};
H
Haojun Liao 已提交
1391 1392 1393
    if (pInfo != NULL) {
      offsetNew = pInfo->offset;
      numOfRows = pInfo->numOfRows;
H
Haojun Liao 已提交
1394 1395 1396 1397 1398 1399 1400 1401 1402
    }

    SMqClientVg clientVg = {
        .pollCnt = 0,
        .currentOffset = offsetNew,
        .vgId = pVgEp->vgId,
        .epSet = pVgEp->epSet,
        .vgStatus = TMQ_VG_STATUS__IDLE,
        .vgSkipCnt = 0,
H
Haojun Liao 已提交
1403
        .emptyBlockReceiveTs = 0,
H
Haojun Liao 已提交
1404
        .numOfRows = numOfRows,
H
Haojun Liao 已提交
1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419
    };

    taosArrayPush(pTopic->vgs, &clientVg);
  }
}

static void freeClientVgInfo(void* param) {
  SMqClientTopic* pTopic = param;
  if (pTopic->schema.nCols) {
    taosMemoryFreeClear(pTopic->schema.pSchema);
  }

  taosArrayDestroy(pTopic->vgs);
}

1420
static bool doUpdateLocalEp(tmq_t* tmq, int32_t epoch, const SMqAskEpRsp* pRsp) {
1421 1422
  bool set = false;

1423
  int32_t topicNumCur = taosArrayGetSize(tmq->clientTopics);
1424
  int32_t topicNumGet = taosArrayGetSize(pRsp->topics);
1425

X
Xiaoyu Wang 已提交
1426 1427
  char vgKey[TSDB_TOPIC_FNAME_LEN + 22];
  tscDebug("consumer:0x%" PRIx64 " update ep epoch from %d to epoch %d, incoming topics:%d, existed topics:%d",
1428
           tmq->consumerId, tmq->epoch, epoch, topicNumGet, topicNumCur);
1429 1430 1431 1432 1433 1434

  SArray* newTopics = taosArrayInit(topicNumGet, sizeof(SMqClientTopic));
  if (newTopics == NULL) {
    return false;
  }

H
Haojun Liao 已提交
1435 1436
  SHashObj* pVgOffsetHashMap = taosHashInit(64, MurmurHash3_32, false, HASH_NO_LOCK);
  if (pVgOffsetHashMap == NULL) {
1437 1438 1439
    taosArrayDestroy(newTopics);
    return false;
  }
1440

H
Haojun Liao 已提交
1441
  // todo extract method
1442 1443 1444 1445 1446
  for (int32_t i = 0; i < topicNumCur; i++) {
    // find old topic
    SMqClientTopic* pTopicCur = taosArrayGet(tmq->clientTopics, i);
    if (pTopicCur->vgs) {
      int32_t vgNumCur = taosArrayGetSize(pTopicCur->vgs);
1447
      tscDebug("consumer:0x%" PRIx64 ", new vg num: %d", tmq->consumerId, vgNumCur);
1448 1449
      for (int32_t j = 0; j < vgNumCur; j++) {
        SMqClientVg* pVgCur = taosArrayGet(pTopicCur->vgs, j);
H
Haojun Liao 已提交
1450 1451
        makeTopicVgroupKey(vgKey, pTopicCur->topicName, pVgCur->vgId);

L
Liu Jicong 已提交
1452
        char buf[80];
L
Liu Jicong 已提交
1453
        tFormatOffset(buf, 80, &pVgCur->currentOffset);
H
Haojun Liao 已提交
1454
        tscDebug("consumer:0x%" PRIx64 ", epoch:%d vgId:%d vgKey:%s, offset:%s", tmq->consumerId, epoch,
L
Liu Jicong 已提交
1455
                 pVgCur->vgId, vgKey, buf);
H
Haojun Liao 已提交
1456 1457 1458

        SVgroupSaveInfo info = {.offset = pVgCur->currentOffset, .numOfRows = pVgCur->numOfRows};
        taosHashPut(pVgOffsetHashMap, vgKey, strlen(vgKey), &info, sizeof(SVgroupSaveInfo));
1459 1460 1461 1462 1463 1464 1465
      }
    }
  }

  for (int32_t i = 0; i < topicNumGet; i++) {
    SMqClientTopic topic = {0};
    SMqSubTopicEp* pTopicEp = taosArrayGet(pRsp->topics, i);
H
Haojun Liao 已提交
1466
    initClientTopicFromRsp(&topic, pTopicEp, pVgOffsetHashMap, tmq);
1467 1468
    taosArrayPush(newTopics, &topic);
  }
1469

H
Haojun Liao 已提交
1470 1471
  taosHashCleanup(pVgOffsetHashMap);

1472
  // destroy current buffered existed topics info
1473
  if (tmq->clientTopics) {
H
Haojun Liao 已提交
1474
    taosArrayDestroyEx(tmq->clientTopics, freeClientVgInfo);
X
Xiaoyu Wang 已提交
1475
  }
H
Haojun Liao 已提交
1476
  tmq->clientTopics = newTopics;
1477

H
Haojun Liao 已提交
1478 1479
  int8_t flag = (topicNumGet == 0)? TMQ_CONSUMER_STATUS__NO_TOPIC:TMQ_CONSUMER_STATUS__READY;
  atomic_store_8(&tmq->status, flag);
X
Xiaoyu Wang 已提交
1480
  atomic_store_32(&tmq->epoch, epoch);
H
Haojun Liao 已提交
1481

1482
  tscDebug("consumer:0x%" PRIx64 " update topic info completed", tmq->consumerId);
X
Xiaoyu Wang 已提交
1483 1484 1485
  return set;
}

1486
int32_t askEpCallbackFn(void* param, SDataBuf* pMsg, int32_t code) {
1487
  SMqAskEpCbParam* pParam = (SMqAskEpCbParam*)param;
1488
  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, pParam->refId);
1489 1490

  if (tmq == NULL) {
1491 1492 1493
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    pParam->pUserFn(tmq, terrno, NULL, pParam->pParam);

1494
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1495
    taosMemoryFree(pMsg->pEpSet);
1496 1497
    taosMemoryFree(pParam);
    return terrno;
1498 1499
  }

H
Haojun Liao 已提交
1500
  if (code != TSDB_CODE_SUCCESS) {
1501 1502 1503 1504 1505 1506 1507 1508 1509
    tscError("consumer:0x%" PRIx64 ", get topic endpoint error, code:%s", tmq->consumerId, tstrerror(code));
    pParam->pUserFn(tmq, code, NULL, pParam->pParam);

    taosReleaseRef(tmqMgmt.rsetId, pParam->refId);

    taosMemoryFree(pMsg->pData);
    taosMemoryFree(pMsg->pEpSet);
    taosMemoryFree(pParam);
    return code;
1510
  }
L
Liu Jicong 已提交
1511

L
Liu Jicong 已提交
1512
  // tmq's epoch is monotonically increase,
L
Liu Jicong 已提交
1513
  // so it's safe to discard any old epoch msg.
L
Liu Jicong 已提交
1514
  // Epoch will only increase when received newer epoch ep msg
L
Liu Jicong 已提交
1515 1516 1517
  SMqRspHead* head = pMsg->pData;
  int32_t     epoch = atomic_load_32(&tmq->epoch);
  if (head->epoch <= epoch) {
1518 1519
    tscDebug("consumer:0x%" PRIx64 ", recv ep, msg epoch %d, current epoch %d, no need to update local ep",
             tmq->consumerId, head->epoch, epoch);
1520

1521 1522 1523 1524 1525 1526 1527 1528
    if (tmq->status == TMQ_CONSUMER_STATUS__RECOVER) {
      SMqAskEpRsp rsp;
      tDecodeSMqAskEpRsp(POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), &rsp);
      int8_t flag = (taosArrayGetSize(rsp.topics) == 0) ? TMQ_CONSUMER_STATUS__NO_TOPIC : TMQ_CONSUMER_STATUS__READY;
      atomic_store_8(&tmq->status, flag);
      tDeleteSMqAskEpRsp(&rsp);
    }

X
Xiaoyu Wang 已提交
1529
  } else {
1530 1531 1532
    tscDebug("consumer:0x%" PRIx64 ", recv ep, msg epoch %d, current epoch %d, update local ep", tmq->consumerId,
             head->epoch, epoch);
    pParam->pUserFn(tmq, code, pMsg, pParam->pParam);
1533
  }
L
Liu Jicong 已提交
1534

1535 1536
  taosReleaseRef(tmqMgmt.rsetId, pParam->refId);

dengyihao's avatar
dengyihao 已提交
1537
  taosMemoryFree(pMsg->pEpSet);
L
Liu Jicong 已提交
1538
  taosMemoryFree(pMsg->pData);
1539
  taosMemoryFree(pParam);
L
Liu Jicong 已提交
1540
  return code;
1541 1542
}

L
Liu Jicong 已提交
1543
void tmqBuildConsumeReqImpl(SMqPollReq* pReq, tmq_t* tmq, int64_t timeout, SMqClientTopic* pTopic, SMqClientVg* pVg) {
L
Liu Jicong 已提交
1544 1545 1546 1547
  int32_t groupLen = strlen(tmq->groupId);
  memcpy(pReq->subKey, tmq->groupId, groupLen);
  pReq->subKey[groupLen] = TMQ_SEPARATOR;
  strcpy(pReq->subKey + groupLen + 1, pTopic->topicName);
1548

1549
  pReq->withTbName = tmq->withTbName;
L
Liu Jicong 已提交
1550
  pReq->consumerId = tmq->consumerId;
1551
  pReq->timeout = timeout;
X
Xiaoyu Wang 已提交
1552
  pReq->epoch = tmq->epoch;
L
Liu Jicong 已提交
1553
  /*pReq->currentOffset = reqOffset;*/
L
Liu Jicong 已提交
1554
  pReq->reqOffset = pVg->currentOffset;
D
dapan1121 已提交
1555
  pReq->head.vgId = pVg->vgId;
1556 1557
  pReq->useSnapshot = tmq->useSnapshot;
  pReq->reqId = generateRequestId();
1558 1559
}

L
Liu Jicong 已提交
1560 1561
SMqMetaRspObj* tmqBuildMetaRspFromWrapper(SMqPollRspWrapper* pWrapper) {
  SMqMetaRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqMetaRspObj));
L
Liu Jicong 已提交
1562
  pRspObj->resType = RES_TYPE__TMQ_META;
L
Liu Jicong 已提交
1563 1564 1565 1566 1567 1568 1569 1570
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
  pRspObj->vgId = pWrapper->vgHandle->vgId;

  memcpy(&pRspObj->metaRsp, &pWrapper->metaRsp, sizeof(SMqMetaRsp));
  return pRspObj;
}

1571
SMqRspObj* tmqBuildRspFromWrapper(SMqPollRspWrapper* pWrapper, SMqClientVg* pVg, int64_t* numOfRows) {
L
Liu Jicong 已提交
1572 1573
  SMqRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqRspObj));
  pRspObj->resType = RES_TYPE__TMQ;
1574

1575
  (*numOfRows) = 0;
L
Liu Jicong 已提交
1576 1577
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
1578

L
Liu Jicong 已提交
1579
  pRspObj->vgId = pWrapper->vgHandle->vgId;
L
Liu Jicong 已提交
1580
  pRspObj->resIter = -1;
L
Liu Jicong 已提交
1581
  memcpy(&pRspObj->rsp, &pWrapper->dataRsp, sizeof(SMqDataRsp));
L
Liu Jicong 已提交
1582

L
Liu Jicong 已提交
1583 1584
  pRspObj->resInfo.totalRows = 0;
  pRspObj->resInfo.precision = TSDB_TIME_PRECISION_MILLI;
1585

L
Liu Jicong 已提交
1586
  if (!pWrapper->dataRsp.withSchema) {
L
Liu Jicong 已提交
1587 1588
    setResSchemaInfo(&pRspObj->resInfo, pWrapper->topicHandle->schema.pSchema, pWrapper->topicHandle->schema.nCols);
  }
L
Liu Jicong 已提交
1589

1590 1591 1592 1593 1594
  // extract the rows in this data packet
  for(int32_t i = 0; i < pRspObj->rsp.blockNum; ++i) {
    SRetrieveTableRsp* pRetrieve = (SRetrieveTableRsp*)taosArrayGetP(pRspObj->rsp.blockData, i);
    int64_t rows = htobe64(pRetrieve->numOfRows);
    pVg->numOfRows += rows;
1595
    (*numOfRows) += rows;
1596 1597
  }

L
Liu Jicong 已提交
1598
  return pRspObj;
X
Xiaoyu Wang 已提交
1599 1600
}

L
Liu Jicong 已提交
1601 1602
SMqTaosxRspObj* tmqBuildTaosxRspFromWrapper(SMqPollRspWrapper* pWrapper) {
  SMqTaosxRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqTaosxRspObj));
1603
  pRspObj->resType = RES_TYPE__TMQ_METADATA;
L
Liu Jicong 已提交
1604 1605 1606 1607
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
  pRspObj->vgId = pWrapper->vgHandle->vgId;
  pRspObj->resIter = -1;
1608
  memcpy(&pRspObj->rsp, &pWrapper->taosxRsp, sizeof(STaosxRsp));
L
Liu Jicong 已提交
1609 1610 1611

  pRspObj->resInfo.totalRows = 0;
  pRspObj->resInfo.precision = TSDB_TIME_PRECISION_MILLI;
1612
  if (!pWrapper->taosxRsp.withSchema) {
L
Liu Jicong 已提交
1613 1614 1615 1616 1617 1618
    setResSchemaInfo(&pRspObj->resInfo, pWrapper->topicHandle->schema.pSchema, pWrapper->topicHandle->schema.nCols);
  }

  return pRspObj;
}

1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651
static int32_t handleErrorBeforePoll(SMqClientVg* pVg, tmq_t* pTmq) {
  atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
  tsem_post(&pTmq->rspSem);
  return -1;
}

static int32_t doTmqPollImpl(tmq_t* pTmq, SMqClientTopic* pTopic, SMqClientVg* pVg, int64_t timeout) {
  SMqPollReq req = {0};
  tmqBuildConsumeReqImpl(&req, pTmq, timeout, pTopic, pVg);

  int32_t msgSize = tSerializeSMqPollReq(NULL, 0, &req);
  if (msgSize < 0) {
    return handleErrorBeforePoll(pVg, pTmq);
  }

  char* msg = taosMemoryCalloc(1, msgSize);
  if (NULL == msg) {
    return handleErrorBeforePoll(pVg, pTmq);
  }

  if (tSerializeSMqPollReq(msg, msgSize, &req) < 0) {
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  SMqPollCbParam* pParam = taosMemoryMalloc(sizeof(SMqPollCbParam));
  if (pParam == NULL) {
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  pParam->refId = pTmq->refId;
  pParam->epoch = pTmq->epoch;
X
Xiaoyu Wang 已提交
1652
  pParam->pVg = pVg;  // pVg may be released,fix it
1653 1654
  pParam->pTopic = pTopic;
  pParam->vgId = pVg->vgId;
H
Haojun Liao 已提交
1655
  pParam->requestId = req.reqId;
1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(pParam);
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  sendInfo->msgInfo = (SDataBuf){
      .pData = msg,
      .len = msgSize,
      .handle = NULL,
  };

  sendInfo->requestId = req.reqId;
  sendInfo->requestObjRefId = 0;
  sendInfo->param = pParam;
  sendInfo->fp = tmqPollCb;
  sendInfo->msgType = TDMT_VND_TMQ_CONSUME;

  int64_t transporterId = 0;
  char    offsetFormatBuf[80];
  tFormatOffset(offsetFormatBuf, tListLen(offsetFormatBuf), &pVg->currentOffset);

H
Haojun Liao 已提交
1680
  tscDebug("consumer:0x%" PRIx64 " send poll to %s vgId:%d, epoch %d, req:%s, reqId:0x%" PRIx64,
1681 1682 1683 1684 1685 1686 1687 1688 1689
           pTmq->consumerId, pTopic->topicName, pVg->vgId, pTmq->epoch, offsetFormatBuf, req.reqId);
  asyncSendMsgToServer(pTmq->pTscObj->pAppInfo->pTransporter, &pVg->epSet, &transporterId, sendInfo);

  pVg->pollCnt++;
  pTmq->pollCnt++;

  return TSDB_CODE_SUCCESS;
}

1690
// broadcast the poll request to all related vnodes
H
Haojun Liao 已提交
1691
static int32_t tmqPollImpl(tmq_t* tmq, int64_t timeout) {
1692
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);
X
Xiaoyu Wang 已提交
1693
  tscDebug("consumer:0x%" PRIx64 " start to poll data, numOfTopics:%d", tmq->consumerId, numOfTopics);
1694 1695

  for (int i = 0; i < numOfTopics; i++) {
X
Xiaoyu Wang 已提交
1696
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
X
Xiaoyu Wang 已提交
1697
    int32_t         numOfVg = taosArrayGetSize(pTopic->vgs);
1698 1699

    for (int j = 0; j < numOfVg; j++) {
X
Xiaoyu Wang 已提交
1700
      SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);
1701
      if (taosGetTimestampMs() - pVg->emptyBlockReceiveTs < EMPTY_BLOCK_POLL_IDLE_DURATION) { // less than 100ms
1702
        tscTrace("consumer:0x%" PRIx64 " epoch %d, vgId:%d idle for 10ms before start next poll", tmq->consumerId, tmq->epoch,
H
Haojun Liao 已提交
1703
                 pVg->vgId);
H
Haojun Liao 已提交
1704 1705 1706
        continue;
      }

1707
      int32_t vgStatus = atomic_val_compare_exchange_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE, TMQ_VG_STATUS__WAIT);
1708
      if (vgStatus == TMQ_VG_STATUS__WAIT) {
L
Liu Jicong 已提交
1709
        int32_t vgSkipCnt = atomic_add_fetch_32(&pVg->vgSkipCnt, 1);
H
Haojun Liao 已提交
1710
        tscTrace("consumer:0x%" PRIx64 " epoch %d wait poll-rsp, skip vgId:%d skip cnt %d", tmq->consumerId, tmq->epoch,
X
Xiaoyu Wang 已提交
1711
                 pVg->vgId, vgSkipCnt);
X
Xiaoyu Wang 已提交
1712
        continue;
L
temp  
Liu Jicong 已提交
1713 1714 1715 1716
#if 0
        if (skipCnt < 30000) {
          continue;
        } else {
1717
        tscDebug("consumer:0x%" PRIx64 ",skip vgId:%d skip too much reset", tmq->consumerId, pVg->vgId);
L
temp  
Liu Jicong 已提交
1718 1719
        }
#endif
X
Xiaoyu Wang 已提交
1720
      }
1721

L
Liu Jicong 已提交
1722
      atomic_store_32(&pVg->vgSkipCnt, 0);
1723 1724 1725
      int32_t code = doTmqPollImpl(tmq, pTopic, pVg, timeout);
      if (code != TSDB_CODE_SUCCESS) {
        return code;
D
dapan1121 已提交
1726
      }
X
Xiaoyu Wang 已提交
1727 1728
    }
  }
1729

1730
  tscDebug("consumer:0x%" PRIx64 " end to poll data", tmq->consumerId);
X
Xiaoyu Wang 已提交
1731 1732 1733
  return 0;
}

H
Haojun Liao 已提交
1734
static int32_t tmqHandleNoPollRsp(tmq_t* tmq, SMqRspWrapper* rspWrapper, bool* pReset) {
L
Liu Jicong 已提交
1735
  if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__EP_RSP) {
L
fix  
Liu Jicong 已提交
1736
    /*printf("ep %d %d\n", rspMsg->head.epoch, tmq->epoch);*/
L
Liu Jicong 已提交
1737 1738
    if (rspWrapper->epoch > atomic_load_32(&tmq->epoch)) {
      SMqAskEpRspWrapper* pEpRspWrapper = (SMqAskEpRspWrapper*)rspWrapper;
L
Liu Jicong 已提交
1739
      SMqAskEpRsp*        rspMsg = &pEpRspWrapper->msg;
1740
      doUpdateLocalEp(tmq, rspWrapper->epoch, rspMsg);
L
temp  
Liu Jicong 已提交
1741
      /*tmqClearUnhandleMsg(tmq);*/
L
Liu Jicong 已提交
1742
      tDeleteSMqAskEpRsp(rspMsg);
X
Xiaoyu Wang 已提交
1743 1744
      *pReset = true;
    } else {
L
Liu Jicong 已提交
1745
      tmqFreeRspWrapper(rspWrapper);
X
Xiaoyu Wang 已提交
1746 1747 1748 1749 1750 1751 1752 1753
      *pReset = false;
    }
  } else {
    return -1;
  }
  return 0;
}

H
Haojun Liao 已提交
1754
static void* tmqHandleAllRsp(tmq_t* tmq, int64_t timeout, bool pollIfReset) {
H
Haojun Liao 已提交
1755
  tscDebug("consumer:0x%" PRIx64 " start to handle the rsp, total:%d", tmq->consumerId, tmq->qall->numOfItems);
1756

X
Xiaoyu Wang 已提交
1757
  while (1) {
1758 1759
    SMqRspWrapper* pRspWrapper = NULL;
    taosGetQitem(tmq->qall, (void**)&pRspWrapper);
1760

1761
    if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1762
      taosReadAllQitems(tmq->mqueue, tmq->qall);
1763 1764
      taosGetQitem(tmq->qall, (void**)&pRspWrapper);
      if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1765 1766
        return NULL;
      }
X
Xiaoyu Wang 已提交
1767 1768
    }

1769
    tscDebug("consumer:0x%"PRIx64" handle rsp, type:%d", tmq->consumerId, pRspWrapper->tmqRspType);
H
Haojun Liao 已提交
1770

1771 1772
    if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__END_RSP) {
      taosFreeQitem(pRspWrapper);
L
Liu Jicong 已提交
1773
      terrno = TSDB_CODE_TQ_NO_COMMITTED_OFFSET;
H
Haojun Liao 已提交
1774
      tscError("consumer:0x%" PRIx64 " unexpected rsp from poll, code:%s", tmq->consumerId, tstrerror(terrno));
L
Liu Jicong 已提交
1775
      return NULL;
1776 1777
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
H
Haojun Liao 已提交
1778

1779
      int32_t consumerEpoch = atomic_load_32(&tmq->epoch);
1780 1781 1782
      SMqDataRsp* pDataRsp = &pollRspWrapper->dataRsp;

      if (pDataRsp->head.epoch == consumerEpoch) {
L
Liu Jicong 已提交
1783
        SMqClientVg* pVg = pollRspWrapper->vgHandle;
1784 1785 1786 1787 1788 1789 1790 1791 1792 1793

        // update the epset
        if (pollRspWrapper->pEpset != NULL) {
          SEp* pEp = GET_ACTIVE_EP(pollRspWrapper->pEpset);
          SEp* pOld = GET_ACTIVE_EP(&(pVg->epSet));
          tscDebug("consumer:0x%" PRIx64 " update epset vgId:%d, ep:%s:%d, old ep:%s:%d", tmq->consumerId,
                   pVg->vgId, pEp->fqdn, pEp->port, pOld->fqdn, pOld->port);
          pVg->epSet = *pollRspWrapper->pEpset;
        }

1794
        // update the local offset value only for the returned values.
1795
        pVg->currentOffset = pDataRsp->rspOffset;
X
Xiaoyu Wang 已提交
1796
        atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
H
Haojun Liao 已提交
1797

1798 1799 1800
        char buf[80];
        tFormatOffset(buf, 80, &pDataRsp->rspOffset);
        if (pDataRsp->blockNum == 0) {
H
Haojun Liao 已提交
1801 1802
          tscDebug("consumer:0x%" PRIx64 " empty block received, vgId:%d, offset:%s, vg total:%"PRId64" total:%"PRId64" reqId:0x%" PRIx64, tmq->consumerId,
                   pVg->vgId, buf, pVg->numOfRows, tmq->totalRows, pollRspWrapper->reqId);
1803
          pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1804
          taosFreeQitem(pollRspWrapper);
1805
        } else {  // build rsp
1806 1807
          int64_t numOfRows = 0;
          SMqRspObj* pRsp = tmqBuildRspFromWrapper(pollRspWrapper, pVg, &numOfRows);
H
Haojun Liao 已提交
1808 1809
          tmq->totalRows += numOfRows;

H
Haojun Liao 已提交
1810
          tscDebug("consumer:0x%" PRIx64 " process poll rsp, vgId:%d, offset:%s, blocks:%d, rows:%" PRId64
H
Haojun Liao 已提交
1811
                   " vg total:%" PRId64 " total:%" PRId64 ", reqId:0x%" PRIx64,
H
Haojun Liao 已提交
1812
                   tmq->consumerId, pVg->vgId, buf, pDataRsp->blockNum, numOfRows, pVg->numOfRows, tmq->totalRows,
H
Haojun Liao 已提交
1813
                   pollRspWrapper->reqId);
1814 1815 1816
          taosFreeQitem(pollRspWrapper);
          return pRsp;
        }
X
Xiaoyu Wang 已提交
1817
      } else {
H
Haojun Liao 已提交
1818
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
1819
                 tmq->consumerId, pollRspWrapper->vgId, pDataRsp->head.epoch, consumerEpoch);
1820
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1821 1822
        taosFreeQitem(pollRspWrapper);
      }
1823 1824
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_META_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
L
Liu Jicong 已提交
1825
      int32_t            consumerEpoch = atomic_load_32(&tmq->epoch);
1826 1827 1828

      tscDebug("consumer:0x%" PRIx64 " process meta rsp", tmq->consumerId);

L
Liu Jicong 已提交
1829
      if (pollRspWrapper->metaRsp.head.epoch == consumerEpoch) {
L
Liu Jicong 已提交
1830
        SMqClientVg* pVg = pollRspWrapper->vgHandle;
wmmhello's avatar
wmmhello 已提交
1831
        pVg->currentOffset = pollRspWrapper->metaRsp.rspOffset;
L
Liu Jicong 已提交
1832 1833
        atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
        // build rsp
L
Liu Jicong 已提交
1834
        SMqMetaRspObj* pRsp = tmqBuildMetaRspFromWrapper(pollRspWrapper);
L
Liu Jicong 已提交
1835 1836 1837
        taosFreeQitem(pollRspWrapper);
        return pRsp;
      } else {
H
Haojun Liao 已提交
1838
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
1839
                 tmq->consumerId, pollRspWrapper->vgId, pollRspWrapper->metaRsp.head.epoch, consumerEpoch);
1840
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1841
        taosFreeQitem(pollRspWrapper);
X
Xiaoyu Wang 已提交
1842
      }
1843 1844
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__TAOSX_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
L
Liu Jicong 已提交
1845
      int32_t consumerEpoch = atomic_load_32(&tmq->epoch);
H
Haojun Liao 已提交
1846

L
Liu Jicong 已提交
1847 1848 1849 1850
      if (pollRspWrapper->taosxRsp.head.epoch == consumerEpoch) {
        SMqClientVg* pVg = pollRspWrapper->vgHandle;
        pVg->currentOffset = pollRspWrapper->taosxRsp.rspOffset;
        atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
H
Haojun Liao 已提交
1851

L
Liu Jicong 已提交
1852
        if (pollRspWrapper->taosxRsp.blockNum == 0) {
H
Haojun Liao 已提交
1853 1854
          tscDebug("consumer:0x%" PRIx64 " taosx empty block received, vgId:%d, vg total:%" PRId64 " reqId:0x%" PRIx64,
                   tmq->consumerId, pVg->vgId, pVg->numOfRows, pollRspWrapper->reqId);
H
Haojun Liao 已提交
1855
          pVg->emptyBlockReceiveTs = taosGetTimestampMs();
1856
          pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
H
Haojun Liao 已提交
1857
          taosFreeQitem(pollRspWrapper);
L
Liu Jicong 已提交
1858
          continue;
H
Haojun Liao 已提交
1859 1860
        } else {
          pVg->emptyBlockReceiveTs = 0; // reset the ts
L
Liu Jicong 已提交
1861
        }
wmmhello's avatar
wmmhello 已提交
1862

L
Liu Jicong 已提交
1863
        // build rsp
wmmhello's avatar
wmmhello 已提交
1864
        void* pRsp = NULL;
1865
        int64_t numOfRows = 0;
L
Liu Jicong 已提交
1866
        if (pollRspWrapper->taosxRsp.createTableNum == 0) {
1867
          pRsp = tmqBuildRspFromWrapper(pollRspWrapper, pVg, &numOfRows);
L
Liu Jicong 已提交
1868
        } else {
wmmhello's avatar
wmmhello 已提交
1869 1870
          pRsp = tmqBuildTaosxRspFromWrapper(pollRspWrapper);
        }
H
Haojun Liao 已提交
1871

1872 1873
        tmq->totalRows += numOfRows;

H
Haojun Liao 已提交
1874 1875
        char buf[80];
        tFormatOffset(buf, 80, &pVg->currentOffset);
H
Haojun Liao 已提交
1876
        tscDebug("consumer:0x%" PRIx64 " process taosx poll rsp, vgId:%d, offset:%s, blocks:%d, rows:%" PRId64
H
Haojun Liao 已提交
1877
                 ", vg total:%" PRId64 " total:%"PRId64" reqId:0x%" PRIx64,
H
Haojun Liao 已提交
1878
                 tmq->consumerId, pVg->vgId, buf, pollRspWrapper->dataRsp.blockNum, numOfRows, pVg->numOfRows,
H
Haojun Liao 已提交
1879
                 tmq->totalRows, pollRspWrapper->reqId);
H
Haojun Liao 已提交
1880 1881

        taosFreeQitem(pollRspWrapper);
L
Liu Jicong 已提交
1882
        return pRsp;
H
Haojun Liao 已提交
1883

L
Liu Jicong 已提交
1884
      } else {
H
Haojun Liao 已提交
1885
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
1886
                 tmq->consumerId, pollRspWrapper->vgId, pollRspWrapper->taosxRsp.head.epoch, consumerEpoch);
1887
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1888 1889
        taosFreeQitem(pollRspWrapper);
      }
X
Xiaoyu Wang 已提交
1890
    } else {
H
Haojun Liao 已提交
1891 1892
      tscDebug("consumer:0x%" PRIx64 " not data msg received", tmq->consumerId);

X
Xiaoyu Wang 已提交
1893
      bool reset = false;
1894 1895
      tmqHandleNoPollRsp(tmq, pRspWrapper, &reset);
      taosFreeQitem(pRspWrapper);
X
Xiaoyu Wang 已提交
1896
      if (pollIfReset && reset) {
1897
        tscDebug("consumer:0x%" PRIx64 ", reset and repoll", tmq->consumerId);
1898
        tmqPollImpl(tmq, timeout);
X
Xiaoyu Wang 已提交
1899 1900 1901 1902 1903
      }
    }
  }
}

1904
TAOS_RES* tmq_consumer_poll(tmq_t* tmq, int64_t timeout) {
L
Liu Jicong 已提交
1905 1906
  void*   rspObj;
  int64_t startTime = taosGetTimestampMs();
L
Liu Jicong 已提交
1907

1908
  tscDebug("consumer:0x%" PRIx64 " start to poll at %"PRId64", timeout:%" PRId64, tmq->consumerId, startTime, timeout);
L
Liu Jicong 已提交
1909

1910 1911 1912
#if 0
  tmqHandleAllDelayedTask(tmq);
  tmqPollImpl(tmq, timeout);
1913
  rspObj = tmqHandleAllRsp(tmq, timeout, false);
L
Liu Jicong 已提交
1914 1915
  if (rspObj) {
    return (TAOS_RES*)rspObj;
L
fix  
Liu Jicong 已提交
1916
  }
1917
#endif
X
Xiaoyu Wang 已提交
1918

1919
  // in no topic status, delayed task also need to be processed
L
Liu Jicong 已提交
1920
  if (atomic_load_8(&tmq->status) == TMQ_CONSUMER_STATUS__INIT) {
1921
    tscDebug("consumer:0x%" PRIx64 " poll return since consumer is init", tmq->consumerId);
1922
    taosMsleep(500);  //     sleep for a while
1923 1924 1925
    return NULL;
  }

wmmhello's avatar
wmmhello 已提交
1926
  while (atomic_load_8(&tmq->status) == TMQ_CONSUMER_STATUS__RECOVER) {
L
Liu Jicong 已提交
1927
    int32_t retryCnt = 0;
1928
    while (TSDB_CODE_MND_CONSUMER_NOT_READY == doAskEp(tmq)) {
H
Haojun Liao 已提交
1929
      if (retryCnt++ > 40) {
L
Liu Jicong 已提交
1930 1931
        return NULL;
      }
1932

H
Haojun Liao 已提交
1933
      tscDebug("consumer:0x%" PRIx64 " not ready, retry:%d/40 in 500ms", tmq->consumerId, retryCnt);
L
Liu Jicong 已提交
1934 1935 1936 1937
      taosMsleep(500);
    }
  }

X
Xiaoyu Wang 已提交
1938
  while (1) {
L
Liu Jicong 已提交
1939
    tmqHandleAllDelayedTask(tmq);
1940

L
Liu Jicong 已提交
1941
    if (tmqPollImpl(tmq, timeout) < 0) {
1942
      tscDebug("consumer:0x%" PRIx64 " return due to poll error", tmq->consumerId);
L
Liu Jicong 已提交
1943
    }
L
Liu Jicong 已提交
1944

1945
    rspObj = tmqHandleAllRsp(tmq, timeout, false);
L
Liu Jicong 已提交
1946
    if (rspObj) {
1947
      tscDebug("consumer:0x%" PRIx64 " return rsp %p", tmq->consumerId, rspObj);
L
Liu Jicong 已提交
1948
      return (TAOS_RES*)rspObj;
L
Liu Jicong 已提交
1949
    } else if (terrno == TSDB_CODE_TQ_NO_COMMITTED_OFFSET) {
1950
      tscDebug("consumer:0x%" PRIx64 " return null since no committed offset", tmq->consumerId);
L
Liu Jicong 已提交
1951
      return NULL;
X
Xiaoyu Wang 已提交
1952
    }
1953

1954
    if (timeout >= 0) {
L
Liu Jicong 已提交
1955
      int64_t currentTime = taosGetTimestampMs();
1956 1957 1958
      int64_t elapsedTime = currentTime - startTime;
      if (elapsedTime > timeout) {
        tscDebug("consumer:0x%" PRIx64 " (epoch %d) timeout, no rsp, start time %" PRId64 ", current time %" PRId64,
L
Liu Jicong 已提交
1959
                 tmq->consumerId, tmq->epoch, startTime, currentTime);
X
Xiaoyu Wang 已提交
1960 1961
        return NULL;
      }
1962
      tsem_timewait(&tmq->rspSem, (timeout - elapsedTime));
L
Liu Jicong 已提交
1963 1964
    } else {
      // use tsem_timewait instead of tsem_wait to avoid unexpected stuck
L
Liu Jicong 已提交
1965
      tsem_timewait(&tmq->rspSem, 1000);
X
Xiaoyu Wang 已提交
1966 1967 1968 1969
    }
  }
}

1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983
static void displayConsumeStatistics(const tmq_t* pTmq) {
  int32_t numOfTopics = taosArrayGetSize(pTmq->clientTopics);
  tscDebug("consumer:0x%" PRIx64 " closing poll:%" PRId64 " rows:%" PRId64 " topics:%d, final epoch:%d",
           pTmq->consumerId, pTmq->pollCnt, pTmq->totalRows, numOfTopics, pTmq->epoch);

  tscDebug("consumer:0x%" PRIx64 " rows dist begin: ", pTmq->consumerId);
  for (int32_t i = 0; i < numOfTopics; ++i) {
    SMqClientTopic* pTopics = taosArrayGet(pTmq->clientTopics, i);

    tscDebug("consumer:0x%" PRIx64 " topic:%d", pTmq->consumerId, i);
    int32_t numOfVgs = taosArrayGetSize(pTopics->vgs);
    for (int32_t j = 0; j < numOfVgs; ++j) {
      SMqClientVg* pVg = taosArrayGet(pTopics->vgs, j);
      tscDebug("topic:%s, %d. vgId:%d rows:%" PRId64, pTopics->topicName, j, pVg->vgId, pVg->numOfRows);
1984
    }
1985
  }
1986

1987 1988
  tscDebug("consumer:0x%" PRIx64 " rows dist end", pTmq->consumerId);
}
1989

1990 1991 1992
int32_t tmq_consumer_close(tmq_t* tmq) {
  tscDebug("consumer:0x%" PRIx64" start to close consumer, status:%d", tmq->consumerId, tmq->status);
  displayConsumeStatistics(tmq);
1993

1994 1995 1996 1997 1998 1999
  if (tmq->status == TMQ_CONSUMER_STATUS__READY) {
    // if auto commit is set, commit before close consumer. Otherwise, do nothing.
    if (tmq->autoCommit) {
      int32_t rsp = tmq_commit_sync(tmq, NULL);
      if (rsp != 0) {
        return rsp;
2000 2001 2002
      }
    }

L
Liu Jicong 已提交
2003
    int32_t     retryCnt = 0;
2004
    tmq_list_t* lst = tmq_list_new();
L
Liu Jicong 已提交
2005
    while (1) {
2006
      int32_t rsp = tmq_subscribe(tmq, lst);
L
Liu Jicong 已提交
2007 2008 2009 2010 2011 2012 2013 2014
      if (rsp != TSDB_CODE_MND_CONSUMER_NOT_READY || retryCnt > 5) {
        break;
      } else {
        retryCnt++;
        taosMsleep(500);
      }
    }

2015
    tmq_list_destroy(lst);
2016 2017
  } else {
    tscWarn("consumer:0x%" PRIx64" not in ready state, close it directly", tmq->consumerId);
L
Liu Jicong 已提交
2018
  }
H
Haojun Liao 已提交
2019

2020
  taosRemoveRef(tmqMgmt.rsetId, tmq->refId);
L
Liu Jicong 已提交
2021
  return 0;
2022
}
L
Liu Jicong 已提交
2023

L
Liu Jicong 已提交
2024 2025
const char* tmq_err2str(int32_t err) {
  if (err == 0) {
L
Liu Jicong 已提交
2026
    return "success";
L
Liu Jicong 已提交
2027
  } else if (err == -1) {
L
Liu Jicong 已提交
2028 2029 2030
    return "fail";
  } else {
    return tstrerror(err);
L
Liu Jicong 已提交
2031 2032
  }
}
L
Liu Jicong 已提交
2033

L
Liu Jicong 已提交
2034 2035 2036 2037 2038
tmq_res_t tmq_get_res_type(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    return TMQ_RES_DATA;
  } else if (TD_RES_TMQ_META(res)) {
    return TMQ_RES_TABLE_META;
2039 2040
  } else if (TD_RES_TMQ_METADATA(res)) {
    return TMQ_RES_METADATA;
L
Liu Jicong 已提交
2041 2042 2043 2044 2045
  } else {
    return TMQ_RES_INVALID;
  }
}

L
Liu Jicong 已提交
2046
const char* tmq_get_topic_name(TAOS_RES* res) {
L
Liu Jicong 已提交
2047 2048
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
L
Liu Jicong 已提交
2049
    return strchr(pRspObj->topic, '.') + 1;
L
Liu Jicong 已提交
2050 2051 2052
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return strchr(pMetaRspObj->topic, '.') + 1;
2053 2054 2055
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return strchr(pRspObj->topic, '.') + 1;
L
Liu Jicong 已提交
2056 2057 2058 2059 2060
  } else {
    return NULL;
  }
}

L
Liu Jicong 已提交
2061 2062 2063 2064
const char* tmq_get_db_name(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    return strchr(pRspObj->db, '.') + 1;
L
Liu Jicong 已提交
2065 2066 2067
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return strchr(pMetaRspObj->db, '.') + 1;
2068 2069 2070
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return strchr(pRspObj->db, '.') + 1;
L
Liu Jicong 已提交
2071 2072 2073 2074 2075
  } else {
    return NULL;
  }
}

L
Liu Jicong 已提交
2076 2077 2078 2079
int32_t tmq_get_vgroup_id(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    return pRspObj->vgId;
L
Liu Jicong 已提交
2080 2081 2082
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return pMetaRspObj->vgId;
2083
  } else if (TD_RES_TMQ_METADATA(res)) {
2084 2085
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return pRspObj->vgId;
L
Liu Jicong 已提交
2086 2087 2088 2089
  } else {
    return -1;
  }
}
L
Liu Jicong 已提交
2090 2091 2092 2093 2094 2095 2096 2097

const char* tmq_get_table_name(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    if (!pRspObj->rsp.withTbName || pRspObj->rsp.blockTbName == NULL || pRspObj->resIter < 0 ||
        pRspObj->resIter >= pRspObj->rsp.blockNum) {
      return NULL;
    }
2098
    return (const char*)taosArrayGetP(pRspObj->rsp.blockTbName, pRspObj->resIter);
2099 2100
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
L
Liu Jicong 已提交
2101 2102 2103
    if (!pRspObj->rsp.withTbName || pRspObj->rsp.blockTbName == NULL || pRspObj->resIter < 0 ||
        pRspObj->resIter >= pRspObj->rsp.blockNum) {
      return NULL;
2104
    }
L
Liu Jicong 已提交
2105 2106
    return (const char*)taosArrayGetP(pRspObj->rsp.blockTbName, pRspObj->resIter);
  }
L
Liu Jicong 已提交
2107 2108
  return NULL;
}
2109

2110 2111 2112 2113 2114 2115
void tmq_commit_async(tmq_t* tmq, const TAOS_RES* pRes, tmq_commit_cb* cb, void* param) {
  if (pRes == NULL) {  // here needs to commit all offsets.
    asyncCommitAllOffsets(tmq, cb, param);
  } else {  // only commit one offset
    asyncCommitOffset(tmq, pRes, cb, param);
  }
L
Liu Jicong 已提交
2116 2117
}

2118 2119 2120 2121 2122 2123 2124 2125 2126
typedef struct SSyncCommitInfo {
  tsem_t  sem;
  int32_t code;
} SSyncCommitInfo;

static void commitCallBackFn(tmq_t *pTmq, int32_t code, void* param) {
  SSyncCommitInfo* pInfo = (SSyncCommitInfo*) param;
  pInfo->code = code;
  tsem_post(&pInfo->sem);
2127
}
2128

2129 2130 2131 2132 2133 2134 2135 2136 2137
int32_t tmq_commit_sync(tmq_t* tmq, const TAOS_RES* pRes) {
  int32_t code = 0;

  SSyncCommitInfo* pInfo = taosMemoryMalloc(sizeof(SSyncCommitInfo));
  tsem_init(&pInfo->sem, 0, 0);
  pInfo->code = 0;

  if (pRes == NULL) {
    asyncCommitAllOffsets(tmq, commitCallBackFn, pInfo);
H
Haojun Liao 已提交
2138 2139
  } else {
    asyncCommitOffset(tmq, pRes, commitCallBackFn, pInfo);
2140 2141
  }

2142 2143
  tsem_wait(&pInfo->sem);
  code = pInfo->code;
H
Haojun Liao 已提交
2144 2145

  tsem_destroy(&pInfo->sem);
2146 2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157 2158 2159 2160
  taosMemoryFree(pInfo);

  tscDebug("consumer:0x%"PRIx64" sync commit done, code:%s", tmq->consumerId, tstrerror(code));
  return code;
}

void updateEpCallbackFn(tmq_t* pTmq, int32_t code, SDataBuf* pDataBuf, void* param) {
  SAskEpInfo* pInfo = param;
  pInfo->code = code;

  if (code == TSDB_CODE_SUCCESS) {
    SMqRspHead* head = pDataBuf->pData;

    SMqAskEpRsp rsp;
    tDecodeSMqAskEpRsp(POINTER_SHIFT(pDataBuf->pData, sizeof(SMqRspHead)), &rsp);
2161
    doUpdateLocalEp(pTmq, head->epoch, &rsp);
2162 2163 2164
    tDeleteSMqAskEpRsp(&rsp);
  }

H
Haojun Liao 已提交
2165
  tsem_post(&pInfo->sem);
2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191
}

void addToQueueCallbackFn(tmq_t* pTmq, int32_t code, SDataBuf* pDataBuf, void* param) {
  if (code != TSDB_CODE_SUCCESS) {
    terrno = code;
    return;
  }

  SMqAskEpRspWrapper* pWrapper = taosAllocateQitem(sizeof(SMqAskEpRspWrapper), DEF_QITEM, 0);
  if (pWrapper == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return;
  }

  SMqRspHead* head = pDataBuf->pData;

  pWrapper->tmqRspType = TMQ_MSG_TYPE__EP_RSP;
  pWrapper->epoch = head->epoch;
  memcpy(&pWrapper->msg, pDataBuf->pData, sizeof(SMqRspHead));
  tDecodeSMqAskEpRsp(POINTER_SHIFT(pDataBuf->pData, sizeof(SMqRspHead)), &pWrapper->msg);

  taosWriteQitem(pTmq->mqueue, pWrapper);
}

int32_t doAskEp(tmq_t* pTmq) {
  SAskEpInfo* pInfo = taosMemoryMalloc(sizeof(SAskEpInfo));
H
Haojun Liao 已提交
2192
  tsem_init(&pInfo->sem, 0, 0);
2193 2194

  asyncAskEp(pTmq, updateEpCallbackFn, pInfo);
H
Haojun Liao 已提交
2195
  tsem_wait(&pInfo->sem);
2196 2197

  int32_t code = pInfo->code;
H
Haojun Liao 已提交
2198
  tsem_destroy(&pInfo->sem);
2199 2200 2201 2202 2203
  taosMemoryFree(pInfo);
  return code;
}

void asyncAskEp(tmq_t* pTmq, __tmq_askep_fn_t askEpFn, void* param) {
2204
  SMqAskEpReq req = {0};
2205 2206 2207
  req.consumerId = pTmq->consumerId;
  req.epoch = pTmq->epoch;
  strcpy(req.cgroup, pTmq->groupId);
2208 2209 2210

  int32_t tlen = tSerializeSMqAskEpReq(NULL, 0, &req);
  if (tlen < 0) {
2211 2212 2213
    tscError("consumer:0x%" PRIx64 ", tSerializeSMqAskEpReq failed", pTmq->consumerId);
    askEpFn(pTmq, TSDB_CODE_INVALID_PARA, NULL, param);
    return;
2214 2215 2216 2217
  }

  void* pReq = taosMemoryCalloc(1, tlen);
  if (pReq == NULL) {
2218 2219 2220
    tscError("consumer:0x%" PRIx64 ", failed to malloc askEpReq msg, size:%d", pTmq->consumerId, tlen);
    askEpFn(pTmq, TSDB_CODE_OUT_OF_MEMORY, NULL, param);
    return;
2221 2222 2223
  }

  if (tSerializeSMqAskEpReq(pReq, tlen, &req) < 0) {
2224
    tscError("consumer:0x%" PRIx64 ", tSerializeSMqAskEpReq %d failed", pTmq->consumerId, tlen);
2225
    taosMemoryFree(pReq);
2226 2227 2228

    askEpFn(pTmq, TSDB_CODE_INVALID_PARA, NULL, param);
    return;
2229 2230 2231 2232
  }

  SMqAskEpCbParam* pParam = taosMemoryCalloc(1, sizeof(SMqAskEpCbParam));
  if (pParam == NULL) {
2233
    tscError("consumer:0x%" PRIx64 ", failed to malloc subscribe param", pTmq->consumerId);
2234
    taosMemoryFree(pReq);
2235 2236 2237

    askEpFn(pTmq, TSDB_CODE_OUT_OF_MEMORY, NULL, param);
    return;
2238 2239
  }

2240 2241 2242 2243
  pParam->refId = pTmq->refId;
  pParam->epoch = pTmq->epoch;
  pParam->pUserFn = askEpFn;
  pParam->pParam = param;
2244 2245 2246 2247 2248

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(pParam);
    taosMemoryFree(pReq);
2249 2250
    askEpFn(pTmq, TSDB_CODE_OUT_OF_MEMORY, NULL, param);
    return;
2251 2252
  }

2253
  sendInfo->msgInfo = (SDataBuf){ .pData = pReq, .len = tlen, .handle = NULL };
2254 2255 2256 2257

  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
  sendInfo->param = pParam;
2258
  sendInfo->fp = askEpCallbackFn;
2259 2260
  sendInfo->msgType = TDMT_MND_TMQ_ASK_EP;

2261 2262
  SEpSet epSet = getEpSet_s(&pTmq->pTscObj->pAppInfo->mgmtEp);
  tscDebug("consumer:0x%" PRIx64 " ask ep from mnode, reqId:0x%" PRIx64, pTmq->consumerId, sendInfo->requestId);
2263 2264

  int64_t transporterId = 0;
2265
  asyncSendMsgToServer(pTmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);
2266 2267 2268 2269 2270 2271 2272
}

int32_t makeTopicVgroupKey(char* dst, const char* topicName, int32_t vg) {
  return sprintf(dst, "%s:%d", topicName, vg);
}

int32_t tmqCommitDone(SMqCommitCbParamSet* pParamSet) {
2273 2274 2275
  int64_t refId = pParamSet->refId;

  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
2276 2277 2278 2279 2280 2281 2282
  if (tmq == NULL) {
    taosMemoryFree(pParamSet);
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    return -1;
  }

  // if no more waiting rsp
2283
  pParamSet->callbackFn(tmq, pParamSet->code, pParamSet->userParam);
2284
  taosMemoryFree(pParamSet);
2285 2286

  taosReleaseRef(tmqMgmt.rsetId, refId);
2287
  return 0;
2288 2289
}

2290
void commitRspCountDown(SMqCommitCbParamSet* pParamSet, int64_t consumerId, const char* pTopic, int32_t vgId) {
2291 2292
  int32_t waitingRspNum = atomic_sub_fetch_32(&pParamSet->waitingRspNum, 1);
  if (waitingRspNum == 0) {
H
Haojun Liao 已提交
2293 2294
    tscDebug("consumer:0x%" PRIx64 " topic:%s vgId:%d all commit-rsp received, commit completed", consumerId, pTopic,
             vgId);
2295
    tmqCommitDone(pParamSet);
H
Haojun Liao 已提交
2296 2297 2298
  } else {
    tscDebug("consumer:0x%" PRIx64 " topic:%s vgId:%d commit-rsp received, remain:%d", consumerId, pTopic, vgId,
             waitingRspNum);
2299 2300
  }
}