clientTmq.c 71.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

L
Liu Jicong 已提交
16
#include "cJSON.h"
17 18 19
#include "clientInt.h"
#include "clientLog.h"
#include "parser.h"
H
Haojun Liao 已提交
20
#include "tdatablock.h"
21 22
#include "tdef.h"
#include "tglobal.h"
X
Xiaoyu Wang 已提交
23
#include "tqueue.h"
24
#include "tref.h"
L
Liu Jicong 已提交
25 26
#include "ttimer.h"

27
#define EMPTY_BLOCK_POLL_IDLE_DURATION  100
28
#define DEFAULT_AUTO_COMMIT_INTERVAL    5000
29

X
Xiaoyu Wang 已提交
30
struct SMqMgmt {
31 32 33
  int8_t  inited;
  tmr_h   timer;
  int32_t rsetId;
34
};
L
Liu Jicong 已提交
35

X
Xiaoyu Wang 已提交
36 37
static TdThreadOnce   tmqInit = PTHREAD_ONCE_INIT;  // initialize only once
volatile int32_t      tmqInitRes = 0;               // initialize rsp code
38
static struct SMqMgmt tmqMgmt = {0};
39

L
Liu Jicong 已提交
40 41 42 43 44 45
typedef struct {
  int8_t  tmqRspType;
  int32_t epoch;
} SMqRspWrapper;

typedef struct {
L
Liu Jicong 已提交
46 47 48
  int8_t      tmqRspType;
  int32_t     epoch;
  SMqAskEpRsp msg;
L
Liu Jicong 已提交
49 50
} SMqAskEpRspWrapper;

L
Liu Jicong 已提交
51
struct tmq_list_t {
L
Liu Jicong 已提交
52
  SArray container;
L
Liu Jicong 已提交
53
};
L
Liu Jicong 已提交
54

L
Liu Jicong 已提交
55
struct tmq_conf_t {
56 57 58 59 60 61 62 63
  char           clientId[256];
  char           groupId[TSDB_CGROUP_LEN];
  int8_t         autoCommit;
  int8_t         resetOffset;
  int8_t         withTbName;
  int8_t         snapEnable;
  int32_t        snapBatchSize;
  bool           hbBgEnable;
64 65 66 67 68
  uint16_t       port;
  int32_t        autoCommitInterval;
  char*          ip;
  char*          user;
  char*          pass;
69
  tmq_commit_cb* commitCb;
L
Liu Jicong 已提交
70
  void*          commitCbUserParam;
L
Liu Jicong 已提交
71 72 73
};

struct tmq_t {
74 75 76 77 78 79 80 81 82 83
  int64_t        refId;
  char           groupId[TSDB_CGROUP_LEN];
  char           clientId[256];
  int8_t         withTbName;
  int8_t         useSnapshot;
  int8_t         autoCommit;
  int32_t        autoCommitInterval;
  int32_t        resetOffsetCfg;
  uint64_t       consumerId;
  bool           hbBgEnable;
L
Liu Jicong 已提交
84 85
  tmq_commit_cb* commitCb;
  void*          commitCbUserParam;
L
Liu Jicong 已提交
86 87 88 89

  // status
  int8_t  status;
  int32_t epoch;
L
Liu Jicong 已提交
90 91
#if 0
  int8_t  epStatus;
L
Liu Jicong 已提交
92
  int32_t epSkipCnt;
L
Liu Jicong 已提交
93
#endif
94 95 96
  // poll info
  int64_t       pollCnt;
  int64_t       totalRows;
L
Liu Jicong 已提交
97

L
Liu Jicong 已提交
98
  // timer
99 100 101 102
  tmr_h         hbLiveTimer;
  tmr_h         epTimer;
  tmr_h         reportTimer;
  tmr_h         commitTimer;
H
Haojun Liao 已提交
103 104 105 106 107 108 109
  STscObj*      pTscObj;       // connection
  SArray*       clientTopics;  // SArray<SMqClientTopic>
  STaosQueue*   mqueue;        // queue of rsp
  STaosQall*    qall;
  STaosQueue*   delayedTask;   // delayed task queue for heartbeat and auto commit
  TdThreadMutex lock;          // used to protect the operation on each topic, when updating the epsets.
  tsem_t        rspSem;
L
Liu Jicong 已提交
110 111
};

X
Xiaoyu Wang 已提交
112 113 114 115 116 117 118 119
enum {
  TMQ_VG_STATUS__IDLE = 0,
  TMQ_VG_STATUS__WAIT,
};

enum {
  TMQ_CONSUMER_STATUS__INIT = 0,
  TMQ_CONSUMER_STATUS__READY,
120
  TMQ_CONSUMER_STATUS__NO_TOPIC,
L
Liu Jicong 已提交
121
  TMQ_CONSUMER_STATUS__RECOVER,
L
Liu Jicong 已提交
122 123
};

L
Liu Jicong 已提交
124
enum {
125
  TMQ_DELAYED_TASK__ASK_EP = 1,
L
Liu Jicong 已提交
126 127 128 129
  TMQ_DELAYED_TASK__REPORT,
  TMQ_DELAYED_TASK__COMMIT,
};

L
Liu Jicong 已提交
130
typedef struct {
H
Haojun Liao 已提交
131
  int64_t      pollCnt;
132
  int64_t      numOfRows;
L
Liu Jicong 已提交
133 134
  STqOffsetVal committedOffset;
  STqOffsetVal currentOffset;
H
Haojun Liao 已提交
135 136 137
  int32_t      vgId;
  int32_t      vgStatus;
  int32_t      vgSkipCnt;
H
Haojun Liao 已提交
138
  int64_t      emptyBlockReceiveTs; // once empty block is received, idle for ignoreCnt then start to poll data
H
Haojun Liao 已提交
139
  SEpSet       epSet;
140 141
} SMqClientVg;

L
Liu Jicong 已提交
142
typedef struct {
143 144 145
  char           topicName[TSDB_TOPIC_FNAME_LEN];
  char           db[TSDB_DB_FNAME_LEN];
  SArray*        vgs;  // SArray<SMqClientVg>
L
Liu Jicong 已提交
146
  SSchemaWrapper schema;
147 148
} SMqClientTopic;

L
Liu Jicong 已提交
149 150 151 152 153
typedef struct {
  int8_t          tmqRspType;
  int32_t         epoch;
  SMqClientVg*    vgHandle;
  SMqClientTopic* topicHandle;
H
Haojun Liao 已提交
154
  uint64_t        reqId;
155
  SEpSet*         pEpset;
L
Liu Jicong 已提交
156
  union {
L
Liu Jicong 已提交
157 158
    SMqDataRsp dataRsp;
    SMqMetaRsp metaRsp;
L
Liu Jicong 已提交
159
    STaosxRsp  taosxRsp;
L
Liu Jicong 已提交
160
  };
L
Liu Jicong 已提交
161 162
} SMqPollRspWrapper;

L
Liu Jicong 已提交
163
typedef struct {
164 165
  int64_t refId;
  int32_t epoch;
L
Liu Jicong 已提交
166 167
  tsem_t  rspSem;
  int32_t rspErr;
L
Liu Jicong 已提交
168
} SMqSubscribeCbParam;
L
Liu Jicong 已提交
169

L
Liu Jicong 已提交
170
typedef struct {
171 172
  int64_t refId;
  int32_t epoch;
L
Liu Jicong 已提交
173
  int32_t code;
L
Liu Jicong 已提交
174
  int32_t async;
X
Xiaoyu Wang 已提交
175
  tsem_t  rspSem;
176 177
} SMqAskEpCbParam;

L
Liu Jicong 已提交
178
typedef struct {
179 180
  int64_t         refId;
  int32_t         epoch;
L
Liu Jicong 已提交
181
  SMqClientVg*    pVg;
L
Liu Jicong 已提交
182
  SMqClientTopic* pTopic;
L
Liu Jicong 已提交
183
  int32_t         vgId;
L
Liu Jicong 已提交
184
  tsem_t          rspSem;
H
Haojun Liao 已提交
185
  uint64_t        requestId; // request id for debug purpose
X
Xiaoyu Wang 已提交
186
} SMqPollCbParam;
187

188
typedef struct {
189 190
  int64_t        refId;
  int32_t        epoch;
L
Liu Jicong 已提交
191 192
  int8_t         automatic;
  int8_t         async;
L
Liu Jicong 已提交
193 194
  int32_t        waitingRspNum;
  int32_t        totalRspNum;
L
Liu Jicong 已提交
195
  int32_t        rspErr;
196
  tmq_commit_cb* userCb;
L
Liu Jicong 已提交
197 198 199 200
  /*SArray*        successfulOffsets;*/
  /*SArray*        failedOffsets;*/
  void*  userParam;
  tsem_t rspSem;
201 202 203 204 205
} SMqCommitCbParamSet;

typedef struct {
  SMqCommitCbParamSet* params;
  STqOffset*           pOffset;
H
Haojun Liao 已提交
206 207 208
  char                 topicName[TSDB_TOPIC_FNAME_LEN];
  int32_t              vgId;
  tmq_t*               pTmq;
209
} SMqCommitCbParam;
210

211
static int32_t tmqAskEp(tmq_t* tmq, bool async);
212 213
static int32_t makeTopicVgroupKey(char* dst, const char* topicName, int32_t vg);
static int32_t tmqCommitDone(SMqCommitCbParamSet* pParamSet);
214 215
static int32_t doSendCommitMsg(tmq_t* tmq, SMqClientVg* pVg, const char* pTopicName, SMqCommitCbParamSet* pParamSet,
                               int32_t index, int32_t totalVgroups);
216
static void tmqCommitRspCountDown(SMqCommitCbParamSet* pParamSet, int64_t consumerId, const char* pTopic, int32_t vgId);
217

218
tmq_conf_t* tmq_conf_new() {
wafwerar's avatar
wafwerar 已提交
219
  tmq_conf_t* conf = taosMemoryCalloc(1, sizeof(tmq_conf_t));
220 221 222 223 224
  if (conf == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return conf;
  }

225
  conf->withTbName = false;
L
Liu Jicong 已提交
226
  conf->autoCommit = true;
227
  conf->autoCommitInterval = DEFAULT_AUTO_COMMIT_INTERVAL;
228
  conf->resetOffset = TMQ_OFFSET__RESET_EARLIEAST;
229
  conf->hbBgEnable = true;
230

231 232 233
  return conf;
}

L
Liu Jicong 已提交
234
void tmq_conf_destroy(tmq_conf_t* conf) {
L
Liu Jicong 已提交
235
  if (conf) {
236 237 238 239 240 241 242 243 244
    if (conf->ip) {
      taosMemoryFree(conf->ip);
    }
    if (conf->user) {
      taosMemoryFree(conf->user);
    }
    if (conf->pass) {
      taosMemoryFree(conf->pass);
    }
L
Liu Jicong 已提交
245 246
    taosMemoryFree(conf);
  }
L
Liu Jicong 已提交
247 248 249
}

tmq_conf_res_t tmq_conf_set(tmq_conf_t* conf, const char* key, const char* value) {
250
  if (strcasecmp(key, "group.id") == 0) {
L
Liu Jicong 已提交
251
    tstrncpy(conf->groupId, value, TSDB_CGROUP_LEN);
L
Liu Jicong 已提交
252
    return TMQ_CONF_OK;
253
  }
L
Liu Jicong 已提交
254

255
  if (strcasecmp(key, "client.id") == 0) {
L
Liu Jicong 已提交
256
    tstrncpy(conf->clientId, value, 256);
L
Liu Jicong 已提交
257 258
    return TMQ_CONF_OK;
  }
L
Liu Jicong 已提交
259

260 261
  if (strcasecmp(key, "enable.auto.commit") == 0) {
    if (strcasecmp(value, "true") == 0) {
L
Liu Jicong 已提交
262
      conf->autoCommit = true;
L
Liu Jicong 已提交
263
      return TMQ_CONF_OK;
264
    } else if (strcasecmp(value, "false") == 0) {
L
Liu Jicong 已提交
265
      conf->autoCommit = false;
L
Liu Jicong 已提交
266 267 268 269
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
270
  }
L
Liu Jicong 已提交
271

272
  if (strcasecmp(key, "auto.commit.interval.ms") == 0) {
273
    conf->autoCommitInterval = taosStr2int64(value);
L
Liu Jicong 已提交
274 275 276
    return TMQ_CONF_OK;
  }

277 278 279
  if (strcasecmp(key, "auto.offset.reset") == 0) {
    if (strcasecmp(value, "none") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_NONE;
L
Liu Jicong 已提交
280
      return TMQ_CONF_OK;
281 282
    } else if (strcasecmp(value, "earliest") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_EARLIEAST;
L
Liu Jicong 已提交
283
      return TMQ_CONF_OK;
284 285
    } else if (strcasecmp(value, "latest") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_LATEST;
L
Liu Jicong 已提交
286 287 288 289 290
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
  }
L
Liu Jicong 已提交
291

292 293
  if (strcasecmp(key, "msg.with.table.name") == 0) {
    if (strcasecmp(value, "true") == 0) {
294
      conf->withTbName = true;
L
Liu Jicong 已提交
295
      return TMQ_CONF_OK;
296
    } else if (strcasecmp(value, "false") == 0) {
297
      conf->withTbName = false;
L
Liu Jicong 已提交
298
      return TMQ_CONF_OK;
299 300 301 302 303
    } else {
      return TMQ_CONF_INVALID;
    }
  }

304 305
  if (strcasecmp(key, "experimental.snapshot.enable") == 0) {
    if (strcasecmp(value, "true") == 0) {
L
Liu Jicong 已提交
306
      conf->snapEnable = true;
307
      return TMQ_CONF_OK;
308
    } else if (strcasecmp(value, "false") == 0) {
L
Liu Jicong 已提交
309
      conf->snapEnable = false;
310 311 312 313 314 315
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
  }

316
  if (strcasecmp(key, "experimental.snapshot.batch.size") == 0) {
317
    conf->snapBatchSize = taosStr2int64(value);
L
Liu Jicong 已提交
318 319 320
    return TMQ_CONF_OK;
  }

321 322
  if (strcasecmp(key, "enable.heartbeat.background") == 0) {
    if (strcasecmp(value, "true") == 0) {
323
      conf->hbBgEnable = true;
L
Liu Jicong 已提交
324
      return TMQ_CONF_OK;
325
    } else if (strcasecmp(value, "false") == 0) {
326
      conf->hbBgEnable = false;
L
Liu Jicong 已提交
327 328 329 330 331 332
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
  }

333
  if (strcasecmp(key, "td.connect.ip") == 0) {
334
    conf->ip = taosStrdup(value);
L
Liu Jicong 已提交
335 336
    return TMQ_CONF_OK;
  }
337

338
  if (strcasecmp(key, "td.connect.user") == 0) {
339
    conf->user = taosStrdup(value);
L
Liu Jicong 已提交
340 341
    return TMQ_CONF_OK;
  }
342

343
  if (strcasecmp(key, "td.connect.pass") == 0) {
344
    conf->pass = taosStrdup(value);
L
Liu Jicong 已提交
345 346
    return TMQ_CONF_OK;
  }
347

348
  if (strcasecmp(key, "td.connect.port") == 0) {
349
    conf->port = taosStr2int64(value);
L
Liu Jicong 已提交
350 351
    return TMQ_CONF_OK;
  }
352

353
  if (strcasecmp(key, "td.connect.db") == 0) {
L
Liu Jicong 已提交
354 355 356
    return TMQ_CONF_OK;
  }

L
Liu Jicong 已提交
357
  return TMQ_CONF_UNKNOWN;
358 359 360
}

tmq_list_t* tmq_list_new() {
L
Liu Jicong 已提交
361
  return (tmq_list_t*)taosArrayInit(0, sizeof(void*));
362 363
}

L
Liu Jicong 已提交
364 365
int32_t tmq_list_append(tmq_list_t* list, const char* src) {
  SArray* container = &list->container;
366
  if (src == NULL || src[0] == 0) return -1;
367
  char* topic = taosStrdup(src);
368 369 370
  if (topic[0] != '`') {
    strtolower(topic, src);
  }
L
fix  
Liu Jicong 已提交
371
  if (taosArrayPush(container, &topic) == NULL) return -1;
372 373 374
  return 0;
}

L
Liu Jicong 已提交
375
void tmq_list_destroy(tmq_list_t* list) {
L
Liu Jicong 已提交
376
  SArray* container = &list->container;
L
Liu Jicong 已提交
377
  taosArrayDestroyP(container, taosMemoryFree);
L
Liu Jicong 已提交
378 379
}

L
Liu Jicong 已提交
380 381 382 383 384 385 386 387 388 389
int32_t tmq_list_get_size(const tmq_list_t* list) {
  const SArray* container = &list->container;
  return taosArrayGetSize(container);
}

char** tmq_list_to_c_array(const tmq_list_t* list) {
  const SArray* container = &list->container;
  return container->pData;
}

390 391 392 393 394
static SMqClientVg* foundClientVg(SArray* pTopicList, const char* pName, int32_t vgId, int32_t* index, int32_t* numOfVgroups) {
  int32_t numOfTopics = taosArrayGetSize(pTopicList);
  *index = -1;
  *numOfVgroups = 0;

395
  for(int32_t i = 0; i < numOfTopics; ++i) {
396 397
    SMqClientTopic* pTopic = taosArrayGet(pTopicList, i);
    if (strcmp(pTopic->topicName, pName) != 0) {
398 399 400
      continue;
    }

401 402
    *numOfVgroups = taosArrayGetSize(pTopic->vgs);
    for (int32_t j = 0; j < (*numOfVgroups); ++j) {
403
      SMqClientVg* pClientVg = taosArrayGet(pTopic->vgs, j);
404 405 406
      if (pClientVg->vgId == vgId) {
        *index = j;
        return pClientVg;
407 408
      }
    }
L
Liu Jicong 已提交
409
  }
410 411

  return NULL;
L
Liu Jicong 已提交
412
}
413

414 415 416
// Two problems do not need to be addressed here
// 1. update to of epset. the response of poll request will automatically handle this problem
// 2. commit failure. This one needs to be resolved.
H
Haojun Liao 已提交
417
static int32_t tmqCommitCb(void* param, SDataBuf* pBuf, int32_t code) {
418
  SMqCommitCbParam*    pParam = (SMqCommitCbParam*)param;
419
  SMqCommitCbParamSet* pParamSet = (SMqCommitCbParamSet*)pParam->params;
H
Haojun Liao 已提交
420

421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449
//  if (code != TSDB_CODE_SUCCESS) { // if commit offset failed, let's try again
//    taosThreadMutexLock(&pParam->pTmq->lock);
//    int32_t numOfVgroups, index;
//    SMqClientVg* pVg = foundClientVg(pParam->pTmq->clientTopics, pParam->topicName, pParam->vgId, &index, &numOfVgroups);
//    if (pVg == NULL) {
//      tscDebug("consumer:0x%" PRIx64
//               " subKey:%s vgId:%d commit failed, code:%s has been transferred to other consumer, no need retry ordinal:%d/%d",
//               pParam->pTmq->consumerId, pParam->pOffset->subKey, pParam->vgId, tstrerror(code), index + 1, numOfVgroups);
//    } else { // let's retry the commit
//      int32_t code1 = doSendCommitMsg(pParam->pTmq, pVg, pParam->topicName, pParamSet, index, numOfVgroups);
//      if (code1 != TSDB_CODE_SUCCESS) {  // retry failed.
//        tscError("consumer:0x%" PRIx64 " topic:%s vgId:%d offset:%" PRId64
//                 " retry failed, ignore this commit. code:%s ordinal:%d/%d",
//                 pParam->pTmq->consumerId, pParam->topicName, pVg->vgId, pVg->committedOffset.version,
//                 tstrerror(terrno), index + 1, numOfVgroups);
//      }
//    }
//
//    taosThreadMutexUnlock(&pParam->pTmq->lock);
//
//    taosMemoryFree(pParam->pOffset);
//    taosMemoryFree(pBuf->pData);
//    taosMemoryFree(pBuf->pEpSet);
//
//    tmqCommitRspCountDown(pParamSet, pParam->pTmq->consumerId, pParam->topicName, pParam->vgId);
//    return 0;
//  }
//
//  // todo replace the pTmq with refId
450

L
Liu Jicong 已提交
451
  taosMemoryFree(pParam->pOffset);
L
Liu Jicong 已提交
452
  taosMemoryFree(pBuf->pData);
dengyihao's avatar
dengyihao 已提交
453
  taosMemoryFree(pBuf->pEpSet);
L
Liu Jicong 已提交
454

455
  tmqCommitRspCountDown(pParamSet, pParam->pTmq->consumerId, pParam->topicName, pParam->vgId);
456 457 458
  return 0;
}

459 460
static int32_t doSendCommitMsg(tmq_t* tmq, SMqClientVg* pVg, const char* pTopicName, SMqCommitCbParamSet* pParamSet,
                               int32_t index, int32_t totalVgroups) {
L
Liu Jicong 已提交
461 462 463 464 465
  STqOffset* pOffset = taosMemoryCalloc(1, sizeof(STqOffset));
  if (pOffset == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
466

L
Liu Jicong 已提交
467
  pOffset->val = pVg->currentOffset;
468

L
Liu Jicong 已提交
469 470 471
  int32_t groupLen = strlen(tmq->groupId);
  memcpy(pOffset->subKey, tmq->groupId, groupLen);
  pOffset->subKey[groupLen] = TMQ_SEPARATOR;
H
Haojun Liao 已提交
472
  strcpy(pOffset->subKey + groupLen + 1, pTopicName);
L
Liu Jicong 已提交
473

474 475
  int32_t len = 0;
  int32_t code = 0;
L
Liu Jicong 已提交
476 477 478 479
  tEncodeSize(tEncodeSTqOffset, pOffset, len, code);
  if (code < 0) {
    return -1;
  }
480

L
Liu Jicong 已提交
481
  void* buf = taosMemoryCalloc(1, sizeof(SMsgHead) + len);
L
Liu Jicong 已提交
482 483 484 485
  if (buf == NULL) {
    taosMemoryFree(pOffset);
    return -1;
  }
486

L
Liu Jicong 已提交
487
  ((SMsgHead*)buf)->vgId = htonl(pVg->vgId);
L
Liu Jicong 已提交
488

L
Liu Jicong 已提交
489 490 491 492 493
  void* abuf = POINTER_SHIFT(buf, sizeof(SMsgHead));

  SEncoder encoder;
  tEncoderInit(&encoder, abuf, len);
  tEncodeSTqOffset(&encoder, pOffset);
L
Liu Jicong 已提交
494
  tEncoderClear(&encoder);
L
Liu Jicong 已提交
495 496

  // build param
497
  SMqCommitCbParam* pParam = taosMemoryCalloc(1, sizeof(SMqCommitCbParam));
L
Liu Jicong 已提交
498
  if (pParam == NULL) {
L
Liu Jicong 已提交
499
    taosMemoryFree(pOffset);
L
Liu Jicong 已提交
500 501 502
    taosMemoryFree(buf);
    return -1;
  }
503

L
Liu Jicong 已提交
504 505
  pParam->params = pParamSet;
  pParam->pOffset = pOffset;
H
Haojun Liao 已提交
506 507 508
  pParam->vgId = pVg->vgId;
  pParam->pTmq = tmq;

H
Haojun Liao 已提交
509
  tstrncpy(pParam->topicName, pTopicName, tListLen(pParam->topicName));
L
Liu Jicong 已提交
510 511 512 513

  // build send info
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (pMsgSendInfo == NULL) {
L
Liu Jicong 已提交
514
    taosMemoryFree(pOffset);
L
Liu Jicong 已提交
515 516
    taosMemoryFree(buf);
    taosMemoryFree(pParam);
L
Liu Jicong 已提交
517 518
    return -1;
  }
519

L
Liu Jicong 已提交
520 521 522 523 524 525 526 527 528
  pMsgSendInfo->msgInfo = (SDataBuf){
      .pData = buf,
      .len = sizeof(SMsgHead) + len,
      .handle = NULL,
  };

  pMsgSendInfo->requestId = generateRequestId();
  pMsgSendInfo->requestObjRefId = 0;
  pMsgSendInfo->param = pParam;
L
Liu Jicong 已提交
529
  pMsgSendInfo->paramFreeFp = taosMemoryFree;
530
  pMsgSendInfo->fp = tmqCommitCb;
L
Liu Jicong 已提交
531
  pMsgSendInfo->msgType = TDMT_VND_TMQ_COMMIT_OFFSET;
L
Liu Jicong 已提交
532

L
Liu Jicong 已提交
533 534 535
  atomic_add_fetch_32(&pParamSet->waitingRspNum, 1);
  atomic_add_fetch_32(&pParamSet->totalRspNum, 1);

H
Haojun Liao 已提交
536 537 538 539 540 541
  SEp* pEp = GET_ACTIVE_EP(&pVg->epSet);
  tscDebug("consumer:0x%" PRIx64 " topic:%s on vgId:%d send offset:%" PRId64 " prev:%" PRId64
           ", ep:%s:%d, ordinal:%d/%d, req:0x%" PRIx64,
           tmq->consumerId, pOffset->subKey, pVg->vgId, pOffset->val.version, pVg->committedOffset.version, pEp->fqdn,
           pEp->port, index + 1, totalVgroups, pMsgSendInfo->requestId);

L
Liu Jicong 已提交
542 543 544 545 546
  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &pVg->epSet, &transporterId, pMsgSendInfo);
  return 0;
}

H
Haojun Liao 已提交
547
static int32_t tmqCommitMsgImpl(tmq_t* tmq, const TAOS_RES* msg, int8_t async, tmq_commit_cb* userCb, void* userParam) {
L
Liu Jicong 已提交
548 549 550 551 552 553 554 555 556 557
  char*   topic;
  int32_t vgId;
  if (TD_RES_TMQ(msg)) {
    SMqRspObj* pRspObj = (SMqRspObj*)msg;
    topic = pRspObj->topic;
    vgId = pRspObj->vgId;
  } else if (TD_RES_TMQ_META(msg)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)msg;
    topic = pMetaRspObj->topic;
    vgId = pMetaRspObj->vgId;
L
Liu Jicong 已提交
558
  } else if (TD_RES_TMQ_METADATA(msg)) {
559 560 561
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)msg;
    topic = pRspObj->topic;
    vgId = pRspObj->vgId;
L
Liu Jicong 已提交
562 563 564 565 566 567 568 569 570
  } else {
    return TSDB_CODE_TMQ_INVALID_MSG;
  }

  SMqCommitCbParamSet* pParamSet = taosMemoryCalloc(1, sizeof(SMqCommitCbParamSet));
  if (pParamSet == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }
H
Haojun Liao 已提交
571

572 573
  pParamSet->refId = tmq->refId;
  pParamSet->epoch = tmq->epoch;
L
Liu Jicong 已提交
574 575 576 577 578 579
  pParamSet->automatic = 0;
  pParamSet->async = async;
  pParamSet->userCb = userCb;
  pParamSet->userParam = userParam;
  tsem_init(&pParamSet->rspSem, 0, 0);

L
Liu Jicong 已提交
580 581
  int32_t code = -1;

H
Haojun Liao 已提交
582
  taosThreadMutexLock(&tmq->lock);
H
Haojun Liao 已提交
583 584 585 586
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);

  tscDebug("consumer:0x%" PRIx64 " user invoked commit offset for %d", tmq->consumerId, numOfTopics);
  for (int32_t i = 0; i < numOfTopics; i++) {
L
Liu Jicong 已提交
587
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
588 589 590 591 592 593
    if (strcmp(pTopic->topicName, topic) != 0) {
      continue;
    }

    int32_t numOfVgroups = taosArrayGetSize(pTopic->vgs);
    for (int32_t j = 0; j < numOfVgroups; j++) {
L
Liu Jicong 已提交
594
      SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);
H
Haojun Liao 已提交
595 596 597
      if (pVg->vgId != vgId) {
        continue;
      }
L
Liu Jicong 已提交
598

L
Liu Jicong 已提交
599
      if (pVg->currentOffset.type > 0 && !tOffsetEqual(&pVg->currentOffset, &pVg->committedOffset)) {
600
        if (doSendCommitMsg(tmq, pVg, pTopic->topicName, pParamSet, j, numOfVgroups) < 0) {
L
Liu Jicong 已提交
601 602
          tsem_destroy(&pParamSet->rspSem);
          taosMemoryFree(pParamSet);
L
Liu Jicong 已提交
603
          goto FAIL;
L
Liu Jicong 已提交
604
        }
L
Liu Jicong 已提交
605
        goto HANDLE_RSP;
L
Liu Jicong 已提交
606 607
      }
    }
L
Liu Jicong 已提交
608
  }
L
Liu Jicong 已提交
609

L
Liu Jicong 已提交
610 611 612 613
HANDLE_RSP:
  if (pParamSet->totalRspNum == 0) {
    tsem_destroy(&pParamSet->rspSem);
    taosMemoryFree(pParamSet);
H
Haojun Liao 已提交
614
    taosThreadMutexUnlock(&tmq->lock);
L
Liu Jicong 已提交
615 616 617
    return 0;
  }

L
Liu Jicong 已提交
618
  if (!async) {
H
Haojun Liao 已提交
619
    taosThreadMutexUnlock(&tmq->lock);
L
Liu Jicong 已提交
620 621 622
    tsem_wait(&pParamSet->rspSem);
    code = pParamSet->rspErr;
    tsem_destroy(&pParamSet->rspSem);
L
Liu Jicong 已提交
623
    taosMemoryFree(pParamSet);
L
Liu Jicong 已提交
624 625 626 627 628 629
    return code;
  } else {
    code = 0;
  }

FAIL:
H
Haojun Liao 已提交
630
  taosThreadMutexUnlock(&tmq->lock);
L
Liu Jicong 已提交
631 632 633
  if (code != 0 && async) {
    userCb(tmq, code, userParam);
  }
H
Haojun Liao 已提交
634

L
Liu Jicong 已提交
635 636 637
  return 0;
}

638
static int32_t doAutoCommit(tmq_t* tmq, int8_t automatic, int8_t async, tmq_commit_cb* userCb, void* userParam) {
L
Liu Jicong 已提交
639 640
  int32_t code = -1;

641 642
  SMqCommitCbParamSet* pParamSet = taosMemoryCalloc(1, sizeof(SMqCommitCbParamSet));
  if (pParamSet == NULL) {
L
Liu Jicong 已提交
643 644 645 646 647 648 649 650
    code = TSDB_CODE_OUT_OF_MEMORY;
    if (async) {
      if (automatic) {
        tmq->commitCb(tmq, code, tmq->commitCbUserParam);
      } else {
        userCb(tmq, code, userParam);
      }
    }
651 652
    return -1;
  }
653 654 655 656

  pParamSet->refId = tmq->refId;
  pParamSet->epoch = tmq->epoch;

657 658 659 660 661 662
  pParamSet->automatic = automatic;
  pParamSet->async = async;
  pParamSet->userCb = userCb;
  pParamSet->userParam = userParam;
  tsem_init(&pParamSet->rspSem, 0, 0);

663 664 665
  // init as 1 to prevent concurrency issue
  pParamSet->waitingRspNum = 1;

H
Haojun Liao 已提交
666
  taosThreadMutexLock(&tmq->lock);
667
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);
X
Xiaoyu Wang 已提交
668
  tscDebug("consumer:0x%" PRIx64 " start to commit offset for %d topics", tmq->consumerId, numOfTopics);
669 670

  for (int32_t i = 0; i < numOfTopics; i++) {
671
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
672
    int32_t         numOfVgroups = taosArrayGetSize(pTopic->vgs);
L
Liu Jicong 已提交
673

674 675
    tscDebug("consumer:0x%" PRIx64 " commit offset for topics:%s, numOfVgs:%d", tmq->consumerId, pTopic->topicName,
             numOfVgroups);
676
    for (int32_t j = 0; j < numOfVgroups; j++) {
677 678 679 680 681 682 683 684
      SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);

      if (pVg->currentOffset.type > 0 && !tOffsetEqual(&pVg->currentOffset, &pVg->committedOffset)) {
        code = doSendCommitMsg(tmq, pVg, pTopic->topicName, pParamSet, j, numOfVgroups);
        if (code != TSDB_CODE_SUCCESS) {
          tscError("consumer:0x%" PRIx64 " topic:%s vgId:%d offset:%" PRId64 " failed, code:%s ordinal:%d/%d",
                   tmq->consumerId, pTopic->topicName, pVg->vgId, pVg->committedOffset.version, tstrerror(terrno),
                   j + 1, numOfVgroups);
L
Liu Jicong 已提交
685 686
          continue;
        }
H
Haojun Liao 已提交
687 688 689

        // update the offset value.
        pVg->committedOffset = pVg->currentOffset;
690
      } else {
691 692
        tscDebug("consumer:0x%" PRIx64 " topic:%s vgId:%d, no commit, current:%" PRId64 ", ordinal:%d/%d",
                 tmq->consumerId, pTopic->topicName, pVg->vgId, pVg->currentOffset.version, j + 1, numOfVgroups);
693 694 695 696
      }
    }
  }

H
Haojun Liao 已提交
697
  tscDebug("consumer:0x%" PRIx64 " total commit:%d for %d topics", tmq->consumerId, pParamSet->waitingRspNum - 1,
698
           numOfTopics);
H
Haojun Liao 已提交
699 700
  taosThreadMutexUnlock(&tmq->lock);

L
Liu Jicong 已提交
701
  // no request is sent
L
Liu Jicong 已提交
702 703 704 705 706 707
  if (pParamSet->totalRspNum == 0) {
    tsem_destroy(&pParamSet->rspSem);
    taosMemoryFree(pParamSet);
    return 0;
  }

L
Liu Jicong 已提交
708
  // count down since waiting rsp num init as 1
709
  tmqCommitRspCountDown(pParamSet, tmq->consumerId, "", 0);
710

711 712 713 714
  if (!async) {
    tsem_wait(&pParamSet->rspSem);
    code = pParamSet->rspErr;
    tsem_destroy(&pParamSet->rspSem);
715
    taosMemoryFree(pParamSet);
L
Liu Jicong 已提交
716
#if 0
717 718
    taosArrayDestroyP(pParamSet->successfulOffsets, taosMemoryFree);
    taosArrayDestroyP(pParamSet->failedOffsets, taosMemoryFree);
L
Liu Jicong 已提交
719
#endif
L
Liu Jicong 已提交
720
  }
721

L
Liu Jicong 已提交
722 723 724
  return code;
}

725 726
static int32_t tmqCommitInner(tmq_t* tmq, const TAOS_RES* msg, int8_t automatic, int8_t async, tmq_commit_cb* userCb,
                              void* userParam) {
H
Haojun Liao 已提交
727
  if (msg) { // user invoked commit
L
Liu Jicong 已提交
728
    return tmqCommitMsgImpl(tmq, msg, async, userCb, userParam);
729
  } else {  // this for auto commit
730
    return doAutoCommit(tmq, automatic, async, userCb, userParam);
L
Liu Jicong 已提交
731
  }
732 733
}

734 735
static void generateTimedTask(int64_t refId, int32_t type) {
  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
736
  if (tmq != NULL) {
S
Shengliang Guan 已提交
737
    int8_t* pTaskType = taosAllocateQitem(sizeof(int8_t), DEF_QITEM, 0);
738
    *pTaskType = type;
739 740 741
    taosWriteQitem(tmq->delayedTask, pTaskType);
    tsem_post(&tmq->rspSem);
  }
742
  taosReleaseRef(tmqMgmt.rsetId, refId);
743 744 745 746 747
}

void tmqAssignAskEpTask(void* param, void* tmrId) {
  int64_t refId = *(int64_t*)param;
  generateTimedTask(refId, TMQ_DELAYED_TASK__ASK_EP);
748
  taosMemoryFree(param);
L
Liu Jicong 已提交
749 750 751
}

void tmqAssignDelayedCommitTask(void* param, void* tmrId) {
752
  int64_t refId = *(int64_t*)param;
753
  generateTimedTask(refId, TMQ_DELAYED_TASK__COMMIT);
754
  taosMemoryFree(param);
L
Liu Jicong 已提交
755 756 757
}

void tmqAssignDelayedReportTask(void* param, void* tmrId) {
758 759 760
  int64_t refId = *(int64_t*)param;
  tmq_t*  tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
  if (tmq != NULL) {
S
Shengliang Guan 已提交
761
    int8_t* pTaskType = taosAllocateQitem(sizeof(int8_t), DEF_QITEM, 0);
762 763 764 765
    *pTaskType = TMQ_DELAYED_TASK__REPORT;
    taosWriteQitem(tmq->delayedTask, pTaskType);
    tsem_post(&tmq->rspSem);
  }
766 767

  taosReleaseRef(tmqMgmt.rsetId, refId);
768
  taosMemoryFree(param);
L
Liu Jicong 已提交
769 770
}

771
int32_t tmqHbCb(void* param, SDataBuf* pMsg, int32_t code) {
dengyihao's avatar
dengyihao 已提交
772 773 774 775
  if (pMsg) {
    taosMemoryFree(pMsg->pData);
    taosMemoryFree(pMsg->pEpSet);
  }
776 777 778 779
  return 0;
}

void tmqSendHbReq(void* param, void* tmrId) {
780
  int64_t refId = *(int64_t*)param;
781

782 783
  tmq_t*  tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
  if (tmq == NULL) {
L
Liu Jicong 已提交
784
    taosMemoryFree(param);
785 786
    return;
  }
D
dapan1121 已提交
787 788 789 790 791

  SMqHbReq req = {0};
  req.consumerId = tmq->consumerId;
  req.epoch = tmq->epoch;

L
Liu Jicong 已提交
792
  int32_t tlen = tSerializeSMqHbReq(NULL, 0, &req);
D
dapan1121 已提交
793 794
  if (tlen < 0) {
    tscError("tSerializeSMqHbReq failed");
795
    goto OVER;
D
dapan1121 已提交
796
  }
797

L
Liu Jicong 已提交
798
  void* pReq = taosMemoryCalloc(1, tlen);
D
dapan1121 已提交
799 800
  if (tlen < 0) {
    tscError("failed to malloc MqHbReq msg, size:%d", tlen);
801
    goto OVER;
D
dapan1121 已提交
802
  }
803

D
dapan1121 已提交
804 805 806
  if (tSerializeSMqHbReq(pReq, tlen, &req) < 0) {
    tscError("tSerializeSMqHbReq %d failed", tlen);
    taosMemoryFree(pReq);
807
    goto OVER;
D
dapan1121 已提交
808
  }
809 810 811 812

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(pReq);
L
Liu Jicong 已提交
813
    goto OVER;
814
  }
815

816 817
  sendInfo->msgInfo = (SDataBuf){
      .pData = pReq,
D
dapan1121 已提交
818
      .len = tlen,
819 820 821 822 823 824 825
      .handle = NULL,
  };

  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
  sendInfo->param = NULL;
  sendInfo->fp = tmqHbCb;
L
Liu Jicong 已提交
826
  sendInfo->msgType = TDMT_MND_TMQ_HB;
827 828 829 830 831 832 833

  SEpSet epSet = getEpSet_s(&tmq->pTscObj->pAppInfo->mgmtEp);

  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);

OVER:
834
  taosTmrReset(tmqSendHbReq, 1000, param, tmqMgmt.timer, &tmq->hbLiveTimer);
835
  taosReleaseRef(tmqMgmt.rsetId, refId);
836 837
}

838
int32_t tmqHandleAllDelayedTask(tmq_t* pTmq) {
L
Liu Jicong 已提交
839
  STaosQall* qall = taosAllocateQall();
840
  taosReadAllQitems(pTmq->delayedTask, qall);
L
Liu Jicong 已提交
841

842 843 844 845
  if (qall->numOfItems == 0) {
    taosFreeQall(qall);
    return TSDB_CODE_SUCCESS;
  }
846

X
Xiaoyu Wang 已提交
847
  tscDebug("consumer:0x%" PRIx64 " handle delayed %d tasks before poll data", pTmq->consumerId, qall->numOfItems);
848 849
  int8_t* pTaskType = NULL;
  taosGetQitem(qall, (void**)&pTaskType);
L
Liu Jicong 已提交
850

851
  while (pTaskType != NULL) {
852
    if (*pTaskType == TMQ_DELAYED_TASK__ASK_EP) {
853
      tmqAskEp(pTmq, true);
854 855

      int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
856
      *pRefId = pTmq->refId;
857

X
Xiaoyu Wang 已提交
858
      tscDebug("consumer:0x%" PRIx64 " retrieve ep from mnode in 1s", pTmq->consumerId);
859
      taosTmrReset(tmqAssignAskEpTask, 1000, pRefId, tmqMgmt.timer, &pTmq->epTimer);
L
Liu Jicong 已提交
860
    } else if (*pTaskType == TMQ_DELAYED_TASK__COMMIT) {
861
      tmqCommitInner(pTmq, NULL, 1, 1, pTmq->commitCb, pTmq->commitCbUserParam);
862 863

      int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
864
      *pRefId = pTmq->refId;
865

X
Xiaoyu Wang 已提交
866
      tscDebug("consumer:0x%" PRIx64 " commit to vnode(s) in %.2fs", pTmq->consumerId,
X
Xiaoyu Wang 已提交
867
               pTmq->autoCommitInterval / 1000.0);
868
      taosTmrReset(tmqAssignDelayedCommitTask, pTmq->autoCommitInterval, pRefId, tmqMgmt.timer, &pTmq->commitTimer);
L
Liu Jicong 已提交
869 870
    } else if (*pTaskType == TMQ_DELAYED_TASK__REPORT) {
    }
871

L
Liu Jicong 已提交
872
    taosFreeQitem(pTaskType);
873
    taosGetQitem(qall, (void**)&pTaskType);
L
Liu Jicong 已提交
874
  }
875

L
Liu Jicong 已提交
876 877 878 879
  taosFreeQall(qall);
  return 0;
}

880
static void* tmqFreeRspWrapper(SMqRspWrapper* rspWrapper) {
L
Liu Jicong 已提交
881 882 883 884 885 886 887
  if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__END_RSP) {
    // do nothing
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__EP_RSP) {
    SMqAskEpRspWrapper* pEpRspWrapper = (SMqAskEpRspWrapper*)rspWrapper;
    tDeleteSMqAskEpRsp(&pEpRspWrapper->msg);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
888 889
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
890 891 892 893 894 895
    taosArrayDestroyP(pRsp->dataRsp.blockData, taosMemoryFree);
    taosArrayDestroy(pRsp->dataRsp.blockDataLen);
    taosArrayDestroyP(pRsp->dataRsp.blockTbName, taosMemoryFree);
    taosArrayDestroyP(pRsp->dataRsp.blockSchema, (FDelete)tDeleteSSchemaWrapper);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_META_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
896 897
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
898 899 900
    taosMemoryFree(pRsp->metaRsp.metaRsp);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__TAOSX_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
901 902
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
903 904 905 906 907 908 909 910
    taosArrayDestroyP(pRsp->taosxRsp.blockData, taosMemoryFree);
    taosArrayDestroy(pRsp->taosxRsp.blockDataLen);
    taosArrayDestroyP(pRsp->taosxRsp.blockTbName, taosMemoryFree);
    taosArrayDestroyP(pRsp->taosxRsp.blockSchema, (FDelete)tDeleteSSchemaWrapper);
    // taosx
    taosArrayDestroy(pRsp->taosxRsp.createTableLen);
    taosArrayDestroyP(pRsp->taosxRsp.createTableReq, taosMemoryFree);
  }
911 912

  return NULL;
L
Liu Jicong 已提交
913 914
}

L
Liu Jicong 已提交
915
void tmqClearUnhandleMsg(tmq_t* tmq) {
L
Liu Jicong 已提交
916
  SMqRspWrapper* rspWrapper = NULL;
L
Liu Jicong 已提交
917
  while (1) {
L
Liu Jicong 已提交
918 919 920 921 922
    taosGetQitem(tmq->qall, (void**)&rspWrapper);
    if (rspWrapper) {
      tmqFreeRspWrapper(rspWrapper);
      taosFreeQitem(rspWrapper);
    } else {
L
Liu Jicong 已提交
923
      break;
L
Liu Jicong 已提交
924
    }
L
Liu Jicong 已提交
925 926
  }

L
Liu Jicong 已提交
927
  rspWrapper = NULL;
L
Liu Jicong 已提交
928 929
  taosReadAllQitems(tmq->mqueue, tmq->qall);
  while (1) {
L
Liu Jicong 已提交
930 931 932 933 934
    taosGetQitem(tmq->qall, (void**)&rspWrapper);
    if (rspWrapper) {
      tmqFreeRspWrapper(rspWrapper);
      taosFreeQitem(rspWrapper);
    } else {
L
Liu Jicong 已提交
935
      break;
L
Liu Jicong 已提交
936
    }
L
Liu Jicong 已提交
937 938 939
  }
}

D
dapan1121 已提交
940
int32_t tmqSubscribeCb(void* param, SDataBuf* pMsg, int32_t code) {
L
Liu Jicong 已提交
941 942
  SMqSubscribeCbParam* pParam = (SMqSubscribeCbParam*)param;
  pParam->rspErr = code;
dengyihao's avatar
dengyihao 已提交
943 944

  taosMemoryFree(pMsg->pEpSet);
L
Liu Jicong 已提交
945 946 947
  tsem_post(&pParam->rspSem);
  return 0;
}
948

L
Liu Jicong 已提交
949
int32_t tmq_subscription(tmq_t* tmq, tmq_list_t** topics) {
X
Xiaoyu Wang 已提交
950 951 952 953
  if (*topics == NULL) {
    *topics = tmq_list_new();
  }
  for (int i = 0; i < taosArrayGetSize(tmq->clientTopics); i++) {
L
Liu Jicong 已提交
954
    SMqClientTopic* topic = taosArrayGet(tmq->clientTopics, i);
L
Liu Jicong 已提交
955
    tmq_list_append(*topics, strchr(topic->topicName, '.') + 1);
X
Xiaoyu Wang 已提交
956
  }
L
Liu Jicong 已提交
957
  return 0;
X
Xiaoyu Wang 已提交
958 959
}

L
Liu Jicong 已提交
960
int32_t tmq_unsubscribe(tmq_t* tmq) {
L
Liu Jicong 已提交
961 962
  int32_t     rsp;
  int32_t     retryCnt = 0;
L
Liu Jicong 已提交
963
  tmq_list_t* lst = tmq_list_new();
L
Liu Jicong 已提交
964 965 966 967 968 969 970 971 972 973
  while (1) {
    rsp = tmq_subscribe(tmq, lst);
    if (rsp != TSDB_CODE_MND_CONSUMER_NOT_READY || retryCnt > 5) {
      break;
    } else {
      retryCnt++;
      taosMsleep(500);
    }
  }

L
Liu Jicong 已提交
974 975
  tmq_list_destroy(lst);
  return rsp;
X
Xiaoyu Wang 已提交
976 977
}

978 979 980 981 982 983
static void freeClientVgImpl(void* param) {
  SMqClientTopic* pTopic = param;
  taosMemoryFreeClear(pTopic->schema.pSchema);
  taosArrayDestroy(pTopic->vgs);
}

984
void tmqFreeImpl(void* handle) {
985 986
  tmq_t*  tmq = (tmq_t*)handle;
  int64_t id = tmq->consumerId;
L
Liu Jicong 已提交
987

988
  // TODO stop timer
L
Liu Jicong 已提交
989 990 991 992
  if (tmq->mqueue) {
    tmqClearUnhandleMsg(tmq);
    taosCloseQueue(tmq->mqueue);
  }
L
Liu Jicong 已提交
993

H
Haojun Liao 已提交
994 995 996 997 998
  if (tmq->delayedTask) {
    taosCloseQueue(tmq->delayedTask);
  }

  taosFreeQall(tmq->qall);
999
  tsem_destroy(&tmq->rspSem);
H
Haojun Liao 已提交
1000
  taosThreadMutexDestroy(&tmq->lock);
L
Liu Jicong 已提交
1001

1002
  taosArrayDestroyEx(tmq->clientTopics, freeClientVgImpl);
1003 1004
  taos_close_internal(tmq->pTscObj);
  taosMemoryFree(tmq);
1005 1006

  tscDebug("consumer:0x%" PRIx64 " closed", id);
L
Liu Jicong 已提交
1007 1008
}

1009 1010 1011 1012 1013 1014 1015 1016 1017
static void tmqMgmtInit(void) {
  tmqInitRes = 0;
  tmqMgmt.timer = taosTmrInit(1000, 100, 360000, "TMQ");

  if (tmqMgmt.timer == NULL) {
    tmqInitRes = TSDB_CODE_OUT_OF_MEMORY;
  }

  tmqMgmt.rsetId = taosOpenRef(10000, tmqFreeImpl);
1018
  if (tmqMgmt.rsetId < 0) {
1019 1020 1021 1022
    tmqInitRes = terrno;
  }
}

L
Liu Jicong 已提交
1023
tmq_t* tmq_consumer_new(tmq_conf_t* conf, char* errstr, int32_t errstrLen) {
1024 1025 1026 1027
  taosThreadOnce(&tmqInit, tmqMgmtInit);
  if (tmqInitRes != 0) {
    terrno = tmqInitRes;
    return NULL;
L
Liu Jicong 已提交
1028 1029
  }

L
Liu Jicong 已提交
1030 1031
  tmq_t* pTmq = taosMemoryCalloc(1, sizeof(tmq_t));
  if (pTmq == NULL) {
L
Liu Jicong 已提交
1032
    terrno = TSDB_CODE_OUT_OF_MEMORY;
1033
    tscError("failed to create consumer, groupId:%s, code:%s", conf->groupId, terrstr());
L
Liu Jicong 已提交
1034 1035
    return NULL;
  }
L
Liu Jicong 已提交
1036

L
Liu Jicong 已提交
1037 1038 1039
  const char* user = conf->user == NULL ? TSDB_DEFAULT_USER : conf->user;
  const char* pass = conf->pass == NULL ? TSDB_DEFAULT_PASS : conf->pass;

L
Liu Jicong 已提交
1040 1041 1042
  pTmq->clientTopics = taosArrayInit(0, sizeof(SMqClientTopic));
  pTmq->mqueue = taosOpenQueue();
  pTmq->delayedTask = taosOpenQueue();
H
Haojun Liao 已提交
1043
  pTmq->qall = taosAllocateQall();
L
Liu Jicong 已提交
1044

H
Haojun Liao 已提交
1045
  taosThreadMutexInit(&pTmq->lock, NULL);
X
Xiaoyu Wang 已提交
1046 1047
  if (pTmq->clientTopics == NULL || pTmq->mqueue == NULL || pTmq->qall == NULL || pTmq->delayedTask == NULL ||
      conf->groupId[0] == 0) {
L
Liu Jicong 已提交
1048
    terrno = TSDB_CODE_OUT_OF_MEMORY;
1049
    tscError("consumer:0x%" PRIx64 " setup failed since %s, groupId:%s", pTmq->consumerId, terrstr(),
S
Shengliang Guan 已提交
1050
             pTmq->groupId);
1051
    goto _failed;
L
Liu Jicong 已提交
1052
  }
L
Liu Jicong 已提交
1053

L
Liu Jicong 已提交
1054 1055
  // init status
  pTmq->status = TMQ_CONSUMER_STATUS__INIT;
L
Liu Jicong 已提交
1056 1057
  pTmq->pollCnt = 0;
  pTmq->epoch = 0;
L
Liu Jicong 已提交
1058 1059
  /*pTmq->epStatus = 0;*/
  /*pTmq->epSkipCnt = 0;*/
L
Liu Jicong 已提交
1060

L
Liu Jicong 已提交
1061 1062 1063
  // set conf
  strcpy(pTmq->clientId, conf->clientId);
  strcpy(pTmq->groupId, conf->groupId);
1064
  pTmq->withTbName = conf->withTbName;
L
Liu Jicong 已提交
1065
  pTmq->useSnapshot = conf->snapEnable;
L
Liu Jicong 已提交
1066
  pTmq->autoCommit = conf->autoCommit;
L
Liu Jicong 已提交
1067
  pTmq->autoCommitInterval = conf->autoCommitInterval;
L
Liu Jicong 已提交
1068 1069
  pTmq->commitCb = conf->commitCb;
  pTmq->commitCbUserParam = conf->commitCbUserParam;
L
Liu Jicong 已提交
1070 1071
  pTmq->resetOffsetCfg = conf->resetOffset;

1072 1073
  pTmq->hbBgEnable = conf->hbBgEnable;

L
Liu Jicong 已提交
1074
  // assign consumerId
L
Liu Jicong 已提交
1075
  pTmq->consumerId = tGenIdPI64();
X
Xiaoyu Wang 已提交
1076

L
Liu Jicong 已提交
1077 1078
  // init semaphore
  if (tsem_init(&pTmq->rspSem, 0, 0) != 0) {
1079
    tscError("consumer:0x %" PRIx64 " setup failed since %s, consumer group %s", pTmq->consumerId, terrstr(),
S
Shengliang Guan 已提交
1080
             pTmq->groupId);
1081
    goto _failed;
L
Liu Jicong 已提交
1082
  }
L
Liu Jicong 已提交
1083

L
Liu Jicong 已提交
1084 1085 1086
  // init connection
  pTmq->pTscObj = taos_connect_internal(conf->ip, user, pass, NULL, NULL, conf->port, CONN_TYPE__TMQ);
  if (pTmq->pTscObj == NULL) {
1087
    tscError("consumer:0x%" PRIx64 " setup failed since %s, groupId:%s", pTmq->consumerId, terrstr(), pTmq->groupId);
L
Liu Jicong 已提交
1088
    tsem_destroy(&pTmq->rspSem);
1089
    goto _failed;
L
Liu Jicong 已提交
1090
  }
L
Liu Jicong 已提交
1091

1092 1093
  pTmq->refId = taosAddRef(tmqMgmt.rsetId, pTmq);
  if (pTmq->refId < 0) {
1094
    goto _failed;
1095 1096
  }

1097
  if (pTmq->hbBgEnable) {
L
Liu Jicong 已提交
1098 1099
    int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
    *pRefId = pTmq->refId;
1100
    pTmq->hbLiveTimer = taosTmrStart(tmqSendHbReq, 1000, pRefId, tmqMgmt.timer);
1101 1102
  }

1103 1104 1105
  char         buf[80] = {0};
  STqOffsetVal offset = {.type = pTmq->resetOffsetCfg};
  tFormatOffset(buf, tListLen(buf), &offset);
1106 1107
  tscInfo("consumer:0x%" PRIx64 " is setup, refId:%"PRId64", groupId:%s, snapshot:%d, autoCommit:%d, commitInterval:%dms, offset:%s, backgroudHB:%d",
          pTmq->consumerId, pTmq->refId, pTmq->groupId, pTmq->useSnapshot, pTmq->autoCommit, pTmq->autoCommitInterval, buf,
1108
          pTmq->hbBgEnable);
L
Liu Jicong 已提交
1109

1110
  return pTmq;
1111

1112 1113
_failed:
  tmqFreeImpl(pTmq);
L
Liu Jicong 已提交
1114
  return NULL;
1115 1116
}

L
Liu Jicong 已提交
1117
int32_t tmq_subscribe(tmq_t* tmq, const tmq_list_t* topic_list) {
L
Liu Jicong 已提交
1118 1119 1120
  const SArray*   container = &topic_list->container;
  int32_t         sz = taosArrayGetSize(container);
  void*           buf = NULL;
L
Liu Jicong 已提交
1121
  SMsgSendInfo*   sendInfo = NULL;
L
Liu Jicong 已提交
1122
  SCMSubscribeReq req = {0};
1123
  int32_t         code = 0;
1124

1125
  tscDebug("consumer:0x%" PRIx64 " cgroup:%s, subscribe %d topics", tmq->consumerId, tmq->groupId, sz);
L
Liu Jicong 已提交
1126

1127
  req.consumerId = tmq->consumerId;
L
Liu Jicong 已提交
1128
  tstrncpy(req.clientId, tmq->clientId, 256);
L
Liu Jicong 已提交
1129
  tstrncpy(req.cgroup, tmq->groupId, TSDB_CGROUP_LEN);
1130 1131
  req.topicNames = taosArrayInit(sz, sizeof(void*));

1132 1133 1134 1135
  if (req.topicNames == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
1136

L
Liu Jicong 已提交
1137 1138
  for (int32_t i = 0; i < sz; i++) {
    char* topic = taosArrayGetP(container, i);
1139 1140

    SName name = {0};
L
Liu Jicong 已提交
1141 1142 1143 1144
    tNameSetDbName(&name, tmq->pTscObj->acctId, topic, strlen(topic));
    char* topicFName = taosMemoryCalloc(1, TSDB_TOPIC_FNAME_LEN);
    if (topicFName == NULL) {
      goto FAIL;
1145 1146
    }

1147
    tNameExtractFullName(&name, topicFName);
X
Xiaoyu Wang 已提交
1148
    tscDebug("consumer:0x%" PRIx64 " subscribe topic:%s", tmq->consumerId, topicFName);
L
Liu Jicong 已提交
1149 1150

    taosArrayPush(req.topicNames, &topicFName);
1151 1152
  }

L
Liu Jicong 已提交
1153
  int32_t tlen = tSerializeSCMSubscribeReq(NULL, &req);
1154

L
Liu Jicong 已提交
1155
  buf = taosMemoryMalloc(tlen);
1156 1157 1158 1159
  if (buf == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
L
Liu Jicong 已提交
1160

1161 1162 1163
  void* abuf = buf;
  tSerializeSCMSubscribeReq(&abuf, &req);

L
Liu Jicong 已提交
1164
  sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
1165 1166 1167 1168
  if (sendInfo == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
1169

X
Xiaoyu Wang 已提交
1170
  SMqSubscribeCbParam param = {
L
Liu Jicong 已提交
1171
      .rspErr = 0,
1172 1173
      .refId = tmq->refId,
      .epoch = tmq->epoch,
X
Xiaoyu Wang 已提交
1174
  };
L
Liu Jicong 已提交
1175

1176 1177 1178
  if (tsem_init(&param.rspSem, 0, 0) != 0) {
    goto FAIL;
  }
L
Liu Jicong 已提交
1179 1180

  sendInfo->msgInfo = (SDataBuf){
X
Xiaoyu Wang 已提交
1181 1182 1183 1184
      .pData = buf,
      .len = tlen,
      .handle = NULL,
  };
1185

L
Liu Jicong 已提交
1186 1187
  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
L
Liu Jicong 已提交
1188 1189
  sendInfo->param = &param;
  sendInfo->fp = tmqSubscribeCb;
L
Liu Jicong 已提交
1190
  sendInfo->msgType = TDMT_MND_TMQ_SUBSCRIBE;
L
Liu Jicong 已提交
1191

1192 1193 1194 1195 1196
  SEpSet epSet = getEpSet_s(&tmq->pTscObj->pAppInfo->mgmtEp);

  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);

L
Liu Jicong 已提交
1197 1198
  // avoid double free if msg is sent
  buf = NULL;
L
Liu Jicong 已提交
1199
  sendInfo = NULL;
L
Liu Jicong 已提交
1200

L
Liu Jicong 已提交
1201 1202
  tsem_wait(&param.rspSem);
  tsem_destroy(&param.rspSem);
1203

1204 1205 1206 1207
  if (param.rspErr != 0) {
    code = param.rspErr;
    goto FAIL;
  }
L
Liu Jicong 已提交
1208

L
Liu Jicong 已提交
1209
  int32_t retryCnt = 0;
L
Liu Jicong 已提交
1210
  while (TSDB_CODE_MND_CONSUMER_NOT_READY == tmqAskEp(tmq, false)) {
wmmhello's avatar
wmmhello 已提交
1211
    if (retryCnt++ > 40) {
L
Liu Jicong 已提交
1212 1213
      goto FAIL;
    }
1214

X
Xiaoyu Wang 已提交
1215
    tscDebug("consumer:0x%" PRIx64 ", mnd not ready for subscribe, retry:%d in 500ms", tmq->consumerId, retryCnt);
L
Liu Jicong 已提交
1216 1217
    taosMsleep(500);
  }
1218

1219 1220
  // init ep timer
  if (tmq->epTimer == NULL) {
1221 1222 1223
    int64_t* pRefId1 = taosMemoryMalloc(sizeof(int64_t));
    *pRefId1 = tmq->refId;
    tmq->epTimer = taosTmrStart(tmqAssignAskEpTask, 1000, pRefId1, tmqMgmt.timer);
1224
  }
L
Liu Jicong 已提交
1225 1226

  // init auto commit timer
1227
  if (tmq->autoCommit && tmq->commitTimer == NULL) {
1228 1229 1230
    int64_t* pRefId2 = taosMemoryMalloc(sizeof(int64_t));
    *pRefId2 = tmq->refId;
    tmq->commitTimer = taosTmrStart(tmqAssignDelayedCommitTask, tmq->autoCommitInterval, pRefId2, tmqMgmt.timer);
L
Liu Jicong 已提交
1231 1232
  }

L
Liu Jicong 已提交
1233
FAIL:
L
Liu Jicong 已提交
1234
  taosArrayDestroyP(req.topicNames, taosMemoryFree);
L
Liu Jicong 已提交
1235
  taosMemoryFree(buf);
L
Liu Jicong 已提交
1236
  taosMemoryFree(sendInfo);
L
Liu Jicong 已提交
1237

L
Liu Jicong 已提交
1238
  return code;
1239 1240
}

L
Liu Jicong 已提交
1241
void tmq_conf_set_auto_commit_cb(tmq_conf_t* conf, tmq_commit_cb* cb, void* param) {
1242
  conf->commitCb = cb;
L
Liu Jicong 已提交
1243
  conf->commitCbUserParam = param;
L
Liu Jicong 已提交
1244
}
1245

D
dapan1121 已提交
1246
int32_t tmqPollCb(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1247
  SMqPollCbParam* pParam = (SMqPollCbParam*)param;
1248 1249

  int64_t         refId = pParam->refId;
X
Xiaoyu Wang 已提交
1250
  SMqClientVg*    pVg = pParam->pVg;
L
Liu Jicong 已提交
1251
  SMqClientTopic* pTopic = pParam->pTopic;
1252

1253
  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
1254 1255 1256 1257
  if (tmq == NULL) {
    tsem_destroy(&pParam->rspSem);
    taosMemoryFree(pParam);
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1258
    taosMemoryFree(pMsg->pEpSet);
1259 1260 1261 1262
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    return -1;
  }

H
Haojun Liao 已提交
1263 1264 1265 1266
  int32_t  epoch = pParam->epoch;
  int32_t  vgId = pParam->vgId;
  uint64_t requestId = pParam->requestId;

L
Liu Jicong 已提交
1267
  taosMemoryFree(pParam);
H
Haojun Liao 已提交
1268

L
Liu Jicong 已提交
1269
  if (code != 0) {
H
Haojun Liao 已提交
1270 1271
    tscWarn("consumer:0x%" PRIx64 " msg from vgId:%d discarded, epoch %d, since %s, reqId:0x%" PRIx64, tmq->consumerId,
            vgId, epoch, tstrerror(code), requestId);
H
Haojun Liao 已提交
1272

L
Liu Jicong 已提交
1273
    if (pMsg->pData) taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1274 1275
    if (pMsg->pEpSet) taosMemoryFree(pMsg->pEpSet);

H
Haojun Liao 已提交
1276
    // in case of consumer mismatch, wait for 500ms and retry
L
Liu Jicong 已提交
1277
    if (code == TSDB_CODE_TMQ_CONSUMER_MISMATCH) {
1278
      taosMsleep(500);
L
Liu Jicong 已提交
1279
      atomic_store_8(&tmq->status, TMQ_CONSUMER_STATUS__RECOVER);
1280
      tscDebug("consumer:0x%" PRIx64" wait for the re-balance, wait for 500ms and set status to be RECOVER", tmq->consumerId);
H
Haojun Liao 已提交
1281
    } else if (code == TSDB_CODE_TQ_NO_COMMITTED_OFFSET) {
S
Shengliang Guan 已提交
1282
      SMqPollRspWrapper* pRspWrapper = taosAllocateQitem(sizeof(SMqPollRspWrapper), DEF_QITEM, 0);
L
Liu Jicong 已提交
1283
      if (pRspWrapper == NULL) {
H
Haojun Liao 已提交
1284 1285
        tscWarn("consumer:0x%" PRIx64 " msg from vgId:%d discarded, epoch %d since out of memory, reqId:0x%" PRIx64,
                tmq->consumerId, vgId, epoch, requestId);
L
Liu Jicong 已提交
1286 1287
        goto CREATE_MSG_FAIL;
      }
H
Haojun Liao 已提交
1288

L
Liu Jicong 已提交
1289 1290 1291
      pRspWrapper->tmqRspType = TMQ_MSG_TYPE__END_RSP;
      taosWriteQitem(tmq->mqueue, pRspWrapper);
    }
H
Haojun Liao 已提交
1292

L
fix txn  
Liu Jicong 已提交
1293
    goto CREATE_MSG_FAIL;
L
Liu Jicong 已提交
1294 1295
  }

X
Xiaoyu Wang 已提交
1296 1297 1298
  int32_t msgEpoch = ((SMqRspHead*)pMsg->pData)->epoch;
  int32_t tmqEpoch = atomic_load_32(&tmq->epoch);
  if (msgEpoch < tmqEpoch) {
L
Liu Jicong 已提交
1299
    // do not write into queue since updating epoch reset
H
Haojun Liao 已提交
1300 1301 1302
    tscWarn("consumer:0x%" PRIx64 " msg discard from vgId:%d since from earlier epoch, rsp epoch %d, current epoch %d, reqId:0x%"PRIx64,
            tmq->consumerId, vgId, msgEpoch, tmqEpoch, requestId);

1303
    tsem_post(&tmq->rspSem);
1304 1305
    taosReleaseRef(tmqMgmt.rsetId, refId);

L
Liu Jicong 已提交
1306
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1307
    taosMemoryFree(pMsg->pEpSet);
X
Xiaoyu Wang 已提交
1308 1309 1310 1311
    return 0;
  }

  if (msgEpoch != tmqEpoch) {
H
Haojun Liao 已提交
1312 1313
    tscWarn("consumer:0x%" PRIx64 " mismatch rsp from vgId:%d, epoch %d, current epoch %d, reqId:0x%" PRIx64,
            tmq->consumerId, vgId, msgEpoch, tmqEpoch, requestId);
X
Xiaoyu Wang 已提交
1314 1315
  }

L
Liu Jicong 已提交
1316 1317 1318
  // handle meta rsp
  int8_t rspType = ((SMqRspHead*)pMsg->pData)->mqMsgType;

S
Shengliang Guan 已提交
1319
  SMqPollRspWrapper* pRspWrapper = taosAllocateQitem(sizeof(SMqPollRspWrapper), DEF_QITEM, 0);
L
Liu Jicong 已提交
1320
  if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1321
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1322
    taosMemoryFree(pMsg->pEpSet);
H
Haojun Liao 已提交
1323
    tscWarn("consumer:0x%"PRIx64" msg discard from vgId:%d, epoch %d since out of memory", tmq->consumerId, vgId, epoch);
L
fix txn  
Liu Jicong 已提交
1324
    goto CREATE_MSG_FAIL;
L
Liu Jicong 已提交
1325
  }
L
Liu Jicong 已提交
1326

L
Liu Jicong 已提交
1327
  pRspWrapper->tmqRspType = rspType;
L
Liu Jicong 已提交
1328 1329
  pRspWrapper->vgHandle = pVg;
  pRspWrapper->topicHandle = pTopic;
H
Haojun Liao 已提交
1330
  pRspWrapper->reqId = requestId;
1331
  pRspWrapper->pEpset = pMsg->pEpSet;
L
Liu Jicong 已提交
1332

1333
  pMsg->pEpSet = NULL;
L
Liu Jicong 已提交
1334
  if (rspType == TMQ_MSG_TYPE__POLL_RSP) {
L
Liu Jicong 已提交
1335 1336 1337
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeSMqDataRsp(&decoder, &pRspWrapper->dataRsp);
wmmhello's avatar
wmmhello 已提交
1338
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1339
    memcpy(&pRspWrapper->dataRsp, pMsg->pData, sizeof(SMqRspHead));
L
Liu Jicong 已提交
1340

H
Haojun Liao 已提交
1341 1342 1343 1344
    char buf[80];
    tFormatOffset(buf, 80, &pRspWrapper->dataRsp.rspOffset);
    tscDebug("consumer:0x%" PRIx64 " recv poll rsp, vgId:%d, req:%" PRId64 ", rsp:%s type %d, reqId:0x%" PRIx64,
             tmq->consumerId, vgId, pRspWrapper->dataRsp.reqOffset.version, buf, rspType, requestId);
L
Liu Jicong 已提交
1345
  } else if (rspType == TMQ_MSG_TYPE__POLL_META_RSP) {
1346 1347 1348 1349
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeSMqMetaRsp(&decoder, &pRspWrapper->metaRsp);
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1350
    memcpy(&pRspWrapper->metaRsp, pMsg->pData, sizeof(SMqRspHead));
L
Liu Jicong 已提交
1351 1352 1353 1354 1355 1356
  } else if (rspType == TMQ_MSG_TYPE__TAOSX_RSP) {
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeSTaosxRsp(&decoder, &pRspWrapper->taosxRsp);
    tDecoderClear(&decoder);
    memcpy(&pRspWrapper->taosxRsp, pMsg->pData, sizeof(SMqRspHead));
H
Haojun Liao 已提交
1357 1358
  } else { // invalid rspType
    tscError("consumer:0x%"PRIx64" invalid rsp msg received, type:%d ignored", tmq->consumerId, rspType);
L
Liu Jicong 已提交
1359
  }
L
Liu Jicong 已提交
1360

L
Liu Jicong 已提交
1361
  taosMemoryFree(pMsg->pData);
H
Haojun Liao 已提交
1362
  taosWriteQitem(tmq->mqueue, pRspWrapper);
L
Liu Jicong 已提交
1363

H
Haojun Liao 已提交
1364 1365 1366
  tscDebug("consumer:0x%" PRIx64 " put poll res into mqueue, type:%d, vgId:%d, total in queue:%d, reqId:0x%" PRIx64,
           tmq->consumerId, rspType, vgId, tmq->mqueue->numOfItems, requestId);

1367
  tsem_post(&tmq->rspSem);
1368 1369
  taosReleaseRef(tmqMgmt.rsetId, refId);

L
Liu Jicong 已提交
1370
  return 0;
H
Haojun Liao 已提交
1371

L
fix txn  
Liu Jicong 已提交
1372
CREATE_MSG_FAIL:
L
Liu Jicong 已提交
1373
  if (epoch == tmq->epoch) {
L
Liu Jicong 已提交
1374 1375
    atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
  }
H
Haojun Liao 已提交
1376

1377
  tsem_post(&tmq->rspSem);
1378 1379
  taosReleaseRef(tmqMgmt.rsetId, refId);

L
Liu Jicong 已提交
1380
  return -1;
1381 1382
}

H
Haojun Liao 已提交
1383 1384 1385 1386 1387
typedef struct SVgroupSaveInfo {
  STqOffsetVal offset;
  int64_t      numOfRows;
} SVgroupSaveInfo;

H
Haojun Liao 已提交
1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404
static void initClientTopicFromRsp(SMqClientTopic* pTopic, SMqSubTopicEp* pTopicEp, SHashObj* pVgOffsetHashMap,
                                   tmq_t* tmq) {
  pTopic->schema = pTopicEp->schema;
  pTopicEp->schema.nCols = 0;
  pTopicEp->schema.pSchema = NULL;

  char vgKey[TSDB_TOPIC_FNAME_LEN + 22];
  int32_t vgNumGet = taosArrayGetSize(pTopicEp->vgs);

  tstrncpy(pTopic->topicName, pTopicEp->topic, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pTopic->db, pTopicEp->db, TSDB_DB_FNAME_LEN);

  tscDebug("consumer:0x%" PRIx64 ", update topic:%s, numOfVgs:%d", tmq->consumerId, pTopic->topicName, vgNumGet);
  pTopic->vgs = taosArrayInit(vgNumGet, sizeof(SMqClientVg));

  for (int32_t j = 0; j < vgNumGet; j++) {
    SMqSubVgEp* pVgEp = taosArrayGet(pTopicEp->vgs, j);
H
Haojun Liao 已提交
1405 1406

    makeTopicVgroupKey(vgKey, pTopic->topicName, pVgEp->vgId);
H
Haojun Liao 已提交
1407
    SVgroupSaveInfo* pInfo = taosHashGet(pVgOffsetHashMap, vgKey, strlen(vgKey));
H
Haojun Liao 已提交
1408

H
Haojun Liao 已提交
1409
    int64_t numOfRows = 0;
H
Haojun Liao 已提交
1410
    STqOffsetVal  offsetNew = {.type = tmq->resetOffsetCfg};
H
Haojun Liao 已提交
1411 1412 1413
    if (pInfo != NULL) {
      offsetNew = pInfo->offset;
      numOfRows = pInfo->numOfRows;
H
Haojun Liao 已提交
1414 1415 1416 1417 1418 1419 1420 1421 1422
    }

    SMqClientVg clientVg = {
        .pollCnt = 0,
        .currentOffset = offsetNew,
        .vgId = pVgEp->vgId,
        .epSet = pVgEp->epSet,
        .vgStatus = TMQ_VG_STATUS__IDLE,
        .vgSkipCnt = 0,
H
Haojun Liao 已提交
1423
        .emptyBlockReceiveTs = 0,
H
Haojun Liao 已提交
1424
        .numOfRows = numOfRows,
H
Haojun Liao 已提交
1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440
    };

    taosArrayPush(pTopic->vgs, &clientVg);
  }
}

static void freeClientVgInfo(void* param) {
  SMqClientTopic* pTopic = param;
  if (pTopic->schema.nCols) {
    taosMemoryFreeClear(pTopic->schema.pSchema);
  }

  taosArrayDestroy(pTopic->vgs);
}

static bool tmqUpdateEp(tmq_t* tmq, int32_t epoch, const SMqAskEpRsp* pRsp) {
1441 1442
  bool set = false;

1443
  int32_t topicNumCur = taosArrayGetSize(tmq->clientTopics);
1444
  int32_t topicNumGet = taosArrayGetSize(pRsp->topics);
1445

X
Xiaoyu Wang 已提交
1446 1447
  char vgKey[TSDB_TOPIC_FNAME_LEN + 22];
  tscDebug("consumer:0x%" PRIx64 " update ep epoch from %d to epoch %d, incoming topics:%d, existed topics:%d",
1448
           tmq->consumerId, tmq->epoch, epoch, topicNumGet, topicNumCur);
1449 1450 1451 1452 1453 1454

  SArray* newTopics = taosArrayInit(topicNumGet, sizeof(SMqClientTopic));
  if (newTopics == NULL) {
    return false;
  }

H
Haojun Liao 已提交
1455 1456
  SHashObj* pVgOffsetHashMap = taosHashInit(64, MurmurHash3_32, false, HASH_NO_LOCK);
  if (pVgOffsetHashMap == NULL) {
1457 1458 1459
    taosArrayDestroy(newTopics);
    return false;
  }
1460

H
Haojun Liao 已提交
1461
  // todo extract method
1462 1463 1464 1465 1466
  for (int32_t i = 0; i < topicNumCur; i++) {
    // find old topic
    SMqClientTopic* pTopicCur = taosArrayGet(tmq->clientTopics, i);
    if (pTopicCur->vgs) {
      int32_t vgNumCur = taosArrayGetSize(pTopicCur->vgs);
1467
      tscDebug("consumer:0x%" PRIx64 ", new vg num: %d", tmq->consumerId, vgNumCur);
1468 1469
      for (int32_t j = 0; j < vgNumCur; j++) {
        SMqClientVg* pVgCur = taosArrayGet(pTopicCur->vgs, j);
H
Haojun Liao 已提交
1470 1471
        makeTopicVgroupKey(vgKey, pTopicCur->topicName, pVgCur->vgId);

L
Liu Jicong 已提交
1472
        char buf[80];
L
Liu Jicong 已提交
1473
        tFormatOffset(buf, 80, &pVgCur->currentOffset);
H
Haojun Liao 已提交
1474
        tscDebug("consumer:0x%" PRIx64 ", epoch:%d vgId:%d vgKey:%s, offset:%s", tmq->consumerId, epoch,
L
Liu Jicong 已提交
1475
                 pVgCur->vgId, vgKey, buf);
H
Haojun Liao 已提交
1476 1477 1478

        SVgroupSaveInfo info = {.offset = pVgCur->currentOffset, .numOfRows = pVgCur->numOfRows};
        taosHashPut(pVgOffsetHashMap, vgKey, strlen(vgKey), &info, sizeof(SVgroupSaveInfo));
1479 1480 1481 1482 1483 1484 1485
      }
    }
  }

  for (int32_t i = 0; i < topicNumGet; i++) {
    SMqClientTopic topic = {0};
    SMqSubTopicEp* pTopicEp = taosArrayGet(pRsp->topics, i);
H
Haojun Liao 已提交
1486
    initClientTopicFromRsp(&topic, pTopicEp, pVgOffsetHashMap, tmq);
1487 1488
    taosArrayPush(newTopics, &topic);
  }
1489

H
Haojun Liao 已提交
1490 1491 1492
  taosHashCleanup(pVgOffsetHashMap);

  taosThreadMutexLock(&tmq->lock);
1493
  // destroy current buffered existed topics info
1494
  if (tmq->clientTopics) {
H
Haojun Liao 已提交
1495
    taosArrayDestroyEx(tmq->clientTopics, freeClientVgInfo);
X
Xiaoyu Wang 已提交
1496
  }
1497

H
Haojun Liao 已提交
1498 1499
  tmq->clientTopics = newTopics;
  taosThreadMutexUnlock(&tmq->lock);
1500

H
Haojun Liao 已提交
1501 1502
  int8_t flag = (topicNumGet == 0)? TMQ_CONSUMER_STATUS__NO_TOPIC:TMQ_CONSUMER_STATUS__READY;
  atomic_store_8(&tmq->status, flag);
X
Xiaoyu Wang 已提交
1503
  atomic_store_32(&tmq->epoch, epoch);
H
Haojun Liao 已提交
1504

1505
  tscDebug("consumer:0x%" PRIx64 " update topic info completed", tmq->consumerId);
X
Xiaoyu Wang 已提交
1506 1507 1508
  return set;
}

H
Haojun Liao 已提交
1509
static int32_t tmqAskEpCb(void* param, SDataBuf* pMsg, int32_t code) {
1510
  SMqAskEpCbParam* pParam = (SMqAskEpCbParam*)param;
L
Liu Jicong 已提交
1511
  int8_t           async = pParam->async;
1512 1513 1514 1515 1516 1517 1518 1519 1520
  tmq_t*           tmq = taosAcquireRef(tmqMgmt.rsetId, pParam->refId);

  if (tmq == NULL) {
    if (!async) {
      tsem_destroy(&pParam->rspSem);
    } else {
      taosMemoryFree(pParam);
    }
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1521
    taosMemoryFree(pMsg->pEpSet);
1522 1523 1524 1525
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    return -1;
  }

L
Liu Jicong 已提交
1526
  pParam->code = code;
H
Haojun Liao 已提交
1527
  if (code != TSDB_CODE_SUCCESS) {
X
Xiaoyu Wang 已提交
1528 1529
    tscError("consumer:0x%" PRIx64 ", get topic endpoint error, async:%d, code:%s", tmq->consumerId, pParam->async,
             tstrerror(code));
L
Liu Jicong 已提交
1530
    goto END;
1531
  }
L
Liu Jicong 已提交
1532

L
Liu Jicong 已提交
1533
  // tmq's epoch is monotonically increase,
L
Liu Jicong 已提交
1534
  // so it's safe to discard any old epoch msg.
L
Liu Jicong 已提交
1535
  // Epoch will only increase when received newer epoch ep msg
L
Liu Jicong 已提交
1536 1537 1538
  SMqRspHead* head = pMsg->pData;
  int32_t     epoch = atomic_load_32(&tmq->epoch);
  if (head->epoch <= epoch) {
1539 1540
    tscDebug("consumer:0x%" PRIx64 ", recv ep, msg epoch %d, current epoch %d, no need to update local ep",
             tmq->consumerId, head->epoch, epoch);
1541 1542 1543 1544 1545 1546 1547 1548
    if (tmq->status == TMQ_CONSUMER_STATUS__RECOVER) {
      SMqAskEpRsp rsp;
      tDecodeSMqAskEpRsp(POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), &rsp);
      int8_t flag = (taosArrayGetSize(rsp.topics) == 0) ? TMQ_CONSUMER_STATUS__NO_TOPIC : TMQ_CONSUMER_STATUS__READY;
      atomic_store_8(&tmq->status, flag);
      tDeleteSMqAskEpRsp(&rsp);
    }

L
Liu Jicong 已提交
1549
    goto END;
1550
  }
L
Liu Jicong 已提交
1551

1552 1553 1554
  tscDebug("consumer:0x%" PRIx64 ", recv ep, msg epoch %d, current epoch %d, update local ep", tmq->consumerId,
           head->epoch, epoch);

L
Liu Jicong 已提交
1555
  if (!async) {
L
Liu Jicong 已提交
1556 1557
    SMqAskEpRsp rsp;
    tDecodeSMqAskEpRsp(POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), &rsp);
L
Liu Jicong 已提交
1558
    tmqUpdateEp(tmq, head->epoch, &rsp);
L
Liu Jicong 已提交
1559
    tDeleteSMqAskEpRsp(&rsp);
X
Xiaoyu Wang 已提交
1560
  } else {
S
Shengliang Guan 已提交
1561
    SMqAskEpRspWrapper* pWrapper = taosAllocateQitem(sizeof(SMqAskEpRspWrapper), DEF_QITEM, 0);
L
Liu Jicong 已提交
1562
    if (pWrapper == NULL) {
X
Xiaoyu Wang 已提交
1563
      terrno = TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
1564 1565
      code = -1;
      goto END;
X
Xiaoyu Wang 已提交
1566
    }
1567

L
Liu Jicong 已提交
1568 1569 1570
    pWrapper->tmqRspType = TMQ_MSG_TYPE__EP_RSP;
    pWrapper->epoch = head->epoch;
    memcpy(&pWrapper->msg, pMsg->pData, sizeof(SMqRspHead));
L
Liu Jicong 已提交
1571
    tDecodeSMqAskEpRsp(POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), &pWrapper->msg);
L
Liu Jicong 已提交
1572

L
Liu Jicong 已提交
1573
    taosWriteQitem(tmq->mqueue, pWrapper);
1574
    tsem_post(&tmq->rspSem);
1575
  }
L
Liu Jicong 已提交
1576 1577

END:
1578 1579
  taosReleaseRef(tmqMgmt.rsetId, pParam->refId);

L
Liu Jicong 已提交
1580
  if (!async) {
L
Liu Jicong 已提交
1581
    tsem_post(&pParam->rspSem);
L
Liu Jicong 已提交
1582 1583
  } else {
    taosMemoryFree(pParam);
L
Liu Jicong 已提交
1584
  }
dengyihao's avatar
dengyihao 已提交
1585 1586

  taosMemoryFree(pMsg->pEpSet);
L
Liu Jicong 已提交
1587
  taosMemoryFree(pMsg->pData);
L
Liu Jicong 已提交
1588
  return code;
1589 1590
}

L
Liu Jicong 已提交
1591
void tmqBuildConsumeReqImpl(SMqPollReq* pReq, tmq_t* tmq, int64_t timeout, SMqClientTopic* pTopic, SMqClientVg* pVg) {
L
Liu Jicong 已提交
1592 1593 1594 1595
  int32_t groupLen = strlen(tmq->groupId);
  memcpy(pReq->subKey, tmq->groupId, groupLen);
  pReq->subKey[groupLen] = TMQ_SEPARATOR;
  strcpy(pReq->subKey + groupLen + 1, pTopic->topicName);
1596

1597
  pReq->withTbName = tmq->withTbName;
L
Liu Jicong 已提交
1598
  pReq->consumerId = tmq->consumerId;
1599
  pReq->timeout = timeout;
X
Xiaoyu Wang 已提交
1600
  pReq->epoch = tmq->epoch;
L
Liu Jicong 已提交
1601
  /*pReq->currentOffset = reqOffset;*/
L
Liu Jicong 已提交
1602
  pReq->reqOffset = pVg->currentOffset;
D
dapan1121 已提交
1603
  pReq->head.vgId = pVg->vgId;
1604 1605
  pReq->useSnapshot = tmq->useSnapshot;
  pReq->reqId = generateRequestId();
1606 1607
}

L
Liu Jicong 已提交
1608 1609
SMqMetaRspObj* tmqBuildMetaRspFromWrapper(SMqPollRspWrapper* pWrapper) {
  SMqMetaRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqMetaRspObj));
L
Liu Jicong 已提交
1610
  pRspObj->resType = RES_TYPE__TMQ_META;
L
Liu Jicong 已提交
1611 1612 1613 1614 1615 1616 1617 1618
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
  pRspObj->vgId = pWrapper->vgHandle->vgId;

  memcpy(&pRspObj->metaRsp, &pWrapper->metaRsp, sizeof(SMqMetaRsp));
  return pRspObj;
}

1619
SMqRspObj* tmqBuildRspFromWrapper(SMqPollRspWrapper* pWrapper, SMqClientVg* pVg, int64_t* numOfRows) {
L
Liu Jicong 已提交
1620 1621
  SMqRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqRspObj));
  pRspObj->resType = RES_TYPE__TMQ;
1622

1623
  (*numOfRows) = 0;
L
Liu Jicong 已提交
1624 1625
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
1626

L
Liu Jicong 已提交
1627
  pRspObj->vgId = pWrapper->vgHandle->vgId;
L
Liu Jicong 已提交
1628
  pRspObj->resIter = -1;
L
Liu Jicong 已提交
1629
  memcpy(&pRspObj->rsp, &pWrapper->dataRsp, sizeof(SMqDataRsp));
L
Liu Jicong 已提交
1630

L
Liu Jicong 已提交
1631 1632
  pRspObj->resInfo.totalRows = 0;
  pRspObj->resInfo.precision = TSDB_TIME_PRECISION_MILLI;
1633

L
Liu Jicong 已提交
1634
  if (!pWrapper->dataRsp.withSchema) {
L
Liu Jicong 已提交
1635 1636
    setResSchemaInfo(&pRspObj->resInfo, pWrapper->topicHandle->schema.pSchema, pWrapper->topicHandle->schema.nCols);
  }
L
Liu Jicong 已提交
1637

1638 1639 1640 1641 1642
  // extract the rows in this data packet
  for(int32_t i = 0; i < pRspObj->rsp.blockNum; ++i) {
    SRetrieveTableRsp* pRetrieve = (SRetrieveTableRsp*)taosArrayGetP(pRspObj->rsp.blockData, i);
    int64_t rows = htobe64(pRetrieve->numOfRows);
    pVg->numOfRows += rows;
1643
    (*numOfRows) += rows;
1644 1645
  }

L
Liu Jicong 已提交
1646
  return pRspObj;
X
Xiaoyu Wang 已提交
1647 1648
}

L
Liu Jicong 已提交
1649 1650
SMqTaosxRspObj* tmqBuildTaosxRspFromWrapper(SMqPollRspWrapper* pWrapper) {
  SMqTaosxRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqTaosxRspObj));
1651
  pRspObj->resType = RES_TYPE__TMQ_METADATA;
L
Liu Jicong 已提交
1652 1653 1654 1655
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
  pRspObj->vgId = pWrapper->vgHandle->vgId;
  pRspObj->resIter = -1;
1656
  memcpy(&pRspObj->rsp, &pWrapper->taosxRsp, sizeof(STaosxRsp));
L
Liu Jicong 已提交
1657 1658 1659

  pRspObj->resInfo.totalRows = 0;
  pRspObj->resInfo.precision = TSDB_TIME_PRECISION_MILLI;
1660
  if (!pWrapper->taosxRsp.withSchema) {
L
Liu Jicong 已提交
1661 1662 1663 1664 1665 1666
    setResSchemaInfo(&pRspObj->resInfo, pWrapper->topicHandle->schema.pSchema, pWrapper->topicHandle->schema.nCols);
  }

  return pRspObj;
}

1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699
static int32_t handleErrorBeforePoll(SMqClientVg* pVg, tmq_t* pTmq) {
  atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
  tsem_post(&pTmq->rspSem);
  return -1;
}

static int32_t doTmqPollImpl(tmq_t* pTmq, SMqClientTopic* pTopic, SMqClientVg* pVg, int64_t timeout) {
  SMqPollReq req = {0};
  tmqBuildConsumeReqImpl(&req, pTmq, timeout, pTopic, pVg);

  int32_t msgSize = tSerializeSMqPollReq(NULL, 0, &req);
  if (msgSize < 0) {
    return handleErrorBeforePoll(pVg, pTmq);
  }

  char* msg = taosMemoryCalloc(1, msgSize);
  if (NULL == msg) {
    return handleErrorBeforePoll(pVg, pTmq);
  }

  if (tSerializeSMqPollReq(msg, msgSize, &req) < 0) {
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  SMqPollCbParam* pParam = taosMemoryMalloc(sizeof(SMqPollCbParam));
  if (pParam == NULL) {
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  pParam->refId = pTmq->refId;
  pParam->epoch = pTmq->epoch;
X
Xiaoyu Wang 已提交
1700
  pParam->pVg = pVg;  // pVg may be released,fix it
1701 1702
  pParam->pTopic = pTopic;
  pParam->vgId = pVg->vgId;
H
Haojun Liao 已提交
1703
  pParam->requestId = req.reqId;
1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(pParam);
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  sendInfo->msgInfo = (SDataBuf){
      .pData = msg,
      .len = msgSize,
      .handle = NULL,
  };

  sendInfo->requestId = req.reqId;
  sendInfo->requestObjRefId = 0;
  sendInfo->param = pParam;
  sendInfo->fp = tmqPollCb;
  sendInfo->msgType = TDMT_VND_TMQ_CONSUME;

  int64_t transporterId = 0;
  char    offsetFormatBuf[80];
  tFormatOffset(offsetFormatBuf, tListLen(offsetFormatBuf), &pVg->currentOffset);

H
Haojun Liao 已提交
1728
  tscDebug("consumer:0x%" PRIx64 " send poll to %s vgId:%d, epoch %d, req:%s, reqId:0x%" PRIx64,
1729 1730 1731 1732 1733 1734 1735 1736 1737
           pTmq->consumerId, pTopic->topicName, pVg->vgId, pTmq->epoch, offsetFormatBuf, req.reqId);
  asyncSendMsgToServer(pTmq->pTscObj->pAppInfo->pTransporter, &pVg->epSet, &transporterId, sendInfo);

  pVg->pollCnt++;
  pTmq->pollCnt++;

  return TSDB_CODE_SUCCESS;
}

1738
// broadcast the poll request to all related vnodes
H
Haojun Liao 已提交
1739
static int32_t tmqPollImpl(tmq_t* tmq, int64_t timeout) {
1740
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);
X
Xiaoyu Wang 已提交
1741
  tscDebug("consumer:0x%" PRIx64 " start to poll data, numOfTopics:%d", tmq->consumerId, numOfTopics);
1742 1743

  for (int i = 0; i < numOfTopics; i++) {
X
Xiaoyu Wang 已提交
1744
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
X
Xiaoyu Wang 已提交
1745
    int32_t         numOfVg = taosArrayGetSize(pTopic->vgs);
1746 1747

    for (int j = 0; j < numOfVg; j++) {
X
Xiaoyu Wang 已提交
1748
      SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);
1749
      if (taosGetTimestampMs() - pVg->emptyBlockReceiveTs < EMPTY_BLOCK_POLL_IDLE_DURATION) { // less than 100ms
H
Haojun Liao 已提交
1750 1751
        tscTrace("consumer:0x%" PRIx64 " epoch %d, vgId:%d idle for 100ms before start next poll", tmq->consumerId, tmq->epoch,
                 pVg->vgId);
H
Haojun Liao 已提交
1752 1753 1754
        continue;
      }

1755
      int32_t vgStatus = atomic_val_compare_exchange_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE, TMQ_VG_STATUS__WAIT);
1756
      if (vgStatus == TMQ_VG_STATUS__WAIT) {
L
Liu Jicong 已提交
1757
        int32_t vgSkipCnt = atomic_add_fetch_32(&pVg->vgSkipCnt, 1);
H
Haojun Liao 已提交
1758
        tscTrace("consumer:0x%" PRIx64 " epoch %d wait poll-rsp, skip vgId:%d skip cnt %d", tmq->consumerId, tmq->epoch,
X
Xiaoyu Wang 已提交
1759
                 pVg->vgId, vgSkipCnt);
X
Xiaoyu Wang 已提交
1760
        continue;
L
temp  
Liu Jicong 已提交
1761 1762 1763 1764
#if 0
        if (skipCnt < 30000) {
          continue;
        } else {
1765
        tscDebug("consumer:0x%" PRIx64 ",skip vgId:%d skip too much reset", tmq->consumerId, pVg->vgId);
L
temp  
Liu Jicong 已提交
1766 1767
        }
#endif
X
Xiaoyu Wang 已提交
1768
      }
1769

L
Liu Jicong 已提交
1770
      atomic_store_32(&pVg->vgSkipCnt, 0);
1771 1772 1773
      int32_t code = doTmqPollImpl(tmq, pTopic, pVg, timeout);
      if (code != TSDB_CODE_SUCCESS) {
        return code;
D
dapan1121 已提交
1774
      }
X
Xiaoyu Wang 已提交
1775 1776
    }
  }
1777

1778
  tscDebug("consumer:0x%" PRIx64 " end to poll data", tmq->consumerId);
X
Xiaoyu Wang 已提交
1779 1780 1781
  return 0;
}

H
Haojun Liao 已提交
1782
static int32_t tmqHandleNoPollRsp(tmq_t* tmq, SMqRspWrapper* rspWrapper, bool* pReset) {
L
Liu Jicong 已提交
1783
  if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__EP_RSP) {
L
fix  
Liu Jicong 已提交
1784
    /*printf("ep %d %d\n", rspMsg->head.epoch, tmq->epoch);*/
L
Liu Jicong 已提交
1785 1786
    if (rspWrapper->epoch > atomic_load_32(&tmq->epoch)) {
      SMqAskEpRspWrapper* pEpRspWrapper = (SMqAskEpRspWrapper*)rspWrapper;
L
Liu Jicong 已提交
1787
      SMqAskEpRsp*        rspMsg = &pEpRspWrapper->msg;
L
Liu Jicong 已提交
1788
      tmqUpdateEp(tmq, rspWrapper->epoch, rspMsg);
L
temp  
Liu Jicong 已提交
1789
      /*tmqClearUnhandleMsg(tmq);*/
L
Liu Jicong 已提交
1790
      tDeleteSMqAskEpRsp(rspMsg);
X
Xiaoyu Wang 已提交
1791 1792
      *pReset = true;
    } else {
L
Liu Jicong 已提交
1793
      tmqFreeRspWrapper(rspWrapper);
X
Xiaoyu Wang 已提交
1794 1795 1796 1797 1798 1799 1800 1801
      *pReset = false;
    }
  } else {
    return -1;
  }
  return 0;
}

H
Haojun Liao 已提交
1802
static void* tmqHandleAllRsp(tmq_t* tmq, int64_t timeout, bool pollIfReset) {
H
Haojun Liao 已提交
1803
  tscDebug("consumer:0x%" PRIx64 " start to handle the rsp, total:%d", tmq->consumerId, tmq->qall->numOfItems);
1804

X
Xiaoyu Wang 已提交
1805
  while (1) {
1806 1807
    SMqRspWrapper* pRspWrapper = NULL;
    taosGetQitem(tmq->qall, (void**)&pRspWrapper);
1808

1809
    if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1810
      taosReadAllQitems(tmq->mqueue, tmq->qall);
1811
      taosGetQitem(tmq->qall, (void**)&pRspWrapper);
L
Liu Jicong 已提交
1812

1813
      if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1814 1815
        return NULL;
      }
X
Xiaoyu Wang 已提交
1816 1817
    }

1818
    tscDebug("consumer:0x%"PRIx64" handle rsp, type:%d", tmq->consumerId, pRspWrapper->tmqRspType);
H
Haojun Liao 已提交
1819

1820 1821
    if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__END_RSP) {
      taosFreeQitem(pRspWrapper);
L
Liu Jicong 已提交
1822
      terrno = TSDB_CODE_TQ_NO_COMMITTED_OFFSET;
H
Haojun Liao 已提交
1823
      tscError("consumer:0x%" PRIx64 " unexpected rsp from poll, code:%s", tmq->consumerId, tstrerror(terrno));
L
Liu Jicong 已提交
1824
      return NULL;
1825 1826
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
H
Haojun Liao 已提交
1827

1828
      int32_t consumerEpoch = atomic_load_32(&tmq->epoch);
1829 1830 1831 1832
      SMqDataRsp* pDataRsp = &pollRspWrapper->dataRsp;

      if (pDataRsp->head.epoch == consumerEpoch) {
        // todo fix it: race condition
L
Liu Jicong 已提交
1833
        SMqClientVg* pVg = pollRspWrapper->vgHandle;
1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844

        // update the epset
        if (pollRspWrapper->pEpset != NULL) {
          SEp* pEp = GET_ACTIVE_EP(pollRspWrapper->pEpset);
          SEp* pOld = GET_ACTIVE_EP(&(pVg->epSet));
          tscDebug("consumer:0x%" PRIx64 " update epset vgId:%d, ep:%s:%d, old ep:%s:%d", tmq->consumerId,
                   pVg->vgId, pEp->fqdn, pEp->port, pOld->fqdn, pOld->port);
          pVg->epSet = *pollRspWrapper->pEpset;
        }

        pVg->currentOffset = pDataRsp->rspOffset;
X
Xiaoyu Wang 已提交
1845
        atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
H
Haojun Liao 已提交
1846

1847 1848 1849
        char buf[80];
        tFormatOffset(buf, 80, &pDataRsp->rspOffset);
        if (pDataRsp->blockNum == 0) {
H
Haojun Liao 已提交
1850 1851
          tscDebug("consumer:0x%" PRIx64 " empty block received, vgId:%d, offset:%s, vg total:%"PRId64" total:%"PRId64" reqId:0x%" PRIx64, tmq->consumerId,
                   pVg->vgId, buf, pVg->numOfRows, tmq->totalRows, pollRspWrapper->reqId);
1852
          pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1853
          taosFreeQitem(pollRspWrapper);
1854
        } else {  // build rsp
1855 1856
          int64_t numOfRows = 0;
          SMqRspObj* pRsp = tmqBuildRspFromWrapper(pollRspWrapper, pVg, &numOfRows);
H
Haojun Liao 已提交
1857 1858
          tmq->totalRows += numOfRows;

H
Haojun Liao 已提交
1859
          tscDebug("consumer:0x%" PRIx64 " process poll rsp, vgId:%d, offset:%s, blocks:%d, rows:%" PRId64
H
Haojun Liao 已提交
1860
                   " vg total:%" PRId64 " total:%" PRId64 ", reqId:0x%" PRIx64,
H
Haojun Liao 已提交
1861
                   tmq->consumerId, pVg->vgId, buf, pDataRsp->blockNum, numOfRows, pVg->numOfRows, tmq->totalRows,
H
Haojun Liao 已提交
1862
                   pollRspWrapper->reqId);
1863 1864 1865
          taosFreeQitem(pollRspWrapper);
          return pRsp;
        }
X
Xiaoyu Wang 已提交
1866
      } else {
H
Haojun Liao 已提交
1867 1868 1869
        SMqClientVg* pVg = pollRspWrapper->vgHandle;
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
                 tmq->consumerId, pVg->vgId, pDataRsp->head.epoch, consumerEpoch);
1870
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1871 1872
        taosFreeQitem(pollRspWrapper);
      }
1873 1874
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_META_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
L
Liu Jicong 已提交
1875
      int32_t            consumerEpoch = atomic_load_32(&tmq->epoch);
1876 1877 1878

      tscDebug("consumer:0x%" PRIx64 " process meta rsp", tmq->consumerId);

L
Liu Jicong 已提交
1879
      if (pollRspWrapper->metaRsp.head.epoch == consumerEpoch) {
L
Liu Jicong 已提交
1880
        SMqClientVg* pVg = pollRspWrapper->vgHandle;
wmmhello's avatar
wmmhello 已提交
1881
        pVg->currentOffset = pollRspWrapper->metaRsp.rspOffset;
L
Liu Jicong 已提交
1882 1883
        atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
        // build rsp
L
Liu Jicong 已提交
1884
        SMqMetaRspObj* pRsp = tmqBuildMetaRspFromWrapper(pollRspWrapper);
L
Liu Jicong 已提交
1885 1886 1887
        taosFreeQitem(pollRspWrapper);
        return pRsp;
      } else {
H
Haojun Liao 已提交
1888 1889
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
                 tmq->consumerId, pollRspWrapper->vgHandle->vgId, pollRspWrapper->metaRsp.head.epoch, consumerEpoch);
1890
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1891
        taosFreeQitem(pollRspWrapper);
X
Xiaoyu Wang 已提交
1892
      }
1893 1894
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__TAOSX_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
L
Liu Jicong 已提交
1895
      int32_t consumerEpoch = atomic_load_32(&tmq->epoch);
H
Haojun Liao 已提交
1896

L
Liu Jicong 已提交
1897 1898 1899 1900
      if (pollRspWrapper->taosxRsp.head.epoch == consumerEpoch) {
        SMqClientVg* pVg = pollRspWrapper->vgHandle;
        pVg->currentOffset = pollRspWrapper->taosxRsp.rspOffset;
        atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
H
Haojun Liao 已提交
1901

L
Liu Jicong 已提交
1902
        if (pollRspWrapper->taosxRsp.blockNum == 0) {
H
Haojun Liao 已提交
1903 1904
          tscDebug("consumer:0x%" PRIx64 " taosx empty block received, vgId:%d, vg total:%" PRId64 " reqId:0x%" PRIx64,
                   tmq->consumerId, pVg->vgId, pVg->numOfRows, pollRspWrapper->reqId);
H
Haojun Liao 已提交
1905
          pVg->emptyBlockReceiveTs = taosGetTimestampMs();
1906
          pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
H
Haojun Liao 已提交
1907
          taosFreeQitem(pollRspWrapper);
L
Liu Jicong 已提交
1908
          continue;
H
Haojun Liao 已提交
1909 1910
        } else {
          pVg->emptyBlockReceiveTs = 0; // reset the ts
L
Liu Jicong 已提交
1911
        }
wmmhello's avatar
wmmhello 已提交
1912

L
Liu Jicong 已提交
1913
        // build rsp
wmmhello's avatar
wmmhello 已提交
1914
        void* pRsp = NULL;
1915
        int64_t numOfRows = 0;
L
Liu Jicong 已提交
1916
        if (pollRspWrapper->taosxRsp.createTableNum == 0) {
1917
          pRsp = tmqBuildRspFromWrapper(pollRspWrapper, pVg, &numOfRows);
L
Liu Jicong 已提交
1918
        } else {
wmmhello's avatar
wmmhello 已提交
1919 1920
          pRsp = tmqBuildTaosxRspFromWrapper(pollRspWrapper);
        }
H
Haojun Liao 已提交
1921

1922 1923
        tmq->totalRows += numOfRows;

H
Haojun Liao 已提交
1924 1925
        char buf[80];
        tFormatOffset(buf, 80, &pVg->currentOffset);
H
Haojun Liao 已提交
1926
        tscDebug("consumer:0x%" PRIx64 " process taosx poll rsp, vgId:%d, offset:%s, blocks:%d, rows:%" PRId64
H
Haojun Liao 已提交
1927
                 ", vg total:%" PRId64 " total:%"PRId64" reqId:0x%" PRIx64,
H
Haojun Liao 已提交
1928
                 tmq->consumerId, pVg->vgId, buf, pollRspWrapper->dataRsp.blockNum, numOfRows, pVg->numOfRows,
H
Haojun Liao 已提交
1929
                 tmq->totalRows, pollRspWrapper->reqId);
H
Haojun Liao 已提交
1930 1931

        taosFreeQitem(pollRspWrapper);
L
Liu Jicong 已提交
1932
        return pRsp;
H
Haojun Liao 已提交
1933

L
Liu Jicong 已提交
1934
      } else {
H
Haojun Liao 已提交
1935 1936
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
                 tmq->consumerId, pollRspWrapper->vgHandle->vgId, pollRspWrapper->taosxRsp.head.epoch, consumerEpoch);
1937
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1938 1939
        taosFreeQitem(pollRspWrapper);
      }
X
Xiaoyu Wang 已提交
1940
    } else {
H
Haojun Liao 已提交
1941 1942
      tscDebug("consumer:0x%" PRIx64 " not data msg received", tmq->consumerId);

X
Xiaoyu Wang 已提交
1943
      bool reset = false;
1944 1945
      tmqHandleNoPollRsp(tmq, pRspWrapper, &reset);
      taosFreeQitem(pRspWrapper);
X
Xiaoyu Wang 已提交
1946
      if (pollIfReset && reset) {
1947
        tscDebug("consumer:0x%" PRIx64 ", reset and repoll", tmq->consumerId);
1948
        tmqPollImpl(tmq, timeout);
X
Xiaoyu Wang 已提交
1949 1950 1951 1952 1953
      }
    }
  }
}

1954
TAOS_RES* tmq_consumer_poll(tmq_t* tmq, int64_t timeout) {
L
Liu Jicong 已提交
1955 1956
  void*   rspObj;
  int64_t startTime = taosGetTimestampMs();
L
Liu Jicong 已提交
1957

1958
  tscDebug("consumer:0x%" PRIx64 " start to poll at %" PRId64, tmq->consumerId, startTime);
L
Liu Jicong 已提交
1959

1960 1961 1962
#if 0
  tmqHandleAllDelayedTask(tmq);
  tmqPollImpl(tmq, timeout);
1963
  rspObj = tmqHandleAllRsp(tmq, timeout, false);
L
Liu Jicong 已提交
1964 1965
  if (rspObj) {
    return (TAOS_RES*)rspObj;
L
fix  
Liu Jicong 已提交
1966
  }
1967
#endif
X
Xiaoyu Wang 已提交
1968

1969
  // in no topic status, delayed task also need to be processed
L
Liu Jicong 已提交
1970
  if (atomic_load_8(&tmq->status) == TMQ_CONSUMER_STATUS__INIT) {
1971
    tscDebug("consumer:0x%" PRIx64 " poll return since consumer is init", tmq->consumerId);
1972
    taosMsleep(500);  //     sleep for a while
1973 1974 1975
    return NULL;
  }

wmmhello's avatar
wmmhello 已提交
1976
  while (atomic_load_8(&tmq->status) == TMQ_CONSUMER_STATUS__RECOVER) {
L
Liu Jicong 已提交
1977 1978
    int32_t retryCnt = 0;
    while (TSDB_CODE_MND_CONSUMER_NOT_READY == tmqAskEp(tmq, false)) {
H
Haojun Liao 已提交
1979
      if (retryCnt++ > 40) {
L
Liu Jicong 已提交
1980 1981
        return NULL;
      }
1982

H
Haojun Liao 已提交
1983
      tscDebug("consumer:0x%" PRIx64 " not ready, retry:%d/40 in 500ms", tmq->consumerId, retryCnt);
L
Liu Jicong 已提交
1984 1985 1986 1987
      taosMsleep(500);
    }
  }

X
Xiaoyu Wang 已提交
1988
  while (1) {
L
Liu Jicong 已提交
1989
    tmqHandleAllDelayedTask(tmq);
1990

L
Liu Jicong 已提交
1991
    if (tmqPollImpl(tmq, timeout) < 0) {
1992
      tscDebug("consumer:0x%" PRIx64 " return due to poll error", tmq->consumerId);
L
Liu Jicong 已提交
1993
    }
L
Liu Jicong 已提交
1994

1995
    rspObj = tmqHandleAllRsp(tmq, timeout, false);
L
Liu Jicong 已提交
1996
    if (rspObj) {
1997
      tscDebug("consumer:0x%" PRIx64 " return rsp %p", tmq->consumerId, rspObj);
L
Liu Jicong 已提交
1998
      return (TAOS_RES*)rspObj;
L
Liu Jicong 已提交
1999
    } else if (terrno == TSDB_CODE_TQ_NO_COMMITTED_OFFSET) {
2000
      tscDebug("consumer:0x%" PRIx64 " return null since no committed offset", tmq->consumerId);
L
Liu Jicong 已提交
2001
      return NULL;
X
Xiaoyu Wang 已提交
2002
    }
2003

2004
    if (timeout >= 0) {
L
Liu Jicong 已提交
2005
      int64_t currentTime = taosGetTimestampMs();
2006 2007 2008
      int64_t elapsedTime = currentTime - startTime;
      if (elapsedTime > timeout) {
        tscDebug("consumer:0x%" PRIx64 " (epoch %d) timeout, no rsp, start time %" PRId64 ", current time %" PRId64,
L
Liu Jicong 已提交
2009
                 tmq->consumerId, tmq->epoch, startTime, currentTime);
X
Xiaoyu Wang 已提交
2010 2011
        return NULL;
      }
2012
      tsem_timewait(&tmq->rspSem, (timeout - elapsedTime));
L
Liu Jicong 已提交
2013 2014
    } else {
      // use tsem_timewait instead of tsem_wait to avoid unexpected stuck
L
Liu Jicong 已提交
2015
      tsem_timewait(&tmq->rspSem, 1000);
X
Xiaoyu Wang 已提交
2016 2017 2018 2019
    }
  }
}

2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033
static void displayConsumeStatistics(const tmq_t* pTmq) {
  int32_t numOfTopics = taosArrayGetSize(pTmq->clientTopics);
  tscDebug("consumer:0x%" PRIx64 " closing poll:%" PRId64 " rows:%" PRId64 " topics:%d, final epoch:%d",
           pTmq->consumerId, pTmq->pollCnt, pTmq->totalRows, numOfTopics, pTmq->epoch);

  tscDebug("consumer:0x%" PRIx64 " rows dist begin: ", pTmq->consumerId);
  for (int32_t i = 0; i < numOfTopics; ++i) {
    SMqClientTopic* pTopics = taosArrayGet(pTmq->clientTopics, i);

    tscDebug("consumer:0x%" PRIx64 " topic:%d", pTmq->consumerId, i);
    int32_t numOfVgs = taosArrayGetSize(pTopics->vgs);
    for (int32_t j = 0; j < numOfVgs; ++j) {
      SMqClientVg* pVg = taosArrayGet(pTopics->vgs, j);
      tscDebug("topic:%s, %d. vgId:%d rows:%" PRId64, pTopics->topicName, j, pVg->vgId, pVg->numOfRows);
2034
    }
2035
  }
2036

2037 2038
  tscDebug("consumer:0x%" PRIx64 " rows dist end", pTmq->consumerId);
}
2039

2040 2041 2042
int32_t tmq_consumer_close(tmq_t* tmq) {
  tscDebug("consumer:0x%" PRIx64" start to close consumer, status:%d", tmq->consumerId, tmq->status);
  displayConsumeStatistics(tmq);
2043

2044 2045 2046 2047 2048 2049
  if (tmq->status == TMQ_CONSUMER_STATUS__READY) {
    // if auto commit is set, commit before close consumer. Otherwise, do nothing.
    if (tmq->autoCommit) {
      int32_t rsp = tmq_commit_sync(tmq, NULL);
      if (rsp != 0) {
        return rsp;
2050 2051 2052
      }
    }

L
Liu Jicong 已提交
2053
    int32_t     retryCnt = 0;
2054
    tmq_list_t* lst = tmq_list_new();
L
Liu Jicong 已提交
2055
    while (1) {
2056
      int32_t rsp = tmq_subscribe(tmq, lst);
L
Liu Jicong 已提交
2057 2058 2059 2060 2061 2062 2063 2064
      if (rsp != TSDB_CODE_MND_CONSUMER_NOT_READY || retryCnt > 5) {
        break;
      } else {
        retryCnt++;
        taosMsleep(500);
      }
    }

2065
    tmq_list_destroy(lst);
2066 2067
  } else {
    tscWarn("consumer:0x%" PRIx64" not in ready state, close it directly", tmq->consumerId);
L
Liu Jicong 已提交
2068
  }
H
Haojun Liao 已提交
2069

2070
  taosRemoveRef(tmqMgmt.rsetId, tmq->refId);
L
Liu Jicong 已提交
2071
  return 0;
2072
}
L
Liu Jicong 已提交
2073

L
Liu Jicong 已提交
2074 2075
const char* tmq_err2str(int32_t err) {
  if (err == 0) {
L
Liu Jicong 已提交
2076
    return "success";
L
Liu Jicong 已提交
2077
  } else if (err == -1) {
L
Liu Jicong 已提交
2078 2079 2080
    return "fail";
  } else {
    return tstrerror(err);
L
Liu Jicong 已提交
2081 2082
  }
}
L
Liu Jicong 已提交
2083

L
Liu Jicong 已提交
2084 2085 2086 2087 2088
tmq_res_t tmq_get_res_type(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    return TMQ_RES_DATA;
  } else if (TD_RES_TMQ_META(res)) {
    return TMQ_RES_TABLE_META;
2089 2090
  } else if (TD_RES_TMQ_METADATA(res)) {
    return TMQ_RES_METADATA;
L
Liu Jicong 已提交
2091 2092 2093 2094 2095
  } else {
    return TMQ_RES_INVALID;
  }
}

L
Liu Jicong 已提交
2096
const char* tmq_get_topic_name(TAOS_RES* res) {
L
Liu Jicong 已提交
2097 2098
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
L
Liu Jicong 已提交
2099
    return strchr(pRspObj->topic, '.') + 1;
L
Liu Jicong 已提交
2100 2101 2102
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return strchr(pMetaRspObj->topic, '.') + 1;
2103 2104 2105
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return strchr(pRspObj->topic, '.') + 1;
L
Liu Jicong 已提交
2106 2107 2108 2109 2110
  } else {
    return NULL;
  }
}

L
Liu Jicong 已提交
2111 2112 2113 2114
const char* tmq_get_db_name(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    return strchr(pRspObj->db, '.') + 1;
L
Liu Jicong 已提交
2115 2116 2117
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return strchr(pMetaRspObj->db, '.') + 1;
2118 2119 2120
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return strchr(pRspObj->db, '.') + 1;
L
Liu Jicong 已提交
2121 2122 2123 2124 2125
  } else {
    return NULL;
  }
}

L
Liu Jicong 已提交
2126 2127 2128 2129
int32_t tmq_get_vgroup_id(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    return pRspObj->vgId;
L
Liu Jicong 已提交
2130 2131 2132
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return pMetaRspObj->vgId;
2133
  } else if (TD_RES_TMQ_METADATA(res)) {
2134 2135
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return pRspObj->vgId;
L
Liu Jicong 已提交
2136 2137 2138 2139
  } else {
    return -1;
  }
}
L
Liu Jicong 已提交
2140 2141 2142 2143 2144 2145 2146 2147

const char* tmq_get_table_name(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    if (!pRspObj->rsp.withTbName || pRspObj->rsp.blockTbName == NULL || pRspObj->resIter < 0 ||
        pRspObj->resIter >= pRspObj->rsp.blockNum) {
      return NULL;
    }
2148
    return (const char*)taosArrayGetP(pRspObj->rsp.blockTbName, pRspObj->resIter);
2149 2150
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
L
Liu Jicong 已提交
2151 2152 2153
    if (!pRspObj->rsp.withTbName || pRspObj->rsp.blockTbName == NULL || pRspObj->resIter < 0 ||
        pRspObj->resIter >= pRspObj->rsp.blockNum) {
      return NULL;
2154
    }
L
Liu Jicong 已提交
2155 2156
    return (const char*)taosArrayGetP(pRspObj->rsp.blockTbName, pRspObj->resIter);
  }
L
Liu Jicong 已提交
2157 2158
  return NULL;
}
2159

L
Liu Jicong 已提交
2160
void tmq_commit_async(tmq_t* tmq, const TAOS_RES* msg, tmq_commit_cb* cb, void* param) {
L
Liu Jicong 已提交
2161
  tmqCommitInner(tmq, msg, 0, 1, cb, param);
L
Liu Jicong 已提交
2162 2163
}

2164
int32_t tmq_commit_sync(tmq_t* tmq, const TAOS_RES* msg) {
L
Liu Jicong 已提交
2165
  return tmqCommitInner(tmq, msg, 0, 0, NULL, NULL);
2166
}
2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201 2202 2203 2204 2205 2206 2207 2208 2209 2210 2211 2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256

int32_t tmqAskEp(tmq_t* tmq, bool async) {
  int32_t code = TSDB_CODE_SUCCESS;
#if 0
  int8_t  epStatus = atomic_val_compare_exchange_8(&tmq->epStatus, 0, 1);
  if (epStatus == 1) {
    int32_t epSkipCnt = atomic_add_fetch_32(&tmq->epSkipCnt, 1);
    tscTrace("consumer:0x%" PRIx64 ", skip ask ep cnt %d", tmq->consumerId, epSkipCnt);
    if (epSkipCnt < 5000) return 0;
  }
  atomic_store_32(&tmq->epSkipCnt, 0);
#endif

  SMqAskEpReq req = {0};
  req.consumerId = tmq->consumerId;
  req.epoch = tmq->epoch;
  strcpy(req.cgroup, tmq->groupId);

  int32_t tlen = tSerializeSMqAskEpReq(NULL, 0, &req);
  if (tlen < 0) {
    tscError("consumer:0x%" PRIx64 ", tSerializeSMqAskEpReq failed", tmq->consumerId);
    return -1;
  }

  void* pReq = taosMemoryCalloc(1, tlen);
  if (pReq == NULL) {
    tscError("consumer:0x%" PRIx64 ", failed to malloc askEpReq msg, size:%d", tmq->consumerId, tlen);
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return -1;
  }

  if (tSerializeSMqAskEpReq(pReq, tlen, &req) < 0) {
    tscError("consumer:0x%" PRIx64 ", tSerializeSMqAskEpReq %d failed", tmq->consumerId, tlen);
    taosMemoryFree(pReq);
    return -1;
  }

  SMqAskEpCbParam* pParam = taosMemoryCalloc(1, sizeof(SMqAskEpCbParam));
  if (pParam == NULL) {
    tscError("consumer:0x%" PRIx64 ", failed to malloc subscribe param", tmq->consumerId);
    taosMemoryFree(pReq);
    return -1;
  }

  pParam->refId = tmq->refId;
  pParam->epoch = tmq->epoch;
  pParam->async = async;
  tsem_init(&pParam->rspSem, 0, 0);

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    tsem_destroy(&pParam->rspSem);
    taosMemoryFree(pParam);
    taosMemoryFree(pReq);
    return -1;
  }

  sendInfo->msgInfo = (SDataBuf){
      .pData = pReq,
      .len = tlen,
      .handle = NULL,
  };

  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
  sendInfo->param = pParam;
  sendInfo->fp = tmqAskEpCb;
  sendInfo->msgType = TDMT_MND_TMQ_ASK_EP;

  SEpSet epSet = getEpSet_s(&tmq->pTscObj->pAppInfo->mgmtEp);
  tscDebug("consumer:0x%" PRIx64 " ask ep from mnode, async:%d, reqId:0x%" PRIx64, tmq->consumerId, async,
           sendInfo->requestId);

  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);

  if (!async) {
    tsem_wait(&pParam->rspSem);
    code = pParam->code;
    taosMemoryFree(pParam);
  }

  return code;
}

int32_t makeTopicVgroupKey(char* dst, const char* topicName, int32_t vg) {
  return sprintf(dst, "%s:%d", topicName, vg);
}

int32_t tmqCommitDone(SMqCommitCbParamSet* pParamSet) {
2257 2258 2259
  int64_t refId = pParamSet->refId;

  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
2260 2261 2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272 2273
  if (tmq == NULL) {
    if (!pParamSet->async) {
      tsem_destroy(&pParamSet->rspSem);
    }
    taosMemoryFree(pParamSet);
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    return -1;
  }

  // if no more waiting rsp
  if (pParamSet->async) {
    // call async cb func
    if (pParamSet->automatic && tmq->commitCb) {
      tmq->commitCb(tmq, pParamSet->rspErr, tmq->commitCbUserParam);
2274
    } else if (!pParamSet->automatic && pParamSet->userCb) { // sem post
2275 2276
      pParamSet->userCb(tmq, pParamSet->rspErr, pParamSet->userParam);
    }
2277

2278 2279 2280 2281 2282 2283 2284 2285 2286
    taosMemoryFree(pParamSet);
  } else {
    tsem_post(&pParamSet->rspSem);
  }

#if 0
  taosArrayDestroyP(pParamSet->successfulOffsets, taosMemoryFree);
    taosArrayDestroyP(pParamSet->failedOffsets, taosMemoryFree);
#endif
2287 2288

  taosReleaseRef(tmqMgmt.rsetId, refId);
2289
  return 0;
2290 2291 2292 2293 2294
}

void tmqCommitRspCountDown(SMqCommitCbParamSet* pParamSet, int64_t consumerId, const char* pTopic, int32_t vgId) {
  int32_t waitingRspNum = atomic_sub_fetch_32(&pParamSet->waitingRspNum, 1);
  if (waitingRspNum == 0) {
H
Haojun Liao 已提交
2295 2296
    tscDebug("consumer:0x%" PRIx64 " topic:%s vgId:%d all commit-rsp received, commit completed", consumerId, pTopic,
             vgId);
2297
    tmqCommitDone(pParamSet);
H
Haojun Liao 已提交
2298 2299 2300
  } else {
    tscDebug("consumer:0x%" PRIx64 " topic:%s vgId:%d commit-rsp received, remain:%d", consumerId, pTopic, vgId,
             waitingRspNum);
2301 2302
  }
}