clientTmq.c 98.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
 *
 * This program is free software: you can use, redistribute, and/or modify
 * it under the terms of the GNU Affero General Public License, version 3
 * or later ("AGPL"), as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 */

L
Liu Jicong 已提交
16
#include "cJSON.h"
17 18 19
#include "clientInt.h"
#include "clientLog.h"
#include "parser.h"
H
Haojun Liao 已提交
20
#include "tdatablock.h"
21 22
#include "tdef.h"
#include "tglobal.h"
X
Xiaoyu Wang 已提交
23
#include "tqueue.h"
24
#include "tref.h"
L
Liu Jicong 已提交
25 26
#include "ttimer.h"

X
Xiaoyu Wang 已提交
27 28
#define EMPTY_BLOCK_POLL_IDLE_DURATION 10
#define DEFAULT_AUTO_COMMIT_INTERVAL   5000
29

30 31
#define OFFSET_IS_RESET_OFFSET(_of)  ((_of) < 0)

32 33
typedef void (*__tmq_askep_fn_t)(tmq_t* pTmq, int32_t code, SDataBuf* pBuf, void* pParam);

X
Xiaoyu Wang 已提交
34
struct SMqMgmt {
35 36 37
  int8_t  inited;
  tmr_h   timer;
  int32_t rsetId;
38
};
L
Liu Jicong 已提交
39

X
Xiaoyu Wang 已提交
40 41
static TdThreadOnce   tmqInit = PTHREAD_ONCE_INIT;  // initialize only once
volatile int32_t      tmqInitRes = 0;               // initialize rsp code
42
static struct SMqMgmt tmqMgmt = {0};
43

L
Liu Jicong 已提交
44 45 46 47 48 49
typedef struct {
  int8_t  tmqRspType;
  int32_t epoch;
} SMqRspWrapper;

typedef struct {
L
Liu Jicong 已提交
50 51 52
  int8_t      tmqRspType;
  int32_t     epoch;
  SMqAskEpRsp msg;
L
Liu Jicong 已提交
53 54
} SMqAskEpRspWrapper;

L
Liu Jicong 已提交
55
struct tmq_list_t {
L
Liu Jicong 已提交
56
  SArray container;
L
Liu Jicong 已提交
57
};
L
Liu Jicong 已提交
58

L
Liu Jicong 已提交
59
struct tmq_conf_t {
60 61 62 63 64 65 66 67
  char           clientId[256];
  char           groupId[TSDB_CGROUP_LEN];
  int8_t         autoCommit;
  int8_t         resetOffset;
  int8_t         withTbName;
  int8_t         snapEnable;
  int32_t        snapBatchSize;
  bool           hbBgEnable;
68 69 70 71 72
  uint16_t       port;
  int32_t        autoCommitInterval;
  char*          ip;
  char*          user;
  char*          pass;
73
  tmq_commit_cb* commitCb;
L
Liu Jicong 已提交
74
  void*          commitCbUserParam;
L
Liu Jicong 已提交
75 76 77
};

struct tmq_t {
78 79 80 81 82 83 84
  int64_t        refId;
  char           groupId[TSDB_CGROUP_LEN];
  char           clientId[256];
  int8_t         withTbName;
  int8_t         useSnapshot;
  int8_t         autoCommit;
  int32_t        autoCommitInterval;
85
  int8_t         resetOffsetCfg;
86 87
  uint64_t       consumerId;
  bool           hbBgEnable;
L
Liu Jicong 已提交
88 89
  tmq_commit_cb* commitCb;
  void*          commitCbUserParam;
L
Liu Jicong 已提交
90 91

  // status
wmmhello's avatar
wmmhello 已提交
92
  SRWLatch        lock;
L
Liu Jicong 已提交
93 94
  int8_t  status;
  int32_t epoch;
L
Liu Jicong 已提交
95 96
#if 0
  int8_t  epStatus;
L
Liu Jicong 已提交
97
  int32_t epSkipCnt;
L
Liu Jicong 已提交
98
#endif
99
  // poll info
X
Xiaoyu Wang 已提交
100 101
  int64_t pollCnt;
  int64_t totalRows;
wmmhello's avatar
wmmhello 已提交
102
//  bool    needReportOffsetRows;
L
Liu Jicong 已提交
103

L
Liu Jicong 已提交
104
  // timer
X
Xiaoyu Wang 已提交
105 106 107 108 109 110 111 112 113 114
  tmr_h       hbLiveTimer;
  tmr_h       epTimer;
  tmr_h       reportTimer;
  tmr_h       commitTimer;
  STscObj*    pTscObj;       // connection
  SArray*     clientTopics;  // SArray<SMqClientTopic>
  STaosQueue* mqueue;        // queue of rsp
  STaosQall*  qall;
  STaosQueue* delayedTask;  // delayed task queue for heartbeat and auto commit
  tsem_t      rspSem;
L
Liu Jicong 已提交
115 116
};

117 118
typedef struct SAskEpInfo {
  int32_t code;
H
Haojun Liao 已提交
119
  tsem_t  sem;
120 121
} SAskEpInfo;

X
Xiaoyu Wang 已提交
122 123 124 125 126 127 128 129
enum {
  TMQ_VG_STATUS__IDLE = 0,
  TMQ_VG_STATUS__WAIT,
};

enum {
  TMQ_CONSUMER_STATUS__INIT = 0,
  TMQ_CONSUMER_STATUS__READY,
130
  TMQ_CONSUMER_STATUS__NO_TOPIC,
L
Liu Jicong 已提交
131
  TMQ_CONSUMER_STATUS__RECOVER,
L
Liu Jicong 已提交
132 133
};

L
Liu Jicong 已提交
134
enum {
135
  TMQ_DELAYED_TASK__ASK_EP = 1,
L
Liu Jicong 已提交
136 137 138 139
  TMQ_DELAYED_TASK__REPORT,
  TMQ_DELAYED_TASK__COMMIT,
};

H
Haojun Liao 已提交
140
typedef struct SVgOffsetInfo {
L
Liu Jicong 已提交
141
  STqOffsetVal committedOffset;
142 143
  STqOffsetVal endOffset;        // the last version in TAOS_RES + 1
  STqOffsetVal beginOffset;      // the first version in TAOS_RES
H
Haojun Liao 已提交
144 145 146 147 148 149 150 151 152 153
  int64_t      walVerBegin;
  int64_t      walVerEnd;
} SVgOffsetInfo;

typedef struct {
  int64_t       pollCnt;
  int64_t       numOfRows;
  SVgOffsetInfo offsetInfo;
  int32_t       vgId;
  int32_t       vgStatus;
H
Haojun Liao 已提交
154
  int32_t       vgSkipCnt;              // here used to mark the slow vgroups
155
//  bool          receivedInfoFromVnode;  // has already received info from vnode
H
Haojun Liao 已提交
156 157
  int64_t       emptyBlockReceiveTs;    // once empty block is received, idle for ignoreCnt then start to poll data
  bool          seekUpdated;            // offset is updated by seek operator, therefore, not update by vnode rsp.
H
Haojun Liao 已提交
158
  SEpSet        epSet;
159 160
} SMqClientVg;

L
Liu Jicong 已提交
161
typedef struct {
162 163 164
  char           topicName[TSDB_TOPIC_FNAME_LEN];
  char           db[TSDB_DB_FNAME_LEN];
  SArray*        vgs;  // SArray<SMqClientVg>
L
Liu Jicong 已提交
165
  SSchemaWrapper schema;
166 167
} SMqClientTopic;

L
Liu Jicong 已提交
168 169
typedef struct {
  int8_t          tmqRspType;
170
  int32_t         epoch;  // epoch can be used to guard the vgHandle
171
  int32_t         vgId;
wmmhello's avatar
wmmhello 已提交
172
  char            topicName[TSDB_TOPIC_FNAME_LEN];
L
Liu Jicong 已提交
173 174
  SMqClientVg*    vgHandle;
  SMqClientTopic* topicHandle;
H
Haojun Liao 已提交
175
  uint64_t        reqId;
176
  SEpSet*         pEpset;
L
Liu Jicong 已提交
177
  union {
L
Liu Jicong 已提交
178 179
    SMqDataRsp dataRsp;
    SMqMetaRsp metaRsp;
L
Liu Jicong 已提交
180
    STaosxRsp  taosxRsp;
L
Liu Jicong 已提交
181
  };
L
Liu Jicong 已提交
182 183
} SMqPollRspWrapper;

L
Liu Jicong 已提交
184
typedef struct {
wmmhello's avatar
wmmhello 已提交
185 186
//  int64_t refId;
//  int32_t epoch;
L
Liu Jicong 已提交
187 188
  tsem_t  rspSem;
  int32_t rspErr;
L
Liu Jicong 已提交
189
} SMqSubscribeCbParam;
L
Liu Jicong 已提交
190

L
Liu Jicong 已提交
191
typedef struct {
192 193 194 195
  int64_t          refId;
  int32_t          epoch;
  void*            pParam;
  __tmq_askep_fn_t pUserFn;
196 197
} SMqAskEpCbParam;

L
Liu Jicong 已提交
198
typedef struct {
199 200
  int64_t         refId;
  int32_t         epoch;
wmmhello's avatar
wmmhello 已提交
201 202 203
  char            topicName[TSDB_TOPIC_FNAME_LEN];
//  SMqClientVg*    pVg;
//  SMqClientTopic* pTopic;
L
Liu Jicong 已提交
204
  int32_t         vgId;
X
Xiaoyu Wang 已提交
205
  uint64_t        requestId;  // request id for debug purpose
X
Xiaoyu Wang 已提交
206
} SMqPollCbParam;
207

208 209 210 211 212 213 214 215 216 217
typedef struct SMqVgCommon {
  tsem_t        rsp;
  int32_t       numOfRsp;
  SArray*       pList;
  TdThreadMutex mutex;
  int64_t       consumerId;
  char*         pTopicName;
  int32_t       code;
} SMqVgCommon;

218 219 220 221 222
typedef struct SMqSeekParam {
  tsem_t        sem;
  int32_t       code;
} SMqSeekParam;

223 224 225 226 227 228 229
typedef struct SMqVgWalInfoParam {
  int32_t      vgId;
  int32_t      epoch;
  int32_t      totalReq;
  SMqVgCommon* pCommon;
} SMqVgWalInfoParam;

230
typedef struct {
231 232
  int64_t        refId;
  int32_t        epoch;
L
Liu Jicong 已提交
233 234
  int32_t        waitingRspNum;
  int32_t        totalRspNum;
235
  int32_t        code;
236
  tmq_commit_cb* callbackFn;
L
Liu Jicong 已提交
237 238
  /*SArray*        successfulOffsets;*/
  /*SArray*        failedOffsets;*/
X
Xiaoyu Wang 已提交
239
  void* userParam;
240 241 242 243
} SMqCommitCbParamSet;

typedef struct {
  SMqCommitCbParamSet* params;
244
  SMqVgOffset*         pOffset;
H
Haojun Liao 已提交
245 246 247
  char                 topicName[TSDB_TOPIC_FNAME_LEN];
  int32_t              vgId;
  tmq_t*               pTmq;
248
} SMqCommitCbParam;
249

250 251 252 253 254
typedef struct SSyncCommitInfo {
  tsem_t  sem;
  int32_t code;
} SSyncCommitInfo;

255
static int32_t doAskEp(tmq_t* tmq);
256 257
static int32_t makeTopicVgroupKey(char* dst, const char* topicName, int32_t vg);
static int32_t tmqCommitDone(SMqCommitCbParamSet* pParamSet);
258
static int32_t doSendCommitMsg(tmq_t* tmq, int32_t vgId, SEpSet* epSet, STqOffsetVal* offset, const char* pTopicName, SMqCommitCbParamSet* pParamSet);
X
Xiaoyu Wang 已提交
259 260 261
static void    commitRspCountDown(SMqCommitCbParamSet* pParamSet, int64_t consumerId, const char* pTopic, int32_t vgId);
static void    asyncAskEp(tmq_t* pTmq, __tmq_askep_fn_t askEpFn, void* param);
static void    addToQueueCallbackFn(tmq_t* pTmq, int32_t code, SDataBuf* pDataBuf, void* param);
262

263
tmq_conf_t* tmq_conf_new() {
wafwerar's avatar
wafwerar 已提交
264
  tmq_conf_t* conf = taosMemoryCalloc(1, sizeof(tmq_conf_t));
265 266 267 268 269
  if (conf == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return conf;
  }

270
  conf->withTbName = false;
L
Liu Jicong 已提交
271
  conf->autoCommit = true;
272
  conf->autoCommitInterval = DEFAULT_AUTO_COMMIT_INTERVAL;
273
  conf->resetOffset = TMQ_OFFSET__RESET_EARLIEST;
274
  conf->hbBgEnable = true;
275

276 277 278
  return conf;
}

L
Liu Jicong 已提交
279
void tmq_conf_destroy(tmq_conf_t* conf) {
L
Liu Jicong 已提交
280
  if (conf) {
281 282 283 284 285 286 287 288 289
    if (conf->ip) {
      taosMemoryFree(conf->ip);
    }
    if (conf->user) {
      taosMemoryFree(conf->user);
    }
    if (conf->pass) {
      taosMemoryFree(conf->pass);
    }
L
Liu Jicong 已提交
290 291
    taosMemoryFree(conf);
  }
L
Liu Jicong 已提交
292 293 294
}

tmq_conf_res_t tmq_conf_set(tmq_conf_t* conf, const char* key, const char* value) {
295
  if (strcasecmp(key, "group.id") == 0) {
L
Liu Jicong 已提交
296
    tstrncpy(conf->groupId, value, TSDB_CGROUP_LEN);
L
Liu Jicong 已提交
297
    return TMQ_CONF_OK;
298
  }
L
Liu Jicong 已提交
299

300
  if (strcasecmp(key, "client.id") == 0) {
L
Liu Jicong 已提交
301
    tstrncpy(conf->clientId, value, 256);
L
Liu Jicong 已提交
302 303
    return TMQ_CONF_OK;
  }
L
Liu Jicong 已提交
304

305 306
  if (strcasecmp(key, "enable.auto.commit") == 0) {
    if (strcasecmp(value, "true") == 0) {
L
Liu Jicong 已提交
307
      conf->autoCommit = true;
L
Liu Jicong 已提交
308
      return TMQ_CONF_OK;
309
    } else if (strcasecmp(value, "false") == 0) {
L
Liu Jicong 已提交
310
      conf->autoCommit = false;
L
Liu Jicong 已提交
311 312 313 314
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
315
  }
L
Liu Jicong 已提交
316

317
  if (strcasecmp(key, "auto.commit.interval.ms") == 0) {
318
    conf->autoCommitInterval = taosStr2int64(value);
L
Liu Jicong 已提交
319 320 321
    return TMQ_CONF_OK;
  }

322 323 324
  if (strcasecmp(key, "auto.offset.reset") == 0) {
    if (strcasecmp(value, "none") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_NONE;
L
Liu Jicong 已提交
325
      return TMQ_CONF_OK;
326
    } else if (strcasecmp(value, "earliest") == 0) {
327
      conf->resetOffset = TMQ_OFFSET__RESET_EARLIEST;
L
Liu Jicong 已提交
328
      return TMQ_CONF_OK;
329 330
    } else if (strcasecmp(value, "latest") == 0) {
      conf->resetOffset = TMQ_OFFSET__RESET_LATEST;
L
Liu Jicong 已提交
331 332 333 334 335
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
  }
L
Liu Jicong 已提交
336

337 338
  if (strcasecmp(key, "msg.with.table.name") == 0) {
    if (strcasecmp(value, "true") == 0) {
339
      conf->withTbName = true;
L
Liu Jicong 已提交
340
      return TMQ_CONF_OK;
341
    } else if (strcasecmp(value, "false") == 0) {
342
      conf->withTbName = false;
L
Liu Jicong 已提交
343
      return TMQ_CONF_OK;
344 345 346 347 348
    } else {
      return TMQ_CONF_INVALID;
    }
  }

349 350
  if (strcasecmp(key, "experimental.snapshot.enable") == 0) {
    if (strcasecmp(value, "true") == 0) {
L
Liu Jicong 已提交
351
      conf->snapEnable = true;
352
      return TMQ_CONF_OK;
353
    } else if (strcasecmp(value, "false") == 0) {
L
Liu Jicong 已提交
354
      conf->snapEnable = false;
355 356 357 358 359 360
      return TMQ_CONF_OK;
    } else {
      return TMQ_CONF_INVALID;
    }
  }

361
  if (strcasecmp(key, "experimental.snapshot.batch.size") == 0) {
362
    conf->snapBatchSize = taosStr2int64(value);
L
Liu Jicong 已提交
363 364 365
    return TMQ_CONF_OK;
  }

366
//  if (strcasecmp(key, "enable.heartbeat.background") == 0) {
X
Xiaoyu Wang 已提交
367 368 369 370 371 372 373
    //    if (strcasecmp(value, "true") == 0) {
    //      conf->hbBgEnable = true;
    //      return TMQ_CONF_OK;
    //    } else if (strcasecmp(value, "false") == 0) {
    //      conf->hbBgEnable = false;
    //      return TMQ_CONF_OK;
    //    } else {
374 375
//    tscError("the default value of enable.heartbeat.background is true, can not be seted");
//    return TMQ_CONF_INVALID;
X
Xiaoyu Wang 已提交
376
    //    }
377
//  }
L
Liu Jicong 已提交
378

379
  if (strcasecmp(key, "td.connect.ip") == 0) {
380
    conf->ip = taosStrdup(value);
L
Liu Jicong 已提交
381 382
    return TMQ_CONF_OK;
  }
383

384
  if (strcasecmp(key, "td.connect.user") == 0) {
385
    conf->user = taosStrdup(value);
L
Liu Jicong 已提交
386 387
    return TMQ_CONF_OK;
  }
388

389
  if (strcasecmp(key, "td.connect.pass") == 0) {
390
    conf->pass = taosStrdup(value);
L
Liu Jicong 已提交
391 392
    return TMQ_CONF_OK;
  }
393

394
  if (strcasecmp(key, "td.connect.port") == 0) {
395
    conf->port = taosStr2int64(value);
L
Liu Jicong 已提交
396 397
    return TMQ_CONF_OK;
  }
398

399
  if (strcasecmp(key, "td.connect.db") == 0) {
L
Liu Jicong 已提交
400 401 402
    return TMQ_CONF_OK;
  }

L
Liu Jicong 已提交
403
  return TMQ_CONF_UNKNOWN;
404 405
}

X
Xiaoyu Wang 已提交
406
tmq_list_t* tmq_list_new() { return (tmq_list_t*)taosArrayInit(0, sizeof(void*)); }
407

L
Liu Jicong 已提交
408 409
int32_t tmq_list_append(tmq_list_t* list, const char* src) {
  SArray* container = &list->container;
410
  if (src == NULL || src[0] == 0) return -1;
411
  char* topic = taosStrdup(src);
L
fix  
Liu Jicong 已提交
412
  if (taosArrayPush(container, &topic) == NULL) return -1;
413 414 415
  return 0;
}

L
Liu Jicong 已提交
416
void tmq_list_destroy(tmq_list_t* list) {
L
Liu Jicong 已提交
417
  SArray* container = &list->container;
L
Liu Jicong 已提交
418
  taosArrayDestroyP(container, taosMemoryFree);
L
Liu Jicong 已提交
419 420
}

L
Liu Jicong 已提交
421 422 423 424 425 426 427 428 429 430
int32_t tmq_list_get_size(const tmq_list_t* list) {
  const SArray* container = &list->container;
  return taosArrayGetSize(container);
}

char** tmq_list_to_c_array(const tmq_list_t* list) {
  const SArray* container = &list->container;
  return container->pData;
}

H
Haojun Liao 已提交
431
static int32_t tmqCommitCb(void* param, SDataBuf* pBuf, int32_t code) {
432
  SMqCommitCbParam*    pParam = (SMqCommitCbParam*)param;
433
  SMqCommitCbParamSet* pParamSet = (SMqCommitCbParamSet*)pParam->params;
H
Haojun Liao 已提交
434

L
Liu Jicong 已提交
435
  taosMemoryFree(pParam->pOffset);
L
Liu Jicong 已提交
436
  taosMemoryFree(pBuf->pData);
dengyihao's avatar
dengyihao 已提交
437
  taosMemoryFree(pBuf->pEpSet);
L
Liu Jicong 已提交
438

439
  commitRspCountDown(pParamSet, pParam->pTmq->consumerId, pParam->topicName, pParam->vgId);
440 441 442
  return 0;
}

443
static int32_t doSendCommitMsg(tmq_t* tmq, int32_t vgId, SEpSet* epSet, STqOffsetVal* offset, const char* pTopicName, SMqCommitCbParamSet* pParamSet) {
444
  SMqVgOffset* pOffset = taosMemoryCalloc(1, sizeof(SMqVgOffset));
L
Liu Jicong 已提交
445
  if (pOffset == NULL) {
446
    return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
447
  }
448

449
  pOffset->consumerId = tmq->consumerId;
450
  pOffset->offset.val = *offset;
451

L
Liu Jicong 已提交
452
  int32_t groupLen = strlen(tmq->groupId);
453 454 455
  memcpy(pOffset->offset.subKey, tmq->groupId, groupLen);
  pOffset->offset.subKey[groupLen] = TMQ_SEPARATOR;
  strcpy(pOffset->offset.subKey + groupLen + 1, pTopicName);
L
Liu Jicong 已提交
456

457 458
  int32_t len = 0;
  int32_t code = 0;
459
  tEncodeSize(tEncodeMqVgOffset, pOffset, len, code);
L
Liu Jicong 已提交
460
  if (code < 0) {
461
    taosMemoryFree(pOffset);
462
    return TSDB_CODE_INVALID_PARA;
L
Liu Jicong 已提交
463
  }
464

L
Liu Jicong 已提交
465
  void* buf = taosMemoryCalloc(1, sizeof(SMsgHead) + len);
L
Liu Jicong 已提交
466 467
  if (buf == NULL) {
    taosMemoryFree(pOffset);
468
    return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
469
  }
470

471
  ((SMsgHead*)buf)->vgId = htonl(vgId);
L
Liu Jicong 已提交
472

L
Liu Jicong 已提交
473 474 475 476
  void* abuf = POINTER_SHIFT(buf, sizeof(SMsgHead));

  SEncoder encoder;
  tEncoderInit(&encoder, abuf, len);
477
  tEncodeMqVgOffset(&encoder, pOffset);
L
Liu Jicong 已提交
478
  tEncoderClear(&encoder);
L
Liu Jicong 已提交
479 480

  // build param
481
  SMqCommitCbParam* pParam = taosMemoryCalloc(1, sizeof(SMqCommitCbParam));
L
Liu Jicong 已提交
482
  if (pParam == NULL) {
L
Liu Jicong 已提交
483
    taosMemoryFree(pOffset);
L
Liu Jicong 已提交
484
    taosMemoryFree(buf);
485
    return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
486
  }
487

L
Liu Jicong 已提交
488 489
  pParam->params = pParamSet;
  pParam->pOffset = pOffset;
490
  pParam->vgId = vgId;
H
Haojun Liao 已提交
491 492
  pParam->pTmq = tmq;

H
Haojun Liao 已提交
493
  tstrncpy(pParam->topicName, pTopicName, tListLen(pParam->topicName));
L
Liu Jicong 已提交
494 495 496 497

  // build send info
  SMsgSendInfo* pMsgSendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (pMsgSendInfo == NULL) {
L
Liu Jicong 已提交
498
    taosMemoryFree(pOffset);
L
Liu Jicong 已提交
499 500
    taosMemoryFree(buf);
    taosMemoryFree(pParam);
501
    return TSDB_CODE_OUT_OF_MEMORY;
L
Liu Jicong 已提交
502
  }
503

504
  pMsgSendInfo->msgInfo = (SDataBuf) { .pData = buf, .len = sizeof(SMsgHead) + len, .handle = NULL };
L
Liu Jicong 已提交
505 506 507 508

  pMsgSendInfo->requestId = generateRequestId();
  pMsgSendInfo->requestObjRefId = 0;
  pMsgSendInfo->param = pParam;
L
Liu Jicong 已提交
509
  pMsgSendInfo->paramFreeFp = taosMemoryFree;
510
  pMsgSendInfo->fp = tmqCommitCb;
511
  pMsgSendInfo->msgType = TDMT_VND_TMQ_COMMIT_OFFSET;
L
Liu Jicong 已提交
512

L
Liu Jicong 已提交
513 514 515
  atomic_add_fetch_32(&pParamSet->waitingRspNum, 1);
  atomic_add_fetch_32(&pParamSet->totalRspNum, 1);

516
  SEp* pEp = GET_ACTIVE_EP(epSet);
517

H
Haojun Liao 已提交
518

L
Liu Jicong 已提交
519
  int64_t transporterId = 0;
520
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, epSet, &transporterId, pMsgSendInfo);
521 522

  return TSDB_CODE_SUCCESS;
L
Liu Jicong 已提交
523 524
}

H
Haojun Liao 已提交
525 526 527 528 529 530 531 532 533 534 535
static SMqClientTopic* getTopicByName(tmq_t* tmq, const char* pTopicName) {
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);
  for (int32_t i = 0; i < numOfTopics; ++i) {
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
    if (strcmp(pTopic->topicName, pTopicName) != 0) {
      continue;
    }

    return pTopic;
  }

H
Haojun Liao 已提交
536
  tscError("consumer:0x%" PRIx64 ", total:%d, failed to find topic:%s", tmq->consumerId, numOfTopics, pTopicName);
H
Haojun Liao 已提交
537 538 539
  return NULL;
}

540
static SMqCommitCbParamSet* prepareCommitCbParamSet(tmq_t* tmq, tmq_commit_cb* pCommitFp, void* userParam, int32_t rspNum){
L
Liu Jicong 已提交
541 542
  SMqCommitCbParamSet* pParamSet = taosMemoryCalloc(1, sizeof(SMqCommitCbParamSet));
  if (pParamSet == NULL) {
543
    pCommitFp(tmq, TSDB_CODE_OUT_OF_MEMORY, userParam);
544
    return NULL;
L
Liu Jicong 已提交
545
  }
H
Haojun Liao 已提交
546

547 548
  pParamSet->refId = tmq->refId;
  pParamSet->epoch = tmq->epoch;
549
  pParamSet->callbackFn = pCommitFp;
L
Liu Jicong 已提交
550
  pParamSet->userParam = userParam;
551
  pParamSet->waitingRspNum = rspNum;
L
Liu Jicong 已提交
552

553 554
  return pParamSet;
}
555

556
static SMqClientVg* getClientVg(tmq_t* tmq, char* pTopicName, int32_t vgId){
H
Haojun Liao 已提交
557 558
  SMqClientTopic* pTopic = getTopicByName(tmq, pTopicName);
  if (pTopic == NULL) {
559 560 561
    tscWarn("consumer:0x%" PRIx64 " failed to find the specified topic:%s", tmq->consumerId, pTopicName);

    return NULL;
562
  }
L
Liu Jicong 已提交
563

564 565 566
  int32_t j = 0;
  int32_t numOfVgroups = taosArrayGetSize(pTopic->vgs);
  for (j = 0; j < numOfVgroups; j++) {
wmmhello's avatar
wmmhello 已提交
567
    SMqClientVg* pVg = (SMqClientVg*)taosArrayGet(pTopic->vgs, j);
568 569
    if (pVg->vgId == vgId) {
      break;
L
Liu Jicong 已提交
570
    }
L
Liu Jicong 已提交
571
  }
L
Liu Jicong 已提交
572

573
  if (j == numOfVgroups) {
X
Xiaoyu Wang 已提交
574 575
    tscWarn("consumer:0x%" PRIx64 " failed to find the specified vgId:%d, total Vgs:%d, topic:%s", tmq->consumerId,
            vgId, numOfVgroups, pTopicName);
576
    return NULL;
L
Liu Jicong 已提交
577 578
  }

wmmhello's avatar
wmmhello 已提交
579
  SMqClientVg* pVg = (SMqClientVg*)taosArrayGet(pTopic->vgs, j);
580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597
  return pVg;
}

static int32_t asyncCommitOffset(tmq_t* tmq, char* pTopicName, int32_t vgId, STqOffsetVal* offsetVal, tmq_commit_cb* pCommitFp, void* userParam) {
  int32_t code = 0;
  tscInfo("consumer:0x%" PRIx64 " do manual commit offset for %s, vgId:%d", tmq->consumerId, pTopicName, vgId);
  taosRLockLatch(&tmq->lock);
  SMqClientVg* pVg = getClientVg(tmq, pTopicName, vgId);
  if(pVg == NULL){
    code = TSDB_CODE_TMQ_INVALID_VGID;
    goto end;
  }
  if (offsetVal->type > 0 && !tOffsetEqual(offsetVal, &pVg->offsetInfo.committedOffset)) {
    char offsetBuf[TSDB_OFFSET_LEN] = {0};
    tFormatOffset(offsetBuf, tListLen(offsetBuf), offsetVal);

    char commitBuf[TSDB_OFFSET_LEN] = {0};
    tFormatOffset(commitBuf, tListLen(commitBuf), &pVg->offsetInfo.committedOffset);
L
Liu Jicong 已提交
598

599 600 601 602 603 604
    SMqCommitCbParamSet* pParamSet = prepareCommitCbParamSet(tmq, pCommitFp, userParam, 0);
    if (pParamSet == NULL) {
      code = TSDB_CODE_OUT_OF_MEMORY;
      goto end;
    }
    code = doSendCommitMsg(tmq, pVg->vgId, &pVg->epSet, &pVg->offsetInfo.endOffset, pTopicName, pParamSet);
605
    if (code != TSDB_CODE_SUCCESS) {
606 607
      tscError("consumer:0x%" PRIx64 " topic:%s on vgId:%d end commit msg failed, send offset:%s committed:%s, code:%s",
               tmq->consumerId, pTopicName, pVg->vgId, offsetBuf, commitBuf, tstrerror(terrno));
608
      taosMemoryFree(pParamSet);
609
      goto end;
610
    }
611 612 613 614

    tscInfo("consumer:0x%" PRIx64 " topic:%s on vgId:%d send commit msg success, send offset:%s committed:%s",
            tmq->consumerId, pTopicName, pVg->vgId, offsetBuf, commitBuf);
    pVg->offsetInfo.committedOffset = *offsetVal;
L
Liu Jicong 已提交
615
  }
616 617

end:
wmmhello's avatar
wmmhello 已提交
618
  taosRUnLockLatch(&tmq->lock);
619
  return code;
L
Liu Jicong 已提交
620 621
}

622 623 624 625 626 627 628 629 630
static void asyncCommitFromResult(tmq_t* tmq, const TAOS_RES* pRes, tmq_commit_cb* pCommitFp, void* userParam){
  char*   pTopicName = NULL;
  int32_t vgId = 0;
  STqOffsetVal offsetVal = {0};
  int32_t code = 0;

  if (pRes == NULL || tmq == NULL) {
    code = TSDB_CODE_INVALID_PARA;
    goto end;
631
  }
632

633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659
  if (TD_RES_TMQ(pRes)) {
    SMqRspObj* pRspObj = (SMqRspObj*)pRes;
    pTopicName = pRspObj->topic;
    vgId = pRspObj->vgId;
    offsetVal = pRspObj->rsp.rspOffset;
  } else if (TD_RES_TMQ_META(pRes)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)pRes;
    pTopicName = pMetaRspObj->topic;
    vgId = pMetaRspObj->vgId;
    offsetVal = pMetaRspObj->metaRsp.rspOffset;
  } else if (TD_RES_TMQ_METADATA(pRes)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)pRes;
    pTopicName = pRspObj->topic;
    vgId = pRspObj->vgId;
    offsetVal = pRspObj->rsp.rspOffset;
  } else {
    code = TSDB_CODE_TMQ_INVALID_MSG;
    goto end;
  }

  code = asyncCommitOffset(tmq, pTopicName, vgId, &offsetVal, pCommitFp, userParam);

end:
  if(code != TSDB_CODE_SUCCESS){
    pCommitFp(tmq, code, userParam);
  }
}
660

661 662
static void asyncCommitAllOffsets(tmq_t* tmq, tmq_commit_cb* pCommitFp, void* userParam) {
  int32_t code = 0;
663
  // init as 1 to prevent concurrency issue
664 665 666 667 668
  SMqCommitCbParamSet* pParamSet = prepareCommitCbParamSet(tmq, pCommitFp, userParam, 1);
  if (pParamSet == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto end;
  }
669

wmmhello's avatar
wmmhello 已提交
670
  taosRLockLatch(&tmq->lock);
671
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);
672
  tscInfo("consumer:0x%" PRIx64 " start to commit offset for %d topics", tmq->consumerId, numOfTopics);
673 674

  for (int32_t i = 0; i < numOfTopics; i++) {
675
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
676
    int32_t         numOfVgroups = taosArrayGetSize(pTopic->vgs);
L
Liu Jicong 已提交
677

678
    tscInfo("consumer:0x%" PRIx64 " commit offset for topics:%s, numOfVgs:%d", tmq->consumerId, pTopic->topicName, numOfVgroups);
679
    for (int32_t j = 0; j < numOfVgroups; j++) {
680 681
      SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);

682 683 684 685 686 687 688 689
      if (pVg->offsetInfo.endOffset.type > 0 && !tOffsetEqual(&pVg->offsetInfo.endOffset, &pVg->offsetInfo.committedOffset)) {
        char offsetBuf[TSDB_OFFSET_LEN] = {0};
        tFormatOffset(offsetBuf, tListLen(offsetBuf), &pVg->offsetInfo.endOffset);

        char commitBuf[TSDB_OFFSET_LEN] = {0};
        tFormatOffset(commitBuf, tListLen(commitBuf), &pVg->offsetInfo.committedOffset);

        code = doSendCommitMsg(tmq, pVg->vgId, &pVg->epSet, &pVg->offsetInfo.endOffset, pTopic->topicName, pParamSet);
690
        if (code != TSDB_CODE_SUCCESS) {
691 692
          tscError("consumer:0x%" PRIx64 " topic:%s on vgId:%d end commit msg failed, send offset:%s committed:%s, code:%s ordinal:%d/%d",
                   tmq->consumerId, pTopic->topicName, pVg->vgId, offsetBuf, commitBuf, tstrerror(terrno), j + 1, numOfVgroups);
L
Liu Jicong 已提交
693 694
          continue;
        }
H
Haojun Liao 已提交
695

696 697 698
        tscInfo("consumer:0x%" PRIx64 " topic:%s on vgId:%d send commit msg success, send offset:%s committed:%s, ordinal:%d/%d",
                tmq->consumerId, pTopic->topicName, pVg->vgId, offsetBuf, commitBuf, j + 1, numOfVgroups);
        pVg->offsetInfo.committedOffset = pVg->offsetInfo.endOffset;
699
      } else {
700 701
        tscInfo("consumer:0x%" PRIx64 " topic:%s vgId:%d, no commit, current:%" PRId64 ", ordinal:%d/%d",
                 tmq->consumerId, pTopic->topicName, pVg->vgId, pVg->offsetInfo.endOffset.version, j + 1, numOfVgroups);
702 703 704
      }
    }
  }
wmmhello's avatar
wmmhello 已提交
705
  taosRUnLockLatch(&tmq->lock);
706

707
  tscInfo("consumer:0x%" PRIx64 " total commit:%d for %d topics", tmq->consumerId, pParamSet->waitingRspNum - 1, numOfTopics);
H
Haojun Liao 已提交
708

709 710 711 712
  // request is sent
  if (pParamSet->totalRspNum != 0) {
    // count down since waiting rsp num init as 1
    commitRspCountDown(pParamSet, tmq->consumerId, "", 0);
713
    return;
L
Liu Jicong 已提交
714 715
  }

716 717 718 719
end:
  taosMemoryFree(pParamSet);
  pCommitFp(tmq, code, userParam);
  return;
720 721
}

722 723
static void generateTimedTask(int64_t refId, int32_t type) {
  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
wmmhello's avatar
wmmhello 已提交
724 725 726 727 728 729 730 731 732
  if(tmq == NULL) return;

  int8_t* pTaskType = taosAllocateQitem(sizeof(int8_t), DEF_QITEM, 0);
  if(pTaskType == NULL) return;

  *pTaskType = type;
  taosWriteQitem(tmq->delayedTask, pTaskType);
  tsem_post(&tmq->rspSem);
  taosReleaseRef(tmqMgmt.rsetId, refId);
733 734 735 736 737
}

void tmqAssignAskEpTask(void* param, void* tmrId) {
  int64_t refId = *(int64_t*)param;
  generateTimedTask(refId, TMQ_DELAYED_TASK__ASK_EP);
738
  taosMemoryFree(param);
L
Liu Jicong 已提交
739 740 741
}

void tmqAssignDelayedCommitTask(void* param, void* tmrId) {
742
  int64_t refId = *(int64_t*)param;
743
  generateTimedTask(refId, TMQ_DELAYED_TASK__COMMIT);
744
  taosMemoryFree(param);
L
Liu Jicong 已提交
745 746
}

wmmhello's avatar
wmmhello 已提交
747 748 749 750 751 752 753 754 755 756 757 758 759
//void tmqAssignDelayedReportTask(void* param, void* tmrId) {
//  int64_t refId = *(int64_t*)param;
//  tmq_t*  tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
//  if (tmq != NULL) {
//    int8_t* pTaskType = taosAllocateQitem(sizeof(int8_t), DEF_QITEM, 0);
//    *pTaskType = TMQ_DELAYED_TASK__REPORT;
//    taosWriteQitem(tmq->delayedTask, pTaskType);
//    tsem_post(&tmq->rspSem);
//  }
//
//  taosReleaseRef(tmqMgmt.rsetId, refId);
//  taosMemoryFree(param);
//}
L
Liu Jicong 已提交
760

761
int32_t tmqHbCb(void* param, SDataBuf* pMsg, int32_t code) {
dengyihao's avatar
dengyihao 已提交
762 763 764 765
  if (pMsg) {
    taosMemoryFree(pMsg->pData);
    taosMemoryFree(pMsg->pEpSet);
  }
766 767 768 769
  return 0;
}

void tmqSendHbReq(void* param, void* tmrId) {
770
  int64_t refId = *(int64_t*)param;
771

X
Xiaoyu Wang 已提交
772
  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
773
  if (tmq == NULL) {
L
Liu Jicong 已提交
774
    taosMemoryFree(param);
775 776
    return;
  }
D
dapan1121 已提交
777 778 779 780

  SMqHbReq req = {0};
  req.consumerId = tmq->consumerId;
  req.epoch = tmq->epoch;
wmmhello's avatar
wmmhello 已提交
781
  taosRLockLatch(&tmq->lock);
wmmhello's avatar
wmmhello 已提交
782
//  if(tmq->needReportOffsetRows){
783 784 785 786 787 788 789 790 791 792 793 794
    req.topics = taosArrayInit(taosArrayGetSize(tmq->clientTopics), sizeof(TopicOffsetRows));
    for(int i = 0; i < taosArrayGetSize(tmq->clientTopics); i++){
      SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
      int32_t         numOfVgroups = taosArrayGetSize(pTopic->vgs);
      TopicOffsetRows* data = taosArrayReserve(req.topics, 1);
      strcpy(data->topicName, pTopic->topicName);
      data->offsetRows = taosArrayInit(numOfVgroups, sizeof(OffsetRows));
      for(int j = 0; j < numOfVgroups; j++){
        SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);
        OffsetRows* offRows = taosArrayReserve(data->offsetRows, 1);
        offRows->vgId = pVg->vgId;
        offRows->rows = pVg->numOfRows;
795
        offRows->offset = pVg->offsetInfo.beginOffset;
796 797
        char buf[TSDB_OFFSET_LEN] = {0};
        tFormatOffset(buf, TSDB_OFFSET_LEN, &offRows->offset);
wmmhello's avatar
wmmhello 已提交
798
        tscInfo("consumer:0x%" PRIx64 ",report offset: vgId:%d, offset:%s, rows:%"PRId64, tmq->consumerId, offRows->vgId, buf, offRows->rows);
799
      }
800
    }
wmmhello's avatar
wmmhello 已提交
801 802
//    tmq->needReportOffsetRows = false;
//  }
wmmhello's avatar
wmmhello 已提交
803
  taosRUnLockLatch(&tmq->lock);
D
dapan1121 已提交
804

L
Liu Jicong 已提交
805
  int32_t tlen = tSerializeSMqHbReq(NULL, 0, &req);
D
dapan1121 已提交
806 807
  if (tlen < 0) {
    tscError("tSerializeSMqHbReq failed");
808
    goto OVER;
D
dapan1121 已提交
809
  }
810

L
Liu Jicong 已提交
811
  void* pReq = taosMemoryCalloc(1, tlen);
D
dapan1121 已提交
812 813
  if (tlen < 0) {
    tscError("failed to malloc MqHbReq msg, size:%d", tlen);
814
    goto OVER;
D
dapan1121 已提交
815
  }
816

D
dapan1121 已提交
817 818 819
  if (tSerializeSMqHbReq(pReq, tlen, &req) < 0) {
    tscError("tSerializeSMqHbReq %d failed", tlen);
    taosMemoryFree(pReq);
820
    goto OVER;
D
dapan1121 已提交
821
  }
822 823 824 825

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(pReq);
L
Liu Jicong 已提交
826
    goto OVER;
827
  }
828

829
  sendInfo->msgInfo = (SDataBuf){ .pData = pReq, .len = tlen, .handle = NULL };
830 831 832 833 834

  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
  sendInfo->param = NULL;
  sendInfo->fp = tmqHbCb;
L
Liu Jicong 已提交
835
  sendInfo->msgType = TDMT_MND_TMQ_HB;
836 837 838 839 840 841 842

  SEpSet epSet = getEpSet_s(&tmq->pTscObj->pAppInfo->mgmtEp);

  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);

OVER:
843
  tDeatroySMqHbReq(&req);
844
  taosTmrReset(tmqSendHbReq, 1000, param, tmqMgmt.timer, &tmq->hbLiveTimer);
845
  taosReleaseRef(tmqMgmt.rsetId, refId);
846 847
}

848 849
static void defaultCommitCbFn(tmq_t* pTmq, int32_t code, void* param) {
  if (code != 0) {
850
    tscError("consumer:0x%" PRIx64 ", failed to commit offset, code:%s", pTmq->consumerId, tstrerror(code));
851 852 853
  }
}

854
int32_t tmqHandleAllDelayedTask(tmq_t* pTmq) {
L
Liu Jicong 已提交
855
  STaosQall* qall = taosAllocateQall();
856
  taosReadAllQitems(pTmq->delayedTask, qall);
L
Liu Jicong 已提交
857

858 859 860 861
  if (qall->numOfItems == 0) {
    taosFreeQall(qall);
    return TSDB_CODE_SUCCESS;
  }
862

X
Xiaoyu Wang 已提交
863
  tscDebug("consumer:0x%" PRIx64 " handle delayed %d tasks before poll data", pTmq->consumerId, qall->numOfItems);
864 865
  int8_t* pTaskType = NULL;
  taosGetQitem(qall, (void**)&pTaskType);
L
Liu Jicong 已提交
866

867
  while (pTaskType != NULL) {
868
    if (*pTaskType == TMQ_DELAYED_TASK__ASK_EP) {
869
      asyncAskEp(pTmq, addToQueueCallbackFn, NULL);
870 871

      int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
872
      *pRefId = pTmq->refId;
873

X
Xiaoyu Wang 已提交
874
      tscDebug("consumer:0x%" PRIx64 " retrieve ep from mnode in 1s", pTmq->consumerId);
875
      taosTmrReset(tmqAssignAskEpTask, 1000, pRefId, tmqMgmt.timer, &pTmq->epTimer);
L
Liu Jicong 已提交
876
    } else if (*pTaskType == TMQ_DELAYED_TASK__COMMIT) {
X
Xiaoyu Wang 已提交
877
      tmq_commit_cb* pCallbackFn = pTmq->commitCb ? pTmq->commitCb : defaultCommitCbFn;
878 879

      asyncCommitAllOffsets(pTmq, pCallbackFn, pTmq->commitCbUserParam);
880
      int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
881
      *pRefId = pTmq->refId;
882

883
      tscDebug("consumer:0x%" PRIx64 " next commit to vnode(s) in %.2fs", pTmq->consumerId,
X
Xiaoyu Wang 已提交
884
               pTmq->autoCommitInterval / 1000.0);
885
      taosTmrReset(tmqAssignDelayedCommitTask, pTmq->autoCommitInterval, pRefId, tmqMgmt.timer, &pTmq->commitTimer);
L
Liu Jicong 已提交
886 887
    } else if (*pTaskType == TMQ_DELAYED_TASK__REPORT) {
    }
888

L
Liu Jicong 已提交
889
    taosFreeQitem(pTaskType);
890
    taosGetQitem(qall, (void**)&pTaskType);
L
Liu Jicong 已提交
891
  }
892

L
Liu Jicong 已提交
893 894 895 896
  taosFreeQall(qall);
  return 0;
}

897
static void* tmqFreeRspWrapper(SMqRspWrapper* rspWrapper) {
L
Liu Jicong 已提交
898 899 900 901 902 903 904
  if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__END_RSP) {
    // do nothing
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__EP_RSP) {
    SMqAskEpRspWrapper* pEpRspWrapper = (SMqAskEpRspWrapper*)rspWrapper;
    tDeleteSMqAskEpRsp(&pEpRspWrapper->msg);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
905 906
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
907 908 909
    taosArrayDestroyP(pRsp->dataRsp.blockData, taosMemoryFree);
    taosArrayDestroy(pRsp->dataRsp.blockDataLen);
    taosArrayDestroyP(pRsp->dataRsp.blockTbName, taosMemoryFree);
910
    taosArrayDestroyP(pRsp->dataRsp.blockSchema, (FDelete)tDeleteSchemaWrapper);
L
Liu Jicong 已提交
911 912
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_META_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
913 914
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
915 916 917
    taosMemoryFree(pRsp->metaRsp.metaRsp);
  } else if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__TAOSX_RSP) {
    SMqPollRspWrapper* pRsp = (SMqPollRspWrapper*)rspWrapper;
918 919
    taosMemoryFreeClear(pRsp->pEpset);

L
Liu Jicong 已提交
920 921 922
    taosArrayDestroyP(pRsp->taosxRsp.blockData, taosMemoryFree);
    taosArrayDestroy(pRsp->taosxRsp.blockDataLen);
    taosArrayDestroyP(pRsp->taosxRsp.blockTbName, taosMemoryFree);
923
    taosArrayDestroyP(pRsp->taosxRsp.blockSchema, (FDelete)tDeleteSchemaWrapper);
L
Liu Jicong 已提交
924 925 926 927
    // taosx
    taosArrayDestroy(pRsp->taosxRsp.createTableLen);
    taosArrayDestroyP(pRsp->taosxRsp.createTableReq, taosMemoryFree);
  }
928 929

  return NULL;
L
Liu Jicong 已提交
930 931
}

L
Liu Jicong 已提交
932
void tmqClearUnhandleMsg(tmq_t* tmq) {
L
Liu Jicong 已提交
933
  SMqRspWrapper* rspWrapper = NULL;
L
Liu Jicong 已提交
934
  while (1) {
L
Liu Jicong 已提交
935 936 937 938 939
    taosGetQitem(tmq->qall, (void**)&rspWrapper);
    if (rspWrapper) {
      tmqFreeRspWrapper(rspWrapper);
      taosFreeQitem(rspWrapper);
    } else {
L
Liu Jicong 已提交
940
      break;
L
Liu Jicong 已提交
941
    }
L
Liu Jicong 已提交
942 943
  }

L
Liu Jicong 已提交
944
  rspWrapper = NULL;
L
Liu Jicong 已提交
945 946
  taosReadAllQitems(tmq->mqueue, tmq->qall);
  while (1) {
L
Liu Jicong 已提交
947 948 949 950 951
    taosGetQitem(tmq->qall, (void**)&rspWrapper);
    if (rspWrapper) {
      tmqFreeRspWrapper(rspWrapper);
      taosFreeQitem(rspWrapper);
    } else {
L
Liu Jicong 已提交
952
      break;
L
Liu Jicong 已提交
953
    }
L
Liu Jicong 已提交
954 955 956
  }
}

D
dapan1121 已提交
957
int32_t tmqSubscribeCb(void* param, SDataBuf* pMsg, int32_t code) {
L
Liu Jicong 已提交
958 959
  SMqSubscribeCbParam* pParam = (SMqSubscribeCbParam*)param;
  pParam->rspErr = code;
dengyihao's avatar
dengyihao 已提交
960 961

  taosMemoryFree(pMsg->pEpSet);
L
Liu Jicong 已提交
962 963 964
  tsem_post(&pParam->rspSem);
  return 0;
}
965

L
Liu Jicong 已提交
966
int32_t tmq_subscription(tmq_t* tmq, tmq_list_t** topics) {
X
Xiaoyu Wang 已提交
967 968 969
  if (*topics == NULL) {
    *topics = tmq_list_new();
  }
wmmhello's avatar
wmmhello 已提交
970
  taosRLockLatch(&tmq->lock);
X
Xiaoyu Wang 已提交
971
  for (int i = 0; i < taosArrayGetSize(tmq->clientTopics); i++) {
L
Liu Jicong 已提交
972
    SMqClientTopic* topic = taosArrayGet(tmq->clientTopics, i);
L
Liu Jicong 已提交
973
    tmq_list_append(*topics, strchr(topic->topicName, '.') + 1);
X
Xiaoyu Wang 已提交
974
  }
wmmhello's avatar
wmmhello 已提交
975
  taosRUnLockLatch(&tmq->lock);
L
Liu Jicong 已提交
976
  return 0;
X
Xiaoyu Wang 已提交
977 978
}

L
Liu Jicong 已提交
979
int32_t tmq_unsubscribe(tmq_t* tmq) {
980 981 982 983 984 985 986 987
  if (tmq->autoCommit) {
    int32_t rsp = tmq_commit_sync(tmq, NULL);
    if (rsp != 0) {
      return rsp;
    }
  }
  taosSsleep(2);  // sleep 2s for hb to send offset and rows to server

L
Liu Jicong 已提交
988 989
  int32_t     rsp;
  int32_t     retryCnt = 0;
L
Liu Jicong 已提交
990
  tmq_list_t* lst = tmq_list_new();
L
Liu Jicong 已提交
991 992 993 994 995 996 997 998 999 1000
  while (1) {
    rsp = tmq_subscribe(tmq, lst);
    if (rsp != TSDB_CODE_MND_CONSUMER_NOT_READY || retryCnt > 5) {
      break;
    } else {
      retryCnt++;
      taosMsleep(500);
    }
  }

L
Liu Jicong 已提交
1001 1002
  tmq_list_destroy(lst);
  return rsp;
X
Xiaoyu Wang 已提交
1003 1004
}

1005 1006 1007 1008 1009 1010
static void freeClientVgImpl(void* param) {
  SMqClientTopic* pTopic = param;
  taosMemoryFreeClear(pTopic->schema.pSchema);
  taosArrayDestroy(pTopic->vgs);
}

1011
void tmqFreeImpl(void* handle) {
1012 1013
  tmq_t*  tmq = (tmq_t*)handle;
  int64_t id = tmq->consumerId;
L
Liu Jicong 已提交
1014

1015
  // TODO stop timer
L
Liu Jicong 已提交
1016 1017 1018 1019
  if (tmq->mqueue) {
    tmqClearUnhandleMsg(tmq);
    taosCloseQueue(tmq->mqueue);
  }
L
Liu Jicong 已提交
1020

H
Haojun Liao 已提交
1021 1022 1023 1024 1025
  if (tmq->delayedTask) {
    taosCloseQueue(tmq->delayedTask);
  }

  taosFreeQall(tmq->qall);
1026
  tsem_destroy(&tmq->rspSem);
L
Liu Jicong 已提交
1027

1028
  taosArrayDestroyEx(tmq->clientTopics, freeClientVgImpl);
1029 1030
  taos_close_internal(tmq->pTscObj);
  taosMemoryFree(tmq);
1031 1032

  tscDebug("consumer:0x%" PRIx64 " closed", id);
L
Liu Jicong 已提交
1033 1034
}

1035 1036 1037 1038 1039 1040 1041 1042 1043
static void tmqMgmtInit(void) {
  tmqInitRes = 0;
  tmqMgmt.timer = taosTmrInit(1000, 100, 360000, "TMQ");

  if (tmqMgmt.timer == NULL) {
    tmqInitRes = TSDB_CODE_OUT_OF_MEMORY;
  }

  tmqMgmt.rsetId = taosOpenRef(10000, tmqFreeImpl);
1044
  if (tmqMgmt.rsetId < 0) {
1045 1046 1047 1048
    tmqInitRes = terrno;
  }
}

L
Liu Jicong 已提交
1049
tmq_t* tmq_consumer_new(tmq_conf_t* conf, char* errstr, int32_t errstrLen) {
1050 1051 1052 1053
  taosThreadOnce(&tmqInit, tmqMgmtInit);
  if (tmqInitRes != 0) {
    terrno = tmqInitRes;
    return NULL;
L
Liu Jicong 已提交
1054 1055
  }

L
Liu Jicong 已提交
1056 1057
  tmq_t* pTmq = taosMemoryCalloc(1, sizeof(tmq_t));
  if (pTmq == NULL) {
L
Liu Jicong 已提交
1058
    terrno = TSDB_CODE_OUT_OF_MEMORY;
1059
    tscError("failed to create consumer, groupId:%s, code:%s", conf->groupId, terrstr());
L
Liu Jicong 已提交
1060 1061
    return NULL;
  }
L
Liu Jicong 已提交
1062

L
Liu Jicong 已提交
1063 1064 1065
  const char* user = conf->user == NULL ? TSDB_DEFAULT_USER : conf->user;
  const char* pass = conf->pass == NULL ? TSDB_DEFAULT_PASS : conf->pass;

L
Liu Jicong 已提交
1066 1067 1068
  pTmq->clientTopics = taosArrayInit(0, sizeof(SMqClientTopic));
  pTmq->mqueue = taosOpenQueue();
  pTmq->delayedTask = taosOpenQueue();
H
Haojun Liao 已提交
1069
  pTmq->qall = taosAllocateQall();
L
Liu Jicong 已提交
1070

X
Xiaoyu Wang 已提交
1071 1072
  if (pTmq->clientTopics == NULL || pTmq->mqueue == NULL || pTmq->qall == NULL || pTmq->delayedTask == NULL ||
      conf->groupId[0] == 0) {
L
Liu Jicong 已提交
1073
    terrno = TSDB_CODE_OUT_OF_MEMORY;
X
Xiaoyu Wang 已提交
1074
    tscError("consumer:0x%" PRIx64 " setup failed since %s, groupId:%s", pTmq->consumerId, terrstr(), pTmq->groupId);
1075
    goto _failed;
L
Liu Jicong 已提交
1076
  }
L
Liu Jicong 已提交
1077

L
Liu Jicong 已提交
1078 1079
  // init status
  pTmq->status = TMQ_CONSUMER_STATUS__INIT;
L
Liu Jicong 已提交
1080 1081
  pTmq->pollCnt = 0;
  pTmq->epoch = 0;
wmmhello's avatar
wmmhello 已提交
1082
//  pTmq->needReportOffsetRows = true;
L
Liu Jicong 已提交
1083

L
Liu Jicong 已提交
1084 1085 1086
  // set conf
  strcpy(pTmq->clientId, conf->clientId);
  strcpy(pTmq->groupId, conf->groupId);
1087
  pTmq->withTbName = conf->withTbName;
L
Liu Jicong 已提交
1088
  pTmq->useSnapshot = conf->snapEnable;
L
Liu Jicong 已提交
1089
  pTmq->autoCommit = conf->autoCommit;
L
Liu Jicong 已提交
1090
  pTmq->autoCommitInterval = conf->autoCommitInterval;
L
Liu Jicong 已提交
1091 1092
  pTmq->commitCb = conf->commitCb;
  pTmq->commitCbUserParam = conf->commitCbUserParam;
L
Liu Jicong 已提交
1093
  pTmq->resetOffsetCfg = conf->resetOffset;
wmmhello's avatar
wmmhello 已提交
1094
  taosInitRWLatch(&pTmq->lock);
L
Liu Jicong 已提交
1095

1096 1097
  pTmq->hbBgEnable = conf->hbBgEnable;

L
Liu Jicong 已提交
1098
  // assign consumerId
L
Liu Jicong 已提交
1099
  pTmq->consumerId = tGenIdPI64();
X
Xiaoyu Wang 已提交
1100

L
Liu Jicong 已提交
1101 1102
  // init semaphore
  if (tsem_init(&pTmq->rspSem, 0, 0) != 0) {
1103
    tscError("consumer:0x %" PRIx64 " setup failed since %s, consumer group %s", pTmq->consumerId, terrstr(),
S
Shengliang Guan 已提交
1104
             pTmq->groupId);
1105
    goto _failed;
L
Liu Jicong 已提交
1106
  }
L
Liu Jicong 已提交
1107

L
Liu Jicong 已提交
1108 1109 1110
  // init connection
  pTmq->pTscObj = taos_connect_internal(conf->ip, user, pass, NULL, NULL, conf->port, CONN_TYPE__TMQ);
  if (pTmq->pTscObj == NULL) {
1111
    tscError("consumer:0x%" PRIx64 " setup failed since %s, groupId:%s", pTmq->consumerId, terrstr(), pTmq->groupId);
L
Liu Jicong 已提交
1112
    tsem_destroy(&pTmq->rspSem);
1113
    goto _failed;
L
Liu Jicong 已提交
1114
  }
L
Liu Jicong 已提交
1115

1116 1117
  pTmq->refId = taosAddRef(tmqMgmt.rsetId, pTmq);
  if (pTmq->refId < 0) {
1118
    goto _failed;
1119 1120
  }

1121
  if (pTmq->hbBgEnable) {
L
Liu Jicong 已提交
1122 1123
    int64_t* pRefId = taosMemoryMalloc(sizeof(int64_t));
    *pRefId = pTmq->refId;
1124
    pTmq->hbLiveTimer = taosTmrStart(tmqSendHbReq, 1000, pRefId, tmqMgmt.timer);
1125 1126
  }

1127
  char         buf[TSDB_OFFSET_LEN] = {0};
1128 1129
  STqOffsetVal offset = {.type = pTmq->resetOffsetCfg};
  tFormatOffset(buf, tListLen(buf), &offset);
X
Xiaoyu Wang 已提交
1130 1131 1132 1133
  tscInfo("consumer:0x%" PRIx64 " is setup, refId:%" PRId64
          ", groupId:%s, snapshot:%d, autoCommit:%d, commitInterval:%dms, offset:%s, backgroudHB:%d",
          pTmq->consumerId, pTmq->refId, pTmq->groupId, pTmq->useSnapshot, pTmq->autoCommit, pTmq->autoCommitInterval,
          buf, pTmq->hbBgEnable);
L
Liu Jicong 已提交
1134

1135
  return pTmq;
1136

1137 1138
_failed:
  tmqFreeImpl(pTmq);
L
Liu Jicong 已提交
1139
  return NULL;
1140 1141
}

L
Liu Jicong 已提交
1142
int32_t tmq_subscribe(tmq_t* tmq, const tmq_list_t* topic_list) {
1143
  const int32_t   MAX_RETRY_COUNT = 120 * 2;  // let's wait for 2 mins at most
L
Liu Jicong 已提交
1144 1145 1146
  const SArray*   container = &topic_list->container;
  int32_t         sz = taosArrayGetSize(container);
  void*           buf = NULL;
L
Liu Jicong 已提交
1147
  SMsgSendInfo*   sendInfo = NULL;
L
Liu Jicong 已提交
1148
  SCMSubscribeReq req = {0};
1149
  int32_t         code = 0;
1150

1151
  tscInfo("consumer:0x%" PRIx64 " cgroup:%s, subscribe %d topics", tmq->consumerId, tmq->groupId, sz);
L
Liu Jicong 已提交
1152

1153
  req.consumerId = tmq->consumerId;
L
Liu Jicong 已提交
1154
  tstrncpy(req.clientId, tmq->clientId, 256);
L
Liu Jicong 已提交
1155
  tstrncpy(req.cgroup, tmq->groupId, TSDB_CGROUP_LEN);
1156 1157
  req.topicNames = taosArrayInit(sz, sizeof(void*));

1158 1159 1160 1161
  if (req.topicNames == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
1162

1163 1164 1165 1166 1167
  req.withTbName = tmq->withTbName;
  req.autoCommit = tmq->autoCommit;
  req.autoCommitInterval = tmq->autoCommitInterval;
  req.resetOffsetCfg = tmq->resetOffsetCfg;

L
Liu Jicong 已提交
1168 1169
  for (int32_t i = 0; i < sz; i++) {
    char* topic = taosArrayGetP(container, i);
1170 1171

    SName name = {0};
L
Liu Jicong 已提交
1172 1173 1174 1175
    tNameSetDbName(&name, tmq->pTscObj->acctId, topic, strlen(topic));
    char* topicFName = taosMemoryCalloc(1, TSDB_TOPIC_FNAME_LEN);
    if (topicFName == NULL) {
      goto FAIL;
1176 1177
    }

1178
    tNameExtractFullName(&name, topicFName);
1179
    tscInfo("consumer:0x%" PRIx64 " subscribe topic:%s", tmq->consumerId, topicFName);
L
Liu Jicong 已提交
1180 1181

    taosArrayPush(req.topicNames, &topicFName);
1182 1183
  }

L
Liu Jicong 已提交
1184
  int32_t tlen = tSerializeSCMSubscribeReq(NULL, &req);
1185

L
Liu Jicong 已提交
1186
  buf = taosMemoryMalloc(tlen);
1187 1188 1189 1190
  if (buf == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
L
Liu Jicong 已提交
1191

1192 1193 1194
  void* abuf = buf;
  tSerializeSCMSubscribeReq(&abuf, &req);

L
Liu Jicong 已提交
1195
  sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
1196 1197 1198 1199
  if (sendInfo == NULL) {
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto FAIL;
  }
1200

H
Haojun Liao 已提交
1201
  SMqSubscribeCbParam param = { .rspErr = 0};
1202
  if (tsem_init(&param.rspSem, 0, 0) != 0) {
wmmhello's avatar
wmmhello 已提交
1203
    code = TSDB_CODE_TSC_INTERNAL_ERROR;
1204 1205
    goto FAIL;
  }
L
Liu Jicong 已提交
1206

1207
  sendInfo->msgInfo = (SDataBuf){.pData = buf, .len = tlen, .handle = NULL};
1208

L
Liu Jicong 已提交
1209 1210
  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
L
Liu Jicong 已提交
1211 1212
  sendInfo->param = &param;
  sendInfo->fp = tmqSubscribeCb;
L
Liu Jicong 已提交
1213
  sendInfo->msgType = TDMT_MND_TMQ_SUBSCRIBE;
L
Liu Jicong 已提交
1214

1215 1216 1217 1218 1219
  SEpSet epSet = getEpSet_s(&tmq->pTscObj->pAppInfo->mgmtEp);

  int64_t transporterId = 0;
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);

L
Liu Jicong 已提交
1220 1221
  // avoid double free if msg is sent
  buf = NULL;
L
Liu Jicong 已提交
1222
  sendInfo = NULL;
L
Liu Jicong 已提交
1223

L
Liu Jicong 已提交
1224 1225
  tsem_wait(&param.rspSem);
  tsem_destroy(&param.rspSem);
1226

1227 1228 1229 1230
  if (param.rspErr != 0) {
    code = param.rspErr;
    goto FAIL;
  }
L
Liu Jicong 已提交
1231

L
Liu Jicong 已提交
1232
  int32_t retryCnt = 0;
1233
  while (TSDB_CODE_MND_CONSUMER_NOT_READY == doAskEp(tmq)) {
1234
    if (retryCnt++ > MAX_RETRY_COUNT) {
wmmhello's avatar
wmmhello 已提交
1235
      tscError("consumer:0x%" PRIx64 ", mnd not ready for subscribe, retry:%d in 500ms", tmq->consumerId, retryCnt);
1236
      code = TSDB_CODE_MND_CONSUMER_NOT_READY;
L
Liu Jicong 已提交
1237 1238
      goto FAIL;
    }
1239

1240
    tscInfo("consumer:0x%" PRIx64 ", mnd not ready for subscribe, retry:%d in 500ms", tmq->consumerId, retryCnt);
L
Liu Jicong 已提交
1241 1242
    taosMsleep(500);
  }
1243

1244 1245
  // init ep timer
  if (tmq->epTimer == NULL) {
1246 1247 1248
    int64_t* pRefId1 = taosMemoryMalloc(sizeof(int64_t));
    *pRefId1 = tmq->refId;
    tmq->epTimer = taosTmrStart(tmqAssignAskEpTask, 1000, pRefId1, tmqMgmt.timer);
1249
  }
L
Liu Jicong 已提交
1250 1251

  // init auto commit timer
1252
  if (tmq->autoCommit && tmq->commitTimer == NULL) {
1253 1254 1255
    int64_t* pRefId2 = taosMemoryMalloc(sizeof(int64_t));
    *pRefId2 = tmq->refId;
    tmq->commitTimer = taosTmrStart(tmqAssignDelayedCommitTask, tmq->autoCommitInterval, pRefId2, tmqMgmt.timer);
L
Liu Jicong 已提交
1256 1257
  }

L
Liu Jicong 已提交
1258
FAIL:
L
Liu Jicong 已提交
1259
  taosArrayDestroyP(req.topicNames, taosMemoryFree);
L
Liu Jicong 已提交
1260
  taosMemoryFree(buf);
L
Liu Jicong 已提交
1261
  taosMemoryFree(sendInfo);
L
Liu Jicong 已提交
1262

L
Liu Jicong 已提交
1263
  return code;
1264 1265
}

L
Liu Jicong 已提交
1266
void tmq_conf_set_auto_commit_cb(tmq_conf_t* conf, tmq_commit_cb* cb, void* param) {
1267
  conf->commitCb = cb;
L
Liu Jicong 已提交
1268
  conf->commitCbUserParam = param;
L
Liu Jicong 已提交
1269
}
1270

wmmhello's avatar
wmmhello 已提交
1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298
static SMqClientVg* getVgInfo(tmq_t* tmq, char* topicName, int32_t  vgId){
  int32_t topicNumCur = taosArrayGetSize(tmq->clientTopics);
  for(int i = 0; i < topicNumCur; i++){
    SMqClientTopic* pTopicCur = taosArrayGet(tmq->clientTopics, i);
    if(strcmp(pTopicCur->topicName, topicName) == 0){
      int32_t vgNumCur = taosArrayGetSize(pTopicCur->vgs);
      for (int32_t j = 0; j < vgNumCur; j++) {
        SMqClientVg* pVgCur = taosArrayGet(pTopicCur->vgs, j);
        if(pVgCur->vgId == vgId){
          return pVgCur;
        }
      }
    }
  }
  return NULL;
}

static SMqClientTopic* getTopicInfo(tmq_t* tmq, char* topicName){
  int32_t topicNumCur = taosArrayGetSize(tmq->clientTopics);
  for(int i = 0; i < topicNumCur; i++){
    SMqClientTopic* pTopicCur = taosArrayGet(tmq->clientTopics, i);
    if(strcmp(pTopicCur->topicName, topicName) == 0){
      return pTopicCur;
    }
  }
  return NULL;
}

D
dapan1121 已提交
1299
int32_t tmqPollCb(void* param, SDataBuf* pMsg, int32_t code) {
X
Xiaoyu Wang 已提交
1300
  SMqPollCbParam* pParam = (SMqPollCbParam*)param;
1301 1302

  int64_t         refId = pParam->refId;
wmmhello's avatar
wmmhello 已提交
1303 1304
//  SMqClientVg*    pVg = pParam->pVg;
//  SMqClientTopic* pTopic = pParam->pTopic;
1305

1306
  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
1307 1308 1309
  if (tmq == NULL) {
    taosMemoryFree(pParam);
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1310
    taosMemoryFree(pMsg->pEpSet);
1311 1312 1313 1314
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    return -1;
  }

H
Haojun Liao 已提交
1315 1316 1317 1318
  int32_t  epoch = pParam->epoch;
  int32_t  vgId = pParam->vgId;
  uint64_t requestId = pParam->requestId;

L
Liu Jicong 已提交
1319
  if (code != 0) {
L
Liu Jicong 已提交
1320
    if (pMsg->pData) taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1321 1322
    if (pMsg->pEpSet) taosMemoryFree(pMsg->pEpSet);

H
Haojun Liao 已提交
1323
    // in case of consumer mismatch, wait for 500ms and retry
L
Liu Jicong 已提交
1324
    if (code == TSDB_CODE_TMQ_CONSUMER_MISMATCH) {
1325
//      taosMsleep(500);
L
Liu Jicong 已提交
1326
      atomic_store_8(&tmq->status, TMQ_CONSUMER_STATUS__RECOVER);
X
Xiaoyu Wang 已提交
1327 1328
      tscDebug("consumer:0x%" PRIx64 " wait for the re-balance, wait for 500ms and set status to be RECOVER",
               tmq->consumerId);
H
Haojun Liao 已提交
1329
    } else if (code == TSDB_CODE_TQ_NO_COMMITTED_OFFSET) {
S
Shengliang Guan 已提交
1330
      SMqPollRspWrapper* pRspWrapper = taosAllocateQitem(sizeof(SMqPollRspWrapper), DEF_QITEM, 0);
L
Liu Jicong 已提交
1331
      if (pRspWrapper == NULL) {
H
Haojun Liao 已提交
1332 1333
        tscWarn("consumer:0x%" PRIx64 " msg from vgId:%d discarded, epoch %d since out of memory, reqId:0x%" PRIx64,
                tmq->consumerId, vgId, epoch, requestId);
L
Liu Jicong 已提交
1334 1335
        goto CREATE_MSG_FAIL;
      }
H
Haojun Liao 已提交
1336

L
Liu Jicong 已提交
1337 1338
      pRspWrapper->tmqRspType = TMQ_MSG_TYPE__END_RSP;
      taosWriteQitem(tmq->mqueue, pRspWrapper);
1339 1340
//    } else if (code == TSDB_CODE_WAL_LOG_NOT_EXIST) {  // poll data while insert
//      taosMsleep(5);
wmmhello's avatar
wmmhello 已提交
1341 1342 1343
    } else{
      tscError("consumer:0x%" PRIx64 " msg from vgId:%d discarded, epoch %d, since %s, reqId:0x%" PRIx64, tmq->consumerId,
               vgId, epoch, tstrerror(code), requestId);
L
Liu Jicong 已提交
1344
    }
H
Haojun Liao 已提交
1345

L
fix txn  
Liu Jicong 已提交
1346
    goto CREATE_MSG_FAIL;
L
Liu Jicong 已提交
1347 1348
  }

X
Xiaoyu Wang 已提交
1349
  int32_t msgEpoch = ((SMqRspHead*)pMsg->pData)->epoch;
1350 1351
  int32_t clientEpoch = atomic_load_32(&tmq->epoch);
  if (msgEpoch < clientEpoch) {
L
Liu Jicong 已提交
1352
    // do not write into queue since updating epoch reset
X
Xiaoyu Wang 已提交
1353 1354
    tscWarn("consumer:0x%" PRIx64
            " msg discard from vgId:%d since from earlier epoch, rsp epoch %d, current epoch %d, reqId:0x%" PRIx64,
1355
            tmq->consumerId, vgId, msgEpoch, clientEpoch, requestId);
H
Haojun Liao 已提交
1356

1357
    tsem_post(&tmq->rspSem);
1358 1359
    taosReleaseRef(tmqMgmt.rsetId, refId);

L
Liu Jicong 已提交
1360
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1361
    taosMemoryFree(pMsg->pEpSet);
wmmhello's avatar
wmmhello 已提交
1362 1363
    taosMemoryFree(pParam);

X
Xiaoyu Wang 已提交
1364 1365 1366
    return 0;
  }

1367
  if (msgEpoch != clientEpoch) {
H
Haojun Liao 已提交
1368
    tscWarn("consumer:0x%" PRIx64 " mismatch rsp from vgId:%d, epoch %d, current epoch %d, reqId:0x%" PRIx64,
1369
            tmq->consumerId, vgId, msgEpoch, clientEpoch, requestId);
X
Xiaoyu Wang 已提交
1370 1371
  }

L
Liu Jicong 已提交
1372 1373 1374
  // handle meta rsp
  int8_t rspType = ((SMqRspHead*)pMsg->pData)->mqMsgType;

S
Shengliang Guan 已提交
1375
  SMqPollRspWrapper* pRspWrapper = taosAllocateQitem(sizeof(SMqPollRspWrapper), DEF_QITEM, 0);
L
Liu Jicong 已提交
1376
  if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1377
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1378
    taosMemoryFree(pMsg->pEpSet);
X
Xiaoyu Wang 已提交
1379 1380
    tscWarn("consumer:0x%" PRIx64 " msg discard from vgId:%d, epoch %d since out of memory", tmq->consumerId, vgId,
            epoch);
L
fix txn  
Liu Jicong 已提交
1381
    goto CREATE_MSG_FAIL;
L
Liu Jicong 已提交
1382
  }
L
Liu Jicong 已提交
1383

L
Liu Jicong 已提交
1384
  pRspWrapper->tmqRspType = rspType;
wmmhello's avatar
wmmhello 已提交
1385 1386
//  pRspWrapper->vgHandle = pVg;
//  pRspWrapper->topicHandle = pTopic;
H
Haojun Liao 已提交
1387
  pRspWrapper->reqId = requestId;
1388
  pRspWrapper->pEpset = pMsg->pEpSet;
wmmhello's avatar
wmmhello 已提交
1389 1390
  pRspWrapper->vgId = vgId;
  strcpy(pRspWrapper->topicName, pParam->topicName);
L
Liu Jicong 已提交
1391

1392
  pMsg->pEpSet = NULL;
L
Liu Jicong 已提交
1393
  if (rspType == TMQ_MSG_TYPE__POLL_RSP) {
L
Liu Jicong 已提交
1394 1395
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
1396
    tDecodeMqDataRsp(&decoder, &pRspWrapper->dataRsp);
wmmhello's avatar
wmmhello 已提交
1397
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1398
    memcpy(&pRspWrapper->dataRsp, pMsg->pData, sizeof(SMqRspHead));
L
Liu Jicong 已提交
1399

wmmhello's avatar
wmmhello 已提交
1400
    char buf[TSDB_OFFSET_LEN] = {0};
1401
    tFormatOffset(buf, TSDB_OFFSET_LEN, &pRspWrapper->dataRsp.rspOffset);
H
Haojun Liao 已提交
1402
    tscDebug("consumer:0x%" PRIx64 " recv poll rsp, vgId:%d, req ver:%" PRId64 ", rsp:%s type %d, reqId:0x%" PRIx64,
H
Haojun Liao 已提交
1403
             tmq->consumerId, vgId, pRspWrapper->dataRsp.reqOffset.version, buf, rspType, requestId);
L
Liu Jicong 已提交
1404
  } else if (rspType == TMQ_MSG_TYPE__POLL_META_RSP) {
1405 1406
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
1407
    tDecodeMqMetaRsp(&decoder, &pRspWrapper->metaRsp);
1408
    tDecoderClear(&decoder);
L
Liu Jicong 已提交
1409
    memcpy(&pRspWrapper->metaRsp, pMsg->pData, sizeof(SMqRspHead));
L
Liu Jicong 已提交
1410 1411 1412 1413 1414 1415
  } else if (rspType == TMQ_MSG_TYPE__TAOSX_RSP) {
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeSTaosxRsp(&decoder, &pRspWrapper->taosxRsp);
    tDecoderClear(&decoder);
    memcpy(&pRspWrapper->taosxRsp, pMsg->pData, sizeof(SMqRspHead));
X
Xiaoyu Wang 已提交
1416 1417
  } else {  // invalid rspType
    tscError("consumer:0x%" PRIx64 " invalid rsp msg received, type:%d ignored", tmq->consumerId, rspType);
L
Liu Jicong 已提交
1418
  }
L
Liu Jicong 已提交
1419

L
Liu Jicong 已提交
1420
  taosMemoryFree(pMsg->pData);
H
Haojun Liao 已提交
1421
  taosWriteQitem(tmq->mqueue, pRspWrapper);
L
Liu Jicong 已提交
1422

1423
  int32_t total = taosQueueItemSize(tmq->mqueue);
H
Haojun Liao 已提交
1424
  tscDebug("consumer:0x%" PRIx64 " put poll res into mqueue, type:%d, vgId:%d, total in queue:%d, reqId:0x%" PRIx64,
1425
           tmq->consumerId, rspType, vgId, total, requestId);
H
Haojun Liao 已提交
1426

1427
  tsem_post(&tmq->rspSem);
1428
  taosReleaseRef(tmqMgmt.rsetId, refId);
wmmhello's avatar
wmmhello 已提交
1429
  taosMemoryFree(pParam);
1430

L
Liu Jicong 已提交
1431
  return 0;
H
Haojun Liao 已提交
1432

L
fix txn  
Liu Jicong 已提交
1433
CREATE_MSG_FAIL:
L
Liu Jicong 已提交
1434
  if (epoch == tmq->epoch) {
wmmhello's avatar
wmmhello 已提交
1435 1436 1437 1438 1439
    taosWLockLatch(&tmq->lock);
    SMqClientVg* pVg = getVgInfo(tmq, pParam->topicName, vgId);
    if(pVg){
      atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
    }
wmmhello's avatar
wmmhello 已提交
1440
    taosWUnLockLatch(&tmq->lock);
L
Liu Jicong 已提交
1441
  }
H
Haojun Liao 已提交
1442

1443
  tsem_post(&tmq->rspSem);
1444
  taosReleaseRef(tmqMgmt.rsetId, refId);
wmmhello's avatar
wmmhello 已提交
1445
  taosMemoryFree(pParam);
1446

L
Liu Jicong 已提交
1447
  return -1;
1448 1449
}

H
Haojun Liao 已提交
1450
typedef struct SVgroupSaveInfo {
wmmhello's avatar
wmmhello 已提交
1451 1452
  STqOffsetVal currentOffset;
  STqOffsetVal commitOffset;
1453
  STqOffsetVal seekOffset;
H
Haojun Liao 已提交
1454 1455 1456
  int64_t      numOfRows;
} SVgroupSaveInfo;

H
Haojun Liao 已提交
1457 1458 1459 1460 1461 1462
static void initClientTopicFromRsp(SMqClientTopic* pTopic, SMqSubTopicEp* pTopicEp, SHashObj* pVgOffsetHashMap,
                                   tmq_t* tmq) {
  pTopic->schema = pTopicEp->schema;
  pTopicEp->schema.nCols = 0;
  pTopicEp->schema.pSchema = NULL;

X
Xiaoyu Wang 已提交
1463
  char    vgKey[TSDB_TOPIC_FNAME_LEN + 22];
H
Haojun Liao 已提交
1464 1465 1466 1467 1468
  int32_t vgNumGet = taosArrayGetSize(pTopicEp->vgs);

  tstrncpy(pTopic->topicName, pTopicEp->topic, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pTopic->db, pTopicEp->db, TSDB_DB_FNAME_LEN);

1469
  tscInfo("consumer:0x%" PRIx64 ", update topic:%s, new numOfVgs:%d", tmq->consumerId, pTopic->topicName, vgNumGet);
H
Haojun Liao 已提交
1470 1471 1472 1473
  pTopic->vgs = taosArrayInit(vgNumGet, sizeof(SMqClientVg));

  for (int32_t j = 0; j < vgNumGet; j++) {
    SMqSubVgEp* pVgEp = taosArrayGet(pTopicEp->vgs, j);
H
Haojun Liao 已提交
1474 1475

    makeTopicVgroupKey(vgKey, pTopic->topicName, pVgEp->vgId);
H
Haojun Liao 已提交
1476
    SVgroupSaveInfo* pInfo = taosHashGet(pVgOffsetHashMap, vgKey, strlen(vgKey));
H
Haojun Liao 已提交
1477

wmmhello's avatar
wmmhello 已提交
1478 1479
    STqOffsetVal offsetNew = {0};
    offsetNew.type = tmq->resetOffsetCfg;
H
Haojun Liao 已提交
1480 1481 1482 1483 1484

    SMqClientVg clientVg = {
        .pollCnt = 0,
        .vgId = pVgEp->vgId,
        .epSet = pVgEp->epSet,
wmmhello's avatar
wmmhello 已提交
1485
        .vgStatus = TMQ_VG_STATUS__IDLE,
H
Haojun Liao 已提交
1486
        .vgSkipCnt = 0,
H
Haojun Liao 已提交
1487
        .emptyBlockReceiveTs = 0,
wmmhello's avatar
wmmhello 已提交
1488
        .numOfRows = pInfo ? pInfo->numOfRows : 0,
H
Haojun Liao 已提交
1489 1490
    };

1491
    clientVg.offsetInfo.endOffset = pInfo ? pInfo->currentOffset : offsetNew;
wmmhello's avatar
wmmhello 已提交
1492
    clientVg.offsetInfo.committedOffset = pInfo ? pInfo->commitOffset : offsetNew;
1493
    clientVg.offsetInfo.beginOffset = pInfo ? pInfo->seekOffset : offsetNew;
H
Haojun Liao 已提交
1494 1495
    clientVg.offsetInfo.walVerBegin = -1;
    clientVg.offsetInfo.walVerEnd = -1;
1496
    clientVg.seekUpdated = false;
1497
//    clientVg.receivedInfoFromVnode = false;
1498

H
Haojun Liao 已提交
1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511
    taosArrayPush(pTopic->vgs, &clientVg);
  }
}

static void freeClientVgInfo(void* param) {
  SMqClientTopic* pTopic = param;
  if (pTopic->schema.nCols) {
    taosMemoryFreeClear(pTopic->schema.pSchema);
  }

  taosArrayDestroy(pTopic->vgs);
}

1512
static bool doUpdateLocalEp(tmq_t* tmq, int32_t epoch, const SMqAskEpRsp* pRsp) {
1513 1514 1515
  bool set = false;

  int32_t topicNumGet = taosArrayGetSize(pRsp->topics);
wmmhello's avatar
wmmhello 已提交
1516 1517 1518
  if (epoch <= tmq->epoch) {
    return false;
  }
1519 1520 1521 1522 1523 1524

  SArray* newTopics = taosArrayInit(topicNumGet, sizeof(SMqClientTopic));
  if (newTopics == NULL) {
    return false;
  }

H
Haojun Liao 已提交
1525 1526
  SHashObj* pVgOffsetHashMap = taosHashInit(64, MurmurHash3_32, false, HASH_NO_LOCK);
  if (pVgOffsetHashMap == NULL) {
1527 1528 1529
    taosArrayDestroy(newTopics);
    return false;
  }
1530

wmmhello's avatar
wmmhello 已提交
1531 1532 1533 1534 1535 1536
  taosWLockLatch(&tmq->lock);
  int32_t topicNumCur = taosArrayGetSize(tmq->clientTopics);

  char vgKey[TSDB_TOPIC_FNAME_LEN + 22];
  tscInfo("consumer:0x%" PRIx64 " update ep epoch from %d to epoch %d, incoming topics:%d, existed topics:%d",
          tmq->consumerId, tmq->epoch, epoch, topicNumGet, topicNumCur);
H
Haojun Liao 已提交
1537
  // todo extract method
1538 1539 1540 1541 1542
  for (int32_t i = 0; i < topicNumCur; i++) {
    // find old topic
    SMqClientTopic* pTopicCur = taosArrayGet(tmq->clientTopics, i);
    if (pTopicCur->vgs) {
      int32_t vgNumCur = taosArrayGetSize(pTopicCur->vgs);
1543
      tscInfo("consumer:0x%" PRIx64 ", current vg num: %d", tmq->consumerId, vgNumCur);
1544 1545
      for (int32_t j = 0; j < vgNumCur; j++) {
        SMqClientVg* pVgCur = taosArrayGet(pTopicCur->vgs, j);
H
Haojun Liao 已提交
1546 1547
        makeTopicVgroupKey(vgKey, pTopicCur->topicName, pVgCur->vgId);

wmmhello's avatar
wmmhello 已提交
1548
        char buf[TSDB_OFFSET_LEN] = {0};
1549
        tFormatOffset(buf, TSDB_OFFSET_LEN, &pVgCur->offsetInfo.endOffset);
1550
        tscInfo("consumer:0x%" PRIx64 ", epoch:%d vgId:%d vgKey:%s, offset:%s", tmq->consumerId, epoch, pVgCur->vgId,
X
Xiaoyu Wang 已提交
1551
                 vgKey, buf);
H
Haojun Liao 已提交
1552

1553
        SVgroupSaveInfo info = {.currentOffset = pVgCur->offsetInfo.endOffset, .seekOffset = pVgCur->offsetInfo.beginOffset, .commitOffset = pVgCur->offsetInfo.committedOffset, .numOfRows = pVgCur->numOfRows};
H
Haojun Liao 已提交
1554
        taosHashPut(pVgOffsetHashMap, vgKey, strlen(vgKey), &info, sizeof(SVgroupSaveInfo));
1555 1556 1557 1558 1559 1560 1561
      }
    }
  }

  for (int32_t i = 0; i < topicNumGet; i++) {
    SMqClientTopic topic = {0};
    SMqSubTopicEp* pTopicEp = taosArrayGet(pRsp->topics, i);
H
Haojun Liao 已提交
1562
    initClientTopicFromRsp(&topic, pTopicEp, pVgOffsetHashMap, tmq);
1563 1564
    taosArrayPush(newTopics, &topic);
  }
1565

H
Haojun Liao 已提交
1566 1567
  taosHashCleanup(pVgOffsetHashMap);

1568
  // destroy current buffered existed topics info
1569
  if (tmq->clientTopics) {
H
Haojun Liao 已提交
1570
    taosArrayDestroyEx(tmq->clientTopics, freeClientVgInfo);
X
Xiaoyu Wang 已提交
1571
  }
H
Haojun Liao 已提交
1572
  tmq->clientTopics = newTopics;
wmmhello's avatar
wmmhello 已提交
1573
  taosWUnLockLatch(&tmq->lock);
1574

X
Xiaoyu Wang 已提交
1575
  int8_t flag = (topicNumGet == 0) ? TMQ_CONSUMER_STATUS__NO_TOPIC : TMQ_CONSUMER_STATUS__READY;
H
Haojun Liao 已提交
1576
  atomic_store_8(&tmq->status, flag);
X
Xiaoyu Wang 已提交
1577
  atomic_store_32(&tmq->epoch, epoch);
H
Haojun Liao 已提交
1578

1579
  tscInfo("consumer:0x%" PRIx64 " update topic info completed", tmq->consumerId);
X
Xiaoyu Wang 已提交
1580 1581 1582
  return set;
}

1583
int32_t askEpCallbackFn(void* param, SDataBuf* pMsg, int32_t code) {
1584
  SMqAskEpCbParam* pParam = (SMqAskEpCbParam*)param;
1585 1586 1587
  tmq_t*           tmq = taosAcquireRef(tmqMgmt.rsetId, pParam->refId);

  if (tmq == NULL) {
1588
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
wmmhello's avatar
wmmhello 已提交
1589
//    pParam->pUserFn(tmq, terrno, NULL, pParam->pParam);
1590

1591
    taosMemoryFree(pMsg->pData);
dengyihao's avatar
dengyihao 已提交
1592
    taosMemoryFree(pMsg->pEpSet);
1593 1594
    taosMemoryFree(pParam);
    return terrno;
1595 1596
  }

H
Haojun Liao 已提交
1597
  if (code != TSDB_CODE_SUCCESS) {
1598 1599 1600 1601 1602 1603 1604 1605 1606
    tscError("consumer:0x%" PRIx64 ", get topic endpoint error, code:%s", tmq->consumerId, tstrerror(code));
    pParam->pUserFn(tmq, code, NULL, pParam->pParam);

    taosReleaseRef(tmqMgmt.rsetId, pParam->refId);

    taosMemoryFree(pMsg->pData);
    taosMemoryFree(pMsg->pEpSet);
    taosMemoryFree(pParam);
    return code;
1607
  }
L
Liu Jicong 已提交
1608

L
Liu Jicong 已提交
1609
  // tmq's epoch is monotonically increase,
L
Liu Jicong 已提交
1610
  // so it's safe to discard any old epoch msg.
L
Liu Jicong 已提交
1611
  // Epoch will only increase when received newer epoch ep msg
L
Liu Jicong 已提交
1612 1613 1614
  SMqRspHead* head = pMsg->pData;
  int32_t     epoch = atomic_load_32(&tmq->epoch);
  if (head->epoch <= epoch) {
1615
    tscInfo("consumer:0x%" PRIx64 ", recv ep, msg epoch %d, current epoch %d, no need to update local ep",
1616
             tmq->consumerId, head->epoch, epoch);
1617

1618 1619 1620 1621 1622 1623 1624 1625
    if (tmq->status == TMQ_CONSUMER_STATUS__RECOVER) {
      SMqAskEpRsp rsp;
      tDecodeSMqAskEpRsp(POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), &rsp);
      int8_t flag = (taosArrayGetSize(rsp.topics) == 0) ? TMQ_CONSUMER_STATUS__NO_TOPIC : TMQ_CONSUMER_STATUS__READY;
      atomic_store_8(&tmq->status, flag);
      tDeleteSMqAskEpRsp(&rsp);
    }

X
Xiaoyu Wang 已提交
1626
  } else {
1627
    tscInfo("consumer:0x%" PRIx64 ", recv ep, msg epoch %d, current epoch %d, update local ep", tmq->consumerId,
1628
             head->epoch, epoch);
1629
  }
L
Liu Jicong 已提交
1630

1631
  pParam->pUserFn(tmq, code, pMsg, pParam->pParam);
1632 1633
  taosReleaseRef(tmqMgmt.rsetId, pParam->refId);

dengyihao's avatar
dengyihao 已提交
1634
  taosMemoryFree(pMsg->pEpSet);
L
Liu Jicong 已提交
1635
  taosMemoryFree(pMsg->pData);
1636
  taosMemoryFree(pParam);
L
Liu Jicong 已提交
1637
  return code;
1638 1639
}

L
Liu Jicong 已提交
1640
void tmqBuildConsumeReqImpl(SMqPollReq* pReq, tmq_t* tmq, int64_t timeout, SMqClientTopic* pTopic, SMqClientVg* pVg) {
L
Liu Jicong 已提交
1641 1642 1643 1644
  int32_t groupLen = strlen(tmq->groupId);
  memcpy(pReq->subKey, tmq->groupId, groupLen);
  pReq->subKey[groupLen] = TMQ_SEPARATOR;
  strcpy(pReq->subKey + groupLen + 1, pTopic->topicName);
1645

1646
  pReq->withTbName = tmq->withTbName;
L
Liu Jicong 已提交
1647
  pReq->consumerId = tmq->consumerId;
1648
  pReq->timeout = timeout;
X
Xiaoyu Wang 已提交
1649
  pReq->epoch = tmq->epoch;
1650
  pReq->reqOffset = pVg->offsetInfo.endOffset;
D
dapan1121 已提交
1651
  pReq->head.vgId = pVg->vgId;
1652 1653
  pReq->useSnapshot = tmq->useSnapshot;
  pReq->reqId = generateRequestId();
1654 1655
}

L
Liu Jicong 已提交
1656 1657
SMqMetaRspObj* tmqBuildMetaRspFromWrapper(SMqPollRspWrapper* pWrapper) {
  SMqMetaRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqMetaRspObj));
L
Liu Jicong 已提交
1658
  pRspObj->resType = RES_TYPE__TMQ_META;
L
Liu Jicong 已提交
1659 1660 1661 1662 1663 1664 1665 1666
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
  pRspObj->vgId = pWrapper->vgHandle->vgId;

  memcpy(&pRspObj->metaRsp, &pWrapper->metaRsp, sizeof(SMqMetaRsp));
  return pRspObj;
}

1667
SMqRspObj* tmqBuildRspFromWrapper(SMqPollRspWrapper* pWrapper, SMqClientVg* pVg, int64_t* numOfRows) {
L
Liu Jicong 已提交
1668 1669
  SMqRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqRspObj));
  pRspObj->resType = RES_TYPE__TMQ;
1670

1671
  (*numOfRows) = 0;
L
Liu Jicong 已提交
1672 1673
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
1674

L
Liu Jicong 已提交
1675
  pRspObj->vgId = pWrapper->vgHandle->vgId;
L
Liu Jicong 已提交
1676
  pRspObj->resIter = -1;
L
Liu Jicong 已提交
1677
  memcpy(&pRspObj->rsp, &pWrapper->dataRsp, sizeof(SMqDataRsp));
L
Liu Jicong 已提交
1678

L
Liu Jicong 已提交
1679 1680
  pRspObj->resInfo.totalRows = 0;
  pRspObj->resInfo.precision = TSDB_TIME_PRECISION_MILLI;
1681

L
Liu Jicong 已提交
1682
  if (!pWrapper->dataRsp.withSchema) {
L
Liu Jicong 已提交
1683 1684
    setResSchemaInfo(&pRspObj->resInfo, pWrapper->topicHandle->schema.pSchema, pWrapper->topicHandle->schema.nCols);
  }
L
Liu Jicong 已提交
1685

1686
  // extract the rows in this data packet
X
Xiaoyu Wang 已提交
1687
  for (int32_t i = 0; i < pRspObj->rsp.blockNum; ++i) {
1688
    SRetrieveTableRsp* pRetrieve = (SRetrieveTableRsp*)taosArrayGetP(pRspObj->rsp.blockData, i);
X
Xiaoyu Wang 已提交
1689
    int64_t            rows = htobe64(pRetrieve->numOfRows);
1690
    pVg->numOfRows += rows;
1691
    (*numOfRows) += rows;
1692 1693
  }

L
Liu Jicong 已提交
1694
  return pRspObj;
X
Xiaoyu Wang 已提交
1695 1696
}

1697
SMqTaosxRspObj* tmqBuildTaosxRspFromWrapper(SMqPollRspWrapper* pWrapper, SMqClientVg* pVg, int64_t* numOfRows) {
L
Liu Jicong 已提交
1698
  SMqTaosxRspObj* pRspObj = taosMemoryCalloc(1, sizeof(SMqTaosxRspObj));
1699
  pRspObj->resType = RES_TYPE__TMQ_METADATA;
L
Liu Jicong 已提交
1700 1701 1702 1703
  tstrncpy(pRspObj->topic, pWrapper->topicHandle->topicName, TSDB_TOPIC_FNAME_LEN);
  tstrncpy(pRspObj->db, pWrapper->topicHandle->db, TSDB_DB_FNAME_LEN);
  pRspObj->vgId = pWrapper->vgHandle->vgId;
  pRspObj->resIter = -1;
1704
  memcpy(&pRspObj->rsp, &pWrapper->taosxRsp, sizeof(STaosxRsp));
L
Liu Jicong 已提交
1705 1706 1707

  pRspObj->resInfo.totalRows = 0;
  pRspObj->resInfo.precision = TSDB_TIME_PRECISION_MILLI;
1708
  if (!pWrapper->taosxRsp.withSchema) {
L
Liu Jicong 已提交
1709 1710 1711
    setResSchemaInfo(&pRspObj->resInfo, pWrapper->topicHandle->schema.pSchema, pWrapper->topicHandle->schema.nCols);
  }

1712 1713 1714 1715 1716 1717 1718
  // extract the rows in this data packet
  for (int32_t i = 0; i < pRspObj->rsp.blockNum; ++i) {
    SRetrieveTableRsp* pRetrieve = (SRetrieveTableRsp*)taosArrayGetP(pRspObj->rsp.blockData, i);
    int64_t            rows = htobe64(pRetrieve->numOfRows);
    pVg->numOfRows += rows;
    (*numOfRows) += rows;
  }
L
Liu Jicong 已提交
1719 1720 1721
  return pRspObj;
}

1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750 1751 1752 1753 1754
static int32_t handleErrorBeforePoll(SMqClientVg* pVg, tmq_t* pTmq) {
  atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);
  tsem_post(&pTmq->rspSem);
  return -1;
}

static int32_t doTmqPollImpl(tmq_t* pTmq, SMqClientTopic* pTopic, SMqClientVg* pVg, int64_t timeout) {
  SMqPollReq req = {0};
  tmqBuildConsumeReqImpl(&req, pTmq, timeout, pTopic, pVg);

  int32_t msgSize = tSerializeSMqPollReq(NULL, 0, &req);
  if (msgSize < 0) {
    return handleErrorBeforePoll(pVg, pTmq);
  }

  char* msg = taosMemoryCalloc(1, msgSize);
  if (NULL == msg) {
    return handleErrorBeforePoll(pVg, pTmq);
  }

  if (tSerializeSMqPollReq(msg, msgSize, &req) < 0) {
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  SMqPollCbParam* pParam = taosMemoryMalloc(sizeof(SMqPollCbParam));
  if (pParam == NULL) {
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

  pParam->refId = pTmq->refId;
  pParam->epoch = pTmq->epoch;
wmmhello's avatar
wmmhello 已提交
1755 1756 1757
//  pParam->pVg = pVg;  // pVg may be released,fix it
//  pParam->pTopic = pTopic;
  strcpy(pParam->topicName, pTopic->topicName);
1758
  pParam->vgId = pVg->vgId;
H
Haojun Liao 已提交
1759
  pParam->requestId = req.reqId;
1760 1761 1762 1763 1764 1765 1766 1767

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(pParam);
    taosMemoryFree(msg);
    return handleErrorBeforePoll(pVg, pTmq);
  }

H
Haojun Liao 已提交
1768
  sendInfo->msgInfo = (SDataBuf){.pData = msg, .len = msgSize, .handle = NULL};
1769 1770 1771 1772 1773 1774 1775
  sendInfo->requestId = req.reqId;
  sendInfo->requestObjRefId = 0;
  sendInfo->param = pParam;
  sendInfo->fp = tmqPollCb;
  sendInfo->msgType = TDMT_VND_TMQ_CONSUME;

  int64_t transporterId = 0;
wmmhello's avatar
wmmhello 已提交
1776
  char    offsetFormatBuf[TSDB_OFFSET_LEN] = {0};
1777
  tFormatOffset(offsetFormatBuf, tListLen(offsetFormatBuf), &pVg->offsetInfo.endOffset);
1778

X
Xiaoyu Wang 已提交
1779 1780
  tscDebug("consumer:0x%" PRIx64 " send poll to %s vgId:%d, epoch %d, req:%s, reqId:0x%" PRIx64, pTmq->consumerId,
           pTopic->topicName, pVg->vgId, pTmq->epoch, offsetFormatBuf, req.reqId);
1781 1782 1783
  asyncSendMsgToServer(pTmq->pTscObj->pAppInfo->pTransporter, &pVg->epSet, &transporterId, sendInfo);

  pVg->pollCnt++;
1784
  pVg->seekUpdated = false;   // reset this flag.
1785 1786 1787 1788 1789
  pTmq->pollCnt++;

  return TSDB_CODE_SUCCESS;
}

1790
// broadcast the poll request to all related vnodes
H
Haojun Liao 已提交
1791
static int32_t tmqPollImpl(tmq_t* tmq, int64_t timeout) {
1792 1793 1794
  if(atomic_load_8(&tmq->status) == TMQ_CONSUMER_STATUS__RECOVER){
    return 0;
  }
wmmhello's avatar
wmmhello 已提交
1795 1796 1797
  int32_t code = 0;

  taosWLockLatch(&tmq->lock);
1798
  int32_t numOfTopics = taosArrayGetSize(tmq->clientTopics);
X
Xiaoyu Wang 已提交
1799
  tscDebug("consumer:0x%" PRIx64 " start to poll data, numOfTopics:%d", tmq->consumerId, numOfTopics);
1800 1801

  for (int i = 0; i < numOfTopics; i++) {
X
Xiaoyu Wang 已提交
1802
    SMqClientTopic* pTopic = taosArrayGet(tmq->clientTopics, i);
X
Xiaoyu Wang 已提交
1803
    int32_t         numOfVg = taosArrayGetSize(pTopic->vgs);
1804 1805

    for (int j = 0; j < numOfVg; j++) {
X
Xiaoyu Wang 已提交
1806
      SMqClientVg* pVg = taosArrayGet(pTopic->vgs, j);
wmmhello's avatar
wmmhello 已提交
1807
      if (taosGetTimestampMs() - pVg->emptyBlockReceiveTs < EMPTY_BLOCK_POLL_IDLE_DURATION) {  // less than 10ms
1808
        tscTrace("consumer:0x%" PRIx64 " epoch %d, vgId:%d idle for 10ms before start next poll", tmq->consumerId,
X
Xiaoyu Wang 已提交
1809
                 tmq->epoch, pVg->vgId);
H
Haojun Liao 已提交
1810 1811 1812
        continue;
      }

1813
      int32_t vgStatus = atomic_val_compare_exchange_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE, TMQ_VG_STATUS__WAIT);
1814
      if (vgStatus == TMQ_VG_STATUS__WAIT) {
L
Liu Jicong 已提交
1815
        int32_t vgSkipCnt = atomic_add_fetch_32(&pVg->vgSkipCnt, 1);
1816
        tscTrace("consumer:0x%" PRIx64 " epoch %d wait poll-rsp, skip vgId:%d skip cnt %d", tmq->consumerId, tmq->epoch,
X
Xiaoyu Wang 已提交
1817
                 pVg->vgId, vgSkipCnt);
X
Xiaoyu Wang 已提交
1818 1819
        continue;
      }
1820

L
Liu Jicong 已提交
1821
      atomic_store_32(&pVg->vgSkipCnt, 0);
wmmhello's avatar
wmmhello 已提交
1822
      code = doTmqPollImpl(tmq, pTopic, pVg, timeout);
1823
      if (code != TSDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
1824
        goto end;
D
dapan1121 已提交
1825
      }
X
Xiaoyu Wang 已提交
1826 1827
    }
  }
1828

wmmhello's avatar
wmmhello 已提交
1829 1830 1831 1832
end:
  taosWUnLockLatch(&tmq->lock);
  tscDebug("consumer:0x%" PRIx64 " end to poll data, code:%d", tmq->consumerId, code);
  return code;
X
Xiaoyu Wang 已提交
1833 1834
}

H
Haojun Liao 已提交
1835
static int32_t tmqHandleNoPollRsp(tmq_t* tmq, SMqRspWrapper* rspWrapper, bool* pReset) {
L
Liu Jicong 已提交
1836
  if (rspWrapper->tmqRspType == TMQ_MSG_TYPE__EP_RSP) {
L
fix  
Liu Jicong 已提交
1837
    /*printf("ep %d %d\n", rspMsg->head.epoch, tmq->epoch);*/
L
Liu Jicong 已提交
1838 1839
    if (rspWrapper->epoch > atomic_load_32(&tmq->epoch)) {
      SMqAskEpRspWrapper* pEpRspWrapper = (SMqAskEpRspWrapper*)rspWrapper;
L
Liu Jicong 已提交
1840
      SMqAskEpRsp*        rspMsg = &pEpRspWrapper->msg;
1841
      doUpdateLocalEp(tmq, rspWrapper->epoch, rspMsg);
L
temp  
Liu Jicong 已提交
1842
      /*tmqClearUnhandleMsg(tmq);*/
L
Liu Jicong 已提交
1843
      tDeleteSMqAskEpRsp(rspMsg);
X
Xiaoyu Wang 已提交
1844 1845
      *pReset = true;
    } else {
L
Liu Jicong 已提交
1846
      tmqFreeRspWrapper(rspWrapper);
X
Xiaoyu Wang 已提交
1847 1848 1849 1850 1851 1852 1853 1854
      *pReset = false;
    }
  } else {
    return -1;
  }
  return 0;
}

1855
static void updateVgInfo(SMqClientVg* pVg, STqOffsetVal* reqOffset, STqOffsetVal* rspOffset, int64_t sver, int64_t ever, int64_t consumerId){
wmmhello's avatar
wmmhello 已提交
1856 1857
  if (!pVg->seekUpdated) {
    tscDebug("consumer:0x%" PRIx64" local offset is update, since seekupdate not set", consumerId);
1858 1859
    pVg->offsetInfo.beginOffset = *reqOffset;
    pVg->offsetInfo.endOffset = *rspOffset;
wmmhello's avatar
wmmhello 已提交
1860 1861 1862 1863 1864 1865 1866 1867 1868
  } else {
    tscDebug("consumer:0x%" PRIx64" local offset is NOT update, since seekupdate is set", consumerId);
  }

  // update the status
  atomic_store_32(&pVg->vgStatus, TMQ_VG_STATUS__IDLE);

  // update the valid wal version range
  pVg->offsetInfo.walVerBegin = sver;
1869
  pVg->offsetInfo.walVerEnd = ever + 1;
1870
//  pVg->receivedInfoFromVnode = true;
wmmhello's avatar
wmmhello 已提交
1871 1872
}

H
Haojun Liao 已提交
1873
static void* tmqHandleAllRsp(tmq_t* tmq, int64_t timeout, bool pollIfReset) {
H
Haojun Liao 已提交
1874
  tscDebug("consumer:0x%" PRIx64 " start to handle the rsp, total:%d", tmq->consumerId, tmq->qall->numOfItems);
1875

X
Xiaoyu Wang 已提交
1876
  while (1) {
1877 1878
    SMqRspWrapper* pRspWrapper = NULL;
    taosGetQitem(tmq->qall, (void**)&pRspWrapper);
1879

1880
    if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1881
      taosReadAllQitems(tmq->mqueue, tmq->qall);
1882 1883
      taosGetQitem(tmq->qall, (void**)&pRspWrapper);
      if (pRspWrapper == NULL) {
L
Liu Jicong 已提交
1884 1885
        return NULL;
      }
X
Xiaoyu Wang 已提交
1886 1887
    }

X
Xiaoyu Wang 已提交
1888
    tscDebug("consumer:0x%" PRIx64 " handle rsp, type:%d", tmq->consumerId, pRspWrapper->tmqRspType);
H
Haojun Liao 已提交
1889

1890 1891
    if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__END_RSP) {
      taosFreeQitem(pRspWrapper);
L
Liu Jicong 已提交
1892
      terrno = TSDB_CODE_TQ_NO_COMMITTED_OFFSET;
H
Haojun Liao 已提交
1893
      tscError("consumer:0x%" PRIx64 " unexpected rsp from poll, code:%s", tmq->consumerId, tstrerror(terrno));
L
Liu Jicong 已提交
1894
      return NULL;
1895 1896
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
H
Haojun Liao 已提交
1897

X
Xiaoyu Wang 已提交
1898
      int32_t     consumerEpoch = atomic_load_32(&tmq->epoch);
1899 1900 1901
      SMqDataRsp* pDataRsp = &pollRspWrapper->dataRsp;

      if (pDataRsp->head.epoch == consumerEpoch) {
wmmhello's avatar
wmmhello 已提交
1902
        taosWLockLatch(&tmq->lock);
wmmhello's avatar
wmmhello 已提交
1903 1904 1905 1906 1907 1908
        SMqClientVg* pVg = getVgInfo(tmq, pollRspWrapper->topicName, pollRspWrapper->vgId);
        pollRspWrapper->vgHandle = pVg;
        pollRspWrapper->topicHandle = getTopicInfo(tmq, pollRspWrapper->topicName);
        if(pollRspWrapper->vgHandle == NULL || pollRspWrapper->topicHandle == NULL){
          tscError("consumer:0x%" PRIx64 " get vg or topic error, topic:%s vgId:%d", tmq->consumerId,
                   pollRspWrapper->topicName, pollRspWrapper->vgId);
wmmhello's avatar
wmmhello 已提交
1909
          taosWUnLockLatch(&tmq->lock);
wmmhello's avatar
wmmhello 已提交
1910 1911
          return NULL;
        }
1912 1913 1914 1915
        // update the epset
        if (pollRspWrapper->pEpset != NULL) {
          SEp* pEp = GET_ACTIVE_EP(pollRspWrapper->pEpset);
          SEp* pOld = GET_ACTIVE_EP(&(pVg->epSet));
X
Xiaoyu Wang 已提交
1916 1917
          tscDebug("consumer:0x%" PRIx64 " update epset vgId:%d, ep:%s:%d, old ep:%s:%d", tmq->consumerId, pVg->vgId,
                   pEp->fqdn, pEp->port, pOld->fqdn, pOld->port);
1918 1919 1920
          pVg->epSet = *pollRspWrapper->pEpset;
        }

1921
        updateVgInfo(pVg, &pDataRsp->reqOffset, &pDataRsp->rspOffset, pDataRsp->head.walsver, pDataRsp->head.walever, tmq->consumerId);
1922

wmmhello's avatar
wmmhello 已提交
1923
        char buf[TSDB_OFFSET_LEN] = {0};
1924
        tFormatOffset(buf, TSDB_OFFSET_LEN, &pDataRsp->rspOffset);
1925
        if (pDataRsp->blockNum == 0) {
X
Xiaoyu Wang 已提交
1926
          tscDebug("consumer:0x%" PRIx64 " empty block received, vgId:%d, offset:%s, vg total:%" PRId64
wmmhello's avatar
wmmhello 已提交
1927
                   ", total:%" PRId64 ", reqId:0x%" PRIx64,
X
Xiaoyu Wang 已提交
1928
                   tmq->consumerId, pVg->vgId, buf, pVg->numOfRows, tmq->totalRows, pollRspWrapper->reqId);
1929
          pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
1930
          pVg->emptyBlockReceiveTs = taosGetTimestampMs();
L
Liu Jicong 已提交
1931
          taosFreeQitem(pollRspWrapper);
1932
        } else {  // build rsp
X
Xiaoyu Wang 已提交
1933
          int64_t    numOfRows = 0;
1934
          SMqRspObj* pRsp = tmqBuildRspFromWrapper(pollRspWrapper, pVg, &numOfRows);
H
Haojun Liao 已提交
1935
          tmq->totalRows += numOfRows;
1936
          pVg->emptyBlockReceiveTs = 0;
H
Haojun Liao 已提交
1937
          tscDebug("consumer:0x%" PRIx64 " process poll rsp, vgId:%d, offset:%s, blocks:%d, rows:%" PRId64
wmmhello's avatar
wmmhello 已提交
1938
                   ", vg total:%" PRId64 ", total:%" PRId64 ", reqId:0x%" PRIx64,
H
Haojun Liao 已提交
1939
                   tmq->consumerId, pVg->vgId, buf, pDataRsp->blockNum, numOfRows, pVg->numOfRows, tmq->totalRows,
H
Haojun Liao 已提交
1940
                   pollRspWrapper->reqId);
1941
          taosFreeQitem(pollRspWrapper);
wmmhello's avatar
wmmhello 已提交
1942
          taosWUnLockLatch(&tmq->lock);
1943 1944
          return pRsp;
        }
wmmhello's avatar
wmmhello 已提交
1945
        taosWUnLockLatch(&tmq->lock);
X
Xiaoyu Wang 已提交
1946
      } else {
H
Haojun Liao 已提交
1947
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
1948
                 tmq->consumerId, pollRspWrapper->vgId, pDataRsp->head.epoch, consumerEpoch);
1949
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1950 1951
        taosFreeQitem(pollRspWrapper);
      }
1952
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__POLL_META_RSP) {
1953
      // todo handle the wal range and epset for each vgroup
1954
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
L
Liu Jicong 已提交
1955
      int32_t            consumerEpoch = atomic_load_32(&tmq->epoch);
1956 1957 1958

      tscDebug("consumer:0x%" PRIx64 " process meta rsp", tmq->consumerId);

L
Liu Jicong 已提交
1959
      if (pollRspWrapper->metaRsp.head.epoch == consumerEpoch) {
wmmhello's avatar
wmmhello 已提交
1960
        taosWLockLatch(&tmq->lock);
wmmhello's avatar
wmmhello 已提交
1961 1962 1963 1964 1965 1966
        SMqClientVg* pVg = getVgInfo(tmq, pollRspWrapper->topicName, pollRspWrapper->vgId);
        pollRspWrapper->vgHandle = pVg;
        pollRspWrapper->topicHandle = getTopicInfo(tmq, pollRspWrapper->topicName);
        if(pollRspWrapper->vgHandle == NULL || pollRspWrapper->topicHandle == NULL){
          tscError("consumer:0x%" PRIx64 " get vg or topic error, topic:%s vgId:%d", tmq->consumerId,
                   pollRspWrapper->topicName, pollRspWrapper->vgId);
wmmhello's avatar
wmmhello 已提交
1967
          taosWUnLockLatch(&tmq->lock);
wmmhello's avatar
wmmhello 已提交
1968 1969
          return NULL;
        }
H
Haojun Liao 已提交
1970

1971
        updateVgInfo(pVg, &pollRspWrapper->metaRsp.rspOffset, &pollRspWrapper->metaRsp.rspOffset, pollRspWrapper->metaRsp.head.walsver, pollRspWrapper->metaRsp.head.walever, tmq->consumerId);
L
Liu Jicong 已提交
1972
        // build rsp
L
Liu Jicong 已提交
1973
        SMqMetaRspObj* pRsp = tmqBuildMetaRspFromWrapper(pollRspWrapper);
L
Liu Jicong 已提交
1974
        taosFreeQitem(pollRspWrapper);
wmmhello's avatar
wmmhello 已提交
1975
        taosWUnLockLatch(&tmq->lock);
L
Liu Jicong 已提交
1976 1977
        return pRsp;
      } else {
H
Haojun Liao 已提交
1978
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
1979
                 tmq->consumerId, pollRspWrapper->vgId, pollRspWrapper->metaRsp.head.epoch, consumerEpoch);
1980
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
1981
        taosFreeQitem(pollRspWrapper);
X
Xiaoyu Wang 已提交
1982
      }
1983 1984
    } else if (pRspWrapper->tmqRspType == TMQ_MSG_TYPE__TAOSX_RSP) {
      SMqPollRspWrapper* pollRspWrapper = (SMqPollRspWrapper*)pRspWrapper;
X
Xiaoyu Wang 已提交
1985
      int32_t            consumerEpoch = atomic_load_32(&tmq->epoch);
H
Haojun Liao 已提交
1986

L
Liu Jicong 已提交
1987
      if (pollRspWrapper->taosxRsp.head.epoch == consumerEpoch) {
wmmhello's avatar
wmmhello 已提交
1988
        taosWLockLatch(&tmq->lock);
wmmhello's avatar
wmmhello 已提交
1989 1990 1991 1992 1993 1994
        SMqClientVg* pVg = getVgInfo(tmq, pollRspWrapper->topicName, pollRspWrapper->vgId);
        pollRspWrapper->vgHandle = pVg;
        pollRspWrapper->topicHandle = getTopicInfo(tmq, pollRspWrapper->topicName);
        if(pollRspWrapper->vgHandle == NULL || pollRspWrapper->topicHandle == NULL){
          tscError("consumer:0x%" PRIx64 " get vg or topic error, topic:%s vgId:%d", tmq->consumerId,
                   pollRspWrapper->topicName, pollRspWrapper->vgId);
wmmhello's avatar
wmmhello 已提交
1995
          taosWUnLockLatch(&tmq->lock);
wmmhello's avatar
wmmhello 已提交
1996 1997
          return NULL;
        }
H
Haojun Liao 已提交
1998

1999
        updateVgInfo(pVg, &pollRspWrapper->taosxRsp.reqOffset, &pollRspWrapper->taosxRsp.rspOffset, pollRspWrapper->taosxRsp.head.walsver, pollRspWrapper->taosxRsp.head.walever, tmq->consumerId);
H
Haojun Liao 已提交
2000

L
Liu Jicong 已提交
2001
        if (pollRspWrapper->taosxRsp.blockNum == 0) {
wmmhello's avatar
wmmhello 已提交
2002
          tscDebug("consumer:0x%" PRIx64 " taosx empty block received, vgId:%d, vg total:%" PRId64 ", reqId:0x%" PRIx64,
H
Haojun Liao 已提交
2003
                   tmq->consumerId, pVg->vgId, pVg->numOfRows, pollRspWrapper->reqId);
H
Haojun Liao 已提交
2004
          pVg->emptyBlockReceiveTs = taosGetTimestampMs();
2005
          pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
H
Haojun Liao 已提交
2006
          taosFreeQitem(pollRspWrapper);
H
Haojun Liao 已提交
2007
        } else {
X
Xiaoyu Wang 已提交
2008
          pVg->emptyBlockReceiveTs = 0;  // reset the ts
wmmhello's avatar
wmmhello 已提交
2009 2010 2011 2012 2013 2014 2015 2016
          // build rsp
          void*   pRsp = NULL;
          int64_t numOfRows = 0;
          if (pollRspWrapper->taosxRsp.createTableNum == 0) {
            pRsp = tmqBuildRspFromWrapper(pollRspWrapper, pVg, &numOfRows);
          } else {
            pRsp = tmqBuildTaosxRspFromWrapper(pollRspWrapper, pVg, &numOfRows);
          }
2017

wmmhello's avatar
wmmhello 已提交
2018
          tmq->totalRows += numOfRows;
H
Haojun Liao 已提交
2019

wmmhello's avatar
wmmhello 已提交
2020
          char buf[TSDB_OFFSET_LEN] = {0};
2021
          tFormatOffset(buf, TSDB_OFFSET_LEN, &pVg->offsetInfo.endOffset);
wmmhello's avatar
wmmhello 已提交
2022 2023 2024 2025
          tscDebug("consumer:0x%" PRIx64 " process taosx poll rsp, vgId:%d, offset:%s, blocks:%d, rows:%" PRId64
                       ", vg total:%" PRId64 ", total:%" PRId64 ", reqId:0x%" PRIx64,
                   tmq->consumerId, pVg->vgId, buf, pollRspWrapper->dataRsp.blockNum, numOfRows, pVg->numOfRows,
                   tmq->totalRows, pollRspWrapper->reqId);
H
Haojun Liao 已提交
2026

wmmhello's avatar
wmmhello 已提交
2027 2028 2029 2030 2031
          taosFreeQitem(pollRspWrapper);
          taosWUnLockLatch(&tmq->lock);
          return pRsp;
        }
        taosWUnLockLatch(&tmq->lock);
L
Liu Jicong 已提交
2032
      } else {
H
Haojun Liao 已提交
2033
        tscDebug("consumer:0x%" PRIx64 " vgId:%d msg discard since epoch mismatch: msg epoch %d, consumer epoch %d",
2034
                 tmq->consumerId, pollRspWrapper->vgId, pollRspWrapper->taosxRsp.head.epoch, consumerEpoch);
2035
        pRspWrapper = tmqFreeRspWrapper(pRspWrapper);
L
Liu Jicong 已提交
2036 2037
        taosFreeQitem(pollRspWrapper);
      }
X
Xiaoyu Wang 已提交
2038
    } else {
H
Haojun Liao 已提交
2039 2040
      tscDebug("consumer:0x%" PRIx64 " not data msg received", tmq->consumerId);

X
Xiaoyu Wang 已提交
2041
      bool reset = false;
2042 2043
      tmqHandleNoPollRsp(tmq, pRspWrapper, &reset);
      taosFreeQitem(pRspWrapper);
X
Xiaoyu Wang 已提交
2044
      if (pollIfReset && reset) {
2045
        tscDebug("consumer:0x%" PRIx64 ", reset and repoll", tmq->consumerId);
2046
        tmqPollImpl(tmq, timeout);
X
Xiaoyu Wang 已提交
2047 2048 2049 2050 2051
      }
    }
  }
}

2052
TAOS_RES* tmq_consumer_poll(tmq_t* tmq, int64_t timeout) {
L
Liu Jicong 已提交
2053 2054
  void*   rspObj;
  int64_t startTime = taosGetTimestampMs();
L
Liu Jicong 已提交
2055

2056
  tscInfo("consumer:0x%" PRIx64 " start to poll at %" PRId64 ", timeout:%" PRId64, tmq->consumerId, startTime,
X
Xiaoyu Wang 已提交
2057
           timeout);
L
Liu Jicong 已提交
2058

2059
  // in no topic status, delayed task also need to be processed
L
Liu Jicong 已提交
2060
  if (atomic_load_8(&tmq->status) == TMQ_CONSUMER_STATUS__INIT) {
2061
    tscInfo("consumer:0x%" PRIx64 " poll return since consumer is init", tmq->consumerId);
2062
    taosMsleep(500);  //     sleep for a while
2063 2064 2065
    return NULL;
  }

wmmhello's avatar
wmmhello 已提交
2066
  while (atomic_load_8(&tmq->status) == TMQ_CONSUMER_STATUS__RECOVER) {
L
Liu Jicong 已提交
2067
    int32_t retryCnt = 0;
2068
    while (TSDB_CODE_MND_CONSUMER_NOT_READY == doAskEp(tmq)) {
H
Haojun Liao 已提交
2069
      if (retryCnt++ > 40) {
L
Liu Jicong 已提交
2070 2071
        return NULL;
      }
2072

2073
      tscInfo("consumer:0x%" PRIx64 " not ready, retry:%d/40 in 500ms", tmq->consumerId, retryCnt);
L
Liu Jicong 已提交
2074 2075 2076 2077
      taosMsleep(500);
    }
  }

X
Xiaoyu Wang 已提交
2078
  while (1) {
L
Liu Jicong 已提交
2079
    tmqHandleAllDelayedTask(tmq);
2080

L
Liu Jicong 已提交
2081
    if (tmqPollImpl(tmq, timeout) < 0) {
2082
      tscError("consumer:0x%" PRIx64 " return due to poll error", tmq->consumerId);
L
Liu Jicong 已提交
2083
    }
L
Liu Jicong 已提交
2084

2085
    rspObj = tmqHandleAllRsp(tmq, timeout, false);
L
Liu Jicong 已提交
2086
    if (rspObj) {
2087
      tscDebug("consumer:0x%" PRIx64 " return rsp %p", tmq->consumerId, rspObj);
L
Liu Jicong 已提交
2088
      return (TAOS_RES*)rspObj;
L
Liu Jicong 已提交
2089
    } else if (terrno == TSDB_CODE_TQ_NO_COMMITTED_OFFSET) {
2090
      tscInfo("consumer:0x%" PRIx64 " return null since no committed offset", tmq->consumerId);
L
Liu Jicong 已提交
2091
      return NULL;
X
Xiaoyu Wang 已提交
2092
    }
2093

2094
    if (timeout >= 0) {
L
Liu Jicong 已提交
2095
      int64_t currentTime = taosGetTimestampMs();
2096 2097
      int64_t elapsedTime = currentTime - startTime;
      if (elapsedTime > timeout) {
2098
        tscInfo("consumer:0x%" PRIx64 " (epoch %d) timeout, no rsp, start time %" PRId64 ", current time %" PRId64,
L
Liu Jicong 已提交
2099
                 tmq->consumerId, tmq->epoch, startTime, currentTime);
X
Xiaoyu Wang 已提交
2100 2101
        return NULL;
      }
2102
      tsem_timewait(&tmq->rspSem, (timeout - elapsedTime));
L
Liu Jicong 已提交
2103 2104
    } else {
      // use tsem_timewait instead of tsem_wait to avoid unexpected stuck
L
Liu Jicong 已提交
2105
      tsem_timewait(&tmq->rspSem, 1000);
X
Xiaoyu Wang 已提交
2106 2107 2108 2109
    }
  }
}

wmmhello's avatar
wmmhello 已提交
2110 2111
static void displayConsumeStatistics(tmq_t* pTmq) {
  taosRLockLatch(&pTmq->lock);
2112 2113 2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124
  int32_t numOfTopics = taosArrayGetSize(pTmq->clientTopics);
  tscDebug("consumer:0x%" PRIx64 " closing poll:%" PRId64 " rows:%" PRId64 " topics:%d, final epoch:%d",
           pTmq->consumerId, pTmq->pollCnt, pTmq->totalRows, numOfTopics, pTmq->epoch);

  tscDebug("consumer:0x%" PRIx64 " rows dist begin: ", pTmq->consumerId);
  for (int32_t i = 0; i < numOfTopics; ++i) {
    SMqClientTopic* pTopics = taosArrayGet(pTmq->clientTopics, i);

    tscDebug("consumer:0x%" PRIx64 " topic:%d", pTmq->consumerId, i);
    int32_t numOfVgs = taosArrayGetSize(pTopics->vgs);
    for (int32_t j = 0; j < numOfVgs; ++j) {
      SMqClientVg* pVg = taosArrayGet(pTopics->vgs, j);
      tscDebug("topic:%s, %d. vgId:%d rows:%" PRId64, pTopics->topicName, j, pVg->vgId, pVg->numOfRows);
2125
    }
2126
  }
wmmhello's avatar
wmmhello 已提交
2127
  taosRUnLockLatch(&pTmq->lock);
2128 2129
  tscDebug("consumer:0x%" PRIx64 " rows dist end", pTmq->consumerId);
}
2130

2131
int32_t tmq_consumer_close(tmq_t* tmq) {
2132
  tscInfo("consumer:0x%" PRIx64 " start to close consumer, status:%d", tmq->consumerId, tmq->status);
2133
  displayConsumeStatistics(tmq);
2134

2135 2136 2137 2138 2139 2140
  if (tmq->status == TMQ_CONSUMER_STATUS__READY) {
    // if auto commit is set, commit before close consumer. Otherwise, do nothing.
    if (tmq->autoCommit) {
      int32_t rsp = tmq_commit_sync(tmq, NULL);
      if (rsp != 0) {
        return rsp;
2141 2142
      }
    }
2143
    taosSsleep(2);  // sleep 2s for hb to send offset and rows to server
2144

L
Liu Jicong 已提交
2145
    int32_t     retryCnt = 0;
2146
    tmq_list_t* lst = tmq_list_new();
L
Liu Jicong 已提交
2147
    while (1) {
2148
      int32_t rsp = tmq_subscribe(tmq, lst);
L
Liu Jicong 已提交
2149 2150 2151 2152 2153 2154 2155 2156
      if (rsp != TSDB_CODE_MND_CONSUMER_NOT_READY || retryCnt > 5) {
        break;
      } else {
        retryCnt++;
        taosMsleep(500);
      }
    }

2157
    tmq_list_destroy(lst);
2158
  } else {
2159
    tscInfo("consumer:0x%" PRIx64 " not in ready state, close it directly", tmq->consumerId);
L
Liu Jicong 已提交
2160
  }
H
Haojun Liao 已提交
2161

2162
  taosRemoveRef(tmqMgmt.rsetId, tmq->refId);
L
Liu Jicong 已提交
2163
  return 0;
2164
}
L
Liu Jicong 已提交
2165

L
Liu Jicong 已提交
2166 2167
const char* tmq_err2str(int32_t err) {
  if (err == 0) {
L
Liu Jicong 已提交
2168
    return "success";
L
Liu Jicong 已提交
2169
  } else if (err == -1) {
L
Liu Jicong 已提交
2170 2171 2172
    return "fail";
  } else {
    return tstrerror(err);
L
Liu Jicong 已提交
2173 2174
  }
}
L
Liu Jicong 已提交
2175

L
Liu Jicong 已提交
2176 2177 2178 2179 2180
tmq_res_t tmq_get_res_type(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    return TMQ_RES_DATA;
  } else if (TD_RES_TMQ_META(res)) {
    return TMQ_RES_TABLE_META;
2181 2182
  } else if (TD_RES_TMQ_METADATA(res)) {
    return TMQ_RES_METADATA;
L
Liu Jicong 已提交
2183 2184 2185 2186 2187
  } else {
    return TMQ_RES_INVALID;
  }
}

L
Liu Jicong 已提交
2188
const char* tmq_get_topic_name(TAOS_RES* res) {
L
Liu Jicong 已提交
2189 2190
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
L
Liu Jicong 已提交
2191
    return strchr(pRspObj->topic, '.') + 1;
L
Liu Jicong 已提交
2192 2193 2194
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return strchr(pMetaRspObj->topic, '.') + 1;
2195 2196 2197
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return strchr(pRspObj->topic, '.') + 1;
L
Liu Jicong 已提交
2198 2199 2200 2201 2202
  } else {
    return NULL;
  }
}

L
Liu Jicong 已提交
2203 2204 2205 2206
const char* tmq_get_db_name(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    return strchr(pRspObj->db, '.') + 1;
L
Liu Jicong 已提交
2207 2208 2209
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return strchr(pMetaRspObj->db, '.') + 1;
2210 2211 2212
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return strchr(pRspObj->db, '.') + 1;
L
Liu Jicong 已提交
2213 2214 2215 2216 2217
  } else {
    return NULL;
  }
}

L
Liu Jicong 已提交
2218 2219 2220 2221
int32_t tmq_get_vgroup_id(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    return pRspObj->vgId;
L
Liu Jicong 已提交
2222 2223 2224
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pMetaRspObj = (SMqMetaRspObj*)res;
    return pMetaRspObj->vgId;
2225
  } else if (TD_RES_TMQ_METADATA(res)) {
2226 2227
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
    return pRspObj->vgId;
L
Liu Jicong 已提交
2228 2229 2230 2231
  } else {
    return -1;
  }
}
L
Liu Jicong 已提交
2232

2233 2234 2235
int64_t tmq_get_vgroup_offset(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*) res;
2236
    STqOffsetVal* pOffset = &pRspObj->rsp.reqOffset;
2237
    if (pOffset->type == TMQ_OFFSET__LOG) {
2238
      return pRspObj->rsp.reqOffset.version;
2239 2240
    }else{
      tscError("invalid offset type:%d", pOffset->type);
2241 2242 2243 2244 2245 2246 2247 2248
    }
  } else if (TD_RES_TMQ_META(res)) {
    SMqMetaRspObj* pRspObj = (SMqMetaRspObj*)res;
    if (pRspObj->metaRsp.rspOffset.type == TMQ_OFFSET__LOG) {
      return pRspObj->metaRsp.rspOffset.version;
    }
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*) res;
2249 2250
    if (pRspObj->rsp.reqOffset.type == TMQ_OFFSET__LOG) {
      return pRspObj->rsp.reqOffset.version;
2251
    }
2252
  } else{
2253
    tscError("invalid tmq type:%d", *(int8_t*)res);
2254 2255 2256 2257 2258 2259
  }

  // data from tsdb, no valid offset info
  return -1;
}

L
Liu Jicong 已提交
2260 2261 2262 2263 2264 2265 2266
const char* tmq_get_table_name(TAOS_RES* res) {
  if (TD_RES_TMQ(res)) {
    SMqRspObj* pRspObj = (SMqRspObj*)res;
    if (!pRspObj->rsp.withTbName || pRspObj->rsp.blockTbName == NULL || pRspObj->resIter < 0 ||
        pRspObj->resIter >= pRspObj->rsp.blockNum) {
      return NULL;
    }
2267
    return (const char*)taosArrayGetP(pRspObj->rsp.blockTbName, pRspObj->resIter);
2268 2269
  } else if (TD_RES_TMQ_METADATA(res)) {
    SMqTaosxRspObj* pRspObj = (SMqTaosxRspObj*)res;
L
Liu Jicong 已提交
2270 2271 2272
    if (!pRspObj->rsp.withTbName || pRspObj->rsp.blockTbName == NULL || pRspObj->resIter < 0 ||
        pRspObj->resIter >= pRspObj->rsp.blockNum) {
      return NULL;
2273
    }
L
Liu Jicong 已提交
2274 2275
    return (const char*)taosArrayGetP(pRspObj->rsp.blockTbName, pRspObj->resIter);
  }
L
Liu Jicong 已提交
2276 2277
  return NULL;
}
2278

2279 2280 2281 2282
void tmq_commit_async(tmq_t* tmq, const TAOS_RES* pRes, tmq_commit_cb* cb, void* param) {
  if (pRes == NULL) {  // here needs to commit all offsets.
    asyncCommitAllOffsets(tmq, cb, param);
  } else {  // only commit one offset
2283
    asyncCommitFromResult(tmq, pRes, cb, param);
2284
  }
L
Liu Jicong 已提交
2285 2286
}

2287
static void commitCallBackFn(tmq_t *UNUSED_PARAM(tmq), int32_t code, void* param) {
2288 2289 2290
  SSyncCommitInfo* pInfo = (SSyncCommitInfo*) param;
  pInfo->code = code;
  tsem_post(&pInfo->sem);
2291
}
2292

2293 2294 2295 2296 2297 2298 2299 2300 2301
int32_t tmq_commit_sync(tmq_t* tmq, const TAOS_RES* pRes) {
  int32_t code = 0;

  SSyncCommitInfo* pInfo = taosMemoryMalloc(sizeof(SSyncCommitInfo));
  tsem_init(&pInfo->sem, 0, 0);
  pInfo->code = 0;

  if (pRes == NULL) {
    asyncCommitAllOffsets(tmq, commitCallBackFn, pInfo);
H
Haojun Liao 已提交
2302
  } else {
2303
    asyncCommitFromResult(tmq, pRes, commitCallBackFn, pInfo);
2304 2305
  }

2306 2307
  tsem_wait(&pInfo->sem);
  code = pInfo->code;
H
Haojun Liao 已提交
2308 2309

  tsem_destroy(&pInfo->sem);
2310 2311
  taosMemoryFree(pInfo);

X
Xiaoyu Wang 已提交
2312
  tscDebug("consumer:0x%" PRIx64 " sync commit done, code:%s", tmq->consumerId, tstrerror(code));
2313 2314 2315
  return code;
}

2316 2317 2318 2319 2320 2321 2322 2323 2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334 2335 2336 2337 2338 2339 2340 2341 2342 2343 2344 2345 2346 2347 2348 2349 2350 2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372 2373 2374 2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396
// wal range will be ok after calling tmq_get_topic_assignment or poll interface
static bool isWalRangeOk(SVgOffsetInfo* offset){
  if (offset->walVerBegin != -1 && offset->walVerEnd != -1) {
    return true;
  }
  return false;
}

int32_t tmq_commit_offset_sync(tmq_t *tmq, const char *pTopicName, int32_t vgId, int64_t offset){
  if (tmq == NULL || pTopicName == NULL) {
    tscError("invalid tmq handle, null");
    return TSDB_CODE_INVALID_PARA;
  }

  int32_t accId = tmq->pTscObj->acctId;
  char tname[TSDB_TOPIC_FNAME_LEN] = {0};
  sprintf(tname, "%d.%s", accId, pTopicName);

  taosWLockLatch(&tmq->lock);
  SMqClientTopic* pTopic = getTopicByName(tmq, tname);
  if (pTopic == NULL) {
    tscError("consumer:0x%" PRIx64 " invalid topic name:%s", tmq->consumerId, pTopicName);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_TMQ_INVALID_TOPIC;
  }

  SMqClientVg* pVg = NULL;
  int32_t      numOfVgs = taosArrayGetSize(pTopic->vgs);
  for (int32_t i = 0; i < numOfVgs; ++i) {
    SMqClientVg* pClientVg = taosArrayGet(pTopic->vgs, i);
    if (pClientVg->vgId == vgId) {
      pVg = pClientVg;
      break;
    }
  }

  if (pVg == NULL) {
    tscError("consumer:0x%" PRIx64 " invalid vgroup id:%d", tmq->consumerId, vgId);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_TMQ_INVALID_VGID;
  }

  SVgOffsetInfo* pOffsetInfo = &pVg->offsetInfo;
  if (!isWalRangeOk(pOffsetInfo)) {
    tscError("consumer:0x%" PRIx64 " Assignment or poll interface need to be called first", tmq->consumerId);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_TMQ_NEED_INITIALIZED;
  }

  if (offset < pOffsetInfo->walVerBegin || offset > pOffsetInfo->walVerEnd) {
    tscError("consumer:0x%" PRIx64 " invalid seek params, offset:%" PRId64 ", valid range:[%" PRId64 ", %" PRId64 "]",
             tmq->consumerId, offset, pOffsetInfo->walVerBegin, pOffsetInfo->walVerEnd);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_TMQ_VERSION_OUT_OF_RANGE;
  }
  taosWUnLockLatch(&tmq->lock);

  STqOffsetVal offsetVal = {.type = TMQ_OFFSET__LOG, .version = offset};

  SSyncCommitInfo* pInfo = taosMemoryMalloc(sizeof(SSyncCommitInfo));
  if (pInfo == NULL) {
    tscError("consumer:0x%"PRIx64" failed to prepare seek operation", tmq->consumerId);
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  tsem_init(&pInfo->sem, 0, 0);
  pInfo->code = 0;

  asyncCommitOffset(tmq, tname, vgId, &offsetVal, commitCallBackFn, pInfo);

  tsem_wait(&pInfo->sem);
  int32_t code = pInfo->code;

  tsem_destroy(&pInfo->sem);
  taosMemoryFree(pInfo);

  tscInfo("consumer:0x%" PRIx64 " send seek to vgId:%d, offset:%" PRId64" code:%s", tmq->consumerId, vgId, offset, tstrerror(code));

  return code;
}

2397 2398 2399 2400 2401 2402 2403 2404 2405
void updateEpCallbackFn(tmq_t* pTmq, int32_t code, SDataBuf* pDataBuf, void* param) {
  SAskEpInfo* pInfo = param;
  pInfo->code = code;

  if (code == TSDB_CODE_SUCCESS) {
    SMqRspHead* head = pDataBuf->pData;

    SMqAskEpRsp rsp;
    tDecodeSMqAskEpRsp(POINTER_SHIFT(pDataBuf->pData, sizeof(SMqRspHead)), &rsp);
2406
    doUpdateLocalEp(pTmq, head->epoch, &rsp);
2407 2408 2409
    tDeleteSMqAskEpRsp(&rsp);
  }

H
Haojun Liao 已提交
2410
  tsem_post(&pInfo->sem);
2411 2412 2413 2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426 2427 2428 2429 2430 2431 2432 2433 2434 2435 2436
}

void addToQueueCallbackFn(tmq_t* pTmq, int32_t code, SDataBuf* pDataBuf, void* param) {
  if (code != TSDB_CODE_SUCCESS) {
    terrno = code;
    return;
  }

  SMqAskEpRspWrapper* pWrapper = taosAllocateQitem(sizeof(SMqAskEpRspWrapper), DEF_QITEM, 0);
  if (pWrapper == NULL) {
    terrno = TSDB_CODE_OUT_OF_MEMORY;
    return;
  }

  SMqRspHead* head = pDataBuf->pData;

  pWrapper->tmqRspType = TMQ_MSG_TYPE__EP_RSP;
  pWrapper->epoch = head->epoch;
  memcpy(&pWrapper->msg, pDataBuf->pData, sizeof(SMqRspHead));
  tDecodeSMqAskEpRsp(POINTER_SHIFT(pDataBuf->pData, sizeof(SMqRspHead)), &pWrapper->msg);

  taosWriteQitem(pTmq->mqueue, pWrapper);
}

int32_t doAskEp(tmq_t* pTmq) {
  SAskEpInfo* pInfo = taosMemoryMalloc(sizeof(SAskEpInfo));
H
Haojun Liao 已提交
2437
  tsem_init(&pInfo->sem, 0, 0);
2438 2439

  asyncAskEp(pTmq, updateEpCallbackFn, pInfo);
H
Haojun Liao 已提交
2440
  tsem_wait(&pInfo->sem);
2441 2442

  int32_t code = pInfo->code;
H
Haojun Liao 已提交
2443
  tsem_destroy(&pInfo->sem);
2444 2445 2446 2447 2448
  taosMemoryFree(pInfo);
  return code;
}

void asyncAskEp(tmq_t* pTmq, __tmq_askep_fn_t askEpFn, void* param) {
2449
  SMqAskEpReq req = {0};
2450 2451 2452
  req.consumerId = pTmq->consumerId;
  req.epoch = pTmq->epoch;
  strcpy(req.cgroup, pTmq->groupId);
2453 2454 2455

  int32_t tlen = tSerializeSMqAskEpReq(NULL, 0, &req);
  if (tlen < 0) {
2456 2457 2458
    tscError("consumer:0x%" PRIx64 ", tSerializeSMqAskEpReq failed", pTmq->consumerId);
    askEpFn(pTmq, TSDB_CODE_INVALID_PARA, NULL, param);
    return;
2459 2460 2461 2462
  }

  void* pReq = taosMemoryCalloc(1, tlen);
  if (pReq == NULL) {
2463 2464 2465
    tscError("consumer:0x%" PRIx64 ", failed to malloc askEpReq msg, size:%d", pTmq->consumerId, tlen);
    askEpFn(pTmq, TSDB_CODE_OUT_OF_MEMORY, NULL, param);
    return;
2466 2467 2468
  }

  if (tSerializeSMqAskEpReq(pReq, tlen, &req) < 0) {
2469
    tscError("consumer:0x%" PRIx64 ", tSerializeSMqAskEpReq %d failed", pTmq->consumerId, tlen);
2470
    taosMemoryFree(pReq);
2471 2472 2473

    askEpFn(pTmq, TSDB_CODE_INVALID_PARA, NULL, param);
    return;
2474 2475 2476 2477
  }

  SMqAskEpCbParam* pParam = taosMemoryCalloc(1, sizeof(SMqAskEpCbParam));
  if (pParam == NULL) {
2478
    tscError("consumer:0x%" PRIx64 ", failed to malloc subscribe param", pTmq->consumerId);
2479
    taosMemoryFree(pReq);
2480 2481 2482

    askEpFn(pTmq, TSDB_CODE_OUT_OF_MEMORY, NULL, param);
    return;
2483 2484
  }

2485 2486 2487 2488
  pParam->refId = pTmq->refId;
  pParam->epoch = pTmq->epoch;
  pParam->pUserFn = askEpFn;
  pParam->pParam = param;
2489 2490 2491 2492 2493

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(pParam);
    taosMemoryFree(pReq);
2494 2495
    askEpFn(pTmq, TSDB_CODE_OUT_OF_MEMORY, NULL, param);
    return;
2496 2497
  }

X
Xiaoyu Wang 已提交
2498
  sendInfo->msgInfo = (SDataBuf){.pData = pReq, .len = tlen, .handle = NULL};
2499 2500 2501 2502

  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
  sendInfo->param = pParam;
2503
  sendInfo->fp = askEpCallbackFn;
2504 2505
  sendInfo->msgType = TDMT_MND_TMQ_ASK_EP;

2506
  SEpSet epSet = getEpSet_s(&pTmq->pTscObj->pAppInfo->mgmtEp);
2507
  tscInfo("consumer:0x%" PRIx64 " ask ep from mnode, reqId:0x%" PRIx64, pTmq->consumerId, sendInfo->requestId);
2508 2509

  int64_t transporterId = 0;
2510
  asyncSendMsgToServer(pTmq->pTscObj->pAppInfo->pTransporter, &epSet, &transporterId, sendInfo);
2511 2512 2513 2514 2515 2516 2517
}

int32_t makeTopicVgroupKey(char* dst, const char* topicName, int32_t vg) {
  return sprintf(dst, "%s:%d", topicName, vg);
}

int32_t tmqCommitDone(SMqCommitCbParamSet* pParamSet) {
2518 2519 2520
  int64_t refId = pParamSet->refId;

  tmq_t* tmq = taosAcquireRef(tmqMgmt.rsetId, refId);
2521 2522 2523 2524 2525 2526 2527
  if (tmq == NULL) {
    taosMemoryFree(pParamSet);
    terrno = TSDB_CODE_TMQ_CONSUMER_CLOSED;
    return -1;
  }

  // if no more waiting rsp
2528
  pParamSet->callbackFn(tmq, pParamSet->code, pParamSet->userParam);
2529
  taosMemoryFree(pParamSet);
wmmhello's avatar
wmmhello 已提交
2530
//  tmq->needReportOffsetRows = true;
2531 2532

  taosReleaseRef(tmqMgmt.rsetId, refId);
2533
  return 0;
2534 2535
}

2536
void commitRspCountDown(SMqCommitCbParamSet* pParamSet, int64_t consumerId, const char* pTopic, int32_t vgId) {
2537 2538
  int32_t waitingRspNum = atomic_sub_fetch_32(&pParamSet->waitingRspNum, 1);
  if (waitingRspNum == 0) {
2539
    tscInfo("consumer:0x%" PRIx64 " topic:%s vgId:%d all commit-rsp received, commit completed", consumerId, pTopic, vgId);
2540
    tmqCommitDone(pParamSet);
H
Haojun Liao 已提交
2541
  } else {
2542
    tscInfo("consumer:0x%" PRIx64 " topic:%s vgId:%d commit-rsp received, remain:%d", consumerId, pTopic, vgId, waitingRspNum);
2543 2544
  }
}
2545 2546 2547 2548 2549 2550 2551 2552 2553 2554 2555 2556 2557 2558 2559 2560 2561 2562 2563 2564 2565 2566

SReqResultInfo* tmqGetNextResInfo(TAOS_RES* res, bool convertUcs4) {
  SMqRspObj* pRspObj = (SMqRspObj*)res;
  pRspObj->resIter++;

  if (pRspObj->resIter < pRspObj->rsp.blockNum) {
    SRetrieveTableRsp* pRetrieve = (SRetrieveTableRsp*)taosArrayGetP(pRspObj->rsp.blockData, pRspObj->resIter);
    if (pRspObj->rsp.withSchema) {
      SSchemaWrapper* pSW = (SSchemaWrapper*)taosArrayGetP(pRspObj->rsp.blockSchema, pRspObj->resIter);
      setResSchemaInfo(&pRspObj->resInfo, pSW->pSchema, pSW->nCols);
      taosMemoryFreeClear(pRspObj->resInfo.row);
      taosMemoryFreeClear(pRspObj->resInfo.pCol);
      taosMemoryFreeClear(pRspObj->resInfo.length);
      taosMemoryFreeClear(pRspObj->resInfo.convertBuf);
      taosMemoryFreeClear(pRspObj->resInfo.convertJson);
    }

    setQueryResultFromRsp(&pRspObj->resInfo, pRetrieve, convertUcs4, false);
    return &pRspObj->resInfo;
  }

  return NULL;
H
Haojun Liao 已提交
2567 2568
}

2569 2570 2571 2572 2573 2574 2575 2576 2577 2578 2579 2580 2581 2582 2583 2584 2585 2586 2587
static int32_t tmqGetWalInfoCb(void* param, SDataBuf* pMsg, int32_t code) {
  SMqVgWalInfoParam* pParam = param;
  SMqVgCommon* pCommon = pParam->pCommon;

  int32_t total = atomic_add_fetch_32(&pCommon->numOfRsp, 1);
  if (code != TSDB_CODE_SUCCESS) {
    tscError("consumer:0x%" PRIx64 " failed to get the wal info from vgId:%d for topic:%s", pCommon->consumerId,
             pParam->vgId, pCommon->pTopicName);
    pCommon->code = code;
  } else {
    SMqDataRsp rsp;
    SDecoder decoder;
    tDecoderInit(&decoder, POINTER_SHIFT(pMsg->pData, sizeof(SMqRspHead)), pMsg->len - sizeof(SMqRspHead));
    tDecodeMqDataRsp(&decoder, &rsp);
    tDecoderClear(&decoder);

    SMqRspHead* pHead = pMsg->pData;

    tmq_topic_assignment assignment = {.begin = pHead->walsver,
2588
                                       .end = pHead->walever + 1,
2589
                                       .currentOffset = rsp.rspOffset.version,
2590
                                       .vgId = pParam->vgId};
2591 2592 2593 2594 2595 2596 2597 2598 2599 2600

    taosThreadMutexLock(&pCommon->mutex);
    taosArrayPush(pCommon->pList, &assignment);
    taosThreadMutexUnlock(&pCommon->mutex);
  }

  if (total == pParam->totalReq) {
    tsem_post(&pCommon->rsp);
  }

2601 2602
  taosMemoryFree(pMsg->pData);
  taosMemoryFree(pMsg->pEpSet);
2603 2604 2605 2606 2607
  taosMemoryFree(pParam);
  return 0;
}

static void destroyCommonInfo(SMqVgCommon* pCommon) {
wmmhello's avatar
wmmhello 已提交
2608 2609 2610
  if(pCommon == NULL){
    return;
  }
2611 2612 2613 2614 2615 2616 2617
  taosArrayDestroy(pCommon->pList);
  tsem_destroy(&pCommon->rsp);
  taosThreadMutexDestroy(&pCommon->mutex);
  taosMemoryFree(pCommon->pTopicName);
  taosMemoryFree(pCommon);
}

2618 2619 2620 2621 2622 2623 2624
static bool isInSnapshotMode(int8_t type, bool useSnapshot){
  if ((type < TMQ_OFFSET__LOG && useSnapshot) || type > TMQ_OFFSET__LOG) {
    return true;
  }
  return false;
}

2625 2626 2627 2628 2629 2630 2631 2632 2633 2634 2635 2636 2637 2638 2639 2640 2641 2642 2643 2644 2645 2646 2647 2648 2649 2650 2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661 2662 2663 2664 2665 2666 2667 2668 2669 2670 2671 2672 2673 2674 2675 2676 2677 2678 2679 2680 2681 2682 2683 2684 2685 2686 2687
int64_t tmq_position(tmq_t *tmq, const char *pTopicName, int32_t vgId){
  if (tmq == NULL) {
    tscError("invalid tmq handle, null");
    return TSDB_CODE_INVALID_PARA;
  }

  int32_t accId = tmq->pTscObj->acctId;
  char tname[TSDB_TOPIC_FNAME_LEN] = {0};
  sprintf(tname, "%d.%s", accId, pTopicName);

  taosWLockLatch(&tmq->lock);
  SMqClientTopic* pTopic = getTopicByName(tmq, tname);
  if (pTopic == NULL) {
    tscError("consumer:0x%" PRIx64 " invalid topic name:%s", tmq->consumerId, pTopicName);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_TMQ_INVALID_TOPIC;
  }

  SMqClientVg* pVg = NULL;
  int32_t      numOfVgs = taosArrayGetSize(pTopic->vgs);
  for (int32_t i = 0; i < numOfVgs; ++i) {
    SMqClientVg* pClientVg = taosArrayGet(pTopic->vgs, i);
    if (pClientVg->vgId == vgId) {
      pVg = pClientVg;
      break;
    }
  }

  if (pVg == NULL) {
    tscError("consumer:0x%" PRIx64 " invalid vgroup id:%d", tmq->consumerId, vgId);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_TMQ_INVALID_VGID;
  }

  int32_t type = pVg->offsetInfo.endOffset.type;
  if (isInSnapshotMode(type, tmq->useSnapshot)) {
    tscError("consumer:0x%" PRIx64 " offset type:%d not wal version, position error", tmq->consumerId, type);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_TMQ_SNAPSHOT_ERROR;
  }

  if (!isWalRangeOk(&pVg->offsetInfo)) {
    tscError("consumer:0x%" PRIx64 " Assignment or poll interface need to be called first", tmq->consumerId);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_TMQ_NEED_INITIALIZED;
  }

  int64_t position = 0;
  STqOffsetVal* pOffsetInfo = &pVg->offsetInfo.endOffset;
  if(type == TMQ_OFFSET__LOG){
    position = pOffsetInfo->version;
  }else if(type == TMQ_OFFSET__RESET_EARLIEST){
    position = pVg->offsetInfo.walVerBegin;
  }else if(type == TMQ_OFFSET__RESET_LATEST){
    position = pVg->offsetInfo.walVerEnd;
  }else{
    tscError("consumer:0x%" PRIx64 " offset type:%d can not be reach here", tmq->consumerId, type);
  }
  taosWUnLockLatch(&tmq->lock);

  return position;
}

H
Haojun Liao 已提交
2688
int32_t tmq_get_topic_assignment(tmq_t* tmq, const char* pTopicName, tmq_topic_assignment** assignment,
H
Haojun Liao 已提交
2689
                                 int32_t* numOfAssignment) {
H
Haojun Liao 已提交
2690 2691
  *numOfAssignment = 0;
  *assignment = NULL;
wmmhello's avatar
wmmhello 已提交
2692
  SMqVgCommon* pCommon = NULL;
H
Haojun Liao 已提交
2693

2694
  int32_t accId = tmq->pTscObj->acctId;
2695
  char    tname[TSDB_TOPIC_FNAME_LEN] = {0};
2696
  sprintf(tname, "%d.%s", accId, pTopicName);
wmmhello's avatar
wmmhello 已提交
2697
  int32_t code = TSDB_CODE_SUCCESS;
2698

wmmhello's avatar
wmmhello 已提交
2699
  taosWLockLatch(&tmq->lock);
2700
  SMqClientTopic* pTopic = getTopicByName(tmq, tname);
H
Haojun Liao 已提交
2701
  if (pTopic == NULL) {
wmmhello's avatar
wmmhello 已提交
2702 2703
    code = TSDB_CODE_INVALID_PARA;
    goto end;
H
Haojun Liao 已提交
2704 2705 2706 2707
  }

  // in case of snapshot is opened, no valid offset will return
  *numOfAssignment = taosArrayGetSize(pTopic->vgs);
2708 2709
  for (int32_t j = 0; j < (*numOfAssignment); ++j) {
    SMqClientVg* pClientVg = taosArrayGet(pTopic->vgs, j);
2710
    int32_t type = pClientVg->offsetInfo.beginOffset.type;
2711 2712
    if (isInSnapshotMode(type, tmq->useSnapshot)) {
      tscError("consumer:0x%" PRIx64 " offset type:%d not wal version, assignment not allowed", tmq->consumerId, type);
2713 2714 2715 2716
      code = TSDB_CODE_TMQ_SNAPSHOT_ERROR;
      goto end;
    }
  }
2717 2718 2719 2720 2721

  *assignment = taosMemoryCalloc(*numOfAssignment, sizeof(tmq_topic_assignment));
  if (*assignment == NULL) {
    tscError("consumer:0x%" PRIx64 " failed to malloc buffer, size:%" PRIzu, tmq->consumerId,
             (*numOfAssignment) * sizeof(tmq_topic_assignment));
wmmhello's avatar
wmmhello 已提交
2722 2723
    code = TSDB_CODE_OUT_OF_MEMORY;
    goto end;
2724 2725
  }

2726 2727
  bool needFetch = false;

H
Haojun Liao 已提交
2728 2729
  for (int32_t j = 0; j < (*numOfAssignment); ++j) {
    SMqClientVg* pClientVg = taosArrayGet(pTopic->vgs, j);
2730
    if (pClientVg->offsetInfo.beginOffset.type != TMQ_OFFSET__LOG) {
2731 2732 2733
      needFetch = true;
      break;
    }
H
Haojun Liao 已提交
2734 2735

    tmq_topic_assignment* pAssignment = &(*assignment)[j];
2736
    pAssignment->currentOffset = pClientVg->offsetInfo.beginOffset.version;
H
Haojun Liao 已提交
2737 2738
    pAssignment->begin = pClientVg->offsetInfo.walVerBegin;
    pAssignment->end = pClientVg->offsetInfo.walVerEnd;
2739
    pAssignment->vgId = pClientVg->vgId;
wmmhello's avatar
wmmhello 已提交
2740 2741
    tscInfo("consumer:0x%" PRIx64 " get assignment from local:%d->%" PRId64, tmq->consumerId,
            pAssignment->vgId, pAssignment->currentOffset);
H
Haojun Liao 已提交
2742 2743
  }

2744
  if (needFetch) {
wmmhello's avatar
wmmhello 已提交
2745
    pCommon = taosMemoryCalloc(1, sizeof(SMqVgCommon));
2746 2747
    if (pCommon == NULL) {
      terrno = TSDB_CODE_OUT_OF_MEMORY;
wmmhello's avatar
wmmhello 已提交
2748 2749
      code = terrno;
      goto end;
2750 2751 2752 2753 2754 2755 2756 2757 2758 2759 2760 2761 2762 2763
    }

    pCommon->pList= taosArrayInit(4, sizeof(tmq_topic_assignment));
    tsem_init(&pCommon->rsp, 0, 0);
    taosThreadMutexInit(&pCommon->mutex, 0);
    pCommon->pTopicName = taosStrdup(pTopic->topicName);
    pCommon->consumerId = tmq->consumerId;

    terrno = TSDB_CODE_OUT_OF_MEMORY;
    for (int32_t i = 0; i < (*numOfAssignment); ++i) {
      SMqClientVg* pClientVg = taosArrayGet(pTopic->vgs, i);

      SMqVgWalInfoParam* pParam = taosMemoryMalloc(sizeof(SMqVgWalInfoParam));
      if (pParam == NULL) {
wmmhello's avatar
wmmhello 已提交
2764 2765
        code = terrno;
        goto end;
2766 2767 2768 2769 2770 2771 2772 2773 2774
      }

      pParam->epoch = tmq->epoch;
      pParam->vgId = pClientVg->vgId;
      pParam->totalReq = *numOfAssignment;
      pParam->pCommon = pCommon;

      SMqPollReq req = {0};
      tmqBuildConsumeReqImpl(&req, tmq, 10, pTopic, pClientVg);
2775
      req.reqOffset = pClientVg->offsetInfo.beginOffset;
2776 2777 2778 2779

      int32_t msgSize = tSerializeSMqPollReq(NULL, 0, &req);
      if (msgSize < 0) {
        taosMemoryFree(pParam);
wmmhello's avatar
wmmhello 已提交
2780 2781
        code = terrno;
        goto end;
2782 2783 2784 2785 2786
      }

      char* msg = taosMemoryCalloc(1, msgSize);
      if (NULL == msg) {
        taosMemoryFree(pParam);
wmmhello's avatar
wmmhello 已提交
2787 2788
        code = terrno;
        goto end;
2789 2790 2791 2792 2793
      }

      if (tSerializeSMqPollReq(msg, msgSize, &req) < 0) {
        taosMemoryFree(msg);
        taosMemoryFree(pParam);
wmmhello's avatar
wmmhello 已提交
2794 2795
        code = terrno;
        goto end;
2796 2797 2798 2799 2800 2801
      }

      SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
      if (sendInfo == NULL) {
        taosMemoryFree(pParam);
        taosMemoryFree(msg);
wmmhello's avatar
wmmhello 已提交
2802 2803
        code = terrno;
        goto end;
2804 2805 2806 2807 2808 2809 2810 2811 2812 2813
      }

      sendInfo->msgInfo = (SDataBuf){.pData = msg, .len = msgSize, .handle = NULL};
      sendInfo->requestId = req.reqId;
      sendInfo->requestObjRefId = 0;
      sendInfo->param = pParam;
      sendInfo->fp = tmqGetWalInfoCb;
      sendInfo->msgType = TDMT_VND_TMQ_VG_WALINFO;

      int64_t transporterId = 0;
wmmhello's avatar
wmmhello 已提交
2814
      char    offsetFormatBuf[TSDB_OFFSET_LEN] = {0};
2815
      tFormatOffset(offsetFormatBuf, tListLen(offsetFormatBuf), &pClientVg->offsetInfo.beginOffset);
2816

2817
      tscInfo("consumer:0x%" PRIx64 " %s retrieve wal info vgId:%d, epoch %d, req:%s, reqId:0x%" PRIx64,
wmmhello's avatar
wmmhello 已提交
2818
              tmq->consumerId, pTopic->topicName, pClientVg->vgId, tmq->epoch, offsetFormatBuf, req.reqId);
2819 2820 2821 2822
      asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &pClientVg->epSet, &transporterId, sendInfo);
    }

    tsem_wait(&pCommon->rsp);
wmmhello's avatar
wmmhello 已提交
2823
    code = pCommon->code;
2824 2825 2826

    terrno = code;
    if (code != TSDB_CODE_SUCCESS) {
wmmhello's avatar
wmmhello 已提交
2827
      goto end;
2828
    }
wmmhello's avatar
wmmhello 已提交
2829 2830 2831
    int32_t num = taosArrayGetSize(pCommon->pList);
    for(int32_t i = 0; i < num; ++i) {
      (*assignment)[i] = *(tmq_topic_assignment*)taosArrayGet(pCommon->pList, i);
2832
    }
wmmhello's avatar
wmmhello 已提交
2833
    *numOfAssignment = num;
2834

2835 2836 2837 2838 2839 2840 2841 2842 2843 2844
    for (int32_t j = 0; j < (*numOfAssignment); ++j) {
      tmq_topic_assignment* p = &(*assignment)[j];

      for(int32_t i = 0; i < taosArrayGetSize(pTopic->vgs); ++i) {
        SMqClientVg* pClientVg = taosArrayGet(pTopic->vgs, i);
        if (pClientVg->vgId != p->vgId) {
          continue;
        }

        SVgOffsetInfo* pOffsetInfo = &pClientVg->offsetInfo;
wmmhello's avatar
wmmhello 已提交
2845
        tscInfo("vgId:%d offset is update to:%"PRId64, p->vgId, p->currentOffset);
2846 2847 2848 2849 2850

        pOffsetInfo->walVerBegin = p->begin;
        pOffsetInfo->walVerEnd = p->end;
      }
    }
wmmhello's avatar
wmmhello 已提交
2851
  }
2852

wmmhello's avatar
wmmhello 已提交
2853 2854 2855 2856 2857
end:
  if(code != TSDB_CODE_SUCCESS){
    taosMemoryFree(*assignment);
    *assignment = NULL;
    *numOfAssignment = 0;
2858
  }
wmmhello's avatar
wmmhello 已提交
2859 2860 2861
  destroyCommonInfo(pCommon);
  taosWUnLockLatch(&tmq->lock);
  return code;
H
Haojun Liao 已提交
2862 2863
}

T
t_max 已提交
2864 2865 2866 2867 2868 2869 2870 2871
void tmq_free_assignment(tmq_topic_assignment* pAssignment) {
    if (pAssignment == NULL) {
        return;
    }

    taosMemoryFree(pAssignment);
}

2872 2873 2874 2875 2876 2877 2878 2879 2880 2881 2882
static int32_t tmqSeekCb(void* param, SDataBuf* pMsg, int32_t code) {
  if (pMsg) {
    taosMemoryFree(pMsg->pData);
    taosMemoryFree(pMsg->pEpSet);
  }
  SMqSeekParam* pParam = param;
  pParam->code = code;
  tsem_post(&pParam->sem);
  return 0;
}

2883
int32_t tmq_offset_seek(tmq_t* tmq, const char* pTopicName, int32_t vgId, int64_t offset) {
H
Haojun Liao 已提交
2884
  if (tmq == NULL) {
H
Haojun Liao 已提交
2885
    tscError("invalid tmq handle, null");
H
Haojun Liao 已提交
2886 2887 2888
    return TSDB_CODE_INVALID_PARA;
  }

2889
  int32_t accId = tmq->pTscObj->acctId;
2890
  char tname[TSDB_TOPIC_FNAME_LEN] = {0};
2891 2892
  sprintf(tname, "%d.%s", accId, pTopicName);

wmmhello's avatar
wmmhello 已提交
2893
  taosWLockLatch(&tmq->lock);
2894
  SMqClientTopic* pTopic = getTopicByName(tmq, tname);
H
Haojun Liao 已提交
2895
  if (pTopic == NULL) {
2896
    tscError("consumer:0x%" PRIx64 " invalid topic name:%s", tmq->consumerId, pTopicName);
wmmhello's avatar
wmmhello 已提交
2897
    taosWUnLockLatch(&tmq->lock);
2898
    return TSDB_CODE_TMQ_INVALID_TOPIC;
H
Haojun Liao 已提交
2899 2900 2901
  }

  SMqClientVg* pVg = NULL;
H
Haojun Liao 已提交
2902 2903
  int32_t      numOfVgs = taosArrayGetSize(pTopic->vgs);
  for (int32_t i = 0; i < numOfVgs; ++i) {
H
Haojun Liao 已提交
2904
    SMqClientVg* pClientVg = taosArrayGet(pTopic->vgs, i);
2905
    if (pClientVg->vgId == vgId) {
H
Haojun Liao 已提交
2906 2907 2908 2909 2910 2911
      pVg = pClientVg;
      break;
    }
  }

  if (pVg == NULL) {
2912
    tscError("consumer:0x%" PRIx64 " invalid vgroup id:%d", tmq->consumerId, vgId);
wmmhello's avatar
wmmhello 已提交
2913
    taosWUnLockLatch(&tmq->lock);
2914
    return TSDB_CODE_TMQ_INVALID_VGID;
H
Haojun Liao 已提交
2915 2916 2917 2918
  }

  SVgOffsetInfo* pOffsetInfo = &pVg->offsetInfo;

2919
  int32_t type = pOffsetInfo->endOffset.type;
2920
  if (isInSnapshotMode(type, tmq->useSnapshot)) {
wmmhello's avatar
wmmhello 已提交
2921 2922
    tscError("consumer:0x%" PRIx64 " offset type:%d not wal version, seek not allowed", tmq->consumerId, type);
    taosWUnLockLatch(&tmq->lock);
2923
    return TSDB_CODE_TMQ_SNAPSHOT_ERROR;
wmmhello's avatar
wmmhello 已提交
2924 2925
  }

2926 2927 2928 2929 2930 2931 2932
  if (!isWalRangeOk(&pVg->offsetInfo)) {
    tscError("consumer:0x%" PRIx64 " Assignment or poll interface need to be called first", tmq->consumerId);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_TMQ_NEED_INITIALIZED;
  }

  if (offset < pOffsetInfo->walVerBegin || offset > pOffsetInfo->walVerEnd) {
wmmhello's avatar
wmmhello 已提交
2933 2934 2935
    tscError("consumer:0x%" PRIx64 " invalid seek params, offset:%" PRId64 ", valid range:[%" PRId64 ", %" PRId64 "]",
             tmq->consumerId, offset, pOffsetInfo->walVerBegin, pOffsetInfo->walVerEnd);
    taosWUnLockLatch(&tmq->lock);
2936
    return TSDB_CODE_TMQ_VERSION_OUT_OF_RANGE;
wmmhello's avatar
wmmhello 已提交
2937
  }
H
Haojun Liao 已提交
2938

H
Haojun Liao 已提交
2939
  // update the offset, and then commit to vnode
2940 2941 2942
  pOffsetInfo->endOffset.type = TMQ_OFFSET__LOG;
  pOffsetInfo->endOffset.version = offset;
  pOffsetInfo->beginOffset = pOffsetInfo->endOffset;
wmmhello's avatar
wmmhello 已提交
2943
  pVg->seekUpdated = true;
2944 2945 2946 2947 2948 2949 2950 2951 2952 2953 2954 2955 2956 2957 2958 2959 2960 2961 2962 2963 2964 2965 2966 2967 2968 2969 2970 2971 2972 2973 2974 2975 2976 2977 2978 2979 2980 2981 2982 2983 2984 2985 2986 2987 2988 2989 2990
  tscInfo("consumer:0x%" PRIx64 " seek to %" PRId64 " on vgId:%d", tmq->consumerId, offset, vgId);

  SMqSeekReq req = {0};
  snprintf(req.subKey, TSDB_SUBSCRIBE_KEY_LEN, "%s:%s", tmq->groupId, pTopic->topicName);
  req.head.vgId = pVg->vgId;
  req.consumerId = tmq->consumerId;

  int32_t msgSize = tSerializeSMqSeekReq(NULL, 0, &req);
  if (msgSize < 0) {
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_PAR_INTERNAL_ERROR;
  }

  char* msg = taosMemoryCalloc(1, msgSize);
  if (NULL == msg) {
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  if (tSerializeSMqSeekReq(msg, msgSize, &req) < 0) {
    taosMemoryFree(msg);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_PAR_INTERNAL_ERROR;
  }

  SMsgSendInfo* sendInfo = taosMemoryCalloc(1, sizeof(SMsgSendInfo));
  if (sendInfo == NULL) {
    taosMemoryFree(msg);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_OUT_OF_MEMORY;
  }

  SMqSeekParam* pParam = taosMemoryMalloc(sizeof(SMqSeekParam));
  if (pParam == NULL) {
    taosMemoryFree(msg);
    taosMemoryFree(sendInfo);
    taosWUnLockLatch(&tmq->lock);
    return TSDB_CODE_OUT_OF_MEMORY;
  }
  tsem_init(&pParam->sem, 0, 0);

  sendInfo->msgInfo = (SDataBuf){.pData = msg, .len = msgSize, .handle = NULL};
  sendInfo->requestId = generateRequestId();
  sendInfo->requestObjRefId = 0;
  sendInfo->param = pParam;
  sendInfo->fp = tmqSeekCb;
  sendInfo->msgType = TDMT_VND_TMQ_SEEK;
H
Haojun Liao 已提交
2991

2992 2993 2994 2995
  int64_t transporterId = 0;
  tscInfo("consumer:0x%" PRIx64 " %s send seek info vgId:%d, epoch %d" PRIx64,
          tmq->consumerId, pTopic->topicName, vgId, tmq->epoch);
  asyncSendMsgToServer(tmq->pTscObj->pAppInfo->pTransporter, &pVg->epSet, &transporterId, sendInfo);
wmmhello's avatar
wmmhello 已提交
2996
  taosWUnLockLatch(&tmq->lock);
2997

2998 2999 3000 3001
  tsem_wait(&pParam->sem);
  int32_t code = pParam->code;
  tsem_destroy(&pParam->sem);
  taosMemoryFree(pParam);
H
Haojun Liao 已提交
3002

3003 3004 3005 3006 3007
  if (code != TSDB_CODE_SUCCESS) {
    tscError("consumer:0x%" PRIx64 " failed to send seek to vgId:%d, code:%s", tmq->consumerId, vgId, tstrerror(code));
  }

  return code;
P
plum-lihui 已提交
3008
}