提交 46579b86 编写于 作者: H Hongqin-Li 提交者: ob-robot

Fix fetch tablet autoinc hang after leader switch

上级 170ebd9b
...@@ -151,40 +151,31 @@ int ObTabletAutoincMgr::fetch_new_range(const ObTabletAutoincParam &param, ...@@ -151,40 +151,31 @@ int ObTabletAutoincMgr::fetch_new_range(const ObTabletAutoincParam &param,
arg.tenant_id_ = param.tenant_id_; arg.tenant_id_ = param.tenant_id_;
arg.tablet_id_ = tablet_id; arg.tablet_id_ = tablet_id;
arg.ls_id_ = ls_id; arg.ls_id_ = ls_id;
if (OB_FAIL(srv_rpc_proxy->to(leader_addr).fetch_tablet_autoinc_seq_cache(arg, res))) {
LOG_WARN("fail to fetch autoinc cache for tablets", K(ret), K(arg));
}
if (OB_FAIL(ret)) { bool finish = false;
int tmp_ret = OB_SUCCESS; for (int64_t retry_times = 0; OB_SUCC(ret) && !finish; retry_times++) {
int64_t retry_times = 0; if (OB_FAIL(srv_rpc_proxy->to(leader_addr).fetch_tablet_autoinc_seq_cache(arg, res))) {
if (OB_NOT_MASTER == ret) { LOG_WARN("fail to fetch autoinc cache for tablets", K(ret), K(retry_times), K(arg));
if (OB_TMP_FAIL(location_service->get(param.tenant_id_, tablet_id, INT64_MAX/*expire_renew_time*/, is_cache_hit, ls_id))) { } else {
LOG_WARN("fail to get log stream id", K(tmp_ret), K(ret), K(tablet_id)); finish = true;
} else if (OB_TMP_FAIL(location_service->get_leader(GCONF.cluster_id,
param.tenant_id_,
ls_id,
true/*force_renew*/,
leader_addr))) {
LOG_WARN("force get leader failed", K(tmp_ret), K(ret), K(ls_id));
}
} }
if (OB_SUCCESS == tmp_ret) { if (OB_FAIL(ret) && is_retryable(ret)) {
bool worker_err = false; const bool need_refresh_leader = OB_NOT_MASTER == ret;
while (OB_FAIL(ret) && !worker_err && is_retryable(ret)) { ob_usleep<common::ObWaitEventIds::STORAGE_AUTOINC_FETCH_RETRY_SLEEP>(RETRY_INTERVAL);
++retry_times; res.reset();
ob_usleep<common::ObWaitEventIds::STORAGE_AUTOINC_FETCH_RETRY_SLEEP>(RETRY_INTERVAL); if (OB_FAIL(THIS_WORKER.check_status())) { // overwrite ret
res.reset(); LOG_WARN("failed to check status", K(ret));
if (OB_FAIL(THIS_WORKER.check_status())) { } else if (need_refresh_leader) {
worker_err = true; if (OB_FAIL(location_service->get(param.tenant_id_, tablet_id, INT64_MAX/*expire_renew_time*/, is_cache_hit, ls_id))) {
LOG_WARN("failed to check status", K(ret)); LOG_WARN("fail to get log stream id", K(ret), K(ret), K(tablet_id));
} else if (OB_FAIL(srv_rpc_proxy->to(leader_addr).fetch_tablet_autoinc_seq_cache(arg, res))) { } else if (OB_FAIL(location_service->get_leader(GCONF.cluster_id,
LOG_WARN("fail to fetch autoinc cache for tablets", K(ret), K(retry_times), K(arg)); param.tenant_id_,
ls_id,
true/*force_renew*/,
leader_addr))) {
LOG_WARN("force get leader failed", K(ret), K(ret), K(ls_id));
} }
} }
} else {
LOG_WARN("fetch new range from leader failed", K(ret), K(tmp_ret));
ret = tmp_ret;
} }
} }
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册