提交 bc70c292 编写于 作者: H Huazhong Tan 提交者: Xie XiuQi

net: hns3: add some DFX info for reset issue

driver inclusion
category: bugfix
bugzilla: NA
CVE: NA

This patch adds more information for reset DFX. Also, adds some
cleanups to reset info, move reset_fail_cnt into struct
hclge_rst_stats, and modifies some print formats.

Feature or Bugfix:Bugfix
Signed-off-by: NHuazhong Tan <tanhuazhong@huawei.com>
Reviewed-by: Nshenjian <shenjian15@huawei.com>
Reviewed-by: Nlinyunsheng <linyunsheng@huawei.com>
Reviewed-by: NYang Yingliang <yangyingliang@huawei.com>
Signed-off-by: NYang Yingliang <yangyingliang@huawei.com>
上级 f46b2cbb
...@@ -1022,18 +1022,33 @@ static void hclge_dbg_fd_tcam(struct hclge_dev *hdev) ...@@ -1022,18 +1022,33 @@ static void hclge_dbg_fd_tcam(struct hclge_dev *hdev)
static void hclge_dbg_dump_rst_info(struct hclge_dev *hdev) static void hclge_dbg_dump_rst_info(struct hclge_dev *hdev)
{ {
dev_info(&hdev->pdev->dev, "PF reset count: %d\n", dev_info(&hdev->pdev->dev, "PF reset count: %u\n",
hdev->rst_stats.pf_rst_cnt); hdev->rst_stats.pf_rst_cnt);
dev_info(&hdev->pdev->dev, "FLR reset count: %d\n", dev_info(&hdev->pdev->dev, "FLR reset count: %u\n",
hdev->rst_stats.flr_rst_cnt); hdev->rst_stats.flr_rst_cnt);
dev_info(&hdev->pdev->dev, "GLOBAL reset count: %d\n", dev_info(&hdev->pdev->dev, "GLOBAL reset count: %u\n",
hdev->rst_stats.global_rst_cnt); hdev->rst_stats.global_rst_cnt);
dev_info(&hdev->pdev->dev, "IMP reset count: %d\n", dev_info(&hdev->pdev->dev, "IMP reset count: %u\n",
hdev->rst_stats.imp_rst_cnt); hdev->rst_stats.imp_rst_cnt);
dev_info(&hdev->pdev->dev, "reset done count: %d\n", dev_info(&hdev->pdev->dev, "reset done count: %u\n",
hdev->rst_stats.reset_done_cnt); hdev->rst_stats.reset_done_cnt);
dev_info(&hdev->pdev->dev, "reset count: %d\n", dev_info(&hdev->pdev->dev, "reset count: %u\n",
hdev->rst_stats.reset_cnt); hdev->rst_stats.reset_cnt);
dev_info(&hdev->pdev->dev, "reset fail count: %u\n",
hdev->rst_stats.reset_fail_cnt);
dev_info(&hdev->pdev->dev, "vector0 interrupt enable status: 0x%x\n",
hclge_read_dev(&hdev->hw, HCLGE_MISC_VECTOR_REG_BASE));
dev_info(&hdev->pdev->dev, "reset interrupt source: 0x%x\n",
hclge_read_dev(&hdev->hw, HCLGE_MISC_RESET_STS_REG));
dev_info(&hdev->pdev->dev, "reset interrupt status: 0x%x\n",
hclge_read_dev(&hdev->hw, HCLGE_MISC_VECTOR_INT_STS));
dev_info(&hdev->pdev->dev, "hardware reset status: 0x%x\n",
hclge_read_dev(&hdev->hw, HCLGE_GLOBAL_RESET_REG));
dev_info(&hdev->pdev->dev, "handshake status: 0x%x\n",
hclge_read_dev(&hdev->hw, HCLGE_NIC_CSQ_DEPTH_REG));
dev_info(&hdev->pdev->dev, "function reset status: 0x%x\n",
hclge_read_dev(&hdev->hw, HCLGE_FUN_RST_ING));
dev_info(&hdev->pdev->dev, "hdev state: 0x%lx\n", hdev->state);
} }
static void hclge_dbg_get_m7_stats_info(struct hclge_dev *hdev) static void hclge_dbg_get_m7_stats_info(struct hclge_dev *hdev)
......
...@@ -3517,12 +3517,12 @@ static bool hclge_reset_err_handle(struct hclge_dev *hdev) ...@@ -3517,12 +3517,12 @@ static bool hclge_reset_err_handle(struct hclge_dev *hdev)
"reset failed because new reset interrupt\n"); "reset failed because new reset interrupt\n");
hclge_clear_reset_cause(hdev); hclge_clear_reset_cause(hdev);
return false; return false;
} else if (hdev->reset_fail_cnt < HCLGE_RESET_MAX_FAIL_CNT) { } else if (hdev->rst_stats.reset_fail_cnt < HCLGE_RESET_MAX_FAIL_CNT) {
hdev->reset_fail_cnt++; hdev->rst_stats.reset_fail_cnt++;
set_bit(hdev->reset_type, &hdev->reset_pending); set_bit(hdev->reset_type, &hdev->reset_pending);
dev_info(&hdev->pdev->dev, dev_info(&hdev->pdev->dev,
"re-schedule reset task(%d)\n", "re-schedule reset task(%d)\n",
hdev->reset_fail_cnt); hdev->rst_stats.reset_fail_cnt);
return true; return true;
} }
...@@ -3651,7 +3651,8 @@ static void hclge_reset(struct hclge_dev *hdev) ...@@ -3651,7 +3651,8 @@ static void hclge_reset(struct hclge_dev *hdev)
/* ignore RoCE notify error if it fails HCLGE_RESET_MAX_FAIL_CNT - 1 /* ignore RoCE notify error if it fails HCLGE_RESET_MAX_FAIL_CNT - 1
* times * times
*/ */
if (ret && hdev->reset_fail_cnt < HCLGE_RESET_MAX_FAIL_CNT - 1) if (ret &&
hdev->rst_stats.reset_fail_cnt < HCLGE_RESET_MAX_FAIL_CNT - 1)
goto err_reset; goto err_reset;
rtnl_lock(); rtnl_lock();
...@@ -3667,7 +3668,7 @@ static void hclge_reset(struct hclge_dev *hdev) ...@@ -3667,7 +3668,7 @@ static void hclge_reset(struct hclge_dev *hdev)
goto err_reset; goto err_reset;
hdev->last_reset_time = jiffies; hdev->last_reset_time = jiffies;
hdev->reset_fail_cnt = 0; hdev->rst_stats.reset_fail_cnt = 0;
hdev->rst_stats.reset_done_cnt++; hdev->rst_stats.reset_done_cnt++;
ae_dev->reset_type = HNAE3_NONE_RESET; ae_dev->reset_type = HNAE3_NONE_RESET;
...@@ -3768,7 +3769,7 @@ static bool hclge_reset_done(struct hnae3_handle *handle, bool done) ...@@ -3768,7 +3769,7 @@ static bool hclge_reset_done(struct hnae3_handle *handle, bool done)
struct hclge_vport *vport = hclge_get_vport(handle); struct hclge_vport *vport = hclge_get_vport(handle);
struct hclge_dev *hdev = vport->back; struct hclge_dev *hdev = vport->back;
if (hdev->reset_fail_cnt >= HCLGE_RESET_MAX_FAIL_CNT) if (hdev->rst_stats.reset_fail_cnt >= HCLGE_RESET_MAX_FAIL_CNT)
dev_err(&hdev->pdev->dev, "Reset fail!\n"); dev_err(&hdev->pdev->dev, "Reset fail!\n");
return done; return done;
......
...@@ -712,6 +712,7 @@ struct hclge_rst_stats { ...@@ -712,6 +712,7 @@ struct hclge_rst_stats {
u32 global_rst_cnt; /* the number of GLOBAL */ u32 global_rst_cnt; /* the number of GLOBAL */
u32 imp_rst_cnt; /* the number of IMP reset */ u32 imp_rst_cnt; /* the number of IMP reset */
u32 reset_cnt; /* the number of reset has been done */ u32 reset_cnt; /* the number of reset has been done */
u32 reset_fail_cnt; /* the number of reset fail */
}; };
/* time and register status when mac tunnel interruption occur */ /* time and register status when mac tunnel interruption occur */
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册