提交 09e0dbbe 编写于 作者: D Danil Kipnis 提交者: Jason Gunthorpe

RDMA/rtrs-clt: add an additional random 8 seconds before reconnecting

In order to avoid all the clients to start reconnecting at the same time
schedule the reconnect dwork with a random jitter of +[0,8] seconds.

Fixes: 6a98d71d ("RDMA/rtrs: client: main functionality")
Link: https://lore.kernel.org/r/20200724111508.15734-2-haris.iqbal@cloud.ionos.comSigned-off-by: NDanil Kipnis <danil.kipnis@cloud.ionos.com>
Signed-off-by: NMd Haris Iqbal <haris.iqbal@cloud.ionos.com>
Signed-off-by: NJason Gunthorpe <jgg@nvidia.com>
上级 f6a9d47a
...@@ -12,6 +12,7 @@ ...@@ -12,6 +12,7 @@
#include <linux/module.h> #include <linux/module.h>
#include <linux/rculist.h> #include <linux/rculist.h>
#include <linux/random.h>
#include "rtrs-clt.h" #include "rtrs-clt.h"
#include "rtrs-log.h" #include "rtrs-log.h"
...@@ -23,6 +24,12 @@ ...@@ -23,6 +24,12 @@
* leads to "false positives" failed reconnect attempts * leads to "false positives" failed reconnect attempts
*/ */
#define RTRS_RECONNECT_BACKOFF 1000 #define RTRS_RECONNECT_BACKOFF 1000
/*
* Wait for additional random time between 0 and 8 seconds
* before starting to reconnect to avoid clients reconnecting
* all at once in case of a major network outage
*/
#define RTRS_RECONNECT_SEED 8
MODULE_DESCRIPTION("RDMA Transport Client"); MODULE_DESCRIPTION("RDMA Transport Client");
MODULE_LICENSE("GPL"); MODULE_LICENSE("GPL");
...@@ -306,7 +313,8 @@ static void rtrs_rdma_error_recovery(struct rtrs_clt_con *con) ...@@ -306,7 +313,8 @@ static void rtrs_rdma_error_recovery(struct rtrs_clt_con *con)
*/ */
delay_ms = clt->reconnect_delay_sec * 1000; delay_ms = clt->reconnect_delay_sec * 1000;
queue_delayed_work(rtrs_wq, &sess->reconnect_dwork, queue_delayed_work(rtrs_wq, &sess->reconnect_dwork,
msecs_to_jiffies(delay_ms)); msecs_to_jiffies(delay_ms +
prandom_u32() % RTRS_RECONNECT_SEED));
} else { } else {
/* /*
* Error can happen just on establishing new connection, * Error can happen just on establishing new connection,
...@@ -2503,7 +2511,9 @@ static void rtrs_clt_reconnect_work(struct work_struct *work) ...@@ -2503,7 +2511,9 @@ static void rtrs_clt_reconnect_work(struct work_struct *work)
sess->stats->reconnects.fail_cnt++; sess->stats->reconnects.fail_cnt++;
delay_ms = clt->reconnect_delay_sec * 1000; delay_ms = clt->reconnect_delay_sec * 1000;
queue_delayed_work(rtrs_wq, &sess->reconnect_dwork, queue_delayed_work(rtrs_wq, &sess->reconnect_dwork,
msecs_to_jiffies(delay_ms)); msecs_to_jiffies(delay_ms +
prandom_u32() %
RTRS_RECONNECT_SEED));
} }
} }
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册