提交 2c97cf13 编写于 作者: G Guoqing Jiang 提交者: Shaohua Li

md-cluser: make resync_finish only called after pers->sync_request

It is not reasonable that cluster raid to release resync
lock before the last pers->sync_request has finished.

As the metadata will be changed when node performs resync,
we need to inform other nodes to update metadata, so the
MD_CHANGE_PENDING flag is set before finish resync.

Then metadata_update_finish is move ahead to ensure that
METADATA_UPDATED msg is sent before finish resync, and
metadata_update_start need to be run after "repeat:" label
accordingly.
Reviewed-by: NNeilBrown <neilb@suse.com>
Signed-off-by: NGuoqing Jiang <gqjiang@suse.com>
Signed-off-by: NShaohua Li <shli@fb.com>
上级 41a9a0dc
...@@ -2291,6 +2291,7 @@ void md_update_sb(struct mddev *mddev, int force_change) ...@@ -2291,6 +2291,7 @@ void md_update_sb(struct mddev *mddev, int force_change)
return; return;
} }
repeat:
if (mddev_is_clustered(mddev)) { if (mddev_is_clustered(mddev)) {
if (test_and_clear_bit(MD_CHANGE_DEVS, &mddev->flags)) if (test_and_clear_bit(MD_CHANGE_DEVS, &mddev->flags))
force_change = 1; force_change = 1;
...@@ -2303,7 +2304,7 @@ void md_update_sb(struct mddev *mddev, int force_change) ...@@ -2303,7 +2304,7 @@ void md_update_sb(struct mddev *mddev, int force_change)
return; return;
} }
} }
repeat:
/* First make sure individual recovery_offsets are correct */ /* First make sure individual recovery_offsets are correct */
rdev_for_each(rdev, mddev) { rdev_for_each(rdev, mddev) {
if (rdev->raid_disk >= 0 && if (rdev->raid_disk >= 0 &&
...@@ -2430,6 +2431,9 @@ void md_update_sb(struct mddev *mddev, int force_change) ...@@ -2430,6 +2431,9 @@ void md_update_sb(struct mddev *mddev, int force_change)
md_super_wait(mddev); md_super_wait(mddev);
/* if there was a failure, MD_CHANGE_DEVS was set, and we re-write super */ /* if there was a failure, MD_CHANGE_DEVS was set, and we re-write super */
if (mddev_is_clustered(mddev) && ret == 0)
md_cluster_ops->metadata_update_finish(mddev);
spin_lock(&mddev->lock); spin_lock(&mddev->lock);
if (mddev->in_sync != sync_req || if (mddev->in_sync != sync_req ||
test_bit(MD_CHANGE_DEVS, &mddev->flags)) { test_bit(MD_CHANGE_DEVS, &mddev->flags)) {
...@@ -2452,9 +2456,6 @@ void md_update_sb(struct mddev *mddev, int force_change) ...@@ -2452,9 +2456,6 @@ void md_update_sb(struct mddev *mddev, int force_change)
clear_bit(BlockedBadBlocks, &rdev->flags); clear_bit(BlockedBadBlocks, &rdev->flags);
wake_up(&rdev->blocked_wait); wake_up(&rdev->blocked_wait);
} }
if (mddev_is_clustered(mddev) && ret == 0)
md_cluster_ops->metadata_update_finish(mddev);
} }
EXPORT_SYMBOL(md_update_sb); EXPORT_SYMBOL(md_update_sb);
...@@ -7785,7 +7786,6 @@ void md_do_sync(struct md_thread *thread) ...@@ -7785,7 +7786,6 @@ void md_do_sync(struct md_thread *thread)
struct md_rdev *rdev; struct md_rdev *rdev;
char *desc, *action = NULL; char *desc, *action = NULL;
struct blk_plug plug; struct blk_plug plug;
bool cluster_resync_finished = false;
int ret; int ret;
/* just incase thread restarts... */ /* just incase thread restarts... */
...@@ -8103,11 +8103,6 @@ void md_do_sync(struct md_thread *thread) ...@@ -8103,11 +8103,6 @@ void md_do_sync(struct md_thread *thread)
mddev->curr_resync_completed = mddev->curr_resync; mddev->curr_resync_completed = mddev->curr_resync;
sysfs_notify(&mddev->kobj, NULL, "sync_completed"); sysfs_notify(&mddev->kobj, NULL, "sync_completed");
} }
/* tell personality and other nodes that we are finished */
if (mddev_is_clustered(mddev)) {
md_cluster_ops->resync_finish(mddev);
cluster_resync_finished = true;
}
mddev->pers->sync_request(mddev, max_sectors, &skipped); mddev->pers->sync_request(mddev, max_sectors, &skipped);
if (!test_bit(MD_RECOVERY_CHECK, &mddev->recovery) && if (!test_bit(MD_RECOVERY_CHECK, &mddev->recovery) &&
...@@ -8147,9 +8142,15 @@ void md_do_sync(struct md_thread *thread) ...@@ -8147,9 +8142,15 @@ void md_do_sync(struct md_thread *thread)
set_bit(MD_CHANGE_DEVS, &mddev->flags); set_bit(MD_CHANGE_DEVS, &mddev->flags);
if (mddev_is_clustered(mddev) && if (mddev_is_clustered(mddev) &&
test_bit(MD_RECOVERY_INTR, &mddev->recovery) && ret == 0) {
!cluster_resync_finished) /* set CHANGE_PENDING here since maybe another
* update is needed, so other nodes are informed */
set_bit(MD_CHANGE_PENDING, &mddev->flags);
md_wakeup_thread(mddev->thread);
wait_event(mddev->sb_wait,
!test_bit(MD_CHANGE_PENDING, &mddev->flags));
md_cluster_ops->resync_finish(mddev); md_cluster_ops->resync_finish(mddev);
}
spin_lock(&mddev->lock); spin_lock(&mddev->lock);
if (!test_bit(MD_RECOVERY_INTR, &mddev->recovery)) { if (!test_bit(MD_RECOVERY_INTR, &mddev->recovery)) {
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册