md/raid10: Fix raid10 replace hang when new added disk faulty

author Alex Wu <alexwu@synology.com>

Fri, 21 Sep 2018 08:05:03 +0000 (16:05 +0800)

committer Shaohua Li <shli@fb.com>

Fri, 28 Sep 2018 18:42:47 +0000 (11:42 -0700)
author Alex Wu <alexwu@synology.com>
Fri, 21 Sep 2018 08:05:03 +0000 (16:05 +0800)
committer Shaohua Li <shli@fb.com>
Fri, 28 Sep 2018 18:42:47 +0000 (11:42 -0700)
diff --git a/drivers/md/raid10.c b/drivers/md/raid10.c

index d6f7978..749848b 100644 (file)
--- a/drivers/md/raid10.c
+++ b/drivers/md/raid10.c
@@ -3079,6 +3079,8 @@ static sector_t raid10_sync_request(struct mddev *mddev, sector_t sector_nr,
                         sector_t sect;
                         int must_sync;
                         int any_working;
+                       int need_recover = 0;
+                       int need_replace = 0;
                         struct raid10_info *mirror = &conf->mirrors[i];
                         struct md_rdev *mrdev, *mreplace;
  
@@ -3086,11 +3088,15 @@ static sector_t raid10_sync_request(struct mddev *mddev, sector_t sector_nr,
                         mrdev = rcu_dereference(mirror->rdev);
                         mreplace = rcu_dereference(mirror->replacement);
  
-                       if ((mrdev == NULL ||
-                            test_bit(Faulty, &mrdev->flags) ||
-                            test_bit(In_sync, &mrdev->flags)) &&
-                           (mreplace == NULL ||
-                            test_bit(Faulty, &mreplace->flags))) {
+                       if (mrdev != NULL &&
+                           !test_bit(Faulty, &mrdev->flags) &&
+                           !test_bit(In_sync, &mrdev->flags))
+                               need_recover = 1;
+                       if (mreplace != NULL &&
+                           !test_bit(Faulty, &mreplace->flags))
+                               need_replace = 1;
+
+                       if (!need_recover && !need_replace) {
                                 rcu_read_unlock();
                                 continue;
                         }
@@ -3213,7 +3219,7 @@ static sector_t raid10_sync_request(struct mddev *mddev, sector_t sector_nr,
                                 r10_bio->devs[1].devnum = i;
                                 r10_bio->devs[1].addr = to_addr;
  
-                               if (!test_bit(In_sync, &mrdev->flags)) {
+                               if (need_recover) {
                                         bio = r10_bio->devs[1].bio;
                                         bio->bi_next = biolist;
                                         biolist = bio;
@@ -3230,16 +3236,11 @@ static sector_t raid10_sync_request(struct mddev *mddev, sector_t sector_nr,
                                 bio = r10_bio->devs[1].repl_bio;
                                 if (bio)
                                         bio->bi_end_io = NULL;
-                               /* Note: if mreplace != NULL, then bio
+                               /* Note: if need_replace, then bio
                                  * cannot be NULL as r10buf_pool_alloc will
                                  * have allocated it.
-                                * So the second test here is pointless.
-                                * But it keeps semantic-checkers happy, and
-                                * this comment keeps human reviewers
-                                * happy.
                                  */
-                               if (mreplace == NULL || bio == NULL ||
-                                   test_bit(Faulty, &mreplace->flags))
+                               if (!need_replace)
                                         break;
                                 bio->bi_next = biolist;
                                 biolist = bio;
author	Alex Wu <alexwu@synology.com>
	Fri, 21 Sep 2018 08:05:03 +0000 (16:05 +0800)
committer	Shaohua Li <shli@fb.com>
	Fri, 28 Sep 2018 18:42:47 +0000 (11:42 -0700)