Skip to content

Commit dfcc34c

Browse files
nhdaileyliu-song-6
authored andcommitted
md/raid1: don't clear bitmap bits on interrupted recovery.
sync_request_write no longer submits writes to a Faulty device. This has the unfortunate side effect that bitmap bits can be incorrectly cleared if a recovery is interrupted (previously, end_sync_write would have prevented this). This means the next recovery may not copy everything it should, potentially corrupting data. Add a function for doing the proper md_bitmap_end_sync, called from end_sync_write and the Faulty case in sync_request_write. backport note to 4.14: s/md_bitmap_end_sync/bitmap_end_sync Cc: stable@vger.kernel.org 4.14+ Fixes: 0c9d5b1 ("md/raid1: avoid reusing a resync bio after error handling.") Reviewed-by: Jack Wang <jinpu.wang@cloud.ionos.com> Tested-by: Jack Wang <jinpu.wang@cloud.ionos.com> Signed-off-by: Nate Dailey <nate.dailey@stratus.com> Signed-off-by: Song Liu <songliubraving@fb.com>
1 parent 96d7cb9 commit dfcc34c

File tree

1 file changed

+18
-10
lines changed

1 file changed

+18
-10
lines changed

drivers/md/raid1.c

Lines changed: 18 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1863,6 +1863,20 @@ static void end_sync_read(struct bio *bio)
18631863
reschedule_retry(r1_bio);
18641864
}
18651865

1866+
static void abort_sync_write(struct mddev *mddev, struct r1bio *r1_bio)
1867+
{
1868+
sector_t sync_blocks = 0;
1869+
sector_t s = r1_bio->sector;
1870+
long sectors_to_go = r1_bio->sectors;
1871+
1872+
/* make sure these bits don't get cleared. */
1873+
do {
1874+
md_bitmap_end_sync(mddev->bitmap, s, &sync_blocks, 1);
1875+
s += sync_blocks;
1876+
sectors_to_go -= sync_blocks;
1877+
} while (sectors_to_go > 0);
1878+
}
1879+
18661880
static void end_sync_write(struct bio *bio)
18671881
{
18681882
int uptodate = !bio->bi_status;
@@ -1874,15 +1888,7 @@ static void end_sync_write(struct bio *bio)
18741888
struct md_rdev *rdev = conf->mirrors[find_bio_disk(r1_bio, bio)].rdev;
18751889

18761890
if (!uptodate) {
1877-
sector_t sync_blocks = 0;
1878-
sector_t s = r1_bio->sector;
1879-
long sectors_to_go = r1_bio->sectors;
1880-
/* make sure these bits doesn't get cleared. */
1881-
do {
1882-
md_bitmap_end_sync(mddev->bitmap, s, &sync_blocks, 1);
1883-
s += sync_blocks;
1884-
sectors_to_go -= sync_blocks;
1885-
} while (sectors_to_go > 0);
1891+
abort_sync_write(mddev, r1_bio);
18861892
set_bit(WriteErrorSeen, &rdev->flags);
18871893
if (!test_and_set_bit(WantReplacement, &rdev->flags))
18881894
set_bit(MD_RECOVERY_NEEDED, &
@@ -2172,8 +2178,10 @@ static void sync_request_write(struct mddev *mddev, struct r1bio *r1_bio)
21722178
(i == r1_bio->read_disk ||
21732179
!test_bit(MD_RECOVERY_SYNC, &mddev->recovery))))
21742180
continue;
2175-
if (test_bit(Faulty, &conf->mirrors[i].rdev->flags))
2181+
if (test_bit(Faulty, &conf->mirrors[i].rdev->flags)) {
2182+
abort_sync_write(mddev, r1_bio);
21762183
continue;
2184+
}
21772185

21782186
bio_set_op_attrs(wbio, REQ_OP_WRITE, 0);
21792187
if (test_bit(FailFast, &conf->mirrors[i].rdev->flags))

0 commit comments

Comments
 (0)