dcavalca / rpms / mdadm

Forked from rpms/mdadm 3 years ago
Clone

Blame SOURCES/Retry-HOT_REMOVE_DISK-a-few-times.patch

2c1b57
From 2dd271fe7041c2f7036939cf6917c0578b92fefe Mon Sep 17 00:00:00 2001
2c1b57
From: NeilBrown <neilb@suse.com>
2c1b57
Date: Mon, 27 Mar 2017 12:50:16 +1100
2c1b57
Subject: [RHEL7.5 PATCH 020/169] Retry HOT_REMOVE_DISK a few times.
2c1b57
2c1b57
HOT_REMOVE_DISK can fail with EBUSY if there are outstanding
2c1b57
IO request that have not completed yet.  It can sometimes
2c1b57
be helpful to wait a little while for these to complete.
2c1b57
2c1b57
We already do this in impose_level() when reshaping a device,
2c1b57
but not in Manage.c in response to an explicit --remove request.
2c1b57
2c1b57
So create hot_remove_disk() to central this code, and call it
2c1b57
where-ever it makes sense to wait for a HOT_REMOVE_DISK to succeed.
2c1b57
2c1b57
Signed-off-by: NeilBrown <neilb@suse.com>
2c1b57
Signed-off-by: Jes Sorensen <Jes.Sorensen@gmail.com>
2c1b57
---
2c1b57
 Grow.c   |  9 +--------
2c1b57
 Manage.c |  4 ++--
2c1b57
 mdadm.h  |  1 +
2c1b57
 util.c   | 18 ++++++++++++++++++
2c1b57
 4 files changed, 22 insertions(+), 10 deletions(-)
2c1b57
2c1b57
diff --git a/Grow.c b/Grow.c
2c1b57
index 455c5f9..218a706 100755
2c1b57
--- a/Grow.c
2c1b57
+++ b/Grow.c
2c1b57
@@ -2736,7 +2736,6 @@ static int impose_level(int fd, int level, char *devname, int verbose)
2c1b57
 		for (d = 0, found = 0;
2c1b57
 		     d < MAX_DISKS && found < array.nr_disks;
2c1b57
 		     d++) {
2c1b57
-			int cnt;
2c1b57
 			mdu_disk_info_t disk;
2c1b57
 			disk.number = d;
2c1b57
 			if (ioctl(fd, GET_DISK_INFO, &disk) < 0)
2c1b57
@@ -2750,13 +2749,7 @@ static int impose_level(int fd, int level, char *devname, int verbose)
2c1b57
 				continue;
2c1b57
 			ioctl(fd, SET_DISK_FAULTY,
2c1b57
 			      makedev(disk.major, disk.minor));
2c1b57
-			cnt = 5;
2c1b57
-			while (ioctl(fd, HOT_REMOVE_DISK,
2c1b57
-				     makedev(disk.major, disk.minor)) < 0
2c1b57
-			       && errno == EBUSY
2c1b57
-			       && cnt--) {
2c1b57
-				usleep(10000);
2c1b57
-			}
2c1b57
+			hot_remove_disk(fd, makedev(disk.major, disk.minor));
2c1b57
 		}
2c1b57
 	}
2c1b57
 	c = map_num(pers, level);
2c1b57
diff --git a/Manage.c b/Manage.c
2c1b57
index 5c3d2b9..9139f96 100644
2c1b57
--- a/Manage.c
2c1b57
+++ b/Manage.c
2c1b57
@@ -1183,7 +1183,7 @@ int Manage_remove(struct supertype *tst, int fd, struct mddev_dev *dv,
2c1b57
 		else
2c1b57
 			err = 0;
2c1b57
 	} else {
2c1b57
-		err = ioctl(fd, HOT_REMOVE_DISK, rdev);
2c1b57
+		err = hot_remove_disk(fd, rdev);
2c1b57
 		if (err && errno == ENODEV) {
2c1b57
 			/* Old kernels rejected this if no personality
2c1b57
 			 * is registered */
2c1b57
@@ -1607,7 +1607,7 @@ int Manage_subdevs(char *devname, int fd,
2c1b57
 
2c1b57
 			if (dv->disposition == 'F')
2c1b57
 				/* Need to remove first */
2c1b57
-				ioctl(fd, HOT_REMOVE_DISK, rdev);
2c1b57
+				hot_remove_disk(fd, rdev);
2c1b57
 			/* Make sure it isn't in use (in 2.6 or later) */
2c1b57
 			tfd = dev_open(dv->devname, O_RDONLY|O_EXCL);
2c1b57
 			if (tfd >= 0) {
2c1b57
diff --git a/mdadm.h b/mdadm.h
2c1b57
index 91fd9eb..5bcfb86 100644
2c1b57
--- a/mdadm.h
2c1b57
+++ b/mdadm.h
2c1b57
@@ -1476,6 +1476,7 @@ extern int add_disk(int mdfd, struct supertype *st,
2c1b57
 		    struct mdinfo *sra, struct mdinfo *info);
2c1b57
 extern int remove_disk(int mdfd, struct supertype *st,
2c1b57
 		       struct mdinfo *sra, struct mdinfo *info);
2c1b57
+extern int hot_remove_disk(int mdfd, unsigned long dev);
2c1b57
 extern int set_array_info(int mdfd, struct supertype *st, struct mdinfo *info);
2c1b57
 unsigned long long min_recovery_start(struct mdinfo *array);
2c1b57
 
2c1b57
diff --git a/util.c b/util.c
2c1b57
index 32bd909..d09a7e2 100644
2c1b57
--- a/util.c
2c1b57
+++ b/util.c
2c1b57
@@ -1795,6 +1795,24 @@ int remove_disk(int mdfd, struct supertype *st,
2c1b57
 	return rv;
2c1b57
 }
2c1b57
 
2c1b57
+int hot_remove_disk(int mdfd, unsigned long dev)
2c1b57
+{
2c1b57
+	int cnt = 5;
2c1b57
+	int ret;
2c1b57
+
2c1b57
+	/* HOT_REMOVE_DISK can fail with EBUSY if there are
2c1b57
+	 * outstanding IO requests to the device.
2c1b57
+	 * In this case, it can be helpful to wait a little while,
2c1b57
+	 * up to half a second, for that IO to flush.
2c1b57
+	 */
2c1b57
+	while ((ret = ioctl(mdfd, HOT_REMOVE_DISK, dev)) == -1 &&
2c1b57
+	       errno == EBUSY &&
2c1b57
+	       cnt-- > 0)
2c1b57
+		usleep(10000);
2c1b57
+
2c1b57
+	return ret;
2c1b57
+}
2c1b57
+
2c1b57
 int set_array_info(int mdfd, struct supertype *st, struct mdinfo *info)
2c1b57
 {
2c1b57
 	/* Initialise kernel's knowledge of array.
2c1b57
-- 
2c1b57
2.7.4
2c1b57