Blame SOURCES/Retry-HOT_REMOVE_DISK-a-few-times.patch

b7f731
From 2dd271fe7041c2f7036939cf6917c0578b92fefe Mon Sep 17 00:00:00 2001
b7f731
From: NeilBrown <neilb@suse.com>
b7f731
Date: Mon, 27 Mar 2017 12:50:16 +1100
b7f731
Subject: [RHEL7.5 PATCH 020/169] Retry HOT_REMOVE_DISK a few times.
b7f731
b7f731
HOT_REMOVE_DISK can fail with EBUSY if there are outstanding
b7f731
IO request that have not completed yet.  It can sometimes
b7f731
be helpful to wait a little while for these to complete.
b7f731
b7f731
We already do this in impose_level() when reshaping a device,
b7f731
but not in Manage.c in response to an explicit --remove request.
b7f731
b7f731
So create hot_remove_disk() to central this code, and call it
b7f731
where-ever it makes sense to wait for a HOT_REMOVE_DISK to succeed.
b7f731
b7f731
Signed-off-by: NeilBrown <neilb@suse.com>
b7f731
Signed-off-by: Jes Sorensen <Jes.Sorensen@gmail.com>
b7f731
---
b7f731
 Grow.c   |  9 +--------
b7f731
 Manage.c |  4 ++--
b7f731
 mdadm.h  |  1 +
b7f731
 util.c   | 18 ++++++++++++++++++
b7f731
 4 files changed, 22 insertions(+), 10 deletions(-)
b7f731
b7f731
diff --git a/Grow.c b/Grow.c
b7f731
index 455c5f9..218a706 100755
b7f731
--- a/Grow.c
b7f731
+++ b/Grow.c
b7f731
@@ -2736,7 +2736,6 @@ static int impose_level(int fd, int level, char *devname, int verbose)
b7f731
 		for (d = 0, found = 0;
b7f731
 		     d < MAX_DISKS && found < array.nr_disks;
b7f731
 		     d++) {
b7f731
-			int cnt;
b7f731
 			mdu_disk_info_t disk;
b7f731
 			disk.number = d;
b7f731
 			if (ioctl(fd, GET_DISK_INFO, &disk) < 0)
b7f731
@@ -2750,13 +2749,7 @@ static int impose_level(int fd, int level, char *devname, int verbose)
b7f731
 				continue;
b7f731
 			ioctl(fd, SET_DISK_FAULTY,
b7f731
 			      makedev(disk.major, disk.minor));
b7f731
-			cnt = 5;
b7f731
-			while (ioctl(fd, HOT_REMOVE_DISK,
b7f731
-				     makedev(disk.major, disk.minor)) < 0
b7f731
-			       && errno == EBUSY
b7f731
-			       && cnt--) {
b7f731
-				usleep(10000);
b7f731
-			}
b7f731
+			hot_remove_disk(fd, makedev(disk.major, disk.minor));
b7f731
 		}
b7f731
 	}
b7f731
 	c = map_num(pers, level);
b7f731
diff --git a/Manage.c b/Manage.c
b7f731
index 5c3d2b9..9139f96 100644
b7f731
--- a/Manage.c
b7f731
+++ b/Manage.c
b7f731
@@ -1183,7 +1183,7 @@ int Manage_remove(struct supertype *tst, int fd, struct mddev_dev *dv,
b7f731
 		else
b7f731
 			err = 0;
b7f731
 	} else {
b7f731
-		err = ioctl(fd, HOT_REMOVE_DISK, rdev);
b7f731
+		err = hot_remove_disk(fd, rdev);
b7f731
 		if (err && errno == ENODEV) {
b7f731
 			/* Old kernels rejected this if no personality
b7f731
 			 * is registered */
b7f731
@@ -1607,7 +1607,7 @@ int Manage_subdevs(char *devname, int fd,
b7f731
 
b7f731
 			if (dv->disposition == 'F')
b7f731
 				/* Need to remove first */
b7f731
-				ioctl(fd, HOT_REMOVE_DISK, rdev);
b7f731
+				hot_remove_disk(fd, rdev);
b7f731
 			/* Make sure it isn't in use (in 2.6 or later) */
b7f731
 			tfd = dev_open(dv->devname, O_RDONLY|O_EXCL);
b7f731
 			if (tfd >= 0) {
b7f731
diff --git a/mdadm.h b/mdadm.h
b7f731
index 91fd9eb..5bcfb86 100644
b7f731
--- a/mdadm.h
b7f731
+++ b/mdadm.h
b7f731
@@ -1476,6 +1476,7 @@ extern int add_disk(int mdfd, struct supertype *st,
b7f731
 		    struct mdinfo *sra, struct mdinfo *info);
b7f731
 extern int remove_disk(int mdfd, struct supertype *st,
b7f731
 		       struct mdinfo *sra, struct mdinfo *info);
b7f731
+extern int hot_remove_disk(int mdfd, unsigned long dev);
b7f731
 extern int set_array_info(int mdfd, struct supertype *st, struct mdinfo *info);
b7f731
 unsigned long long min_recovery_start(struct mdinfo *array);
b7f731
 
b7f731
diff --git a/util.c b/util.c
b7f731
index 32bd909..d09a7e2 100644
b7f731
--- a/util.c
b7f731
+++ b/util.c
b7f731
@@ -1795,6 +1795,24 @@ int remove_disk(int mdfd, struct supertype *st,
b7f731
 	return rv;
b7f731
 }
b7f731
 
b7f731
+int hot_remove_disk(int mdfd, unsigned long dev)
b7f731
+{
b7f731
+	int cnt = 5;
b7f731
+	int ret;
b7f731
+
b7f731
+	/* HOT_REMOVE_DISK can fail with EBUSY if there are
b7f731
+	 * outstanding IO requests to the device.
b7f731
+	 * In this case, it can be helpful to wait a little while,
b7f731
+	 * up to half a second, for that IO to flush.
b7f731
+	 */
b7f731
+	while ((ret = ioctl(mdfd, HOT_REMOVE_DISK, dev)) == -1 &&
b7f731
+	       errno == EBUSY &&
b7f731
+	       cnt-- > 0)
b7f731
+		usleep(10000);
b7f731
+
b7f731
+	return ret;
b7f731
+}
b7f731
+
b7f731
 int set_array_info(int mdfd, struct supertype *st, struct mdinfo *info)
b7f731
 {
b7f731
 	/* Initialise kernel's knowledge of array.
b7f731
-- 
b7f731
2.7.4
b7f731