|
|
e3c68b |
From 9912a432dc3493007462f76c5933d04a160814ae Mon Sep 17 00:00:00 2001
|
|
|
e3c68b |
From: Pranith Kumar K <pkarampu@redhat.com>
|
|
|
e3c68b |
Date: Thu, 20 Jun 2019 17:05:49 +0530
|
|
|
e3c68b |
Subject: [PATCH 198/221] cluster/ec: Prevent double pre-op xattrops
|
|
|
e3c68b |
|
|
|
e3c68b |
Problem:
|
|
|
e3c68b |
Race:
|
|
|
e3c68b |
Thread-1 Thread-2
|
|
|
e3c68b |
1) Does ec_get_size_version() to perform
|
|
|
e3c68b |
pre-op fxattrop as part of write-1
|
|
|
e3c68b |
2) Calls ec_set_dirty_flag() in
|
|
|
e3c68b |
ec_get_size_version() for write-2.
|
|
|
e3c68b |
This sets dirty[] to 1
|
|
|
e3c68b |
3) Completes executing
|
|
|
e3c68b |
ec_prepare_update_cbk leading to
|
|
|
e3c68b |
ctx->dirty[] = '1'
|
|
|
e3c68b |
4) Takes LOCK(inode->lock) to check if there are
|
|
|
e3c68b |
any flags and sets dirty-flag because
|
|
|
e3c68b |
lock->waiting_flag is 0 now. This leads to
|
|
|
e3c68b |
fxattrop to increment on-disk dirty[] to '2'
|
|
|
e3c68b |
|
|
|
e3c68b |
At the end of the writes the file will be marked for heal even when it doesn't need heal.
|
|
|
e3c68b |
|
|
|
e3c68b |
Fix:
|
|
|
e3c68b |
Perform ec_set_dirty_flag() and other checks inside LOCK() to prevent dirty[] to be marked
|
|
|
e3c68b |
as '1' in step 2) above
|
|
|
e3c68b |
|
|
|
e3c68b |
> Upstream-patch: https://review.gluster.org/c/glusterfs/+/22907
|
|
|
e3c68b |
|
|
|
e3c68b |
fixes: bz#1600918
|
|
|
e3c68b |
Change-Id: Icac2ab39c0b1e7e154387800fbededc561612865
|
|
|
e3c68b |
Signed-off-by: Pranith Kumar K <pkarampu@redhat.com>
|
|
|
e3c68b |
Reviewed-on: https://code.engineering.redhat.com/gerrit/174385
|
|
|
e3c68b |
Reviewed-by: Atin Mukherjee <amukherj@redhat.com>
|
|
|
e3c68b |
Tested-by: Atin Mukherjee <amukherj@redhat.com>
|
|
|
e3c68b |
---
|
|
|
e3c68b |
tests/basic/ec/ec-dirty-flags.t | 23 +++++++++++++++++++++++
|
|
|
e3c68b |
xlators/cluster/ec/src/ec-common.c | 13 +++++++------
|
|
|
e3c68b |
2 files changed, 30 insertions(+), 6 deletions(-)
|
|
|
e3c68b |
create mode 100644 tests/basic/ec/ec-dirty-flags.t
|
|
|
e3c68b |
|
|
|
e3c68b |
diff --git a/tests/basic/ec/ec-dirty-flags.t b/tests/basic/ec/ec-dirty-flags.t
|
|
|
e3c68b |
new file mode 100644
|
|
|
e3c68b |
index 0000000..68e6610
|
|
|
e3c68b |
--- /dev/null
|
|
|
e3c68b |
+++ b/tests/basic/ec/ec-dirty-flags.t
|
|
|
e3c68b |
@@ -0,0 +1,23 @@
|
|
|
e3c68b |
+#!/bin/bash
|
|
|
e3c68b |
+
|
|
|
e3c68b |
+. $(dirname $0)/../../include.rc
|
|
|
e3c68b |
+. $(dirname $0)/../../volume.rc
|
|
|
e3c68b |
+
|
|
|
e3c68b |
+# This checks if the fop keeps the dirty flags settings correctly after
|
|
|
e3c68b |
+# finishing the fop.
|
|
|
e3c68b |
+
|
|
|
e3c68b |
+cleanup
|
|
|
e3c68b |
+TEST glusterd
|
|
|
e3c68b |
+TEST pidof glusterd
|
|
|
e3c68b |
+TEST $CLI volume create $V0 disperse 3 redundancy 1 $H0:$B0/${V0}{0..2}
|
|
|
e3c68b |
+TEST $CLI volume heal $V0 disable
|
|
|
e3c68b |
+TEST $CLI volume start $V0
|
|
|
e3c68b |
+
|
|
|
e3c68b |
+TEST $GFS --volfile-id=/$V0 --volfile-server=$H0 $M0;
|
|
|
e3c68b |
+EXPECT_WITHIN $CHILD_UP_TIMEOUT "3" ec_child_up_count $V0 0
|
|
|
e3c68b |
+cd $M0
|
|
|
e3c68b |
+for i in {1..1000}; do dd if=/dev/zero of=file-${i} bs=512k count=2; done
|
|
|
e3c68b |
+cd -
|
|
|
e3c68b |
+EXPECT "^0$" get_pending_heal_count $V0
|
|
|
e3c68b |
+
|
|
|
e3c68b |
+cleanup
|
|
|
e3c68b |
diff --git a/xlators/cluster/ec/src/ec-common.c b/xlators/cluster/ec/src/ec-common.c
|
|
|
e3c68b |
index 9cc6395..35c2256 100644
|
|
|
e3c68b |
--- a/xlators/cluster/ec/src/ec-common.c
|
|
|
e3c68b |
+++ b/xlators/cluster/ec/src/ec-common.c
|
|
|
e3c68b |
@@ -1405,6 +1405,10 @@ ec_get_size_version(ec_lock_link_t *link)
|
|
|
e3c68b |
!ec_is_data_fop(fop->id))
|
|
|
e3c68b |
link->optimistic_changelog = _gf_true;
|
|
|
e3c68b |
|
|
|
e3c68b |
+ memset(&loc, 0, sizeof(loc));
|
|
|
e3c68b |
+
|
|
|
e3c68b |
+ LOCK(&lock->loc.inode->lock);
|
|
|
e3c68b |
+
|
|
|
e3c68b |
set_dirty = ec_set_dirty_flag(link, ctx, dirty);
|
|
|
e3c68b |
|
|
|
e3c68b |
/* If ec metadata has already been retrieved, do not try again. */
|
|
|
e3c68b |
@@ -1412,20 +1416,16 @@ ec_get_size_version(ec_lock_link_t *link)
|
|
|
e3c68b |
if (ec_is_data_fop(fop->id)) {
|
|
|
e3c68b |
fop->healing |= lock->healing;
|
|
|
e3c68b |
}
|
|
|
e3c68b |
- return;
|
|
|
e3c68b |
+ goto unlock;
|
|
|
e3c68b |
}
|
|
|
e3c68b |
|
|
|
e3c68b |
/* Determine if there's something we need to retrieve for the current
|
|
|
e3c68b |
* operation. */
|
|
|
e3c68b |
if (!set_dirty && !lock->query && (lock->loc.inode->ia_type != IA_IFREG) &&
|
|
|
e3c68b |
(lock->loc.inode->ia_type != IA_INVAL)) {
|
|
|
e3c68b |
- return;
|
|
|
e3c68b |
+ goto unlock;
|
|
|
e3c68b |
}
|
|
|
e3c68b |
|
|
|
e3c68b |
- memset(&loc, 0, sizeof(loc));
|
|
|
e3c68b |
-
|
|
|
e3c68b |
- LOCK(&lock->loc.inode->lock);
|
|
|
e3c68b |
-
|
|
|
e3c68b |
changed_flags = ec_set_xattrop_flags_and_params(lock, link, dirty);
|
|
|
e3c68b |
if (link->waiting_flags) {
|
|
|
e3c68b |
/* This fop needs to wait until all its flags are cleared which
|
|
|
e3c68b |
@@ -1436,6 +1436,7 @@ ec_get_size_version(ec_lock_link_t *link)
|
|
|
e3c68b |
GF_ASSERT(!changed_flags);
|
|
|
e3c68b |
}
|
|
|
e3c68b |
|
|
|
e3c68b |
+unlock:
|
|
|
e3c68b |
UNLOCK(&lock->loc.inode->lock);
|
|
|
e3c68b |
|
|
|
e3c68b |
if (!changed_flags)
|
|
|
e3c68b |
--
|
|
|
e3c68b |
1.8.3.1
|
|
|
e3c68b |
|