|
|
21ab4e |
From 2588152f410c133c408d182f04b8cc5759c1af3e Mon Sep 17 00:00:00 2001
|
|
|
21ab4e |
From: Ravishankar N <ravishankar@redhat.com>
|
|
|
21ab4e |
Date: Wed, 10 May 2017 10:03:08 +0530
|
|
|
21ab4e |
Subject: [PATCH 437/473] afr: propagate correct errno for fop failures in
|
|
|
21ab4e |
arbiter
|
|
|
21ab4e |
|
|
|
21ab4e |
Backport of: https://review.gluster.org/17235
|
|
|
21ab4e |
|
|
|
21ab4e |
Problem:
|
|
|
21ab4e |
If quorum is not met in fop cbk, arbiter sends an ENOTCONN error to the
|
|
|
21ab4e |
upper xlators. In a VM workload with sharding enabled, this was leading
|
|
|
21ab4e |
to the VM pausing when replace-brick was performed as described in the BZ.
|
|
|
21ab4e |
|
|
|
21ab4e |
Fix:
|
|
|
21ab4e |
Move the fop cbk arbitration logic to afr_handle_quorum() because in
|
|
|
21ab4e |
normal replica volumes, that is the function that has the quorum and
|
|
|
21ab4e |
errno checks in the fop cbk path before doing a post-op.
|
|
|
21ab4e |
|
|
|
21ab4e |
Thanks to Pranith for suggesting this approach.
|
|
|
21ab4e |
|
|
|
21ab4e |
Change-Id: I4fffa3b34a4017eb950b4e1c55b943441eacee21
|
|
|
21ab4e |
BUG: 1443980
|
|
|
21ab4e |
Signed-off-by: Ravishankar N <ravishankar@redhat.com>
|
|
|
21ab4e |
Reviewed-on: https://code.engineering.redhat.com/gerrit/106202
|
|
|
21ab4e |
---
|
|
|
21ab4e |
xlators/cluster/afr/src/afr-dir-write.c | 1 -
|
|
|
21ab4e |
xlators/cluster/afr/src/afr-inode-write.c | 1 -
|
|
|
21ab4e |
xlators/cluster/afr/src/afr-transaction.c | 23 ++++++++++++-----------
|
|
|
21ab4e |
xlators/cluster/afr/src/afr-transaction.h | 2 --
|
|
|
21ab4e |
4 files changed, 12 insertions(+), 15 deletions(-)
|
|
|
21ab4e |
|
|
|
21ab4e |
diff --git a/xlators/cluster/afr/src/afr-dir-write.c b/xlators/cluster/afr/src/afr-dir-write.c
|
|
|
21ab4e |
index 8e483c3..9099b8c 100644
|
|
|
21ab4e |
--- a/xlators/cluster/afr/src/afr-dir-write.c
|
|
|
21ab4e |
+++ b/xlators/cluster/afr/src/afr-dir-write.c
|
|
|
21ab4e |
@@ -183,7 +183,6 @@ __afr_dir_write_finalize (call_frame_t *frame, xlator_t *this)
|
|
|
21ab4e |
}
|
|
|
21ab4e |
}
|
|
|
21ab4e |
|
|
|
21ab4e |
- afr_txn_arbitrate_fop_cbk (frame, this);
|
|
|
21ab4e |
}
|
|
|
21ab4e |
|
|
|
21ab4e |
|
|
|
21ab4e |
diff --git a/xlators/cluster/afr/src/afr-inode-write.c b/xlators/cluster/afr/src/afr-inode-write.c
|
|
|
21ab4e |
index 200b420..04bbf21 100644
|
|
|
21ab4e |
--- a/xlators/cluster/afr/src/afr-inode-write.c
|
|
|
21ab4e |
+++ b/xlators/cluster/afr/src/afr-inode-write.c
|
|
|
21ab4e |
@@ -131,7 +131,6 @@ __afr_inode_write_finalize (call_frame_t *frame, xlator_t *this)
|
|
|
21ab4e |
}
|
|
|
21ab4e |
}
|
|
|
21ab4e |
|
|
|
21ab4e |
- afr_txn_arbitrate_fop_cbk (frame, this);
|
|
|
21ab4e |
afr_set_in_flight_sb_status (this, local, local->inode);
|
|
|
21ab4e |
}
|
|
|
21ab4e |
|
|
|
21ab4e |
diff --git a/xlators/cluster/afr/src/afr-transaction.c b/xlators/cluster/afr/src/afr-transaction.c
|
|
|
21ab4e |
index a3cb766..644ebe2 100644
|
|
|
21ab4e |
--- a/xlators/cluster/afr/src/afr-transaction.c
|
|
|
21ab4e |
+++ b/xlators/cluster/afr/src/afr-transaction.c
|
|
|
21ab4e |
@@ -303,22 +303,21 @@ afr_compute_pre_op_sources (call_frame_t *frame, xlator_t *this)
|
|
|
21ab4e |
}
|
|
|
21ab4e |
}
|
|
|
21ab4e |
|
|
|
21ab4e |
-void
|
|
|
21ab4e |
-afr_txn_arbitrate_fop_cbk (call_frame_t *frame, xlator_t *this)
|
|
|
21ab4e |
+gf_boolean_t
|
|
|
21ab4e |
+afr_has_arbiter_fop_cbk_quorum (call_frame_t *frame)
|
|
|
21ab4e |
{
|
|
|
21ab4e |
afr_local_t *local = NULL;
|
|
|
21ab4e |
afr_private_t *priv = NULL;
|
|
|
21ab4e |
+ xlator_t *this = NULL;
|
|
|
21ab4e |
gf_boolean_t fop_failed = _gf_false;
|
|
|
21ab4e |
unsigned char *pre_op_sources = NULL;
|
|
|
21ab4e |
int i = 0;
|
|
|
21ab4e |
|
|
|
21ab4e |
local = frame->local;
|
|
|
21ab4e |
+ this = frame->this;
|
|
|
21ab4e |
priv = this->private;
|
|
|
21ab4e |
pre_op_sources = local->transaction.pre_op_sources;
|
|
|
21ab4e |
|
|
|
21ab4e |
- if (priv->arbiter_count != 1 || local->op_ret < 0)
|
|
|
21ab4e |
- return;
|
|
|
21ab4e |
-
|
|
|
21ab4e |
/* If the fop failed on the brick, it is not a source. */
|
|
|
21ab4e |
for (i = 0; i < priv->child_count; i++)
|
|
|
21ab4e |
if (local->transaction.failed_subvols[i])
|
|
|
21ab4e |
@@ -334,12 +333,10 @@ afr_txn_arbitrate_fop_cbk (call_frame_t *frame, xlator_t *this)
|
|
|
21ab4e |
break;
|
|
|
21ab4e |
}
|
|
|
21ab4e |
|
|
|
21ab4e |
- if (fop_failed) {
|
|
|
21ab4e |
- local->op_ret = -1;
|
|
|
21ab4e |
- local->op_errno = ENOTCONN;
|
|
|
21ab4e |
- }
|
|
|
21ab4e |
+ if (fop_failed)
|
|
|
21ab4e |
+ return _gf_false;
|
|
|
21ab4e |
|
|
|
21ab4e |
- return;
|
|
|
21ab4e |
+ return _gf_true;
|
|
|
21ab4e |
}
|
|
|
21ab4e |
|
|
|
21ab4e |
void
|
|
|
21ab4e |
@@ -787,8 +784,12 @@ afr_handle_quorum (call_frame_t *frame)
|
|
|
21ab4e |
* no split-brain with the fix. The problem is eliminated completely.
|
|
|
21ab4e |
*/
|
|
|
21ab4e |
|
|
|
21ab4e |
- if (afr_has_fop_cbk_quorum (frame))
|
|
|
21ab4e |
+ if (priv->arbiter_count) {
|
|
|
21ab4e |
+ if (afr_has_arbiter_fop_cbk_quorum (frame))
|
|
|
21ab4e |
+ return;
|
|
|
21ab4e |
+ } else if (afr_has_fop_cbk_quorum (frame)) {
|
|
|
21ab4e |
return;
|
|
|
21ab4e |
+ }
|
|
|
21ab4e |
|
|
|
21ab4e |
for (i = 0; i < priv->child_count; i++) {
|
|
|
21ab4e |
if (local->transaction.pre_op[i])
|
|
|
21ab4e |
diff --git a/xlators/cluster/afr/src/afr-transaction.h b/xlators/cluster/afr/src/afr-transaction.h
|
|
|
21ab4e |
index db82456..dd19e5b 100644
|
|
|
21ab4e |
--- a/xlators/cluster/afr/src/afr-transaction.h
|
|
|
21ab4e |
+++ b/xlators/cluster/afr/src/afr-transaction.h
|
|
|
21ab4e |
@@ -16,8 +16,6 @@
|
|
|
21ab4e |
void
|
|
|
21ab4e |
afr_transaction_fop_failed (call_frame_t *frame, xlator_t *this,
|
|
|
21ab4e |
int child_index);
|
|
|
21ab4e |
-void
|
|
|
21ab4e |
-afr_txn_arbitrate_fop_cbk (call_frame_t *frame, xlator_t *this);
|
|
|
21ab4e |
|
|
|
21ab4e |
int
|
|
|
21ab4e |
afr_lock_server_count (afr_private_t *priv, afr_transaction_type type);
|
|
|
21ab4e |
--
|
|
|
21ab4e |
1.8.3.1
|
|
|
21ab4e |
|