Tree - rpms/glusterfs - CentOS Git server

rpms / glusterfs

Blame SOURCES/0300-glusterd-Don-t-allow-remove-brick-start-commit-if-gl.patch

Blob History Raw

		cb8e9e	`From 84007736637b8278858401d1988c1ea39df530d0 Mon Sep 17 00:00:00 2001`
		cb8e9e	`From: Atin Mukherjee <amukherj@redhat.com>`
		cb8e9e	`Date: Tue, 21 Jul 2015 09:57:43 +0530`
		cb8e9e	`Subject: [PATCH 300/304] glusterd: Don't allow remove brick start/commit if glusterd is down of the host of the brick`
		cb8e9e
		cb8e9e	`Backport of http://review.gluster.org/#/c/11726/`
		cb8e9e
		cb8e9e	`remove brick stage blindly starts the remove brick operation even if the`
		cb8e9e	`glusterd instance of the node hosting the brick is down. Operationally its`
		cb8e9e	`incorrect and this could result into a inconsistent rebalance status across all`
		cb8e9e	`the nodes as the originator of this command will always have the rebalance`
		cb8e9e	`status to 'DEFRAG_NOT_STARTED', however when the glusterd instance on the other`
		cb8e9e	`nodes comes up, will trigger rebalance and make the status to completed once the`
		cb8e9e	`rebalance is finished.`
		cb8e9e
		cb8e9e	`This patch fixes two things:`
		cb8e9e	`1. Add a validation in remove brick to check whether all the peers hosting the`
		cb8e9e	`bricks to be removed are up.`
		cb8e9e
		cb8e9e	`2. Don't copy volinfo->rebal.dict from stale volinfo during restore as this`
		cb8e9e	`might end up in a incosistent node_state.info file resulting into volume status`
		cb8e9e	`command failure.`
		cb8e9e
		cb8e9e	`Change-Id: Ia4a76865c05037d49eec5e3bbfaf68c1567f1f81`
		cb8e9e	`BUG: 1236038`
		cb8e9e	`Signed-off-by: Atin Mukherjee <amukherj@redhat.com>`
		cb8e9e	`Reviewed-on: http://review.gluster.org/11726`
		cb8e9e	`Tested-by: NetBSD Build System <jenkins@build.gluster.org>`
		cb8e9e	`Reviewed-by: N Balachandran <nbalacha@redhat.com>`
		cb8e9e	`Reviewed-by: Krishnan Parthasarathi <kparthas@redhat.com>`
		cb8e9e	`Reviewed-on: https://code.engineering.redhat.com/gerrit/56353`
		cb8e9e	`Tested-by: Krishnan Parthasarathi <kparthas@redhat.com>`
		cb8e9e	`---`
		cb8e9e	`.../glusterd/bug-1245045-remove-brick-validation.t \| 54 +++++++++`
		cb8e9e	`xlators/mgmt/glusterd/src/glusterd-brick-ops.c \| 119 +++++++++++++++-----`
		cb8e9e	`xlators/mgmt/glusterd/src/glusterd-utils.c \| 1 -`
		cb8e9e	`3 files changed, 143 insertions(+), 31 deletions(-)`
		cb8e9e	`create mode 100644 tests/bugs/glusterd/bug-1245045-remove-brick-validation.t`
		cb8e9e
		cb8e9e	`diff --git a/tests/bugs/glusterd/bug-1245045-remove-brick-validation.t b/tests/bugs/glusterd/bug-1245045-remove-brick-validation.t`
		cb8e9e	`new file mode 100644`
		cb8e9e	`index 0000000..22a8d55`
		cb8e9e	`--- /dev/null`
		cb8e9e	`+++ b/tests/bugs/glusterd/bug-1245045-remove-brick-validation.t`
		cb8e9e	`@@ -0,0 +1,54 @@`
		cb8e9e	`+#!/bin/bash`
		cb8e9e	`+`
		cb8e9e	`+. $(dirname $0)/../../include.rc`
		cb8e9e	`+. $(dirname $0)/../../cluster.rc`
		cb8e9e	`+`
		cb8e9e	`+cleanup`
		cb8e9e	`+`
		cb8e9e	`+TEST launch_cluster 3;`
		cb8e9e	`+TEST $CLI_1 peer probe $H2;`
		cb8e9e	`+TEST $CLI_1 peer probe $H3;`
		cb8e9e	`+EXPECT_WITHIN $PROBE_TIMEOUT 2 peer_count`
		cb8e9e	`+`
		cb8e9e	`+TEST $CLI_1 volume create $V0 $H1:$B1/$V0 $H2:$B2/$V0`
		cb8e9e	`+TEST $CLI_1 volume start $V0`
		cb8e9e	`+`
		cb8e9e	`+kill_glusterd 2`
		cb8e9e	`+`
		cb8e9e	`+#remove-brick should fail as the peer hosting the brick is down`
		cb8e9e	`+TEST ! $CLI_1 volume remove-brick $V0 $H2:$B2/${V0} start`
		cb8e9e	`+`
		cb8e9e	`+TEST start_glusterd 2`
		cb8e9e	`+`
		cb8e9e	`+EXPECT_WITHIN $PROBE_TIMEOUT 2 peer_count`
		cb8e9e	`+`
		cb8e9e	`+#volume status should work`
		cb8e9e	`+TEST $CLI_2 volume status`
		cb8e9e	`+`
		cb8e9e	`+`
		cb8e9e	`+TEST $CLI_1 volume remove-brick $V0 $H2:$B2/${V0} start`
		cb8e9e	`+kill_glusterd 2`
		cb8e9e	`+`
		cb8e9e	`+#remove-brick commit should fail as the peer hosting the brick is down`
		cb8e9e	`+TEST ! $CLI_1 volume remove-brick $V0 $H2:$B2/${V0} commit`
		cb8e9e	`+`
		cb8e9e	`+TEST start_glusterd 2`
		cb8e9e	`+`
		cb8e9e	`+EXPECT_WITHIN $PROBE_TIMEOUT 2 peer_count`
		cb8e9e	`+`
		cb8e9e	`+#volume status should work`
		cb8e9e	`+TEST $CLI_2 volume status`
		cb8e9e	`+`
		cb8e9e	`+TEST $CLI_1 volume remove-brick $V0 $H2:$B2/${V0} stop`
		cb8e9e	`+`
		cb8e9e	`+kill_glusterd 3`
		cb8e9e	`+EXPECT_WITHIN $PROBE_TIMEOUT 1 peer_count`
		cb8e9e	`+`
		cb8e9e	`+TEST $CLI_1 volume remove-brick $V0 $H2:$B2/${V0} start`
		cb8e9e	`+`
		cb8e9e	`+TEST start_glusterd 3`
		cb8e9e	`+EXPECT_WITHIN $PROBE_TIMEOUT 2 peer_count`
		cb8e9e	`+`
		cb8e9e	`+TEST $CLI_3 volume status`
		cb8e9e	`+`
		cb8e9e	`+cleanup`
		cb8e9e	`diff --git a/xlators/mgmt/glusterd/src/glusterd-brick-ops.c b/xlators/mgmt/glusterd/src/glusterd-brick-ops.c`
		cb8e9e	`index caf51a4..e1a0397 100644`
		cb8e9e	`--- a/xlators/mgmt/glusterd/src/glusterd-brick-ops.c`
		cb8e9e	`+++ b/xlators/mgmt/glusterd/src/glusterd-brick-ops.c`
		cb8e9e	`@@ -1661,6 +1661,83 @@ out:`
		cb8e9e	`return ret;`
		cb8e9e	`}`
		cb8e9e
		cb8e9e	`+static int`
		cb8e9e	`+glusterd_remove_brick_validate_bricks (gf1_op_commands cmd, int32_t brick_count,`
		cb8e9e	`+ dict_t *dict,`
		cb8e9e	`+ glusterd_volinfo_t *volinfo,`
		cb8e9e	`+ char **errstr)`
		cb8e9e	`+{`
		cb8e9e	`+ char *brick = NULL;`
		cb8e9e	`+ char msg[2048] = {0,};`
		cb8e9e	`+ char key[256] = {0,};`
		cb8e9e	`+ glusterd_brickinfo_t *brickinfo = NULL;`
		cb8e9e	`+ glusterd_peerinfo_t *peerinfo = NULL;`
		cb8e9e	`+ int i = 0;`
		cb8e9e	`+ int ret = -1;`
		cb8e9e	`+`
		cb8e9e	`+ /* Check whether all the nodes of the bricks to be removed are`
		cb8e9e	`+ * up, if not fail the operation */`
		cb8e9e	`+ for (i = 1; i <= brick_count; i++) {`
		cb8e9e	`+ snprintf (key, sizeof (key), "brick%d", i);`
		cb8e9e	`+ ret = dict_get_str (dict, key, &brick);`
		cb8e9e	`+ if (ret) {`
		cb8e9e	`+ snprintf (msg, sizeof (msg),`
		cb8e9e	`+ "Unable to get %s", key);`
		cb8e9e	`+ *errstr = gf_strdup (msg);`
		cb8e9e	`+ goto out;`
		cb8e9e	`+ }`
		cb8e9e	`+`
		cb8e9e	`+ ret =`
		cb8e9e	`+ glusterd_volume_brickinfo_get_by_brick(brick, volinfo,`
		cb8e9e	`+ &brickinfo);`
		cb8e9e	`+ if (ret) {`
		cb8e9e	`+ snprintf (msg, sizeof (msg), "Incorrect brick "`
		cb8e9e	`+ "%s for volume %s", brick, volinfo->volname);`
		cb8e9e	`+ *errstr = gf_strdup (msg);`
		cb8e9e	`+ goto out;`
		cb8e9e	`+ }`
		cb8e9e	`+ /* Do not allow commit if the bricks are not decommissioned`
		cb8e9e	`+ * if its a remove brick commit`
		cb8e9e	`+ */`
		cb8e9e	`+ if (cmd == GF_OP_CMD_COMMIT && !brickinfo->decommissioned) {`
		cb8e9e	`+ snprintf (msg, sizeof (msg), "Brick %s "`
		cb8e9e	`+ "is not decommissioned. "`
		cb8e9e	`+ "Use start or force option",`
		cb8e9e	`+ brick);`
		cb8e9e	`+ *errstr = gf_strdup (msg);`
		cb8e9e	`+ ret = -1;`
		cb8e9e	`+ goto out;`
		cb8e9e	`+ }`
		cb8e9e	`+`
		cb8e9e	`+ if (glusterd_is_local_brick (THIS, volinfo, brickinfo))`
		cb8e9e	`+ continue;`
		cb8e9e	`+`
		cb8e9e	`+ rcu_read_lock ();`
		cb8e9e	`+ peerinfo = glusterd_peerinfo_find_by_uuid`
		cb8e9e	`+ (brickinfo->uuid);`
		cb8e9e	`+ if (!peerinfo) {`
		cb8e9e	`+ snprintf (msg, sizeof(msg), "Host node of the "`
		cb8e9e	`+ "brick %s is not in cluster", brick);`
		cb8e9e	`+ *errstr = gf_strdup (msg);`
		cb8e9e	`+ ret = -1;`
		cb8e9e	`+ rcu_read_unlock ();`
		cb8e9e	`+ goto out;`
		cb8e9e	`+ }`
		cb8e9e	`+ if (!peerinfo->connected) {`
		cb8e9e	`+ snprintf (msg, sizeof(msg), "Host node of the "`
		cb8e9e	`+ "brick %s is down", brick);`
		cb8e9e	`+ *errstr = gf_strdup (msg);`
		cb8e9e	`+ ret = -1;`
		cb8e9e	`+ rcu_read_unlock ();`
		cb8e9e	`+ goto out;`
		cb8e9e	`+ }`
		cb8e9e	`+ rcu_read_unlock ();`
		cb8e9e	`+ }`
		cb8e9e	`+`
		cb8e9e	`+out:`
		cb8e9e	`+ return ret;`
		cb8e9e	`+}`
		cb8e9e	`+`
		cb8e9e	`int`
		cb8e9e	`glusterd_op_stage_remove_brick (dict_t dict, char *op_errstr)`
		cb8e9e	`{`
		cb8e9e	`@@ -1679,6 +1756,7 @@ glusterd_op_stage_remove_brick (dict_t dict, char *op_errstr)`
		cb8e9e	`char *brick = NULL;`
		cb8e9e	`glusterd_brickinfo_t *brickinfo = NULL;`
		cb8e9e	`gsync_status_param_t param = {0,};`
		cb8e9e	`+ glusterd_peerinfo_t *peerinfo = NULL;`
		cb8e9e
		cb8e9e	`this = THIS;`
		cb8e9e	`GF_ASSERT (this);`
		cb8e9e	`@@ -1817,6 +1895,12 @@ glusterd_op_stage_remove_brick (dict_t dict, char *op_errstr)`
		cb8e9e	`goto out;`
		cb8e9e	`}`
		cb8e9e
		cb8e9e	`+ ret = glusterd_remove_brick_validate_bricks (cmd, brick_count,`
		cb8e9e	`+ dict, volinfo,`
		cb8e9e	`+ &errstr);`
		cb8e9e	`+ if (ret)`
		cb8e9e	`+ goto out;`
		cb8e9e	`+`
		cb8e9e	`if (is_origin_glusterd (dict)) {`
		cb8e9e	`ret = glusterd_generate_and_set_task_id`
		cb8e9e	`(dict, GF_REMOVE_BRICK_TID_KEY);`
		cb8e9e	`@@ -1861,36 +1945,11 @@ glusterd_op_stage_remove_brick (dict_t dict, char *op_errstr)`
		cb8e9e	`goto out;`
		cb8e9e	`}`
		cb8e9e
		cb8e9e	`- /* Do not allow commit if the bricks are not decommissioned */`
		cb8e9e	`- for ( i = 1; i <= brick_count; i++ ) {`
		cb8e9e	`- snprintf (key, sizeof (key), "brick%d", i);`
		cb8e9e	`- ret = dict_get_str (dict, key, &brick);`
		cb8e9e	`- if (ret) {`
		cb8e9e	`- snprintf (msg, sizeof (msg),`
		cb8e9e	`- "Unable to get %s", key);`
		cb8e9e	`- errstr = gf_strdup (msg);`
		cb8e9e	`- goto out;`
		cb8e9e	`- }`
		cb8e9e	`-`
		cb8e9e	`- ret =`
		cb8e9e	`- glusterd_volume_brickinfo_get_by_brick(brick, volinfo,`
		cb8e9e	`- &brickinfo);`
		cb8e9e	`- if (ret) {`
		cb8e9e	`- snprintf (msg, sizeof (msg), "Incorrect brick "`
		cb8e9e	`- "%s for volume %s", brick, volname);`
		cb8e9e	`- errstr = gf_strdup (msg);`
		cb8e9e	`- goto out;`
		cb8e9e	`- }`
		cb8e9e	`- if ( !brickinfo->decommissioned ) {`
		cb8e9e	`- snprintf (msg, sizeof (msg), "Brick %s "`
		cb8e9e	`- "is not decommissioned. "`
		cb8e9e	`- "Use start or force option",`
		cb8e9e	`- brick);`
		cb8e9e	`- errstr = gf_strdup (msg);`
		cb8e9e	`- ret = -1;`
		cb8e9e	`- goto out;`
		cb8e9e	`- }`
		cb8e9e	`- }`
		cb8e9e	`+ ret = glusterd_remove_brick_validate_bricks (cmd, brick_count,`
		cb8e9e	`+ dict, volinfo,`
		cb8e9e	`+ &errstr);`
		cb8e9e	`+ if (ret)`
		cb8e9e	`+ goto out;`
		cb8e9e
		cb8e9e	`/* If geo-rep is configured, for this volume, it should be`
		cb8e9e	`* stopped.`
		cb8e9e	`diff --git a/xlators/mgmt/glusterd/src/glusterd-utils.c b/xlators/mgmt/glusterd/src/glusterd-utils.c`
		cb8e9e	`index 4982828..0f0ca27 100644`
		cb8e9e	`--- a/xlators/mgmt/glusterd/src/glusterd-utils.c`
		cb8e9e	`+++ b/xlators/mgmt/glusterd/src/glusterd-utils.c`
		cb8e9e	`@@ -3739,7 +3739,6 @@ gd_check_and_update_rebalance_info (glusterd_volinfo_t *old_volinfo,`
		cb8e9e	`new->skipped_files = old->skipped_files;`
		cb8e9e	`new->rebalance_failures = old->rebalance_failures;`
		cb8e9e	`new->rebalance_time = old->rebalance_time;`
		cb8e9e	`- new->dict = (old->dict ? dict_ref (old->dict) : NULL);`
		cb8e9e
		cb8e9e	`/* glusterd_rebalance_t.{op, id, defrag_cmd} are copied during volume`
		cb8e9e	`* import`
		cb8e9e	`--`
		cb8e9e	`1.7.1`
		cb8e9e

rpms / glusterfs

Source Code

Blame SOURCES/0300-glusterd-Don-t-allow-remove-brick-start-commit-if-gl.patch