|
|
17b94a |
From 11b64d494c52004002f900888694d20ef8af6df6 Mon Sep 17 00:00:00 2001
|
|
|
17b94a |
From: Mohammed Rafi KC <rkavunga@redhat.com>
|
|
|
17b94a |
Date: Sat, 11 May 2019 22:40:22 +0530
|
|
|
17b94a |
Subject: [PATCH 158/169] glusterfsd/cleanup: Protect graph object under a lock
|
|
|
17b94a |
|
|
|
17b94a |
While processing a cleanup_and_exit function, we are
|
|
|
17b94a |
accessing a graph object. But this has not been protected
|
|
|
17b94a |
under a lock. Because a parallel cleanup of a graph is quite
|
|
|
17b94a |
possible which might lead to an invalid memory access
|
|
|
17b94a |
|
|
|
17b94a |
Upstream patch:https://review.gluster.org/#/c/glusterfs/+/22709/
|
|
|
17b94a |
|
|
|
17b94a |
>Change-Id: Id05ca70d5b57e172b0401d07b6a1f5386c044e79
|
|
|
17b94a |
>fixes: bz#1708926
|
|
|
17b94a |
>Signed-off-by: Mohammed Rafi KC <rkavunga@redhat.com>
|
|
|
17b94a |
|
|
|
17b94a |
Change-Id: I55ab0525c79baa99a3bd929ee979c5519be5ab21
|
|
|
17b94a |
BUG: 1716626
|
|
|
17b94a |
Signed-off-by: Mohammed Rafi KC <rkavunga@redhat.com>
|
|
|
17b94a |
Reviewed-on: https://code.engineering.redhat.com/gerrit/172283
|
|
|
17b94a |
Reviewed-by: Atin Mukherjee <amukherj@redhat.com>
|
|
|
17b94a |
Tested-by: RHGS Build Bot <nigelb@redhat.com>
|
|
|
17b94a |
---
|
|
|
17b94a |
libglusterfs/src/graph.c | 58 +++++++++++++++----------
|
|
|
17b94a |
libglusterfs/src/statedump.c | 16 +++++--
|
|
|
17b94a |
tests/bugs/glusterd/optimized-basic-testcases.t | 4 +-
|
|
|
17b94a |
3 files changed, 50 insertions(+), 28 deletions(-)
|
|
|
17b94a |
|
|
|
17b94a |
diff --git a/libglusterfs/src/graph.c b/libglusterfs/src/graph.c
|
|
|
17b94a |
index 4c8b02d..18fb2d9 100644
|
|
|
17b94a |
--- a/libglusterfs/src/graph.c
|
|
|
17b94a |
+++ b/libglusterfs/src/graph.c
|
|
|
17b94a |
@@ -1392,8 +1392,12 @@ glusterfs_graph_cleanup(void *arg)
|
|
|
17b94a |
}
|
|
|
17b94a |
pthread_mutex_unlock(&ctx->notify_lock);
|
|
|
17b94a |
|
|
|
17b94a |
- glusterfs_graph_fini(graph);
|
|
|
17b94a |
- glusterfs_graph_destroy(graph);
|
|
|
17b94a |
+ pthread_mutex_lock(&ctx->cleanup_lock);
|
|
|
17b94a |
+ {
|
|
|
17b94a |
+ glusterfs_graph_fini(graph);
|
|
|
17b94a |
+ glusterfs_graph_destroy(graph);
|
|
|
17b94a |
+ }
|
|
|
17b94a |
+ pthread_mutex_unlock(&ctx->cleanup_lock);
|
|
|
17b94a |
out:
|
|
|
17b94a |
return NULL;
|
|
|
17b94a |
}
|
|
|
17b94a |
@@ -1468,31 +1472,37 @@ glusterfs_process_svc_detach(glusterfs_ctx_t *ctx, gf_volfile_t *volfile_obj)
|
|
|
17b94a |
|
|
|
17b94a |
if (!ctx || !ctx->active || !volfile_obj)
|
|
|
17b94a |
goto out;
|
|
|
17b94a |
- parent_graph = ctx->active;
|
|
|
17b94a |
- graph = volfile_obj->graph;
|
|
|
17b94a |
- if (!graph)
|
|
|
17b94a |
- goto out;
|
|
|
17b94a |
- if (graph->first)
|
|
|
17b94a |
- xl = graph->first;
|
|
|
17b94a |
|
|
|
17b94a |
- last_xl = graph->last_xl;
|
|
|
17b94a |
- if (last_xl)
|
|
|
17b94a |
- last_xl->next = NULL;
|
|
|
17b94a |
- if (!xl || xl->cleanup_starting)
|
|
|
17b94a |
- goto out;
|
|
|
17b94a |
+ pthread_mutex_lock(&ctx->cleanup_lock);
|
|
|
17b94a |
+ {
|
|
|
17b94a |
+ parent_graph = ctx->active;
|
|
|
17b94a |
+ graph = volfile_obj->graph;
|
|
|
17b94a |
+ if (!graph)
|
|
|
17b94a |
+ goto unlock;
|
|
|
17b94a |
+ if (graph->first)
|
|
|
17b94a |
+ xl = graph->first;
|
|
|
17b94a |
+
|
|
|
17b94a |
+ last_xl = graph->last_xl;
|
|
|
17b94a |
+ if (last_xl)
|
|
|
17b94a |
+ last_xl->next = NULL;
|
|
|
17b94a |
+ if (!xl || xl->cleanup_starting)
|
|
|
17b94a |
+ goto unlock;
|
|
|
17b94a |
|
|
|
17b94a |
- xl->cleanup_starting = 1;
|
|
|
17b94a |
- gf_msg("mgmt", GF_LOG_INFO, 0, LG_MSG_GRAPH_DETACH_STARTED,
|
|
|
17b94a |
- "detaching child %s", volfile_obj->vol_id);
|
|
|
17b94a |
+ xl->cleanup_starting = 1;
|
|
|
17b94a |
+ gf_msg("mgmt", GF_LOG_INFO, 0, LG_MSG_GRAPH_DETACH_STARTED,
|
|
|
17b94a |
+ "detaching child %s", volfile_obj->vol_id);
|
|
|
17b94a |
|
|
|
17b94a |
- list_del_init(&volfile_obj->volfile_list);
|
|
|
17b94a |
- glusterfs_mux_xlator_unlink(parent_graph->top, xl);
|
|
|
17b94a |
- parent_graph->last_xl = glusterfs_get_last_xlator(parent_graph);
|
|
|
17b94a |
- parent_graph->xl_count -= graph->xl_count;
|
|
|
17b94a |
- parent_graph->leaf_count -= graph->leaf_count;
|
|
|
17b94a |
- default_notify(xl, GF_EVENT_PARENT_DOWN, xl);
|
|
|
17b94a |
- parent_graph->id++;
|
|
|
17b94a |
- ret = 0;
|
|
|
17b94a |
+ list_del_init(&volfile_obj->volfile_list);
|
|
|
17b94a |
+ glusterfs_mux_xlator_unlink(parent_graph->top, xl);
|
|
|
17b94a |
+ parent_graph->last_xl = glusterfs_get_last_xlator(parent_graph);
|
|
|
17b94a |
+ parent_graph->xl_count -= graph->xl_count;
|
|
|
17b94a |
+ parent_graph->leaf_count -= graph->leaf_count;
|
|
|
17b94a |
+ default_notify(xl, GF_EVENT_PARENT_DOWN, xl);
|
|
|
17b94a |
+ parent_graph->id++;
|
|
|
17b94a |
+ ret = 0;
|
|
|
17b94a |
+ }
|
|
|
17b94a |
+unlock:
|
|
|
17b94a |
+ pthread_mutex_unlock(&ctx->cleanup_lock);
|
|
|
17b94a |
out:
|
|
|
17b94a |
if (!ret) {
|
|
|
17b94a |
list_del_init(&volfile_obj->volfile_list);
|
|
|
17b94a |
diff --git a/libglusterfs/src/statedump.c b/libglusterfs/src/statedump.c
|
|
|
17b94a |
index 0cf80c0..0d58f8f 100644
|
|
|
17b94a |
--- a/libglusterfs/src/statedump.c
|
|
|
17b94a |
+++ b/libglusterfs/src/statedump.c
|
|
|
17b94a |
@@ -805,11 +805,17 @@ gf_proc_dump_info(int signum, glusterfs_ctx_t *ctx)
|
|
|
17b94a |
int brick_count = 0;
|
|
|
17b94a |
int len = 0;
|
|
|
17b94a |
|
|
|
17b94a |
- gf_proc_dump_lock();
|
|
|
17b94a |
-
|
|
|
17b94a |
if (!ctx)
|
|
|
17b94a |
goto out;
|
|
|
17b94a |
|
|
|
17b94a |
+ /*
|
|
|
17b94a |
+ * Multiplexed daemons can change the active graph when attach/detach
|
|
|
17b94a |
+ * is called. So this has to be protected with the cleanup lock.
|
|
|
17b94a |
+ */
|
|
|
17b94a |
+ if (mgmt_is_multiplexed_daemon(ctx->cmd_args.process_name))
|
|
|
17b94a |
+ pthread_mutex_lock(&ctx->cleanup_lock);
|
|
|
17b94a |
+ gf_proc_dump_lock();
|
|
|
17b94a |
+
|
|
|
17b94a |
if (!mgmt_is_multiplexed_daemon(ctx->cmd_args.process_name) &&
|
|
|
17b94a |
(ctx && ctx->active)) {
|
|
|
17b94a |
top = ctx->active->first;
|
|
|
17b94a |
@@ -923,7 +929,11 @@ gf_proc_dump_info(int signum, glusterfs_ctx_t *ctx)
|
|
|
17b94a |
out:
|
|
|
17b94a |
GF_FREE(dump_options.dump_path);
|
|
|
17b94a |
dump_options.dump_path = NULL;
|
|
|
17b94a |
- gf_proc_dump_unlock();
|
|
|
17b94a |
+ if (ctx) {
|
|
|
17b94a |
+ gf_proc_dump_unlock();
|
|
|
17b94a |
+ if (mgmt_is_multiplexed_daemon(ctx->cmd_args.process_name))
|
|
|
17b94a |
+ pthread_mutex_unlock(&ctx->cleanup_lock);
|
|
|
17b94a |
+ }
|
|
|
17b94a |
|
|
|
17b94a |
return;
|
|
|
17b94a |
}
|
|
|
17b94a |
diff --git a/tests/bugs/glusterd/optimized-basic-testcases.t b/tests/bugs/glusterd/optimized-basic-testcases.t
|
|
|
17b94a |
index d700b5e..110f1b9 100644
|
|
|
17b94a |
--- a/tests/bugs/glusterd/optimized-basic-testcases.t
|
|
|
17b94a |
+++ b/tests/bugs/glusterd/optimized-basic-testcases.t
|
|
|
17b94a |
@@ -289,7 +289,9 @@ mkdir -p /xyz/var/lib/glusterd/abc
|
|
|
17b94a |
TEST $CLI volume create "test" $H0:/xyz/var/lib/glusterd/abc
|
|
|
17b94a |
EXPECT 'Created' volinfo_field "test" 'Status';
|
|
|
17b94a |
|
|
|
17b94a |
-EXPECT "1" generate_statedump_and_check_for_glusterd_info
|
|
|
17b94a |
+#While taking a statedump, there is a TRY_LOCK on call_frame, which might may cause
|
|
|
17b94a |
+#failure. So Adding a EXPECT_WITHIN
|
|
|
17b94a |
+EXPECT_WITHIN $PROCESS_UP_TIMEOUT "^1$" generate_statedump_and_check_for_glusterd_info
|
|
|
17b94a |
|
|
|
17b94a |
cleanup_statedump `pidof glusterd`
|
|
|
17b94a |
cleanup
|
|
|
17b94a |
--
|
|
|
17b94a |
1.8.3.1
|
|
|
17b94a |
|