17b94a
From 998d9b8b5e271f407e1c654c34f45f0db36abc71 Mon Sep 17 00:00:00 2001
17b94a
From: Mohammed Rafi KC <rkavunga@redhat.com>
17b94a
Date: Tue, 21 May 2019 17:15:07 +0530
17b94a
Subject: [PATCH 172/178] ec/fini: Fix race with ec_fini and ec_notify
17b94a
17b94a
During a graph cleanup, we first sent a PARENT_DOWN and wait for
17b94a
a child down to ultimately free the xlator and the graph.
17b94a
17b94a
In the ec xlator, we cleanup the threads when we get a PARENT_DOWN event.
17b94a
But a racing event like CHILD_UP or event xl_op may trigger healing threads
17b94a
after threads cleanup.
17b94a
17b94a
So there is a chance that the threads might access a freed private variabe
17b94a
17b94a
Upstream patch: https://review.gluster.org/#/c/glusterfs/+/22758/
17b94a
17b94a
>Change-Id: I252d10181bb67b95900c903d479de707a8489532
17b94a
>fixes: bz#1703948
17b94a
>Signed-off-by: Mohammed Rafi KC <rkavunga@redhat.com>
17b94a
17b94a
Change-Id: I84a10352d9fb3e68d4147b3791e3af45ab79050e
17b94a
BUG: 1703434
17b94a
Signed-off-by: Mohammed Rafi KC <rkavunga@redhat.com>
17b94a
Reviewed-on: https://code.engineering.redhat.com/gerrit/172285
17b94a
Tested-by: RHGS Build Bot <nigelb@redhat.com>
17b94a
Reviewed-by: Atin Mukherjee <amukherj@redhat.com>
17b94a
---
17b94a
 libglusterfs/src/glusterfs/xlator.h |  3 +++
17b94a
 libglusterfs/src/libglusterfs.sym   |  1 +
17b94a
 libglusterfs/src/xlator.c           | 21 +++++++++++++++++++++
17b94a
 xlators/cluster/ec/src/ec-heal.c    |  4 ++++
17b94a
 xlators/cluster/ec/src/ec-heald.c   |  6 ++++++
17b94a
 xlators/cluster/ec/src/ec.c         |  3 +++
17b94a
 6 files changed, 38 insertions(+)
17b94a
17b94a
diff --git a/libglusterfs/src/glusterfs/xlator.h b/libglusterfs/src/glusterfs/xlator.h
17b94a
index 8998976..09e463e 100644
17b94a
--- a/libglusterfs/src/glusterfs/xlator.h
17b94a
+++ b/libglusterfs/src/glusterfs/xlator.h
17b94a
@@ -1092,4 +1092,7 @@ gluster_graph_take_reference(xlator_t *tree);
17b94a
 
17b94a
 gf_boolean_t
17b94a
 mgmt_is_multiplexed_daemon(char *name);
17b94a
+
17b94a
+gf_boolean_t
17b94a
+xlator_is_cleanup_starting(xlator_t *this);
17b94a
 #endif /* _XLATOR_H */
17b94a
diff --git a/libglusterfs/src/libglusterfs.sym b/libglusterfs/src/libglusterfs.sym
17b94a
index ec474e7..7a2edef 100644
17b94a
--- a/libglusterfs/src/libglusterfs.sym
17b94a
+++ b/libglusterfs/src/libglusterfs.sym
17b94a
@@ -1161,3 +1161,4 @@ glusterfs_process_svc_attach_volfp
17b94a
 glusterfs_mux_volfile_reconfigure
17b94a
 glusterfs_process_svc_detach
17b94a
 mgmt_is_multiplexed_daemon
17b94a
+xlator_is_cleanup_starting
17b94a
diff --git a/libglusterfs/src/xlator.c b/libglusterfs/src/xlator.c
17b94a
index 022c3ed..fbfbbe2 100644
17b94a
--- a/libglusterfs/src/xlator.c
17b94a
+++ b/libglusterfs/src/xlator.c
17b94a
@@ -1486,3 +1486,24 @@ mgmt_is_multiplexed_daemon(char *name)
17b94a
     }
17b94a
     return _gf_false;
17b94a
 }
17b94a
+
17b94a
+gf_boolean_t
17b94a
+xlator_is_cleanup_starting(xlator_t *this)
17b94a
+{
17b94a
+    gf_boolean_t cleanup = _gf_false;
17b94a
+    glusterfs_graph_t *graph = NULL;
17b94a
+    xlator_t *xl = NULL;
17b94a
+
17b94a
+    if (!this)
17b94a
+        goto out;
17b94a
+    graph = this->graph;
17b94a
+
17b94a
+    if (!graph)
17b94a
+        goto out;
17b94a
+
17b94a
+    xl = graph->first;
17b94a
+    if (xl && xl->cleanup_starting)
17b94a
+        cleanup = _gf_true;
17b94a
+out:
17b94a
+    return cleanup;
17b94a
+}
17b94a
diff --git a/xlators/cluster/ec/src/ec-heal.c b/xlators/cluster/ec/src/ec-heal.c
17b94a
index 2fa1f11..8844c29 100644
17b94a
--- a/xlators/cluster/ec/src/ec-heal.c
17b94a
+++ b/xlators/cluster/ec/src/ec-heal.c
17b94a
@@ -2855,6 +2855,10 @@ ec_replace_brick_heal_wrap(void *opaque)
17b94a
         itable = ec->xl->itable;
17b94a
     else
17b94a
         goto out;
17b94a
+
17b94a
+    if (xlator_is_cleanup_starting(ec->xl))
17b94a
+        goto out;
17b94a
+
17b94a
     ret = ec_replace_heal(ec, itable->root);
17b94a
 out:
17b94a
     return ret;
17b94a
diff --git a/xlators/cluster/ec/src/ec-heald.c b/xlators/cluster/ec/src/ec-heald.c
17b94a
index edf5e11..91512d7 100644
17b94a
--- a/xlators/cluster/ec/src/ec-heald.c
17b94a
+++ b/xlators/cluster/ec/src/ec-heald.c
17b94a
@@ -444,6 +444,9 @@ unlock:
17b94a
 int
17b94a
 ec_shd_full_healer_spawn(xlator_t *this, int subvol)
17b94a
 {
17b94a
+    if (xlator_is_cleanup_starting(this))
17b94a
+        return -1;
17b94a
+
17b94a
     return ec_shd_healer_spawn(this, NTH_FULL_HEALER(this, subvol),
17b94a
                                ec_shd_full_healer);
17b94a
 }
17b94a
@@ -451,6 +454,9 @@ ec_shd_full_healer_spawn(xlator_t *this, int subvol)
17b94a
 int
17b94a
 ec_shd_index_healer_spawn(xlator_t *this, int subvol)
17b94a
 {
17b94a
+    if (xlator_is_cleanup_starting(this))
17b94a
+        return -1;
17b94a
+
17b94a
     return ec_shd_healer_spawn(this, NTH_INDEX_HEALER(this, subvol),
17b94a
                                ec_shd_index_healer);
17b94a
 }
17b94a
diff --git a/xlators/cluster/ec/src/ec.c b/xlators/cluster/ec/src/ec.c
17b94a
index 264582a..df5912c 100644
17b94a
--- a/xlators/cluster/ec/src/ec.c
17b94a
+++ b/xlators/cluster/ec/src/ec.c
17b94a
@@ -486,6 +486,9 @@ ec_set_up_state(ec_t *ec, uintptr_t index_mask, uintptr_t new_state)
17b94a
 {
17b94a
     uintptr_t current_state = 0;
17b94a
 
17b94a
+    if (xlator_is_cleanup_starting(ec->xl))
17b94a
+        return _gf_false;
17b94a
+
17b94a
     if ((ec->xl_notify & index_mask) == 0) {
17b94a
         ec->xl_notify |= index_mask;
17b94a
         ec->xl_notify_count++;
17b94a
-- 
17b94a
1.8.3.1
17b94a