Blob Blame History Raw
From 1de7497540b8428187df5048a1b8e82c2feec604 Mon Sep 17 00:00:00 2001
From: Mohit Agrawal <moagrawa@redhat.com>
Date: Mon, 19 Nov 2018 13:00:57 +0530
Subject: [PATCH 446/450] core: Portmap entries showing stale brick entries
 when bricks are down

Problem: pmap is showing stale brick entries after down the brick
         because of glusterd_brick_rpc_notify call gf_is_service_running
         before call pmap_registry_remove to ensure about brick instance.

Solutiom: 1) Change the condition in gf_is_pid_running to ensure about
             process existence, use open instead of access to achieve
             the same
          2) Call search_brick_path_from_proc in __glusterd_brick_rpc_notify
             along with gf_is_service_running

> Change-Id: Ia663ac61c01fdee6c12f47c0300cdf93f19b6a19
> fixes: bz#1646892
> Signed-off-by: Mohit Agrawal <moagrawal@redhat.com>
> (Cherry picked from commit bcf1e8b07491b48c5372924dbbbad5b8391c6d81)
> (Reviwed on upstream link https://review.gluster.org/#/c/glusterfs/+/21568/)

BUG: 1649651
Change-Id: I06b0842d5e3ffc909304529311709064237ccc94
Signed-off-by: Mohit Agrawal <moagrawa@redhat.com>
Reviewed-on: https://code.engineering.redhat.com/gerrit/156326
Tested-by: RHGS Build Bot <nigelb@redhat.com>
Reviewed-by: Atin Mukherjee <amukherj@redhat.com>
---
 libglusterfs/src/common-utils.c              | 5 ++++-
 xlators/mgmt/glusterd/src/glusterd-handler.c | 7 +++++--
 xlators/mgmt/glusterd/src/glusterd-utils.h   | 2 ++
 3 files changed, 11 insertions(+), 3 deletions(-)

diff --git a/libglusterfs/src/common-utils.c b/libglusterfs/src/common-utils.c
index 54ef875..dd6cdb3 100644
--- a/libglusterfs/src/common-utils.c
+++ b/libglusterfs/src/common-utils.c
@@ -3986,13 +3986,16 @@ gf_boolean_t
 gf_is_pid_running (int pid)
 {
         char fname[32] = {0,};
+        int fd = -1;
 
         snprintf(fname, sizeof(fname), "/proc/%d/cmdline", pid);
 
-        if (sys_access (fname , R_OK) != 0) {
+        fd = sys_open(fname, O_RDONLY, 0);
+        if (fd < 0) {
                 return _gf_false;
         }
 
+        sys_close(fd);
         return _gf_true;
 
 }
diff --git a/xlators/mgmt/glusterd/src/glusterd-handler.c b/xlators/mgmt/glusterd/src/glusterd-handler.c
index bf37e70..a129afc 100644
--- a/xlators/mgmt/glusterd/src/glusterd-handler.c
+++ b/xlators/mgmt/glusterd/src/glusterd-handler.c
@@ -6193,11 +6193,14 @@ __glusterd_brick_rpc_notify (struct rpc_clnt *rpc, void *mydata,
                         /* In case of an abrupt shutdown of a brick PMAP_SIGNOUT
                          * event is not received by glusterd which can lead to a
                          * stale port entry in glusterd, so forcibly clean up
-                         * the same if the process is not running
+                         * the same if the process is not running sometime
+                         * gf_is_service_running true so to ensure about brick instance
+                         * call search_brick_path_from_proc
                          */
                         GLUSTERD_GET_BRICK_PIDFILE (pidfile, volinfo,
                                                     brickinfo, conf);
-                        if (!gf_is_service_running (pidfile, &pid)) {
+                        if (!gf_is_service_running (pidfile, &pid) ||
+                            !search_brick_path_from_proc(pid, brickinfo->path)) {
                                 ret = pmap_registry_remove (
                                                       THIS, brickinfo->port,
                                                       brickinfo->path,
diff --git a/xlators/mgmt/glusterd/src/glusterd-utils.h b/xlators/mgmt/glusterd/src/glusterd-utils.h
index ffcc636..8e5320d 100644
--- a/xlators/mgmt/glusterd/src/glusterd-utils.h
+++ b/xlators/mgmt/glusterd/src/glusterd-utils.h
@@ -897,4 +897,6 @@ glusterd_get_index_basepath (glusterd_brickinfo_t *brickinfo, char *buffer,
 gf_boolean_t
 glusterd_is_profile_on (glusterd_volinfo_t *volinfo);
 
+char *
+search_brick_path_from_proc(pid_t brick_pid, char *brickpath);
 #endif
-- 
1.8.3.1