|
|
17b94a |
From 4d95e271a9042bf2d789a4d900ad263b6ea47681 Mon Sep 17 00:00:00 2001
|
|
|
17b94a |
From: Mohammed Rafi KC <rkavunga@redhat.com>
|
|
|
17b94a |
Date: Wed, 23 Jan 2019 21:55:01 +0530
|
|
|
17b94a |
Subject: [PATCH 100/124] clnt/rpc: ref leak during disconnect.
|
|
|
17b94a |
|
|
|
17b94a |
During disconnect cleanup, we are not cancelling reconnect
|
|
|
17b94a |
timer, which causes a ref leak each time when a disconnect
|
|
|
17b94a |
happen.
|
|
|
17b94a |
|
|
|
17b94a |
Backport of: https://review.gluster.org/#/c/glusterfs/+/22087/
|
|
|
17b94a |
|
|
|
17b94a |
>Change-Id: I9d05d1f368d080e04836bf6a0bb018bf8f7b5b8a
|
|
|
17b94a |
>updates: bz#1659708
|
|
|
17b94a |
>Signed-off-by: Mohammed Rafi KC <rkavunga@redhat.com>
|
|
|
17b94a |
|
|
|
17b94a |
Change-Id: I5a2dbb17e663a4809bb4c435cacadbf0ab694a76
|
|
|
17b94a |
BUG: 1471742
|
|
|
17b94a |
Signed-off-by: Mohammed Rafi KC <rkavunga@redhat.com>
|
|
|
17b94a |
Reviewed-on: https://code.engineering.redhat.com/gerrit/167844
|
|
|
17b94a |
Tested-by: RHGS Build Bot <nigelb@redhat.com>
|
|
|
17b94a |
Reviewed-by: Atin Mukherjee <amukherj@redhat.com>
|
|
|
17b94a |
---
|
|
|
17b94a |
libglusterfs/src/timer.c | 16 +++++++----
|
|
|
17b94a |
rpc/rpc-lib/src/rpc-clnt.c | 11 +++++++-
|
|
|
17b94a |
.../mgmt/glusterd/src/glusterd-snapshot-utils.c | 32 ++++++++++++++++++----
|
|
|
17b94a |
3 files changed, 47 insertions(+), 12 deletions(-)
|
|
|
17b94a |
|
|
|
17b94a |
diff --git a/libglusterfs/src/timer.c b/libglusterfs/src/timer.c
|
|
|
17b94a |
index d882543..2643c07 100644
|
|
|
17b94a |
--- a/libglusterfs/src/timer.c
|
|
|
17b94a |
+++ b/libglusterfs/src/timer.c
|
|
|
17b94a |
@@ -75,13 +75,13 @@ gf_timer_call_cancel(glusterfs_ctx_t *ctx, gf_timer_t *event)
|
|
|
17b94a |
if (ctx == NULL || event == NULL) {
|
|
|
17b94a |
gf_msg_callingfn("timer", GF_LOG_ERROR, EINVAL, LG_MSG_INVALID_ARG,
|
|
|
17b94a |
"invalid argument");
|
|
|
17b94a |
- return 0;
|
|
|
17b94a |
+ return -1;
|
|
|
17b94a |
}
|
|
|
17b94a |
|
|
|
17b94a |
if (ctx->cleanup_started) {
|
|
|
17b94a |
gf_msg_callingfn("timer", GF_LOG_INFO, 0, LG_MSG_CTX_CLEANUP_STARTED,
|
|
|
17b94a |
"ctx cleanup started");
|
|
|
17b94a |
- return 0;
|
|
|
17b94a |
+ return -1;
|
|
|
17b94a |
}
|
|
|
17b94a |
|
|
|
17b94a |
LOCK(&ctx->lock);
|
|
|
17b94a |
@@ -93,10 +93,9 @@ gf_timer_call_cancel(glusterfs_ctx_t *ctx, gf_timer_t *event)
|
|
|
17b94a |
if (!reg) {
|
|
|
17b94a |
/* This can happen when cleanup may have just started and
|
|
|
17b94a |
* gf_timer_registry_destroy() sets ctx->timer to NULL.
|
|
|
17b94a |
- * Just bail out as success as gf_timer_proc() takes
|
|
|
17b94a |
- * care of cleaning up the events.
|
|
|
17b94a |
+ * gf_timer_proc() takes care of cleaning up the events.
|
|
|
17b94a |
*/
|
|
|
17b94a |
- return 0;
|
|
|
17b94a |
+ return -1;
|
|
|
17b94a |
}
|
|
|
17b94a |
|
|
|
17b94a |
LOCK(®->lock);
|
|
|
17b94a |
@@ -203,6 +202,13 @@ gf_timer_proc(void *data)
|
|
|
17b94a |
list_for_each_entry_safe(event, tmp, ®->active, list)
|
|
|
17b94a |
{
|
|
|
17b94a |
list_del(&event->list);
|
|
|
17b94a |
+ /* TODO Possible resource leak
|
|
|
17b94a |
+ * Before freeing the event, we need to call the respective
|
|
|
17b94a |
+ * event functions and free any resources.
|
|
|
17b94a |
+ * For example, In case of rpc_clnt_reconnect, we need to
|
|
|
17b94a |
+ * unref rpc object which was taken when added to timer
|
|
|
17b94a |
+ * wheel.
|
|
|
17b94a |
+ */
|
|
|
17b94a |
GF_FREE(event);
|
|
|
17b94a |
}
|
|
|
17b94a |
}
|
|
|
17b94a |
diff --git a/rpc/rpc-lib/src/rpc-clnt.c b/rpc/rpc-lib/src/rpc-clnt.c
|
|
|
17b94a |
index 3f7bb3c..6f47515 100644
|
|
|
17b94a |
--- a/rpc/rpc-lib/src/rpc-clnt.c
|
|
|
17b94a |
+++ b/rpc/rpc-lib/src/rpc-clnt.c
|
|
|
17b94a |
@@ -495,6 +495,7 @@ rpc_clnt_connection_cleanup(rpc_clnt_connection_t *conn)
|
|
|
17b94a |
int unref = 0;
|
|
|
17b94a |
int ret = 0;
|
|
|
17b94a |
gf_boolean_t timer_unref = _gf_false;
|
|
|
17b94a |
+ gf_boolean_t reconnect_unref = _gf_false;
|
|
|
17b94a |
|
|
|
17b94a |
if (!conn) {
|
|
|
17b94a |
goto out;
|
|
|
17b94a |
@@ -514,6 +515,12 @@ rpc_clnt_connection_cleanup(rpc_clnt_connection_t *conn)
|
|
|
17b94a |
timer_unref = _gf_true;
|
|
|
17b94a |
conn->timer = NULL;
|
|
|
17b94a |
}
|
|
|
17b94a |
+ if (conn->reconnect) {
|
|
|
17b94a |
+ ret = gf_timer_call_cancel(clnt->ctx, conn->reconnect);
|
|
|
17b94a |
+ if (!ret)
|
|
|
17b94a |
+ reconnect_unref = _gf_true;
|
|
|
17b94a |
+ conn->reconnect = NULL;
|
|
|
17b94a |
+ }
|
|
|
17b94a |
|
|
|
17b94a |
conn->connected = 0;
|
|
|
17b94a |
conn->disconnected = 1;
|
|
|
17b94a |
@@ -533,6 +540,8 @@ rpc_clnt_connection_cleanup(rpc_clnt_connection_t *conn)
|
|
|
17b94a |
if (timer_unref)
|
|
|
17b94a |
rpc_clnt_unref(clnt);
|
|
|
17b94a |
|
|
|
17b94a |
+ if (reconnect_unref)
|
|
|
17b94a |
+ rpc_clnt_unref(clnt);
|
|
|
17b94a |
out:
|
|
|
17b94a |
return 0;
|
|
|
17b94a |
}
|
|
|
17b94a |
@@ -830,7 +839,7 @@ rpc_clnt_handle_disconnect(struct rpc_clnt *clnt, rpc_clnt_connection_t *conn)
|
|
|
17b94a |
pthread_mutex_lock(&conn->lock);
|
|
|
17b94a |
{
|
|
|
17b94a |
if (!conn->rpc_clnt->disabled && (conn->reconnect == NULL)) {
|
|
|
17b94a |
- ts.tv_sec = 10;
|
|
|
17b94a |
+ ts.tv_sec = 3;
|
|
|
17b94a |
ts.tv_nsec = 0;
|
|
|
17b94a |
|
|
|
17b94a |
rpc_clnt_ref(clnt);
|
|
|
17b94a |
diff --git a/xlators/mgmt/glusterd/src/glusterd-snapshot-utils.c b/xlators/mgmt/glusterd/src/glusterd-snapshot-utils.c
|
|
|
17b94a |
index 041946d..b3c4158 100644
|
|
|
17b94a |
--- a/xlators/mgmt/glusterd/src/glusterd-snapshot-utils.c
|
|
|
17b94a |
+++ b/xlators/mgmt/glusterd/src/glusterd-snapshot-utils.c
|
|
|
17b94a |
@@ -3364,6 +3364,25 @@ out:
|
|
|
17b94a |
return ret;
|
|
|
17b94a |
}
|
|
|
17b94a |
|
|
|
17b94a |
+int
|
|
|
17b94a |
+glusterd_is_path_mounted(const char *path)
|
|
|
17b94a |
+{
|
|
|
17b94a |
+ FILE *mtab = NULL;
|
|
|
17b94a |
+ struct mntent *part = NULL;
|
|
|
17b94a |
+ int is_mounted = 0;
|
|
|
17b94a |
+
|
|
|
17b94a |
+ if ((mtab = setmntent("/etc/mtab", "r")) != NULL) {
|
|
|
17b94a |
+ while ((part = getmntent(mtab)) != NULL) {
|
|
|
17b94a |
+ if ((part->mnt_fsname != NULL) &&
|
|
|
17b94a |
+ (strcmp(part->mnt_dir, path)) == 0) {
|
|
|
17b94a |
+ is_mounted = 1;
|
|
|
17b94a |
+ break;
|
|
|
17b94a |
+ }
|
|
|
17b94a |
+ }
|
|
|
17b94a |
+ endmntent(mtab);
|
|
|
17b94a |
+ }
|
|
|
17b94a |
+ return is_mounted;
|
|
|
17b94a |
+}
|
|
|
17b94a |
/* This function will do unmount for snaps.
|
|
|
17b94a |
*/
|
|
|
17b94a |
int32_t
|
|
|
17b94a |
@@ -3388,14 +3407,11 @@ glusterd_snap_unmount(xlator_t *this, glusterd_volinfo_t *volinfo)
|
|
|
17b94a |
continue;
|
|
|
17b94a |
}
|
|
|
17b94a |
|
|
|
17b94a |
- /* Fetch the brick mount path from the brickinfo->path */
|
|
|
17b94a |
- ret = glusterd_get_brick_root(brickinfo->path, &brick_mount_path);
|
|
|
17b94a |
+ ret = glusterd_find_brick_mount_path(brickinfo->path,
|
|
|
17b94a |
+ &brick_mount_path);
|
|
|
17b94a |
if (ret) {
|
|
|
17b94a |
- gf_msg(this->name, GF_LOG_INFO, 0, GD_MSG_BRICK_PATH_UNMOUNTED,
|
|
|
17b94a |
+ gf_msg(this->name, GF_LOG_ERROR, 0, GD_MSG_BRK_MNTPATH_GET_FAIL,
|
|
|
17b94a |
"Failed to find brick_mount_path for %s", brickinfo->path);
|
|
|
17b94a |
- /* There is chance that brick path is already
|
|
|
17b94a |
- * unmounted. */
|
|
|
17b94a |
- ret = 0;
|
|
|
17b94a |
goto out;
|
|
|
17b94a |
}
|
|
|
17b94a |
/* unmount cannot be done when the brick process is still in
|
|
|
17b94a |
@@ -3440,6 +3456,10 @@ glusterd_umount(const char *path)
|
|
|
17b94a |
GF_ASSERT(this);
|
|
|
17b94a |
GF_ASSERT(path);
|
|
|
17b94a |
|
|
|
17b94a |
+ if (!glusterd_is_path_mounted(path)) {
|
|
|
17b94a |
+ return 0;
|
|
|
17b94a |
+ }
|
|
|
17b94a |
+
|
|
|
17b94a |
runinit(&runner);
|
|
|
17b94a |
snprintf(msg, sizeof(msg), "umount path %s", path);
|
|
|
17b94a |
runner_add_args(&runner, _PATH_UMOUNT, "-f", path, NULL);
|
|
|
17b94a |
--
|
|
|
17b94a |
1.8.3.1
|
|
|
17b94a |
|