d1681e
From dbf993f9c56c7ee995e9054b09c5552f88253bb3 Mon Sep 17 00:00:00 2001
d1681e
From: Ashish Pandey <aspandey@redhat.com>
d1681e
Date: Mon, 31 Jul 2017 12:45:21 +0530
d1681e
Subject: [PATCH 100/128] cluster/ec: Improve heal info command to handle
d1681e
 obvious cases
d1681e
d1681e
Problem:
d1681e
1 - If a brick is down and we see an index entry in
d1681e
.glusterfs/indices, we should show it in heal info
d1681e
output as it most certainly needs heal.
d1681e
d1681e
2 - The first problem is also not getting handled after
d1681e
ec_heal_inspect. Even if in ec_heal_inspect, lookup will
d1681e
mark need_heal as true, we don't handle it properly in
d1681e
ec_get_heal_info and continue with locked inspect which
d1681e
takes lot of time.
d1681e
d1681e
Solution:
d1681e
1 - In first case we need not to do any further invstigation.
d1681e
As soon as we see that a brick is down, we should say that
d1681e
this index entry needs heal for sure.
d1681e
d1681e
2 - In second case, if we have need_heal as _gf_true after
d1681e
ec_heal_inspect, we should show it as heal requires.
d1681e
d1681e
>Change-Id: Ibe7f9d7602cc0b382ba53bddaf75a2a2c3326aa6
d1681e
>BUG: 1476668
d1681e
>Signed-off-by: Ashish Pandey <aspandey@redhat.com>
d1681e
Upstream Patch: https://review.gluster.org/#/c/17923/
d1681e
d1681e
BUG: 1509833
d1681e
Change-Id: Ibe7f9d7602cc0b382ba53bddaf75a2a2c3326aa6
d1681e
Signed-off-by: Sunil Kumar Acharya <sheggodu@redhat.com>
d1681e
Reviewed-on: https://code.engineering.redhat.com/gerrit/125194
d1681e
Tested-by: RHGS Build Bot <nigelb@redhat.com>
d1681e
---
d1681e
 xlators/cluster/ec/src/ec-common.h |  2 +-
d1681e
 xlators/cluster/ec/src/ec-heal.c   | 54 ++++++++++++++++++++++----------------
d1681e
 xlators/cluster/ec/src/ec-types.h  |  9 +++++++
d1681e
 3 files changed, 41 insertions(+), 24 deletions(-)
d1681e
d1681e
diff --git a/xlators/cluster/ec/src/ec-common.h b/xlators/cluster/ec/src/ec-common.h
d1681e
index 0f7a252..dec81ca 100644
d1681e
--- a/xlators/cluster/ec/src/ec-common.h
d1681e
+++ b/xlators/cluster/ec/src/ec-common.h
d1681e
@@ -132,7 +132,7 @@ int32_t
d1681e
 ec_heal_inspect (call_frame_t *frame, ec_t *ec,
d1681e
                  inode_t *inode, unsigned char *locked_on,
d1681e
                  gf_boolean_t self_locked, gf_boolean_t thorough,
d1681e
-                 gf_boolean_t *need_heal);
d1681e
+                 ec_heal_need_t *need_heal);
d1681e
 int32_t
d1681e
 ec_get_heal_info (xlator_t *this, loc_t *loc, dict_t **dict);
d1681e
 #endif /* __EC_COMMON_H__ */
d1681e
diff --git a/xlators/cluster/ec/src/ec-heal.c b/xlators/cluster/ec/src/ec-heal.c
d1681e
index bc25015..fd8c902 100644
d1681e
--- a/xlators/cluster/ec/src/ec-heal.c
d1681e
+++ b/xlators/cluster/ec/src/ec-heal.c
d1681e
@@ -2421,9 +2421,9 @@ ec_heal_do (xlator_t *this, void *data, loc_t *loc, int32_t partial)
d1681e
         intptr_t      bad            = 0;
d1681e
         ec_fop_data_t *fop           = data;
d1681e
         gf_boolean_t  blocking       = _gf_false;
d1681e
-        gf_boolean_t  need_heal      = _gf_false;
d1681e
+        ec_heal_need_t  need_heal    = EC_HEAL_NONEED;
d1681e
         unsigned char *up_subvols    = NULL;
d1681e
-	char up_bricks[32];
d1681e
+        char up_bricks[32];
d1681e
 
d1681e
         ec = this->private;
d1681e
 
d1681e
@@ -2470,7 +2470,8 @@ ec_heal_do (xlator_t *this, void *data, loc_t *loc, int32_t partial)
d1681e
          * triggers heals periodically which need not be thorough*/
d1681e
         ec_heal_inspect (frame, ec, loc->inode, up_subvols, _gf_false,
d1681e
                          !ec->shd.iamshd, &need_heal);
d1681e
-        if (!need_heal) {
d1681e
+
d1681e
+        if (need_heal == EC_HEAL_NONEED)  {
d1681e
                 gf_msg (ec->xl->name, GF_LOG_DEBUG, 0,
d1681e
                         EC_MSG_HEAL_FAIL, "Heal is not required for : %s ",
d1681e
                         uuid_utoa(loc->gfid));
d1681e
@@ -2776,18 +2777,18 @@ out:
d1681e
 static int32_t
d1681e
 _need_heal_calculate (ec_t *ec, uint64_t *dirty, unsigned char *sources,
d1681e
                       gf_boolean_t self_locked, int32_t lock_count,
d1681e
-                      gf_boolean_t *need_heal)
d1681e
+                      ec_heal_need_t *need_heal)
d1681e
 {
d1681e
         int i = 0;
d1681e
         int source_count = 0;
d1681e
 
d1681e
         source_count = EC_COUNT (sources, ec->nodes);
d1681e
         if (source_count == ec->nodes) {
d1681e
-                *need_heal = _gf_false;
d1681e
+                *need_heal = EC_HEAL_NONEED;
d1681e
                 if (self_locked || lock_count == 0) {
d1681e
                         for (i = 0; i < ec->nodes; i++) {
d1681e
                                 if (dirty[i]) {
d1681e
-                                        *need_heal = _gf_true;
d1681e
+                                        *need_heal = EC_HEAL_MUST;
d1681e
                                         goto out;
d1681e
                                 }
d1681e
                         }
d1681e
@@ -2799,13 +2800,13 @@ _need_heal_calculate (ec_t *ec, uint64_t *dirty, unsigned char *sources,
d1681e
                                  * set and this indicates a problem in the
d1681e
                                  * inode.*/
d1681e
                                 if (dirty[i] > 1) {
d1681e
-                                        *need_heal = _gf_true;
d1681e
+                                        *need_heal = EC_HEAL_MUST;
d1681e
                                         goto out;
d1681e
                                 }
d1681e
                         }
d1681e
                 }
d1681e
         } else {
d1681e
-                *need_heal = _gf_true;
d1681e
+                *need_heal = EC_HEAL_MUST;
d1681e
         }
d1681e
 
d1681e
 out:
d1681e
@@ -2815,7 +2816,7 @@ out:
d1681e
 static int32_t
d1681e
 ec_need_metadata_heal (ec_t *ec, inode_t *inode, default_args_cbk_t *replies,
d1681e
                        int32_t lock_count, gf_boolean_t self_locked,
d1681e
-                       gf_boolean_t thorough, gf_boolean_t *need_heal)
d1681e
+                       gf_boolean_t thorough, ec_heal_need_t *need_heal)
d1681e
 {
d1681e
         uint64_t           *dirty         = NULL;
d1681e
         unsigned char      *sources       = NULL;
d1681e
@@ -2836,10 +2837,10 @@ ec_need_metadata_heal (ec_t *ec, inode_t *inode, default_args_cbk_t *replies,
d1681e
 
d1681e
         ret = _need_heal_calculate (ec, dirty, sources, self_locked, lock_count,
d1681e
                                     need_heal);
d1681e
-        if (ret == ec->nodes && !(*need_heal)) {
d1681e
+        if (ret == ec->nodes && *need_heal == EC_HEAL_NONEED) {
d1681e
                 for (i = 1; i < ec->nodes; i++) {
d1681e
                         if (meta_versions[i] != meta_versions[0]) {
d1681e
-                                *need_heal = _gf_true;
d1681e
+                                *need_heal = EC_HEAL_MUST;
d1681e
                                 goto out;
d1681e
                         }
d1681e
                 }
d1681e
@@ -2851,7 +2852,7 @@ out:
d1681e
 static int32_t
d1681e
 ec_need_data_heal (ec_t *ec, inode_t *inode, default_args_cbk_t *replies,
d1681e
                    int32_t lock_count, gf_boolean_t self_locked,
d1681e
-                   gf_boolean_t thorough, gf_boolean_t *need_heal)
d1681e
+                   gf_boolean_t thorough, ec_heal_need_t *need_heal)
d1681e
 {
d1681e
         uint64_t           *dirty         = NULL;
d1681e
         unsigned char      *sources       = NULL;
d1681e
@@ -2888,7 +2889,7 @@ out:
d1681e
 static int32_t
d1681e
 ec_need_entry_heal (ec_t *ec, inode_t *inode, default_args_cbk_t *replies,
d1681e
                     int32_t lock_count, gf_boolean_t self_locked,
d1681e
-                    gf_boolean_t thorough, gf_boolean_t *need_heal)
d1681e
+                    gf_boolean_t thorough, ec_heal_need_t *need_heal)
d1681e
 {
d1681e
         uint64_t           *dirty         = NULL;
d1681e
         unsigned char      *sources       = NULL;
d1681e
@@ -2916,7 +2917,7 @@ out:
d1681e
 static int32_t
d1681e
 ec_need_heal (ec_t *ec, inode_t *inode, default_args_cbk_t *replies,
d1681e
               int32_t lock_count, gf_boolean_t self_locked,
d1681e
-              gf_boolean_t thorough, gf_boolean_t *need_heal)
d1681e
+              gf_boolean_t thorough, ec_heal_need_t *need_heal)
d1681e
 {
d1681e
         int                ret            = 0;
d1681e
 
d1681e
@@ -2926,7 +2927,7 @@ ec_need_heal (ec_t *ec, inode_t *inode, default_args_cbk_t *replies,
d1681e
         if (ret < 0)
d1681e
                 goto out;
d1681e
 
d1681e
-        if (*need_heal)
d1681e
+        if (*need_heal == EC_HEAL_MUST)
d1681e
                 goto out;
d1681e
 
d1681e
         if (inode->ia_type == IA_IFREG) {
d1681e
@@ -2945,7 +2946,7 @@ int32_t
d1681e
 ec_heal_inspect (call_frame_t *frame, ec_t *ec,
d1681e
                  inode_t *inode, unsigned char *locked_on,
d1681e
                  gf_boolean_t self_locked, gf_boolean_t thorough,
d1681e
-                 gf_boolean_t *need_heal)
d1681e
+                 ec_heal_need_t *need_heal)
d1681e
 {
d1681e
         loc_t              loc           = {0};
d1681e
         int                i             = 0;
d1681e
@@ -2989,7 +2990,7 @@ ec_heal_inspect (call_frame_t *frame, ec_t *ec,
d1681e
 
d1681e
         if (ret != ec->nodes) {
d1681e
                 ret = ec->nodes;
d1681e
-                *need_heal = _gf_true;
d1681e
+                *need_heal = EC_HEAL_MUST;
d1681e
                 goto out;
d1681e
         }
d1681e
 
d1681e
@@ -3009,6 +3010,9 @@ need_heal:
d1681e
         ret = ec_need_heal (ec, inode, replies, lock_count,
d1681e
                             self_locked, thorough, need_heal);
d1681e
 
d1681e
+        if (!self_locked && *need_heal == EC_HEAL_MUST) {
d1681e
+                *need_heal = EC_HEAL_MAYBE;
d1681e
+        }
d1681e
 out:
d1681e
         cluster_replies_wipe (replies, ec->nodes);
d1681e
         loc_wipe (&loc;;
d1681e
@@ -3020,7 +3024,7 @@ out:
d1681e
 
d1681e
 int32_t
d1681e
 ec_heal_locked_inspect (call_frame_t *frame, ec_t *ec, inode_t *inode,
d1681e
-                        gf_boolean_t *need_heal)
d1681e
+                        ec_heal_need_t *need_heal)
d1681e
 {
d1681e
         unsigned char      *locked_on  = NULL;
d1681e
         unsigned char      *up_subvols = NULL;
d1681e
@@ -3038,7 +3042,7 @@ ec_heal_locked_inspect (call_frame_t *frame, ec_t *ec, inode_t *inode,
d1681e
                                replies, locked_on, frame, ec->xl,
d1681e
                                ec->xl->name, inode, 0, 0);
d1681e
         if (ret != ec->nodes) {
d1681e
-                *need_heal = _gf_true;
d1681e
+                *need_heal = EC_HEAL_MUST;
d1681e
                 goto unlock;
d1681e
         }
d1681e
         ret = ec_heal_inspect (frame, ec, inode, locked_on, _gf_true, _gf_true,
d1681e
@@ -3055,7 +3059,7 @@ int32_t
d1681e
 ec_get_heal_info (xlator_t *this, loc_t *entry_loc, dict_t **dict_rsp)
d1681e
 {
d1681e
         int             ret             = -ENOMEM;
d1681e
-        gf_boolean_t    need_heal       = _gf_false;
d1681e
+        ec_heal_need_t  need_heal       = EC_HEAL_NONEED;
d1681e
         call_frame_t    *frame          = NULL;
d1681e
         ec_t            *ec             = NULL;
d1681e
         unsigned char   *up_subvols     = NULL;
d1681e
@@ -3068,6 +3072,10 @@ ec_get_heal_info (xlator_t *this, loc_t *entry_loc, dict_t **dict_rsp)
d1681e
         up_subvols = alloca0(ec->nodes);
d1681e
         ec_mask_to_char_array (ec->xl_up, up_subvols, ec->nodes);
d1681e
 
d1681e
+        if (EC_COUNT (up_subvols, ec->nodes) != ec->nodes) {
d1681e
+                need_heal = EC_HEAL_MUST;
d1681e
+                goto set_heal;
d1681e
+        }
d1681e
         frame = create_frame (this, this->ctx->pool);
d1681e
         if (!frame) {
d1681e
                 goto out;
d1681e
@@ -3092,16 +3100,16 @@ ec_get_heal_info (xlator_t *this, loc_t *entry_loc, dict_t **dict_rsp)
d1681e
 
d1681e
         ret = ec_heal_inspect (frame, ec, loc.inode, up_subvols, _gf_false,
d1681e
                                _gf_false, &need_heal);
d1681e
-        if (ret == ec->nodes && !need_heal) {
d1681e
+        if (ret == ec->nodes && need_heal == EC_HEAL_NONEED) {
d1681e
                 goto set_heal;
d1681e
         }
d1681e
-        need_heal = _gf_false;
d1681e
+        need_heal = EC_HEAL_NONEED;
d1681e
         ret = ec_heal_locked_inspect (frame, ec, loc.inode,
d1681e
                                       &need_heal);
d1681e
         if (ret < 0)
d1681e
                 goto out;
d1681e
 set_heal:
d1681e
-        if (need_heal) {
d1681e
+        if (need_heal == EC_HEAL_MUST) {
d1681e
                 ret =  ec_set_heal_info (dict_rsp, "heal");
d1681e
         } else {
d1681e
                 ret =  ec_set_heal_info (dict_rsp, "no-heal");
d1681e
diff --git a/xlators/cluster/ec/src/ec-types.h b/xlators/cluster/ec/src/ec-types.h
d1681e
index 354b4ed..a891ff5 100644
d1681e
--- a/xlators/cluster/ec/src/ec-types.h
d1681e
+++ b/xlators/cluster/ec/src/ec-types.h
d1681e
@@ -17,6 +17,9 @@
d1681e
 
d1681e
 #define EC_GF_MAX_REGS 16
d1681e
 
d1681e
+enum _ec_heal_need;
d1681e
+typedef enum _ec_heal_need ec_heal_need_t;
d1681e
+
d1681e
 enum _ec_read_policy;
d1681e
 typedef enum _ec_read_policy ec_read_policy_t;
d1681e
 
d1681e
@@ -115,6 +118,12 @@ enum _ec_read_policy {
d1681e
         EC_READ_POLICY_MAX
d1681e
 };
d1681e
 
d1681e
+enum _ec_heal_need {
d1681e
+        EC_HEAL_NONEED,
d1681e
+        EC_HEAL_MAYBE,
d1681e
+        EC_HEAL_MUST
d1681e
+};
d1681e
+
d1681e
 struct _ec_config {
d1681e
     uint32_t version;
d1681e
     uint8_t  algorithm;
d1681e
-- 
d1681e
1.8.3.1
d1681e