anitazha / rpms / ndctl

Forked from rpms/ndctl 2 years ago
Clone

Blame SOURCES/aa99000-libndctl-papr-Add-support-for-reporting-shutdown-count.patch

0dc130
libndctl/papr: Add support for reporting shutdown-count
0dc130
0dc130
BZ: 
0dc130
Brew: 
0dc130
0dc130
commit aa990008f48f21121474a411d829f24e832c89a2
0dc130
Author: Vaibhav Jain <vaibhav@linux.ibm.com>
0dc130
Date:   Tue Jan 25 00:26:05 2022 +0530
0dc130
0dc130
    libndctl/papr: Add support for reporting shutdown-count
0dc130
    
0dc130
    Add support for reporting dirty-shutdown-count (DSC) for PAPR based
0dc130
    NVDIMMs. The sysfs attribute exposing this value is located at
0dc130
    nmemX/papr/dirty_shutdown.
0dc130
    
0dc130
    This counter is also returned in payload for PAPR_PDSM_HEALTH as newly
0dc130
    introduced member 'dimm_dsc' in 'struct nd_papr_pdsm_health'. Presence
0dc130
    of 'DSC' is indicated by the PDSM_DIMM_DSC_VALID extension flag.
0dc130
    
0dc130
    The patch implements 'ndctl_dimm_ops.smart_get_shutdown_count'
0dc130
    callback in implemented as papr_smart_get_shutdown_count().
0dc130
    
0dc130
    Kernel side changes to support reporting DSC have been merged to linux kernel
0dc130
    via patch proposed at [1]. With updated kernel 'ndctl list -DH' reports
0dc130
    following output on PPC64:
0dc130
    
0dc130
    $ sudo ndctl list -DH
0dc130
    [
0dc130
      {
0dc130
        "dev":"nmem0",
0dc130
        "health":{
0dc130
          "health_state":"ok",
0dc130
          "life_used_percentage":50,
0dc130
          "shutdown_state":"clean",
0dc130
          "shutdown_count":10
0dc130
        }
0dc130
      }
0dc130
    ]
0dc130
    
0dc130
    [1] http://patchwork.ozlabs.org/project/linuxppc-dev/patch/20210624080621.252038-1-vaibhav@linux.ibm.com
0dc130
    
0dc130
    Link: https://lore.kernel.org/r/20220124185605.1465681-1-vaibhav@linux.ibm.com
0dc130
    Signed-off-by: Vaibhav Jain <vaibhav@linux.ibm.com>
0dc130
    Signed-off-by: Vishal Verma <vishal.l.verma@intel.com>
0dc130
0dc130
diff --git a/ndctl/lib/libndctl.c b/ndctl/lib/libndctl.c
0dc130
index 47a234c..5979a92 100644
0dc130
--- a/ndctl/lib/libndctl.c
0dc130
+++ b/ndctl/lib/libndctl.c
0dc130
@@ -1819,8 +1819,12 @@ static int add_papr_dimm(struct ndctl_dimm *dimm, const char *dimm_base)
0dc130
 
0dc130
 		/* Allocate monitor mode fd */
0dc130
 		dimm->health_eventfd = open(path, O_RDONLY|O_CLOEXEC);
0dc130
-		rc = 0;
0dc130
+		/* Get the dirty shutdown counter value */
0dc130
+		sprintf(path, "%s/papr/dirty_shutdown", dimm_base);
0dc130
+		if (sysfs_read_attr(ctx, path, buf) == 0)
0dc130
+			dimm->dirty_shutdown = strtoll(buf, NULL, 0);
0dc130
 
0dc130
+		rc = 0;
0dc130
 	} else if (strcmp(buf, "nvdimm_test") == 0) {
0dc130
 		/* probe via common populate_dimm_attributes() */
0dc130
 		rc = populate_dimm_attributes(dimm, dimm_base, "papr");
0dc130
diff --git a/ndctl/lib/papr.c b/ndctl/lib/papr.c
0dc130
index 43b8412..46cf9c1 100644
0dc130
--- a/ndctl/lib/papr.c
0dc130
+++ b/ndctl/lib/papr.c
0dc130
@@ -165,6 +165,9 @@ static unsigned int papr_smart_get_flags(struct ndctl_cmd *cmd)
0dc130
 		if (health.extension_flags & PDSM_DIMM_HEALTH_RUN_GAUGE_VALID)
0dc130
 			flags |= ND_SMART_USED_VALID;
0dc130
 
0dc130
+		if (health.extension_flags &  PDSM_DIMM_DSC_VALID)
0dc130
+			flags |= ND_SMART_SHUTDOWN_COUNT_VALID;
0dc130
+
0dc130
 		return flags;
0dc130
 	}
0dc130
 
0dc130
@@ -236,6 +239,25 @@ static unsigned int papr_smart_get_life_used(struct ndctl_cmd *cmd)
0dc130
 		(100 - health.dimm_fuel_gauge) : 0;
0dc130
 }
0dc130
 
0dc130
+static unsigned int papr_smart_get_shutdown_count(struct ndctl_cmd *cmd)
0dc130
+{
0dc130
+
0dc130
+	struct nd_papr_pdsm_health health;
0dc130
+
0dc130
+	/* Ignore in case of error or invalid pdsm */
0dc130
+	if (!cmd_is_valid(cmd) ||
0dc130
+	    to_pdsm(cmd)->cmd_status != 0 ||
0dc130
+	    to_pdsm_cmd(cmd) != PAPR_PDSM_HEALTH)
0dc130
+		return 0;
0dc130
+
0dc130
+	/* get the payload from command */
0dc130
+	health = to_payload(cmd)->health;
0dc130
+
0dc130
+	return (health.extension_flags & PDSM_DIMM_DSC_VALID) ?
0dc130
+		(health.dimm_dsc) : 0;
0dc130
+
0dc130
+}
0dc130
+
0dc130
 struct ndctl_dimm_ops * const papr_dimm_ops = &(struct ndctl_dimm_ops) {
0dc130
 	.cmd_is_supported = papr_cmd_is_supported,
0dc130
 	.smart_get_flags = papr_smart_get_flags,
0dc130
@@ -245,4 +267,5 @@ struct ndctl_dimm_ops * const papr_dimm_ops = &(struct ndctl_dimm_ops) {
0dc130
 	.smart_get_health = papr_smart_get_health,
0dc130
 	.smart_get_shutdown_state = papr_smart_get_shutdown_state,
0dc130
 	.smart_get_life_used = papr_smart_get_life_used,
0dc130
+	.smart_get_shutdown_count = papr_smart_get_shutdown_count,
0dc130
 };
0dc130
diff --git a/ndctl/lib/papr_pdsm.h b/ndctl/lib/papr_pdsm.h
0dc130
index 1bac8a7..f45b1e4 100644
0dc130
--- a/ndctl/lib/papr_pdsm.h
0dc130
+++ b/ndctl/lib/papr_pdsm.h
0dc130
@@ -75,6 +75,9 @@
0dc130
 /* Indicate that the 'dimm_fuel_gauge' field is valid */
0dc130
 #define PDSM_DIMM_HEALTH_RUN_GAUGE_VALID 1
0dc130
 
0dc130
+/* Indicate that the 'dimm_dsc' field is valid */
0dc130
+#define PDSM_DIMM_DSC_VALID 2
0dc130
+
0dc130
 /*
0dc130
  * Struct exchanged between kernel & ndctl in for PAPR_PDSM_HEALTH
0dc130
  * Various flags indicate the health status of the dimm.
0dc130
@@ -103,6 +106,9 @@ struct nd_papr_pdsm_health {
0dc130
 
0dc130
 			/* Extension flag PDSM_DIMM_HEALTH_RUN_GAUGE_VALID */
0dc130
 			__u16 dimm_fuel_gauge;
0dc130
+
0dc130
+			/* Extension flag PDSM_DIMM_DSC_VALID */
0dc130
+			__u64 dimm_dsc;
0dc130
 		};
0dc130
 		__u8 buf[ND_PDSM_PAYLOAD_MAX_SIZE];
0dc130
 	};