Hi Vishal,

The corrosponding kernel patch for the functionality has been merged
into upstream ppc-next tree via following commit:

de21e1377c4f("powerpc/papr_scm: Add support for reporting dirty-shutdown-count")

[Link] https://git.kernel.org/powerpc/c/de21e1377c4fe65bfd8d31e446482c1bc2232997

So the corrosponding ndctl patch can now be merged.

Thanks,
~ Vaibhav

Vaibhav Jain <[email protected]> writes:

> Hi Vishal,
>
> Thanks for looking into this patch.
>
> "Verma, Vishal L" <[email protected]> writes:
>
>> On Fri, 2021-05-21 at 16:56 +0530, Vaibhav Jain wrote:
>>> Add support for reporting dirty-shutdown-count (DSC) for PAPR based
>>> NVDIMMs. The sysfs attribute exposing this value is located at
>>> nmemX/papr/dirty_shutdown.
>>> 
>>> This counter is also returned in payload for PAPR_PDSM_HEALTH as newly
>>> introduced member 'dimm_dsc' in 'struct nd_papr_pdsm_health'. Presence
>>> of 'DSC' is indicated by the PDSM_DIMM_DSC_VALID extension flag.
>>> 
>>> The patch implements 'ndctl_dimm_ops.smart_get_shutdown_count'
>>> callback in implemented as papr_smart_get_shutdown_count().
>>> 
>>> Kernel side changes to support reporting DSC have been proposed at
>>> [1]. With updated kernel 'ndctl list -DH' reports following output on
>>> PPC64:
>>> 
>>> $ sudo ndctl list -DH
>>> [
>>>   {
>>>     "dev":"nmem0",
>>>     "health":{
>>>       "health_state":"ok",
>>>       "life_used_percentage":50,
>>>       "shutdown_state":"clean",
>>>       "shutdown_count":10
>>>     }
>>>   }
>>> ]
>>> 
>>> Link: 
>>> https://lore.kernel.org/nvdimm/[email protected]
>>
>> I'd suggest just using '[1]: <https://lore....'  for this. The Link:
>> trailer is added by 'b4' when I apply this patch, and points to this
>> patch on lore. It would be confusing to have two Link: trailers
>> pointing to different things.
>>
> Thanks for pointing this out. Will use your suggested format going
> forward.
>
>>> Signed-off-by: Vaibhav Jain <[email protected]>
>>> ---
>>>  ndctl/lib/libndctl.c  |  6 +++++-
>>>  ndctl/lib/papr.c      | 23 +++++++++++++++++++++++
>>>  ndctl/lib/papr_pdsm.h |  6 ++++++
>>>  3 files changed, 34 insertions(+), 1 deletion(-)
>>
>> The patch looks okay to me - but I assume it depends on the kernel
>> interfaces not changing in the patch referenced above. Should I put
>> this on hold until the kernel side is accepted?
>>
> Yes, it will be better to hold this until the corroponding kernel patch
> is merged.
>
>>> 
>>> diff --git a/ndctl/lib/libndctl.c b/ndctl/lib/libndctl.c
>>> index aa36a3c87c57..6ee426ae30e1 100644
>>> --- a/ndctl/lib/libndctl.c
>>> +++ b/ndctl/lib/libndctl.c
>>> @@ -1795,8 +1795,12 @@ static int add_papr_dimm(struct ndctl_dimm *dimm, 
>>> const char *dimm_base)
>>>  
>>>             /* Allocate monitor mode fd */
>>>             dimm->health_eventfd = open(path, O_RDONLY|O_CLOEXEC);
>>> -           rc = 0;
>>> +           /* Get the dirty shutdown counter value */
>>> +           sprintf(path, "%s/papr/dirty_shutdown", dimm_base);
>>> +           if (sysfs_read_attr(ctx, path, buf) == 0)
>>> +                   dimm->dirty_shutdown = strtoll(buf, NULL, 0);
>>>  
>>> +           rc = 0;
>>>     } else if (strcmp(buf, "nvdimm_test") == 0) {
>>>             /* probe via common populate_dimm_attributes() */
>>>             rc = populate_dimm_attributes(dimm, dimm_base, "papr");
>>> diff --git a/ndctl/lib/papr.c b/ndctl/lib/papr.c
>>> index 9c6f2f045fc2..42ff200dc588 100644
>>> --- a/ndctl/lib/papr.c
>>> +++ b/ndctl/lib/papr.c
>>> @@ -165,6 +165,9 @@ static unsigned int papr_smart_get_flags(struct 
>>> ndctl_cmd *cmd)
>>>             if (health.extension_flags & PDSM_DIMM_HEALTH_RUN_GAUGE_VALID)
>>>                     flags |= ND_SMART_USED_VALID;
>>>  
>>> +           if (health.extension_flags &  PDSM_DIMM_DSC_VALID)
>>> +                   flags |= ND_SMART_SHUTDOWN_COUNT_VALID;
>>> +
>>>             return flags;
>>>     }
>>>  
>>> @@ -236,6 +239,25 @@ static unsigned int papr_smart_get_life_used(struct 
>>> ndctl_cmd *cmd)
>>>             (100 - health.dimm_fuel_gauge) : 0;
>>>  }
>>>  
>>> +static unsigned int papr_smart_get_shutdown_count(struct ndctl_cmd *cmd)
>>> +{
>>> +
>>> +   struct nd_papr_pdsm_health health;
>>> +
>>> +   /* Ignore in case of error or invalid pdsm */
>>> +   if (!cmd_is_valid(cmd) ||
>>> +       to_pdsm(cmd)->cmd_status != 0 ||
>>> +       to_pdsm_cmd(cmd) != PAPR_PDSM_HEALTH)
>>> +           return 0;
>>> +
>>> +   /* get the payload from command */
>>> +   health = to_payload(cmd)->health;
>>> +
>>> +   return (health.extension_flags & PDSM_DIMM_DSC_VALID) ?
>>> +           (health.dimm_dsc) : 0;
>>> +
>>> +}
>>> +
>>>  struct ndctl_dimm_ops * const papr_dimm_ops = &(struct ndctl_dimm_ops) {
>>>     .cmd_is_supported = papr_cmd_is_supported,
>>>     .smart_get_flags = papr_smart_get_flags,
>>> @@ -245,4 +267,5 @@ struct ndctl_dimm_ops * const papr_dimm_ops = &(struct 
>>> ndctl_dimm_ops) {
>>>     .smart_get_health = papr_smart_get_health,
>>>     .smart_get_shutdown_state = papr_smart_get_shutdown_state,
>>>     .smart_get_life_used = papr_smart_get_life_used,
>>> +   .smart_get_shutdown_count = papr_smart_get_shutdown_count,
>>>  };
>>> diff --git a/ndctl/lib/papr_pdsm.h b/ndctl/lib/papr_pdsm.h
>>> index 1bac8a7fc933..f45b1e40c075 100644
>>> --- a/ndctl/lib/papr_pdsm.h
>>> +++ b/ndctl/lib/papr_pdsm.h
>>> @@ -75,6 +75,9 @@
>>>  /* Indicate that the 'dimm_fuel_gauge' field is valid */
>>>  #define PDSM_DIMM_HEALTH_RUN_GAUGE_VALID 1
>>>  
>>> +/* Indicate that the 'dimm_dsc' field is valid */
>>> +#define PDSM_DIMM_DSC_VALID 2
>>> +
>>>  /*
>>>   * Struct exchanged between kernel & ndctl in for PAPR_PDSM_HEALTH
>>>   * Various flags indicate the health status of the dimm.
>>> @@ -103,6 +106,9 @@ struct nd_papr_pdsm_health {
>>>  
>>>                     /* Extension flag PDSM_DIMM_HEALTH_RUN_GAUGE_VALID */
>>>                     __u16 dimm_fuel_gauge;
>>> +
>>> +                   /* Extension flag PDSM_DIMM_DSC_VALID */
>>> +                   __u64 dimm_dsc;
>>>             };
>>>             __u8 buf[ND_PDSM_PAYLOAD_MAX_SIZE];
>>>     };
>>

Reply via email to