On Thu, Nov 05, 2020 at 04:47:25PM +1100, Brad Campbell wrote:
> Commit fff2d0f701e6 ("hwmon: (applesmc) avoid overlong udelay()") introduced
> an issue whereby communication with the SMC became unreliable with write
> errors :
> 
> [  120.378614] applesmc: send_byte(0x00, 0x0300) fail: 0x40
> [  120.378621] applesmc: LKSB: write data fail
> [  120.512782] applesmc: send_byte(0x00, 0x0300) fail: 0x40
> [  120.512787] applesmc: LKSB: write data fail
> 
> The original code appeared to be timing sensitive and was not reliable with
> the timing changes in the aforementioned commit.
> 
> This patch re-factors the SMC communication to remove the timing 
> dependencies and restore function with the changes previously committed.
> 
> Reported-by: Andreas Kemnade <andr...@kemnade.info>

Add

Fixes: fff2d0f701e6 ("hwmon: (applesmc) avoid overlong udelay()")

> Signed-off-by: Brad Campbell <b...@fnarfbargle.com>
> 
> ---
> diff --git a/drivers/hwmon/applesmc.c b/drivers/hwmon/applesmc.c
> index a18887990f4a..22cc5122ce9a 100644
> --- a/drivers/hwmon/applesmc.c
> +++ b/drivers/hwmon/applesmc.c
> @@ -42,6 +42,11 @@
>  
>  #define APPLESMC_MAX_DATA_LENGTH 32
>  
> +/* Apple SMC status bits from VirtualSMC */
> +#define SMC_STATUS_AWAITING_DATA  0x01  ///< Data waiting to be read
> +#define SMC_STATUS_IB_CLOSED      0x02  /// A write is pending / will ignore 
> input
> +#define SMC_STATUS_BUSY           0x04  ///< Busy in the middle of a command.
> +

Maybe consider using BIT() while at it.

/* Please use standard comments */

Also, what does the "<" mean ? Is that supposed to be negated 
(ie bit set means not busy) ? If so, that isn't a standard notation
that I am aware of. Maybe "not set if busy in the middle of a command"
would be better in this case.

>  /* wait up to 128 ms for a status change. */
>  #define APPLESMC_MIN_WAIT    0x0010
>  #define APPLESMC_RETRY_WAIT  0x0100
> @@ -151,65 +156,77 @@ static unsigned int key_at_index;
>  static struct workqueue_struct *applesmc_led_wq;
>  
>  /*
> - * wait_read - Wait for a byte to appear on SMC port. Callers must
> - * hold applesmc_lock.
> + * Wait for specific status bits with a mask on the SMC
> + * Used before and after writes, and before reads
>   */
> -static int wait_read(void)
> +
> +static int wait_status(u8 val, u8 mask)
>  {
>       unsigned long end = jiffies + (APPLESMC_MAX_WAIT * HZ) / USEC_PER_SEC;
>       u8 status;
>       int us;
>  
>       for (us = APPLESMC_MIN_WAIT; us < APPLESMC_MAX_WAIT; us <<= 1) {
> -             usleep_range(us, us * 16);
>               status = inb(APPLESMC_CMD_PORT);
> -             /* read: wait for smc to settle */
> -             if (status & 0x01)
> +             if ((status & mask) == val)
>                       return 0;
>               /* timeout: give up */
>               if (time_after(jiffies, end))
>                       break;
> -     }
> -
> -     pr_warn("wait_read() fail: 0x%02x\n", status);
> +             usleep_range(us, us * 16);
> +             }
> +     pr_warn("wait_status timeout: 0x%02x, 0x%02x, 0x%02x\n", status, val, 
> mask);
>       return -EIO;
>  }
>  
>  /*
> - * send_byte - Write to SMC port, retrying when necessary. Callers
> + * send_byte_data - Write to SMC data port. Callers
>   * must hold applesmc_lock.
> + * Parameter skip must be true on the last write of any
> + * command or it'll time out.
>   */
> -static int send_byte(u8 cmd, u16 port)

I would suggest to keep send_byte() and change it to the following.

static int send_byte(u8 cmd, u16 port)
{
        return send_byte_data(cmd, port, false);
}

That would limit the number of changes needed later in the code
(it is never called with a hard 'true' as parameter).

> +
> +static int send_byte_data(u8 cmd, u16 port, bool skip)
>  {
> -     u8 status;
> -     int us;
> -     unsigned long end = jiffies + (APPLESMC_MAX_WAIT * HZ) / USEC_PER_SEC;
> +     u8 wstat = SMC_STATUS_BUSY;
>  
> +     if (skip)
> +             wstat = 0;

        u8 wstat = skip ? 0 : SMC_STATUS_BUSY;

> +     if (wait_status(SMC_STATUS_BUSY,
> +     SMC_STATUS_BUSY | SMC_STATUS_IB_CLOSED))

This fits one line, and the error code
should really not be overwritten.

        ret = wait_status(SMC_STATUS_BUSY, SMC_STATUS_BUSY | 
SMC_STATUS_IB_CLOSED);
        if (ret)
                return ret;

> +             goto fail;
>       outb(cmd, port);
> -     for (us = APPLESMC_MIN_WAIT; us < APPLESMC_MAX_WAIT; us <<= 1) {
> -             usleep_range(us, us * 16);
> -             status = inb(APPLESMC_CMD_PORT);
> -             /* write: wait for smc to settle */
> -             if (status & 0x02)
> -                     continue;
> -             /* ready: cmd accepted, return */
> -             if (status & 0x04)
> -                     return 0;
> -             /* timeout: give up */
> -             if (time_after(jiffies, end))
> -                     break;
> -             /* busy: long wait and resend */
> -             udelay(APPLESMC_RETRY_WAIT);
> -             outb(cmd, port);
> -     }
> -
> -     pr_warn("send_byte(0x%02x, 0x%04x) fail: 0x%02x\n", cmd, port, status);
> +     if (!wait_status(wstat,
> +     SMC_STATUS_BUSY))

That really fits into one line.

> +             return 0;
> +fail:
> +     pr_warn("send_byte_data(0x%02x, 0x%04x) fail\n", cmd, 
> APPLESMC_CMD_PORT);

Can you drop this message ? wait_status() already displays a message,
after all. Also, please reverse error handling, and don't overwrite
error codes.

        ret = wait_status(wstat, SMC_STATUS_BUSY)
        if (ret)
                return ret;

Actually, this can be simplified to
        return wait_status(wstat, SMC_STATUS_BUSY);
or, since wstat is only used once,
        return wait_status(skip ? 0 : SMC_STATUS_BUSY, SMC_STATUS_BUSY);

>       return -EIO;
>  }
>  
> +/*
> + * send_command - Write a command to the SMC. Callers must hold 
> applesmc_lock.
> + * If SMC is in undefined state, any new command write resets the state 
> machine.
> + */
> +
>  static int send_command(u8 cmd)
>  {
> -     return send_byte(cmd, APPLESMC_CMD_PORT);
> +     u8 status;
> +
> +     if (wait_status(0,
> +     SMC_STATUS_IB_CLOSED)) {

Another one of those odd continuation lines.

> +             pr_warn("send_command SMC was busy\n");

and logging noise. As for error handling, same as above, please

        ret = wait_status(0, SMC_STATUS_IB_CLOSED);
        if (ret)
                return ret;

> +             goto fail; }
> +
> +     status = inb(APPLESMC_CMD_PORT);
> +
> +     outb(cmd, APPLESMC_CMD_PORT);
> +     if (!wait_status(SMC_STATUS_BUSY,
> +     SMC_STATUS_BUSY))

Odd/unnecessary continuation line again.

> +             return 0;
> +fail:
> +     pr_warn("send_cmd(0x%02x, 0x%04x) fail\n", cmd, APPLESMC_CMD_PORT);

Wow, up to three messages on failure. Please, don't do that.
One message per failure is really enough. Please simplify to

        return wait_status(SMC_STATUS_BUSY, SMC_STATUS_BUSY);

Actually, I notice that the callers of send_command()
log yet again. Maybe it is time to drop all the messages
from here and from send_argument() and only log in the
calling code.

> +     return -EIO;
>  }
>  
>  static int send_argument(const char *key)
> @@ -217,7 +234,8 @@ static int send_argument(const char *key)
>       int i;
>  
>       for (i = 0; i < 4; i++)
> -             if (send_byte(key[i], APPLESMC_DATA_PORT))
> +     /* Parameter skip is false as we always send data after an argument */

Please align comments with code. Maybe move the comment ahead
of the for statement. Or drop it entirely - it doesn't add that
much value. Actually, this blob would go away if you keep
send_byte().

> +             if (send_byte_data(key[i], APPLESMC_DATA_PORT, false))
>                       return -EIO;
>       return 0;
>  }
> @@ -233,13 +251,15 @@ static int read_smc(u8 cmd, const char *key, u8 
> *buffer, u8 len)
>       }
>  
>       /* This has no effect on newer (2012) SMCs */
> -     if (send_byte(len, APPLESMC_DATA_PORT)) {
> +     if (send_byte_data(len, APPLESMC_DATA_PORT, false)) {
>               pr_warn("%.4s: read len fail\n", key);
>               return -EIO;
>       }
>  
>       for (i = 0; i < len; i++) {
> -             if (wait_read()) {
> +             if (wait_status(SMC_STATUS_AWAITING_DATA | SMC_STATUS_BUSY,
> +             SMC_STATUS_AWAITING_DATA | SMC_STATUS_BUSY |
> +             SMC_STATUS_IB_CLOSED)) {

Align continuatiuon lines with preceding '('. "checkpatch --strict"
reports all those alignment issues.

>                       pr_warn("%.4s: read data[%d] fail\n", key, i);
>                       return -EIO;
>               }
> @@ -250,7 +270,7 @@ static int read_smc(u8 cmd, const char *key, u8 *buffer, 
> u8 len)
>       for (i = 0; i < 16; i++) {
>               udelay(APPLESMC_MIN_WAIT);
>               status = inb(APPLESMC_CMD_PORT);
> -             if (!(status & 0x01))
> +             if (!(status & SMC_STATUS_AWAITING_DATA))
>                       break;
>               data = inb(APPLESMC_DATA_PORT);
>       }
> @@ -263,20 +283,21 @@ static int read_smc(u8 cmd, const char *key, u8 
> *buffer, u8 len)
>  static int write_smc(u8 cmd, const char *key, const u8 *buffer, u8 len)
>  {
>       int i;
> +     u8 end = len-1;

space before and after '-', please. checkpatch --strict will tell.

>  
>       if (send_command(cmd) || send_argument(key)) {
>               pr_warn("%s: write arg fail\n", key);
>               return -EIO;

I notice the driver keeps overwriting error codes. Oh well.
I can't expect you to fix that, and it should not be fixed as part
of this patch, but please don't make it worse (not here, but above
where calls are changed).

>       }
>  
> -     if (send_byte(len, APPLESMC_DATA_PORT)) {
> +     if (send_byte_data(len, APPLESMC_DATA_PORT, false)) {
>               pr_warn("%.4s: write len fail\n", key);
>               return -EIO;
>       }
>  
>       for (i = 0; i < len; i++) {
> -             if (send_byte(buffer[i], APPLESMC_DATA_PORT)) {
> -                     pr_warn("%s: write data fail\n", key);
> +             if (send_byte_data(buffer[i], APPLESMC_DATA_PORT, (i == end))) {

Unnecessary ( ) around i == end. Not sure if the 'end' variable
is worth it. Might as well make it "i == len - 1" and let the compiler
optimize it at will.

> +                     pr_warn("%s: write data fail at %i\n", key, i);
>                       return -EIO;
>               }
>       }

Reply via email to