Hi Rob, a couple of suggestions for way this erratum is gated, but I
haven't delved into the details of the errata itself.

On Fri, Jul 17, 2020 at 02:52:33PM -0600, Rob Herring wrote:
> On Cortex-A77 r0p0 and r1p0, a sequence of a non-cacheable or device load
> and a store exclusive or PAR_EL1 read can cause a deadlock.
> 
> The workaround requires a DMB SY before and after a PAR_EL1 register read.
> A deadlock is still possible with the workaround as KVM guests must also
> have the workaround. IOW, a malicious guest can deadlock an affected
> systems.
> 
> This workaround also depends on a firmware counterpart to enable the h/w
> to insert DMB SY after load and store exclusive instructions. See the
> errata document SDEN-1152370 v10 [1] for more information.
> 
> [1] 
> https://static.docs.arm.com/101992/0010/Arm_Cortex_A77_MP074_Software_Developer_Errata_Notice_v10.pdf
> 
> Cc: Catalin Marinas <[email protected]>
> Cc: James Morse <[email protected]>
> Cc: Suzuki K Poulose <[email protected]>
> Cc: Will Deacon <[email protected]>
> Cc: Marc Zyngier <[email protected]>
> Cc: Julien Thierry <[email protected]>
> Cc: [email protected]
> Signed-off-by: Rob Herring <[email protected]>
> ---
> v3:
> - Add dmbs around PAR reads in KVM code
> - Clean-up 'work-around' and 'errata'
> 
> v2:
> - Don't disable KVM, just print warning
> ---
>  Documentation/arm64/silicon-errata.rst |  2 ++
>  arch/arm64/Kconfig                     | 19 +++++++++++++++++++
>  arch/arm64/include/asm/cpucaps.h       |  3 ++-
>  arch/arm64/include/asm/kvm_hyp.h       | 11 +++++++++++
>  arch/arm64/kernel/cpu_errata.c         | 10 ++++++++++
>  arch/arm64/kvm/arm.c                   |  3 ++-
>  arch/arm64/kvm/hyp/switch.c            |  7 ++++---
>  arch/arm64/kvm/hyp/sysreg-sr.c         |  2 +-
>  arch/arm64/kvm/sys_regs.c              |  8 +++++++-
>  arch/arm64/mm/fault.c                  | 10 ++++++++++
>  10 files changed, 68 insertions(+), 7 deletions(-)
> 
> diff --git a/Documentation/arm64/silicon-errata.rst 
> b/Documentation/arm64/silicon-errata.rst
> index 936cf2a59ca4..716b279e3b33 100644
> --- a/Documentation/arm64/silicon-errata.rst
> +++ b/Documentation/arm64/silicon-errata.rst
> @@ -90,6 +90,8 @@ stable kernels.
>  
> +----------------+-----------------+-----------------+-----------------------------+
>  | ARM            | Cortex-A76      | #1463225        | ARM64_ERRATUM_1463225 
>       |
>  
> +----------------+-----------------+-----------------+-----------------------------+
> +| ARM            | Cortex-A77      | #1508412        | ARM64_ERRATUM_1508412 
>       |
> ++----------------+-----------------+-----------------+-----------------------------+
>  | ARM            | Neoverse-N1     | #1188873,1418040| ARM64_ERRATUM_1418040 
>       |
>  
> +----------------+-----------------+-----------------+-----------------------------+
>  | ARM            | Neoverse-N1     | #1349291        | N/A                   
>       |
> diff --git a/arch/arm64/Kconfig b/arch/arm64/Kconfig
> index a4a094bedcb2..6638444ce0d8 100644
> --- a/arch/arm64/Kconfig
> +++ b/arch/arm64/Kconfig
> @@ -626,6 +626,25 @@ config ARM64_ERRATUM_1542419
>  
>         If unsure, say Y.
>  
> +config ARM64_ERRATUM_1508412
> +     bool "Cortex-A77: 1508412: workaround deadlock on sequence of NC/Device 
> load and store exclusive or PAR read"
> +     default y
> +     help
> +       This option adds a workaround for Arm Cortex-A77 erratum 1508412.
> +
> +       Affected Cortex-A77 cores (r0p0, r1p0) could deadlock on a sequence
> +       of a store-exclusive or read of PAR_EL1 and a load with device or
> +       non-cacheable memory attributes. The workaround depends on a firmware
> +       counterpart.
> +
> +       KVM guests must also have the workaround implemented or they can
> +       deadlock the system.
> +
> +       Work around the issue by inserting DMB SY barriers around PAR_EL1
> +       register reads and warning KVM users.
> +
> +       If unsure, say Y.
> +
>  config CAVIUM_ERRATUM_22375
>       bool "Cavium erratum 22375, 24313"
>       default y
> diff --git a/arch/arm64/include/asm/cpucaps.h 
> b/arch/arm64/include/asm/cpucaps.h
> index d7b3bb0cb180..2a2cdb4ced8b 100644
> --- a/arch/arm64/include/asm/cpucaps.h
> +++ b/arch/arm64/include/asm/cpucaps.h
> @@ -62,7 +62,8 @@
>  #define ARM64_HAS_GENERIC_AUTH                       52
>  #define ARM64_HAS_32BIT_EL1                  53
>  #define ARM64_BTI                            54
> +#define ARM64_WORKAROUND_1508412             55
>  
> -#define ARM64_NCAPS                          55
> +#define ARM64_NCAPS                          56
>  
>  #endif /* __ASM_CPUCAPS_H */
> diff --git a/arch/arm64/include/asm/kvm_hyp.h 
> b/arch/arm64/include/asm/kvm_hyp.h
> index ce3080834bfa..ce5b0d9b12bf 100644
> --- a/arch/arm64/include/asm/kvm_hyp.h
> +++ b/arch/arm64/include/asm/kvm_hyp.h
> @@ -46,6 +46,17 @@
>  #define read_sysreg_el2(r)   read_sysreg_elx(r, _EL2, _EL1)
>  #define write_sysreg_el2(v,r)        write_sysreg_elx(v, r, _EL2, _EL1)
>  
> +static inline u64 __hyp_text read_sysreg_par(void)
> +{
> +     u64 par;
> +     if (cpus_have_const_cap(ARM64_WORKAROUND_1508412))
> +             dmb(sy);
> +     par = read_sysreg(par_el1);
> +     if (cpus_have_const_cap(ARM64_WORKAROUND_1508412))
> +             dmb(sy);
> +     return par;
> +}
> +
>  /*
>   * Without an __arch_swab32(), we fall back to ___constant_swab32(), but the
>   * static inline can allow the compiler to out-of-line this. KVM always wants
> diff --git a/arch/arm64/kernel/cpu_errata.c b/arch/arm64/kernel/cpu_errata.c
> index ad06d6802d2e..5eee8a75540c 100644
> --- a/arch/arm64/kernel/cpu_errata.c
> +++ b/arch/arm64/kernel/cpu_errata.c
> @@ -938,6 +938,16 @@ const struct arm64_cpu_capabilities arm64_errata[] = {
>               .matches = has_neoverse_n1_erratum_1542419,
>               .cpu_enable = cpu_enable_trap_ctr_access,
>       },
> +#endif
> +#ifdef CONFIG_ARM64_ERRATUM_1508412
> +     {
> +             /* we depend on the firmware portion for correctness */
> +             .desc = "ARM erratum 1508412 (kernel portion)",
> +             .capability = ARM64_WORKAROUND_1508412,
> +             ERRATA_MIDR_RANGE(MIDR_CORTEX_A77,
> +                               0, 0,
> +                               1, 0),
> +     },
>  #endif
>       {
>       }
> diff --git a/arch/arm64/kvm/arm.c b/arch/arm64/kvm/arm.c
> index 9b070b5e212b..21d8b3ca5bd7 100644
> --- a/arch/arm64/kvm/arm.c
> +++ b/arch/arm64/kvm/arm.c
> @@ -1653,7 +1653,8 @@ int kvm_arch_init(void *opaque)
>               return -ENODEV;
>       }
>  
> -     if (cpus_have_const_cap(ARM64_WORKAROUND_DEVICE_LOAD_ACQUIRE))
> +     if (cpus_have_const_cap(ARM64_WORKAROUND_DEVICE_LOAD_ACQUIRE) ||
> +         cpus_have_const_cap(ARM64_WORKAROUND_1508412))

By the time KVM is initialized, it's safe to use cpus_have_final_cap
rather than cpus_have_const_cap as the capabilities will have been
finalized.

It looks as though the other places that the capabilities are checked
happen after this point so they can also use cpus_have_final_cap.

>               kvm_info("Guests without required CPU erratum workarounds can 
> deadlock system!\n" \
>                        "Only trusted guests should be used on this 
> system.\n");
>  
> diff --git a/arch/arm64/kvm/hyp/switch.c b/arch/arm64/kvm/hyp/switch.c
> index db1c4487d95d..d76b6638b705 100644
> --- a/arch/arm64/kvm/hyp/switch.c
> +++ b/arch/arm64/kvm/hyp/switch.c
> @@ -298,11 +298,12 @@ static bool __hyp_text __translate_far_to_hpfar(u64 
> far, u64 *hpfar)
>        * We do need to save/restore PAR_EL1 though, as we haven't
>        * saved the guest context yet, and we may return early...
>        */
> -     par = read_sysreg(par_el1);
> +     par = read_sysreg_par();
> +
>       asm volatile("at s1e1r, %0" : : "r" (far));
>       isb();
>  
> -     tmp = read_sysreg(par_el1);
> +     tmp = read_sysreg_par();
>       write_sysreg(par, par_el1);
>  
>       if (unlikely(tmp & SYS_PAR_EL1_F))
> @@ -925,7 +926,7 @@ void __hyp_text __noreturn hyp_panic(struct 
> kvm_cpu_context *host_ctxt)
>  {
>       u64 spsr = read_sysreg_el2(SYS_SPSR);
>       u64 elr = read_sysreg_el2(SYS_ELR);
> -     u64 par = read_sysreg(par_el1);
> +     u64 par = read_sysreg_par();
>  
>       if (!has_vhe())
>               __hyp_call_panic_nvhe(spsr, elr, par, host_ctxt);
> diff --git a/arch/arm64/kvm/hyp/sysreg-sr.c b/arch/arm64/kvm/hyp/sysreg-sr.c
> index cc7e957f5b2c..f522cbff291d 100644
> --- a/arch/arm64/kvm/hyp/sysreg-sr.c
> +++ b/arch/arm64/kvm/hyp/sysreg-sr.c
> @@ -52,7 +52,7 @@ static void __hyp_text __sysreg_save_el1_state(struct 
> kvm_cpu_context *ctxt)
>       ctxt->sys_regs[CONTEXTIDR_EL1]  = read_sysreg_el1(SYS_CONTEXTIDR);
>       ctxt->sys_regs[AMAIR_EL1]       = read_sysreg_el1(SYS_AMAIR);
>       ctxt->sys_regs[CNTKCTL_EL1]     = read_sysreg_el1(SYS_CNTKCTL);
> -     ctxt->sys_regs[PAR_EL1]         = read_sysreg(par_el1);
> +     ctxt->sys_regs[PAR_EL1]         = read_sysreg_par();
>       ctxt->sys_regs[TPIDR_EL1]       = read_sysreg(tpidr_el1);
>  
>       ctxt->gp_regs.sp_el1            = read_sysreg(sp_el1);
> diff --git a/arch/arm64/kvm/sys_regs.c b/arch/arm64/kvm/sys_regs.c
> index baf5ce9225ce..3f798e0f1419 100644
> --- a/arch/arm64/kvm/sys_regs.c
> +++ b/arch/arm64/kvm/sys_regs.c
> @@ -94,10 +94,16 @@ static bool __vcpu_read_sys_reg_from_cpu(int reg, u64 
> *val)
>       case TPIDR_EL1:         *val = read_sysreg_s(SYS_TPIDR_EL1);    break;
>       case AMAIR_EL1:         *val = read_sysreg_s(SYS_AMAIR_EL12);   break;
>       case CNTKCTL_EL1:       *val = read_sysreg_s(SYS_CNTKCTL_EL12); break;
> -     case PAR_EL1:           *val = read_sysreg_s(SYS_PAR_EL1);      break;
>       case DACR32_EL2:        *val = read_sysreg_s(SYS_DACR32_EL2);   break;
>       case IFSR32_EL2:        *val = read_sysreg_s(SYS_IFSR32_EL2);   break;
>       case DBGVCR32_EL2:      *val = read_sysreg_s(SYS_DBGVCR32_EL2); break;
> +     case PAR_EL1:
> +             if (cpus_have_const_cap(ARM64_WORKAROUND_1508412))
> +                     dmb(sy);
> +             *val = read_sysreg_s(SYS_PAR_EL1);
> +             if (cpus_have_const_cap(ARM64_WORKAROUND_1508412))
> +                     dmb(sy);
> +             break;
>       default:                return false;
>       }
>  
> diff --git a/arch/arm64/mm/fault.c b/arch/arm64/mm/fault.c
> index 8afb238ff335..98609532e61a 100644
> --- a/arch/arm64/mm/fault.c
> +++ b/arch/arm64/mm/fault.c
> @@ -260,7 +260,17 @@ static bool __kprobes 
> is_spurious_el1_translation_fault(unsigned long addr,
>       local_irq_save(flags);
>       asm volatile("at s1e1r, %0" :: "r" (addr));
>       isb();
> +     /*
> +      * Arm Erratum 1508412 requires dmb(sy) before and after reads of
> +      * PAR_EL1.
> +      * As this location is not a hot path, just condition it on the config
> +      * option.
> +      */
> +     if (IS_ENABLED(CONFIG_ARM64_ERRATUM_1508412))
> +             dmb(sy);
>       par = read_sysreg(par_el1);
> +     if (IS_ENABLED(CONFIG_ARM64_ERRATUM_1508412))
> +             dmb(sy);

Having the condition simply based on the config can bring the additional
DMBs even if the CPU isn't affected by this erratum. The config is
default y so this doesn't seem like an unlikely situation.

The comment mentions that this is a hot path so would an alternative be
applicable? That's the approach taken for the speculative AT errata.

  asm(ALTERNATIVE("nop", "dmb sy", ARM64_ERRATUM_1508412));

>       local_irq_restore(flags);
>  
>       /*
> -- 
> 2.25.1
> 
> _______________________________________________
> kvmarm mailing list
> [email protected]
> https://lists.cs.columbia.edu/mailman/listinfo/kvmarm
_______________________________________________
kvmarm mailing list
[email protected]
https://lists.cs.columbia.edu/mailman/listinfo/kvmarm

Reply via email to