apply_core_errata() currently runs both Cortex A53 and A57 part
checks even when no matching erratum is built in. For boards with no
ARM core errata, that means two MIDR_EL1 reads and two comparisons
on every CPU entry before lowlevel_init().

Only build the dispatch code when one of the supported errata is
enabled. When A57 errata are enabled, read MIDR_EL1 once and reuse
the extracted part number.

Measured on qemu_arm64_defconfig and ls2080aqds_qspi_defconfig:

Case                         before   after
qemu start.o text bytes      392      336
qemu linked text bytes       1437007  1436963
qemu dispatch instructions   15       1
ls2080 start.o text bytes    600      576
ls2080 dispatch instructions 33       26

A KVM virt microbench using the same dispatch instruction sequences
and one million calls gave:

Case            before ticks/call  after ticks/call  speedup
no errata path  27.09              20.78             1.30x
A57 miss path   28.93              26.50             1.09x

Signed-off-by: Josh Law <[email protected]>
---
 arch/arm/cpu/armv8/start.S | 35 ++++++++++++++++++++++++-----------
 1 file changed, 24 insertions(+), 11 deletions(-)

diff --git a/arch/arm/cpu/armv8/start.S b/arch/arm/cpu/armv8/start.S
index 40c342e97e9..5c847ed0f85 100644
--- a/arch/arm/cpu/armv8/start.S
+++ b/arch/arm/cpu/armv8/start.S
@@ -209,30 +209,41 @@ master_cpu:
 
 /*-----------------------------------------------------------------------*/
 
+#if defined(CONFIG_ARM_ERRATA_826974) || defined(CONFIG_ARM_ERRATA_828024) || \
+       defined(CONFIG_ARM_ERRATA_829520) || defined(CONFIG_ARM_ERRATA_833069) 
|| \
+       defined(CONFIG_ARM_ERRATA_833471)
+#define ARMV8_CORTEX_A57_ERRATA
+#endif
+
 WEAK(apply_core_errata)
 
+#if defined(CONFIG_ARM_ERRATA_855873) || defined(ARMV8_CORTEX_A57_ERRATA)
        mov     x29, lr                 /* Save LR */
        /* For now, we support Cortex-A53, Cortex-A57 specific errata */
+       mrs     x0, midr_el1
+       ubfx    x1, x0, #4, #12         /* CPU part number */
 
-       /* Check if we are running on a Cortex-A53 core */
-       branch_if_a53_core x0, apply_a53_core_errata
+#ifdef CONFIG_ARM_ERRATA_855873
+       cmp     x1, #0xD03              /* Cortex-A53 MPCore processor */
+       b.eq    apply_a53_core_errata
+#endif
 
-       /* Check if we are running on a Cortex-A57 core */
-       branch_if_a57_core x0, apply_a57_core_errata
+#ifdef ARMV8_CORTEX_A57_ERRATA
+       cmp     x1, #0xD07              /* Cortex-A57 MPCore processor */
+       b.eq    apply_a57_core_errata
+#endif
 0:
        mov     lr, x29                 /* Restore LR */
+#endif
        ret
 
-apply_a53_core_errata:
-
 #ifdef CONFIG_ARM_ERRATA_855873
-       mrs     x0, midr_el1
+apply_a53_core_errata:
        tst     x0, #(0xf << 20)
        b.ne    0b
 
-       mrs     x0, midr_el1
-       and     x0, x0, #0xf
-       cmp     x0, #3
+       and     x1, x0, #0xf
+       cmp     x1, #3
        b.lt    0b
 
        mrs     x0, S3_1_c15_c2_0       /* cpuactlr_el1 */
@@ -240,9 +251,10 @@ apply_a53_core_errata:
        orr     x0, x0, #1 << 44
        msr     S3_1_c15_c2_0, x0       /* cpuactlr_el1 */
        isb
-#endif
        b 0b
+#endif
 
+#ifdef ARMV8_CORTEX_A57_ERRATA
 apply_a57_core_errata:
 
 #ifdef CONFIG_ARM_ERRATA_828024
@@ -294,6 +306,7 @@ apply_a57_core_errata:
        isb
 #endif
        b 0b
+#endif
 ENDPROC(apply_core_errata)
 
 /*-----------------------------------------------------------------------*/
-- 
2.47.3

Reply via email to