Hi Casey,

On Tue, 12 May 2026 at 14:13, Casey Connolly <[email protected]> wrote:
>
> Implement a super basic software TLB walk which can look up a single
> address in the TLB and print each stage of the translation. This is
> helpful for debugging TLB issues and will be compiled out if unused.
>
> Signed-off-by: Casey Connolly <[email protected]>
> ---
>  arch/arm/cpu/armv8/cache_v8.c    | 49 
> ++++++++++++++++++++++++++++++++++++++++
>  arch/arm/include/asm/armv8/mmu.h |  7 ++++++
>  2 files changed, 56 insertions(+)
>
> diff --git a/arch/arm/cpu/armv8/cache_v8.c b/arch/arm/cpu/armv8/cache_v8.c
> index 39479df7b21f..368c622cd18e 100644
> --- a/arch/arm/cpu/armv8/cache_v8.c
> +++ b/arch/arm/cpu/armv8/cache_v8.c
> @@ -733,8 +733,57 @@ void dump_pagetable(u64 ttbr, u64 tcr)
>                va_bits, va_bits < 39 ? 3 : 4);
>         walk_pagetable(ttbr, tcr, pagetable_print_entry, NULL);
>  }
>
> +/* Do a software pagetable walk for the given address */
> +void tlb_debug_lookup(u64 addr)
> +{
> +       u64 tcr = get_tcr(NULL, NULL);
> +       u64 va_bits = 64 - (tcr & (BIT(6) - 1));

Any reason you can't use va_bits from get_tcr?

> +       u64 ttbr = gd->arch.tlb_addr, *pte;
> +       int lshift, level = va_bits < 39 ? 1 : 0;
> +
> +       printf("Performing software TLB lookup of address %#010llx va_bits: 
> %lld\n", addr, va_bits);
> +
> +       addr = ALIGN_DOWN(addr, 0x1000);
> +       pte = ((u64 *)ttbr);
> +       for (int i = level; i < 4; i++) {
> +               int indent = (i - level + 1) * 2;
> +               lshift = level2shift(i);
> +               u32 idx = (addr >> lshift) & 0x1FF;
> +               u64 _addr;
> +
> +               printf("%*sPTE: %#010llx. addr[%d:%d]: %#05x (offset 
> %#07x)\n", indent, "", (u64)pte,
> +                      lshift + 8, lshift, idx, idx * 8);
> +               printf("%*sL%d: %#010llx -> ", indent, "", i, 
> (u64)(&pte[idx]));
> +
> +               pte = &pte[idx];
> +               _addr = *pte & GENMASK_ULL(va_bits, PAGE_SHIFT);
> +
> +               switch (pte_type(pte)) {
> +               case PTE_TYPE_FAULT:
> +                       printf("UNMAPPED!\n");
> +                       return;
> +               case PTE_TYPE_BLOCK:
> +                       printf("BLOCK (%#010llx)\n", _addr);
> +                       break;
> +               case PTE_TYPE_TABLE: // || PTE_TYPE_PAGE

Get rid of comments with // etc

> +                       if (i < 3) {
> +                               printf("TABLE (%#010llx)\n", _addr);
> +                               pte = (u64 *)_addr;
> +                               continue;
> +                       } else { // Page
> +                               printf("PAGE (%#010llx)\n", _addr);
> +                       }
> +                       break;

I think we should add a default here, so people can add more cases if
they need them

> +               }
> +
> +               // We did the lookup!
> +               printf("%*s[%#010llx - %#010llx]\n", indent + 2, "", _addr, 
> _addr + (1 << lshift));
> +               return;
> +       }
> +}
> +
>  /* Returns the estimated required size of all page tables */
>  __weak u64 get_page_table_size(void)
>  {
>         u64 one_pt = MAX_PTE_ENTRIES * sizeof(u64);
> diff --git a/arch/arm/include/asm/armv8/mmu.h 
> b/arch/arm/include/asm/armv8/mmu.h
> index 8aa5f9721c4a..ee81619a1843 100644
> --- a/arch/arm/include/asm/armv8/mmu.h
> +++ b/arch/arm/include/asm/armv8/mmu.h
> @@ -186,8 +186,15 @@ void walk_pagetable(u64 ttbr, u64 tcr, pte_walker_cb_t 
> cb, void *priv);
>   * @tcr: TCR value to use
>   */
>  void dump_pagetable(u64 ttbr, u64 tcr);
>
> +/**
> + * tlb_debug_lookup() - Perform a software TLB walk printing each stage
> + *
> + * @addr: the address to look-up in the TLB.
> + */
> +void tlb_debug_lookup(u64 addr);
> +
>  struct mm_region {
>         u64 virt;
>         u64 phys;
>         u64 size;
>
> --
> 2.53.0
>

Reply via email to