Hi Casey,
On Tue, 12 May 2026 at 14:13, Casey Connolly <[email protected]> wrote:
>
> Implement a super basic software TLB walk which can look up a single
> address in the TLB and print each stage of the translation. This is
> helpful for debugging TLB issues and will be compiled out if unused.
>
> Signed-off-by: Casey Connolly <[email protected]>
> ---
> arch/arm/cpu/armv8/cache_v8.c | 49
> ++++++++++++++++++++++++++++++++++++++++
> arch/arm/include/asm/armv8/mmu.h | 7 ++++++
> 2 files changed, 56 insertions(+)
>
> diff --git a/arch/arm/cpu/armv8/cache_v8.c b/arch/arm/cpu/armv8/cache_v8.c
> index 39479df7b21f..368c622cd18e 100644
> --- a/arch/arm/cpu/armv8/cache_v8.c
> +++ b/arch/arm/cpu/armv8/cache_v8.c
> @@ -733,8 +733,57 @@ void dump_pagetable(u64 ttbr, u64 tcr)
> va_bits, va_bits < 39 ? 3 : 4);
> walk_pagetable(ttbr, tcr, pagetable_print_entry, NULL);
> }
>
> +/* Do a software pagetable walk for the given address */
> +void tlb_debug_lookup(u64 addr)
> +{
> + u64 tcr = get_tcr(NULL, NULL);
> + u64 va_bits = 64 - (tcr & (BIT(6) - 1));
Any reason you can't use va_bits from get_tcr?
> + u64 ttbr = gd->arch.tlb_addr, *pte;
> + int lshift, level = va_bits < 39 ? 1 : 0;
> +
> + printf("Performing software TLB lookup of address %#010llx va_bits:
> %lld\n", addr, va_bits);
> +
> + addr = ALIGN_DOWN(addr, 0x1000);
> + pte = ((u64 *)ttbr);
> + for (int i = level; i < 4; i++) {
> + int indent = (i - level + 1) * 2;
> + lshift = level2shift(i);
> + u32 idx = (addr >> lshift) & 0x1FF;
> + u64 _addr;
> +
> + printf("%*sPTE: %#010llx. addr[%d:%d]: %#05x (offset
> %#07x)\n", indent, "", (u64)pte,
> + lshift + 8, lshift, idx, idx * 8);
> + printf("%*sL%d: %#010llx -> ", indent, "", i,
> (u64)(&pte[idx]));
> +
> + pte = &pte[idx];
> + _addr = *pte & GENMASK_ULL(va_bits, PAGE_SHIFT);
> +
> + switch (pte_type(pte)) {
> + case PTE_TYPE_FAULT:
> + printf("UNMAPPED!\n");
> + return;
> + case PTE_TYPE_BLOCK:
> + printf("BLOCK (%#010llx)\n", _addr);
> + break;
> + case PTE_TYPE_TABLE: // || PTE_TYPE_PAGE
Get rid of comments with // etc
> + if (i < 3) {
> + printf("TABLE (%#010llx)\n", _addr);
> + pte = (u64 *)_addr;
> + continue;
> + } else { // Page
> + printf("PAGE (%#010llx)\n", _addr);
> + }
> + break;
I think we should add a default here, so people can add more cases if
they need them
> + }
> +
> + // We did the lookup!
> + printf("%*s[%#010llx - %#010llx]\n", indent + 2, "", _addr,
> _addr + (1 << lshift));
> + return;
> + }
> +}
> +
> /* Returns the estimated required size of all page tables */
> __weak u64 get_page_table_size(void)
> {
> u64 one_pt = MAX_PTE_ENTRIES * sizeof(u64);
> diff --git a/arch/arm/include/asm/armv8/mmu.h
> b/arch/arm/include/asm/armv8/mmu.h
> index 8aa5f9721c4a..ee81619a1843 100644
> --- a/arch/arm/include/asm/armv8/mmu.h
> +++ b/arch/arm/include/asm/armv8/mmu.h
> @@ -186,8 +186,15 @@ void walk_pagetable(u64 ttbr, u64 tcr, pte_walker_cb_t
> cb, void *priv);
> * @tcr: TCR value to use
> */
> void dump_pagetable(u64 ttbr, u64 tcr);
>
> +/**
> + * tlb_debug_lookup() - Perform a software TLB walk printing each stage
> + *
> + * @addr: the address to look-up in the TLB.
> + */
> +void tlb_debug_lookup(u64 addr);
> +
> struct mm_region {
> u64 virt;
> u64 phys;
> u64 size;
>
> --
> 2.53.0
>