> diff --git a/arch/powerpc/net/bpf_jit_comp64.c 
> b/arch/powerpc/net/bpf_jit_comp64.c
> index d7cd8ab6559c..cbaf811e1a35 100644
> --- a/arch/powerpc/net/bpf_jit_comp64.c
> +++ b/arch/powerpc/net/bpf_jit_comp64.c

[ ... ]

> @@ -245,9 +302,25 @@ static void bpf_jit_emit_common_epilogue(u32 *image, 
> struct codegen_context *ctx
>               EMIT(PPC_RAW_LD(bpf_to_ppc(ARENA_VM_START), _R1,
>                               bpf_jit_stack_offsetof(ctx, 
> bpf_to_ppc(ARENA_VM_START))));
>
> +     if (ctx->exception_cb) {
> +             /*
> +              * Recover additionally saved non volatile registers from stack
> +              * frame of exception boundary program.
> +              */
> +             for (i = _R14; i <= _R25; i++)
> +                     EMIT(PPC_RAW_LD(i, _R1, bpf_jit_stack_offsetof(ctx, 
> i)));
> +
> +             /*
> +              * LR value from boundary-frame is received as second parameter
> +              * in exception callback.
> +              */
> +             EMIT(PPC_RAW_MTLR(_R4));
                ^^^^^^^^^^^^^^^^^^^

This sets LR from R4 (the boundary's LR passed as second parameter).

> +     }
> +
>       /* Tear down our stack frame */
>       if (bpf_has_stack_frame(ctx)) {
> -             EMIT(PPC_RAW_ADDI(_R1, _R1, BPF_PPC_STACKFRAME + 
> ctx->stack_size));
> +             EMIT(PPC_RAW_ADDI(_R1, _R1, bpf_jit_stack_size(ctx) + 
> ctx->stack_size));
> +
>               if (ctx->seen & SEEN_FUNC || ctx->exception_cb) {
                                          ^^^^^^^^^^^^^^^^^^^^^
>                       EMIT(PPC_RAW_LD(_R0, _R1, PPC_LR_STKOFF));
>                       EMIT(PPC_RAW_MTLR(_R0));
                        ^^^^^^^^^^^^^^^^^^^

For exception_cb programs, bpf_has_stack_frame() returns true (the function
explicitly checks ctx->exception_cb). The condition on the inner if statement
also evaluates true because of "|| ctx->exception_cb".

This means for exception_cb programs, LR is first set correctly from R4,
but then immediately overwritten by loading from the stack and issuing a
second MTLR.

The comment above the EMIT(PPC_RAW_MTLR(_R4)) states that LR is received as
the second parameter, suggesting R4 is the authoritative source. If
exception_cb and exception_boundary have different stack_depth values, the
stack-loaded LR value after the ADDI may point to an incorrect location.

Should the inner condition exclude exception_cb, perhaps something like:

    if (ctx->seen & SEEN_FUNC && !ctx->exception_cb) {

Or alternatively, should the EMIT(PPC_RAW_MTLR(_R4)) be moved after the
stack teardown code to ensure it takes precedence?


---
AI reviewed your patch. Please fix the bug or email reply why it's not a bug.
See: https://github.com/kernel-patches/vmtest/blob/master/ci/claude/README.md

CI run summary: https://github.com/kernel-patches/bpf/actions/runs/21257691486

Reply via email to