On Mon, Jun 22, 2026 at 12:02 AM Charlie Jenkins via B4 Relay
<[email protected]> wrote:
>
> From: Charlie Jenkins <[email protected]>
>
> Migrate the alternatives patching code to use the generated instruction
> headers instead of the hand-written instruction composition functions.
>
> Signed-off-by: Charlie Jenkins <[email protected]>

Reviewed-by: Jesse Taube <[email protected]>
> ---
>
> These function expansions are very simple and almost expand to the same
> thing in the new and old version. The main difference is
> riscv_insn_auipc_extract_imm() in the new version expands to:
>
> ((_insn >> 12 & GENMASK(19, 0)) << 12)
>
> while it expands to the following in the old version:
>
> ((_insn >> 0) & GENMASK(31, 12))
>
> These are the same thing, but GCC is unable to properly optimize the
> second one so the first one ends up using almost half as many
> instructions. With this finding and other similar examples, I made
> the generated headers construct in the first way to help GCC optimize
> all of these functions.
>
> Brute force can also be checked with this code:
>
> void check_auipc_jalr() {
>         for (unsigned int auipc = 0; auipc < ((1ULL << 12) - 1); auipc++) {
>                 for (unsigned int jalr = 0; jalr < ((1ULL << 20) - 1); 
> jalr++) {
>                         unsigned int auipc_t=riscv_insn_auipc(auipc, 0), 
> jalr_t=riscv_insn_jalr(jalr, 0, 0), auipc_t2=riscv_insn_auipc(auipc, 0), 
> jalr_t2=riscv_insn_jalr(jalr, 0, 0);
>                         riscv_alternative_fix_auipc_jalr(&auipc_t, &jalr_t, 
> 0);
>                         riscv_alternative_fix_auipc_jalr2(&auipc_t2, 
> &jalr_t2, 0);
>
>                         if (auipc_t != auipc_t2) {
>                                 printf("auipcs don't match %u, %u: %u != 
> %u\n", auipc, jalr, auipc_t, auipc_t2);
>                                 return;
>                         }
>
>                         if (jalr_t != jalr_t2) {
>                                 printf("jalrs don't match %u: %u != %u\n", i, 
> jalr_t, jalr_t2);
>                         }
>                 }
>         }
> }
> ---
>  arch/riscv/include/asm/insn.h   | 74 
> -----------------------------------------
>  arch/riscv/kernel/alternative.c | 23 +++++++++----
>  2 files changed, 17 insertions(+), 80 deletions(-)
>
> diff --git a/arch/riscv/include/asm/insn.h b/arch/riscv/include/asm/insn.h
> index d562b2b40ba1..d0e137f9bcd7 100644
> --- a/arch/riscv/include/asm/insn.h
> +++ b/arch/riscv/include/asm/insn.h
> @@ -514,78 +514,4 @@ static __always_inline bool riscv_insn_is_branch(u32 
> code)
>
>  #define RVV_EXTRACT_VL_VS_WIDTH(x) RVFDQ_EXTRACT_FL_FS_WIDTH(x)
>
> -/*
> - * Get the immediate from a J-type instruction.
> - *
> - * @insn: instruction to process
> - * Return: immediate
> - */
> -static inline s32 riscv_insn_extract_jtype_imm(u32 insn)
> -{
> -       return RV_EXTRACT_JTYPE_IMM(insn);
> -}
> -
> -/*
> - * Update a J-type instruction with an immediate value.
> - *
> - * @insn: pointer to the jtype instruction
> - * @imm: the immediate to insert into the instruction
> - */
> -static inline void riscv_insn_insert_jtype_imm(u32 *insn, s32 imm)
> -{
> -       /* drop the old IMMs, all jal IMM bits sit at 31:12 */
> -       *insn &= ~GENMASK(31, 12);
> -       *insn |= (RV_X_MASK(imm, RV_J_IMM_10_1_OFF, RV_J_IMM_10_1_MASK) << 
> RV_J_IMM_10_1_OPOFF) |
> -                (RV_X_MASK(imm, RV_J_IMM_11_OFF, RV_J_IMM_11_MASK) << 
> RV_J_IMM_11_OPOFF) |
> -                (RV_X_MASK(imm, RV_J_IMM_19_12_OFF, RV_J_IMM_19_12_MASK) << 
> RV_J_IMM_19_12_OPOFF) |
> -                (RV_X_MASK(imm, RV_J_IMM_SIGN_OFF, 1) << 
> RV_J_IMM_SIGN_OPOFF);
> -}
> -
> -/*
> - * Put together one immediate from a U-type and I-type instruction pair.
> - *
> - * The U-type contains an upper immediate, meaning bits[31:12] with [11:0]
> - * being zero, while the I-type contains a 12bit immediate.
> - * Combined these can encode larger 32bit values and are used for example
> - * in auipc + jalr pairs to allow larger jumps.
> - *
> - * @utype_insn: instruction containing the upper immediate
> - * @itype_insn: instruction
> - * Return: combined immediate
> - */
> -static inline s32 riscv_insn_extract_utype_itype_imm(u32 utype_insn, u32 
> itype_insn)
> -{
> -       s32 imm;
> -
> -       imm = RV_EXTRACT_UTYPE_IMM(utype_insn);
> -       imm += RV_EXTRACT_ITYPE_IMM(itype_insn);
> -
> -       return imm;
> -}
> -
> -/*
> - * Update a set of two instructions (U-type + I-type) with an immediate 
> value.
> - *
> - * Used for example in auipc+jalrs pairs the U-type instructions contains
> - * a 20bit upper immediate representing bits[31:12], while the I-type
> - * instruction contains a 12bit immediate representing bits[11:0].
> - *
> - * This also takes into account that both separate immediates are
> - * considered as signed values, so if the I-type immediate becomes
> - * negative (BIT(11) set) the U-type part gets adjusted.
> - *
> - * @utype_insn: pointer to the utype instruction of the pair
> - * @itype_insn: pointer to the itype instruction of the pair
> - * @imm: the immediate to insert into the two instructions
> - */
> -static inline void riscv_insn_insert_utype_itype_imm(u32 *utype_insn, u32 
> *itype_insn, s32 imm)
> -{
> -       /* drop possible old IMM values */
> -       *utype_insn &= ~(RV_U_IMM_31_12_MASK);
> -       *itype_insn &= ~(RV_I_IMM_11_0_MASK << RV_I_IMM_11_0_OPOFF);
> -
> -       /* add the adapted IMMs */
> -       *utype_insn |= (imm & RV_U_IMM_31_12_MASK) + ((imm & BIT(11)) << 1);
> -       *itype_insn |= ((imm & RV_I_IMM_11_0_MASK) << RV_I_IMM_11_0_OPOFF);
> -}
>  #endif /* _ASM_RISCV_INSN_H */
> diff --git a/arch/riscv/kernel/alternative.c b/arch/riscv/kernel/alternative.c
> index 7642704c7f18..b26a90eb65cc 100644
> --- a/arch/riscv/kernel/alternative.c
> +++ b/arch/riscv/kernel/alternative.c
> @@ -11,6 +11,7 @@
>  #include <linux/cpu.h>
>  #include <linux/uaccess.h>
>  #include <asm/alternative.h>
> +#include <asm/insn.h>
>  #include <asm/module.h>
>  #include <asm/sections.h>
>  #include <asm/vdso.h>
> @@ -78,14 +79,24 @@ static void riscv_alternative_fix_auipc_jalr(void *ptr, 
> u32 auipc_insn,
>                                              u32 jalr_insn, int patch_offset)
>  {
>         u32 call[2] = { auipc_insn, jalr_insn };
> +       u32 auipc_imm;
>         s32 imm;
>
>         /* get and adjust new target address */
> -       imm = riscv_insn_extract_utype_itype_imm(auipc_insn, jalr_insn);
> +       imm = riscv_insn_auipc_extract_imm(auipc_insn) + 
> riscv_insn_jalr_extract_imm(jalr_insn);
>         imm -= patch_offset;
>
> +       /*
> +        * When the 32-bit immediate is split across auipc and jalr, the
> +        * constructed immediates need to be treated as individually sign
> +        * extended numbers. Add the sign bit of the lower 12 bits to the 
> upper
> +        * 20 bits to undo the bleeding of the sign.
> +        */
> +       auipc_imm = imm + (BIT(11) << 1);
> +
>         /* update instructions */
> -       riscv_insn_insert_utype_itype_imm(&call[0], &call[1], imm);
> +       riscv_insn_auipc_insert_imm(&call[0], auipc_imm);
> +       riscv_insn_jalr_insert_imm(&call[1], imm);
>
>         /* patch the call place again */
>         patch_text_nosync(ptr, call, sizeof(u32) * 2);
> @@ -96,11 +107,11 @@ static void riscv_alternative_fix_jal(void *ptr, u32 
> jal_insn, int patch_offset)
>         s32 imm;
>
>         /* get and adjust new target address */
> -       imm = riscv_insn_extract_jtype_imm(jal_insn);
> +       imm = riscv_insn_jal_extract_imm(jal_insn);
>         imm -= patch_offset;
>
>         /* update instruction */
> -       riscv_insn_insert_jtype_imm(&jal_insn, imm);
> +       riscv_insn_jal_insert_imm(&jal_insn, imm);
>
>         /* patch the call place again */
>         patch_text_nosync(ptr, &jal_insn, sizeof(u32));
> @@ -127,7 +138,7 @@ void riscv_alternative_fix_offsets(void *alt_ptr, 
> unsigned int len,
>                                 continue;
>
>                         /* if instruction pair is a call, it will use the ra 
> register */
> -                       if (RV_EXTRACT_RD_REG(insn) != 1)
> +                       if (riscv_insn_jalr_extract_xd(insn) != 1)
>                                 continue;
>
>                         riscv_alternative_fix_auipc_jalr(alt_ptr + i * 
> sizeof(u32),
> @@ -136,7 +147,7 @@ void riscv_alternative_fix_offsets(void *alt_ptr, 
> unsigned int len,
>                 }
>
>                 if (riscv_insn_is_jal(insn)) {
> -                       s32 imm = riscv_insn_extract_jtype_imm(insn);
> +                       s32 imm = riscv_insn_jal_extract_imm(insn);
>
>                         /* Don't modify jumps inside the alternative block */
>                         if ((alt_ptr + i * sizeof(u32) + imm) >= alt_ptr &&
>
> --
> 2.54.0
>
>
>
> _______________________________________________
> linux-riscv mailing list
> [email protected]
> http://lists.infradead.org/mailman/listinfo/linux-riscv
>


Reply via email to