Re: [PATCH 07/12] aarch64: Use VNx16BI for svac*

Kyrylo Tkachov Thu, 31 Jul 2025 09:55:51 -0700

> On 29 Jul 2025, at 18:41, Richard Sandiford <richard.sandif...@arm.com> wrote:
> 
> This patch continues the work of making ACLE intrinsics use VNx16BI
> for svbool_t results.  It deals with the svac* intrinsics (floating-
> point compare absolute).

Ok.
Thanks,
Kyrill

> 
> gcc/
> * config/aarch64/aarch64-sve.md (@aarch64_pred_fac<cmp_op><mode>):
> Replace with...
> (@aarch64_pred_fac<cmp_op><mode>_acle): ...this new expander.
> (*aarch64_pred_fac<cmp_op><mode>_strict_acle): New pattern.
> * config/aarch64/aarch64-sve-builtins-base.cc
> (svac_impl::expand): Update accordingly.
> 
> gcc/testsuite/
> * gcc.target/aarch64/sve/acle/general/acge_1.c: New test.
> * gcc.target/aarch64/sve/acle/general/acgt_1.c: Likewise.
> * gcc.target/aarch64/sve/acle/general/acle_1.c: Likewise.
> * gcc.target/aarch64/sve/acle/general/aclt_1.c: Likewise.
> ---
> .../aarch64/aarch64-sve-builtins-base.cc      |   3 +-
> gcc/config/aarch64/aarch64-sve.md             |  63 ++++++++---
> .../aarch64/sve/acle/general/acge_1.c         | 104 ++++++++++++++++++
> .../aarch64/sve/acle/general/acgt_1.c         | 104 ++++++++++++++++++
> .../aarch64/sve/acle/general/acle_1.c         | 104 ++++++++++++++++++
> .../aarch64/sve/acle/general/aclt_1.c         | 104 ++++++++++++++++++
> 6 files changed, 465 insertions(+), 17 deletions(-)
> create mode 100644 gcc/testsuite/gcc.target/aarch64/sve/acle/general/acge_1.c
> create mode 100644 gcc/testsuite/gcc.target/aarch64/sve/acle/general/acgt_1.c
> create mode 100644 gcc/testsuite/gcc.target/aarch64/sve/acle/general/acle_1.c
> create mode 100644 gcc/testsuite/gcc.target/aarch64/sve/acle/general/aclt_1.c
> 
> diff --git a/gcc/config/aarch64/aarch64-sve-builtins-base.cc 
> b/gcc/config/aarch64/aarch64-sve-builtins-base.cc
> index 79b5d570694..d58d5972baf 100644
> --- a/gcc/config/aarch64/aarch64-sve-builtins-base.cc
> +++ b/gcc/config/aarch64/aarch64-sve-builtins-base.cc
> @@ -214,7 +214,8 @@ public:
>   expand (function_expander &e) const override
>   {
>     e.add_ptrue_hint (0, e.gp_mode (0));
> -    insn_code icode = code_for_aarch64_pred_fac (m_unspec, e.vector_mode 
> (0));
> +    insn_code icode = code_for_aarch64_pred_fac_acle (m_unspec,
> +      e.vector_mode (0));
>     return e.use_exact_insn (icode);
>   }
> 
> diff --git a/gcc/config/aarch64/aarch64-sve.md 
> b/gcc/config/aarch64/aarch64-sve.md
> index 70fbc5ce2df..b881ba851b6 100644
> --- a/gcc/config/aarch64/aarch64-sve.md
> +++ b/gcc/config/aarch64/aarch64-sve.md
> @@ -9306,23 +9306,30 @@ (define_insn_and_split "*fcmuo<mode>_nor_combine"
> ;; -------------------------------------------------------------------------
> 
> ;; Predicated floating-point absolute comparisons.
> -(define_expand "@aarch64_pred_fac<cmp_op><mode>"
> -  [(set (match_operand:<VPRED> 0 "register_operand")
> - (unspec:<VPRED>
> -  [(match_operand:<VPRED> 1 "register_operand")
> -   (match_operand:SI 2 "aarch64_sve_ptrue_flag")
> -   (unspec:SVE_FULL_F
> -     [(match_dup 1)
> -      (match_dup 2)
> -      (match_operand:SVE_FULL_F 3 "register_operand")]
> -     UNSPEC_COND_FABS)
> -   (unspec:SVE_FULL_F
> -     [(match_dup 1)
> -      (match_dup 2)
> -      (match_operand:SVE_FULL_F 4 "register_operand")]
> -     UNSPEC_COND_FABS)]
> -  SVE_COND_FP_ABS_CMP))]
> +(define_expand "@aarch64_pred_fac<cmp_op><mode>_acle"
> +  [(set (match_operand:VNx16BI 0 "register_operand")
> + (and:VNx16BI
> +  (subreg:VNx16BI
> +    (unspec:<VPRED>
> +      [(match_operand:<VPRED> 1 "register_operand")
> +       (match_operand:SI 2 "aarch64_sve_ptrue_flag")
> +       (unspec:SVE_FULL_F
> + [(match_dup 1)
> +  (match_dup 2)
> +  (match_operand:SVE_FULL_F 3 "register_operand")]
> + UNSPEC_COND_FABS)
> +       (unspec:SVE_FULL_F
> + [(match_dup 1)
> +  (match_dup 2)
> +  (match_operand:SVE_FULL_F 4 "register_operand")]
> + UNSPEC_COND_FABS)]
> +      SVE_COND_FP_ABS_CMP)
> +    0)
> +  (match_dup 5)))]
>   "TARGET_SVE"
> +  {
> +    operands[5] = aarch64_ptrue_all (GET_MODE_UNIT_SIZE (<MODE>mode));
> +  }
> )
> 
> (define_insn_and_rewrite "*aarch64_pred_fac<cmp_op><mode>_relaxed"
> @@ -9371,6 +9378,30 @@ (define_insn "*aarch64_pred_fac<cmp_op><mode>_strict"
>   "fac<cmp_op>\t%0.<Vetype>, %1/z, %2.<Vetype>, %3.<Vetype>"
> )
> 
> +(define_insn "*aarch64_pred_fac<cmp_op><mode>_strict_acle"
> +  [(set (match_operand:VNx16BI 0 "register_operand" "=Upa")
> + (and:VNx16BI
> +  (subreg:VNx16BI
> +    (unspec:<VPRED>
> +      [(match_operand:<VPRED> 1 "register_operand" "Upl")
> +       (match_operand:SI 4 "aarch64_sve_ptrue_flag")
> +       (unspec:SVE_FULL_F
> + [(match_dup 1)
> +  (match_operand:SI 5 "aarch64_sve_gp_strictness")
> +  (match_operand:SVE_FULL_F 2 "register_operand" "w")]
> + UNSPEC_COND_FABS)
> +       (unspec:SVE_FULL_F
> + [(match_dup 1)
> +  (match_operand:SI 6 "aarch64_sve_gp_strictness")
> +  (match_operand:SVE_FULL_F 3 "register_operand" "w")]
> + UNSPEC_COND_FABS)]
> +      SVE_COND_FP_ABS_CMP)
> +    0)
> +  (match_operand:<VPRED> 7 "aarch64_ptrue_all_operand")))]
> +  "TARGET_SVE"
> +  "fac<cmp_op>\t%0.<Vetype>, %1/z, %2.<Vetype>, %3.<Vetype>"
> +)
> +
> ;; -------------------------------------------------------------------------
> ;; ---- [PRED] Select
> ;; -------------------------------------------------------------------------
> diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/general/acge_1.c 
> b/gcc/testsuite/gcc.target/aarch64/sve/acle/general/acge_1.c
> new file mode 100644
> index 00000000000..37428a86700
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/general/acge_1.c
> @@ -0,0 +1,104 @@
> +/* { dg-do compile } */
> +/* { dg-options "-O2" } */
> +/* { dg-final { check-function-bodies "**" "" } } */
> +
> +#include <arm_sve.h>
> +
> +#ifdef __cplusplus
> +extern "C" {
> +#endif
> +
> +/*
> +** test1:
> +** facge p0\.h, p0/z, z0\.h, z1\.h
> +** ret
> +*/
> +svbool_t
> +test1 (svbool_t pg, svfloat16_t x, svfloat16_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacge (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test2:
> +** facge p0\.s, p0/z, z0\.s, z1\.s
> +** ret
> +*/
> +svbool_t
> +test2 (svbool_t pg, svfloat32_t x, svfloat32_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacge (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test3:
> +** facge p0\.s, p0/z, z0\.s, z1\.s
> +** ret
> +*/
> +svbool_t
> +test3 (svbool_t pg, svfloat32_t x, svfloat32_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacge (pg, x, y),
> +  svptrue_b32 ());
> +}
> +
> +/*
> +** test4:
> +** facge p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test4 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacge (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test5:
> +** facge p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test5 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b32 (),
> +  svacge (pg, x, y),
> +  svptrue_b8 ());
> +}
> +
> +/*
> +** test6:
> +** facge p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test6 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacge (pg, x, y),
> +  svptrue_b64 ());
> +}
> +
> +/*
> +** test7:
> +** facge p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test7 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b32 (),
> +  svacge (pg, x, y),
> +  svptrue_b64 ());
> +}
> +
> +#ifdef __cplusplus
> +}
> +#endif
> diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/general/acgt_1.c 
> b/gcc/testsuite/gcc.target/aarch64/sve/acle/general/acgt_1.c
> new file mode 100644
> index 00000000000..5829369a479
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/general/acgt_1.c
> @@ -0,0 +1,104 @@
> +/* { dg-do compile } */
> +/* { dg-options "-O2" } */
> +/* { dg-final { check-function-bodies "**" "" } } */
> +
> +#include <arm_sve.h>
> +
> +#ifdef __cplusplus
> +extern "C" {
> +#endif
> +
> +/*
> +** test1:
> +** facgt p0\.h, p0/z, z0\.h, z1\.h
> +** ret
> +*/
> +svbool_t
> +test1 (svbool_t pg, svfloat16_t x, svfloat16_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacgt (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test2:
> +** facgt p0\.s, p0/z, z0\.s, z1\.s
> +** ret
> +*/
> +svbool_t
> +test2 (svbool_t pg, svfloat32_t x, svfloat32_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacgt (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test3:
> +** facgt p0\.s, p0/z, z0\.s, z1\.s
> +** ret
> +*/
> +svbool_t
> +test3 (svbool_t pg, svfloat32_t x, svfloat32_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacgt (pg, x, y),
> +  svptrue_b32 ());
> +}
> +
> +/*
> +** test4:
> +** facgt p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test4 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacgt (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test5:
> +** facgt p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test5 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b32 (),
> +  svacgt (pg, x, y),
> +  svptrue_b8 ());
> +}
> +
> +/*
> +** test6:
> +** facgt p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test6 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacgt (pg, x, y),
> +  svptrue_b64 ());
> +}
> +
> +/*
> +** test7:
> +** facgt p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test7 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b32 (),
> +  svacgt (pg, x, y),
> +  svptrue_b64 ());
> +}
> +
> +#ifdef __cplusplus
> +}
> +#endif
> diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/general/acle_1.c 
> b/gcc/testsuite/gcc.target/aarch64/sve/acle/general/acle_1.c
> new file mode 100644
> index 00000000000..bd5200e94b7
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/general/acle_1.c
> @@ -0,0 +1,104 @@
> +/* { dg-do compile } */
> +/* { dg-options "-O2" } */
> +/* { dg-final { check-function-bodies "**" "" } } */
> +
> +#include <arm_sve.h>
> +
> +#ifdef __cplusplus
> +extern "C" {
> +#endif
> +
> +/*
> +** test1:
> +** facle p0\.h, p0/z, z0\.h, z1\.h
> +** ret
> +*/
> +svbool_t
> +test1 (svbool_t pg, svfloat16_t x, svfloat16_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacle (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test2:
> +** facle p0\.s, p0/z, z0\.s, z1\.s
> +** ret
> +*/
> +svbool_t
> +test2 (svbool_t pg, svfloat32_t x, svfloat32_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacle (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test3:
> +** facle p0\.s, p0/z, z0\.s, z1\.s
> +** ret
> +*/
> +svbool_t
> +test3 (svbool_t pg, svfloat32_t x, svfloat32_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacle (pg, x, y),
> +  svptrue_b32 ());
> +}
> +
> +/*
> +** test4:
> +** facle p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test4 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacle (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test5:
> +** facle p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test5 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b32 (),
> +  svacle (pg, x, y),
> +  svptrue_b8 ());
> +}
> +
> +/*
> +** test6:
> +** facle p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test6 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svacle (pg, x, y),
> +  svptrue_b64 ());
> +}
> +
> +/*
> +** test7:
> +** facle p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test7 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b32 (),
> +  svacle (pg, x, y),
> +  svptrue_b64 ());
> +}
> +
> +#ifdef __cplusplus
> +}
> +#endif
> diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/general/aclt_1.c 
> b/gcc/testsuite/gcc.target/aarch64/sve/acle/general/aclt_1.c
> new file mode 100644
> index 00000000000..876aba965e2
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/general/aclt_1.c
> @@ -0,0 +1,104 @@
> +/* { dg-do compile } */
> +/* { dg-options "-O2" } */
> +/* { dg-final { check-function-bodies "**" "" } } */
> +
> +#include <arm_sve.h>
> +
> +#ifdef __cplusplus
> +extern "C" {
> +#endif
> +
> +/*
> +** test1:
> +** faclt p0\.h, p0/z, z0\.h, z1\.h
> +** ret
> +*/
> +svbool_t
> +test1 (svbool_t pg, svfloat16_t x, svfloat16_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svaclt (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test2:
> +** faclt p0\.s, p0/z, z0\.s, z1\.s
> +** ret
> +*/
> +svbool_t
> +test2 (svbool_t pg, svfloat32_t x, svfloat32_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svaclt (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test3:
> +** faclt p0\.s, p0/z, z0\.s, z1\.s
> +** ret
> +*/
> +svbool_t
> +test3 (svbool_t pg, svfloat32_t x, svfloat32_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svaclt (pg, x, y),
> +  svptrue_b32 ());
> +}
> +
> +/*
> +** test4:
> +** faclt p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test4 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svaclt (pg, x, y),
> +  svptrue_b16 ());
> +}
> +
> +/*
> +** test5:
> +** faclt p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test5 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b32 (),
> +  svaclt (pg, x, y),
> +  svptrue_b8 ());
> +}
> +
> +/*
> +** test6:
> +** faclt p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test6 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b8 (),
> +  svaclt (pg, x, y),
> +  svptrue_b64 ());
> +}
> +
> +/*
> +** test7:
> +** faclt p0\.d, p0/z, z0\.d, z1\.d
> +** ret
> +*/
> +svbool_t
> +test7 (svbool_t pg, svfloat64_t x, svfloat64_t y)
> +{
> +  return svand_z (svptrue_b32 (),
> +  svaclt (pg, x, y),
> +  svptrue_b64 ());
> +}
> +
> +#ifdef __cplusplus
> +}
> +#endif
> -- 
> 2.43.0
>
Re: [PATCH 07/12] aarch64: Use VNx16BI for svac*

Reply via email to