Re: [PATCH] RISC-V: Support combine extend and reduce sum to widen reduce sum

Kito Cheng via Gcc-patches Thu, 14 Sep 2023 09:05:27 -0700

LGTM


On Thu, Sep 14, 2023 at 11:51 PM Lehua Ding <lehua.d...@rivai.ai> wrote:
>
> This patch add combine pattern to combine extend and reduce sum
> to widen reduce sum. The pattern in autovec.md was adjusted as
> needed. Note that the current vectorization cannot generate reduce
> openrand which is LMUL=M8, because this means that we need an LMUL=M16
> for the extended openrand, which is currently not possible. So I've
> added VI_QHS_NO_M8 and VF_HS_NO_M8 mode iterator, which exclude
> mode which is LMUL=M8.
>
>         PR target/111381
>
> gcc/ChangeLog:
>
>         * config/riscv/autovec-opt.md (*reduc_plus_scal_<mode>):
>         New combine pattern.
>         (*fold_left_widen_plus_<mode>): Ditto.
>         (*mask_len_fold_left_widen_plus_<mode>): Ditto.
>         * config/riscv/autovec.md (reduc_plus_scal_<mode>):
>         Change from define_expand to define_insn_and_split.
>         (fold_left_plus_<mode>): Ditto.
>         (mask_len_fold_left_plus_<mode>): Ditto.
>         * config/riscv/riscv-v.cc (expand_reduction):
>         Support widen reduction.
>         * config/riscv/vector-iterators.md (UNSPEC_WREDUC_SUM):
>         Add new iterators and attrs.
>
> gcc/testsuite/ChangeLog:
>
>         * gcc.target/riscv/rvv/autovec/widen/widen_reduc-1.c: New test.
>         * gcc.target/riscv/rvv/autovec/widen/widen_reduc_order-1.c: New test.
>         * gcc.target/riscv/rvv/autovec/widen/widen_reduc_order-2.c: New test.
>         * gcc.target/riscv/rvv/autovec/widen/widen_reduc_order_run-1.c: New 
> test.
>         * gcc.target/riscv/rvv/autovec/widen/widen_reduc_order_run-2.c: New 
> test.
>         * gcc.target/riscv/rvv/autovec/widen/widen_reduc_run-1.c: New test.
>
> ---
>  gcc/config/riscv/autovec-opt.md               | 82 +++++++++++++++++++
>  gcc/config/riscv/autovec.md                   | 74 +++++++++++------
>  gcc/config/riscv/riscv-v.cc                   |  7 +-
>  gcc/config/riscv/vector-iterators.md          | 51 ++++++++++++
>  .../riscv/rvv/autovec/widen/widen_reduc-1.c   | 27 ++++++
>  .../rvv/autovec/widen/widen_reduc_order-1.c   | 20 +++++
>  .../rvv/autovec/widen/widen_reduc_order-2.c   | 19 +++++
>  .../autovec/widen/widen_reduc_order_run-1.c   | 24 ++++++
>  .../autovec/widen/widen_reduc_order_run-2.c   | 22 +++++
>  .../rvv/autovec/widen/widen_reduc_run-1.c     | 22 +++++
>  10 files changed, 321 insertions(+), 27 deletions(-)
>  create mode 100644 
> gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc-1.c
>  create mode 100644 
> gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order-1.c
>  create mode 100644 
> gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order-2.c
>  create mode 100644 
> gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order_run-1.c
>  create mode 100644 
> gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order_run-2.c
>  create mode 100644 
> gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_run-1.c
>
> diff --git a/gcc/config/riscv/autovec-opt.md b/gcc/config/riscv/autovec-opt.md
> index 22ab8afc994..df516849527 100644
> --- a/gcc/config/riscv/autovec-opt.md
> +++ b/gcc/config/riscv/autovec-opt.md
> @@ -1196,6 +1196,88 @@
>  }
>  [(set_attr "type" "vfwmul")])
>
> +;; Combine extend + vredsum to vwredsum[u]
> +(define_insn_and_split "*reduc_plus_scal_<mode>"
> +  [(set (match_operand:<V_DOUBLE_EXTEND_VEL> 0 "register_operand")
> +        (unspec:<V_DOUBLE_EXTEND_VEL> [
> +          (any_extend:<V_DOUBLE_EXTEND>
> +            (match_operand:VI_QHS_NO_M8 1 "register_operand"))
> +        ] UNSPEC_REDUC_SUM))]
> +  "TARGET_VECTOR && can_create_pseudo_p ()"
> +  "#"
> +  "&& 1"
> +  [(const_int 0)]
> +{
> +  riscv_vector::expand_reduction (<WREDUC_UNSPEC>, operands,
> +                                  CONST0_RTX (<V_DOUBLE_EXTEND_VEL>mode));
> +  DONE;
> +}
> +[(set_attr "type" "vector")])
> +
> +;; Combine extend + vfredusum to vfwredusum
> +(define_insn_and_split "*reduc_plus_scal_<mode>"
> +  [(set (match_operand:<V_DOUBLE_EXTEND_VEL> 0 "register_operand")
> +        (unspec:<V_DOUBLE_EXTEND_VEL> [
> +          (float_extend:<V_DOUBLE_EXTEND>
> +            (match_operand:VF_HS_NO_M8 1 "register_operand"))
> +        ] UNSPEC_REDUC_SUM_UNORDERED))]
> +  "TARGET_VECTOR && can_create_pseudo_p ()"
> +  "#"
> +  "&& 1"
> +  [(const_int 0)]
> +{
> +  riscv_vector::expand_reduction (UNSPEC_WREDUC_SUM_UNORDERED, operands,
> +                                  CONST0_RTX (<V_DOUBLE_EXTEND_VEL>mode));
> +  DONE;
> +}
> +[(set_attr "type" "vector")])
> +
> +;; Combine extend + vfredosum to vfwredosum
> +(define_insn_and_split "*fold_left_widen_plus_<mode>"
> +  [(set (match_operand:<V_DOUBLE_EXTEND_VEL> 0 "register_operand")
> +        (unspec:<V_DOUBLE_EXTEND_VEL> [
> +          (float_extend:<V_DOUBLE_EXTEND>
> +            (match_operand:VF_HS_NO_M8 2 "register_operand"))
> +          (match_operand:<V_DOUBLE_EXTEND_VEL> 1 "register_operand")
> +        ] UNSPEC_REDUC_SUM_ORDERED))]
> +  "TARGET_VECTOR && can_create_pseudo_p ()"
> +  "#"
> +  "&& 1"
> +  [(const_int 0)]
> +{
> +  riscv_vector::expand_reduction (UNSPEC_WREDUC_SUM_ORDERED, operands,
> +                                 operands[1],
> +                                 riscv_vector::reduction_type::FOLD_LEFT);
> +  DONE;
> +}
> +[(set_attr "type" "vector")])
> +
> +;; Combine extend + mask vfredosum to mask vfwredosum
> +(define_insn_and_split "*mask_len_fold_left_widen_plus_<mode>"
> +  [(set (match_operand:<V_DOUBLE_EXTEND_VEL> 0 "register_operand")
> +        (unspec:<V_DOUBLE_EXTEND_VEL> [
> +          (float_extend:<V_DOUBLE_EXTEND>
> +            (match_operand:VF_HS_NO_M8 2 "register_operand"))
> +          (match_operand:<V_DOUBLE_EXTEND_VEL> 1 "register_operand")
> +          (match_operand:<VM> 3 "vector_mask_operand")
> +          (match_operand 4 "autovec_length_operand")
> +          (match_operand 5 "const_0_operand")
> +        ] UNSPEC_REDUC_SUM_ORDERED))]
> +  "TARGET_VECTOR && can_create_pseudo_p ()"
> +  "#"
> +  "&& 1"
> +  [(const_int 0)]
> +{
> +  if (rtx_equal_p (operands[4], const0_rtx))
> +    emit_move_insn (operands[0], operands[1]);
> +  else
> +    riscv_vector::expand_reduction (UNSPEC_WREDUC_SUM_ORDERED, operands,
> +                                   operands[1],
> +                                   
> riscv_vector::reduction_type::MASK_LEN_FOLD_LEFT);
> +  DONE;
> +}
> +[(set_attr "type" "vector")])
> +
>  ;; 
> =============================================================================
>  ;; Misc combine patterns
>  ;; 
> =============================================================================
> diff --git a/gcc/config/riscv/autovec.md b/gcc/config/riscv/autovec.md
> index 9e05afddd29..4a5f4fd3716 100644
> --- a/gcc/config/riscv/autovec.md
> +++ b/gcc/config/riscv/autovec.md
> @@ -2086,14 +2086,20 @@
>  ;; - vredxor.vs
>  ;; -------------------------------------------------------------------------
>
> -(define_expand "reduc_plus_scal_<mode>"
> -  [(match_operand:<VEL> 0 "register_operand")
> -   (match_operand:VI 1 "register_operand")]
> -  "TARGET_VECTOR"
> +(define_insn_and_split "reduc_plus_scal_<mode>"
> +  [(set (match_operand:<VEL> 0 "register_operand")
> +        (unspec:<VEL> [
> +             (match_operand:VI 1 "register_operand")
> +        ] UNSPEC_REDUC_SUM))]
> +  "TARGET_VECTOR && can_create_pseudo_p ()"
> +  "#"
> +  "&& 1"
> +  [(const_int 0)]
>  {
>    riscv_vector::expand_reduction (UNSPEC_REDUC_SUM, operands, CONST0_RTX 
> (<VEL>mode));
>    DONE;
> -})
> +}
> +[(set_attr "type" "vector")])
>
>  (define_expand "reduc_smax_scal_<mode>"
>    [(match_operand:<VEL> 0 "register_operand")
> @@ -2173,15 +2179,21 @@
>  ;; - vfredmin.vs
>  ;; -------------------------------------------------------------------------
>
> -(define_expand "reduc_plus_scal_<mode>"
> -  [(match_operand:<VEL> 0 "register_operand")
> -   (match_operand:VF 1 "register_operand")]
> -  "TARGET_VECTOR"
> +(define_insn_and_split "reduc_plus_scal_<mode>"
> +  [(set (match_operand:<VEL> 0 "register_operand")
> +        (unspec:<VEL> [
> +             (match_operand:VF 1 "register_operand")
> +        ] UNSPEC_REDUC_SUM_UNORDERED))]
> +  "TARGET_VECTOR && can_create_pseudo_p ()"
> +  "#"
> +  "&& 1"
> +  [(const_int 0)]
>  {
>    riscv_vector::expand_reduction (UNSPEC_REDUC_SUM_UNORDERED, operands,
>                                    CONST0_RTX (<VEL>mode));
>    DONE;
> -})
> +}
> +[(set_attr "type" "vector")])
>
>  (define_expand "reduc_smax_scal_<mode>"
>    [(match_operand:<VEL> 0 "register_operand")
> @@ -2215,27 +2227,38 @@
>  ;; -------------------------------------------------------------------------
>
>  ;; Unpredicated in-order FP reductions.
> -(define_expand "fold_left_plus_<mode>"
> -  [(match_operand:<VEL> 0 "register_operand")
> -   (match_operand:<VEL> 1 "register_operand")
> -   (match_operand:VF 2 "register_operand")]
> -  "TARGET_VECTOR"
> +(define_insn_and_split "fold_left_plus_<mode>"
> +  [(set (match_operand:<VEL> 0 "register_operand")
> +        (unspec:<VEL> [
> +             (match_operand:VF 2 "register_operand")
> +             (match_operand:<VEL> 1 "register_operand")
> +        ] UNSPEC_REDUC_SUM_ORDERED))]
> +  "TARGET_VECTOR && can_create_pseudo_p ()"
> +  "#"
> +  "&& 1"
> +  [(const_int 0)]
>  {
>    riscv_vector::expand_reduction (UNSPEC_REDUC_SUM_ORDERED, operands,
>                                   operands[1],
>                                   riscv_vector::reduction_type::FOLD_LEFT);
>    DONE;
> -})
> +}
> +[(set_attr "type" "vector")])
>
>  ;; Predicated in-order FP reductions.
> -(define_expand "mask_len_fold_left_plus_<mode>"
> -  [(match_operand:<VEL> 0 "register_operand")
> -   (match_operand:<VEL> 1 "register_operand")
> -   (match_operand:VF 2 "register_operand")
> -   (match_operand:<VM> 3 "vector_mask_operand")
> -   (match_operand 4 "autovec_length_operand")
> -   (match_operand 5 "const_0_operand")]
> -  "TARGET_VECTOR"
> +(define_insn_and_split "mask_len_fold_left_plus_<mode>"
> +  [(set (match_operand:<VEL> 0 "register_operand")
> +        (unspec:<VEL> [
> +          (match_operand:VF 2 "register_operand")
> +          (match_operand:<VEL> 1 "register_operand")
> +          (match_operand:<VM> 3 "vector_mask_operand")
> +          (match_operand 4 "autovec_length_operand")
> +          (match_operand 5 "const_0_operand")
> +        ] UNSPEC_REDUC_SUM_ORDERED))]
> +  "TARGET_VECTOR && can_create_pseudo_p ()"
> +  "#"
> +  "&& 1"
> +  [(const_int 0)]
>  {
>    if (rtx_equal_p (operands[4], const0_rtx))
>      emit_move_insn (operands[0], operands[1]);
> @@ -2244,7 +2267,8 @@
>                                     operands[1],
>                                     
> riscv_vector::reduction_type::MASK_LEN_FOLD_LEFT);
>    DONE;
> -})
> +}
> +[(set_attr "type" "vector")])
>
>  ;; -------------------------------------------------------------------------
>  ;; ---- [INT,FP] Extract active element
> diff --git a/gcc/config/riscv/riscv-v.cc b/gcc/config/riscv/riscv-v.cc
> index 1bf5471beaf..668594b65ed 100644
> --- a/gcc/config/riscv/riscv-v.cc
> +++ b/gcc/config/riscv/riscv-v.cc
> @@ -3212,7 +3212,8 @@ expand_reduction (unsigned unspec, rtx *ops, rtx init, 
> reduction_type type)
>  {
>    rtx vector = type == reduction_type::UNORDERED ? ops[1] : ops[2];
>    machine_mode vmode = GET_MODE (vector);
> -  machine_mode m1_mode = get_m1_mode (vmode).require ();
> +  machine_mode vel_mode = GET_MODE (ops[0]);
> +  machine_mode m1_mode = get_m1_mode (vel_mode).require ();
>
>    rtx m1_tmp = gen_reg_rtx (m1_mode);
>    rtx scalar_move_ops[] = {m1_tmp, init};
> @@ -3225,7 +3226,9 @@ expand_reduction (unsigned unspec, rtx *ops, rtx init, 
> reduction_type type)
>    rtx reduc_ops[] = {m1_tmp2, vector, m1_tmp};
>
>    if (unspec == UNSPEC_REDUC_SUM_ORDERED
> -      || unspec == UNSPEC_REDUC_SUM_UNORDERED)
> +      || unspec == UNSPEC_WREDUC_SUM_ORDERED
> +      || unspec == UNSPEC_REDUC_SUM_UNORDERED
> +      || unspec == UNSPEC_WREDUC_SUM_UNORDERED)
>      {
>        insn_code icode = code_for_pred (unspec, vmode);
>        if (type == reduction_type::MASK_LEN_FOLD_LEFT)
> diff --git a/gcc/config/riscv/vector-iterators.md 
> b/gcc/config/riscv/vector-iterators.md
> index c9d0a501910..fa9892cebc1 100644
> --- a/gcc/config/riscv/vector-iterators.md
> +++ b/gcc/config/riscv/vector-iterators.md
> @@ -686,6 +686,14 @@
>    RVVM8SI RVVM4SI RVVM2SI RVVM1SI (RVVMF2SI "TARGET_MIN_VLEN > 32")
>  ])
>
> +(define_mode_iterator VI_QHS_NO_M8 [
> +  RVVM4QI RVVM2QI RVVM1QI RVVMF2QI RVVMF4QI (RVVMF8QI "TARGET_MIN_VLEN > 32")
> +
> +  RVVM4HI RVVM2HI RVVM1HI RVVMF2HI (RVVMF4HI "TARGET_MIN_VLEN > 32")
> +
> +  RVVM4SI RVVM2SI RVVM1SI (RVVMF2SI "TARGET_MIN_VLEN > 32")
> +])
> +
>  (define_mode_iterator VF_HS [
>    (RVVM8HF "TARGET_ZVFH") (RVVM4HF "TARGET_ZVFH") (RVVM2HF "TARGET_ZVFH")
>    (RVVM1HF "TARGET_ZVFH") (RVVMF2HF "TARGET_ZVFH")
> @@ -695,6 +703,23 @@
>    (RVVM1SF "TARGET_VECTOR_ELEN_FP_32") (RVVMF2SF "TARGET_VECTOR_ELEN_FP_32 
> && TARGET_MIN_VLEN > 32")
>  ])
>
> +(define_mode_iterator VF_HS_NO_M8 [
> +  (RVVM4HF "TARGET_ZVFH")
> +  (RVVM2HF "TARGET_ZVFH")
> +  (RVVM1HF "TARGET_ZVFH")
> +  (RVVMF2HF "TARGET_ZVFH")
> +  (RVVMF4HF "TARGET_ZVFH && TARGET_MIN_VLEN > 32")
> +  (RVVM4SF "TARGET_VECTOR_ELEN_FP_32")
> +  (RVVM2SF "TARGET_VECTOR_ELEN_FP_32")
> +  (RVVM1SF "TARGET_VECTOR_ELEN_FP_32")
> +  (RVVMF2SF "TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN > 32")
> +])
> +
> +(define_mode_iterator VF_HS_M8 [
> +  (RVVM8HF "TARGET_ZVFH")
> +  (RVVM8SF "TARGET_VECTOR_ELEN_FP_32")
> +])
> +
>  (define_mode_iterator V_VLSI_QHS [
>    RVVM8QI RVVM4QI RVVM2QI RVVM1QI RVVMF2QI RVVMF4QI (RVVMF8QI 
> "TARGET_MIN_VLEN > 32")
>
> @@ -1319,6 +1344,8 @@
>    (UNSPEC_WREDUC_SUM_ORDERED "wredosum") (UNSPEC_WREDUC_SUM_UNORDERED 
> "wredusum")
>  ])
>
> +(define_code_attr WREDUC_UNSPEC [(zero_extend "UNSPEC_WREDUC_SUMU") 
> (sign_extend "UNSPEC_WREDUC_SUM")])
> +
>  (define_mode_attr VINDEX [
>    (RVVM8QI "RVVM8QI") (RVVM4QI "RVVM4QI") (RVVM2QI "RVVM2QI") (RVVM1QI 
> "RVVM1QI")
>    (RVVMF2QI "RVVMF2QI") (RVVMF4QI "RVVMF4QI") (RVVMF8QI "RVVMF8QI")
> @@ -1743,6 +1770,18 @@
>    (V1DF "DF") (V2DF "DF") (V4DF "DF") (V8DF "DF") (V16DF "DF") (V32DF "DF") 
> (V64DF "DF") (V128DF "DF") (V256DF "DF") (V512DF "DF")
>  ])
>
> +(define_mode_attr V_DOUBLE_EXTEND_VEL [
> +  (RVVM4QI "HI") (RVVM2QI "HI") (RVVM1QI "HI") (RVVMF2QI "HI") (RVVMF4QI 
> "HI") (RVVMF8QI "HI")
> +
> +  (RVVM4HI "SI") (RVVM2HI "SI") (RVVM1HI "SI") (RVVMF2HI "SI") (RVVMF4HI 
> "SI")
> +
> +  (RVVM4SI "DI") (RVVM2SI "DI") (RVVM1SI "DI") (RVVMF2SI "DI")
> +
> +  (RVVM4HF "SF") (RVVM2HF "SF") (RVVM1HF "SF") (RVVMF2HF "SF") (RVVMF4HF 
> "SF")
> +
> +  (RVVM4SF "DF") (RVVM2SF "DF") (RVVM1SF "DF") (RVVMF2SF "DF")
> +])
> +
>  (define_mode_attr vel [
>    (RVVM8QI "qi") (RVVM4QI "qi") (RVVM2QI "qi") (RVVM1QI "qi") (RVVMF2QI 
> "qi") (RVVMF4QI "qi") (RVVMF8QI "qi")
>
> @@ -2101,6 +2140,18 @@
>    (RVVM1QI "64") (RVVMF2QI "64") (RVVMF4QI "64") (RVVMF8QI "64")
>  ])
>
> +(define_mode_attr V_DOUBLE_EXTEND [
> +  (RVVM4QI "RVVM8HI") (RVVM2QI "RVVM4HI") (RVVM1QI "RVVM2HI") (RVVMF2QI 
> "RVVM1HI") (RVVMF4QI "RVVMF2HI") (RVVMF8QI "RVVMF4HI")
> +
> +  (RVVM4HI "RVVM8SI") (RVVM2HI "RVVM4SI") (RVVM1HI "RVVM2SI") (RVVMF2HI 
> "RVVM1SI") (RVVMF4HI "RVVMF2SI")
> +
> +  (RVVM4SI "RVVM8DI") (RVVM2SI "RVVM4DI") (RVVM1SI "RVVM2DI") (RVVMF2SI 
> "RVVM1DI")
> +
> +  (RVVM4HF "RVVM8SF") (RVVM2HF "RVVM4SF") (RVVM1HF "RVVM2SF") (RVVMF2HF 
> "RVVM1SF") (RVVMF4HF "RVVMF2SF")
> +
> +  (RVVM4SF "RVVM8DF") (RVVM2SF "RVVM4DF") (RVVM1SF "RVVM2DF") (RVVMF2SF 
> "RVVM1DF")
> +])
> +
>  (define_mode_attr V_DOUBLE_TRUNC [
>    (RVVM8HI "RVVM4QI") (RVVM4HI "RVVM2QI") (RVVM2HI "RVVM1QI") (RVVM1HI 
> "RVVMF2QI") (RVVMF2HI "RVVMF4QI") (RVVMF4HI "RVVMF8QI")
>
> diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc-1.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc-1.c
> new file mode 100644
> index 00000000000..80756468ec1
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc-1.c
> @@ -0,0 +1,27 @@
> +/* { dg-do compile } */
> +/* { dg-additional-options "-march=rv64gcv_zvfh_zvl128b -mabi=lp64d --param 
> riscv-autovec-preference=fixed-vlmax --param riscv-autovec-lmul=m2 
> -fno-vect-cost-model -ffast-math" } */
> +#include <stdint-gcc.h>
> +
> +#define TEST_TYPE(TYPE1, TYPE2, N)                                           
>   \
> +  __attribute__((noipa)) TYPE1 reduc_##TYPE1##_##TYPE2(TYPE2 *restrict a) {  
>   \
> +    TYPE1 sum = 0;                                                           
>   \
> +    for (int i = 0; i < N; i += 1)                                           
>   \
> +      sum += a[i];                                                           
>   \
> +    return sum;                                                              
>   \
> +  }
> +
> +#define TEST_ALL(TEST)                                                       
>   \
> +  TEST(int16_t, int8_t, 16)                                                  
>   \
> +  TEST(int32_t, int16_t, 8)                                                  
>   \
> +  TEST(int64_t, int32_t, 4)                                                  
>   \
> +  TEST(uint16_t, uint8_t, 16)                                                
>   \
> +  TEST(uint32_t, uint16_t, 8)                                                
>   \
> +  TEST(uint64_t, uint32_t, 4)                                                
>   \
> +  TEST(float, _Float16, 8)                                                   
>   \
> +  TEST(double, float, 4)
> +
> +TEST_ALL(TEST_TYPE)
> +
> +/* { dg-final { scan-assembler-times {\tvfwredusum\.vs} 2 } } */
> +/* { dg-final { scan-assembler-times {\tvwredsum\.vs} 3 } } */
> +/* { dg-final { scan-assembler-times {\tvwredsumu\.vs} 3 } } */
> diff --git 
> a/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order-1.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order-1.c
> new file mode 100644
> index 00000000000..7ae508096e7
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order-1.c
> @@ -0,0 +1,20 @@
> +/* { dg-do compile } */
> +/* { dg-additional-options "-march=rv64gcv_zvfh -mabi=lp64d --param 
> riscv-autovec-preference=scalable -fno-vect-cost-model" } */
> +#include <stdint-gcc.h>
> +
> +#define TEST_TYPE(TYPE1, TYPE2)                                              
>   \
> +  __attribute__((noipa))                                                     
>   \
> +  TYPE1 reduc_##TYPE1##_##TYPE2(TYPE2 *restrict a, int n) {                  
>   \
> +    TYPE1 sum = 0;                                                           
>   \
> +    for (int i = 0; i < n; i += 1)                                           
>   \
> +      sum += a[i];                                                           
>   \
> +    return sum;                                                              
>   \
> +  }
> +
> +#define TEST_ALL(TEST)                                                       
>   \
> +  TEST(float, _Float16)                                                      
>   \
> +  TEST(double, float)
> +
> +TEST_ALL(TEST_TYPE)
> +
> +/* { dg-final { scan-assembler-times {\tvfwredosum\.vs} 2 } } */
> diff --git 
> a/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order-2.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order-2.c
> new file mode 100644
> index 00000000000..a922aa71279
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order-2.c
> @@ -0,0 +1,19 @@
> +/* { dg-do compile } */
> +/* { dg-additional-options "-march=rv64gcv_zvfh -mabi=lp64d --param 
> riscv-autovec-preference=scalable --param riscv-autovec-lmul=m2 
> -fno-vect-cost-model" } */
> +#include <stdint-gcc.h>
> +
> +#define TEST_TYPE(TYPE1, TYPE2, N)                                           
>   \
> +  __attribute__((noipa)) TYPE1 reduc_##TYPE1##_##TYPE2(TYPE2 *restrict a) {  
>   \
> +    TYPE1 sum = 0;                                                           
>   \
> +    for (int i = 0; i < N; i += 1)                                           
>   \
> +      sum += a[i];                                                           
>   \
> +    return sum;                                                              
>   \
> +  }
> +
> +#define TEST_ALL(TEST)                                                       
>   \
> +  TEST(float, _Float16, 8)                                                   
>   \
> +  TEST(double, float, 4)
> +
> +TEST_ALL(TEST_TYPE)
> +
> +/* { dg-final { scan-assembler-times {\tvfwredosum\.vs} 2 } } */
> diff --git 
> a/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order_run-1.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order_run-1.c
> new file mode 100644
> index 00000000000..d4ba4f50285
> --- /dev/null
> +++ 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order_run-1.c
> @@ -0,0 +1,24 @@
> +/* { dg-do run { target { riscv_vector } } } */
> +/* { dg-additional-options "--param=riscv-autovec-preference=scalable 
> -fno-vect-cost-model" } */
> +
> +#include "widen_reduc_order-1.c"
> +
> +#define N 99
> +
> +#define RUN(TYPE1, TYPE2)                                                    
>   \
> +  {                                                                          
>   \
> +    TYPE2 a[N];                                                              
>   \
> +    TYPE1 r = 0;                                                             
>   \
> +    for (int i = 0; i < N; i++) {                                            
>   \
> +      a[i] = (i * 0.1) * (i & 1 ? 1 : -1);                                   
>   \
> +      r += a[i];                                                             
>   \
> +      asm volatile("" ::: "memory");                                         
>   \
> +    }                                                                        
>   \
> +    if (r != reduc_##TYPE1##_##TYPE2(a, N))                                  
>   \
> +      __builtin_abort();                                                     
>   \
> +  }
> +
> +int __attribute__((optimize(1))) main() {
> +  TEST_ALL(RUN)
> +  return 0;
> +}
> diff --git 
> a/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order_run-2.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order_run-2.c
> new file mode 100644
> index 00000000000..6ac676245dc
> --- /dev/null
> +++ 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_order_run-2.c
> @@ -0,0 +1,22 @@
> +/* { dg-do run { target { riscv_vector } } } */
> +/* { dg-additional-options "--param=riscv-autovec-preference=scalable 
> -fno-vect-cost-model" } */
> +
> +#include "widen_reduc_order-2.c"
> +
> +#define RUN(TYPE1, TYPE2, N)                                                 
>   \
> +  {                                                                          
>   \
> +    TYPE2 a[N];                                                              
>   \
> +    TYPE1 r = 0;                                                             
>   \
> +    for (int i = 0; i < N; i++) {                                            
>   \
> +      a[i] = (i * 0.1) * (i & 1 ? 1 : -1);                                   
>   \
> +      r += a[i];                                                             
>   \
> +      asm volatile("" ::: "memory");                                         
>   \
> +    }                                                                        
>   \
> +    if (r != reduc_##TYPE1##_##TYPE2(a))                                     
>   \
> +      __builtin_abort();                                                     
>   \
> +  }
> +
> +int __attribute__((optimize(1))) main() {
> +  TEST_ALL(RUN)
> +  return 0;
> +}
> diff --git 
> a/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_run-1.c 
> b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_run-1.c
> new file mode 100644
> index 00000000000..d70a652a56a
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/widen/widen_reduc_run-1.c
> @@ -0,0 +1,22 @@
> +/* { dg-do run { target { riscv_vector } } } */
> +/* { dg-additional-options "--param=riscv-autovec-preference=scalable 
> -fno-vect-cost-model" } */
> +
> +#include "widen_reduc-1.c"
> +
> +#define RUN(TYPE1, TYPE2, N)                                                 
>   \
> +  {                                                                          
>   \
> +    TYPE2 a[N];                                                              
>   \
> +    TYPE1 r = 0;                                                             
>   \
> +    for (int i = 0; i < N; i++) {                                            
>   \
> +      a[i] = (i * 0.1) * (i & 1 ? 1 : -1);                                   
>   \
> +      r += a[i];                                                             
>   \
> +      asm volatile("" ::: "memory");                                         
>   \
> +    }                                                                        
>   \
> +    if (r != reduc_##TYPE1##_##TYPE2(a))                                     
>   \
> +      __builtin_abort();                                                     
>   \
> +  }
> +
> +int __attribute__((optimize(1))) main() {
> +  TEST_ALL(RUN)
> +  return 0;
> +}
> --
> 2.36.3
>

Re: [PATCH] RISC-V: Support combine extend and reduce sum to widen reduce sum

Reply via email to