Hi,
We're missing some VLS BF modes, e.g. for gathers. This patch adds them.
While at it, it adds some documentation to the iterators and corrects
the vec_set iterator (for the time being).
Regtested on rv64gcv_zvl512b but curious what the CI says.
Regards
Robin
PR/target 121582
gcc/ChangeLog:
* config/riscv/autovec.md: Use V_VLS_ZVFH for vec_set.
* config/riscv/riscv-modes.def (RVV_NF4_MODES): Add BF mdoes.
(ADJUST_PRECISION): Ditto.
(VECTOR_MODE_WITH_PREFIX): Ditto.
(VLS_MODES): Ditto.
* config/riscv/riscv-v.cc (can_be_broadcast_p): Add BF handling.
* config/riscv/riscv-vector-switch.def (VLS_ENTRY): Add BF
modes.
* config/riscv/riscv.md: Ditto.
* config/riscv/vector-iterators.md: Document modes.
* config/riscv/vector.md: Add BF modes.
gcc/testsuite/ChangeLog:
* gcc.target/riscv/rvv/autovec/pr121582.c: New test.
---
gcc/config/riscv/autovec.md | 6 +-
gcc/config/riscv/riscv-modes.def | 24 ++--
gcc/config/riscv/riscv-v.cc | 8 ++
gcc/config/riscv/riscv-vector-switch.def | 12 ++
gcc/config/riscv/riscv.md | 1 +
gcc/config/riscv/vector-iterators.md | 121 +++++++++++++++++-
gcc/config/riscv/vector.md | 50 ++++++--
.../gcc.target/riscv/rvv/autovec/pr121582.c | 6 +
8 files changed, 200 insertions(+), 28 deletions(-)
create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/pr121582.c
diff --git a/gcc/config/riscv/autovec.md b/gcc/config/riscv/autovec.md
index e69a3a33db1..95ab3694920 100644
--- a/gcc/config/riscv/autovec.md
+++ b/gcc/config/riscv/autovec.md
@@ -1350,9 +1350,9 @@ (define_expand "select_vl<mode>"
;; -------------------------------------------------------------------------
(define_expand "vec_set<mode>"
- [(match_operand:V_VLS 0 "register_operand")
- (match_operand:<VEL> 1 "register_operand")
- (match_operand 2 "nonmemory_operand")]
+ [(match_operand:V_VLS_ZVFH 0 "register_operand")
+ (match_operand:<VEL> 1 "register_operand")
+ (match_operand 2 "nonmemory_operand")]
"TARGET_VECTOR"
{
/* If we set the first element, emit an v(f)mv.s.[xf]. */
diff --git a/gcc/config/riscv/riscv-modes.def b/gcc/config/riscv/riscv-modes.def
index 55f7fd08c4d..f3d987e698f 100644
--- a/gcc/config/riscv/riscv-modes.def
+++ b/gcc/config/riscv/riscv-modes.def
@@ -331,7 +331,7 @@ RVV_NF4_MODES (4)
\
ADJUST_ALIGNMENT (RVVM4x##NF##QI, 1);
\
ADJUST_ALIGNMENT (RVVM4x##NF##HI, 2);
\
- ADJUST_ALIGNMENT (RVVM4x##NF##BF, 2);
\
+ ADJUST_ALIGNMENT (RVVM4x##NF##BF, 2);
\
ADJUST_ALIGNMENT (RVVM4x##NF##HF, 2);
\
ADJUST_ALIGNMENT (RVVM4x##NF##SI, 4);
\
ADJUST_ALIGNMENT (RVVM4x##NF##SF, 4);
\
@@ -395,6 +395,7 @@ ADJUST_PRECISION (V4096BI, 4096);
VECTOR_MODE_WITH_PREFIX (V, INT, SI, NBYTES / 4, 1);
\
VECTOR_MODE_WITH_PREFIX (V, INT, DI, NBYTES / 8, 1);
\
VECTOR_MODE_WITH_PREFIX (V, FLOAT, HF, NBYTES / 2, 1);
\
+ VECTOR_MODE_WITH_PREFIX (V, FLOAT, BF, NBYTES / 2, 1);
\
VECTOR_MODE_WITH_PREFIX (V, FLOAT, SF, NBYTES / 4, 1);
\
VECTOR_MODE_WITH_PREFIX (V, FLOAT, DF, NBYTES / 8, 1);
@@ -403,6 +404,7 @@ VECTOR_MODE_WITH_PREFIX (V, INT, HI, 1, 1); /* V1HI */
VECTOR_MODE_WITH_PREFIX (V, INT, SI, 1, 1); /* V1SI */
VECTOR_MODE_WITH_PREFIX (V, INT, DI, 1, 1); /* V1DI */
VECTOR_MODE_WITH_PREFIX (V, FLOAT, HF, 1, 1); /* V1HF */
+VECTOR_MODE_WITH_PREFIX (V, FLOAT, BF, 1, 1); /* V1BF */
VECTOR_MODE_WITH_PREFIX (V, FLOAT, SF, 1, 1); /* V1SF */
VECTOR_MODE_WITH_PREFIX (V, FLOAT, DF, 1, 1); /* V1DF */
VECTOR_MODE_WITH_PREFIX (V, INT, QI, 2, 1); /* V2QI */
@@ -411,18 +413,20 @@ VECTOR_MODE_WITH_PREFIX (V, INT, QI, 8, 1); /* V8QI */
VECTOR_MODE_WITH_PREFIX (V, INT, HI, 2, 1); /* V2HI */
VECTOR_MODE_WITH_PREFIX (V, INT, HI, 4, 1); /* V4HI */
VECTOR_MODE_WITH_PREFIX (V, FLOAT, HF, 2, 1); /* V2HF */
+VECTOR_MODE_WITH_PREFIX (V, FLOAT, BF, 2, 1); /* V2BF */
VECTOR_MODE_WITH_PREFIX (V, FLOAT, HF, 4, 1); /* V4HF */
+VECTOR_MODE_WITH_PREFIX (V, FLOAT, BF, 4, 1); /* V4BF */
VECTOR_MODE_WITH_PREFIX (V, INT, SI, 2, 1); /* V2SI */
VECTOR_MODE_WITH_PREFIX (V, FLOAT, SF, 2, 1); /* V2SF */
-VLS_MODES (16); /* V16QI V8HI V4SI V2DI V8HF V4SF
V2DF */
-VLS_MODES (32); /* V32QI V16HI V8SI V4DI V16HF V8SF
V4DF */
-VLS_MODES (64); /* V64QI V32HI V16SI V8DI V32HF V16SF
V8DF */
-VLS_MODES (128); /* V128QI V64HI V32SI V16DI V64HF V32SF V16DF */
-VLS_MODES (256); /* V256QI V128HI V64SI V32DI V128HF V64SF V32DF */
-VLS_MODES (512); /* V512QI V256HI V128SI V64DI V256HF V128SF V64DF */
-VLS_MODES (1024); /* V1024QI V512HI V256SI V128DI V512HF V256SF V128DF */
-VLS_MODES (2048); /* V2048QI V1024HI V512SI V256DI V1024HF V512SF V256DF */
-VLS_MODES (4096); /* V4096QI V2048HI V1024SI V512DI V2048HF V1024SF V512DF */
+VLS_MODES (16); /* V16QI V8HI V4SI V2DI V8HF V8BF
V4SF V2DF */
+VLS_MODES (32); /* V32QI V16HI V8SI V4DI V16HF V16BF
V8SF V4DF */
+VLS_MODES (64); /* V64QI V32HI V16SI V8DI V32HF V32BF
V16SF V8DF */
+VLS_MODES (128); /* V128QI V64HI V32SI V16DI V64HF V64BF V32SF
V16DF */
+VLS_MODES (256); /* V256QI V128HI V64SI V32DI V128HF V128BF V64SF
V32DF */
+VLS_MODES (512); /* V512QI V256HI V128SI V64DI V256HF V256BF V128SF
V64DF */
+VLS_MODES (1024); /* V1024QI V512HI V256SI V128DI V512HF V512BF V256SF
V128DF */
+VLS_MODES (2048); /* V2048QI V1024HI V512SI V256DI V1024HF V1024BF V512SF
V256DF */
+VLS_MODES (4096); /* V4096QI V2048HI V1024SI V512DI V2048HF V2048BF V1024SF
V512DF */
/* TODO: According to RISC-V 'V' ISA spec, the maximum vector length can
be 65536 for a single vector register which means the vector mode in
diff --git a/gcc/config/riscv/riscv-v.cc b/gcc/config/riscv/riscv-v.cc
index 7ca183cde22..120e59d5dad 100644
--- a/gcc/config/riscv/riscv-v.cc
+++ b/gcc/config/riscv/riscv-v.cc
@@ -6181,6 +6181,10 @@ can_be_broadcast_p (rtx op)
if (mode == HFmode && !TARGET_ZVFH)
return false;
+ /* We don't have a vfmv.bf16.v.f. */
+ if (mode == BFmode)
+ return false;
+
/* Same for float, just that we can always handle 64-bit doubles
even on !TARGET_64BIT. We have ruled out 16-bit HF already
above. */
@@ -6220,6 +6224,10 @@ strided_broadcast_p (rtx op)
if (!TARGET_ZVFH && mode == HFmode)
return true;
+ /* We don't have a vfmv.bf16.v.f. */
+ if (mode == BFmode)
+ return true;
+
return false;
}
diff --git a/gcc/config/riscv/riscv-vector-switch.def
b/gcc/config/riscv/riscv-vector-switch.def
index 1b0d61940a6..6b71ab61223 100644
--- a/gcc/config/riscv/riscv-vector-switch.def
+++ b/gcc/config/riscv/riscv-vector-switch.def
@@ -401,6 +401,18 @@ VLS_ENTRY (V256HF, riscv_vector::vls_mode_valid_p
(V256HFmode) && TARGET_VECTOR_
VLS_ENTRY (V512HF, riscv_vector::vls_mode_valid_p (V512HFmode) &&
TARGET_VECTOR_ELEN_FP_16 && TARGET_MIN_VLEN >= 1024)
VLS_ENTRY (V1024HF, riscv_vector::vls_mode_valid_p (V1024HFmode) &&
TARGET_VECTOR_ELEN_FP_16 && TARGET_MIN_VLEN >= 2048)
VLS_ENTRY (V2048HF, riscv_vector::vls_mode_valid_p (V2048HFmode) &&
TARGET_VECTOR_ELEN_FP_16 && TARGET_MIN_VLEN >= 4096)
+VLS_ENTRY (V1BF, riscv_vector::vls_mode_valid_p (V1BFmode) &&
TARGET_VECTOR_ELEN_BF_16)
+VLS_ENTRY (V2BF, riscv_vector::vls_mode_valid_p (V2BFmode) &&
TARGET_VECTOR_ELEN_BF_16)
+VLS_ENTRY (V4BF, riscv_vector::vls_mode_valid_p (V4BFmode) &&
TARGET_VECTOR_ELEN_BF_16)
+VLS_ENTRY (V8BF, riscv_vector::vls_mode_valid_p (V8BFmode) &&
TARGET_VECTOR_ELEN_BF_16)
+VLS_ENTRY (V16BF, riscv_vector::vls_mode_valid_p (V16BFmode) &&
TARGET_VECTOR_ELEN_BF_16)
+VLS_ENTRY (V32BF, riscv_vector::vls_mode_valid_p (V32BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 64)
+VLS_ENTRY (V64BF, riscv_vector::vls_mode_valid_p (V64BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 128)
+VLS_ENTRY (V128BF, riscv_vector::vls_mode_valid_p (V128BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 256)
+VLS_ENTRY (V256BF, riscv_vector::vls_mode_valid_p (V256BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 512)
+VLS_ENTRY (V512BF, riscv_vector::vls_mode_valid_p (V512BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 1024)
+VLS_ENTRY (V1024BF, riscv_vector::vls_mode_valid_p (V1024BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 2048)
+VLS_ENTRY (V2048BF, riscv_vector::vls_mode_valid_p (V2048BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 4096)
VLS_ENTRY (V1SF, riscv_vector::vls_mode_valid_p (V1SFmode) &&
TARGET_VECTOR_ELEN_FP_32)
VLS_ENTRY (V2SF, riscv_vector::vls_mode_valid_p (V2SFmode) &&
TARGET_VECTOR_ELEN_FP_32)
VLS_ENTRY (V4SF, riscv_vector::vls_mode_valid_p (V4SFmode) &&
TARGET_VECTOR_ELEN_FP_32)
diff --git a/gcc/config/riscv/riscv.md b/gcc/config/riscv/riscv.md
index 640ca5f9b0e..8a4c6d8ddea 100644
--- a/gcc/config/riscv/riscv.md
+++ b/gcc/config/riscv/riscv.md
@@ -273,6 +273,7 @@ (define_attr "mode"
"unknown,none,QI,HI,SI,DI,TI,HF,BF,SF,DF,TF,
V1SI,V2SI,V4SI,V8SI,V16SI,V32SI,V64SI,V128SI,V256SI,V512SI,V1024SI,
V1DI,V2DI,V4DI,V8DI,V16DI,V32DI,V64DI,V128DI,V256DI,V512DI,
V1HF,V2HF,V4HF,V8HF,V16HF,V32HF,V64HF,V128HF,V256HF,V512HF,V1024HF,V2048HF,
+ V1BF,V2BF,V4BF,V8BF,V16BF,V32BF,V64BF,V128BF,V256BF,V512BF,V1024BF,V2048BF,
V1SF,V2SF,V4SF,V8SF,V16SF,V32SF,V64SF,V128SF,V256SF,V512SF,V1024SF,
V1DF,V2DF,V4DF,V8DF,V16DF,V32DF,V64DF,V128DF,V256DF,V512DF,
V1BI,V2BI,V4BI,V8BI,V16BI,V32BI,V64BI,V128BI,V256BI,V512BI,V1024BI,V2048BI,V4096BI"
diff --git a/gcc/config/riscv/vector-iterators.md
b/gcc/config/riscv/vector-iterators.md
index 45af65642cd..81276a8e3f5 100644
--- a/gcc/config/riscv/vector-iterators.md
+++ b/gcc/config/riscv/vector-iterators.md
@@ -173,6 +173,21 @@ (define_mode_iterator VF_ZVFBF16 [
(RVVMF4BF "TARGET_VECTOR_ELEN_BF_16 && TARGET_VECTOR_ELEN_64")
])
+(define_mode_iterator VLSF_ZVFBF16 [
+ (V1BF "riscv_vector::vls_mode_valid_p (V1BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V2BF "riscv_vector::vls_mode_valid_p (V2BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V4BF "riscv_vector::vls_mode_valid_p (V4BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V8BF "riscv_vector::vls_mode_valid_p (V8BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V16BF "riscv_vector::vls_mode_valid_p (V16BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V32BF "riscv_vector::vls_mode_valid_p (V32BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 64")
+ (V64BF "riscv_vector::vls_mode_valid_p (V64BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 128")
+ (V128BF "riscv_vector::vls_mode_valid_p (V128BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 256")
+ (V256BF "riscv_vector::vls_mode_valid_p (V256BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 512")
+ (V512BF "riscv_vector::vls_mode_valid_p (V512BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 1024")
+ (V1024BF "riscv_vector::vls_mode_valid_p (V1024BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 2048")
+ (V2048BF "riscv_vector::vls_mode_valid_p (V2048BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 4096")
+])
+
(define_mode_iterator VF_ZVFHMIN [
(RVVM8HF "TARGET_VECTOR_ELEN_FP_16") (RVVM4HF "TARGET_VECTOR_ELEN_FP_16")
(RVVM2HF "TARGET_VECTOR_ELEN_FP_16")
(RVVM1HF "TARGET_VECTOR_ELEN_FP_16") (RVVMF2HF "TARGET_VECTOR_ELEN_FP_16")
@@ -1646,6 +1661,18 @@ (define_mode_iterator VINDEXED [
(V512HF "riscv_vector::vls_mode_valid_p (V512HFmode) && TARGET_ZVFH &&
TARGET_MIN_VLEN >= 1024")
(V1024HF "riscv_vector::vls_mode_valid_p (V1024HFmode) && TARGET_ZVFH &&
TARGET_MIN_VLEN >= 2048")
(V2048HF "riscv_vector::vls_mode_valid_p (V2048HFmode) && TARGET_ZVFH &&
TARGET_MIN_VLEN >= 4096")
+ (V1BF "riscv_vector::vls_mode_valid_p (V1BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V2BF "riscv_vector::vls_mode_valid_p (V2BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V4BF "riscv_vector::vls_mode_valid_p (V4BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V8BF "riscv_vector::vls_mode_valid_p (V8BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V16BF "riscv_vector::vls_mode_valid_p (V16BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V32BF "riscv_vector::vls_mode_valid_p (V32BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 64")
+ (V64BF "riscv_vector::vls_mode_valid_p (V64BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 128")
+ (V128BF "riscv_vector::vls_mode_valid_p (V128BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 256")
+ (V256BF "riscv_vector::vls_mode_valid_p (V256BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 512")
+ (V512BF "riscv_vector::vls_mode_valid_p (V512BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 1024")
+ (V1024BF "riscv_vector::vls_mode_valid_p (V1024BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 2048")
+ (V2048BF "riscv_vector::vls_mode_valid_p (V2048BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 4096")
(V1SF "riscv_vector::vls_mode_valid_p (V1SFmode) &&
TARGET_VECTOR_ELEN_FP_32")
(V2SF "riscv_vector::vls_mode_valid_p (V2SFmode) &&
TARGET_VECTOR_ELEN_FP_32")
(V4SF "riscv_vector::vls_mode_valid_p (V4SFmode) &&
TARGET_VECTOR_ELEN_FP_32")
@@ -1671,23 +1698,39 @@ (define_mode_iterator VINDEXED [
(define_mode_iterator VB_VLS [VB VLSB])
-(define_mode_iterator VLS [VLSI VLSF_ZVFHMIN])
+;; VLSI + VLSF but including half-float modes for Zvfhmin and Zvfbf16,
+;; to be used for loads/stores.
+(define_mode_iterator VLS [VLSI VLSF_ZVFHMIN VLSF_ZVFBF16])
+;; VLSI + VLSF but including half-float modes iff TARGET_ZVFH.
(define_mode_iterator VLS_ZVFH [VLSI VLSF])
-(define_mode_iterator V [VI VF_ZVFBF16 VF_ZVFHMIN])
+;; VI + VF but including half-float modes for Zvfhmin and Zvfbf16,
+;; to be used for loads/stores.
+(define_mode_iterator V [VI VF_ZVFHMIN VF_ZVFBF16])
+;; VI + VF but including half-float modes iff TARGET_ZVFH.
(define_mode_iterator V_ZVFH [VI VF])
+;; Used for permutes and loads/stores, i.e. operations that are int/float
+;; agnostic. Some loads/stores still only use V for now but we can change
+;; that.
(define_mode_iterator V_VLS [V VLS])
+;; Same as V_VLS but with ZVFH instead of ZVFHMIN. Currently only used for
+;; vec_extract and vec_set because those use vm(f)v. As those are just
+;; permutes we could pun with an integer type when the actual mode is
+;; not supported. (Just as we already do for broadcasting unsupported
+;; modes, see V_VLSF_FALLBACK).
(define_mode_iterator V_VLS_ZVFH [V_ZVFH VLS_ZVFH])
(define_mode_iterator V_VLSI [VI VLSI])
(define_mode_iterator V_VLSF [VF VLSF])
-(define_mode_iterator V_VLSF_ZVFHMIN [VF_ZVFBF16 VF_ZVFHMIN VLSF_ZVFHMIN])
+;; All modes that cannot be broadcast directly so we either use strided
+;; broadcast or gather broadcast.
+(define_mode_iterator V_VLSF_FALLBACK [VF_ZVFBF16 VLSF_ZVFBF16 VF_ZVFHMIN
VLSF_ZVFHMIN])
(define_mode_iterator VT [V1T V2T V4T V8T V16T V32T])
@@ -1842,6 +1885,18 @@ (define_mode_attr VINDEX [
(V512HF "V512HI")
(V1024HF "V1024HI")
(V2048HF "V2048HI")
+ (V1BF "V1HI")
+ (V2BF "V2HI")
+ (V4BF "V4HI")
+ (V8BF "V8HI")
+ (V16BF "V16HI")
+ (V32BF "V32HI")
+ (V64BF "V64HI")
+ (V128BF "V128HI")
+ (V256BF "V256HI")
+ (V512BF "V512HI")
+ (V1024BF "V1024HI")
+ (V2048BF "V2048HI")
(V1SF "V1SI")
(V2SF "V2SI")
(V4SF "V4SI")
@@ -2064,6 +2119,9 @@ (define_mode_attr VM [
(V1HF "V1BI") (V2HF "V2BI") (V4HF "V4BI") (V8HF "V8BI") (V16HF "V16BI")
(V32HF "V32BI") (V64HF "V64BI") (V128HF "V128BI") (V256HF "V256BI")
(V512HF "V512BI") (V1024HF "V1024BI") (V2048HF "V2048BI")
+ (V1BF "V1BI") (V2BF "V2BI") (V4BF "V4BI") (V8BF "V8BI") (V16BF "V16BI")
+ (V32BF "V32BI") (V64BF "V64BI") (V128BF "V128BI") (V256BF "V256BI")
+ (V512BF "V512BI") (V1024BF "V1024BI") (V2048BF "V2048BI")
(V1SF "V1BI") (V2SF "V2BI") (V4SF "V4BI") (V8SF "V8BI")
(V16SF "V16BI") (V32SF "V32BI") (V64SF "V64BI")
(V128SF "V128BI") (V256SF "V256BI") (V512SF "V512BI") (V1024SF "V1024BI")
@@ -2175,6 +2233,9 @@ (define_mode_attr vm [
(V1HF "v1bi") (V2HF "v2bi") (V4HF "v4bi") (V8HF "v8bi") (V16HF "v16bi")
(V32HF "v32bi") (V64HF "v64bi") (V128HF "v128bi") (V256HF "v256bi")
(V512HF "v512bi") (V1024HF "v1024bi") (V2048HF "v2048bi")
+ (V1BF "v1bi") (V2BF "v2bi") (V4BF "v4bi") (V8BF "v8bi") (V16BF "v16bi")
+ (V32BF "v32bi") (V64BF "v64bi") (V128BF "v128bi") (V256BF "v256bi")
+ (V512BF "v512bi") (V1024BF "v1024bi") (V2048BF "v2048bi")
(V1SF "v1bi") (V2SF "v2bi") (V4SF "v4bi") (V8SF "v8bi")
(V16SF "v16bi") (V32SF "v32bi") (V64SF "v64bi")
(V128SF "v128bi") (V256SF "v256bi") (V512SF "v512bi") (V1024SF "v1024bi")
@@ -2209,6 +2270,8 @@ (define_mode_attr VEL [
(V1DI "DI") (V2DI "DI") (V4DI "DI") (V8DI "DI") (V16DI "DI") (V32DI "DI")
(V64DI "DI") (V128DI "DI") (V256DI "DI") (V512DI "DI")
(V1HF "HF") (V2HF "HF") (V4HF "HF") (V8HF "HF") (V16HF "HF") (V32HF "HF")
(V64HF "HF") (V128HF "HF") (V256HF "HF")
(V512HF "HF") (V1024HF "HF") (V2048HF "HF")
+ (V1BF "BF") (V2BF "BF") (V4BF "BF") (V8BF "BF") (V16BF "BF") (V32BF "BF")
(V64BF "BF") (V128BF "BF") (V256BF "BF")
+ (V512BF "BF") (V1024BF "BF") (V2048BF "BF")
(V1SF "SF") (V2SF "SF") (V4SF "SF") (V8SF "SF") (V16SF "SF") (V32SF "SF")
(V64SF "SF") (V128SF "SF") (V256SF "SF")
(V512SF "SF") (V1024SF "SF")
(V1DF "DF") (V2DF "DF") (V4DF "DF") (V8DF "DF") (V16DF "DF") (V32DF "DF")
(V64DF "DF") (V128DF "DF") (V256DF "DF") (V512DF "DF")
@@ -2308,6 +2371,8 @@ (define_mode_attr vel [
(V1DI "di") (V2DI "di") (V4DI "di") (V8DI "di") (V16DI "di") (V32DI "di")
(V64DI "di") (V128DI "di") (V256DI "di") (V512DI "di")
(V1HF "hf") (V2HF "hf") (V4HF "hf") (V8HF "hf") (V16HF "hf") (V32HF "hf")
(V64HF "hf") (V128HF "hf") (V256HF "hf")
(V512HF "hf") (V1024HF "hf") (V2048HF "hf")
+ (V1BF "BF") (V2BF "BF") (V4BF "BF") (V8BF "BF") (V16BF "BF") (V32BF "BF")
(V64BF "BF") (V128BF "BF") (V256BF "BF")
+ (V512BF "BF") (V1024BF "BF") (V2048BF "BF")
(V1SF "sf") (V2SF "sf") (V4SF "sf") (V8SF "sf") (V16SF "sf") (V32SF "sf")
(V64SF "sf") (V128SF "sf") (V256SF "sf")
(V512SF "sf") (V1024SF "sf")
(V1DF "df") (V2DF "df") (V4DF "df") (V8DF "df") (V16DF "df") (V32DF "df")
(V64DF "df") (V128DF "df") (V256DF "df") (V512DF "df")
@@ -2689,6 +2754,8 @@ (define_mode_attr sew [
(V1DI "64") (V2DI "64") (V4DI "64") (V8DI "64") (V16DI "64") (V32DI "64")
(V64DI "64") (V128DI "64") (V256DI "64") (V512DI "64")
(V1HF "16") (V2HF "16") (V4HF "16") (V8HF "16") (V16HF "16") (V32HF "16")
(V64HF "16") (V128HF "16") (V256HF "16")
(V512HF "16") (V1024HF "16") (V2048HF "16")
+ (V1BF "16") (V2BF "16") (V4BF "16") (V8BF "16") (V16BF "16") (V32BF "16")
(V64BF "16") (V128BF "16") (V256BF "16")
+ (V512BF "16") (V1024BF "16") (V2048BF "16")
(V1SF "32") (V2SF "32") (V4SF "32") (V8SF "32") (V16SF "32") (V32SF "32")
(V64SF "32") (V128SF "32") (V256SF "32")
(V512SF "32") (V1024SF "32")
(V1DF "64") (V2DF "64") (V4DF "64") (V8DF "64") (V16DF "64") (V32DF "64")
(V64DF "64") (V128DF "64") (V256DF "64") (V512DF "64")
@@ -3702,6 +3769,18 @@ (define_mode_attr stride_predicate [
(V512HF "vector_eew16_stride_operand")
(V1024HF "vector_eew16_stride_operand")
(V2048HF "vector_eew16_stride_operand")
+ (V1BF "vector_eew16_stride_operand")
+ (V2BF "vector_eew16_stride_operand")
+ (V4BF "vector_eew16_stride_operand")
+ (V8BF "vector_eew16_stride_operand")
+ (V16BF "vector_eew16_stride_operand")
+ (V32BF "vector_eew16_stride_operand")
+ (V64BF "vector_eew16_stride_operand")
+ (V128BF "vector_eew16_stride_operand")
+ (V256BF "vector_eew16_stride_operand")
+ (V512BF "vector_eew16_stride_operand")
+ (V1024BF "vector_eew16_stride_operand")
+ (V2048BF "vector_eew16_stride_operand")
(V1SF "vector_eew32_stride_operand")
(V2SF "vector_eew32_stride_operand")
(V4SF "vector_eew32_stride_operand")
@@ -3816,6 +3895,18 @@ (define_mode_attr stride_load_constraint [
(V512HF "rJ,rJ,rJ,k02,k02,k02")
(V1024HF "rJ,rJ,rJ,k02,k02,k02")
(V2048HF "rJ,rJ,rJ,k02,k02,k02")
+ (V1BF "rJ,rJ,rJ,k02,k02,k02")
+ (V2BF "rJ,rJ,rJ,k02,k02,k02")
+ (V4BF "rJ,rJ,rJ,k02,k02,k02")
+ (V8BF "rJ,rJ,rJ,k02,k02,k02")
+ (V16BF "rJ,rJ,rJ,k02,k02,k02")
+ (V32BF "rJ,rJ,rJ,k02,k02,k02")
+ (V64BF "rJ,rJ,rJ,k02,k02,k02")
+ (V128BF "rJ,rJ,rJ,k02,k02,k02")
+ (V256BF "rJ,rJ,rJ,k02,k02,k02")
+ (V512BF "rJ,rJ,rJ,k02,k02,k02")
+ (V1024BF "rJ,rJ,rJ,k02,k02,k02")
+ (V2048BF "rJ,rJ,rJ,k02,k02,k02")
(V1SF "rJ,rJ,rJ,k04,k04,k04")
(V2SF "rJ,rJ,rJ,k04,k04,k04")
(V4SF "rJ,rJ,rJ,k04,k04,k04")
@@ -3930,6 +4021,18 @@ (define_mode_attr stride_store_constraint [
(V512HF "rJ,k02")
(V1024HF "rJ,k02")
(V2048HF "rJ,k02")
+ (V1BF "rJ,k02")
+ (V2BF "rJ,k02")
+ (V4BF "rJ,k02")
+ (V8BF "rJ,k02")
+ (V16BF "rJ,k02")
+ (V32BF "rJ,k02")
+ (V64BF "rJ,k02")
+ (V128BF "rJ,k02")
+ (V256BF "rJ,k02")
+ (V512BF "rJ,k02")
+ (V1024BF "rJ,k02")
+ (V2048BF "rJ,k02")
(V1SF "rJ,k04")
(V2SF "rJ,k04")
(V4SF "rJ,k04")
@@ -4409,6 +4512,11 @@ (define_mode_iterator VLS_AVL_IMM [
(V4HF "riscv_vector::vls_mode_valid_p (V4HFmode) &&
TARGET_VECTOR_ELEN_FP_16")
(V8HF "riscv_vector::vls_mode_valid_p (V8HFmode) &&
TARGET_VECTOR_ELEN_FP_16")
(V16HF "riscv_vector::vls_mode_valid_p (V16HFmode) &&
TARGET_VECTOR_ELEN_FP_16")
+ (V1BF "riscv_vector::vls_mode_valid_p (V1BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V2BF "riscv_vector::vls_mode_valid_p (V2BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V4BF "riscv_vector::vls_mode_valid_p (V4BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V8BF "riscv_vector::vls_mode_valid_p (V8BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
+ (V16BF "riscv_vector::vls_mode_valid_p (V16BFmode) &&
TARGET_VECTOR_ELEN_BF_16")
(V1SF "riscv_vector::vls_mode_valid_p (V1SFmode) &&
TARGET_VECTOR_ELEN_FP_32")
(V2SF "riscv_vector::vls_mode_valid_p (V2SFmode) &&
TARGET_VECTOR_ELEN_FP_32")
(V4SF "riscv_vector::vls_mode_valid_p (V4SFmode) &&
TARGET_VECTOR_ELEN_FP_32")
@@ -4461,6 +4569,13 @@ (define_mode_iterator VLS_AVL_REG [
(V512HF "riscv_vector::vls_mode_valid_p (V512HFmode) &&
TARGET_VECTOR_ELEN_FP_16 && TARGET_MIN_VLEN >= 1024")
(V1024HF "riscv_vector::vls_mode_valid_p (V1024HFmode) &&
TARGET_VECTOR_ELEN_FP_16 && TARGET_MIN_VLEN >= 2048")
(V2048HF "riscv_vector::vls_mode_valid_p (V2048HFmode) &&
TARGET_VECTOR_ELEN_FP_16 && TARGET_MIN_VLEN >= 4096")
+ (V32BF "riscv_vector::vls_mode_valid_p (V32BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 64")
+ (V64BF "riscv_vector::vls_mode_valid_p (V64BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 128")
+ (V128BF "riscv_vector::vls_mode_valid_p (V128BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 256")
+ (V256BF "riscv_vector::vls_mode_valid_p (V256BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 512")
+ (V512BF "riscv_vector::vls_mode_valid_p (V512BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 1024")
+ (V1024BF "riscv_vector::vls_mode_valid_p (V1024BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 2048")
+ (V2048BF "riscv_vector::vls_mode_valid_p (V2048BFmode) &&
TARGET_VECTOR_ELEN_BF_16 && TARGET_MIN_VLEN >= 4096")
(V32SF "riscv_vector::vls_mode_valid_p (V32SFmode) &&
TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN >= 128")
(V64SF "riscv_vector::vls_mode_valid_p (V64SFmode) &&
TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN >= 256")
(V128SF "riscv_vector::vls_mode_valid_p (V128SFmode) &&
TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN >= 512")
diff --git a/gcc/config/riscv/vector.md b/gcc/config/riscv/vector.md
index 3cb87bf4eae..fc91e265fef 100644
--- a/gcc/config/riscv/vector.md
+++ b/gcc/config/riscv/vector.md
@@ -139,7 +139,8 @@ (define_attr "sew" ""
RVVM2x3HF,RVVM1x3HF,RVVMF2x3HF,RVVMF4x3HF,\
RVVM4x2HF,RVVM2x2HF,RVVM1x2HF,RVVMF2x2HF,RVVMF4x2HF,\
V1HI,V2HI,V4HI,V8HI,V16HI,V32HI,V64HI,V128HI,V256HI,V512HI,V1024HI,V2048HI,\
-
V1HF,V2HF,V4HF,V8HF,V16HF,V32HF,V64HF,V128HF,V256HF,V512HF,V1024HF,V2048HF")
+
V1HF,V2HF,V4HF,V8HF,V16HF,V32HF,V64HF,V128HF,V256HF,V512HF,V1024HF,V2048HF,\
+
V1BF,V2BF,V4BF,V8BF,V16BF,V32BF,V64BF,V128BF,V256BF,V512BF,V1024BF,V2048BF")
(const_int 16)
(eq_attr "mode" "RVVM8SI,RVVM4SI,RVVM2SI,RVVM1SI,RVVMF2SI,\
RVVM8SF,RVVM4SF,RVVM2SF,RVVM1SF,RVVMF2SF,\
@@ -446,6 +447,18 @@ (define_attr "vlmul" ""
(eq_attr "mode" "V512HF") (symbol_ref
"riscv_vector::get_vlmul(E_V512HFmode)")
(eq_attr "mode" "V1024HF") (symbol_ref
"riscv_vector::get_vlmul(E_V1024HFmode)")
(eq_attr "mode" "V2048HF") (symbol_ref
"riscv_vector::get_vlmul(E_V2048HFmode)")
+ (eq_attr "mode" "V1BF") (symbol_ref
"riscv_vector::get_vlmul(E_V1BFmode)")
+ (eq_attr "mode" "V2BF") (symbol_ref
"riscv_vector::get_vlmul(E_V2BFmode)")
+ (eq_attr "mode" "V4BF") (symbol_ref
"riscv_vector::get_vlmul(E_V4BFmode)")
+ (eq_attr "mode" "V8BF") (symbol_ref
"riscv_vector::get_vlmul(E_V8BFmode)")
+ (eq_attr "mode" "V16BF") (symbol_ref
"riscv_vector::get_vlmul(E_V16BFmode)")
+ (eq_attr "mode" "V32BF") (symbol_ref
"riscv_vector::get_vlmul(E_V32BFmode)")
+ (eq_attr "mode" "V64BF") (symbol_ref
"riscv_vector::get_vlmul(E_V64BFmode)")
+ (eq_attr "mode" "V128BF") (symbol_ref
"riscv_vector::get_vlmul(E_V128BFmode)")
+ (eq_attr "mode" "V256BF") (symbol_ref
"riscv_vector::get_vlmul(E_V256BFmode)")
+ (eq_attr "mode" "V512BF") (symbol_ref
"riscv_vector::get_vlmul(E_V512BFmode)")
+ (eq_attr "mode" "V1024BF") (symbol_ref
"riscv_vector::get_vlmul(E_V1024BFmode)")
+ (eq_attr "mode" "V2048BF") (symbol_ref
"riscv_vector::get_vlmul(E_V2048BFmode)")
(eq_attr "mode" "V1SF") (symbol_ref
"riscv_vector::get_vlmul(E_V1SFmode)")
(eq_attr "mode" "V2SF") (symbol_ref
"riscv_vector::get_vlmul(E_V2SFmode)")
(eq_attr "mode" "V4SF") (symbol_ref
"riscv_vector::get_vlmul(E_V4SFmode)")
@@ -762,6 +775,18 @@ (define_attr "ratio" ""
(eq_attr "mode" "V512HF") (symbol_ref
"riscv_vector::get_ratio(E_V512HFmode)")
(eq_attr "mode" "V1024HF") (symbol_ref
"riscv_vector::get_ratio(E_V1024HFmode)")
(eq_attr "mode" "V2048HF") (symbol_ref
"riscv_vector::get_ratio(E_V2048HFmode)")
+ (eq_attr "mode" "V1BF") (symbol_ref
"riscv_vector::get_ratio(E_V1BFmode)")
+ (eq_attr "mode" "V2BF") (symbol_ref
"riscv_vector::get_ratio(E_V2BFmode)")
+ (eq_attr "mode" "V4BF") (symbol_ref
"riscv_vector::get_ratio(E_V4BFmode)")
+ (eq_attr "mode" "V8BF") (symbol_ref
"riscv_vector::get_ratio(E_V8BFmode)")
+ (eq_attr "mode" "V16BF") (symbol_ref
"riscv_vector::get_ratio(E_V16BFmode)")
+ (eq_attr "mode" "V32BF") (symbol_ref
"riscv_vector::get_ratio(E_V32BFmode)")
+ (eq_attr "mode" "V64BF") (symbol_ref
"riscv_vector::get_ratio(E_V64BFmode)")
+ (eq_attr "mode" "V128BF") (symbol_ref
"riscv_vector::get_ratio(E_V128BFmode)")
+ (eq_attr "mode" "V256BF") (symbol_ref
"riscv_vector::get_ratio(E_V256BFmode)")
+ (eq_attr "mode" "V512BF") (symbol_ref
"riscv_vector::get_ratio(E_V512BFmode)")
+ (eq_attr "mode" "V1024BF") (symbol_ref
"riscv_vector::get_ratio(E_V1024BFmode)")
+ (eq_attr "mode" "V2048BF") (symbol_ref
"riscv_vector::get_ratio(E_V2048BFmode)")
(eq_attr "mode" "V1SF") (symbol_ref
"riscv_vector::get_ratio(E_V1SFmode)")
(eq_attr "mode" "V2SF") (symbol_ref
"riscv_vector::get_ratio(E_V2SFmode)")
(eq_attr "mode" "V4SF") (symbol_ref
"riscv_vector::get_ratio(E_V4SFmode)")
@@ -2402,19 +2427,19 @@ (define_insn_and_split "*pred_strided_broadcast<mode>"
(set_attr "mode" "<MODE>")])
(define_insn_and_split "*pred_strided_broadcast<mode>_zvfhmin"
- [(set (match_operand:V_VLSF_ZVFHMIN 0 "register_operand"
"=vr, vr, vr, vr")
- (if_then_else:V_VLSF_ZVFHMIN
+ [(set (match_operand:V_VLSF_FALLBACK 0 "register_operand"
"=vr, vr, vr, vr")
+ (if_then_else:V_VLSF_FALLBACK
(unspec:<VM>
- [(match_operand:<VM> 1 "strided_broadcast_mask_operand" "
vm, vm, Wc1, Wc1")
- (match_operand 4 "vector_length_operand"
"rvl, rvl, rvl, rvl")
- (match_operand 5 "const_int_operand" "
i, i, i, i")
- (match_operand 6 "const_int_operand" "
i, i, i, i")
- (match_operand 7 "const_int_operand" "
i, i, i, i")
+ [(match_operand:<VM> 1 "strided_broadcast_mask_operand" "
vm, vm, Wc1, Wc1")
+ (match_operand 4 "vector_length_operand"
"rvl, rvl, rvl, rvl")
+ (match_operand 5 "const_int_operand" "
i, i, i, i")
+ (match_operand 6 "const_int_operand" "
i, i, i, i")
+ (match_operand 7 "const_int_operand" "
i, i, i, i")
(reg:SI VL_REGNUM)
(reg:SI VTYPE_REGNUM)] UNSPEC_VPREDICATE)
- (vec_duplicate:V_VLSF_ZVFHMIN
- (match_operand:<VEL> 3 "strided_broadcast_operand" "
A, A, A, A"))
- (match_operand:V_VLSF_ZVFHMIN 2 "vector_merge_operand" "
vu, 0, vu, 0")))]
+ (vec_duplicate:V_VLSF_FALLBACK
+ (match_operand:<VEL> 3 "strided_broadcast_operand" "
A, A, A, A"))
+ (match_operand:V_VLSF_FALLBACK 2 "vector_merge_operand" "
vu, 0, vu, 0")))]
"TARGET_VECTOR"
"@
vlse<sew>.v\t%0,%3,zero,%1.t
@@ -2422,7 +2447,8 @@ (define_insn_and_split
"*pred_strided_broadcast<mode>_zvfhmin"
vlse<sew>.v\t%0,%3,zero
vlse<sew>.v\t%0,%3,zero"
"&& !strided_load_broadcast_p ()
- && <VEL>mode == HFmode
+ && (<VEL>mode == HFmode
+ || <VEL>mode == BFmode)
&& can_create_pseudo_p ()"
[(const_int 0)]
{
diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr121582.c
b/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr121582.c
new file mode 100644
index 00000000000..0e991c03e52
--- /dev/null
+++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/pr121582.c
@@ -0,0 +1,6 @@
+/* { dg-do compile } */
+/* { dg-options "-O3 -march=rv64gcv_zvfbfmin -mabi=lp64d" } */
+
+typedef __attribute__((__vector_size__(8))) __bf16 V;
+V v, w;
+void foo() { v -= w; }
--
2.51.0