This properly updates invariant SLP nodes vector types for bswap
vectorization.

Bootstrapped / tested on x86_64-unknown-linux-gnu, applied.

2020-05-25  Richard Biener  <rguent...@suse.de>

        PR tree-optimization/95271
        * tree-vect-stmts.c (vectorizable_bswap): Update invariant SLP
        children vector type.
        (vectorizable_call): Pass down slp ops.

        * gcc.dg/vect/bb-slp-pr95271.c: New testcase.
---
 gcc/testsuite/gcc.dg/vect/bb-slp-pr95271.c | 19 +++++++++++++++++++
 gcc/tree-vect-stmts.c                      | 12 +++++++++++-
 2 files changed, 30 insertions(+), 1 deletion(-)
 create mode 100644 gcc/testsuite/gcc.dg/vect/bb-slp-pr95271.c

diff --git a/gcc/testsuite/gcc.dg/vect/bb-slp-pr95271.c 
b/gcc/testsuite/gcc.dg/vect/bb-slp-pr95271.c
new file mode 100644
index 00000000000..2f235980405
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/vect/bb-slp-pr95271.c
@@ -0,0 +1,19 @@
+/* { dg-do compile } */
+/* { dg-additional-options "-march=cooperlake" { target x86_64-*-* i?86-*-* } 
} */
+
+int a;
+struct b c;
+long d;
+struct b {
+  unsigned long address;
+  unsigned long e;
+};
+void f()
+{
+  d = (long)(&a)[0] << 56 | (long)((unsigned char *)&a)[1] << 48 |
+      (long)((unsigned char *)&a)[2] << 40 |
+      (long)((unsigned char *)&a)[3] << 32 |
+      (long)((unsigned char *)&a)[4] << 24 | ((unsigned char *)&a)[5] << 16 |
+      ((unsigned char *)&a)[6] << 8 | ((unsigned char *)&a)[7];
+  c.address = c.e = d;
+}
diff --git a/gcc/tree-vect-stmts.c b/gcc/tree-vect-stmts.c
index e7822c44951..9023dd4c216 100644
--- a/gcc/tree-vect-stmts.c
+++ b/gcc/tree-vect-stmts.c
@@ -3009,6 +3009,7 @@ static bool
 vectorizable_bswap (vec_info *vinfo,
                    stmt_vec_info stmt_info, gimple_stmt_iterator *gsi,
                    stmt_vec_info *vec_stmt, slp_tree slp_node,
+                   slp_tree *slp_op,
                    tree vectype_in, stmt_vector_for_cost *cost_vec)
 {
   tree op, vectype;
@@ -3051,6 +3052,15 @@ vectorizable_bswap (vec_info *vinfo,
 
   if (! vec_stmt)
     {
+      if (slp_node
+         && !vect_maybe_update_slp_op_vectype (slp_op[0], vectype_in))
+       {
+         if (dump_enabled_p ())
+           dump_printf_loc (MSG_MISSED_OPTIMIZATION, vect_location,
+                            "incompatible vector types for invariants\n");
+         return false;
+       }
+
       STMT_VINFO_TYPE (stmt_info) = call_vec_info_type;
       DUMP_VECT_SCOPE ("vectorizable_bswap");
       if (! slp_node)
@@ -3377,7 +3387,7 @@ vectorizable_call (vec_info *vinfo,
                   || gimple_call_builtin_p (stmt, BUILT_IN_BSWAP32)
                   || gimple_call_builtin_p (stmt, BUILT_IN_BSWAP64)))
        return vectorizable_bswap (vinfo, stmt_info, gsi, vec_stmt, slp_node,
-                                  vectype_in, cost_vec);
+                                  slp_op, vectype_in, cost_vec);
       else
        {
          if (dump_enabled_p ())
-- 
2.25.1

Reply via email to