tree-optimization/108724 - vectorized code getting piecewise expanded

author Richard Biener <rguenther@suse.de>

Fri, 10 Feb 2023 10:07:30 +0000 (11:07 +0100)

committer Richard Biener <rguenther@suse.de>

Wed, 15 Mar 2023 09:07:42 +0000 (10:07 +0100)
author Richard Biener <rguenther@suse.de>
Fri, 10 Feb 2023 10:07:30 +0000 (11:07 +0100)
committer Richard Biener <rguenther@suse.de>
Wed, 15 Mar 2023 09:07:42 +0000 (10:07 +0100)
diff --git a/gcc/testsuite/gcc.target/i386/pr108724.c b/gcc/testsuite/gcc.target/i386/pr108724.c

new file mode 100644 (file)

index 0000000..c4e0e91
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/pr108724.c
@@ -0,0 +1,15 @@
+/* { dg-do compile } */
+/* { dg-options "-O3 -mno-sse" } */
+
+int a[16], b[16], c[16];
+void foo()
+{
+  for (int i = 0; i < 16; i++) {
+    a[i] = b[i] + c[i];
+  }
+}
+
+/* When this is vectorized this shouldn't be expanded piecewise again
+   which will result in spilling for the upper half access.  */
+
+/* { dg-final { scan-assembler-not "\\\[er\\\]sp" } } */
diff --git a/gcc/tree-vect-stmts.cc b/gcc/tree-vect-stmts.cc

index 2498948fad2c59f729a3b7a9279fda2386ef831d..1cc3e00f0a6bdaf8d7e5e8b9596a3ffd11f0ae08 100644 (file)
--- a/gcc/tree-vect-stmts.cc
+++ b/gcc/tree-vect-stmts.cc
@@ -6274,6 +6274,20 @@ vectorizable_operation (vec_info *vinfo,
        return false;
      }
  
+  /* ???  We should instead expand the operations here, instead of
+     relying on vector lowering which has this hard cap on the number
+     of vector elements below it performs elementwise operations.  */
+  if (using_emulated_vectors_p
+      && (code == PLUS_EXPR || code == MINUS_EXPR || code == NEGATE_EXPR)
+      && ((BITS_PER_WORD / vector_element_bits (vectype)) < 4
+         || maybe_lt (nunits_out, 4U)))
+    {
+      if (dump_enabled_p ())
+       dump_printf (MSG_NOTE, "not using word mode for +- and less than "
+                    "four vector elements\n");
+      return false;
+    }
+
    int reduc_idx = STMT_VINFO_REDUC_IDX (stmt_info);
    vec_loop_masks *masks = (loop_vinfo ? &LOOP_VINFO_MASKS (loop_vinfo) : NULL);
    internal_fn cond_fn = get_conditional_internal_fn (code);
author	Richard Biener <rguenther@suse.de>
	Fri, 10 Feb 2023 10:07:30 +0000 (11:07 +0100)
committer	Richard Biener <rguenther@suse.de>
	Wed, 15 Mar 2023 09:07:42 +0000 (10:07 +0100)
gcc/testsuite/gcc.target/i386/pr108724.c	[new file with mode: 0644]	patch \| blob
gcc/tree-vect-stmts.cc		patch \| blob \| blame \| history