[PATCH] Handle vector COND_EXPRs in vector genericization (PR tree-optimization/65427)

Richard Biener rguenther@suse.de
Mon Mar 16 18:16:00 GMT 2015


On March 16, 2015 5:21:02 PM GMT+01:00, Jakub Jelinek <jakub@redhat.com> wrote:
>Hi!
>
>On the following testcase, gimple LIM creates a vector COND_EXPR
>(scalar
>condition, vector lhs, rhs2 and rhs3), but if we don't have
>corresponding
>vector mode for it, we ICE trying to expand the BLKmode COND_EXPR, as
>it is
>unprepared for that.
>
>This patch lowers those (parallel or piecewise).
>Bootstrapped/regtested on x86_64-linux and i686-linux, ok for trunk?

OK.  Though maybe LIM should not create these for cost reasons? I also wonder if we should lower them to control flow?

Thanks,
Richard.

>2015-03-16  Jakub Jelinek  <jakub@redhat.com>
>
>	PR tree-optimization/65427
>	* tree-vect-generic.c (do_cond, expand_vector_scalar_condition): New
>	functions.
>	(expand_vector_operations_1): Handle BLKmode vector COND_EXPR.
>
>	* gcc.c-torture/execute/pr65427.c: New test.
>
>--- gcc/tree-vect-generic.c.jj	2015-01-15 20:25:40.000000000 +0100
>+++ gcc/tree-vect-generic.c	2015-03-16 14:25:37.391932269 +0100
>@@ -1417,6 +1417,57 @@ count_type_subparts (tree type)
>   return VECTOR_TYPE_P (type) ? TYPE_VECTOR_SUBPARTS (type) : 1;
> }
> 
>+static tree
>+do_cond (gimple_stmt_iterator *gsi, tree inner_type, tree a, tree b,
>+	 tree bitpos, tree bitsize, enum tree_code code)
>+{
>+  if (TREE_CODE (TREE_TYPE (a)) == VECTOR_TYPE)
>+    a = tree_vec_extract (gsi, inner_type, a, bitsize, bitpos);
>+  if (TREE_CODE (TREE_TYPE (b)) == VECTOR_TYPE)
>+    b = tree_vec_extract (gsi, inner_type, b, bitsize, bitpos);
>+  tree cond = gimple_assign_rhs1 (gsi_stmt (*gsi));
>+  return gimplify_build3 (gsi, code, inner_type, cond, a, b);
>+}
>+
>+/* Expand a vector COND_EXPR to scalars, piecewise.  */
>+static void
>+expand_vector_scalar_condition (gimple_stmt_iterator *gsi)
>+{
>+  gassign *stmt = as_a <gassign *> (gsi_stmt (*gsi));
>+  tree type = gimple_expr_type (stmt);
>+  tree compute_type = get_compute_type (COND_EXPR, mov_optab, type);
>+  machine_mode compute_mode = TYPE_MODE (compute_type);
>+  gcc_assert (compute_mode != BLKmode);
>+  tree lhs = gimple_assign_lhs (stmt);
>+  tree rhs2 = gimple_assign_rhs2 (stmt);
>+  tree rhs3 = gimple_assign_rhs3 (stmt);
>+  tree new_rhs;
>+
>+  /* If the compute mode is not a vector mode (hence we are not
>decomposing
>+     a BLKmode vector to smaller, hardware-supported vectors), we may
>want
>+     to expand the operations in parallel.  */
>+  if (GET_MODE_CLASS (compute_mode) != MODE_VECTOR_INT
>+      && GET_MODE_CLASS (compute_mode) != MODE_VECTOR_FLOAT
>+      && GET_MODE_CLASS (compute_mode) != MODE_VECTOR_FRACT
>+      && GET_MODE_CLASS (compute_mode) != MODE_VECTOR_UFRACT
>+      && GET_MODE_CLASS (compute_mode) != MODE_VECTOR_ACCUM
>+      && GET_MODE_CLASS (compute_mode) != MODE_VECTOR_UACCUM)
>+    new_rhs = expand_vector_parallel (gsi, do_cond, type, rhs2, rhs3,
>+				      COND_EXPR);
>+  else
>+    new_rhs = expand_vector_piecewise (gsi, do_cond, type,
>compute_type,
>+				       rhs2, rhs3, COND_EXPR);
>+  if (!useless_type_conversion_p (TREE_TYPE (lhs), TREE_TYPE
>(new_rhs)))
>+    new_rhs = gimplify_build1 (gsi, VIEW_CONVERT_EXPR, TREE_TYPE
>(lhs),
>+			       new_rhs);
>+
>+  /* NOTE:  We should avoid using gimple_assign_set_rhs_from_tree. One
>+     way to do it is change expand_vector_operation and its callees to
>+     return a tree_code, RHS1 and RHS2 instead of a tree. */
>+  gimple_assign_set_rhs_from_tree (gsi, new_rhs);
>+  update_stmt (gsi_stmt (*gsi));
>+}
>+
>/* Process one statement.  If we identify a vector operation, expand
>it.  */
> 
> static void
>@@ -1449,6 +1500,14 @@ expand_vector_operations_1 (gimple_stmt_
>       return;
>     }
> 
>+  if (code == COND_EXPR
>+      && TREE_CODE (TREE_TYPE (gimple_assign_lhs (stmt))) ==
>VECTOR_TYPE
>+      && TYPE_MODE (TREE_TYPE (gimple_assign_lhs (stmt))) == BLKmode)
>+    {
>+      expand_vector_scalar_condition (gsi);
>+      return;
>+    }
>+
>   if (code == CONSTRUCTOR
>       && TREE_CODE (lhs) == SSA_NAME
>       && VECTOR_MODE_P (TYPE_MODE (TREE_TYPE (lhs)))
>--- gcc/testsuite/gcc.c-torture/execute/pr65427.c.jj	2015-03-16
>14:36:29.489254701 +0100
>+++ gcc/testsuite/gcc.c-torture/execute/pr65427.c	2015-03-16
>14:40:58.789851433 +0100
>@@ -0,0 +1,34 @@
>+/* PR tree-optimization/65427 */
>+
>+typedef int V __attribute__ ((vector_size (8 * sizeof (int))));
>+V a, b, c, d, e, f;
>+
>+__attribute__((noinline, noclone)) void
>+foo (int x, int y)
>+{
>+  do
>+    {
>+      if (x)
>+	d = a ^ c;
>+      else
>+	d = a ^ b;
>+    }
>+  while (y);
>+}
>+
>+int
>+main ()
>+{
>+  a = (V) { 1, 2, 3, 4, 5, 6, 7, 8 };
>+  b = (V) { 0x40, 0x80, 0x40, 0x80, 0x40, 0x80, 0x40, 0x80 };
>+  e = (V) { 0x41, 0x82, 0x43, 0x84, 0x45, 0x86, 0x47, 0x88 };
>+  foo (0, 0);
>+  if (__builtin_memcmp (&d, &e, sizeof (V)) != 0)
>+    __builtin_abort ();
>+  c = (V) { 0x80, 0x40, 0x80, 0x40, 0x80, 0x40, 0x80, 0x40 };
>+  f = (V) { 0x81, 0x42, 0x83, 0x44, 0x85, 0x46, 0x87, 0x48 };
>+  foo (1, 0);
>+  if (__builtin_memcmp (&d, &f, sizeof (V)) != 0)
>+    __builtin_abort ();
>+  return 0;
>+}
>
>	Jakub




More information about the Gcc-patches mailing list