Patchwork Fix PR49483

login
register
mail settings
Submitter Richard Guenther
Date June 21, 2011, 11 a.m.
Message ID <alpine.LNX.2.00.1106211259360.810@zhemvz.fhfr.qr>
Download mbox | patch
Permalink /patch/101273/
State New
Headers show

Comments

Richard Guenther - June 21, 2011, 11 a.m.
This fixes a missed vectorization with bitwise int-float conversions.

Bootstrapped and tested on x86_64-unknown-linux-gnu, applied to trunk.

Richard.

2011-06-21  Richard Guenther  <rguenther@suse.de>

	PR tree-optimization/49483
	* tree-vect-stmts.c (vectorizable_assignment): Also handle
	VIEW_CONVERT_EXPR conversions.

	* gcc.dg/vect/vect-120.c: New testcase.

Patch

Index: gcc/tree-vect-stmts.c
===================================================================
--- gcc/tree-vect-stmts.c	(revision 175205)
+++ gcc/tree-vect-stmts.c	(working copy)
@@ -2089,6 +2089,9 @@  vectorizable_assignment (gimple stmt, gi
   else
     return false;
 
+  if (code == VIEW_CONVERT_EXPR)
+    op = TREE_OPERAND (op, 0);
+
   if (!vect_is_simple_use_1 (op, loop_vinfo, bb_vinfo,
 			     &def_stmt, &def, &dt[0], &vectype_in))
     {
@@ -2099,7 +2102,8 @@  vectorizable_assignment (gimple stmt, gi
 
   /* We can handle NOP_EXPR conversions that do not change the number
      of elements or the vector size.  */
-  if (CONVERT_EXPR_CODE_P (code)
+  if ((CONVERT_EXPR_CODE_P (code)
+       || code == VIEW_CONVERT_EXPR)
       && (!vectype_in
 	  || TYPE_VECTOR_SUBPARTS (vectype_in) != nunits
 	  || (GET_MODE_SIZE (TYPE_MODE (vectype))
@@ -2134,7 +2138,8 @@  vectorizable_assignment (gimple stmt, gi
       /* Arguments are ready. create the new vector stmt.  */
       FOR_EACH_VEC_ELT (tree, vec_oprnds, i, vop)
        {
-	 if (CONVERT_EXPR_CODE_P (code))
+	 if (CONVERT_EXPR_CODE_P (code)
+	     || code == VIEW_CONVERT_EXPR)
 	   vop = build1 (VIEW_CONVERT_EXPR, vectype, vop);
          new_stmt = gimple_build_assign (vec_dest, vop);
          new_temp = make_ssa_name (vec_dest, new_stmt);
Index: gcc/testsuite/gcc.dg/vect/vect-120.c
===================================================================
--- gcc/testsuite/gcc.dg/vect/vect-120.c	(revision 0)
+++ gcc/testsuite/gcc.dg/vect/vect-120.c	(revision 0)
@@ -0,0 +1,36 @@ 
+/* { dg-do compile } */
+/* { dg-require-effective-target vect_float } */
+/* { dg-require-effective-target vect_shift } */
+
+static inline float
+i2f(int x)
+{
+  union { float f; int i; } tmp;
+  tmp.i=x;
+  return tmp.f;
+}
+static inline float
+vect_ldexpf(float x, int n)
+{
+  n = (n+0x7f)<<23;
+  return x * i2f(n);
+}
+
+float __attribute__ ((aligned(16))) a[1024];
+float __attribute__ ((aligned(16))) b[1024];
+float __attribute__ ((aligned(16))) c[1024];
+
+void
+tV()
+{
+  int i;
+  for (i=0; i!=1024; ++i)
+    {
+      float z = a[i];
+      int n = b[i];
+      c[i] = vect_ldexpf(z,n);
+    }
+}
+
+/* { dg-final { scan-tree-dump-times "vectorized 1 loops" 1 "vect" } } */
+/* { dg-final { cleanup-tree-dump "vect" } } */