This fixes a missed vectorization with bitwise int-float conversions.

Bootstrapped and tested on x86_64-unknown-linux-gnu, applied to trunk.

Richard.

2011-06-21  Richard Guenther  <rguent...@suse.de>

        PR tree-optimization/49483
        * tree-vect-stmts.c (vectorizable_assignment): Also handle
        VIEW_CONVERT_EXPR conversions.

        * gcc.dg/vect/vect-120.c: New testcase.

Index: gcc/tree-vect-stmts.c
===================================================================
--- gcc/tree-vect-stmts.c       (revision 175205)
+++ gcc/tree-vect-stmts.c       (working copy)
@@ -2089,6 +2089,9 @@ vectorizable_assignment (gimple stmt, gi
   else
     return false;
 
+  if (code == VIEW_CONVERT_EXPR)
+    op = TREE_OPERAND (op, 0);
+
   if (!vect_is_simple_use_1 (op, loop_vinfo, bb_vinfo,
                             &def_stmt, &def, &dt[0], &vectype_in))
     {
@@ -2099,7 +2102,8 @@ vectorizable_assignment (gimple stmt, gi
 
   /* We can handle NOP_EXPR conversions that do not change the number
      of elements or the vector size.  */
-  if (CONVERT_EXPR_CODE_P (code)
+  if ((CONVERT_EXPR_CODE_P (code)
+       || code == VIEW_CONVERT_EXPR)
       && (!vectype_in
          || TYPE_VECTOR_SUBPARTS (vectype_in) != nunits
          || (GET_MODE_SIZE (TYPE_MODE (vectype))
@@ -2134,7 +2138,8 @@ vectorizable_assignment (gimple stmt, gi
       /* Arguments are ready. create the new vector stmt.  */
       FOR_EACH_VEC_ELT (tree, vec_oprnds, i, vop)
        {
-        if (CONVERT_EXPR_CODE_P (code))
+        if (CONVERT_EXPR_CODE_P (code)
+            || code == VIEW_CONVERT_EXPR)
           vop = build1 (VIEW_CONVERT_EXPR, vectype, vop);
          new_stmt = gimple_build_assign (vec_dest, vop);
          new_temp = make_ssa_name (vec_dest, new_stmt);
Index: gcc/testsuite/gcc.dg/vect/vect-120.c
===================================================================
--- gcc/testsuite/gcc.dg/vect/vect-120.c        (revision 0)
+++ gcc/testsuite/gcc.dg/vect/vect-120.c        (revision 0)
@@ -0,0 +1,36 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target vect_float } */
+/* { dg-require-effective-target vect_shift } */
+
+static inline float
+i2f(int x)
+{
+  union { float f; int i; } tmp;
+  tmp.i=x;
+  return tmp.f;
+}
+static inline float
+vect_ldexpf(float x, int n)
+{
+  n = (n+0x7f)<<23;
+  return x * i2f(n);
+}
+
+float __attribute__ ((aligned(16))) a[1024];
+float __attribute__ ((aligned(16))) b[1024];
+float __attribute__ ((aligned(16))) c[1024];
+
+void
+tV()
+{
+  int i;
+  for (i=0; i!=1024; ++i)
+    {
+      float z = a[i];
+      int n = b[i];
+      c[i] = vect_ldexpf(z,n);
+    }
+}
+
+/* { dg-final { scan-tree-dump-times "vectorized 1 loops" 1 "vect" } } */
+/* { dg-final { cleanup-tree-dump "vect" } } */

Reply via email to