PR67218: Fix invalid removal of FP cast

Richard Sandiford Tue, 18 Aug 2015 08:12:25 -0700

simplify_unary_operation_1 has:

      /*  (float_truncate (float x)) is (float x)  */
      if ((GET_CODE (op) == FLOAT || GET_CODE (op) == UNSIGNED_FLOAT)
         && (flag_unsafe_math_optimizations
             || (SCALAR_FLOAT_MODE_P (GET_MODE (op))
                 && ((unsigned)significand_size (GET_MODE (op))
                     >= (GET_MODE_PRECISION (GET_MODE (XEXP (op, 0)))
                         - num_sign_bit_copies (XEXP (op, 0),
                                                GET_MODE (XEXP (op, 0))))))))
       return simplify_gen_unary (GET_CODE (op), mode,
                                  XEXP (op, 0),
                                  GET_MODE (XEXP (op, 0)));


where the !flag_unsafe_math_optimizations alternative is trying to check
that the int->float conversion is exact.  Using num_sign_bit_copies is
only correct for signed inputs though; for UNSIGNED_FLOAT we need to
check whether the upper bits are zero.

Also, for both cases we can discount known trailing zeros.  It might not
be a particularly exciting thing to check on its own, but since we're
calling nonzero_bits for UNSIGNED_FLOAT anyway...  It does mean calling
nonzero_bits as well as num_sign_bit_copies for FLOAT, but this is very
rarely executed code.

I noticed this while trying to generalise some of the simplify-rtx.c
patterns so that they applied to vectors as well as scalars.  (Dave's
recent GET_MODE_INNER changes make this easier and cheaper to do.)
The patch does that here too for completeness.  I think any code
in simplify-rtx.c that handles GET_MODE_PRECISION for scalars only
is suspect.

Tested on x86_64-linux-gnu and aarch64-linux-gnu.  OK to install?

This is a gcc 6 regression so no backport is needed.

Thanks,
Richard


gcc/
        PR rtl-optimization/67218
        * simplify-rtx.c (exact_int_to_float_conversion_p): New function.
        (simplify_unary_operation_1): Use it.

gcc/testsuite/
        PR rtl-optimization/67218
        * gcc.c-torture/execute/ieee/pr67218.c,
        gcc.target/aarch64/fcvt_int_float_double1.c,
        gcc.target/aarch64/fcvt_int_float_double2.c,
        gcc.target/aarch64/fcvt_int_float_double3.c,
        gcc.target/aarch64/fcvt_int_float_double4.c,
        gcc.target/aarch64/fcvt_uint_float_double1.c,
        gcc.target/aarch64/fcvt_uint_float_double2.c,
        gcc.target/aarch64/fcvt_uint_float_double3.c,
        gcc.target/aarch64/fcvt_uint_float_double4.c: New tests.

diff --git a/gcc/simplify-rtx.c b/gcc/simplify-rtx.c
index f9352a1..8d86e57 100644
--- a/gcc/simplify-rtx.c
+++ b/gcc/simplify-rtx.c
@@ -829,6 +829,32 @@ simplify_unary_operation (enum rtx_code code, machine_mode 
mode,
   return simplify_unary_operation_1 (code, mode, op);
 }
 
+/* Return true if FLOAT or UNSIGNED_FLOAT operation OP is known
+   to be exact.  */
+
+static bool
+exact_int_to_float_conversion_p (const_rtx op)
+{
+  int out_bits = significand_size (GET_MODE_INNER (GET_MODE (op)));
+  machine_mode op0_mode = GET_MODE (XEXP (op, 0));
+  /* Constants shouldn't reach here.  */
+  gcc_assert (op0_mode != VOIDmode);
+  int in_prec = GET_MODE_UNIT_PRECISION (op0_mode);
+  int in_bits = in_prec;
+  if (HWI_COMPUTABLE_MODE_P (op0_mode))
+    {
+      unsigned HOST_WIDE_INT nonzero = nonzero_bits (XEXP (op, 0), op0_mode);
+      if (GET_CODE (op) == FLOAT)
+       in_bits -= num_sign_bit_copies (XEXP (op, 0), op0_mode);
+      else if (GET_CODE (op) == UNSIGNED_FLOAT)
+       in_bits = wi::min_precision (wi::uhwi (nonzero, in_prec), UNSIGNED);
+      else
+       gcc_unreachable ();
+      in_bits -= wi::ctz (wi::uhwi (nonzero, in_prec));
+    }
+  return in_bits <= out_bits;
+}
+
 /* Perform some simplifications we can do even if the operands
    aren't constant.  */
 static rtx
@@ -1190,11 +1216,7 @@ simplify_unary_operation_1 (enum rtx_code code, 
machine_mode mode, rtx op)
       /*  (float_truncate (float x)) is (float x)  */
       if ((GET_CODE (op) == FLOAT || GET_CODE (op) == UNSIGNED_FLOAT)
          && (flag_unsafe_math_optimizations
-             || (SCALAR_FLOAT_MODE_P (GET_MODE (op))
-                 && ((unsigned)significand_size (GET_MODE (op))
-                     >= (GET_MODE_PRECISION (GET_MODE (XEXP (op, 0)))
-                         - num_sign_bit_copies (XEXP (op, 0),
-                                                GET_MODE (XEXP (op, 0))))))))
+             || exact_int_to_float_conversion_p (op)))
        return simplify_gen_unary (GET_CODE (op), mode,
                                   XEXP (op, 0),
                                   GET_MODE (XEXP (op, 0)));
@@ -1227,11 +1249,7 @@ simplify_unary_operation_1 (enum rtx_code code, 
machine_mode mode, rtx op)
           */
       if (GET_CODE (op) == FLOAT_EXTEND
          || ((GET_CODE (op) == FLOAT || GET_CODE (op) == UNSIGNED_FLOAT)
-             && SCALAR_FLOAT_MODE_P (GET_MODE (op))
-             && ((unsigned)significand_size (GET_MODE (op))
-                 >= (GET_MODE_PRECISION (GET_MODE (XEXP (op, 0)))
-                     - num_sign_bit_copies (XEXP (op, 0),
-                                            GET_MODE (XEXP (op, 0)))))))
+             && exact_int_to_float_conversion_p (op)))
        return simplify_gen_unary (GET_CODE (op), mode,
                                   XEXP (op, 0),
                                   GET_MODE (XEXP (op, 0)));
diff --git a/gcc/testsuite/gcc.c-torture/execute/ieee/pr67218.c 
b/gcc/testsuite/gcc.c-torture/execute/ieee/pr67218.c
new file mode 100644
index 0000000..2a1260a
--- /dev/null
+++ b/gcc/testsuite/gcc.c-torture/execute/ieee/pr67218.c
@@ -0,0 +1,15 @@
+extern void abort (void) __attribute__ ((noreturn));
+
+double __attribute__ ((noinline, noclone))
+foo (unsigned int x)
+{
+  return (double) (float) (x | 0xffff0000);
+}
+
+int
+main ()
+{
+  if (foo (1) != 0x1.fffep31)
+    abort ();
+  return 0;
+}
diff --git a/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double1.c 
b/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double1.c
new file mode 100644
index 0000000..e555b2c
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double1.c
@@ -0,0 +1,10 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (int x)
+{
+  return (double) (float) (x | (int) 0xff000000);
+}
+
+/* { dg-final { scan-assembler {\tscvtf\td0, w[0-9]*} } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double2.c 
b/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double2.c
new file mode 100644
index 0000000..7791b22
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double2.c
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (int x)
+{
+  return (double) (float) (x | (int) 0xfe000000);
+}
+
+/* { dg-final { scan-assembler {\tscvtf\ts[0-9]*, w[0-9]*} } } */
+/* { dg-final { scan-assembler {\tfcvt\td0, s[0-9]*} } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double3.c 
b/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double3.c
new file mode 100644
index 0000000..c647742
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double3.c
@@ -0,0 +1,10 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (int x)
+{
+  return (double) (float) ((x & -16) | (int) 0xf0000000);
+}
+
+/* { dg-final { scan-assembler {\tscvtf\td0, w[0-9]*} } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double4.c 
b/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double4.c
new file mode 100644
index 0000000..88a5242
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/fcvt_int_float_double4.c
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (int x)
+{
+  return (double) (float) ((x & -16) | (int) 0xfe00000);
+}
+
+/* { dg-final { scan-assembler {\tscvtf\ts[0-9]*, w[0-9]*} } } */
+/* { dg-final { scan-assembler {\tfcvt\td0, s[0-9]*} } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double1.c 
b/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double1.c
new file mode 100644
index 0000000..c1c4920
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double1.c
@@ -0,0 +1,10 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (unsigned int x)
+{
+  return (double) (float) (x & 0xffffff);
+}
+
+/* { dg-final { scan-assembler {\t[su]cvtf\td0, w[0-9]*} } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double2.c 
b/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double2.c
new file mode 100644
index 0000000..334aae8
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double2.c
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (unsigned int x)
+{
+  return (double) (float) (x & 0x1ffffff);
+}
+
+/* { dg-final { scan-assembler {\t[su]cvtf\ts[0-9]*, w[0-9]*} } } */
+/* { dg-final { scan-assembler {\tfcvt\td0, s[0-9]*} } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double3.c 
b/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double3.c
new file mode 100644
index 0000000..deb4578
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double3.c
@@ -0,0 +1,10 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (unsigned int x)
+{
+  return (double) (float) (x & 0xffffff00);
+}
+
+/* { dg-final { scan-assembler {\tucvtf\td0, w[0-9]*} } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double4.c 
b/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double4.c
new file mode 100644
index 0000000..8f0955c
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/fcvt_uint_float_double4.c
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (unsigned int x)
+{
+  return (double) (float) (x & 0xffffff80);
+}
+
+/* { dg-final { scan-assembler {\tucvtf\ts[0-9]*, w[0-9]*} } } */
+/* { dg-final { scan-assembler {\tfcvt\td0, s[0-9]*} } } */

PR67218: Fix invalid removal of FP cast

Reply via email to