@@ -829,6 +829,32 @@ simplify_unary_operation (enum rtx_code code, machine_mode mode,
return simplify_unary_operation_1 (code, mode, op);
}
+/* Return true if FLOAT or UNSIGNED_FLOAT operation OP is known
+ to be exact. */
+
+static bool
+exact_int_to_float_conversion_p (const_rtx op)
+{
+ int out_bits = significand_size (GET_MODE_INNER (GET_MODE (op)));
+ machine_mode op0_mode = GET_MODE (XEXP (op, 0));
+ /* Constants shouldn't reach here. */
+ gcc_assert (op0_mode != VOIDmode);
+ int in_prec = GET_MODE_UNIT_PRECISION (op0_mode);
+ int in_bits = in_prec;
+ if (HWI_COMPUTABLE_MODE_P (op0_mode))
+ {
+ unsigned HOST_WIDE_INT nonzero = nonzero_bits (XEXP (op, 0), op0_mode);
+ if (GET_CODE (op) == FLOAT)
+ in_bits -= num_sign_bit_copies (XEXP (op, 0), op0_mode);
+ else if (GET_CODE (op) == UNSIGNED_FLOAT)
+ in_bits = wi::min_precision (wi::uhwi (nonzero, in_prec), UNSIGNED);
+ else
+ gcc_unreachable ();
+ in_bits -= wi::ctz (wi::uhwi (nonzero, in_prec));
+ }
+ return in_bits <= out_bits;
+}
+
/* Perform some simplifications we can do even if the operands
aren't constant. */
static rtx
@@ -1190,11 +1216,7 @@ simplify_unary_operation_1 (enum rtx_code code, machine_mode mode, rtx op)
/* (float_truncate (float x)) is (float x) */
if ((GET_CODE (op) == FLOAT || GET_CODE (op) == UNSIGNED_FLOAT)
&& (flag_unsafe_math_optimizations
- || (SCALAR_FLOAT_MODE_P (GET_MODE (op))
- && ((unsigned)significand_size (GET_MODE (op))
- >= (GET_MODE_PRECISION (GET_MODE (XEXP (op, 0)))
- - num_sign_bit_copies (XEXP (op, 0),
- GET_MODE (XEXP (op, 0))))))))
+ || exact_int_to_float_conversion_p (op)))
return simplify_gen_unary (GET_CODE (op), mode,
XEXP (op, 0),
GET_MODE (XEXP (op, 0)));
@@ -1227,11 +1249,7 @@ simplify_unary_operation_1 (enum rtx_code code, machine_mode mode, rtx op)
*/
if (GET_CODE (op) == FLOAT_EXTEND
|| ((GET_CODE (op) == FLOAT || GET_CODE (op) == UNSIGNED_FLOAT)
- && SCALAR_FLOAT_MODE_P (GET_MODE (op))
- && ((unsigned)significand_size (GET_MODE (op))
- >= (GET_MODE_PRECISION (GET_MODE (XEXP (op, 0)))
- - num_sign_bit_copies (XEXP (op, 0),
- GET_MODE (XEXP (op, 0)))))))
+ && exact_int_to_float_conversion_p (op)))
return simplify_gen_unary (GET_CODE (op), mode,
XEXP (op, 0),
GET_MODE (XEXP (op, 0)));
new file mode 100644
@@ -0,0 +1,15 @@
+extern void abort (void) __attribute__ ((noreturn));
+
+double __attribute__ ((noinline, noclone))
+foo (unsigned int x)
+{
+ return (double) (float) (x | 0xffff0000);
+}
+
+int
+main ()
+{
+ if (foo (1) != 0x1.fffep31)
+ abort ();
+ return 0;
+}
new file mode 100644
@@ -0,0 +1,10 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (int x)
+{
+ return (double) (float) (x | (int) 0xff000000);
+}
+
+/* { dg-final { scan-assembler {\tscvtf\td0, w[0-9]*} } } */
new file mode 100644
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (int x)
+{
+ return (double) (float) (x | (int) 0xfe000000);
+}
+
+/* { dg-final { scan-assembler {\tscvtf\ts[0-9]*, w[0-9]*} } } */
+/* { dg-final { scan-assembler {\tfcvt\td0, s[0-9]*} } } */
new file mode 100644
@@ -0,0 +1,10 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (int x)
+{
+ return (double) (float) ((x & -16) | (int) 0xf0000000);
+}
+
+/* { dg-final { scan-assembler {\tscvtf\td0, w[0-9]*} } } */
new file mode 100644
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (int x)
+{
+ return (double) (float) ((x & -16) | (int) 0xfe00000);
+}
+
+/* { dg-final { scan-assembler {\tscvtf\ts[0-9]*, w[0-9]*} } } */
+/* { dg-final { scan-assembler {\tfcvt\td0, s[0-9]*} } } */
new file mode 100644
@@ -0,0 +1,10 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (unsigned int x)
+{
+ return (double) (float) (x & 0xffffff);
+}
+
+/* { dg-final { scan-assembler {\t[su]cvtf\td0, w[0-9]*} } } */
new file mode 100644
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (unsigned int x)
+{
+ return (double) (float) (x & 0x1ffffff);
+}
+
+/* { dg-final { scan-assembler {\t[su]cvtf\ts[0-9]*, w[0-9]*} } } */
+/* { dg-final { scan-assembler {\tfcvt\td0, s[0-9]*} } } */
new file mode 100644
@@ -0,0 +1,10 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (unsigned int x)
+{
+ return (double) (float) (x & 0xffffff00);
+}
+
+/* { dg-final { scan-assembler {\tucvtf\td0, w[0-9]*} } } */
new file mode 100644
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+double
+foo (unsigned int x)
+{
+ return (double) (float) (x & 0xffffff80);
+}
+
+/* { dg-final { scan-assembler {\tucvtf\ts[0-9]*, w[0-9]*} } } */
+/* { dg-final { scan-assembler {\tfcvt\td0, s[0-9]*} } } */
simplify_unary_operation_1 has: /* (float_truncate (float x)) is (float x) */ if ((GET_CODE (op) == FLOAT || GET_CODE (op) == UNSIGNED_FLOAT) && (flag_unsafe_math_optimizations || (SCALAR_FLOAT_MODE_P (GET_MODE (op)) && ((unsigned)significand_size (GET_MODE (op)) >= (GET_MODE_PRECISION (GET_MODE (XEXP (op, 0))) - num_sign_bit_copies (XEXP (op, 0), GET_MODE (XEXP (op, 0)))))))) return simplify_gen_unary (GET_CODE (op), mode, XEXP (op, 0), GET_MODE (XEXP (op, 0))); where the !flag_unsafe_math_optimizations alternative is trying to check that the int->float conversion is exact. Using num_sign_bit_copies is only correct for signed inputs though; for UNSIGNED_FLOAT we need to check whether the upper bits are zero. Also, for both cases we can discount known trailing zeros. It might not be a particularly exciting thing to check on its own, but since we're calling nonzero_bits for UNSIGNED_FLOAT anyway... It does mean calling nonzero_bits as well as num_sign_bit_copies for FLOAT, but this is very rarely executed code. I noticed this while trying to generalise some of the simplify-rtx.c patterns so that they applied to vectors as well as scalars. (Dave's recent GET_MODE_INNER changes make this easier and cheaper to do.) The patch does that here too for completeness. I think any code in simplify-rtx.c that handles GET_MODE_PRECISION for scalars only is suspect. Tested on x86_64-linux-gnu and aarch64-linux-gnu. OK to install? This is a gcc 6 regression so no backport is needed. Thanks, Richard gcc/ PR rtl-optimization/67218 * simplify-rtx.c (exact_int_to_float_conversion_p): New function. (simplify_unary_operation_1): Use it. gcc/testsuite/ PR rtl-optimization/67218 * gcc.c-torture/execute/ieee/pr67218.c, gcc.target/aarch64/fcvt_int_float_double1.c, gcc.target/aarch64/fcvt_int_float_double2.c, gcc.target/aarch64/fcvt_int_float_double3.c, gcc.target/aarch64/fcvt_int_float_double4.c, gcc.target/aarch64/fcvt_uint_float_double1.c, gcc.target/aarch64/fcvt_uint_float_double2.c, gcc.target/aarch64/fcvt_uint_float_double3.c, gcc.target/aarch64/fcvt_uint_float_double4.c: New tests.