MATCH: [PR111109] Fix bit_ior(cond,cond) when comparisons are fp

author Andrew Pinski <apinski@marvell.com>

Wed, 23 Aug 2023 16:46:10 +0000 (16:46 +0000)

committer Andrew Pinski <apinski@marvell.com>

Thu, 24 Aug 2023 07:20:50 +0000 (07:20 +0000)
author Andrew Pinski <apinski@marvell.com>
Wed, 23 Aug 2023 16:46:10 +0000 (16:46 +0000)
committer Andrew Pinski <apinski@marvell.com>
Thu, 24 Aug 2023 07:20:50 +0000 (07:20 +0000)
diff --git a/gcc/match.pd b/gcc/match.pd

index 890f050cbad467eb0c5f8368588814225211d4d6..cf0bb3a42170459ad54b5734b5ce04c21f581683 100644 (file)
--- a/gcc/match.pd
+++ b/gcc/match.pd
@@ -2087,6 +2087,7 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT)
     (bit_and:c (convert? (cmp@0  @01 @02)) @3)
     (bit_and:c (convert? (icmp@4 @01 @02)) @5))
      (if (INTEGRAL_TYPE_P (type)
+        && invert_tree_comparison (cmp, HONOR_NANS (@01)) == icmp
          /* The scalar version has to be canonicalized after vectorization
             because it makes unconditional loads conditional ones, which
             means we lose vectorization because the loads may trap.  */
@@ -2101,6 +2102,7 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT)
     (cond (cmp@0  @01 @02) @3 zerop)
     (cond (icmp@4 @01 @02) @5 zerop))
      (if (INTEGRAL_TYPE_P (type)
+        && invert_tree_comparison (cmp, HONOR_NANS (@01)) == icmp
          /* The scalar version has to be canonicalized after vectorization
             because it makes unconditional loads conditional ones, which
             means we lose vectorization because the loads may trap.  */
@@ -2113,13 +2115,15 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT)
    (bit_ior
     (bit_and:c (vec_cond:s (cmp@0 @6 @7) @4 @5) @2)
     (bit_and:c (vec_cond:s (icmp@1 @6 @7) @4 @5) @3))
-    (if (integer_zerop (@5))
+    (if (integer_zerop (@5)
+        && invert_tree_comparison (cmp, HONOR_NANS (@6)) == icmp)
       (switch
        (if (integer_onep (@4))
         (bit_and (vec_cond @0 @2 @3) @4))
         (if (integer_minus_onep (@4))
          (vec_cond @0 @2 @3)))
-    (if (integer_zerop (@4))
+    (if (integer_zerop (@4)
+        && invert_tree_comparison (cmp, HONOR_NANS (@6)) == icmp)
       (switch
        (if (integer_onep (@5))
         (bit_and (vec_cond @0 @3 @2) @5))
@@ -2132,7 +2136,8 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT)
    (bit_ior
     (vec_cond:s (cmp@0 @4 @5) @2 integer_zerop)
     (vec_cond:s (icmp@1 @4 @5) @3 integer_zerop))
-    (vec_cond @0 @2 @3)))
+  (if (invert_tree_comparison (cmp, HONOR_NANS (@4)) == icmp)
+   (vec_cond @0 @2 @3))))
  
  /* Transform X & -Y into X * Y when Y is { 0 or 1 }.  */
  (simplify
diff --git a/gcc/testsuite/gcc.c-torture/execute/ieee/fp-cmp-cond-1.c b/gcc/testsuite/gcc.c-torture/execute/ieee/fp-cmp-cond-1.c

new file mode 100644 (file)

index 0000000..4a3c4b0
--- /dev/null
+++ b/gcc/testsuite/gcc.c-torture/execute/ieee/fp-cmp-cond-1.c
@@ -0,0 +1,78 @@
+/* PR tree-optimization/111109 */
+
+/*
+   f should return 0 if either fa and fb are a nan.
+   Rather than the value of a or b.
+*/
+__attribute__((noipa))
+int f(int a, int b, float fa, float fb) {
+  const _Bool c = fa < fb;
+  const _Bool c1 = fa >= fb;
+  return (c * a) | (c1 * b);
+}
+
+/*
+   f1 should return 0 if either fa and fb are a nan.
+   Rather than the value of a&1 or b&1.
+*/
+__attribute__((noipa))
+int f1(int a, int b, float fa, float fb) {
+  const _Bool c = fa < fb;
+  const _Bool c1 = fa >= fb;
+  return (c & a) | (c1 & b);
+}
+
+#if __SIZEOF_INT__ == __SIZEOF_FLOAT__
+typedef int v4si __attribute__ ((vector_size (1*sizeof(int))));
+typedef float v4sf __attribute__ ((vector_size (1*sizeof(float))));
+/*
+   fvf0 should return {0} if either fa and fb are a nan.
+   Rather than the value of a or b.
+*/
+__attribute__((noipa))
+v4si vf0(v4si a, v4si b, v4sf fa, v4sf fb) {
+  const v4si c = fa < fb;
+  const v4si c1 = fa >= fb;
+  return (c & a) | (c1 & b);
+}
+
+
+#endif
+
+int main(void)
+{
+  float a = __builtin_nan("");
+
+  if (f(-1,-1, a, a) != 0)
+    __builtin_abort();
+  if (f(-1,-1, a, 0) != 0)
+    __builtin_abort();
+  if (f(-1,-1, 0, a) != 0)
+    __builtin_abort();
+  if (f(-1,-1, 0, 0) != -1)
+    __builtin_abort();
+
+
+  if (f1(1,1, a, a) != 0)
+    __builtin_abort();
+  if (f1(1,1, a, 0) != 0)
+    __builtin_abort();
+  if (f1(1,1, 0, a) != 0)
+    __builtin_abort();
+  if (f1(1,1, 0, 0) != 1)
+        __builtin_abort();
+
+#if __SIZEOF_INT__ == __SIZEOF_FLOAT__
+  v4si b = {-1};
+  v4sf c = {a};
+  v4sf d = {0.0};
+  if (vf0(b,b, c, c)[0] != 0)
+    __builtin_abort();
+  if (vf0(b,b, c, d)[0] != 0)
+    __builtin_abort();
+  if (vf0(b,b, d, c)[0] != 0)
+    __builtin_abort();
+  if (vf0(b,b, d, d)[0] != b[0])
+        __builtin_abort();
+#endif
+}
author	Andrew Pinski <apinski@marvell.com>
	Wed, 23 Aug 2023 16:46:10 +0000 (16:46 +0000)
committer	Andrew Pinski <apinski@marvell.com>
	Thu, 24 Aug 2023 07:20:50 +0000 (07:20 +0000)
gcc/match.pd		patch \| blob \| blame \| history
gcc/testsuite/gcc.c-torture/execute/ieee/fp-cmp-cond-1.c	[new file with mode: 0644]	patch \| blob