PR target/113560: Enhance is_widening_mult_rhs_p.

author Roger Sayle <roger@nextmovesoftware.com>

Thu, 1 Feb 2024 06:10:42 +0000 (06:10 +0000)

committer Roger Sayle <roger@nextmovesoftware.com>

Thu, 1 Feb 2024 06:10:42 +0000 (06:10 +0000)
author Roger Sayle <roger@nextmovesoftware.com>
Thu, 1 Feb 2024 06:10:42 +0000 (06:10 +0000)
committer Roger Sayle <roger@nextmovesoftware.com>
Thu, 1 Feb 2024 06:10:42 +0000 (06:10 +0000)
diff --git a/gcc/testsuite/g++.target/i386/pr113560.C b/gcc/testsuite/g++.target/i386/pr113560.C

new file mode 100644 (file)

index 0000000..179b68f
--- /dev/null
+++ b/gcc/testsuite/g++.target/i386/pr113560.C
@@ -0,0 +1,19 @@
+/* { dg-do compile { target { ! ia32 } } } */
+/* { dg-options "-Ofast -std=c++23 -march=znver4" } */
+
+#include <immintrin.h>
+auto f(char *buf, unsigned long long in) noexcept
+{
+    unsigned long long hi{};
+    auto lo{_mulx_u64(in, 0x2af31dc462ull, &hi)};
+    lo = _mulx_u64(lo, 100, &hi);
+    __builtin_memcpy(buf + 2, &hi, 2);
+    return buf + 10;
+}
+
+/* { dg-final { scan-assembler-times "mulx" 1 } } */
+/* { dg-final { scan-assembler-times "mulq" 1 } } */
+/* { dg-final { scan-assembler-not "addq" } } */
+/* { dg-final { scan-assembler-not "adcq" } } */
+/* { dg-final { scan-assembler-not "salq" } } */
+/* { dg-final { scan-assembler-not "shldq" } } */
diff --git a/gcc/testsuite/gcc.dg/pr87954.c b/gcc/testsuite/gcc.dg/pr87954.c

index 620657cb1f5d3dc507eb1972074dd5b04b9924e2..80d0543bbb389f1188fc56e8acd1dead3383fd63 100644 (file)
--- a/gcc/testsuite/gcc.dg/pr87954.c
+++ b/gcc/testsuite/gcc.dg/pr87954.c
@@ -18,4 +18,4 @@ imul(unsigned int flags)
    return type_dma + (is_rec * !is_dma) * KMALLOC_RECLAIM;
  }
  
-/* { dg-final { scan-tree-dump-times { \* } 1 "optimized" } } */
+/* { dg-final { scan-tree-dump-times { \*w? |WIDEN_MULT_PLUS_EXPR} 1 "optimized" } } */
diff --git a/gcc/testsuite/gcc.target/i386/pr113560.c b/gcc/testsuite/gcc.target/i386/pr113560.c

new file mode 100644 (file)

index 0000000..ac2e01a
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/pr113560.c
@@ -0,0 +1,17 @@
+/* { dg-do compile { target int128 } } */
+/* { dg-options "-O2" } */
+
+unsigned __int128 foo(unsigned __int128 x, unsigned __int128 y)
+{
+  return (x & 1000) * (y & 1000);
+}
+
+__int128 bar(__int128 x, __int128 y)
+{
+  return (x & 1000) * (y & 1000);
+}
+
+/* { dg-final { scan-assembler-times "\tmulq" 1 } } */
+/* { dg-final { scan-assembler-times "\timulq" 1 } } */
+/* { dg-final { scan-assembler-not "addq" } } */
+/* { dg-final { scan-assembler-not "xorl" } } */
diff --git a/gcc/tree-ssa-math-opts.cc b/gcc/tree-ssa-math-opts.cc

index 2db26e4ed4868aa1baf2fa88a0f327f0bd4ea56f..cffe7573f794731629335965eb2a0f45b4d47857 100644 (file)
--- a/gcc/tree-ssa-math-opts.cc
+++ b/gcc/tree-ssa-math-opts.cc
@@ -2552,12 +2552,47 @@ is_widening_mult_rhs_p (tree type, tree rhs, tree *type_out,
  
    if (TREE_CODE (rhs) == SSA_NAME)
      {
+      /* Use tree_non_zero_bits to see if this operand is zero_extended
+        for unsigned widening multiplications or non-negative for
+        signed widening multiplications.  */
+      if (TREE_CODE (type) == INTEGER_TYPE
+         && (TYPE_PRECISION (type) & 1) == 0
+         && int_mode_for_size (TYPE_PRECISION (type) / 2, 1).exists ())
+       {
+         unsigned int prec = TYPE_PRECISION (type);
+         unsigned int hprec = prec / 2;
+         wide_int bits = wide_int::from (tree_nonzero_bits (rhs), prec,
+                                         TYPE_SIGN (TREE_TYPE (rhs)));
+         if (TYPE_UNSIGNED (type)
+             && wi::bit_and (bits, wi::mask (hprec, true, prec)) == 0)
+           {
+             *type_out = build_nonstandard_integer_type (hprec, true);
+             /* X & MODE_MASK can be simplified to (T)X.  */
+             stmt = SSA_NAME_DEF_STMT (rhs);
+             if (is_gimple_assign (stmt)
+                 && gimple_assign_rhs_code (stmt) == BIT_AND_EXPR
+                 && TREE_CODE (gimple_assign_rhs2 (stmt)) == INTEGER_CST
+                 && wi::to_wide (gimple_assign_rhs2 (stmt))
+                    == wi::mask (hprec, false, prec))
+               *new_rhs_out = gimple_assign_rhs1 (stmt);
+             else
+               *new_rhs_out = rhs;
+             return true;
+           }
+         else if (!TYPE_UNSIGNED (type)
+                  && wi::bit_and (bits, wi::mask (hprec - 1, true, prec)) == 0)
+           {
+             *type_out = build_nonstandard_integer_type (hprec, false);
+             *new_rhs_out = rhs;
+             return true;
+           }
+       }
+
        stmt = SSA_NAME_DEF_STMT (rhs);
        if (is_gimple_assign (stmt))
         {
-         if (! widening_mult_conversion_strippable_p (type, stmt))
-           rhs1 = rhs;
-         else
+
+         if (widening_mult_conversion_strippable_p (type, stmt))
             {
               rhs1 = gimple_assign_rhs1 (stmt);
  
@@ -2568,6 +2603,8 @@ is_widening_mult_rhs_p (tree type, tree rhs, tree *type_out,
                   return true;
                 }
             }
+         else
+           rhs1 = rhs;
         }
        else
         rhs1 = rhs;
@@ -2827,12 +2864,16 @@ convert_mult_to_widen (gimple *stmt, gimple_stmt_iterator *gsi)
    if (2 * actual_precision > TYPE_PRECISION (type))
      return false;
    if (actual_precision != TYPE_PRECISION (type1)
-      || from_unsigned1 != TYPE_UNSIGNED (type1))
+      || from_unsigned1 != TYPE_UNSIGNED (type1)
+      || (TREE_TYPE (rhs1) != type1
+         && TREE_CODE (rhs1) != INTEGER_CST))
      rhs1 = build_and_insert_cast (gsi, loc,
                                   build_nonstandard_integer_type
                                     (actual_precision, from_unsigned1), rhs1);
    if (actual_precision != TYPE_PRECISION (type2)
-      || from_unsigned2 != TYPE_UNSIGNED (type2))
+      || from_unsigned2 != TYPE_UNSIGNED (type2)
+      || (TREE_TYPE (rhs2) != type2
+         && TREE_CODE (rhs2) != INTEGER_CST))
      rhs2 = build_and_insert_cast (gsi, loc,
                                   build_nonstandard_integer_type
                                     (actual_precision, from_unsigned2), rhs2);
@@ -3046,7 +3087,7 @@ convert_plusminus_to_widen (gimple_stmt_iterator *gsi, gimple *stmt,
        || from_unsigned1 != TYPE_UNSIGNED (type1))
      mult_rhs1 = build_and_insert_cast (gsi, loc,
                                        build_nonstandard_integer_type
-                                        (actual_precision, from_unsigned1),
+                                        (actual_precision, from_unsigned1),
                                        mult_rhs1);
    if (actual_precision != TYPE_PRECISION (type2)
        || from_unsigned2 != TYPE_UNSIGNED (type2))
author	Roger Sayle <roger@nextmovesoftware.com>
	Thu, 1 Feb 2024 06:10:42 +0000 (06:10 +0000)
committer	Roger Sayle <roger@nextmovesoftware.com>
	Thu, 1 Feb 2024 06:10:42 +0000 (06:10 +0000)
gcc/testsuite/g++.target/i386/pr113560.C	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.dg/pr87954.c		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/i386/pr113560.c	[new file with mode: 0644]	patch \| blob
gcc/tree-ssa-math-opts.cc		patch \| blob \| blame \| history