gimple: allow more folding of memcpy [PR102125]

author Richard Earnshaw <rearnsha@arm.com>

Fri, 3 Sep 2021 16:06:15 +0000 (17:06 +0100)

committer Richard Earnshaw <rearnsha@arm.com>

Mon, 13 Sep 2021 10:26:48 +0000 (11:26 +0100)
author Richard Earnshaw <rearnsha@arm.com>
Fri, 3 Sep 2021 16:06:15 +0000 (17:06 +0100)
committer Richard Earnshaw <rearnsha@arm.com>
Mon, 13 Sep 2021 10:26:48 +0000 (11:26 +0100)
diff --git a/gcc/gimple-fold.c b/gcc/gimple-fold.c

index dd0e6b5daffa7ff7ce3f2acd67fd734a832b2ab4..6fea8a6f9fdb51d5dd717a28f3d2f49efbf59d75 100644 (file)
--- a/gcc/gimple-fold.c
+++ b/gcc/gimple-fold.c
@@ -67,6 +67,8 @@ along with GCC; see the file COPYING3.  If not see
  #include "tree-vector-builder.h"
  #include "tree-ssa-strlen.h"
  #include "varasm.h"
+#include "memmodel.h"
+#include "optabs.h"
  
  enum strlen_range_kind {
    /* Compute the exact constant string length.  */
@@ -957,14 +959,17 @@ gimple_fold_builtin_memory_op (gimple_stmt_iterator *gsi,
         = build_int_cst (build_pointer_type_for_mode (char_type_node,
                                                       ptr_mode, true), 0);
  
-      /* If we can perform the copy efficiently with first doing all loads
-         and then all stores inline it that way.  Currently efficiently
-        means that we can load all the memory into a single integer
-        register which is what MOVE_MAX gives us.  */
+      /* If we can perform the copy efficiently with first doing all loads and
+        then all stores inline it that way.  Currently efficiently means that
+        we can load all the memory with a single set operation and that the
+        total size is less than MOVE_MAX * MOVE_RATIO.  */
        src_align = get_pointer_alignment (src);
        dest_align = get_pointer_alignment (dest);
        if (tree_fits_uhwi_p (len)
-         && compare_tree_int (len, MOVE_MAX) <= 0
+         && (compare_tree_int
+             (len, (MOVE_MAX
+                    * MOVE_RATIO (optimize_function_for_size_p (cfun))))
+             <= 0)
           /* FIXME: Don't transform copies from strings with known length.
              Until GCC 9 this prevented a case in gcc.dg/strlenopt-8.c
              from being handled, and the case was XFAILed for that reason.
@@ -1000,6 +1005,7 @@ gimple_fold_builtin_memory_op (gimple_stmt_iterator *gsi,
               if (type
                   && is_a <scalar_int_mode> (TYPE_MODE (type), &mode)
                   && GET_MODE_SIZE (mode) * BITS_PER_UNIT == ilen * 8
+                 && have_insn_for (SET, mode)
                   /* If the destination pointer is not aligned we must be able
                      to emit an unaligned store.  */
                   && (dest_align >= GET_MODE_ALIGNMENT (mode)
author	Richard Earnshaw <rearnsha@arm.com>
	Fri, 3 Sep 2021 16:06:15 +0000 (17:06 +0100)
committer	Richard Earnshaw <rearnsha@arm.com>
	Mon, 13 Sep 2021 10:26:48 +0000 (11:26 +0100)