vect: Fix insufficient alignment requirement for speculative loads [PR121190]

author Pengfei Li <Pengfei.Li2@arm.com>

Wed, 30 Jul 2025 09:51:11 +0000 (10:51 +0100)

committer Tamar Christina <tamar.christina@arm.com>

Thu, 31 Jul 2025 05:01:42 +0000 (06:01 +0100)
author Pengfei Li <Pengfei.Li2@arm.com>
Wed, 30 Jul 2025 09:51:11 +0000 (10:51 +0100)
committer Tamar Christina <tamar.christina@arm.com>
Thu, 31 Jul 2025 05:01:42 +0000 (06:01 +0100)
diff --git a/gcc/testsuite/gcc.dg/vect/vect-early-break_137-pr121190.c b/gcc/testsuite/gcc.dg/vect/vect-early-break_137-pr121190.c

new file mode 100644 (file)

index 0000000..e6b071c
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/vect/vect-early-break_137-pr121190.c
@@ -0,0 +1,62 @@
+/* PR tree-optimization/121190 */
+/* { dg-options "-O3" } */
+/* { dg-additional-options "-march=znver2" { target x86_64-*-* i?86-*-* } } */
+/* { dg-require-effective-target mmap } */
+/* { dg-require-effective-target vect_early_break } */
+
+#include <stdint.h>
+#include <string.h>
+#include <stdio.h>
+#include <sys/mman.h>
+#include <unistd.h>
+#include "tree-vect.h"
+
+#define MAX_COMPARE 5000
+
+__attribute__((noipa))
+int diff (uint64_t *restrict p, uint64_t *restrict q)
+{
+  int i = 0;
+  while (i < MAX_COMPARE) {
+    if (*(p + i) != *(q + i))
+      return i;
+    i++;
+  }
+  return -1;
+}
+
+int main ()
+{
+  check_vect ();
+
+  long pgsz = sysconf (_SC_PAGESIZE);
+  if (pgsz == -1) {
+    fprintf (stderr, "sysconf failed\n");
+    return 0;
+  }
+
+  /* Allocate 2 consecutive pages of memory and let p1 and p2 point to the
+     beginning of each.  */
+  void *mem = mmap (NULL, pgsz * 2, PROT_READ | PROT_WRITE,
+                   MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
+  if (mem == MAP_FAILED) {
+    fprintf (stderr, "mmap failed\n");
+    return 0;
+  }
+  uint64_t *p1 = (uint64_t *) mem;
+  uint64_t *p2 = (uint64_t *) mem + pgsz / sizeof (uint64_t);
+
+  /* Fill the first page with zeros, except for its last 64 bits.  */
+  memset (p1, 0, pgsz);
+  *(p2 - 1) = -1;
+
+  /* Make the 2nd page not accessable.  */
+  mprotect (p2, pgsz, PROT_NONE);
+
+  /* Calls to diff should not read the 2nd page.  */
+  for (int i = 1; i <= 20; i++) {
+    if (diff (p2 - i, p1) != i - 1)
+      __builtin_abort ();
+  }
+}
+
diff --git a/gcc/testsuite/gcc.dg/vect/vect-early-break_52.c b/gcc/testsuite/gcc.dg/vect/vect-early-break_52.c

index 86a632f2a82291b3063a57cd62f2310ed6d5c747..6abfcd6580e4a5b4213efc31ecba1beb483f3d98 100644 (file)
--- a/gcc/testsuite/gcc.dg/vect/vect-early-break_52.c
+++ b/gcc/testsuite/gcc.dg/vect/vect-early-break_52.c
@@ -18,4 +18,4 @@ int main1 (short X)
      }
  }
  
-/* { dg-final { scan-tree-dump "vectorized 1 loops in function" "vect" { target { ! "x86_64-*-* i?86-*-*" } } } } */
+/* { dg-final { scan-tree-dump "vectorized 1 loops in function" "vect" { target { ! "x86_64-*-* i?86-*-* arm*-*-*" } } } } */
diff --git a/gcc/tree-vect-data-refs.cc b/gcc/tree-vect-data-refs.cc

index 85145f94516a5261dabdeb234c0e6ab67d0972a6..abb76b641838d52294bf1ed6bb1ea498b44f7f32 100644 (file)
--- a/gcc/tree-vect-data-refs.cc
+++ b/gcc/tree-vect-data-refs.cc
@@ -2758,12 +2758,14 @@ vect_enhance_data_refs_alignment (loop_vec_info loop_vinfo)
       2) there is at least one unsupported misaligned data ref with an unknown
          misalignment, and
       3) all misaligned data refs with a known misalignment are supported, and
-     4) the number of runtime alignment checks is within reason.  */
+     4) the number of runtime alignment checks is within reason.
+     5) the vectorization factor is a constant.  */
  
    do_versioning
      = (optimize_loop_nest_for_speed_p (loop)
         && !loop->inner /* FORNOW */
-       && loop_cost_model (loop) > VECT_COST_MODEL_CHEAP);
+       && loop_cost_model (loop) > VECT_COST_MODEL_CHEAP)
+       && LOOP_VINFO_VECT_FACTOR (loop_vinfo).is_constant ();
  
    if (do_versioning)
      {
@@ -2804,17 +2806,6 @@ vect_enhance_data_refs_alignment (loop_vec_info loop_vinfo)
                    break;
                  }
  
-             /* At present we don't support versioning for alignment
-                with variable VF, since there's no guarantee that the
-                VF is a power of two.  We could relax this if we added
-                a way of enforcing a power-of-two size.  */
-             unsigned HOST_WIDE_INT size;
-             if (!GET_MODE_SIZE (TYPE_MODE (vectype)).is_constant (&size))
-               {
-                 do_versioning = false;
-                 break;
-               }
-
               /* Forcing alignment in the first iteration is no good if
                  we don't keep it across iterations.  For now, just disable
                  versioning in this case.
@@ -2833,7 +2824,8 @@ vect_enhance_data_refs_alignment (loop_vec_info loop_vinfo)
                   Construct the mask needed for this test.  For example,
                   GET_MODE_SIZE for the vector mode V4SI is 16 bytes so the
                   mask must be 15 = 0xf. */
-             int mask = size - 1;
+             gcc_assert (DR_TARGET_ALIGNMENT (dr_info).is_constant ());
+             int mask = DR_TARGET_ALIGNMENT (dr_info).to_constant () - 1;
  
               /* FORNOW: use the same mask to test all potentially unaligned
                  references in the loop.  */
author	Pengfei Li <Pengfei.Li2@arm.com>
	Wed, 30 Jul 2025 09:51:11 +0000 (10:51 +0100)
committer	Tamar Christina <tamar.christina@arm.com>
	Thu, 31 Jul 2025 05:01:42 +0000 (06:01 +0100)
gcc/testsuite/gcc.dg/vect/vect-early-break_137-pr121190.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.dg/vect/vect-early-break_52.c		patch \| blob \| blame \| history
gcc/tree-vect-data-refs.cc		patch \| blob \| blame \| history