[i386] Reject too large vectors for partial vector vectorization

author Richard Biener <rguenther@suse.de>

Mon, 19 Jun 2023 10:28:32 +0000 (12:28 +0200)

committer Richard Biener <rguenther@suse.de>

Wed, 21 Jun 2023 07:10:13 +0000 (09:10 +0200)
author Richard Biener <rguenther@suse.de>
Mon, 19 Jun 2023 10:28:32 +0000 (12:28 +0200)
committer Richard Biener <rguenther@suse.de>
Wed, 21 Jun 2023 07:10:13 +0000 (09:10 +0200)
diff --git a/gcc/config/i386/i386.cc b/gcc/config/i386/i386.cc

index b20cb86b822e2e1ccb49c8f3f82fadf97e36afe8..32851a514a92e2aa45c1c35fae9458830e089815 100644 (file)
--- a/gcc/config/i386/i386.cc
+++ b/gcc/config/i386/i386.cc
@@ -23666,6 +23666,7 @@ class ix86_vector_costs : public vector_costs
                               stmt_vec_info stmt_info, slp_tree node,
                               tree vectype, int misalign,
                               vect_cost_model_location where) override;
+  void finish_cost (const vector_costs *) override;
  };
  
  /* Implement targetm.vectorize.create_costs.  */
@@ -23918,6 +23919,31 @@ ix86_vector_costs::add_stmt_cost (int count, vect_cost_for_stmt kind,
    return retval;
  }
  
+void
+ix86_vector_costs::finish_cost (const vector_costs *scalar_costs)
+{
+  loop_vec_info loop_vinfo = dyn_cast<loop_vec_info> (m_vinfo);
+  if (loop_vinfo && !m_costing_for_scalar)
+    {
+      /* We are currently not asking the vectorizer to compare costs
+        between different vector mode sizes.  When using predication
+        that will end up always choosing the prefered mode size even
+        if there's a smaller mode covering all lanes.  Test for this
+        situation and artificially reject the larger mode attempt.
+        ???  We currently lack masked ops for sub-SSE sized modes,
+        so we could restrict this rejection to AVX and AVX512 modes
+        but error on the safe side for now.  */
+      if (LOOP_VINFO_USING_PARTIAL_VECTORS_P (loop_vinfo)
+         && !LOOP_VINFO_EPILOGUE_P (loop_vinfo)
+         && LOOP_VINFO_NITERS_KNOWN_P (loop_vinfo)
+         && (exact_log2 (LOOP_VINFO_VECT_FACTOR (loop_vinfo).to_constant ())
+             > ceil_log2 (LOOP_VINFO_INT_NITERS (loop_vinfo))))
+       m_costs[vect_body] = INT_MAX;
+    }
+
+  vector_costs::finish_cost (scalar_costs);
+}
+
  /* Validate target specific memory model bits in VAL. */
  
  static unsigned HOST_WIDE_INT
diff --git a/gcc/testsuite/gcc.target/i386/vect-partial-vectors-1.c b/gcc/testsuite/gcc.target/i386/vect-partial-vectors-1.c

new file mode 100644 (file)

index 0000000..3834720
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/vect-partial-vectors-1.c
@@ -0,0 +1,13 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -mavx512f -mavx512vl -mprefer-vector-width=512 --param vect-partial-vector-usage=1" } */
+
+void foo (int * __restrict a, int *b)
+{
+  for (int i = 0; i < 4; ++i)
+    a[i] = b[i] + 42;
+}
+
+/* We do not want to optimize this using masked AVX or AXV512
+   but unmasked SSE.  */
+/* { dg-final { scan-assembler-not "\[yz\]mm" } } */
+/* { dg-final { scan-assembler "xmm" } } */
diff --git a/gcc/testsuite/gcc.target/i386/vect-partial-vectors-2.c b/gcc/testsuite/gcc.target/i386/vect-partial-vectors-2.c

new file mode 100644 (file)

index 0000000..4ab2cbc
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/vect-partial-vectors-2.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -mavx512f -mavx512vl -mprefer-vector-width=512 --param vect-partial-vector-usage=1" } */
+
+void foo (int * __restrict a, int *b)
+{
+  for (int i = 0; i < 7; ++i)
+    a[i] = b[i] + 42;
+}
+
+/* We want to optimize this using masked AVX, not AXV512 or SSE.  */
+/* { dg-final { scan-assembler-not "zmm" } } */
+/* { dg-final { scan-assembler "ymm\[^\r\n\]*\{%k" } } */
author	Richard Biener <rguenther@suse.de>
	Mon, 19 Jun 2023 10:28:32 +0000 (12:28 +0200)
committer	Richard Biener <rguenther@suse.de>
	Wed, 21 Jun 2023 07:10:13 +0000 (09:10 +0200)
gcc/config/i386/i386.cc		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/i386/vect-partial-vectors-1.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/i386/vect-partial-vectors-2.c	[new file with mode: 0644]	patch \| blob