[x86] override vector_costs::better_main_loop_than_p

author Richard Biener <rguenther@suse.de>

Tue, 28 Apr 2026 09:00:38 +0000 (11:00 +0200)

committer Richard Biener <rguenth@gcc.gnu.org>

Thu, 30 Apr 2026 06:12:46 +0000 (08:12 +0200)
author Richard Biener <rguenther@suse.de>
Tue, 28 Apr 2026 09:00:38 +0000 (11:00 +0200)
committer Richard Biener <rguenth@gcc.gnu.org>
Thu, 30 Apr 2026 06:12:46 +0000 (08:12 +0200)
diff --git a/gcc/config/i386/i386.cc b/gcc/config/i386/i386.cc

index cfec6845c1688661bd6e0adb8843bb76087fd5ab..b92338bc6dd091d54369939b97ed82425a4f4be0 100644 (file)
--- a/gcc/config/i386/i386.cc
+++ b/gcc/config/i386/i386.cc
@@ -26128,6 +26128,7 @@ public:
                               tree vectype, int misalign,
                               vect_cost_model_location where) override;
    void finish_cost (const vector_costs *) override;
+  bool better_main_loop_than_p (const vector_costs *) const override;
  
  private:
  
@@ -26987,6 +26988,28 @@ ix86_vector_costs::finish_cost (const vector_costs *scalar_costs)
    vector_costs::finish_cost (scalar_costs);
  }
  
+/* Return true if THIS should be preferred over OTHER as main vector loop.  */
+
+bool
+ix86_vector_costs::better_main_loop_than_p (const vector_costs *other) const
+{
+  loop_vec_info this_loop_vinfo = as_a<loop_vec_info> (this->vinfo ());
+  loop_vec_info other_loop_vinfo = as_a<loop_vec_info> (other->vinfo ());
+
+  /* If the other loop is masked it does not need an epilog.  Prefer that
+     if the current loop cannot be vectorized fully with a vector
+     epilogs with at most one scalar iteration left.  */
+  if (LOOP_VINFO_NITERS_KNOWN_P (this_loop_vinfo)
+      && LOOP_VINFO_USING_PARTIAL_VECTORS_P (other_loop_vinfo)
+      && known_gt (LOOP_VINFO_VECT_FACTOR (other_loop_vinfo),
+                  LOOP_VINFO_INT_NITERS (this_loop_vinfo))
+      && (popcount_hwi (LOOP_VINFO_INT_NITERS (this_loop_vinfo) & ~1)
+         > (param_vect_epilogues_nomask != 0)))
+    return false;
+
+  return vector_costs::better_main_loop_than_p (other);
+}
+
  /* Validate target specific memory model bits in VAL. */
  
  static unsigned HOST_WIDE_INT
diff --git a/gcc/tree-vectorizer.h b/gcc/tree-vectorizer.h

index c01b17b3ee69e08f46e7fbe22fa5aacff13255d2..de50ed3277c475c130cbe223ade6501a7bb22045 100644 (file)
--- a/gcc/tree-vectorizer.h
+++ b/gcc/tree-vectorizer.h
@@ -1804,8 +1804,11 @@ public:
    unsigned int epilogue_cost () const;
    unsigned int outside_cost () const;
    unsigned int total_cost () const;
+
    unsigned int suggested_unroll_factor () const;
    machine_mode suggested_epilogue_mode (int &masked) const;
+
+  vec_info *vinfo () const { return m_vinfo; }
    bool costing_for_scalar () const { return m_costing_for_scalar; }
  
  protected:
author	Richard Biener <rguenther@suse.de>
	Tue, 28 Apr 2026 09:00:38 +0000 (11:00 +0200)
committer	Richard Biener <rguenth@gcc.gnu.org>
	Thu, 30 Apr 2026 06:12:46 +0000 (08:12 +0200)
gcc/config/i386/i386.cc		patch \| blob \| blame \| history
gcc/tree-vectorizer.h		patch \| blob \| blame \| history