]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
aarch64: Set loop_align to 64:16 for NVIDIA Olympus
authorKyrylo Tkachov <ktkachov@nvidia.com>
Tue, 17 Mar 2026 08:48:01 +0000 (01:48 -0700)
committerKyrylo Tkachov <ktkachov@nvidia.com>
Fri, 20 Mar 2026 15:50:34 +0000 (16:50 +0100)
The Olympus core benefits from a more relaxed bigger alignment on hot loops.

Bootstrapped and tested on aarch64-none-linux-gnu.
Pushing to trunk.

Signed-off-by: Kyrylo Tkachov <ktkachov@nvidia.com>
gcc/ChangeLog

* config/aarch64/tuning_models/olympus.h (olympus_tunings): Set
loop_align to 64:16.

gcc/config/aarch64/tuning_models/olympus.h

index 29b87a40f68f548c9c0f0d523514992142b7d9bf..745a5ff064970cb795abfce57333174834057329 100644 (file)
@@ -547,7 +547,7 @@ static struct tune_params olympus_tunings =
   AARCH64_FUSE_NEOVERSE_BASE, /* fusible_ops  */
   "32:16",     /* function_align.  */
   "4",         /* jump_align.  */
-  "32:16",     /* loop_align.  */
+  "64:16",     /* loop_align.  */
   8,   /* int_reassoc_width.  */
   6,   /* fp_reassoc_width.  */
   4,   /* fma_reassoc_width.  */