aarch64: PR target/123584 - Fix expansion of SHA3 XAR with 0 amount

author Kyrylo Tkachov <ktkachov@nvidia.com>

Thu, 15 Jan 2026 13:10:31 +0000 (05:10 -0800)

committer Kyrylo Tkachov <ktkachov@nvidia.com>

Tue, 20 Jan 2026 12:55:34 +0000 (13:55 +0100)
author Kyrylo Tkachov <ktkachov@nvidia.com>
Thu, 15 Jan 2026 13:10:31 +0000 (05:10 -0800)
committer Kyrylo Tkachov <ktkachov@nvidia.com>
Tue, 20 Jan 2026 12:55:34 +0000 (13:55 +0100)
diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md

index 7a38310efce85b60236dabe51d4d239e936238f9..0ef7339a40a77be91200af3aa3230f41821fa626 100644 (file)
--- a/gcc/config/aarch64/aarch64-simd.md
+++ b/gcc/config/aarch64/aarch64-simd.md
@@ -9579,9 +9579,13 @@
          (match_operand:V2DI 3 "aarch64_simd_lshift_imm" "Dl")))]
    "TARGET_SHA3"
    {
+    /* Translate the RTL left-rotate amount into the assembly right-rotate
+       amount.  Modulo by 64 to ensure that a left-rotate of 0 is emitted
+       as a right-rotate of 0 as accepted by the assembly instruction.  */
      operands[3]
-      = GEN_INT (64 - INTVAL (unwrap_const_vec_duplicate (operands[3])));
-    return "xar\\t%0.2d, %1.2d, %2.2d, %3";
+      = GEN_INT ((64 - INTVAL (unwrap_const_vec_duplicate (operands[3])))
+                 % 64);
+    return "xar\\t%0.2d, %1.2d, %2.2d, #%3";
    }
    [(set_attr "type" "crypto_sha3")]
  )
@@ -9601,9 +9605,12 @@
          (match_operand:SI 3 "aarch64_simd_shift_imm_di")))]
    "TARGET_SHA3"
    {
-    operands[3]
-      = aarch64_simd_gen_const_vector_dup (V2DImode,
-                                          64 - INTVAL (operands[3]));
+      operands[3]
+        = aarch64_simd_gen_const_vector_dup (V2DImode,
+                                            /* In the edge case of a 0 rotate
+                                               amount leave as is.  */
+                                            operands[3] == CONST0_RTX (SImode)
+                                              ? 0 : 64 - INTVAL (operands[3]));
    }
  )
  
diff --git a/gcc/testsuite/gcc.target/aarch64/torture/xar-zero.c b/gcc/testsuite/gcc.target/aarch64/torture/xar-zero.c

new file mode 100644 (file)

index 0000000..379c5b7
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/torture/xar-zero.c
@@ -0,0 +1,9 @@
+/* PR target/123584.  */
+/* { dg-do compile } */
+/* { dg-options "-march=armv8.2-a+sha3" } */
+
+#include <arm_neon.h>
+uint64x2_t
+simde_vld1q_u64(uint64x2_t simde_vld1q_u64_a, uint64x2_t simde_vld1q_u64_b) {
+  return vxarq_u64(simde_vld1q_u64_a, simde_vld1q_u64_b, 0);
+}
author	Kyrylo Tkachov <ktkachov@nvidia.com>
	Thu, 15 Jan 2026 13:10:31 +0000 (05:10 -0800)
committer	Kyrylo Tkachov <ktkachov@nvidia.com>
	Tue, 20 Jan 2026 12:55:34 +0000 (13:55 +0100)
gcc/config/aarch64/aarch64-simd.md		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/torture/xar-zero.c	[new file with mode: 0644]	patch \| blob