aarch64: PR target/121749: Use correct predicate for narrowing shift amounts

author Kyrylo Tkachov <ktkachov@nvidia.com>

Tue, 2 Sep 2025 07:43:14 +0000 (00:43 -0700)

committer Kyrylo Tkachov <ktkachov@nvidia.com>

Mon, 15 Sep 2025 14:13:14 +0000 (16:13 +0200)
author Kyrylo Tkachov <ktkachov@nvidia.com>
Tue, 2 Sep 2025 07:43:14 +0000 (00:43 -0700)
committer Kyrylo Tkachov <ktkachov@nvidia.com>
Mon, 15 Sep 2025 14:13:14 +0000 (16:13 +0200)
diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md

index e2afe87e5130cc066b8348659209ab40747327e5..97558c9687cea40f4ccb905774150baa61d5df4d 100644 (file)
--- a/gcc/config/aarch64/aarch64-simd.md
+++ b/gcc/config/aarch64/aarch64-simd.md
@@ -6678,7 +6678,7 @@
         (SAT_TRUNC:<VNARROWQ>
           (<TRUNC_SHIFT>:SD_HSDI
             (match_operand:SD_HSDI 1 "register_operand" "w")
-           (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>"))))]
+           (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>"))))]
    "TARGET_SIMD"
    "<shrn_op>shrn\t%<vn2>0<Vmntype>, %<v>1<Vmtype>, %2"
    [(set_attr "type" "neon_shift_imm_narrow_q")]
@@ -6700,7 +6700,7 @@
         (ALL_TRUNC:<VNARROWQ>
           (<TRUNC_SHIFT>:VQN
             (match_operand:VQN 1 "register_operand")
-           (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>"))))]
+           (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>"))))]
    "TARGET_SIMD"
    {
      operands[2] = aarch64_simd_gen_const_vector_dup (<MODE>mode,
@@ -6731,7 +6731,7 @@
               (<TRUNCEXTEND>:<DWI>
                 (match_operand:SD_HSDI 1 "register_operand" "w"))
               (match_operand:<DWI> 3 "aarch64_int_rnd_operand"))
-           (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>"))))]
+           (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>"))))]
    "TARGET_SIMD
     && aarch64_const_vec_rnd_cst_p (operands[3], operands[2])"
    "<shrn_op>rshrn\t%<vn2>0<Vmntype>, %<v>1<Vmtype>, %2"
@@ -6746,7 +6746,7 @@
               (<TRUNCEXTEND>:<V2XWIDE>
                 (match_operand:SD_HSDI 1 "register_operand"))
               (match_dup 3))
-           (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>"))))]
+           (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>"))))]
    "TARGET_SIMD"
    {
      /* Use this expander to create the rounding constant vector, which is
@@ -6766,7 +6766,7 @@
               (<TRUNCEXTEND>:<V2XWIDE>
                 (match_operand:VQN 1 "register_operand"))
               (match_dup 3))
-           (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>"))))]
+           (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>"))))]
    "TARGET_SIMD"
    {
      if (<CODE> == TRUNCATE
@@ -6808,7 +6808,7 @@
           (smax:SD_HSDI
             (ashiftrt:SD_HSDI
               (match_operand:SD_HSDI 1 "register_operand" "w")
-             (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>"))
+             (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>"))
             (const_int 0))
           (const_int <half_mask>)))]
    "TARGET_SIMD"
@@ -6819,7 +6819,7 @@
  (define_expand "aarch64_sqshrun_n<mode>"
    [(match_operand:<VNARROWQ> 0 "register_operand")
     (match_operand:SD_HSDI 1 "register_operand")
-   (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>")]
+   (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>")]
    "TARGET_SIMD"
    {
      rtx dst = gen_reg_rtx (<MODE>mode);
@@ -6837,7 +6837,7 @@
             (smax:VQN
               (ashiftrt:VQN
                 (match_operand:VQN 1 "register_operand")
-               (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>"))
+               (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>"))
               (match_dup 3))
             (match_dup 4))))]
    "TARGET_SIMD"
@@ -6879,7 +6879,7 @@
                 (sign_extend:<DWI>
                   (match_operand:SD_HSDI 1 "register_operand" "w"))
                 (match_operand:<DWI> 3 "aarch64_int_rnd_operand"))
-             (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>"))
+             (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>"))
             (const_int 0))
           (const_int <half_mask>)))]
    "TARGET_SIMD
@@ -6891,7 +6891,7 @@
  (define_expand "aarch64_sqrshrun_n<mode>"
    [(match_operand:<VNARROWQ> 0 "register_operand")
     (match_operand:SD_HSDI 1 "register_operand")
-   (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>")]
+   (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>")]
    "TARGET_SIMD"
    {
      int prec = GET_MODE_UNIT_PRECISION (<DWI>mode);
@@ -6914,7 +6914,7 @@
                   (sign_extend:<V2XWIDE>
                     (match_operand:VQN 1 "register_operand"))
                   (match_dup 3))
-               (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<ve_mode>"))
+               (match_operand:SI 2 "aarch64_simd_shift_imm_offset_<vn_mode>"))
               (match_dup 4))
             (match_dup 5))))]
    "TARGET_SIMD"
diff --git a/gcc/config/aarch64/iterators.md b/gcc/config/aarch64/iterators.md

index 47a9bdf2d038b7e7d0211a5c4ed9d3b3e3b1fa5e..4d60322b45ddb310a83375c2817a8a95b6c7d4b4 100644 (file)
--- a/gcc/config/aarch64/iterators.md
+++ b/gcc/config/aarch64/iterators.md
@@ -2126,7 +2126,8 @@
                            (SI   "si")])
  
  ;; Like ve_mode but for the half-width modes.
-(define_mode_attr vn_mode [(V8HI  "qi") (V4SI  "hi") (V2DI  "si")])
+(define_mode_attr vn_mode [(V8HI  "qi") (V4SI  "hi") (V2DI  "si") (DI "si")
+                          (SI "hi") (HI "qi")])
  
  ;; Vm for lane instructions is restricted to FP_LO_REGS.
  (define_mode_attr vwx [(V4HI "x") (V8HI "x") (HI "x")
diff --git a/gcc/testsuite/gcc.target/aarch64/simd/pr121749.c b/gcc/testsuite/gcc.target/aarch64/simd/pr121749.c

new file mode 100644 (file)

index 0000000..c4e1a2d
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/simd/pr121749.c
@@ -0,0 +1,11 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+#include <arm_neon.h>
+
+uint32_t
+foo (uint64_t v0)
+{
+  return vqshrnd_n_u64 (vshrd_n_u64 (v0, 26), 7);
+}
+
author	Kyrylo Tkachov <ktkachov@nvidia.com>
	Tue, 2 Sep 2025 07:43:14 +0000 (00:43 -0700)
committer	Kyrylo Tkachov <ktkachov@nvidia.com>
	Mon, 15 Sep 2025 14:13:14 +0000 (16:13 +0200)
gcc/config/aarch64/aarch64-simd.md		patch \| blob \| blame \| history
gcc/config/aarch64/iterators.md		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/simd/pr121749.c	[new file with mode: 0644]	patch \| blob