aarch64: Emit ADD X, Y, Y instead of SHL X, Y, #1 for Advanced SIMD

author Kyrylo Tkachov <ktkachov@nvidia.com>

Mon, 5 Aug 2024 18:29:44 +0000 (11:29 -0700)

committer Kyrylo Tkachov <ktkachov@nvidia.com>

Mon, 12 Aug 2024 09:41:04 +0000 (11:41 +0200)
author Kyrylo Tkachov <ktkachov@nvidia.com>
Mon, 5 Aug 2024 18:29:44 +0000 (11:29 -0700)
committer Kyrylo Tkachov <ktkachov@nvidia.com>
Mon, 12 Aug 2024 09:41:04 +0000 (11:41 +0200)
diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md

index cc612ec2ca0e3d84df410242c48ff60211ae7613..475f19766c38e38bff7ea683c98165629e9f02c5 100644 (file)
--- a/gcc/config/aarch64/aarch64-simd.md
+++ b/gcc/config/aarch64/aarch64-simd.md
@@ -1352,12 +1352,14 @@
  )
  
  (define_insn "aarch64_simd_imm_shl<mode><vczle><vczbe>"
- [(set (match_operand:VDQ_I 0 "register_operand" "=w")
-       (ashift:VDQ_I (match_operand:VDQ_I 1 "register_operand" "w")
-                  (match_operand:VDQ_I  2 "aarch64_simd_lshift_imm" "Dl")))]
+ [(set (match_operand:VDQ_I 0 "register_operand")
+       (ashift:VDQ_I (match_operand:VDQ_I 1 "register_operand")
+                  (match_operand:VDQ_I  2 "aarch64_simd_lshift_imm")))]
   "TARGET_SIMD"
-  "shl\t%0.<Vtype>, %1.<Vtype>, %2"
-  [(set_attr "type" "neon_shift_imm<q>")]
+  {@ [ cons: =0, 1,  2   ; attrs: type       ]
+     [ w       , w,  vs1 ; neon_add<q>       ] add\t%0.<Vtype>, %1.<Vtype>, %1.<Vtype>
+     [ w       , w,  Dl  ; neon_shift_imm<q> ] shl\t%0.<Vtype>, %1.<Vtype>, %2
+  }
  )
  
  (define_insn "aarch64_simd_reg_sshl<mode><vczle><vczbe>"
diff --git a/gcc/config/aarch64/constraints.md b/gcc/config/aarch64/constraints.md

index a2878f580d909d694a55b3d0e2b2c78d7abe2930..f491e4bd6a069bc9f8a3c71bdec14496c862a94d 100644 (file)
--- a/gcc/config/aarch64/constraints.md
+++ b/gcc/config/aarch64/constraints.md
@@ -667,6 +667,12 @@
     SMAX and SMIN operations."
   (match_operand 0 "aarch64_sve_vsm_immediate"))
  
+(define_constraint "vs1"
+  "@internal
+ A constraint that matches a vector of immediate one."
+ (and (match_code "const,const_vector")
+      (match_test "op == CONST1_RTX (GET_MODE (op))")))
+
  (define_constraint "vsA"
    "@internal
     A constraint that matches an immediate operand valid for SVE FADD
diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd_shl_add.c b/gcc/testsuite/gcc.target/aarch64/advsimd_shl_add.c

new file mode 100644 (file)

index 0000000..a161f89
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/advsimd_shl_add.c
@@ -0,0 +1,64 @@
+/* { dg-do compile } */
+/* { dg-additional-options "--save-temps -O1" } */
+/* { dg-final { check-function-bodies "**" "" "" } } */
+
+typedef __INT64_TYPE__ __attribute__ ((vector_size (16))) v2di;
+typedef int __attribute__ ((vector_size (16))) v4si;
+typedef short __attribute__ ((vector_size (16))) v8hi;
+typedef char __attribute__ ((vector_size (16))) v16qi;
+typedef short __attribute__ ((vector_size (8))) v4hi;
+typedef char __attribute__ ((vector_size (8))) v8qi;
+
+#define FUNC(S) \
+S               \
+foo_##S (S a)   \
+{ return a << 1; }
+
+/*
+** foo_v2di:
+**      add    v0.2d, v0.2d, v0.2d
+**      ret
+*/
+
+FUNC (v2di)
+
+/*
+** foo_v4si:
+**      add    v0.4s, v0.4s, v0.4s
+**      ret
+*/
+
+FUNC (v4si)
+
+/*
+** foo_v8hi:
+**      add    v0.8h, v0.8h, v0.8h
+**      ret
+*/
+
+FUNC (v8hi)
+
+/*
+** foo_v16qi:
+**      add    v0.16b, v0.16b, v0.16b
+**      ret
+*/
+
+FUNC (v16qi)
+
+/*
+** foo_v4hi:
+**      add    v0.4h, v0.4h, v0.4h
+**      ret
+*/
+
+FUNC (v4hi)
+
+/*
+** foo_v8qi:
+**      add    v0.8b, v0.8b, v0.8b
+**      ret
+*/
+
+FUNC (v8qi)
+
author	Kyrylo Tkachov <ktkachov@nvidia.com>
	Mon, 5 Aug 2024 18:29:44 +0000 (11:29 -0700)
committer	Kyrylo Tkachov <ktkachov@nvidia.com>
	Mon, 12 Aug 2024 09:41:04 +0000 (11:41 +0200)
gcc/config/aarch64/aarch64-simd.md		patch \| blob \| blame \| history
gcc/config/aarch64/constraints.md		patch \| blob \| blame \| history
gcc/testsuite/gcc.target/aarch64/advsimd_shl_add.c	[new file with mode: 0644]	patch \| blob