From: Kyrylo Tkachov Date: Sun, 23 Apr 2023 13:44:13 +0000 (+0100) Subject: aarch64: Annotate fcvtn pattern for vec_concat with zeroes X-Git-Tag: basepoints/gcc-15~9960 X-Git-Url: http://git.ipfire.org/cgi-bin/gitweb.cgi?a=commitdiff_plain;h=7e26fd6bcd39f53bc917f55f8cce6101180c1dcd;p=thirdparty%2Fgcc.git aarch64: Annotate fcvtn pattern for vec_concat with zeroes Using the define_substs in aarch64-simd.md this is a straightforward annotation to remove a redundant fmov insn. So the codegen goes from: foo_d: fcvtn v0.2s, v0.2d fmov d0, d0 ret to the simple: foo_d: fcvtn v0.2s, v0.2d ret Bootstrapped and tested on aarch64-none-linux-gnu. gcc/ChangeLog: * config/aarch64/aarch64-simd.md (aarch64_float_truncate_lo_): Rename to... (aarch64_float_truncate_lo_): ... This. gcc/testsuite/ChangeLog: * gcc.target/aarch64/float_truncate_zero.c: New test. --- diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md index 4a1ec71995da..7bd4362318b6 100644 --- a/gcc/config/aarch64/aarch64-simd.md +++ b/gcc/config/aarch64/aarch64-simd.md @@ -3331,7 +3331,7 @@ } ) -(define_insn "aarch64_float_truncate_lo_" +(define_insn "aarch64_float_truncate_lo_" [(set (match_operand:VDF 0 "register_operand" "=w") (float_truncate:VDF (match_operand: 1 "register_operand" "w")))] diff --git a/gcc/testsuite/gcc.target/aarch64/float_truncate_zero.c b/gcc/testsuite/gcc.target/aarch64/float_truncate_zero.c new file mode 100644 index 000000000000..41775d164a50 --- /dev/null +++ b/gcc/testsuite/gcc.target/aarch64/float_truncate_zero.c @@ -0,0 +1,32 @@ +/* { dg-do compile } */ +/* { dg-additional-options "--save-temps -O1" } */ +/* { dg-final { check-function-bodies "**" "" "" } } */ + +#include + +/* +** foo: +** fcvtn v0.4h, v0.4s +** ret +*/ + +float16x8_t +foo (float32x4_t a) +{ + float16x4_t b = vcvt_f16_f32 (a); + return vcombine_f16 (b, vdup_n_f16 (0.0)); +} + +/* +** foo_d: +** fcvtn v0.2s, v0.2d +** ret +*/ + +float32x4_t +foo_d (float64x2_t a) +{ + float32x2_t b = vcvt_f32_f64 (a); + return vcombine_f32 (b, vdup_n_f32 (0.0)); +} +