From: Jonathan Wright Date: Mon, 8 Nov 2021 17:31:30 +0000 (+0000) Subject: aarch64: Use type-qualified builtins for PMUL[L] Neon intrinsics X-Git-Tag: basepoints/gcc-13~3151 X-Git-Url: http://git.ipfire.org/?a=commitdiff_plain;h=a2590b545ee76867f3843749e38233f2887ce3ad;p=thirdparty%2Fgcc.git aarch64: Use type-qualified builtins for PMUL[L] Neon intrinsics Declare poly type-qualified builtins and use them for PMUL[L] Neon intrinsics. This removes the need for casts in arm_neon.h. gcc/ChangeLog: 2021-11-08 Jonathan Wright * config/aarch64/aarch64-simd-builtins.def: Use poly type qualifier in builtin generator macros. * config/aarch64/arm_neon.h (vmul_p8): Use type-qualified builtin and remove casts. (vmulq_p8): Likewise. (vmull_high_p8): Likewise. (vmull_p8): Likewise. --- diff --git a/gcc/config/aarch64/aarch64-simd-builtins.def b/gcc/config/aarch64/aarch64-simd-builtins.def index c39f172513fb..4e298de5646c 100644 --- a/gcc/config/aarch64/aarch64-simd-builtins.def +++ b/gcc/config/aarch64/aarch64-simd-builtins.def @@ -45,9 +45,9 @@ BUILTIN_VDC (COMBINE, combine, 0, AUTO_FP) VAR1 (COMBINEP, combine, 0, NONE, di) - BUILTIN_VB (BINOP, pmul, 0, NONE) - VAR1 (BINOP, pmull, 0, NONE, v8qi) - VAR1 (BINOP, pmull_hi, 0, NONE, v16qi) + BUILTIN_VB (BINOPP, pmul, 0, NONE) + VAR1 (BINOPP, pmull, 0, NONE, v8qi) + VAR1 (BINOPP, pmull_hi, 0, NONE, v16qi) BUILTIN_VHSDF_HSDF (BINOP, fmulx, 0, FP) BUILTIN_VHSDF_DF (UNOP, sqrt, 2, FP) BUILTIN_VDQ_I (BINOP, addp, 0, NONE) diff --git a/gcc/config/aarch64/arm_neon.h b/gcc/config/aarch64/arm_neon.h index 538fc3cddffd..236358774abd 100644 --- a/gcc/config/aarch64/arm_neon.h +++ b/gcc/config/aarch64/arm_neon.h @@ -1007,8 +1007,7 @@ __extension__ extern __inline poly8x8_t __attribute__ ((__always_inline__, __gnu_inline__, __artificial__)) vmul_p8 (poly8x8_t __a, poly8x8_t __b) { - return (poly8x8_t) __builtin_aarch64_pmulv8qi ((int8x8_t) __a, - (int8x8_t) __b); + return __builtin_aarch64_pmulv8qi_ppp (__a, __b); } __extension__ extern __inline int8x16_t @@ -1071,8 +1070,7 @@ __extension__ extern __inline poly8x16_t __attribute__ ((__always_inline__, __gnu_inline__, __artificial__)) vmulq_p8 (poly8x16_t __a, poly8x16_t __b) { - return (poly8x16_t) __builtin_aarch64_pmulv16qi ((int8x16_t) __a, - (int8x16_t) __b); + return __builtin_aarch64_pmulv16qi_ppp (__a, __b); } __extension__ extern __inline int8x8_t @@ -7716,8 +7714,7 @@ __extension__ extern __inline poly16x8_t __attribute__ ((__always_inline__, __gnu_inline__, __artificial__)) vmull_high_p8 (poly8x16_t __a, poly8x16_t __b) { - return (poly16x8_t) __builtin_aarch64_pmull_hiv16qi ((int8x16_t) __a, - (int8x16_t) __b); + return __builtin_aarch64_pmull_hiv16qi_ppp (__a, __b); } __extension__ extern __inline int16x8_t @@ -7850,8 +7847,7 @@ __extension__ extern __inline poly16x8_t __attribute__ ((__always_inline__, __gnu_inline__, __artificial__)) vmull_p8 (poly8x8_t __a, poly8x8_t __b) { - return (poly16x8_t) __builtin_aarch64_pmullv8qi ((int8x8_t) __a, - (int8x8_t) __b); + return __builtin_aarch64_pmullv8qi_ppp (__a, __b); } __extension__ extern __inline int16x8_t