Aarch64: Add simd exp/expf ABI symbols

author Szabolcs Nagy <szabolcs.nagy@arm.com>

Fri, 28 Jun 2019 10:29:19 +0000 (11:29 +0100)

committer Szabolcs Nagy <szabolcs.nagy@arm.com>

Tue, 16 Jul 2019 10:01:46 +0000 (11:01 +0100)
author Szabolcs Nagy <szabolcs.nagy@arm.com>
Fri, 28 Jun 2019 10:29:19 +0000 (11:29 +0100)
committer Szabolcs Nagy <szabolcs.nagy@arm.com>
Tue, 16 Jul 2019 10:01:46 +0000 (11:01 +0100)
diff --git a/sysdeps/aarch64/configure b/sysdeps/aarch64/configure

index 5bd355a6917df365a71b2518b5d5590444463cd6..df15cdb02aa4dbd4a65353e1aca500d1f7f00aba 100644 (file)
--- a/sysdeps/aarch64/configure
+++ b/sysdeps/aarch64/configure
@@ -172,3 +172,34 @@ else
    config_vars="$config_vars
  default-abi = lp64"
  fi
+
+{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for pcs attribute support" >&5
+$as_echo_n "checking for pcs attribute support... " >&6; }
+if ${libc_cv_gcc_pcs_attribute+:} false; then :
+  $as_echo_n "(cached) " >&6
+else
+  cat > conftest.c <<EOF
+__attribute__((aarch64_vector_pcs)) extern void foo (void);
+EOF
+libc_cv_gcc_pcs_attribute=no
+if ${CC-cc} -c -Wall -Werror conftest.c -o conftest.o 1>&5 \
+   2>&5 ; then
+  libc_cv_gcc_pcs_attribute=yes
+fi
+rm -f conftest*
+fi
+{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $libc_cv_gcc_pcs_attribute" >&5
+$as_echo "$libc_cv_gcc_pcs_attribute" >&6; }
+
+# Enable libmvec by default.
+if test x"$build_mathvec" = xnotset; then
+  build_mathvec=yes
+fi
+
+# Only test libmvec if the compiler supports aarch64_vector_pcs.
+if test x"$build_mathvec" = xyes; then
+  if test $libc_cv_gcc_pcs_attribute = yes; then
+    config_vars="$config_vars
+test-mathvec = yes"
+  fi
+fi
diff --git a/sysdeps/aarch64/configure.ac b/sysdeps/aarch64/configure.ac

index 7851dd4dac345b2aab7d29e33d1b63051a66b2f4..eab411cad4c975b7d1eb529cbeee3e4a62f8c4ac 100644 (file)
--- a/sysdeps/aarch64/configure.ac
+++ b/sysdeps/aarch64/configure.ac
@@ -20,3 +20,27 @@ if test $libc_cv_aarch64_be = yes; then
  else
    LIBC_CONFIG_VAR([default-abi], [lp64])
  fi
+
+AC_CACHE_CHECK([for pcs attribute support],
+               libc_cv_gcc_pcs_attribute, [dnl
+cat > conftest.c <<EOF
+__attribute__((aarch64_vector_pcs)) extern void foo (void);
+EOF
+libc_cv_gcc_pcs_attribute=no
+if ${CC-cc} -c -Wall -Werror conftest.c -o conftest.o 1>&AS_MESSAGE_LOG_FD \
+   2>&AS_MESSAGE_LOG_FD ; then
+  libc_cv_gcc_pcs_attribute=yes
+fi
+rm -f conftest*])
+
+# Enable libmvec by default.
+if test x"$build_mathvec" = xnotset; then
+  build_mathvec=yes
+fi
+
+# Only test libmvec if the compiler supports aarch64_vector_pcs.
+if test x"$build_mathvec" = xyes; then
+  if test $libc_cv_gcc_pcs_attribute = yes; then
+    LIBC_CONFIG_VAR([test-mathvec], [yes])
+  fi
+fi
diff --git a/sysdeps/aarch64/fpu/Makefile b/sysdeps/aarch64/fpu/Makefile

index 4a182bd6d6886387816e97128524957504e37595..2841c03c14311ec5bb5f9b1546851951857c14ee 100644 (file)
--- a/sysdeps/aarch64/fpu/Makefile
+++ b/sysdeps/aarch64/fpu/Makefile
@@ -12,3 +12,22 @@ CFLAGS-s_fmaxf.c += -ffinite-math-only
  CFLAGS-s_fmin.c += -ffinite-math-only
  CFLAGS-s_fminf.c += -ffinite-math-only
  endif
+
+ifeq ($(subdir),mathvec)
+libmvec-support += \
+  libmvec_double_vlen2_exp \
+  libmvec_float_vlen4_expf \
+
+install-lib += libmvec_nonshared.a
+$(objpfx)libmvec_nonshared.a: $(dep-dummy-lib); $(make-dummy-lib)
+endif
+
+ifeq ($(subdir),math)
+ifeq ($(build-mathvec),yes)
+double-vlen2-funcs = exp
+float-vlen4-funcs = exp
+ifeq ($(test-mathvec),yes)
+libmvec-tests += double-vlen2 float-vlen4
+endif
+endif
+endif
diff --git a/sysdeps/aarch64/fpu/Versions b/sysdeps/aarch64/fpu/Versions

new file mode 100644 (file)

index 0000000..da36f3c
--- /dev/null
+++ b/sysdeps/aarch64/fpu/Versions
@@ -0,0 +1,5 @@
+libmvec {
+  GLIBC_2.30 {
+    _ZGVnN2v_exp; _ZGVnN4v_expf;
+  }
+}
diff --git a/sysdeps/aarch64/fpu/libmvec_double_vlen2.h b/sysdeps/aarch64/fpu/libmvec_double_vlen2.h

new file mode 100644 (file)

index 0000000..383980d
--- /dev/null
+++ b/sysdeps/aarch64/fpu/libmvec_double_vlen2.h
@@ -0,0 +1,59 @@
+/* Double-precision 2 element vector function template.
+   Copyright (C) 2019 Free Software Foundation, Inc.
+   This file is part of the GNU C Library.
+
+   The GNU C Library is free software; you can redistribute it and/or
+   modify it under the terms of the GNU Lesser General Public
+   License as published by the Free Software Foundation; either
+   version 2.1 of the License, or (at your option) any later version.
+
+   The GNU C Library is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   Lesser General Public License for more details.
+
+   You should have received a copy of the GNU Lesser General Public
+   License along with the GNU C Library; if not, see
+   <http://www.gnu.org/licenses/>.  */
+
+#include <sysdep.h>
+
+ENTRY (VECTOR_FUNCTION)
+       stp     x29, x30, [sp, -288]!
+       cfi_adjust_cfa_offset (288)
+       cfi_rel_offset (x29, 0)
+       cfi_rel_offset (x30, 8)
+       mov     x29, sp
+       stp      q8,  q9, [sp, 16]
+       stp     q10, q11, [sp, 48]
+       stp     q12, q13, [sp, 80]
+       stp     q14, q15, [sp, 112]
+       stp     q16, q17, [sp, 144]
+       stp     q18, q19, [sp, 176]
+       stp     q20, q21, [sp, 208]
+       stp     q22, q23, [sp, 240]
+
+       // Use per lane load/store to avoid endianness issues.
+       str     q0, [sp, 272]
+       ldr     d0, [sp, 272]
+       bl SCALAR_FUNCTION
+       str     d0, [sp, 272]
+       ldr     d0, [sp, 280]
+       bl SCALAR_FUNCTION
+       str     d0, [sp, 280]
+       ldr     q0, [sp, 272]
+
+       ldp     q8, q9, [sp, 16]
+       ldp     q10, q11, [sp, 48]
+       ldp     q12, q13, [sp, 80]
+       ldp     q14, q15, [sp, 112]
+       ldp     q16, q17, [sp, 144]
+       ldp     q18, q19, [sp, 176]
+       ldp     q20, q21, [sp, 208]
+       ldp     q22, q23, [sp, 240]
+       ldp     x29, x30, [sp], 288
+       cfi_adjust_cfa_offset (288)
+       cfi_restore (x29)
+       cfi_restore (x30)
+       ret
+END (VECTOR_FUNCTION)
diff --git a/sysdeps/aarch64/fpu/libmvec_double_vlen2_exp.S b/sysdeps/aarch64/fpu/libmvec_double_vlen2_exp.S

new file mode 100644 (file)

index 0000000..644405c
--- /dev/null
+++ b/sysdeps/aarch64/fpu/libmvec_double_vlen2_exp.S
@@ -0,0 +1,21 @@
+/* Double-precision 2 element vector e^x function.
+   Copyright (C) 2019 Free Software Foundation, Inc.
+   This file is part of the GNU C Library.
+
+   The GNU C Library is free software; you can redistribute it and/or
+   modify it under the terms of the GNU Lesser General Public
+   License as published by the Free Software Foundation; either
+   version 2.1 of the License, or (at your option) any later version.
+
+   The GNU C Library is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   Lesser General Public License for more details.
+
+   You should have received a copy of the GNU Lesser General Public
+   License along with the GNU C Library; if not, see
+   <http://www.gnu.org/licenses/>.  */
+
+#define SCALAR_FUNCTION exp
+#define VECTOR_FUNCTION _ZGVnN2v_exp
+#include "libmvec_double_vlen2.h"
diff --git a/sysdeps/aarch64/fpu/libmvec_float_vlen4.h b/sysdeps/aarch64/fpu/libmvec_float_vlen4.h

new file mode 100644 (file)

index 0000000..2450309
--- /dev/null
+++ b/sysdeps/aarch64/fpu/libmvec_float_vlen4.h
@@ -0,0 +1,65 @@
+/* Single-precision 4 element vector function template.
+   Copyright (C) 2019 Free Software Foundation, Inc.
+   This file is part of the GNU C Library.
+
+   The GNU C Library is free software; you can redistribute it and/or
+   modify it under the terms of the GNU Lesser General Public
+   License as published by the Free Software Foundation; either
+   version 2.1 of the License, or (at your option) any later version.
+
+   The GNU C Library is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   Lesser General Public License for more details.
+
+   You should have received a copy of the GNU Lesser General Public
+   License along with the GNU C Library; if not, see
+   <http://www.gnu.org/licenses/>.  */
+
+#include <sysdep.h>
+
+ENTRY (VECTOR_FUNCTION)
+       stp     x29, x30, [sp, -288]!
+       cfi_adjust_cfa_offset (288)
+       cfi_rel_offset (x29, 0)
+       cfi_rel_offset (x30, 8)
+       mov     x29, sp
+       stp      q8,  q9, [sp, 16]
+       stp     q10, q11, [sp, 48]
+       stp     q12, q13, [sp, 80]
+       stp     q14, q15, [sp, 112]
+       stp     q16, q17, [sp, 144]
+       stp     q18, q19, [sp, 176]
+       stp     q20, q21, [sp, 208]
+       stp     q22, q23, [sp, 240]
+
+       // Use per lane load/store to avoid endianness issues.
+       str     q0, [sp, 272]
+       ldr     s0, [sp, 272]
+       bl SCALAR_FUNCTION
+       str     s0, [sp, 272]
+       ldr     s0, [sp, 276]
+       bl SCALAR_FUNCTION
+       str     s0, [sp, 276]
+       ldr     s0, [sp, 280]
+       bl SCALAR_FUNCTION
+       str     s0, [sp, 280]
+       ldr     s0, [sp, 284]
+       bl SCALAR_FUNCTION
+       str     s0, [sp, 284]
+       ldr     q0, [sp, 272]
+
+       ldp     q8, q9, [sp, 16]
+       ldp     q10, q11, [sp, 48]
+       ldp     q12, q13, [sp, 80]
+       ldp     q14, q15, [sp, 112]
+       ldp     q16, q17, [sp, 144]
+       ldp     q18, q19, [sp, 176]
+       ldp     q20, q21, [sp, 208]
+       ldp     q22, q23, [sp, 240]
+       ldp     x29, x30, [sp], 288
+       cfi_adjust_cfa_offset (288)
+       cfi_restore (x29)
+       cfi_restore (x30)
+       ret
+END (VECTOR_FUNCTION)
diff --git a/sysdeps/aarch64/fpu/libmvec_float_vlen4_expf.S b/sysdeps/aarch64/fpu/libmvec_float_vlen4_expf.S

new file mode 100644 (file)

index 0000000..ab76ea0
--- /dev/null
+++ b/sysdeps/aarch64/fpu/libmvec_float_vlen4_expf.S
@@ -0,0 +1,21 @@
+/* Single-precision 4 element vector e^x function.
+   Copyright (C) 2019 Free Software Foundation, Inc.
+   This file is part of the GNU C Library.
+
+   The GNU C Library is free software; you can redistribute it and/or
+   modify it under the terms of the GNU Lesser General Public
+   License as published by the Free Software Foundation; either
+   version 2.1 of the License, or (at your option) any later version.
+
+   The GNU C Library is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   Lesser General Public License for more details.
+
+   You should have received a copy of the GNU Lesser General Public
+   License along with the GNU C Library; if not, see
+   <http://www.gnu.org/licenses/>.  */
+
+#define SCALAR_FUNCTION expf
+#define VECTOR_FUNCTION _ZGVnN4v_expf
+#include "libmvec_float_vlen4.h"
diff --git a/sysdeps/aarch64/fpu/test-double-vlen2-wrappers.c b/sysdeps/aarch64/fpu/test-double-vlen2-wrappers.c

new file mode 100644 (file)

index 0000000..6c6c44d
--- /dev/null
+++ b/sysdeps/aarch64/fpu/test-double-vlen2-wrappers.c
@@ -0,0 +1,28 @@
+/* Wrapper part of tests for aarch64 double vector math functions.
+   Copyright (C) 2019 Free Software Foundation, Inc.
+   This file is part of the GNU C Library.
+
+   The GNU C Library is free software; you can redistribute it and/or
+   modify it under the terms of the GNU Lesser General Public
+   License as published by the Free Software Foundation; either
+   version 2.1 of the License, or (at your option) any later version.
+
+   The GNU C Library is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   Lesser General Public License for more details.
+
+   You should have received a copy of the GNU Lesser General Public
+   License along with the GNU C Library; if not, see
+   <http://www.gnu.org/licenses/>.  */
+
+#include <arm_neon.h>
+#include "test-double-vlen2.h"
+
+#define VEC_TYPE float64x2_t
+
+/* Hack: VECTOR_WRAPPER declares the vector function without the pcs attribute,
+   placing it here happens to work, should be fixed in test-math-vector.h.  */
+__attribute__ ((aarch64_vector_pcs))
+
+VECTOR_WRAPPER (WRAPPER_NAME (exp), _ZGVnN2v_exp)
diff --git a/sysdeps/aarch64/fpu/test-float-vlen4-wrappers.c b/sysdeps/aarch64/fpu/test-float-vlen4-wrappers.c

new file mode 100644 (file)

index 0000000..5117633
--- /dev/null
+++ b/sysdeps/aarch64/fpu/test-float-vlen4-wrappers.c
@@ -0,0 +1,28 @@
+/* Wrapper part of tests for float aarch64 vector math functions.
+   Copyright (C) 2019 Free Software Foundation, Inc.
+   This file is part of the GNU C Library.
+
+   The GNU C Library is free software; you can redistribute it and/or
+   modify it under the terms of the GNU Lesser General Public
+   License as published by the Free Software Foundation; either
+   version 2.1 of the License, or (at your option) any later version.
+
+   The GNU C Library is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   Lesser General Public License for more details.
+
+   You should have received a copy of the GNU Lesser General Public
+   License along with the GNU C Library; if not, see
+   <http://www.gnu.org/licenses/>.  */
+
+#include <arm_neon.h>
+#include "test-float-vlen4.h"
+
+#define VEC_TYPE float32x4_t
+
+/* Hack: VECTOR_WRAPPER declares the vector function without the pcs attribute,
+   placing it here happens to work, should be fixed in test-math-vector.h.  */
+__attribute__ ((aarch64_vector_pcs))
+
+VECTOR_WRAPPER (WRAPPER_NAME (expf), _ZGVnN4v_expf)
diff --git a/sysdeps/aarch64/libm-test-ulps b/sysdeps/aarch64/libm-test-ulps

index 585e5bbce7a537c2543e9f1563b46d9ca359c53f..1ed4af9e552ac07f9f5e0fd855417edd3e55caef 100644 (file)
--- a/sysdeps/aarch64/libm-test-ulps
+++ b/sysdeps/aarch64/libm-test-ulps
@@ -1601,6 +1601,12 @@ float: 1
  idouble: 1
  ifloat: 1
  
+Function: "exp_vlen2":
+double: 1
+
+Function: "exp_vlen4":
+float: 1
+
  Function: "expm1":
  double: 1
  float: 1
diff --git a/sysdeps/unix/sysv/linux/aarch64/libmvec.abilist b/sysdeps/unix/sysv/linux/aarch64/libmvec.abilist

new file mode 100644 (file)

index 0000000..9e17825
--- /dev/null
+++ b/sysdeps/unix/sysv/linux/aarch64/libmvec.abilist
@@ -0,0 +1,2 @@
+GLIBC_2.30 _ZGVnN2v_exp F
+GLIBC_2.30 _ZGVnN4v_expf F
author	Szabolcs Nagy <szabolcs.nagy@arm.com>
	Fri, 28 Jun 2019 10:29:19 +0000 (11:29 +0100)
committer	Szabolcs Nagy <szabolcs.nagy@arm.com>
	Tue, 16 Jul 2019 10:01:46 +0000 (11:01 +0100)
sysdeps/aarch64/configure		patch \| blob \| blame \| history
sysdeps/aarch64/configure.ac		patch \| blob \| blame \| history
sysdeps/aarch64/fpu/Makefile		patch \| blob \| blame \| history
sysdeps/aarch64/fpu/Versions	[new file with mode: 0644]	patch \| blob
sysdeps/aarch64/fpu/libmvec_double_vlen2.h	[new file with mode: 0644]	patch \| blob
sysdeps/aarch64/fpu/libmvec_double_vlen2_exp.S	[new file with mode: 0644]	patch \| blob
sysdeps/aarch64/fpu/libmvec_float_vlen4.h	[new file with mode: 0644]	patch \| blob
sysdeps/aarch64/fpu/libmvec_float_vlen4_expf.S	[new file with mode: 0644]	patch \| blob
sysdeps/aarch64/fpu/test-double-vlen2-wrappers.c	[new file with mode: 0644]	patch \| blob
sysdeps/aarch64/fpu/test-float-vlen4-wrappers.c	[new file with mode: 0644]	patch \| blob
sysdeps/aarch64/libm-test-ulps		patch \| blob \| blame \| history
sysdeps/unix/sysv/linux/aarch64/libmvec.abilist	[new file with mode: 0644]	patch \| blob