/* Function acosf vectorized with SSE4. Copyright (C) 2021-2024 Free Software Foundation, Inc. This file is part of the GNU C Library. The GNU C Library is free software; you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. The GNU C Library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details. You should have received a copy of the GNU Lesser General Public License along with the GNU C Library; if not, see https://www.gnu.org/licenses/. */ /* * ALGORITHM DESCRIPTION: * * SelMask = (|x| >= 0.5) ? 1 : 0; * R = SelMask ? sqrt(0.5 - 0.5*|x|) : |x| * acos(|x|) = SelMask ? 2*Poly(R) : (Pi/2 - Poly(R)) * acos(x) = sign(x) ? (Pi - acos(|x|)) : acos(|x|) * * */ /* Offsets for data table __svml_sacos_data_internal */ #define SgnBit 0 #define OneHalf 16 #define SmallNorm 32 #define MOne 48 #define Two 64 #define sqrt_coeff 80 #define poly_coeff 112 #define Pi2H 192 #define PiH 208 #include .section .text.sse4, "ax", @progbits ENTRY(_ZGVbN4v_acosf_sse4) subq $72, %rsp cfi_def_cfa_offset(80) /* X