]>
Commit | Line | Data |
---|---|---|
c9bfaa1b AJ |
1 | /* |
2 | * ==================================================== | |
3 | * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved. | |
4 | * | |
5 | * Developed at SunPro, a Sun Microsystems, Inc. business. | |
6 | * Permission to use, copy, modify, and distribute this | |
7 | * software is freely granted, provided that this notice | |
8 | * is preserved. | |
9 | * ==================================================== | |
10 | */ | |
11 | ||
12 | /* | |
cc7375ce RM |
13 | Long double expansions are |
14 | Copyright (C) 2001 Stephen L. Moshier <moshier@na-net.ornl.gov> | |
9cd2726c RM |
15 | and are incorporated herein by permission of the author. The author |
16 | reserves the right to distribute this material elsewhere under different | |
17 | copying permissions. These modifications are distributed here under | |
18 | the following terms: | |
cc7375ce RM |
19 | |
20 | This library is free software; you can redistribute it and/or | |
21 | modify it under the terms of the GNU Lesser General Public | |
22 | License as published by the Free Software Foundation; either | |
23 | version 2.1 of the License, or (at your option) any later version. | |
24 | ||
25 | This library is distributed in the hope that it will be useful, | |
26 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
27 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
28 | Lesser General Public License for more details. | |
29 | ||
30 | You should have received a copy of the GNU Lesser General Public | |
31 | License along with this library; if not, write to the Free Software | |
32 | Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */ | |
c9bfaa1b AJ |
33 | |
34 | /* __ieee754_acosl(x) | |
35 | * Method : | |
36 | * acos(x) = pi/2 - asin(x) | |
37 | * acos(-x) = pi/2 + asin(x) | |
38 | * For |x| <= 0.375 | |
39 | * acos(x) = pi/2 - asin(x) | |
40 | * Between .375 and .5 the approximation is | |
41 | * acos(0.4375 + x) = acos(0.4375) + x P(x) / Q(x) | |
42 | * Between .5 and .625 the approximation is | |
43 | * acos(0.5625 + x) = acos(0.5625) + x rS(x) / sS(x) | |
44 | * For x > 0.625, | |
45 | * acos(x) = 2 asin(sqrt((1-x)/2)) | |
46 | * computed with an extended precision square root in the leading term. | |
47 | * For x < -0.625 | |
48 | * acos(x) = pi - 2 asin(sqrt((1-|x|)/2)) | |
49 | * | |
50 | * Special cases: | |
51 | * if x is NaN, return x itself; | |
52 | * if |x|>1, return NaN with invalid signal. | |
53 | * | |
54 | * Functions needed: __ieee754_sqrtl. | |
55 | */ | |
56 | ||
57 | #include "math.h" | |
58 | #include "math_private.h" | |
59 | ||
60 | #ifdef __STDC__ | |
61 | static const long double | |
62 | #else | |
63 | static long double | |
64 | #endif | |
65 | one = 1.0L, | |
66 | pio2_hi = 1.5707963267948966192313216916397514420986L, | |
67 | pio2_lo = 4.3359050650618905123985220130216759843812E-35L, | |
68 | ||
69 | /* acos(0.5625 + x) = acos(0.5625) + x rS(x) / sS(x) | |
70 | -0.0625 <= x <= 0.0625 | |
71 | peak relative error 3.3e-35 */ | |
72 | ||
73 | rS0 = 5.619049346208901520945464704848780243887E0L, | |
74 | rS1 = -4.460504162777731472539175700169871920352E1L, | |
75 | rS2 = 1.317669505315409261479577040530751477488E2L, | |
76 | rS3 = -1.626532582423661989632442410808596009227E2L, | |
77 | rS4 = 3.144806644195158614904369445440583873264E1L, | |
78 | rS5 = 9.806674443470740708765165604769099559553E1L, | |
79 | rS6 = -5.708468492052010816555762842394927806920E1L, | |
80 | rS7 = -1.396540499232262112248553357962639431922E1L, | |
81 | rS8 = 1.126243289311910363001762058295832610344E1L, | |
82 | rS9 = 4.956179821329901954211277873774472383512E-1L, | |
83 | rS10 = -3.313227657082367169241333738391762525780E-1L, | |
84 | ||
85 | sS0 = -4.645814742084009935700221277307007679325E0L, | |
86 | sS1 = 3.879074822457694323970438316317961918430E1L, | |
87 | sS2 = -1.221986588013474694623973554726201001066E2L, | |
88 | sS3 = 1.658821150347718105012079876756201905822E2L, | |
89 | sS4 = -4.804379630977558197953176474426239748977E1L, | |
90 | sS5 = -1.004296417397316948114344573811562952793E2L, | |
91 | sS6 = 7.530281592861320234941101403870010111138E1L, | |
92 | sS7 = 1.270735595411673647119592092304357226607E1L, | |
93 | sS8 = -1.815144839646376500705105967064792930282E1L, | |
94 | sS9 = -7.821597334910963922204235247786840828217E-2L, | |
95 | /* 1.000000000000000000000000000000000000000E0 */ | |
96 | ||
97 | acosr5625 = 9.7338991014954640492751132535550279812151E-1L, | |
98 | pimacosr5625 = 2.1682027434402468335351320579240000860757E0L, | |
99 | ||
100 | /* acos(0.4375 + x) = acos(0.4375) + x rS(x) / sS(x) | |
101 | -0.0625 <= x <= 0.0625 | |
102 | peak relative error 2.1e-35 */ | |
103 | ||
104 | P0 = 2.177690192235413635229046633751390484892E0L, | |
105 | P1 = -2.848698225706605746657192566166142909573E1L, | |
106 | P2 = 1.040076477655245590871244795403659880304E2L, | |
107 | P3 = -1.400087608918906358323551402881238180553E2L, | |
108 | P4 = 2.221047917671449176051896400503615543757E1L, | |
109 | P5 = 9.643714856395587663736110523917499638702E1L, | |
110 | P6 = -5.158406639829833829027457284942389079196E1L, | |
111 | P7 = -1.578651828337585944715290382181219741813E1L, | |
112 | P8 = 1.093632715903802870546857764647931045906E1L, | |
113 | P9 = 5.448925479898460003048760932274085300103E-1L, | |
114 | P10 = -3.315886001095605268470690485170092986337E-1L, | |
115 | Q0 = -1.958219113487162405143608843774587557016E0L, | |
116 | Q1 = 2.614577866876185080678907676023269360520E1L, | |
117 | Q2 = -9.990858606464150981009763389881793660938E1L, | |
118 | Q3 = 1.443958741356995763628660823395334281596E2L, | |
119 | Q4 = -3.206441012484232867657763518369723873129E1L, | |
120 | Q5 = -1.048560885341833443564920145642588991492E2L, | |
121 | Q6 = 6.745883931909770880159915641984874746358E1L, | |
122 | Q7 = 1.806809656342804436118449982647641392951E1L, | |
123 | Q8 = -1.770150690652438294290020775359580915464E1L, | |
124 | Q9 = -5.659156469628629327045433069052560211164E-1L, | |
125 | /* 1.000000000000000000000000000000000000000E0 */ | |
126 | ||
127 | acosr4375 = 1.1179797320499710475919903296900511518755E0L, | |
128 | pimacosr4375 = 2.0236129215398221908706530535894517323217E0L, | |
129 | ||
130 | /* asin(x) = x + x^3 pS(x^2) / qS(x^2) | |
131 | 0 <= x <= 0.5 | |
132 | peak relative error 1.9e-35 */ | |
133 | pS0 = -8.358099012470680544198472400254596543711E2L, | |
134 | pS1 = 3.674973957689619490312782828051860366493E3L, | |
135 | pS2 = -6.730729094812979665807581609853656623219E3L, | |
136 | pS3 = 6.643843795209060298375552684423454077633E3L, | |
137 | pS4 = -3.817341990928606692235481812252049415993E3L, | |
138 | pS5 = 1.284635388402653715636722822195716476156E3L, | |
139 | pS6 = -2.410736125231549204856567737329112037867E2L, | |
140 | pS7 = 2.219191969382402856557594215833622156220E1L, | |
141 | pS8 = -7.249056260830627156600112195061001036533E-1L, | |
142 | pS9 = 1.055923570937755300061509030361395604448E-3L, | |
143 | ||
144 | qS0 = -5.014859407482408326519083440151745519205E3L, | |
145 | qS1 = 2.430653047950480068881028451580393430537E4L, | |
146 | qS2 = -4.997904737193653607449250593976069726962E4L, | |
147 | qS3 = 5.675712336110456923807959930107347511086E4L, | |
148 | qS4 = -3.881523118339661268482937768522572588022E4L, | |
149 | qS5 = 1.634202194895541569749717032234510811216E4L, | |
150 | qS6 = -4.151452662440709301601820849901296953752E3L, | |
151 | qS7 = 5.956050864057192019085175976175695342168E2L, | |
152 | qS8 = -4.175375777334867025769346564600396877176E1L; | |
153 | /* 1.000000000000000000000000000000000000000E0 */ | |
154 | ||
155 | #ifdef __STDC__ | |
156 | long double | |
157 | __ieee754_acosl (long double x) | |
158 | #else | |
159 | long double | |
160 | __ieee754_acosl (x) | |
161 | long double x; | |
162 | #endif | |
163 | { | |
164 | long double z, r, w, p, q, s, t, f2; | |
165 | int32_t ix, sign; | |
166 | ieee854_long_double_shape_type u; | |
167 | ||
168 | u.value = x; | |
169 | sign = u.parts32.w0; | |
170 | ix = sign & 0x7fffffff; | |
171 | u.parts32.w0 = ix; /* |x| */ | |
172 | if (ix >= 0x3fff0000) /* |x| >= 1 */ | |
173 | { | |
174 | if (ix == 0x3fff0000 | |
175 | && (u.parts32.w1 | u.parts32.w2 | u.parts32.w3) == 0) | |
176 | { /* |x| == 1 */ | |
0e2bd6fd | 177 | if ((sign & 0x80000000) == 0) |
c9bfaa1b AJ |
178 | return 0.0; /* acos(1) = 0 */ |
179 | else | |
180 | return (2.0 * pio2_hi) + (2.0 * pio2_lo); /* acos(-1)= pi */ | |
181 | } | |
182 | return (x - x) / (x - x); /* acos(|x| > 1) is NaN */ | |
183 | } | |
184 | else if (ix < 0x3ffe0000) /* |x| < 0.5 */ | |
185 | { | |
186 | if (ix < 0x3fc60000) /* |x| < 2**-57 */ | |
187 | return pio2_hi + pio2_lo; | |
188 | if (ix < 0x3ffde000) /* |x| < .4375 */ | |
189 | { | |
190 | /* Arcsine of x. */ | |
191 | z = x * x; | |
192 | p = (((((((((pS9 * z | |
193 | + pS8) * z | |
194 | + pS7) * z | |
195 | + pS6) * z | |
196 | + pS5) * z | |
197 | + pS4) * z | |
198 | + pS3) * z | |
199 | + pS2) * z | |
200 | + pS1) * z | |
201 | + pS0) * z; | |
202 | q = (((((((( z | |
203 | + qS8) * z | |
204 | + qS7) * z | |
205 | + qS6) * z | |
206 | + qS5) * z | |
207 | + qS4) * z | |
208 | + qS3) * z | |
209 | + qS2) * z | |
210 | + qS1) * z | |
211 | + qS0; | |
212 | r = x + x * p / q; | |
213 | z = pio2_hi - (r - pio2_lo); | |
214 | return z; | |
215 | } | |
216 | /* .4375 <= |x| < .5 */ | |
217 | t = u.value - 0.4375L; | |
218 | p = ((((((((((P10 * t | |
219 | + P9) * t | |
220 | + P8) * t | |
221 | + P7) * t | |
222 | + P6) * t | |
223 | + P5) * t | |
224 | + P4) * t | |
225 | + P3) * t | |
226 | + P2) * t | |
227 | + P1) * t | |
228 | + P0) * t; | |
229 | ||
230 | q = (((((((((t | |
231 | + Q9) * t | |
232 | + Q8) * t | |
233 | + Q7) * t | |
234 | + Q6) * t | |
235 | + Q5) * t | |
236 | + Q4) * t | |
237 | + Q3) * t | |
238 | + Q2) * t | |
239 | + Q1) * t | |
240 | + Q0; | |
241 | r = p / q; | |
242 | if (sign & 0x80000000) | |
243 | r = pimacosr4375 - r; | |
244 | else | |
245 | r = acosr4375 + r; | |
246 | return r; | |
247 | } | |
248 | else if (ix < 0x3ffe4000) /* |x| < 0.625 */ | |
249 | { | |
250 | t = u.value - 0.5625L; | |
251 | p = ((((((((((rS10 * t | |
252 | + rS9) * t | |
253 | + rS8) * t | |
254 | + rS7) * t | |
255 | + rS6) * t | |
256 | + rS5) * t | |
257 | + rS4) * t | |
258 | + rS3) * t | |
259 | + rS2) * t | |
260 | + rS1) * t | |
261 | + rS0) * t; | |
262 | ||
263 | q = (((((((((t | |
264 | + sS9) * t | |
265 | + sS8) * t | |
266 | + sS7) * t | |
267 | + sS6) * t | |
268 | + sS5) * t | |
269 | + sS4) * t | |
270 | + sS3) * t | |
271 | + sS2) * t | |
272 | + sS1) * t | |
273 | + sS0; | |
274 | if (sign & 0x80000000) | |
275 | r = pimacosr5625 - p / q; | |
276 | else | |
277 | r = acosr5625 + p / q; | |
278 | return r; | |
279 | } | |
280 | else | |
281 | { /* |x| >= .625 */ | |
282 | z = (one - u.value) * 0.5; | |
283 | s = __ieee754_sqrtl (z); | |
284 | /* Compute an extended precision square root from | |
285 | the Newton iteration s -> 0.5 * (s + z / s). | |
286 | The change w from s to the improved value is | |
287 | w = 0.5 * (s + z / s) - s = (s^2 + z)/2s - s = (z - s^2)/2s. | |
288 | Express s = f1 + f2 where f1 * f1 is exactly representable. | |
289 | w = (z - s^2)/2s = (z - f1^2 - 2 f1 f2 - f2^2)/2s . | |
290 | s + w has extended precision. */ | |
291 | u.value = s; | |
292 | u.parts32.w2 = 0; | |
293 | u.parts32.w3 = 0; | |
294 | f2 = s - u.value; | |
295 | w = z - u.value * u.value; | |
296 | w = w - 2.0 * u.value * f2; | |
297 | w = w - f2 * f2; | |
298 | w = w / (2.0 * s); | |
299 | /* Arcsine of s. */ | |
300 | p = (((((((((pS9 * z | |
301 | + pS8) * z | |
302 | + pS7) * z | |
303 | + pS6) * z | |
304 | + pS5) * z | |
305 | + pS4) * z | |
306 | + pS3) * z | |
307 | + pS2) * z | |
308 | + pS1) * z | |
309 | + pS0) * z; | |
310 | q = (((((((( z | |
311 | + qS8) * z | |
312 | + qS7) * z | |
313 | + qS6) * z | |
314 | + qS5) * z | |
315 | + qS4) * z | |
316 | + qS3) * z | |
317 | + qS2) * z | |
318 | + qS1) * z | |
319 | + qS0; | |
320 | r = s + (w + s * p / q); | |
321 | ||
322 | if (sign & 0x80000000) | |
323 | w = pio2_hi + (pio2_lo - r); | |
324 | else | |
325 | w = r; | |
326 | return 2.0 * w; | |
327 | } | |
328 | } |