More strict check of AVX512 support in assembler.
[glibc.git] / sysdeps / ieee754 / ldbl-96 / e_jnl.c
bloba6668089dd52c4ad21185ba793406cfbc790d9bc
1 /*
2 * ====================================================
3 * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
5 * Developed at SunPro, a Sun Microsystems, Inc. business.
6 * Permission to use, copy, modify, and distribute this
7 * software is freely granted, provided that this notice
8 * is preserved.
9 * ====================================================
12 /* Modifications for long double are
13 Copyright (C) 2001 Stephen L. Moshier <moshier@na-net.ornl.gov>
14 and are incorporated herein by permission of the author. The author
15 reserves the right to distribute this material elsewhere under different
16 copying permissions. These modifications are distributed here under
17 the following terms:
19 This library is free software; you can redistribute it and/or
20 modify it under the terms of the GNU Lesser General Public
21 License as published by the Free Software Foundation; either
22 version 2.1 of the License, or (at your option) any later version.
24 This library is distributed in the hope that it will be useful,
25 but WITHOUT ANY WARRANTY; without even the implied warranty of
26 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
27 Lesser General Public License for more details.
29 You should have received a copy of the GNU Lesser General Public
30 License along with this library; if not, see
31 <http://www.gnu.org/licenses/>. */
34 * __ieee754_jn(n, x), __ieee754_yn(n, x)
35 * floating point Bessel's function of the 1st and 2nd kind
36 * of order n
38 * Special cases:
39 * y0(0)=y1(0)=yn(n,0) = -inf with overflow signal;
40 * y0(-ve)=y1(-ve)=yn(n,-ve) are NaN with invalid signal.
41 * Note 2. About jn(n,x), yn(n,x)
42 * For n=0, j0(x) is called,
43 * for n=1, j1(x) is called,
44 * for n<x, forward recursion us used starting
45 * from values of j0(x) and j1(x).
46 * for n>x, a continued fraction approximation to
47 * j(n,x)/j(n-1,x) is evaluated and then backward
48 * recursion is used starting from a supposed value
49 * for j(n,x). The resulting value of j(0,x) is
50 * compared with the actual value to correct the
51 * supposed value of j(n,x).
53 * yn(n,x) is similar in all respects, except
54 * that forward recursion is used for all
55 * values of n>1.
59 #include <errno.h>
60 #include <float.h>
61 #include <math.h>
62 #include <math_private.h>
64 static const long double
65 invsqrtpi = 5.64189583547756286948079e-1L, two = 2.0e0L, one = 1.0e0L;
67 static const long double zero = 0.0L;
69 long double
70 __ieee754_jnl (int n, long double x)
72 u_int32_t se, i0, i1;
73 int32_t i, ix, sgn;
74 long double a, b, temp, di;
75 long double z, w;
77 /* J(-n,x) = (-1)^n * J(n, x), J(n, -x) = (-1)^n * J(n, x)
78 * Thus, J(-n,x) = J(n,-x)
81 GET_LDOUBLE_WORDS (se, i0, i1, x);
82 ix = se & 0x7fff;
84 /* if J(n,NaN) is NaN */
85 if (__glibc_unlikely ((ix == 0x7fff) && ((i0 & 0x7fffffff) != 0)))
86 return x + x;
87 if (n < 0)
89 n = -n;
90 x = -x;
91 se ^= 0x8000;
93 if (n == 0)
94 return (__ieee754_j0l (x));
95 if (n == 1)
96 return (__ieee754_j1l (x));
97 sgn = (n & 1) & (se >> 15); /* even n -- 0, odd n -- sign(x) */
98 x = fabsl (x);
99 if (__glibc_unlikely ((ix | i0 | i1) == 0 || ix >= 0x7fff))
100 /* if x is 0 or inf */
101 b = zero;
102 else if ((long double) n <= x)
104 /* Safe to use J(n+1,x)=2n/x *J(n,x)-J(n-1,x) */
105 if (ix >= 0x412D)
106 { /* x > 2**302 */
108 /* ??? This might be a futile gesture.
109 If x exceeds X_TLOSS anyway, the wrapper function
110 will set the result to zero. */
112 /* (x >> n**2)
113 * Jn(x) = cos(x-(2n+1)*pi/4)*sqrt(2/x*pi)
114 * Yn(x) = sin(x-(2n+1)*pi/4)*sqrt(2/x*pi)
115 * Let s=sin(x), c=cos(x),
116 * xn=x-(2n+1)*pi/4, sqt2 = sqrt(2),then
118 * n sin(xn)*sqt2 cos(xn)*sqt2
119 * ----------------------------------
120 * 0 s-c c+s
121 * 1 -s-c -c+s
122 * 2 -s+c -c-s
123 * 3 s+c c-s
125 long double s;
126 long double c;
127 __sincosl (x, &s, &c);
128 switch (n & 3)
130 case 0:
131 temp = c + s;
132 break;
133 case 1:
134 temp = -c + s;
135 break;
136 case 2:
137 temp = -c - s;
138 break;
139 case 3:
140 temp = c - s;
141 break;
143 b = invsqrtpi * temp / __ieee754_sqrtl (x);
145 else
147 a = __ieee754_j0l (x);
148 b = __ieee754_j1l (x);
149 for (i = 1; i < n; i++)
151 temp = b;
152 b = b * ((long double) (i + i) / x) - a; /* avoid underflow */
153 a = temp;
157 else
159 if (ix < 0x3fde)
160 { /* x < 2**-33 */
161 /* x is tiny, return the first Taylor expansion of J(n,x)
162 * J(n,x) = 1/n!*(x/2)^n - ...
164 if (n >= 400) /* underflow, result < 10^-4952 */
165 b = zero;
166 else
168 temp = x * 0.5;
169 b = temp;
170 for (a = one, i = 2; i <= n; i++)
172 a *= (long double) i; /* a = n! */
173 b *= temp; /* b = (x/2)^n */
175 b = b / a;
178 else
180 /* use backward recurrence */
181 /* x x^2 x^2
182 * J(n,x)/J(n-1,x) = ---- ------ ------ .....
183 * 2n - 2(n+1) - 2(n+2)
185 * 1 1 1
186 * (for large x) = ---- ------ ------ .....
187 * 2n 2(n+1) 2(n+2)
188 * -- - ------ - ------ -
189 * x x x
191 * Let w = 2n/x and h=2/x, then the above quotient
192 * is equal to the continued fraction:
194 * = -----------------------
196 * w - -----------------
198 * w+h - ---------
199 * w+2h - ...
201 * To determine how many terms needed, let
202 * Q(0) = w, Q(1) = w(w+h) - 1,
203 * Q(k) = (w+k*h)*Q(k-1) - Q(k-2),
204 * When Q(k) > 1e4 good for single
205 * When Q(k) > 1e9 good for double
206 * When Q(k) > 1e17 good for quadruple
208 /* determine k */
209 long double t, v;
210 long double q0, q1, h, tmp;
211 int32_t k, m;
212 w = (n + n) / (long double) x;
213 h = 2.0L / (long double) x;
214 q0 = w;
215 z = w + h;
216 q1 = w * z - 1.0L;
217 k = 1;
218 while (q1 < 1.0e11L)
220 k += 1;
221 z += h;
222 tmp = z * q1 - q0;
223 q0 = q1;
224 q1 = tmp;
226 m = n + n;
227 for (t = zero, i = 2 * (n + k); i >= m; i -= 2)
228 t = one / (i / x - t);
229 a = t;
230 b = one;
231 /* estimate log((2/x)^n*n!) = n*log(2/x)+n*ln(n)
232 * Hence, if n*(log(2n/x)) > ...
233 * single 8.8722839355e+01
234 * double 7.09782712893383973096e+02
235 * long double 1.1356523406294143949491931077970765006170e+04
236 * then recurrent value may overflow and the result is
237 * likely underflow to zero
239 tmp = n;
240 v = two / x;
241 tmp = tmp * __ieee754_logl (fabsl (v * tmp));
243 if (tmp < 1.1356523406294143949491931077970765006170e+04L)
245 for (i = n - 1, di = (long double) (i + i); i > 0; i--)
247 temp = b;
248 b *= di;
249 b = b / x - a;
250 a = temp;
251 di -= two;
254 else
256 for (i = n - 1, di = (long double) (i + i); i > 0; i--)
258 temp = b;
259 b *= di;
260 b = b / x - a;
261 a = temp;
262 di -= two;
263 /* scale b to avoid spurious overflow */
264 if (b > 1e100L)
266 a /= b;
267 t /= b;
268 b = one;
272 /* j0() and j1() suffer enormous loss of precision at and
273 * near zero; however, we know that their zero points never
274 * coincide, so just choose the one further away from zero.
276 z = __ieee754_j0l (x);
277 w = __ieee754_j1l (x);
278 if (fabsl (z) >= fabsl (w))
279 b = (t * z / b);
280 else
281 b = (t * w / a);
284 if (sgn == 1)
285 return -b;
286 else
287 return b;
289 strong_alias (__ieee754_jnl, __jnl_finite)
291 long double
292 __ieee754_ynl (int n, long double x)
294 u_int32_t se, i0, i1;
295 int32_t i, ix;
296 int32_t sign;
297 long double a, b, temp, ret;
300 GET_LDOUBLE_WORDS (se, i0, i1, x);
301 ix = se & 0x7fff;
302 /* if Y(n,NaN) is NaN */
303 if (__builtin_expect ((ix == 0x7fff) && ((i0 & 0x7fffffff) != 0), 0))
304 return x + x;
305 if (__builtin_expect ((ix | i0 | i1) == 0, 0))
306 /* -inf or inf and divide-by-zero exception. */
307 return ((n < 0 && (n & 1) != 0) ? 1.0L : -1.0L) / 0.0L;
308 if (__builtin_expect (se & 0x8000, 0))
309 return zero / (zero * x);
310 sign = 1;
311 if (n < 0)
313 n = -n;
314 sign = 1 - ((n & 1) << 1);
316 if (n == 0)
317 return (__ieee754_y0l (x));
319 SET_RESTORE_ROUNDL (FE_TONEAREST);
320 if (n == 1)
322 ret = sign * __ieee754_y1l (x);
323 goto out;
325 if (__glibc_unlikely (ix == 0x7fff))
326 return zero;
327 if (ix >= 0x412D)
328 { /* x > 2**302 */
330 /* ??? See comment above on the possible futility of this. */
332 /* (x >> n**2)
333 * Jn(x) = cos(x-(2n+1)*pi/4)*sqrt(2/x*pi)
334 * Yn(x) = sin(x-(2n+1)*pi/4)*sqrt(2/x*pi)
335 * Let s=sin(x), c=cos(x),
336 * xn=x-(2n+1)*pi/4, sqt2 = sqrt(2),then
338 * n sin(xn)*sqt2 cos(xn)*sqt2
339 * ----------------------------------
340 * 0 s-c c+s
341 * 1 -s-c -c+s
342 * 2 -s+c -c-s
343 * 3 s+c c-s
345 long double s;
346 long double c;
347 __sincosl (x, &s, &c);
348 switch (n & 3)
350 case 0:
351 temp = s - c;
352 break;
353 case 1:
354 temp = -s - c;
355 break;
356 case 2:
357 temp = -s + c;
358 break;
359 case 3:
360 temp = s + c;
361 break;
363 b = invsqrtpi * temp / __ieee754_sqrtl (x);
365 else
367 a = __ieee754_y0l (x);
368 b = __ieee754_y1l (x);
369 /* quit if b is -inf */
370 GET_LDOUBLE_WORDS (se, i0, i1, b);
371 /* Use 0xffffffff since GET_LDOUBLE_WORDS sign-extends SE. */
372 for (i = 1; i < n && se != 0xffffffff; i++)
374 temp = b;
375 b = ((long double) (i + i) / x) * b - a;
376 GET_LDOUBLE_WORDS (se, i0, i1, b);
377 a = temp;
380 /* If B is +-Inf, set up errno accordingly. */
381 if (! isfinite (b))
382 __set_errno (ERANGE);
383 if (sign > 0)
384 ret = b;
385 else
386 ret = -b;
388 out:
389 if (isinf (ret))
390 ret = __copysignl (LDBL_MAX, ret) * LDBL_MAX;
391 return ret;
393 strong_alias (__ieee754_ynl, __ynl_finite)