2 * ====================================================
3 * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
5 * Developed at SunPro, a Sun Microsystems, Inc. business.
6 * Permission to use, copy, modify, and distribute this
7 * software is freely granted, provided that this notice
9 * ====================================================
12 /* Expansions and modifications for 128-bit long double are
13 Copyright (C) 2001 Stephen L. Moshier <moshier@na-net.ornl.gov>
14 and are incorporated herein by permission of the author. The author
15 reserves the right to distribute this material elsewhere under different
16 copying permissions. These modifications are distributed here under
19 This library is free software; you can redistribute it and/or
20 modify it under the terms of the GNU Lesser General Public
21 License as published by the Free Software Foundation; either
22 version 2.1 of the License, or (at your option) any later version.
24 This library is distributed in the hope that it will be useful,
25 but WITHOUT ANY WARRANTY; without even the implied warranty of
26 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
27 Lesser General Public License for more details.
29 You should have received a copy of the GNU Lesser General Public
30 License along with this library; if not, see
31 <http://www.gnu.org/licenses/>. */
33 /* powq(x,y) return x**y
36 * Method: Let x = 2 * (1+f)
37 * 1. Compute and return log2(x) in two pieces:
39 * where w1 has 113-53 = 60 bit trailing zeros.
40 * 2. Perform y*log2(x) = n+y' by simulating muti-precision
41 * arithmetic, where |y'|<=0.5.
42 * 3. Return x**y = 2**n*exp(y'*log2)
45 * 1. (anything) ** 0 is 1
46 * 2. (anything) ** 1 is itself
47 * 3. (anything) ** NAN is NAN
48 * 4. NAN ** (anything except 0) is NAN
49 * 5. +-(|x| > 1) ** +INF is +INF
50 * 6. +-(|x| > 1) ** -INF is +0
51 * 7. +-(|x| < 1) ** +INF is +0
52 * 8. +-(|x| < 1) ** -INF is +INF
53 * 9. +-1 ** +-INF is NAN
54 * 10. +0 ** (+anything except 0, NAN) is +0
55 * 11. -0 ** (+anything except 0, NAN, odd integer) is +0
56 * 12. +0 ** (-anything except 0, NAN) is +INF
57 * 13. -0 ** (-anything except 0, NAN, odd integer) is +INF
58 * 14. -0 ** (odd integer) = -( +0 ** (odd integer) )
59 * 15. +INF ** (+anything except 0,NAN) is +INF
60 * 16. +INF ** (-anything except 0,NAN) is +0
61 * 17. -INF ** (anything) = -0 ** (-anything)
62 * 18. (-anything) ** (integer) is (-1)**(integer)*(+anything**integer)
63 * 19. (-anything except 0 and inf) ** (non-integer) is NAN
67 #include "quadmath-imp.h"
69 static const __float128 bp
[] = {
75 static const __float128 dp_h
[] = {
77 5.8496250072115607565592654282227158546448E-1Q
80 /* Low part of log_2(1.5) */
81 static const __float128 dp_l
[] = {
83 1.0579781240112554492329533686862998106046E-16Q
86 static const __float128 zero
= 0,
89 two113
= 1.0384593717069655257060992658440192E34Q
,
93 /* 3/2 log x = 3 z + z^3 + z^3 (z^2 R(z^2))
96 Peak relative error 2.3e-37 */
97 static const __float128 LN
[] =
99 -3.0779177200290054398792536829702930623200E1Q
,
100 6.5135778082209159921251824580292116201640E1Q
,
101 -4.6312921812152436921591152809994014413540E1Q
,
102 1.2510208195629420304615674658258363295208E1Q
,
103 -9.9266909031921425609179910128531667336670E-1Q
105 static const __float128 LD
[] =
107 -5.129862866715009066465422805058933131960E1Q
,
108 1.452015077564081884387441590064272782044E2Q
,
109 -1.524043275549860505277434040464085593165E2Q
,
110 7.236063513651544224319663428634139768808E1Q
,
111 -1.494198912340228235853027849917095580053E1Q
115 /* exp(x) = 1 + x - x / (1 - 2 / (x - x^2 R(x^2)))
117 Peak relative error 5.7e-38 */
118 static const __float128 PN
[] =
120 5.081801691915377692446852383385968225675E8Q
,
121 9.360895299872484512023336636427675327355E6Q
,
122 4.213701282274196030811629773097579432957E4Q
,
123 5.201006511142748908655720086041570288182E1Q
,
124 9.088368420359444263703202925095675982530E-3Q
,
126 static const __float128 PD
[] =
128 3.049081015149226615468111430031590411682E9Q
,
129 1.069833887183886839966085436512368982758E8Q
,
130 8.259257717868875207333991924545445705394E5Q
,
131 1.872583833284143212651746812884298360922E3Q
,
135 static const __float128
137 lg2
= 6.9314718055994530941723212145817656807550E-1Q
,
138 lg2_h
= 6.9314718055994528622676398299518041312695E-1Q
,
139 lg2_l
= 2.3190468138462996154948554638754786504121E-17Q
,
140 ovt
= 8.0085662595372944372e-0017Q
,
142 cp
= 9.6179669392597560490661645400126142495110E-1Q
,
143 cp_h
= 9.6179669392597555432899980587535537779331E-1Q
,
144 cp_l
= 5.0577616648125906047157785230014751039424E-17Q
;
147 powq (__float128 x
, __float128 y
)
149 __float128 z
, ax
, z_h
, z_l
, p_h
, p_l
;
150 __float128 y1
, t1
, t2
, r
, s
, sgn
, t
, u
, v
, w
;
151 __float128 s2
, s_h
, s_l
, t_h
, t_l
, ay
;
152 int32_t i
, j
, k
, yisint
, n
;
155 ieee854_float128 o
, p
, q
;
159 ix
= hx
& 0x7fffffff;
163 iy
= hy
& 0x7fffffff;
166 /* y==zero: x**0 = 1 */
167 if ((iy
| q
.words32
.w1
| q
.words32
.w2
| q
.words32
.w3
) == 0
168 && !issignalingq (x
))
171 /* 1.0**y = 1; -1.0**+-Inf = 1 */
172 if (x
== one
&& !issignalingq (y
))
174 if (x
== -1 && iy
== 0x7fff0000
175 && (q
.words32
.w1
| q
.words32
.w2
| q
.words32
.w3
) == 0)
178 /* +-NaN return x+y */
179 if ((ix
> 0x7fff0000)
180 || ((ix
== 0x7fff0000)
181 && ((p
.words32
.w1
| p
.words32
.w2
| p
.words32
.w3
) != 0))
183 || ((iy
== 0x7fff0000)
184 && ((q
.words32
.w1
| q
.words32
.w2
| q
.words32
.w3
) != 0)))
187 /* determine if y is an odd int when x < 0
188 * yisint = 0 ... y is not an integer
189 * yisint = 1 ... y is an odd int
190 * yisint = 2 ... y is an even int
195 if (iy
>= 0x40700000) /* 2^113 */
196 yisint
= 2; /* even integer y */
197 else if (iy
>= 0x3fff0000) /* 1.0 */
210 /* special value of y */
211 if ((q
.words32
.w1
| q
.words32
.w2
| q
.words32
.w3
) == 0)
213 if (iy
== 0x7fff0000) /* y is +-inf */
215 if (((ix
- 0x3fff0000) | p
.words32
.w1
| p
.words32
.w2
| p
.words32
.w3
)
217 return y
- y
; /* +-1**inf is NaN */
218 else if (ix
>= 0x3fff0000) /* (|x|>1)**+-inf = inf,0 */
219 return (hy
>= 0) ? y
: zero
;
220 else /* (|x|<1)**-,+inf = inf,0 */
221 return (hy
< 0) ? -y
: zero
;
223 if (iy
== 0x3fff0000)
230 if (hy
== 0x40000000)
231 return x
* x
; /* y is 2 */
232 if (hy
== 0x3ffe0000)
234 if (hx
>= 0) /* x >= +0 */
240 /* special value of x */
241 if ((p
.words32
.w1
| p
.words32
.w2
| p
.words32
.w3
) == 0)
243 if (ix
== 0x7fff0000 || ix
== 0 || ix
== 0x3fff0000)
245 z
= ax
; /*x is +-0,+-inf,+-1 */
247 z
= one
/ z
; /* z = (1/|x|) */
250 if (((ix
- 0x3fff0000) | yisint
) == 0)
252 z
= (z
- z
) / (z
- z
); /* (-1)**non-int is NaN */
254 else if (yisint
== 1)
255 z
= -z
; /* (x<0)**odd = -(|x|**odd) */
261 /* (x<0)**(non-int) is NaN */
262 if (((((uint32_t) hx
>> 31) - 1) | yisint
) == 0)
263 return (x
- x
) / (x
- x
);
265 /* sgn (sign of result -ve**odd) = -1 else = 1 */
267 if (((((uint32_t) hx
>> 31) - 1) | (yisint
- 1)) == 0)
268 sgn
= -one
; /* (-ve)**(odd int) */
271 2^-16495 = 1/2 of smallest representable value.
272 If (1 - 1/131072)^y underflows, y > 1.4986e9 */
275 /* if (1 - 2^-113)^y underflows, y > 1.1873e38 */
278 if (ix
<= 0x3ffeffff)
279 return (hy
< 0) ? huge
* huge
: tiny
* tiny
;
280 if (ix
>= 0x3fff0000)
281 return (hy
> 0) ? huge
* huge
: tiny
* tiny
;
283 /* over/underflow if x is not close to one */
285 return (hy
< 0) ? sgn
* huge
* huge
: sgn
* tiny
* tiny
;
287 return (hy
> 0) ? sgn
* huge
* huge
: sgn
* tiny
* tiny
;
292 y
= y
< 0 ? -0x1p
-128 : 0x1p
-128;
295 /* take care subnormal number */
303 n
+= ((ix
) >> 16) - 0x3fff;
305 /* determine interval */
306 ix
= j
| 0x3fff0000; /* normalize ix */
308 k
= 0; /* |x|<sqrt(3/2) */
310 k
= 1; /* |x|<sqrt(3) */
322 /* compute s = s_h+s_l = (x-1)/(x+1) or (x-1.5)/(x+1.5) */
323 u
= ax
- bp
[k
]; /* bp[0]=1.0, bp[1]=1.5 */
324 v
= one
/ (ax
+ bp
[k
]);
330 o
.words32
.w2
&= 0xf8000000;
332 /* t_h=ax+bp[k] High */
336 o
.words32
.w2
&= 0xf8000000;
338 t_l
= ax
- (t_h
- bp
[k
]);
339 s_l
= v
* ((u
- s_h
* t_h
) - s_h
* t_l
);
340 /* compute log(ax) */
342 u
= LN
[0] + s2
* (LN
[1] + s2
* (LN
[2] + s2
* (LN
[3] + s2
* LN
[4])));
343 v
= LD
[0] + s2
* (LD
[1] + s2
* (LD
[2] + s2
* (LD
[3] + s2
* (LD
[4] + s2
))));
345 r
+= s_l
* (s_h
+ s
);
350 o
.words32
.w2
&= 0xf8000000;
352 t_l
= r
- ((t_h
- 3.0) - s2
);
353 /* u+v = s*(1+...) */
355 v
= s_l
* t_h
+ t_l
* s
;
356 /* 2/(3log2)*(s+...) */
360 o
.words32
.w2
&= 0xf8000000;
363 z_h
= cp_h
* p_h
; /* cp_h+cp_l = 2/(3*log2) */
364 z_l
= cp_l
* p_h
+ p_l
* cp
+ dp_l
[k
];
365 /* log2(ax) = (s+..)*2/(3*log2) = n + dp_h + z_h + z_l */
367 t1
= (((z_h
+ z_l
) + dp_h
[k
]) + t
);
370 o
.words32
.w2
&= 0xf8000000;
372 t2
= z_l
- (((t1
- t
) - dp_h
[k
]) - z_h
);
374 /* split up y into y1+y2 and compute (y1+y2)*(t1+t2) */
378 o
.words32
.w2
&= 0xf8000000;
380 p_l
= (y
- y1
) * t1
+ y
* t2
;
385 if (j
>= 0x400d0000) /* z >= 16384 */
388 if (((j
- 0x400d0000) | o
.words32
.w1
| o
.words32
.w2
| o
.words32
.w3
) != 0)
389 return sgn
* huge
* huge
; /* overflow */
392 if (p_l
+ ovt
> z
- p_h
)
393 return sgn
* huge
* huge
; /* overflow */
396 else if ((j
& 0x7fffffff) >= 0x400d01b9) /* z <= -16495 */
399 if (((j
- 0xc00d01bc) | o
.words32
.w1
| o
.words32
.w2
| o
.words32
.w3
)
401 return sgn
* tiny
* tiny
; /* underflow */
405 return sgn
* tiny
* tiny
; /* underflow */
408 /* compute 2**(p_h+p_l) */
410 k
= (i
>> 16) - 0x3fff;
413 { /* if |z| > 0.5, set n = [z+0.5] */
414 n
= floorq (z
+ 0.5Q
);
421 o
.words32
.w2
&= 0xf8000000;
424 v
= (p_l
- (t
- p_h
)) * lg2
+ t
* lg2_l
;
429 u
= PN
[0] + t
* (PN
[1] + t
* (PN
[2] + t
* (PN
[3] + t
* PN
[4])));
430 v
= PD
[0] + t
* (PD
[1] + t
* (PD
[2] + t
* (PD
[3] + t
)));
432 r
= (z
* t1
) / (t1
- two
) - (w
+ z
* w
);
439 z
= scalbnq (z
, n
); /* subnormal output */
440 __float128 force_underflow
= z
* z
;
441 math_force_eval (force_underflow
);