sysdeps/ieee754/ldbl-96/e_lgammal_r.c

   1 /*
   2  * ====================================================
   3  * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
   4  *
   5  * Developed at SunPro, a Sun Microsystems, Inc. business.
   6  * Permission to use, copy, modify, and distribute this
   7  * software is freely granted, provided that this notice
   8  * is preserved.
   9  * ====================================================
  10  */
  11
  12 /* Long double expansions are
  13   Copyright (C) 2001 Stephen L. Moshier <moshier@na-net.ornl.gov>
  14   and are incorporated herein by permission of the author.  The author
  15   reserves the right to distribute this material elsewhere under different
  16   copying permissions.  These modifications are distributed here under
  17   the following terms:
  18
  19     This library is free software; you can redistribute it and/or
  20     modify it under the terms of the GNU Lesser General Public
  21     License as published by the Free Software Foundation; either
  22     version 2.1 of the License, or (at your option) any later version.
  23
  24     This library is distributed in the hope that it will be useful,
  25     but WITHOUT ANY WARRANTY; without even the implied warranty of
  26     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  27     Lesser General Public License for more details.
  28
  29     You should have received a copy of the GNU Lesser General Public
  30     License along with this library; if not, see
  31     <http://www.gnu.org/licenses/>.  */
  32
  33 /* __ieee754_lgammal_r(x, signgamp)
  34  * Reentrant version of the logarithm of the Gamma function
  35  * with user provide pointer for the sign of Gamma(x).
  36  *
  37  * Method:
  38  *   1. Argument Reduction for 0 < x <= 8
  39  *      Since gamma(1+s)=s*gamma(s), for x in [0,8], we may
  40  *      reduce x to a number in [1.5,2.5] by
  41  *              lgamma(1+s) = log(s) + lgamma(s)
  42  *      for example,
  43  *              lgamma(7.3) = log(6.3) + lgamma(6.3)
  44  *                          = log(6.3*5.3) + lgamma(5.3)
  45  *                          = log(6.3*5.3*4.3*3.3*2.3) + lgamma(2.3)
  46  *   2. Polynomial approximation of lgamma around its
  47  *      minimun ymin=1.461632144968362245 to maintain monotonicity.
  48  *      On [ymin-0.23, ymin+0.27] (i.e., [1.23164,1.73163]), use
  49  *              Let z = x-ymin;
  50  *              lgamma(x) = -1.214862905358496078218 + z^2*poly(z)
  51  *   2. Rational approximation in the primary interval [2,3]
  52  *      We use the following approximation:
  53  *              s = x-2.0;
  54  *              lgamma(x) = 0.5*s + s*P(s)/Q(s)
  55  *      Our algorithms are based on the following observation
  56  *
  57  *                             zeta(2)-1    2    zeta(3)-1    3
  58  * lgamma(2+s) = s*(1-Euler) + --------- * s  -  --------- * s  + ...
  59  *                                 2                 3
  60  *
  61  *      where Euler = 0.5771... is the Euler constant, which is very
  62  *      close to 0.5.
  63  *
  64  *   3. For x>=8, we have
  65  *      lgamma(x)~(x-0.5)log(x)-x+0.5*log(2pi)+1/(12x)-1/(360x**3)+....
  66  *      (better formula:
  67  *         lgamma(x)~(x-0.5)*(log(x)-1)-.5*(log(2pi)-1) + ...)
  68  *      Let z = 1/x, then we approximation
  69  *              f(z) = lgamma(x) - (x-0.5)(log(x)-1)
  70  *      by
  71  *                                  3       5             11
  72  *              w = w0 + w1*z + w2*z  + w3*z  + ... + w6*z
  73  *
  74  *   4. For negative x, since (G is gamma function)
  75  *              -x*G(-x)*G(x) = pi/sin(pi*x),
  76  *      we have
  77  *              G(x) = pi/(sin(pi*x)*(-x)*G(-x))
  78  *      since G(-x) is positive, sign(G(x)) = sign(sin(pi*x)) for x<0
  79  *      Hence, for x<0, signgam = sign(sin(pi*x)) and
  80  *              lgamma(x) = log(|Gamma(x)|)
  81  *                        = log(pi/(|x*sin(pi*x)|)) - lgamma(-x);
  82  *      Note: one should avoid compute pi*(-x) directly in the
  83  *            computation of sin(pi*(-x)).
  84  *
  85  *   5. Special Cases
  86  *              lgamma(2+s) ~ s*(1-Euler) for tiny s
  87  *              lgamma(1)=lgamma(2)=0
  88  *              lgamma(x) ~ -log(x) for tiny x
  89  *              lgamma(0) = lgamma(inf) = inf
  90  *              lgamma(-integer) = +-inf
  91  *
  92  */
  93
  94 #include <math.h>
  95 #include <math_private.h>
  96 #include <libc-diag.h>
  97
  98 static const long double
  99   half = 0.5L,
 100   one = 1.0L,
 101   pi = 3.14159265358979323846264L,
 102   two63 = 9.223372036854775808e18L,
 103
 104   /* lgam(1+x) = 0.5 x + x a(x)/b(x)
 105      -0.268402099609375 <= x <= 0
 106      peak relative error 6.6e-22 */
 107   a0 = -6.343246574721079391729402781192128239938E2L,
 108   a1 =  1.856560238672465796768677717168371401378E3L,
 109   a2 =  2.404733102163746263689288466865843408429E3L,
 110   a3 =  8.804188795790383497379532868917517596322E2L,
 111   a4 =  1.135361354097447729740103745999661157426E2L,
 112   a5 =  3.766956539107615557608581581190400021285E0L,
 113
 114   b0 =  8.214973713960928795704317259806842490498E3L,
 115   b1 =  1.026343508841367384879065363925870888012E4L,
 116   b2 =  4.553337477045763320522762343132210919277E3L,
 117   b3 =  8.506975785032585797446253359230031874803E2L,
 118   b4 =  6.042447899703295436820744186992189445813E1L,
 119   /* b5 =  1.000000000000000000000000000000000000000E0 */
 120
 121
 122   tc =  1.4616321449683623412626595423257213284682E0L,
 123   tf = -1.2148629053584961146050602565082954242826E-1,/* double precision */
 124 /* tt = (tail of tf), i.e. tf + tt has extended precision. */
 125   tt = 3.3649914684731379602768989080467587736363E-18L,
 126   /* lgam ( 1.4616321449683623412626595423257213284682E0 ) =
 127 -1.2148629053584960809551455717769158215135617312999903886372437313313530E-1 */
 128
 129   /* lgam (x + tc) = tf + tt + x g(x)/h(x)
 130      - 0.230003726999612341262659542325721328468 <= x
 131      <= 0.2699962730003876587373404576742786715318
 132      peak relative error 2.1e-21 */
 133   g0 = 3.645529916721223331888305293534095553827E-18L,
 134   g1 = 5.126654642791082497002594216163574795690E3L,
 135   g2 = 8.828603575854624811911631336122070070327E3L,
 136   g3 = 5.464186426932117031234820886525701595203E3L,
 137   g4 = 1.455427403530884193180776558102868592293E3L,
 138   g5 = 1.541735456969245924860307497029155838446E2L,
 139   g6 = 4.335498275274822298341872707453445815118E0L,
 140
 141   h0 = 1.059584930106085509696730443974495979641E4L,
 142   h1 =  2.147921653490043010629481226937850618860E4L,
 143   h2 = 1.643014770044524804175197151958100656728E4L,
 144   h3 =  5.869021995186925517228323497501767586078E3L,
 145   h4 =  9.764244777714344488787381271643502742293E2L,
 146   h5 =  6.442485441570592541741092969581997002349E1L,
 147   /* h6 = 1.000000000000000000000000000000000000000E0 */
 148
 149
 150   /* lgam (x+1) = -0.5 x + x u(x)/v(x)
 151      -0.100006103515625 <= x <= 0.231639862060546875
 152      peak relative error 1.3e-21 */
 153   u0 = -8.886217500092090678492242071879342025627E1L,
 154   u1 =  6.840109978129177639438792958320783599310E2L,
 155   u2 =  2.042626104514127267855588786511809932433E3L,
 156   u3 =  1.911723903442667422201651063009856064275E3L,
 157   u4 =  7.447065275665887457628865263491667767695E2L,
 158   u5 =  1.132256494121790736268471016493103952637E2L,
 159   u6 =  4.484398885516614191003094714505960972894E0L,
 160
 161   v0 =  1.150830924194461522996462401210374632929E3L,
 162   v1 =  3.399692260848747447377972081399737098610E3L,
 163   v2 =  3.786631705644460255229513563657226008015E3L,
 164   v3 =  1.966450123004478374557778781564114347876E3L,
 165   v4 =  4.741359068914069299837355438370682773122E2L,
 166   v5 =  4.508989649747184050907206782117647852364E1L,
 167   /* v6 =  1.000000000000000000000000000000000000000E0 */
 168
 169
 170   /* lgam (x+2) = .5 x + x s(x)/r(x)
 171      0 <= x <= 1
 172      peak relative error 7.2e-22 */
 173   s0 =  1.454726263410661942989109455292824853344E6L,
 174   s1 = -3.901428390086348447890408306153378922752E6L,
 175   s2 = -6.573568698209374121847873064292963089438E6L,
 176   s3 = -3.319055881485044417245964508099095984643E6L,
 177   s4 = -7.094891568758439227560184618114707107977E5L,
 178   s5 = -6.263426646464505837422314539808112478303E4L,
 179   s6 = -1.684926520999477529949915657519454051529E3L,
 180
 181   r0 = -1.883978160734303518163008696712983134698E7L,
 182   r1 = -2.815206082812062064902202753264922306830E7L,
 183   r2 = -1.600245495251915899081846093343626358398E7L,
 184   r3 = -4.310526301881305003489257052083370058799E6L,
 185   r4 = -5.563807682263923279438235987186184968542E5L,
 186   r5 = -3.027734654434169996032905158145259713083E4L,
 187   r6 = -4.501995652861105629217250715790764371267E2L,
 188   /* r6 =  1.000000000000000000000000000000000000000E0 */
 189
 190
 191 /* lgam(x) = ( x - 0.5 ) * log(x) - x + LS2PI + 1/x w(1/x^2)
 192    x >= 8
 193    Peak relative error 1.51e-21
 194    w0 = LS2PI - 0.5 */
 195   w0 =  4.189385332046727417803e-1L,
 196   w1 =  8.333333333333331447505E-2L,
 197   w2 = -2.777777777750349603440E-3L,
 198   w3 =  7.936507795855070755671E-4L,
 199   w4 = -5.952345851765688514613E-4L,
 200   w5 =  8.412723297322498080632E-4L,
 201   w6 = -1.880801938119376907179E-3L,
 202   w7 =  4.885026142432270781165E-3L;
 203
 204 static const long double zero = 0.0L;
 205
 206 static long double
 207 sin_pi (long double x)
 208 {
 209   long double y, z;
 210   int n, ix;
 211   uint32_t se, i0, i1;
 212
 213   GET_LDOUBLE_WORDS (se, i0, i1, x);
 214   ix = se & 0x7fff;
 215   ix = (ix << 16) | (i0 >> 16);
 216   if (ix < 0x3ffd8000) /* 0.25 */
 217     return __sinl (pi * x);
 218   y = -x;                       /* x is assume negative */
 219
 220   /*
 221    * argument reduction, make sure inexact flag not raised if input
 222    * is an integer
 223    */
 224   z = __floorl (y);
 225   if (z != y)
 226     {                           /* inexact anyway */
 227       y  *= 0.5;
 228       y = 2.0*(y - __floorl(y));                /* y = |x| mod 2.0 */
 229       n = (int) (y*4.0);
 230     }
 231   else
 232     {
 233       if (ix >= 0x403f8000)  /* 2^64 */
 234         {
 235           y = zero; n = 0;                 /* y must be even */
 236         }
 237       else
 238         {
 239         if (ix < 0x403e8000)  /* 2^63 */
 240           z = y + two63;        /* exact */
 241         GET_LDOUBLE_WORDS (se, i0, i1, z);
 242         n = i1 & 1;
 243         y  = n;
 244         n <<= 2;
 245       }
 246     }
 247
 248   switch (n)
 249     {
 250     case 0:
 251       y = __sinl (pi * y);
 252       break;
 253     case 1:
 254     case 2:
 255       y = __cosl (pi * (half - y));
 256       break;
 257     case 3:
 258     case 4:
 259       y = __sinl (pi * (one - y));
 260       break;
 261     case 5:
 262     case 6:
 263       y = -__cosl (pi * (y - 1.5));
 264       break;
 265     default:
 266       y = __sinl (pi * (y - 2.0));
 267       break;
 268     }
 269   return -y;
 270 }
 271
 272
 273 long double
 274 __ieee754_lgammal_r (long double x, int *signgamp)
 275 {
 276   long double t, y, z, nadj, p, p1, p2, q, r, w;
 277   int i, ix;
 278   uint32_t se, i0, i1;
 279
 280   *signgamp = 1;
 281   GET_LDOUBLE_WORDS (se, i0, i1, x);
 282   ix = se & 0x7fff;
 283
 284   if (__builtin_expect((ix | i0 | i1) == 0, 0))
 285     {
 286       if (se & 0x8000)
 287         *signgamp = -1;
 288       return one / fabsl (x);
 289     }
 290
 291   ix = (ix << 16) | (i0 >> 16);
 292
 293   /* purge off +-inf, NaN, +-0, and negative arguments */
 294   if (__builtin_expect(ix >= 0x7fff0000, 0))
 295     return x * x;
 296
 297   if (__builtin_expect(ix < 0x3fc08000, 0)) /* 2^-63 */
 298     {                           /* |x|<2**-63, return -log(|x|) */
 299       if (se & 0x8000)
 300         {
 301           *signgamp = -1;
 302           return -__ieee754_logl (-x);
 303         }
 304       else
 305         return -__ieee754_logl (x);
 306     }
 307   if (se & 0x8000)
 308     {
 309       if (x < -2.0L && x > -33.0L)
 310         return __lgamma_negl (x, signgamp);
 311       t = sin_pi (x);
 312       if (t == zero)
 313         return one / fabsl (t); /* -integer */
 314       nadj = __ieee754_logl (pi / fabsl (t * x));
 315       if (t < zero)
 316         *signgamp = -1;
 317       x = -x;
 318     }
 319
 320   /* purge off 1 and 2 */
 321   if ((((ix - 0x3fff8000) | i0 | i1) == 0)
 322       || (((ix - 0x40008000) | i0 | i1) == 0))
 323     r = 0;
 324   else if (ix < 0x40008000) /* 2.0 */
 325     {
 326       /* x < 2.0 */
 327       if (ix <= 0x3ffee666) /* 8.99993896484375e-1 */
 328         {
 329           /* lgamma(x) = lgamma(x+1) - log(x) */
 330           r = -__ieee754_logl (x);
 331           if (ix >= 0x3ffebb4a) /* 7.31597900390625e-1 */
 332             {
 333               y = x - one;
 334               i = 0;
 335             }
 336           else if (ix >= 0x3ffced33)/* 2.31639862060546875e-1 */
 337             {
 338               y = x - (tc - one);
 339               i = 1;
 340             }
 341           else
 342             {
 343               /* x < 0.23 */
 344               y = x;
 345               i = 2;
 346             }
 347         }
 348       else
 349         {
 350           r = zero;
 351           if (ix >= 0x3fffdda6) /* 1.73162841796875 */
 352             {
 353               /* [1.7316,2] */
 354               y = x - 2.0;
 355               i = 0;
 356             }
 357           else if (ix >= 0x3fff9da6)/* 1.23162841796875 */
 358             {
 359               /* [1.23,1.73] */
 360               y = x - tc;
 361               i = 1;
 362             }
 363           else
 364             {
 365               /* [0.9, 1.23] */
 366               y = x - one;
 367               i = 2;
 368             }
 369         }
 370       switch (i)
 371         {
 372         case 0:
 373           p1 = a0 + y * (a1 + y * (a2 + y * (a3 + y * (a4 + y * a5))));
 374           p2 = b0 + y * (b1 + y * (b2 + y * (b3 + y * (b4 + y))));
 375           r += half * y + y * p1/p2;
 376           break;
 377         case 1:
 378     p1 = g0 + y * (g1 + y * (g2 + y * (g3 + y * (g4 + y * (g5 + y * g6)))));
 379     p2 = h0 + y * (h1 + y * (h2 + y * (h3 + y * (h4 + y * (h5 + y)))));
 380     p = tt + y * p1/p2;
 381           r += (tf + p);
 382           break;
 383         case 2:
 384  p1 = y * (u0 + y * (u1 + y * (u2 + y * (u3 + y * (u4 + y * (u5 + y * u6))))));
 385       p2 = v0 + y * (v1 + y * (v2 + y * (v3 + y * (v4 + y * (v5 + y)))));
 386           r += (-half * y + p1 / p2);
 387         }
 388     }
 389   else if (ix < 0x40028000) /* 8.0 */
 390     {
 391       /* x < 8.0 */
 392       i = (int) x;
 393       t = zero;
 394       y = x - (double) i;
 395   p = y *
 396      (s0 + y * (s1 + y * (s2 + y * (s3 + y * (s4 + y * (s5 + y * s6))))));
 397   q = r0 + y * (r1 + y * (r2 + y * (r3 + y * (r4 + y * (r5 + y * (r6 + y))))));
 398       r = half * y + p / q;
 399       z = one;                  /* lgamma(1+s) = log(s) + lgamma(s) */
 400       switch (i)
 401         {
 402         case 7:
 403           z *= (y + 6.0);       /* FALLTHRU */
 404         case 6:
 405           z *= (y + 5.0);       /* FALLTHRU */
 406         case 5:
 407           z *= (y + 4.0);       /* FALLTHRU */
 408         case 4:
 409           z *= (y + 3.0);       /* FALLTHRU */
 410         case 3:
 411           z *= (y + 2.0);       /* FALLTHRU */
 412           r += __ieee754_logl (z);
 413           break;
 414         }
 415     }
 416   else if (ix < 0x40418000) /* 2^66 */
 417     {
 418       /* 8.0 <= x < 2**66 */
 419       t = __ieee754_logl (x);
 420       z = one / x;
 421       y = z * z;
 422       w = w0 + z * (w1
 423           + y * (w2 + y * (w3 + y * (w4 + y * (w5 + y * (w6 + y * w7))))));
 424       r = (x - half) * (t - one) + w;
 425     }
 426   else
 427     /* 2**66 <= x <= inf */
 428     r = x * (__ieee754_logl (x) - one);
 429   /* NADJ is set for negative arguments but not otherwise, resulting
 430      in warnings that it may be used uninitialized although in the
 431      cases where it is used it has always been set.  */
 432   DIAG_PUSH_NEEDS_COMMENT;
 433   DIAG_IGNORE_NEEDS_COMMENT (4.9, "-Wmaybe-uninitialized");
 434   if (se & 0x8000)
 435     r = nadj - r;
 436   DIAG_POP_NEEDS_COMMENT;
 437   return r;
 438 }
 439 strong_alias (__ieee754_lgammal_r, __lgammal_r_finite)