Update copyright notices with scripts/update-copyrights.
[glibc.git] / sysdeps / ieee754 / dbl-64 / mpsqrt.c
blob65df9fd0673896512d91d9f9a3c6b27e21b4a70d
1 /*
2 * IBM Accurate Mathematical Library
3 * written by International Business Machines Corp.
4 * Copyright (C) 2001-2013 Free Software Foundation, Inc.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU Lesser General Public License as published by
8 * the Free Software Foundation; either version 2.1 of the License, or
9 * (at your option) any later version.
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU Lesser General Public License for more details.
16 * You should have received a copy of the GNU Lesser General Public License
17 * along with this program; if not, see <http://www.gnu.org/licenses/>.
19 /****************************************************************************/
20 /* MODULE_NAME:mpsqrt.c */
21 /* */
22 /* FUNCTION:mpsqrt */
23 /* fastiroot */
24 /* */
25 /* FILES NEEDED:endian.h mpa.h mpsqrt.h */
26 /* mpa.c */
27 /* Multi-Precision square root function subroutine for precision p >= 4. */
28 /* The relative error is bounded by 3.501*r**(1-p), where r=2**24. */
29 /* */
30 /****************************************************************************/
31 #include "endian.h"
32 #include "mpa.h"
34 #ifndef SECTION
35 # define SECTION
36 #endif
38 #include "mpsqrt.h"
40 /****************************************************************************/
41 /* Multi-Precision square root function subroutine for precision p >= 4. */
42 /* The relative error is bounded by 3.501*r**(1-p), where r=2**24. */
43 /* Routine receives two pointers to Multi Precision numbers: */
44 /* x (left argument) and y (next argument). Routine also receives precision */
45 /* p as integer. Routine computes sqrt(*x) and stores result in *y */
46 /****************************************************************************/
48 static double fastiroot(double);
50 void
51 SECTION
52 __mpsqrt(mp_no *x, mp_no *y, int p) {
53 int i,m,ey;
54 double dx,dy;
55 static const mp_no
56 mphalf = {0,{1.0,8388608.0 /* 2^23 */}},
57 mp3halfs = {1,{1.0,1.0,8388608.0 /* 2^23 */}};
58 mp_no mpxn,mpz,mpu,mpt1,mpt2;
60 ey=EX/2; __cpy(x,&mpxn,p); mpxn.e -= (ey+ey);
61 __mp_dbl(&mpxn,&dx,p); dy=fastiroot(dx); __dbl_mp(dy,&mpu,p);
62 __mul(&mpxn,&mphalf,&mpz,p);
64 m=__mpsqrt_mp[p];
65 for (i=0; i<m; i++) {
66 __mul(&mpu,&mpu,&mpt1,p);
67 __mul(&mpt1,&mpz,&mpt2,p);
68 __sub(&mp3halfs,&mpt2,&mpt1,p);
69 __mul(&mpu,&mpt1,&mpt2,p);
70 __cpy(&mpt2,&mpu,p);
72 __mul(&mpxn,&mpu,y,p); EY += ey;
74 return;
77 /***********************************************************/
78 /* Compute a double precision approximation for 1/sqrt(x) */
79 /* with the relative error bounded by 2**-51. */
80 /***********************************************************/
81 static double
82 SECTION
83 fastiroot(double x) {
84 union {int i[2]; double d;} p,q;
85 double y,z, t;
86 int n;
87 static const double c0 = 0.99674, c1 = -0.53380, c2 = 0.45472, c3 = -0.21553;
89 p.d = x;
90 p.i[HIGH_HALF] = (p.i[HIGH_HALF] & 0x3FFFFFFF ) | 0x3FE00000 ;
91 q.d = x;
92 y = p.d;
93 z = y -1.0;
94 n = (q.i[HIGH_HALF] - p.i[HIGH_HALF])>>1;
95 z = ((c3*z + c2)*z + c1)*z + c0; /* 2**-7 */
96 z = z*(1.5 - 0.5*y*z*z); /* 2**-14 */
97 p.d = z*(1.5 - 0.5*y*z*z); /* 2**-28 */
98 p.i[HIGH_HALF] -= n;
99 t = x*p.d;
100 return p.d*(1.5 - 0.5*p.d*t);