1*81418a27Smrg /*
2*81418a27Smrg  * ====================================================
3*81418a27Smrg  * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
4*81418a27Smrg  *
5*81418a27Smrg  * Developed at SunPro, a Sun Microsystems, Inc. business.
6*81418a27Smrg  * Permission to use, copy, modify, and distribute this
7*81418a27Smrg  * software is freely granted, provided that this notice
8*81418a27Smrg  * is preserved.
9*81418a27Smrg  * ====================================================
10*81418a27Smrg  */
11*81418a27Smrg 
12*81418a27Smrg /*
13*81418a27Smrg   Long double expansions are
14*81418a27Smrg   Copyright (C) 2001 Stephen L. Moshier <moshier@na-net.ornl.gov>
15*81418a27Smrg   and are incorporated herein by permission of the author.  The author
16*81418a27Smrg   reserves the right to distribute this material elsewhere under different
17*81418a27Smrg   copying permissions.  These modifications are distributed here under the
18*81418a27Smrg   following terms:
19*81418a27Smrg 
20*81418a27Smrg     This library is free software; you can redistribute it and/or
21*81418a27Smrg     modify it under the terms of the GNU Lesser General Public
22*81418a27Smrg     License as published by the Free Software Foundation; either
23*81418a27Smrg     version 2.1 of the License, or (at your option) any later version.
24*81418a27Smrg 
25*81418a27Smrg     This library is distributed in the hope that it will be useful,
26*81418a27Smrg     but WITHOUT ANY WARRANTY; without even the implied warranty of
27*81418a27Smrg     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
28*81418a27Smrg     Lesser General Public License for more details.
29*81418a27Smrg 
30*81418a27Smrg     You should have received a copy of the GNU Lesser General Public
31*81418a27Smrg     License along with this library; if not, see
32*81418a27Smrg     <http://www.gnu.org/licenses/>.  */
33*81418a27Smrg 
34*81418a27Smrg /* __ieee754_asin(x)
35*81418a27Smrg  * Method :
36*81418a27Smrg  *	Since  asin(x) = x + x^3/6 + x^5*3/40 + x^7*15/336 + ...
37*81418a27Smrg  *	we approximate asin(x) on [0,0.5] by
38*81418a27Smrg  *		asin(x) = x + x*x^2*R(x^2)
39*81418a27Smrg  *      Between .5 and .625 the approximation is
40*81418a27Smrg  *              asin(0.5625 + x) = asin(0.5625) + x rS(x) / sS(x)
41*81418a27Smrg  *	For x in [0.625,1]
42*81418a27Smrg  *		asin(x) = pi/2-2*asin(sqrt((1-x)/2))
43*81418a27Smrg  *	Let y = (1-x), z = y/2, s := sqrt(z), and pio2_hi+pio2_lo=pi/2;
44*81418a27Smrg  *	then for x>0.98
45*81418a27Smrg  *		asin(x) = pi/2 - 2*(s+s*z*R(z))
46*81418a27Smrg  *			= pio2_hi - (2*(s+s*z*R(z)) - pio2_lo)
47*81418a27Smrg  *	For x<=0.98, let pio4_hi = pio2_hi/2, then
48*81418a27Smrg  *		f = hi part of s;
49*81418a27Smrg  *		c = sqrt(z) - f = (z-f*f)/(s+f) 	...f+c=sqrt(z)
50*81418a27Smrg  *	and
51*81418a27Smrg  *		asin(x) = pi/2 - 2*(s+s*z*R(z))
52*81418a27Smrg  *			= pio4_hi+(pio4-2s)-(2s*z*R(z)-pio2_lo)
53*81418a27Smrg  *			= pio4_hi+(pio4-2f)-(2s*z*R(z)-(pio2_lo+2c))
54*81418a27Smrg  *
55*81418a27Smrg  * Special cases:
56*81418a27Smrg  *	if x is NaN, return x itself;
57*81418a27Smrg  *	if |x|>1, return NaN with invalid signal.
58*81418a27Smrg  *
59*81418a27Smrg  */
60*81418a27Smrg 
61*81418a27Smrg #include "quadmath-imp.h"
62*81418a27Smrg 
63*81418a27Smrg static const __float128
64*81418a27Smrg   one = 1,
65*81418a27Smrg   huge = 1.0e+4932Q,
66*81418a27Smrg   pio2_hi = 1.5707963267948966192313216916397514420986Q,
67*81418a27Smrg   pio2_lo = 4.3359050650618905123985220130216759843812E-35Q,
68*81418a27Smrg   pio4_hi = 7.8539816339744830961566084581987569936977E-1Q,
69*81418a27Smrg 
70*81418a27Smrg 	/* coefficient for R(x^2) */
71*81418a27Smrg 
72*81418a27Smrg   /* asin(x) = x + x^3 pS(x^2) / qS(x^2)
73*81418a27Smrg      0 <= x <= 0.5
74*81418a27Smrg      peak relative error 1.9e-35  */
75*81418a27Smrg   pS0 = -8.358099012470680544198472400254596543711E2Q,
76*81418a27Smrg   pS1 =  3.674973957689619490312782828051860366493E3Q,
77*81418a27Smrg   pS2 = -6.730729094812979665807581609853656623219E3Q,
78*81418a27Smrg   pS3 =  6.643843795209060298375552684423454077633E3Q,
79*81418a27Smrg   pS4 = -3.817341990928606692235481812252049415993E3Q,
80*81418a27Smrg   pS5 =  1.284635388402653715636722822195716476156E3Q,
81*81418a27Smrg   pS6 = -2.410736125231549204856567737329112037867E2Q,
82*81418a27Smrg   pS7 =  2.219191969382402856557594215833622156220E1Q,
83*81418a27Smrg   pS8 = -7.249056260830627156600112195061001036533E-1Q,
84*81418a27Smrg   pS9 =  1.055923570937755300061509030361395604448E-3Q,
85*81418a27Smrg 
86*81418a27Smrg   qS0 = -5.014859407482408326519083440151745519205E3Q,
87*81418a27Smrg   qS1 =  2.430653047950480068881028451580393430537E4Q,
88*81418a27Smrg   qS2 = -4.997904737193653607449250593976069726962E4Q,
89*81418a27Smrg   qS3 =  5.675712336110456923807959930107347511086E4Q,
90*81418a27Smrg   qS4 = -3.881523118339661268482937768522572588022E4Q,
91*81418a27Smrg   qS5 =  1.634202194895541569749717032234510811216E4Q,
92*81418a27Smrg   qS6 = -4.151452662440709301601820849901296953752E3Q,
93*81418a27Smrg   qS7 =  5.956050864057192019085175976175695342168E2Q,
94*81418a27Smrg   qS8 = -4.175375777334867025769346564600396877176E1Q,
95*81418a27Smrg   /* 1.000000000000000000000000000000000000000E0 */
96*81418a27Smrg 
97*81418a27Smrg   /* asin(0.5625 + x) = asin(0.5625) + x rS(x) / sS(x)
98*81418a27Smrg      -0.0625 <= x <= 0.0625
99*81418a27Smrg      peak relative error 3.3e-35  */
100*81418a27Smrg   rS0 = -5.619049346208901520945464704848780243887E0Q,
101*81418a27Smrg   rS1 =  4.460504162777731472539175700169871920352E1Q,
102*81418a27Smrg   rS2 = -1.317669505315409261479577040530751477488E2Q,
103*81418a27Smrg   rS3 =  1.626532582423661989632442410808596009227E2Q,
104*81418a27Smrg   rS4 = -3.144806644195158614904369445440583873264E1Q,
105*81418a27Smrg   rS5 = -9.806674443470740708765165604769099559553E1Q,
106*81418a27Smrg   rS6 =  5.708468492052010816555762842394927806920E1Q,
107*81418a27Smrg   rS7 =  1.396540499232262112248553357962639431922E1Q,
108*81418a27Smrg   rS8 = -1.126243289311910363001762058295832610344E1Q,
109*81418a27Smrg   rS9 = -4.956179821329901954211277873774472383512E-1Q,
110*81418a27Smrg   rS10 =  3.313227657082367169241333738391762525780E-1Q,
111*81418a27Smrg 
112*81418a27Smrg   sS0 = -4.645814742084009935700221277307007679325E0Q,
113*81418a27Smrg   sS1 =  3.879074822457694323970438316317961918430E1Q,
114*81418a27Smrg   sS2 = -1.221986588013474694623973554726201001066E2Q,
115*81418a27Smrg   sS3 =  1.658821150347718105012079876756201905822E2Q,
116*81418a27Smrg   sS4 = -4.804379630977558197953176474426239748977E1Q,
117*81418a27Smrg   sS5 = -1.004296417397316948114344573811562952793E2Q,
118*81418a27Smrg   sS6 =  7.530281592861320234941101403870010111138E1Q,
119*81418a27Smrg   sS7 =  1.270735595411673647119592092304357226607E1Q,
120*81418a27Smrg   sS8 = -1.815144839646376500705105967064792930282E1Q,
121*81418a27Smrg   sS9 = -7.821597334910963922204235247786840828217E-2Q,
122*81418a27Smrg   /*  1.000000000000000000000000000000000000000E0 */
123*81418a27Smrg 
124*81418a27Smrg  asinr5625 =  5.9740641664535021430381036628424864397707E-1Q;
125*81418a27Smrg 
126*81418a27Smrg 
127*81418a27Smrg 
128*81418a27Smrg __float128
asinq(__float128 x)129*81418a27Smrg asinq (__float128 x)
130*81418a27Smrg {
131*81418a27Smrg   __float128 t, w, p, q, c, r, s;
132*81418a27Smrg   int32_t ix, sign, flag;
133*81418a27Smrg   ieee854_float128 u;
134*81418a27Smrg 
135*81418a27Smrg   flag = 0;
136*81418a27Smrg   u.value = x;
137*81418a27Smrg   sign = u.words32.w0;
138*81418a27Smrg   ix = sign & 0x7fffffff;
139*81418a27Smrg   u.words32.w0 = ix;    /* |x| */
140*81418a27Smrg   if (ix >= 0x3fff0000)	/* |x|>= 1 */
141*81418a27Smrg     {
142*81418a27Smrg       if (ix == 0x3fff0000
143*81418a27Smrg 	  && (u.words32.w1 | u.words32.w2 | u.words32.w3) == 0)
144*81418a27Smrg 	/* asin(1)=+-pi/2 with inexact */
145*81418a27Smrg 	return x * pio2_hi + x * pio2_lo;
146*81418a27Smrg       return (x - x) / (x - x);	/* asin(|x|>1) is NaN */
147*81418a27Smrg     }
148*81418a27Smrg   else if (ix < 0x3ffe0000) /* |x| < 0.5 */
149*81418a27Smrg     {
150*81418a27Smrg       if (ix < 0x3fc60000) /* |x| < 2**-57 */
151*81418a27Smrg 	{
152*81418a27Smrg 	  math_check_force_underflow (x);
153*81418a27Smrg 	  __float128 force_inexact = huge + x;
154*81418a27Smrg 	  math_force_eval (force_inexact);
155*81418a27Smrg 	  return x;		/* return x with inexact if x!=0 */
156*81418a27Smrg 	}
157*81418a27Smrg       else
158*81418a27Smrg 	{
159*81418a27Smrg 	  t = x * x;
160*81418a27Smrg 	  /* Mark to use pS, qS later on.  */
161*81418a27Smrg 	  flag = 1;
162*81418a27Smrg 	}
163*81418a27Smrg     }
164*81418a27Smrg   else if (ix < 0x3ffe4000) /* 0.625 */
165*81418a27Smrg     {
166*81418a27Smrg       t = u.value - 0.5625;
167*81418a27Smrg       p = ((((((((((rS10 * t
168*81418a27Smrg 		    + rS9) * t
169*81418a27Smrg 		   + rS8) * t
170*81418a27Smrg 		  + rS7) * t
171*81418a27Smrg 		 + rS6) * t
172*81418a27Smrg 		+ rS5) * t
173*81418a27Smrg 	       + rS4) * t
174*81418a27Smrg 	      + rS3) * t
175*81418a27Smrg 	     + rS2) * t
176*81418a27Smrg 	    + rS1) * t
177*81418a27Smrg 	   + rS0) * t;
178*81418a27Smrg 
179*81418a27Smrg       q = ((((((((( t
180*81418a27Smrg 		    + sS9) * t
181*81418a27Smrg 		  + sS8) * t
182*81418a27Smrg 		 + sS7) * t
183*81418a27Smrg 		+ sS6) * t
184*81418a27Smrg 	       + sS5) * t
185*81418a27Smrg 	      + sS4) * t
186*81418a27Smrg 	     + sS3) * t
187*81418a27Smrg 	    + sS2) * t
188*81418a27Smrg 	   + sS1) * t
189*81418a27Smrg 	+ sS0;
190*81418a27Smrg       t = asinr5625 + p / q;
191*81418a27Smrg       if ((sign & 0x80000000) == 0)
192*81418a27Smrg 	return t;
193*81418a27Smrg       else
194*81418a27Smrg 	return -t;
195*81418a27Smrg     }
196*81418a27Smrg   else
197*81418a27Smrg     {
198*81418a27Smrg       /* 1 > |x| >= 0.625 */
199*81418a27Smrg       w = one - u.value;
200*81418a27Smrg       t = w * 0.5;
201*81418a27Smrg     }
202*81418a27Smrg 
203*81418a27Smrg   p = (((((((((pS9 * t
204*81418a27Smrg 	       + pS8) * t
205*81418a27Smrg 	      + pS7) * t
206*81418a27Smrg 	     + pS6) * t
207*81418a27Smrg 	    + pS5) * t
208*81418a27Smrg 	   + pS4) * t
209*81418a27Smrg 	  + pS3) * t
210*81418a27Smrg 	 + pS2) * t
211*81418a27Smrg 	+ pS1) * t
212*81418a27Smrg        + pS0) * t;
213*81418a27Smrg 
214*81418a27Smrg   q = (((((((( t
215*81418a27Smrg 	      + qS8) * t
216*81418a27Smrg 	     + qS7) * t
217*81418a27Smrg 	    + qS6) * t
218*81418a27Smrg 	   + qS5) * t
219*81418a27Smrg 	  + qS4) * t
220*81418a27Smrg 	 + qS3) * t
221*81418a27Smrg 	+ qS2) * t
222*81418a27Smrg        + qS1) * t
223*81418a27Smrg     + qS0;
224*81418a27Smrg 
225*81418a27Smrg   if (flag) /* 2^-57 < |x| < 0.5 */
226*81418a27Smrg     {
227*81418a27Smrg       w = p / q;
228*81418a27Smrg       return x + x * w;
229*81418a27Smrg     }
230*81418a27Smrg 
231*81418a27Smrg   s = sqrtq (t);
232*81418a27Smrg   if (ix >= 0x3ffef333) /* |x| > 0.975 */
233*81418a27Smrg     {
234*81418a27Smrg       w = p / q;
235*81418a27Smrg       t = pio2_hi - (2.0 * (s + s * w) - pio2_lo);
236*81418a27Smrg     }
237*81418a27Smrg   else
238*81418a27Smrg     {
239*81418a27Smrg       u.value = s;
240*81418a27Smrg       u.words32.w3 = 0;
241*81418a27Smrg       u.words32.w2 = 0;
242*81418a27Smrg       w = u.value;
243*81418a27Smrg       c = (t - w * w) / (s + w);
244*81418a27Smrg       r = p / q;
245*81418a27Smrg       p = 2.0 * s * r - (pio2_lo - 2.0 * c);
246*81418a27Smrg       q = pio4_hi - 2.0 * w;
247*81418a27Smrg       t = pio4_hi - (p - q);
248*81418a27Smrg     }
249*81418a27Smrg 
250*81418a27Smrg   if ((sign & 0x80000000) == 0)
251*81418a27Smrg     return t;
252*81418a27Smrg   else
253*81418a27Smrg     return -t;
254*81418a27Smrg }
255