xref: /freebsd/lib/msun/src/e_lgammaf_r.c (revision a4e4b355)
1 /* e_lgammaf_r.c -- float version of e_lgamma_r.c.
2  * Conversion to float by Ian Lance Taylor, Cygnus Support, ian@cygnus.com.
3  * Conversion to float fixed By Steven G. Kargl.
4  */
5 
6 /*
7  * ====================================================
8  * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
9  *
10  * Developed at SunPro, a Sun Microsystems, Inc. business.
11  * Permission to use, copy, modify, and distribute this
12  * software is freely granted, provided that this notice
13  * is preserved.
14  * ====================================================
15  */
16 
17 #include <sys/cdefs.h>
18 __FBSDID("$FreeBSD$");
19 
20 #include "math.h"
21 #include "math_private.h"
22 
23 static const volatile float vzero = 0;
24 
25 static const float
26 zero=  0,
27 half=  0.5,
28 one =  1,
29 pi  =  3.1415927410e+00, /* 0x40490fdb */
30 /*
31  * Domain y in [0x1p-27, 0.27], range ~[-3.4599e-10, 3.4590e-10]:
32  * |(lgamma(2 - y) + 0.5 * y) / y - a(y)| < 2**-31.4
33  */
34 a0  =  7.72156641e-02, /* 0x3d9e233f */
35 a1  =  3.22467119e-01, /* 0x3ea51a69 */
36 a2  =  6.73484802e-02, /* 0x3d89ee00 */
37 a3  =  2.06395667e-02, /* 0x3ca9144f */
38 a4  =  6.98275631e-03, /* 0x3be4cf9b */
39 a5  =  4.11768444e-03, /* 0x3b86eda4 */
40 /*
41  * Domain x in [tc-0.24, tc+0.28], range ~[-5.6577e-10, 5.5677e-10]:
42  * |(lgamma(x) - tf) - t(x - tc)| < 2**-30.8.
43  */
44 tc  =  1.46163213e+00, /* 0x3fbb16c3 */
45 tf  = -1.21486291e-01, /* 0xbdf8cdce */
46 t0  = -2.94064460e-11, /* 0xae0154b7 */
47 t1  = -2.35939837e-08, /* 0xb2caabb8 */
48 t2  =  4.83836412e-01, /* 0x3ef7b968 */
49 t3  = -1.47586212e-01, /* 0xbe1720d7 */
50 t4  =  6.46013096e-02, /* 0x3d844db1 */
51 t5  = -3.28450352e-02, /* 0xbd068884 */
52 t6  =  1.86483748e-02, /* 0x3c98c47a */
53 t7  = -9.89206228e-03, /* 0xbc221251 */
54 /*
55  * Domain y in [-0.1, 0.232], range ~[-8.4931e-10, 8.7794e-10]:
56  * |(lgamma(1 + y) + 0.5 * y) / y - u(y) / v(y)| < 2**-31.2
57  */
58 u0  = -7.72156641e-02, /* 0xbd9e233f */
59 u1  =  7.36789703e-01, /* 0x3f3c9e40 */
60 u2  =  4.95649040e-01, /* 0x3efdc5b6 */
61 v1  =  1.10958421e+00, /* 0x3f8e06db */
62 v2  =  2.10598111e-01, /* 0x3e57a708 */
63 v3  = -1.02995494e-02, /* 0xbc28bf71 */
64 /*
65  * Domain x in (2, 3], range ~[-5.5189e-11, 5.2317e-11]:
66  * |(lgamma(y+2) - 0.5 * y) / y - s(y)/r(y)| < 2**-35.0
67  * with y = x - 2.
68  */
69 s0 = -7.72156641e-02, /* 0xbd9e233f */
70 s1 =  2.69987404e-01, /* 0x3e8a3bca */
71 s2 =  1.42851010e-01, /* 0x3e124789 */
72 s3 =  1.19389519e-02, /* 0x3c439b98 */
73 r1 =  6.79650068e-01, /* 0x3f2dfd8c */
74 r2 =  1.16058730e-01, /* 0x3dedb033 */
75 r3 =  3.75673687e-03, /* 0x3b763396 */
76 /*
77  * Domain z in [8, 0x1p24], range ~[-1.2640e-09, 1.2640e-09]:
78  * |lgamma(x) - (x - 0.5) * (log(x) - 1) - w(1/x)| < 2**-29.6.
79  */
80 w0 =  4.18938547e-01, /* 0x3ed67f1d */
81 w1 =  8.33332464e-02, /* 0x3daaaa9f */
82 w2 = -2.76129087e-03; /* 0xbb34f6c6 */
83 
84 static float
85 sin_pif(float x)
86 {
87 	volatile float vz;
88 	float y,z;
89 	int n;
90 
91 	y = -x;
92 
93 	vz = y+0x1p23F;			/* depend on 0 <= y < 0x1p23 */
94 	z = vz-0x1p23F;			/* rintf(y) for the above range */
95 	if (z == y)
96 	    return zero;
97 
98 	vz = y+0x1p21F;
99 	GET_FLOAT_WORD(n,vz);		/* bits for rounded y (units 0.25) */
100 	z = vz-0x1p21F;			/* y rounded to a multiple of 0.25 */
101 	if (z > y) {
102 	    z -= 0.25F;			/* adjust to round down */
103 	    n--;
104 	}
105 	n &= 7;				/* octant of y mod 2 */
106 	y = y - z + n * 0.25F;		/* y mod 2 */
107 
108 	switch (n) {
109 	    case 0:   y =  __kernel_sindf(pi*y); break;
110 	    case 1:
111 	    case 2:   y =  __kernel_cosdf(pi*((float)0.5-y)); break;
112 	    case 3:
113 	    case 4:   y =  __kernel_sindf(pi*(one-y)); break;
114 	    case 5:
115 	    case 6:   y = -__kernel_cosdf(pi*(y-(float)1.5)); break;
116 	    default:  y =  __kernel_sindf(pi*(y-(float)2.0)); break;
117 	    }
118 	return -y;
119 }
120 
121 
122 float
123 __ieee754_lgammaf_r(float x, int *signgamp)
124 {
125 	float nadj,p,p1,p2,p3,q,r,t,w,y,z;
126 	int32_t hx;
127 	int i,ix;
128 
129 	GET_FLOAT_WORD(hx,x);
130 
131     /* purge +-Inf and NaNs */
132 	*signgamp = 1;
133 	ix = hx&0x7fffffff;
134 	if(ix>=0x7f800000) return x*x;
135 
136     /* purge +-0 and tiny arguments */
137 	*signgamp = 1-2*((uint32_t)hx>>31);
138 	if(ix<0x32000000) {		/* |x|<2**-27, return -log(|x|) */
139 	    if(ix==0)
140 	        return one/vzero;
141 	    return -__ieee754_logf(fabsf(x));
142 	}
143 
144     /* purge negative integers and start evaluation for other x < 0 */
145 	if(hx<0) {
146 	    *signgamp = 1;
147 	    if(ix>=0x4b000000) 		/* |x|>=2**23, must be -integer */
148 		return one/vzero;
149 	    t = sin_pif(x);
150 	    if(t==zero) return one/vzero; /* -integer */
151 	    nadj = __ieee754_logf(pi/fabsf(t*x));
152 	    if(t<zero) *signgamp = -1;
153 	    x = -x;
154 	}
155 
156     /* purge 1 and 2 */
157 	if (ix==0x3f800000||ix==0x40000000) r = 0;
158     /* for x < 2.0 */
159 	else if(ix<0x40000000) {
160 	    if(ix<=0x3f666666) { 	/* lgamma(x) = lgamma(x+1)-log(x) */
161 		r = -__ieee754_logf(x);
162 		if(ix>=0x3f3b4a20) {y = one-x; i= 0;}
163 		else if(ix>=0x3e6d3308) {y= x-(tc-one); i=1;}
164 	  	else {y = x; i=2;}
165 	    } else {
166 	  	r = zero;
167 	        if(ix>=0x3fdda618) {y=2-x;i=0;} /* [1.7316,2] */
168 	        else if(ix>=0x3F9da620) {y=x-tc;i=1;} /* [1.23,1.73] */
169 		else {y=x-one;i=2;}
170 	    }
171 	    switch(i) {
172 	      case 0:
173 		z = y*y;
174 		p1 = a0+z*(a2+z*a4);
175 		p2 = z*(a1+z*(a3+z*a5));
176 		p  = y*p1+p2;
177 		r  += p-y/2; break;
178 	      case 1:
179 		p = t0+y*t1+y*y*(t2+y*(t3+y*(t4+y*(t5+y*(t6+y*t7)))));
180 		r += tf + p; break;
181 	      case 2:
182 		p1 = y*(u0+y*(u1+y*u2));
183 		p2 = one+y*(v1+y*(v2+y*v3));
184 		r += p1/p2-y/2;
185 	    }
186 	}
187     /* x < 8.0 */
188 	else if(ix<0x41000000) {
189 	    i = x;
190 	    y = x-i;
191 	    p = y*(s0+y*(s1+y*(s2+y*s3)));
192 	    q = one+y*(r1+y*(r2+y*r3));
193 	    r = y/2+p/q;
194 	    z = one;	/* lgamma(1+s) = log(s) + lgamma(s) */
195 	    switch(i) {
196 	    case 7: z *= (y+6);		/* FALLTHRU */
197 	    case 6: z *= (y+5);		/* FALLTHRU */
198 	    case 5: z *= (y+4);		/* FALLTHRU */
199 	    case 4: z *= (y+3);		/* FALLTHRU */
200 	    case 3: z *= (y+2);		/* FALLTHRU */
201 		    r += __ieee754_logf(z); break;
202 	    }
203     /* 8.0 <= x < 2**27 */
204 	} else if (ix < 0x4d000000) {
205 	    t = __ieee754_logf(x);
206 	    z = one/x;
207 	    y = z*z;
208 	    w = w0+z*(w1+y*w2);
209 	    r = (x-half)*(t-one)+w;
210 	} else
211     /* 2**27 <= x <= inf */
212 	    r =  x*(__ieee754_logf(x)-one);
213 	if(hx<0) r = nadj - r;
214 	return r;
215 }
216