e_lgamma_r.c source code [glibc/sysdeps/ieee754/dbl-64/e_lgamma_r.c]

1	/ @(#)er_lgamma.c 5.1 93/09/24 /
2	/*
3	* ====================================================
4	* Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
5	*
6	* Developed at SunPro, a Sun Microsystems, Inc. business.
7	* Permission to use, copy, modify, and distribute this
8	* software is freely granted, provided that this notice
9	* is preserved.
10	* ====================================================
11	*/
12
13	/ __ieee754_lgamma_r(x, signgamp)*
14	* Reentrant version of the logarithm of the Gamma function
15	* with user provide pointer for the sign of Gamma(x).
16	*
17	* Method:
18	* 1. Argument Reduction for 0 < x <= 8
19	* Since gamma(1+s)=s*gamma(s), for x in [0,8], we may
20	* reduce x to a number in [1.5,2.5] by
21	* lgamma(1+s) = log(s) + lgamma(s)
22	* for example,
23	* lgamma(7.3) = log(6.3) + lgamma(6.3)
24	* = log(6.3*5.3) + lgamma(5.3)
25	* = log(6.35.34.33.32.3) + lgamma(2.3)
26	* 2. Polynomial approximation of lgamma around its
27	* minimun ymin=1.461632144968362245 to maintain monotonicity.
28	* On [ymin-0.23, ymin+0.27] (i.e., [1.23164,1.73163]), use
29	* Let z = x-ymin;
30	* lgamma(x) = -1.214862905358496078218 + z^2*poly(z)
31	* where
32	* poly(z) is a 14 degree polynomial.
33	* 2. Rational approximation in the primary interval [2,3]
34	* We use the following approximation:
35	* s = x-2.0;
36	* lgamma(x) = 0.5s + sP(s)/Q(s)
37	* with accuracy
38	* \|P/Q - (lgamma(x)-0.5s)\| < 2**-61.71
39	* Our algorithms are based on the following observation
40	*
41	* zeta(2)-1 2 zeta(3)-1 3
42	* lgamma(2+s) = s(1-Euler) + --------- s - --------- * s + ...
43	* 2 3
44	*
45	* where Euler = 0.5771... is the Euler constant, which is very
46	* close to 0.5.
47	*
48	* 3. For x>=8, we have
49	* lgamma(x)~(x-0.5)log(x)-x+0.5log(2pi)+1/(12x)-1/(360x*3)+....
50	* (better formula:
51	* lgamma(x)~(x-0.5)(log(x)-1)-.5(log(2pi)-1) + ...)
52	* Let z = 1/x, then we approximation
53	* f(z) = lgamma(x) - (x-0.5)(log(x)-1)
54	* by
55	* 3 5 11
56	* w = w0 + w1z + w2z + w3z + ... + w6z
57	* where
58	* \|w - f(z)\| < 2**-58.74
59	*
60	* 4. For negative x, since (G is gamma function)
61	* -xG(-x)G(x) = pi/sin(pi*x),
62	* we have
63	* G(x) = pi/(sin(pix)(-x)*G(-x))
64	* since G(-x) is positive, sign(G(x)) = sign(sin(pi*x)) for x<0
65	* Hence, for x<0, signgam = sign(sin(pi*x)) and
66	* lgamma(x) = log(\|Gamma(x)\|)
67	* = log(pi/(\|xsin(pix)\|)) - lgamma(-x);
68	* Note: one should avoid compute pi*(-x) directly in the
69	* computation of sin(pi*(-x)).
70	*
71	* 5. Special Cases
72	* lgamma(2+s) ~ s*(1-Euler) for tiny s
73	* lgamma(1)=lgamma(2)=0
74	* lgamma(x) ~ -log(x) for tiny x
75	* lgamma(0) = lgamma(inf) = inf
76	* lgamma(-integer) = +-inf
77	*
78	*/
79
80	#include <math.h>
81	#include <math-narrow-eval.h>
82	#include <math_private.h>
83	#include <libc-diag.h>
84
85	static const double
86	two52= `4.50359962737049600000e+15`, / 0x43300000, 0x00000000 /
87	half= `5.00000000000000000000e-01`, / 0x3FE00000, 0x00000000 /
88	one = `1.00000000000000000000e+00`, / 0x3FF00000, 0x00000000 /
89	pi = `3.14159265358979311600e+00`, / 0x400921FB, 0x54442D18 /
90	a0 = `7.72156649015328655494e-02`, / 0x3FB3C467, 0xE37DB0C8 /
91	a1 = `3.22467033424113591611e-01`, / 0x3FD4A34C, 0xC4A60FAD /
92	a2 = `6.73523010531292681824e-02`, / 0x3FB13E00, 0x1A5562A7 /
93	a3 = `2.05808084325167332806e-02`, / 0x3F951322, 0xAC92547B /
94	a4 = `7.38555086081402883957e-03`, / 0x3F7E404F, 0xB68FEFE8 /
95	a5 = `2.89051383673415629091e-03`, / 0x3F67ADD8, 0xCCB7926B /
96	a6 = `1.19270763183362067845e-03`, / 0x3F538A94, 0x116F3F5D /
97	a7 = `5.10069792153511336608e-04`, / 0x3F40B6C6, 0x89B99C00 /
98	a8 = `2.20862790713908385557e-04`, / 0x3F2CF2EC, 0xED10E54D /
99	a9 = `1.08011567247583939954e-04`, / 0x3F1C5088, 0x987DFB07 /
100	a10 = `2.52144565451257326939e-05`, / 0x3EFA7074, 0x428CFA52 /
101	a11 = `4.48640949618915160150e-05`, / 0x3F07858E, 0x90A45837 /
102	tc = `1.46163214496836224576e+00`, / 0x3FF762D8, 0x6356BE3F /
103	tf = -`1.21486290535849611461e-01`, / 0xBFBF19B9, 0xBCC38A42 /
104	/ tt = -(tail of tf) /
105	tt = -`3.63867699703950536541e-18`, / 0xBC50C7CA, 0xA48A971F /
106	t0 = `4.83836122723810047042e-01`, / 0x3FDEF72B, 0xC8EE38A2 /
107	t1 = -`1.47587722994593911752e-01`, / 0xBFC2E427, 0x8DC6C509 /
108	t2 = `6.46249402391333854778e-02`, / 0x3FB08B42, 0x94D5419B /
109	t3 = -`3.27885410759859649565e-02`, / 0xBFA0C9A8, 0xDF35B713 /
110	t4 = `1.79706750811820387126e-02`, / 0x3F9266E7, 0x970AF9EC /
111	t5 = -`1.03142241298341437450e-02`, / 0xBF851F9F, 0xBA91EC6A /
112	t6 = `6.10053870246291332635e-03`, / 0x3F78FCE0, 0xE370E344 /
113	t7 = -`3.68452016781138256760e-03`, / 0xBF6E2EFF, 0xB3E914D7 /
114	t8 = `2.25964780900612472250e-03`, / 0x3F6282D3, 0x2E15C915 /
115	t9 = -`1.40346469989232843813e-03`, / 0xBF56FE8E, 0xBF2D1AF1 /
116	t10 = `8.81081882437654011382e-04`, / 0x3F4CDF0C, 0xEF61A8E9 /
117	t11 = -`5.38595305356740546715e-04`, / 0xBF41A610, 0x9C73E0EC /
118	t12 = `3.15632070903625950361e-04`, / 0x3F34AF6D, 0x6C0EBBF7 /
119	t13 = -`3.12754168375120860518e-04`, / 0xBF347F24, 0xECC38C38 /
120	t14 = `3.35529192635519073543e-04`, / 0x3F35FD3E, 0xE8C2D3F4 /
121	u0 = -`7.72156649015328655494e-02`, / 0xBFB3C467, 0xE37DB0C8 /
122	u1 = `6.32827064025093366517e-01`, / 0x3FE4401E, 0x8B005DFF /
123	u2 = `1.45492250137234768737e+00`, / 0x3FF7475C, 0xD119BD6F /
124	u3 = `9.77717527963372745603e-01`, / 0x3FEF4976, 0x44EA8450 /
125	u4 = `2.28963728064692451092e-01`, / 0x3FCD4EAE, 0xF6010924 /
126	u5 = `1.33810918536787660377e-02`, / 0x3F8B678B, 0xBF2BAB09 /
127	v1 = `2.45597793713041134822e+00`, / 0x4003A5D7, 0xC2BD619C /
128	v2 = `2.12848976379893395361e+00`, / 0x40010725, 0xA42B18F5 /
129	v3 = `7.69285150456672783825e-01`, / 0x3FE89DFB, 0xE45050AF /
130	v4 = `1.04222645593369134254e-01`, / 0x3FBAAE55, 0xD6537C88 /
131	v5 = `3.21709242282423911810e-03`, / 0x3F6A5ABB, 0x57D0CF61 /
132	s0 = -`7.72156649015328655494e-02`, / 0xBFB3C467, 0xE37DB0C8 /
133	s1 = `2.14982415960608852501e-01`, / 0x3FCB848B, 0x36E20878 /
134	s2 = `3.25778796408930981787e-01`, / 0x3FD4D98F, 0x4F139F59 /
135	s3 = `1.46350472652464452805e-01`, / 0x3FC2BB9C, 0xBEE5F2F7 /
136	s4 = `2.66422703033638609560e-02`, / 0x3F9B481C, 0x7E939961 /
137	s5 = `1.84028451407337715652e-03`, / 0x3F5E26B6, 0x7368F239 /
138	s6 = `3.19475326584100867617e-05`, / 0x3F00BFEC, 0xDD17E945 /
139	r1 = `1.39200533467621045958e+00`, / 0x3FF645A7, 0x62C4AB74 /
140	r2 = `7.21935547567138069525e-01`, / 0x3FE71A18, 0x93D3DCDC /
141	r3 = `1.71933865632803078993e-01`, / 0x3FC601ED, 0xCCFBDF27 /
142	r4 = `1.86459191715652901344e-02`, / 0x3F9317EA, 0x742ED475 /
143	r5 = `7.77942496381893596434e-04`, / 0x3F497DDA, 0xCA41A95B /
144	r6 = `7.32668430744625636189e-06`, / 0x3EDEBAF7, 0xA5B38140 /
145	w0 = `4.18938533204672725052e-01`, / 0x3FDACFE3, 0x90C97D69 /
146	w1 = `8.33333333333329678849e-02`, / 0x3FB55555, 0x5555553B /
147	w2 = -`2.77777777728775536470e-03`, / 0xBF66C16C, 0x16B02E5C /
148	w3 = `7.93650558643019558500e-04`, / 0x3F4A019F, 0x98CF38B6 /
149	w4 = -`5.95187557450339963135e-04`, / 0xBF4380CB, 0x8C0FE741 /
150	w5 = `8.36339918996282139126e-04`, / 0x3F4B67BA, 0x4CDAD5D1 /
151	w6 = -`1.63092934096575273989e-03`; / 0xBF5AB89D, 0x0B9E43E4 /
152
153	static const double zero= `0.00000000000000000000e+00`;
154
155	static double
156	sin_pi(double x)
157	{
158	double y,z;
159	int n,ix;
160
161	GET_HIGH_WORD(ix,x);
162	ix &= `0x7fffffff`;
163
164	if(ix<`0x3fd00000`) return __sin(pi*x);
165	y = -x; / x is assume negative /
166
167	/*
168	* argument reduction, make sure inexact flag not raised if input
169	* is an integer
170	*/
171	z = __floor(y);
172	if(z!=y) { / inexact anyway /
173	y *= `0.5`;
174	y = `2.0`(y - __floor(y)); /* y = \|x\| mod 2.0 /
175	n = (int) (y*`4.0`);
176	} else {
177	if(ix>=`0x43400000`) {
178	y = zero; n = `0`; / y must be even /
179	} else {
180	if(ix<`0x43300000`) z = y+two52; / exact /
181	GET_LOW_WORD(n,z);
182	n &= `1`;
183	y = n;
184	n<<= `2`;
185	}
186	}
187	switch (n) {
188	case `0`: y = __sin(piy); break*;
189	case `1`:
190	case `2`: y = __cos(pi(`0.5`-y)); break*;
191	case `3`:
192	case `4`: y = __sin(pi(one-y)); break*;
193	case `5`:
194	case `6`: y = -__cos(pi(y-`1.5`)); break*;
195	default: y = __sin(pi(y-`2.0`)); break*;
196	}
197	return -y;
198	}
199
200
201	double
202	__ieee754_lgamma_r(double x, int *signgamp)
203	{
204	double t,y,z,nadj,p,p1,p2,p3,q,r,w;
205	int i,hx,lx,ix;
206
207	EXTRACT_WORDS(hx,lx,x);
208
209	/ purge off +-inf, NaN, +-0, and negative arguments /
210	*signgamp = `1`;
211	ix = hx&`0x7fffffff`;
212	if(__builtin_expect(ix>=`0x7ff00000`, `0`)) return x*x;
213	if(__builtin_expect((ix\|lx)==`0`, `0`))
214	{
215	if (hx < `0`)
216	*signgamp = -`1`;
217	return one/fabs(x);
218	}
219	if(__builtin_expect(ix<`0x3b900000`, `0`)) {
220	/ \|x\|<2*-70, return -log(\|x\|) /*
221	if(hx<`0`) {
222	*signgamp = -`1`;
223	return -__ieee754_log(-x);
224	} else return -__ieee754_log(x);
225	}
226	if(hx<`0`) {
227	if(__builtin_expect(ix>=`0x43300000`, `0`))
228	/ \|x\|>=2*52, must be -integer /*
229	return fabs (x)/zero;
230	if (x < -`2.0` && x > -`28.0`)
231	return __lgamma_neg (x, signgamp);
232	t = sin_pi(x);
233	if(t==zero) return one/fabsf(t); / -integer /
234	nadj = __ieee754_log(pi/fabs(t*x));
235	if(t<zero) *signgamp = -`1`;
236	x = -x;
237	}
238
239	/ purge off 1 and 2 /
240	if((((ix-`0x3ff00000`)\|lx)==`0`)\|\|(((ix-`0x40000000`)\|lx)==`0`)) r = `0`;
241	/ for x < 2.0 /
242	else if(ix<`0x40000000`) {
243	if(ix<=`0x3feccccc`) { / lgamma(x) = lgamma(x+1)-log(x) /
244	r = -__ieee754_log(x);
245	if(ix>=`0x3FE76944`) {y = one-x; i= `0`;}
246	else if(ix>=`0x3FCDA661`) {y= x-(tc-one); i=`1`;}
247	else {y = x; i=`2`;}
248	} else {
249	r = zero;
250	if(ix>=`0x3FFBB4C3`) {y=`2.0`-x;i=`0`;} / [1.7316,2] /
251	else if(ix>=`0x3FF3B4C4`) {y=x-tc;i=`1`;} / [1.23,1.73] /
252	else {y=x-one;i=`2`;}
253	}
254	switch(i) {
255	case `0`:
256	z = y*y;
257	p1 = a0+z(a2+z(a4+z(a6+z(a8+z*a10))));
258	p2 = z(a1+z(a3+z(a5+z(a7+z(a9+za11)))));
259	p = y*p1+p2;
260	r += (p-`0.5`y); break*;
261	case `1`:
262	z = y*y;
263	w = z*y;
264	p1 = t0+w(t3+w(t6+w(t9 +wt12))); / parallel comp /
265	p2 = t1+w(t4+w(t7+w(t10+wt13)));
266	p3 = t2+w(t5+w(t8+w(t11+wt14)));
267	p = zp1-(tt-w(p2+y*p3));
268	r += (tf + p); break;
269	case `2`:
270	p1 = y(u0+y(u1+y(u2+y(u3+y(u4+yu5)))));
271	p2 = one+y(v1+y(v2+y(v3+y(v4+y*v5))));
272	r += (-`0.5`*y + p1/p2);
273	}
274	}
275	else if(ix<`0x40200000`) { / x < 8.0 /
276	i = (int)x;
277	t = zero;
278	y = x-(double)i;
279	p = y(s0+y(s1+y(s2+y(s3+y(s4+y(s5+y*s6))))));
280	q = one+y(r1+y(r2+y(r3+y(r4+y(r5+yr6)))));
281	r = half*y+p/q;
282	z = one; / lgamma(1+s) = log(s) + lgamma(s) /
283	switch(i) {
284	case `7`: z = (y+`6.0`); /* FALLTHRU /
285	case `6`: z = (y+`5.0`); /* FALLTHRU /
286	case `5`: z = (y+`4.0`); /* FALLTHRU /
287	case `4`: z = (y+`3.0`); /* FALLTHRU /
288	case `3`: z = (y+`2.0`); /* FALLTHRU /
289	r += __ieee754_log(z); break;
290	}
291	/ 8.0 <= x < 2*58 /*
292	} else if (ix < `0x43900000`) {
293	t = __ieee754_log(x);
294	z = one/x;
295	y = z*z;
296	w = w0+z(w1+y(w2+y(w3+y(w4+y(w5+yw6)))));
297	r = (x-half)*(t-one)+w;
298	} else
299	/ 2*58 <= x <= inf /*
300	r = math_narrow_eval (x*(__ieee754_log(x)-one));
301	/ NADJ is set for negative arguments but not otherwise,*
302	resulting in warnings that it may be used uninitialized
303	although in the cases where it is used it has always been
304	set. /*
305	DIAG_PUSH_NEEDS_COMMENT;
306	DIAG_IGNORE_NEEDS_COMMENT (`4.9`, "-Wmaybe-uninitialized");
307	if(hx<`0`) r = nadj - r;
308	DIAG_POP_NEEDS_COMMENT;
309	return r;
310	}
311	strong_alias (__ieee754_lgamma_r, __lgamma_r_finite)
312

Browse the source code of glibc/sysdeps/ieee754/dbl-64/e_lgamma_r.c