e_lgammal_r.c source code [glibc_src_2.27/sysdeps/ieee754/ldbl-96/e_lgammal_r.c]

1	/*
2	* ====================================================
3	* Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
4	*
5	* Developed at SunPro, a Sun Microsystems, Inc. business.
6	* Permission to use, copy, modify, and distribute this
7	* software is freely granted, provided that this notice
8	* is preserved.
9	* ====================================================
10	*/
11
12	/ Long double expansions are*
13	Copyright (C) 2001 Stephen L. Moshier <moshier@na-net.ornl.gov>
14	and are incorporated herein by permission of the author. The author
15	reserves the right to distribute this material elsewhere under different
16	copying permissions. These modifications are distributed here under
17	the following terms:
18
19	This library is free software; you can redistribute it and/or
20	modify it under the terms of the GNU Lesser General Public
21	License as published by the Free Software Foundation; either
22	version 2.1 of the License, or (at your option) any later version.
23
24	This library is distributed in the hope that it will be useful,
25	but WITHOUT ANY WARRANTY; without even the implied warranty of
26	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
27	Lesser General Public License for more details.
28
29	You should have received a copy of the GNU Lesser General Public
30	License along with this library; if not, see
31	<http://www.gnu.org/licenses/>. /*
32
33	/ __ieee754_lgammal_r(x, signgamp)*
34	* Reentrant version of the logarithm of the Gamma function
35	* with user provide pointer for the sign of Gamma(x).
36	*
37	* Method:
38	* 1. Argument Reduction for 0 < x <= 8
39	* Since gamma(1+s)=s*gamma(s), for x in [0,8], we may
40	* reduce x to a number in [1.5,2.5] by
41	* lgamma(1+s) = log(s) + lgamma(s)
42	* for example,
43	* lgamma(7.3) = log(6.3) + lgamma(6.3)
44	* = log(6.3*5.3) + lgamma(5.3)
45	* = log(6.35.34.33.32.3) + lgamma(2.3)
46	* 2. Polynomial approximation of lgamma around its
47	* minimun ymin=1.461632144968362245 to maintain monotonicity.
48	* On [ymin-0.23, ymin+0.27] (i.e., [1.23164,1.73163]), use
49	* Let z = x-ymin;
50	* lgamma(x) = -1.214862905358496078218 + z^2*poly(z)
51	* 2. Rational approximation in the primary interval [2,3]
52	* We use the following approximation:
53	* s = x-2.0;
54	* lgamma(x) = 0.5s + sP(s)/Q(s)
55	* Our algorithms are based on the following observation
56	*
57	* zeta(2)-1 2 zeta(3)-1 3
58	* lgamma(2+s) = s(1-Euler) + --------- s - --------- * s + ...
59	* 2 3
60	*
61	* where Euler = 0.5771... is the Euler constant, which is very
62	* close to 0.5.
63	*
64	* 3. For x>=8, we have
65	* lgamma(x)~(x-0.5)log(x)-x+0.5log(2pi)+1/(12x)-1/(360x*3)+....
66	* (better formula:
67	* lgamma(x)~(x-0.5)(log(x)-1)-.5(log(2pi)-1) + ...)
68	* Let z = 1/x, then we approximation
69	* f(z) = lgamma(x) - (x-0.5)(log(x)-1)
70	* by
71	* 3 5 11
72	* w = w0 + w1z + w2z + w3z + ... + w6z
73	*
74	* 4. For negative x, since (G is gamma function)
75	* -xG(-x)G(x) = pi/sin(pi*x),
76	* we have
77	* G(x) = pi/(sin(pix)(-x)*G(-x))
78	* since G(-x) is positive, sign(G(x)) = sign(sin(pi*x)) for x<0
79	* Hence, for x<0, signgam = sign(sin(pi*x)) and
80	* lgamma(x) = log(\|Gamma(x)\|)
81	* = log(pi/(\|xsin(pix)\|)) - lgamma(-x);
82	* Note: one should avoid compute pi*(-x) directly in the
83	* computation of sin(pi*(-x)).
84	*
85	* 5. Special Cases
86	* lgamma(2+s) ~ s*(1-Euler) for tiny s
87	* lgamma(1)=lgamma(2)=0
88	* lgamma(x) ~ -log(x) for tiny x
89	* lgamma(0) = lgamma(inf) = inf
90	* lgamma(-integer) = +-inf
91	*
92	*/
93
94	#include <math.h>
95	#include <math_private.h>
96	#include <libc-diag.h>
97
98	static const long double
99	half = `0.5L`,
100	one = `1.0L`,
101	pi = `3.14159265358979323846264L`,
102	two63 = `9.223372036854775808e18L`,
103
104	/ lgam(1+x) = 0.5 x + x a(x)/b(x)*
105	-0.268402099609375 <= x <= 0
106	peak relative error 6.6e-22 /*
107	a0 = -`6.343246574721079391729402781192128239938E2L`,
108	a1 = `1.856560238672465796768677717168371401378E3L`,
109	a2 = `2.404733102163746263689288466865843408429E3L`,
110	a3 = `8.804188795790383497379532868917517596322E2L`,
111	a4 = `1.135361354097447729740103745999661157426E2L`,
112	a5 = `3.766956539107615557608581581190400021285E0L`,
113
114	b0 = `8.214973713960928795704317259806842490498E3L`,
115	b1 = `1.026343508841367384879065363925870888012E4L`,
116	b2 = `4.553337477045763320522762343132210919277E3L`,
117	b3 = `8.506975785032585797446253359230031874803E2L`,
118	b4 = `6.042447899703295436820744186992189445813E1L`,
119	/ b5 = 1.000000000000000000000000000000000000000E0 /
120
121
122	tc = `1.4616321449683623412626595423257213284682E0L`,
123	tf = -`1.2148629053584961146050602565082954242826E-1`,/ double precision /
124	/ tt = (tail of tf), i.e. tf + tt has extended precision. /
125	tt = `3.3649914684731379602768989080467587736363E-18L`,
126	/ lgam ( 1.4616321449683623412626595423257213284682E0 ) =*
127	-1.2148629053584960809551455717769158215135617312999903886372437313313530E-1 /*
128
129	/ lgam (x + tc) = tf + tt + x g(x)/h(x)*
130	- 0.230003726999612341262659542325721328468 <= x
131	<= 0.2699962730003876587373404576742786715318
132	peak relative error 2.1e-21 /*
133	g0 = `3.645529916721223331888305293534095553827E-18L`,
134	g1 = `5.126654642791082497002594216163574795690E3L`,
135	g2 = `8.828603575854624811911631336122070070327E3L`,
136	g3 = `5.464186426932117031234820886525701595203E3L`,
137	g4 = `1.455427403530884193180776558102868592293E3L`,
138	g5 = `1.541735456969245924860307497029155838446E2L`,
139	g6 = `4.335498275274822298341872707453445815118E0L`,
140
141	h0 = `1.059584930106085509696730443974495979641E4L`,
142	h1 = `2.147921653490043010629481226937850618860E4L`,
143	h2 = `1.643014770044524804175197151958100656728E4L`,
144	h3 = `5.869021995186925517228323497501767586078E3L`,
145	h4 = `9.764244777714344488787381271643502742293E2L`,
146	h5 = `6.442485441570592541741092969581997002349E1L`,
147	/ h6 = 1.000000000000000000000000000000000000000E0 /
148
149
150	/ lgam (x+1) = -0.5 x + x u(x)/v(x)*
151	-0.100006103515625 <= x <= 0.231639862060546875
152	peak relative error 1.3e-21 /*
153	u0 = -`8.886217500092090678492242071879342025627E1L`,
154	u1 = `6.840109978129177639438792958320783599310E2L`,
155	u2 = `2.042626104514127267855588786511809932433E3L`,
156	u3 = `1.911723903442667422201651063009856064275E3L`,
157	u4 = `7.447065275665887457628865263491667767695E2L`,
158	u5 = `1.132256494121790736268471016493103952637E2L`,
159	u6 = `4.484398885516614191003094714505960972894E0L`,
160
161	v0 = `1.150830924194461522996462401210374632929E3L`,
162	v1 = `3.399692260848747447377972081399737098610E3L`,
163	v2 = `3.786631705644460255229513563657226008015E3L`,
164	v3 = `1.966450123004478374557778781564114347876E3L`,
165	v4 = `4.741359068914069299837355438370682773122E2L`,
166	v5 = `4.508989649747184050907206782117647852364E1L`,
167	/ v6 = 1.000000000000000000000000000000000000000E0 /
168
169
170	/ lgam (x+2) = .5 x + x s(x)/r(x)*
171	0 <= x <= 1
172	peak relative error 7.2e-22 /*
173	s0 = `1.454726263410661942989109455292824853344E6L`,
174	s1 = -`3.901428390086348447890408306153378922752E6L`,
175	s2 = -`6.573568698209374121847873064292963089438E6L`,
176	s3 = -`3.319055881485044417245964508099095984643E6L`,
177	s4 = -`7.094891568758439227560184618114707107977E5L`,
178	s5 = -`6.263426646464505837422314539808112478303E4L`,
179	s6 = -`1.684926520999477529949915657519454051529E3L`,
180
181	r0 = -`1.883978160734303518163008696712983134698E7L`,
182	r1 = -`2.815206082812062064902202753264922306830E7L`,
183	r2 = -`1.600245495251915899081846093343626358398E7L`,
184	r3 = -`4.310526301881305003489257052083370058799E6L`,
185	r4 = -`5.563807682263923279438235987186184968542E5L`,
186	r5 = -`3.027734654434169996032905158145259713083E4L`,
187	r6 = -`4.501995652861105629217250715790764371267E2L`,
188	/ r6 = 1.000000000000000000000000000000000000000E0 /
189
190
191	/ lgam(x) = ( x - 0.5 ) * log(x) - x + LS2PI + 1/x w(1/x^2)*
192	x >= 8
193	Peak relative error 1.51e-21
194	w0 = LS2PI - 0.5 /*
195	w0 = `4.189385332046727417803e-1L`,
196	w1 = `8.333333333333331447505E-2L`,
197	w2 = -`2.777777777750349603440E-3L`,
198	w3 = `7.936507795855070755671E-4L`,
199	w4 = -`5.952345851765688514613E-4L`,
200	w5 = `8.412723297322498080632E-4L`,
201	w6 = -`1.880801938119376907179E-3L`,
202	w7 = `4.885026142432270781165E-3L`;
203
204	static const long double zero = `0.0L`;
205
206	static long double
207	sin_pi (long double x)
208	{
209	long double y, z;
210	int n, ix;
211	uint32_t se, i0, i1;
212
213	GET_LDOUBLE_WORDS (se, i0, i1, x);
214	ix = se & `0x7fff`;
215	ix = (ix << `16`) \| (i0 >> `16`);
216	if (ix < `0x3ffd8000`) / 0.25 /
217	return __sinl (pi * x);
218	y = -x; / x is assume negative /
219
220	/*
221	* argument reduction, make sure inexact flag not raised if input
222	* is an integer
223	*/
224	z = __floorl (y);
225	if (z != y)
226	{ / inexact anyway /
227	y *= `0.5`;
228	y = `2.0`(y - __floorl(y)); /* y = \|x\| mod 2.0 /
229	n = (int) (y*`4.0`);
230	}
231	else
232	{
233	if (ix >= `0x403f8000`) / 2^64 /
234	{
235	y = zero; n = `0`; / y must be even /
236	}
237	else
238	{
239	if (ix < `0x403e8000`) / 2^63 /
240	z = y + two63; / exact /
241	GET_LDOUBLE_WORDS (se, i0, i1, z);
242	n = i1 & `1`;
243	y = n;
244	n <<= `2`;
245	}
246	}
247
248	switch (n)
249	{
250	case `0`:
251	y = __sinl (pi * y);
252	break;
253	case `1`:
254	case `2`:
255	y = __cosl (pi * (half - y));
256	break;
257	case `3`:
258	case `4`:
259	y = __sinl (pi * (one - y));
260	break;
261	case `5`:
262	case `6`:
263	y = -__cosl (pi * (y - `1.5`));
264	break;
265	default:
266	y = __sinl (pi * (y - `2.0`));
267	break;
268	}
269	return -y;
270	}
271
272
273	long double
274	__ieee754_lgammal_r (long double x, int *signgamp)
275	{
276	long double t, y, z, nadj, p, p1, p2, q, r, w;
277	int i, ix;
278	uint32_t se, i0, i1;
279
280	*signgamp = `1`;
281	GET_LDOUBLE_WORDS (se, i0, i1, x);
282	ix = se & `0x7fff`;
283
284	if (__builtin_expect((ix \| i0 \| i1) == `0`, `0`))
285	{
286	if (se & `0x8000`)
287	*signgamp = -`1`;
288	return one / fabsl (x);
289	}
290
291	ix = (ix << `16`) \| (i0 >> `16`);
292
293	/ purge off +-inf, NaN, +-0, and negative arguments /
294	if (__builtin_expect(ix >= `0x7fff0000`, `0`))
295	return x * x;
296
297	if (__builtin_expect(ix < `0x3fc08000`, `0`)) / 2^-63 /
298	{ / \|x\|<2*-63, return -log(\|x\|) /*
299	if (se & `0x8000`)
300	{
301	*signgamp = -`1`;
302	return -__ieee754_logl (-x);
303	}
304	else
305	return -__ieee754_logl (x);
306	}
307	if (se & `0x8000`)
308	{
309	if (x < -`2.0L` && x > -`33.0L`)
310	return __lgamma_negl (x, signgamp);
311	t = sin_pi (x);
312	if (t == zero)
313	return one / fabsl (t); / -integer /
314	nadj = __ieee754_logl (pi / fabsl (t * x));
315	if (t < zero)
316	*signgamp = -`1`;
317	x = -x;
318	}
319
320	/ purge off 1 and 2 /
321	if ((((ix - `0x3fff8000`) \| i0 \| i1) == `0`)
322	\|\| (((ix - `0x40008000`) \| i0 \| i1) == `0`))
323	r = `0`;
324	else if (ix < `0x40008000`) / 2.0 /
325	{
326	/ x < 2.0 /
327	if (ix <= `0x3ffee666`) / 8.99993896484375e-1 /
328	{
329	/ lgamma(x) = lgamma(x+1) - log(x) /
330	r = -__ieee754_logl (x);
331	if (ix >= `0x3ffebb4a`) / 7.31597900390625e-1 /
332	{
333	y = x - one;
334	i = `0`;
335	}
336	else if (ix >= `0x3ffced33`)/ 2.31639862060546875e-1 /
337	{
338	y = x - (tc - one);
339	i = `1`;
340	}
341	else
342	{
343	/ x < 0.23 /
344	y = x;
345	i = `2`;
346	}
347	}
348	else
349	{
350	r = zero;
351	if (ix >= `0x3fffdda6`) / 1.73162841796875 /
352	{
353	/ [1.7316,2] /
354	y = x - `2.0`;
355	i = `0`;
356	}
357	else if (ix >= `0x3fff9da6`)/ 1.23162841796875 /
358	{
359	/ [1.23,1.73] /
360	y = x - tc;
361	i = `1`;
362	}
363	else
364	{
365	/ [0.9, 1.23] /
366	y = x - one;
367	i = `2`;
368	}
369	}
370	switch (i)
371	{
372	case `0`:
373	p1 = a0 + y * (a1 + y * (a2 + y * (a3 + y * (a4 + y * a5))));
374	p2 = b0 + y * (b1 + y * (b2 + y * (b3 + y * (b4 + y))));
375	r += half * y + y * p1/p2;
376	break;
377	case `1`:
378	p1 = g0 + y * (g1 + y * (g2 + y * (g3 + y * (g4 + y * (g5 + y * g6)))));
379	p2 = h0 + y * (h1 + y * (h2 + y * (h3 + y * (h4 + y * (h5 + y)))));
380	p = tt + y * p1/p2;
381	r += (tf + p);
382	break;
383	case `2`:
384	p1 = y * (u0 + y * (u1 + y * (u2 + y * (u3 + y * (u4 + y * (u5 + y * u6))))));
385	p2 = v0 + y * (v1 + y * (v2 + y * (v3 + y * (v4 + y * (v5 + y)))));
386	r += (-half * y + p1 / p2);
387	}
388	}
389	else if (ix < `0x40028000`) / 8.0 /
390	{
391	/ x < 8.0 /
392	i = (int) x;
393	t = zero;
394	y = x - (double) i;
395	p = y *
396	(s0 + y * (s1 + y * (s2 + y * (s3 + y * (s4 + y * (s5 + y * s6))))));
397	q = r0 + y * (r1 + y * (r2 + y * (r3 + y * (r4 + y * (r5 + y * (r6 + y))))));
398	r = half * y + p / q;
399	z = one; / lgamma(1+s) = log(s) + lgamma(s) /
400	switch (i)
401	{
402	case `7`:
403	z = (y + `6.0`); /* FALLTHRU /
404	case `6`:
405	z = (y + `5.0`); /* FALLTHRU /
406	case `5`:
407	z = (y + `4.0`); /* FALLTHRU /
408	case `4`:
409	z = (y + `3.0`); /* FALLTHRU /
410	case `3`:
411	z = (y + `2.0`); /* FALLTHRU /
412	r += __ieee754_logl (z);
413	break;
414	}
415	}
416	else if (ix < `0x40418000`) / 2^66 /
417	{
418	/ 8.0 <= x < 2*66 /*
419	t = __ieee754_logl (x);
420	z = one / x;
421	y = z * z;
422	w = w0 + z * (w1
423	+ y * (w2 + y * (w3 + y * (w4 + y * (w5 + y * (w6 + y * w7))))));
424	r = (x - half) * (t - one) + w;
425	}
426	else
427	/ 2*66 <= x <= inf /*
428	r = x * (__ieee754_logl (x) - one);
429	/ NADJ is set for negative arguments but not otherwise, resulting*
430	in warnings that it may be used uninitialized although in the
431	cases where it is used it has always been set. /*
432	DIAG_PUSH_NEEDS_COMMENT;
433	DIAG_IGNORE_NEEDS_COMMENT (`4.9`, "-Wmaybe-uninitialized");
434	if (se & `0x8000`)
435	r = nadj - r;
436	DIAG_POP_NEEDS_COMMENT;
437	return r;
438	}
439	strong_alias (__ieee754_lgammal_r, __lgammal_r_finite)
440

Browse the source code of glibc_src_2.27/sysdeps/ieee754/ldbl-96/e_lgammal_r.c