lgammaf_r.rs source code [crates/libm/src/math/lgammaf_r.rs]

1	/ origin: FreeBSD /usr/src/lib/msun/src/e_lgammaf_r.c /
2	/*
3	* Conversion to float by Ian Lance Taylor, Cygnus Support, ian@cygnus.com.
4	*/
5	/*
6	* ====================================================
7	* Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
8	*
9	* Developed at SunPro, a Sun Microsystems, Inc. business.
10	* Permission to use, copy, modify, and distribute this
11	* software is freely granted, provided that this notice
12	* is preserved.
13	* ====================================================
14	*/
15
16	use super::{floorf, k_cosf, k_sinf, logf};
17
18	const PI: f32 = `3.1415927410e+00`; / 0x40490fdb /
19	const A0: f32 = `7.7215664089e-02`; / 0x3d9e233f /
20	const A1: f32 = `3.2246702909e-01`; / 0x3ea51a66 /
21	const A2: f32 = `6.7352302372e-02`; / 0x3d89f001 /
22	const A3: f32 = `2.0580807701e-02`; / 0x3ca89915 /
23	const A4: f32 = `7.3855509982e-03`; / 0x3bf2027e /
24	const A5: f32 = `2.8905137442e-03`; / 0x3b3d6ec6 /
25	const A6: f32 = `1.1927076848e-03`; / 0x3a9c54a1 /
26	const A7: f32 = `5.1006977446e-04`; / 0x3a05b634 /
27	const A8: f32 = `2.2086278477e-04`; / 0x39679767 /
28	const A9: f32 = `1.0801156895e-04`; / 0x38e28445 /
29	const A10: f32 = `2.5214456400e-05`; / 0x37d383a2 /
30	const A11: f32 = `4.4864096708e-05`; / 0x383c2c75 /
31	const TC: f32 = `1.4616321325e+00`; / 0x3fbb16c3 /
32	const TF: f32 = `-1.2148628384e-01`; / 0xbdf8cdcd /
33	/ TT = -(tail of TF) /
34	const TT: f32 = `6.6971006518e-09`; / 0x31e61c52 /
35	const T0: f32 = `4.8383611441e-01`; / 0x3ef7b95e /
36	const T1: f32 = `-1.4758771658e-01`; / 0xbe17213c /
37	const T2: f32 = `6.4624942839e-02`; / 0x3d845a15 /
38	const T3: f32 = `-3.2788541168e-02`; / 0xbd064d47 /
39	const T4: f32 = `1.7970675603e-02`; / 0x3c93373d /
40	const T5: f32 = `-1.0314224288e-02`; / 0xbc28fcfe /
41	const T6: f32 = `6.1005386524e-03`; / 0x3bc7e707 /
42	const T7: f32 = `-3.6845202558e-03`; / 0xbb7177fe /
43	const T8: f32 = `2.2596477065e-03`; / 0x3b141699 /
44	const T9: f32 = `-1.4034647029e-03`; / 0xbab7f476 /
45	const T10: f32 = `8.8108185446e-04`; / 0x3a66f867 /
46	const T11: f32 = `-5.3859531181e-04`; / 0xba0d3085 /
47	const T12: f32 = `3.1563205994e-04`; / 0x39a57b6b /
48	const T13: f32 = `-3.1275415677e-04`; / 0xb9a3f927 /
49	const T14: f32 = `3.3552918467e-04`; / 0x39afe9f7 /
50	const U0: f32 = `-7.7215664089e-02`; / 0xbd9e233f /
51	const U1: f32 = `6.3282704353e-01`; / 0x3f2200f4 /
52	const U2: f32 = `1.4549225569e+00`; / 0x3fba3ae7 /
53	const U3: f32 = `9.7771751881e-01`; / 0x3f7a4bb2 /
54	const U4: f32 = `2.2896373272e-01`; / 0x3e6a7578 /
55	const U5: f32 = `1.3381091878e-02`; / 0x3c5b3c5e /
56	const V1: f32 = `2.4559779167e+00`; / 0x401d2ebe /
57	const V2: f32 = `2.1284897327e+00`; / 0x4008392d /
58	const V3: f32 = `7.6928514242e-01`; / 0x3f44efdf /
59	const V4: f32 = `1.0422264785e-01`; / 0x3dd572af /
60	const V5: f32 = `3.2170924824e-03`; / 0x3b52d5db /
61	const S0: f32 = `-7.7215664089e-02`; / 0xbd9e233f /
62	const S1: f32 = `2.1498242021e-01`; / 0x3e5c245a /
63	const S2: f32 = `3.2577878237e-01`; / 0x3ea6cc7a /
64	const S3: f32 = `1.4635047317e-01`; / 0x3e15dce6 /
65	const S4: f32 = `2.6642270386e-02`; / 0x3cda40e4 /
66	const S5: f32 = `1.8402845599e-03`; / 0x3af135b4 /
67	const S6: f32 = `3.1947532989e-05`; / 0x3805ff67 /
68	const R1: f32 = `1.3920053244e+00`; / 0x3fb22d3b /
69	const R2: f32 = `7.2193557024e-01`; / 0x3f38d0c5 /
70	const R3: f32 = `1.7193385959e-01`; / 0x3e300f6e /
71	const R4: f32 = `1.8645919859e-02`; / 0x3c98bf54 /
72	const R5: f32 = `7.7794247773e-04`; / 0x3a4beed6 /
73	const R6: f32 = `7.3266842264e-06`; / 0x36f5d7bd /
74	const W0: f32 = `4.1893854737e-01`; / 0x3ed67f1d /
75	const W1: f32 = `8.3333335817e-02`; / 0x3daaaaab /
76	const W2: f32 = `-2.7777778450e-03`; / 0xbb360b61 /
77	const W3: f32 = `7.9365057172e-04`; / 0x3a500cfd /
78	const W4: f32 = `-5.9518753551e-04`; / 0xba1c065c /
79	const W5: f32 = `8.3633989561e-04`; / 0x3a5b3dd2 /
80	const W6: f32 = `-1.6309292987e-03`; / 0xbad5c4e8 /
81
82	/ sin(PIx) assuming x > 2^-100, if sin(PIx)==0 the sign is arbitrary /
83	fn sin_pi(mut x: f32) -> f32 {
84	let mut y: f64;
85	let mut n: isize;
86
87	/ spurious inexact if odd int /
88	x = `2.0` * (x * `0.5` - floorf(x * `0.5`)); / x mod 2.0 /
89
90	n = (x * `4.0`) as isize;
91	n = div!(n + `1`, `2`);
92	y = (x as f64) - (n as f64) * `0.5`;
93	y *= `3.14159265358979323846`;
94	match n {
95	`1` => k_cosf(y),
96	`2` => k_sinf(-y),
97	`3` => -k_cosf(y),
98	// 0
99	_ => k_sinf(y),
100	}
101	}
102
103	#[cfg_attr(assert_no_panic, no_panic::no_panic)]
104	pub fn lgammaf_r(mut x: f32) -> (f32, i32) {
105	let u = x.to_bits();
106	let mut t: f32;
107	let y: f32;
108	let mut z: f32;
109	let nadj: f32;
110	let p: f32;
111	let p1: f32;
112	let p2: f32;
113	let p3: f32;
114	let q: f32;
115	let mut r: f32;
116	let w: f32;
117	let ix: u32;
118	let i: i32;
119	let sign: bool;
120	let mut signgam: i32;
121
122	/ purge off +-inf, NaN, +-0, tiny and negative arguments /
123	signgam = `1`;
124	sign = (u >> `31`) != `0`;
125	ix = u & `0x7fffffff`;
126	if ix >= `0x7f800000` {
127	return (x * x, signgam);
128	}
129	if ix < `0x35000000` {
130	/ \|x\| < 2*-21, return -log(\|x\|) /*
131	if sign {
132	signgam = `-1`;
133	x = -x;
134	}
135	return (-logf(x), signgam);
136	}
137	if sign {
138	x = -x;
139	t = sin_pi(x);
140	if t == `0.0` {
141	/ -integer /
142	return (`1.0` / (x - x), signgam);
143	}
144	if t > `0.0` {
145	signgam = `-1`;
146	} else {
147	t = -t;
148	}
149	nadj = logf(PI / (t * x));
150	} else {
151	nadj = `0.0`;
152	}
153
154	/ purge off 1 and 2 /
155	if ix == `0x3f800000` \|\| ix == `0x40000000` {
156	r = `0.0`;
157	}
158	/ for x < 2.0 /
159	else if ix < `0x40000000` {
160	if ix <= `0x3f666666` {
161	/ lgamma(x) = lgamma(x+1)-log(x) /
162	r = -logf(x);
163	if ix >= `0x3f3b4a20` {
164	y = `1.0` - x;
165	i = `0`;
166	} else if ix >= `0x3e6d3308` {
167	y = x - (TC - `1.0`);
168	i = `1`;
169	} else {
170	y = x;
171	i = `2`;
172	}
173	} else {
174	r = `0.0`;
175	if ix >= `0x3fdda618` {
176	/ [1.7316,2] /
177	y = `2.0` - x;
178	i = `0`;
179	} else if ix >= `0x3F9da620` {
180	/ [1.23,1.73] /
181	y = x - TC;
182	i = `1`;
183	} else {
184	y = x - `1.0`;
185	i = `2`;
186	}
187	}
188	match i {
189	`0` => {
190	z = y * y;
191	p1 = A0 + z * (A2 + z * (A4 + z * (A6 + z * (A8 + z * A10))));
192	p2 = z * (A1 + z * (A3 + z * (A5 + z * (A7 + z * (A9 + z * A11)))));
193	p = y * p1 + p2;
194	r += p - `0.5` * y;
195	}
196	`1` => {
197	z = y * y;
198	w = z * y;
199	p1 = T0 + w * (T3 + w * (T6 + w * (T9 + w * T12))); / parallel comp /
200	p2 = T1 + w * (T4 + w * (T7 + w * (T10 + w * T13)));
201	p3 = T2 + w * (T5 + w * (T8 + w * (T11 + w * T14)));
202	p = z * p1 - (TT - w * (p2 + y * p3));
203	r += TF + p;
204	}
205	`2` => {
206	p1 = y * (U0 + y * (U1 + y * (U2 + y * (U3 + y * (U4 + y * U5)))));
207	p2 = `1.0` + y * (V1 + y * (V2 + y * (V3 + y * (V4 + y * V5))));
208	r += `-0.5` * y + p1 / p2;
209	}
210	#[cfg(debug_assertions)]
211	_ => unreachable!(),
212	#[cfg(not(debug_assertions))]
213	_ => {}
214	}
215	} else if ix < `0x41000000` {
216	/ x < 8.0 /
217	i = x as i32;
218	y = x - (i as f32);
219	p = y * (S0 + y * (S1 + y * (S2 + y * (S3 + y * (S4 + y * (S5 + y * S6))))));
220	q = `1.0` + y * (R1 + y * (R2 + y * (R3 + y * (R4 + y * (R5 + y * R6)))));
221	r = `0.5` * y + p / q;
222	z = `1.0`; / lgamma(1+s) = log(s) + lgamma(s) /
223	// TODO: In C, this was implemented using switch jumps with fallthrough.
224	// Does this implementation have performance problems?
225	if i >= `7` {
226	z *= y + `6.0`;
227	}
228	if i >= `6` {
229	z *= y + `5.0`;
230	}
231	if i >= `5` {
232	z *= y + `4.0`;
233	}
234	if i >= `4` {
235	z *= y + `3.0`;
236	}
237	if i >= `3` {
238	z *= y + `2.0`;
239	r += logf(z);
240	}
241	} else if ix < `0x5c800000` {
242	/ 8.0 <= x < 2*58 /*
243	t = logf(x);
244	z = `1.0` / x;
245	y = z * z;
246	w = W0 + z * (W1 + y * (W2 + y * (W3 + y * (W4 + y * (W5 + y * W6)))));
247	r = (x - `0.5`) * (t - `1.0`) + w;
248	} else {
249	/ 2*58 <= x <= inf /*
250	r = x * (logf(x) - `1.0`);
251	}
252	if sign {
253	r = nadj - r;
254	}
255	return (r, signgam);
256	}
257