float_to_string.h source code [libc/src/__support/float_to_string.h]

Warning: This file is not a C or C++ file. It does not have highlighting.

1	//===-- Utilities to convert floating point values to string ----- C++ --===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8
9	#ifndef LLVM_LIBC_SRC___SUPPORT_FLOAT_TO_STRING_H
10	#define LLVM_LIBC_SRC___SUPPORT_FLOAT_TO_STRING_H
11
12	#include <stdint.h>
13
14	#include "src/__support/CPP/limits.h"
15	#include "src/__support/CPP/type_traits.h"
16	#include "src/__support/FPUtil/FPBits.h"
17	#include "src/__support/FPUtil/dyadic_float.h"
18	#include "src/__support/big_int.h"
19	#include "src/__support/common.h"
20	#include "src/__support/libc_assert.h"
21	#include "src/__support/macros/attributes.h"
22	#include "src/__support/macros/config.h"
23	#include "src/__support/sign.h"
24
25	// This file has 5 compile-time flags to allow the user to configure the float
26	// to string behavior. These were used to explore tradeoffs during the design
27	// phase, and can still be used to gain specific properties. Unless you
28	// specifically know what you're doing, you should leave all these flags off.
29
30	// LIBC_COPT_FLOAT_TO_STR_NO_SPECIALIZE_LD
31	// This flag disables the separate long double conversion implementation. It is
32	// not based on the Ryu algorithm, instead generating the digits by
33	// multiplying/dividing the written-out number by 10^9 to get blocks. It's
34	// significantly faster than INT_CALC, only about 10x slower than MEGA_TABLE,
35	// and is small in binary size. Its downside is that it always calculates all
36	// of the digits above the decimal point, making it inefficient for %e calls
37	// with large exponents. This specialization overrides other flags, so this
38	// flag must be set for other flags to effect the long double behavior.
39
40	// LIBC_COPT_FLOAT_TO_STR_USE_MEGA_LONG_DOUBLE_TABLE
41	// The Mega Table is ~5 megabytes when compiled. It lists the constants needed
42	// to perform the Ryu Printf algorithm (described below) for all long double
43	// values. This makes it extremely fast for both doubles and long doubles, in
44	// exchange for large binary size.
45
46	// LIBC_COPT_FLOAT_TO_STR_USE_DYADIC_FLOAT
47	// Dyadic floats are software floating point numbers, and their accuracy can be
48	// as high as necessary. This option uses 256 bit dyadic floats to calculate
49	// the table values that Ryu Printf needs. This is reasonably fast and very
50	// small compared to the Mega Table, but the 256 bit floats only give accurate
51	// results for the first ~50 digits of the output. In practice this shouldn't
52	// be a problem since long doubles are only accurate for ~35 digits, but the
53	// trailing values all being 0s may cause brittle tests to fail.
54
55	// LIBC_COPT_FLOAT_TO_STR_USE_INT_CALC
56	// Integer Calculation uses wide integers to do the calculations for the Ryu
57	// Printf table, which is just as accurate as the Mega Table without requiring
58	// as much code size. These integers can be very large (~32KB at max, though
59	// always on the stack) to handle the edges of the long double range. They are
60	// also very slow, taking multiple seconds on a powerful CPU to calculate the
61	// values at the end of the range. If no flag is set, this is used for long
62	// doubles, the flag only changes the double behavior.
63
64	// LIBC_COPT_FLOAT_TO_STR_NO_TABLE
65	// This flag doesn't change the actual calculation method, instead it is used
66	// to disable the normal Ryu Printf table for configurations that don't use any
67	// table at all.
68
69	// Default Config:
70	// If no flags are set, doubles use the normal (and much more reasonably sized)
71	// Ryu Printf table and long doubles use their specialized implementation. This
72	// provides good performance and binary size.
73
74	#ifdef LIBC_COPT_FLOAT_TO_STR_USE_MEGA_LONG_DOUBLE_TABLE
75	#include "src/__support/ryu_long_double_constants.h"
76	#elif !defined(LIBC_COPT_FLOAT_TO_STR_NO_TABLE)
77	#include "src/__support/ryu_constants.h"
78	#else
79	constexpr size_t IDX_SIZE = 1;
80	constexpr size_t MID_INT_SIZE = 192;
81	#endif
82
83	// This implementation is based on the Ryu Printf algorithm by Ulf Adams:
84	// Ulf Adams. 2019. Ryū revisited: printf floating point conversion.
85	// Proc. ACM Program. Lang. 3, OOPSLA, Article 169 (October 2019), 23 pages.
86	// https://doi.org/10.1145/3360595
87
88	// This version is modified to require significantly less memory (it doesn't use
89	// a large buffer to store the result).
90
91	// The general concept of this algorithm is as follows:
92	// We want to calculate a 9 digit segment of a floating point number using this
93	// formula: floor((mantissa * 2^exponent)/10^i) % 10^9.
94	// To do so normally would involve large integers (~1000 bits for doubles), so
95	// we use a shortcut. We can avoid calculating 2^exponent / 10^i by using a
96	// lookup table. The resulting intermediate value needs to be about 192 bits to
97	// store the result with enough precision. Since this is all being done with
98	// integers for appropriate precision, we would run into a problem if
99	// i > exponent since then 2^exponent / 10^i would be less than 1. To correct
100	// for this, the actual calculation done is 2^(exponent + c) / 10^i, and then
101	// when multiplying by the mantissa we reverse this by dividing by 2^c, like so:
102	// floor((mantissa * table[exponent][i])/(2^c)) % 10^9.
103	// This gives a 9 digit value, which is small enough to fit in a 32 bit integer,
104	// and that integer is converted into a string as normal, and called a block. In
105	// this implementation, the most recent block is buffered, so that if rounding
106	// is necessary the block can be adjusted before being written to the output.
107	// Any block that is all 9s adds one to the max block counter and doesn't clear
108	// the buffer because they can cause the block above them to be rounded up.
109
110	namespace LIBC_NAMESPACE_DECL {
111
112	using BlockInt = uint32_t;
113	constexpr uint32_t BLOCK_SIZE = 9;
114	constexpr uint64_t EXP5_9 = 1953125;
115	constexpr uint64_t EXP10_9 = 1000000000;
116
117	using FPBits = fputil::FPBits<long double>;
118
119	// Larger numbers prefer a slightly larger constant than is used for the smaller
120	// numbers.
121	constexpr size_t CALC_SHIFT_CONST = 128;
122
123	namespace internal {
124
125	// Returns floor(log_10(2^e)); requires 0 <= e <= 42039.
126	LIBC_INLINE constexpr uint32_t log10_pow2(uint64_t e) {
127	LIBC_ASSERT(e <= 42039 &&
128	"Incorrect exponent to perform log10_pow2 approximation.");
129	// This approximation is based on the float value for log_10(2). It first
130	// gives an incorrect result for our purposes at 42039 (well beyond the 16383
131	// maximum for long doubles).
132
133	// To get these constants I first evaluated log_10(2) to get an approximation
134	// of 0.301029996. Next I passed that value through a string to double
135	// conversion to get an explicit mantissa of 0x13441350fbd738 and an exponent
136	// of -2 (which becomes -54 when we shift the mantissa to be a non-fractional
137	// number). Next I shifted the mantissa right 12 bits to create more space for
138	// the multiplication result, adding 12 to the exponent to compensate. To
139	// check that this approximation works for our purposes I used the following
140	// python code:
141	// for i in range(16384):
142	// if(len(str(2*i)) != (((i0x13441350fbd)>>42)+1)):
143	// print(i)
144	// The reason we add 1 is because this evaluation truncates the result, giving
145	// us the floor, whereas counting the digits of the power of 2 gives us the
146	// ceiling. With a similar loop I checked the maximum valid value and found
147	// 42039.
148	return static_cast<uint32_t>((e * 0x13441350fbdll) >> 42);
149	}
150
151	// Same as above, but with different constants.
152	LIBC_INLINE constexpr uint32_t log2_pow5(uint64_t e) {
153	return static_cast<uint32_t>((e * 0x12934f0979bll) >> 39);
154	}
155
156	// Returns 1 + floor(log_10(2^e). This could technically be off by 1 if any
157	// power of 2 was also a power of 10, but since that doesn't exist this is
158	// always accurate. This is used to calculate the maximum number of base-10
159	// digits a given e-bit number could have.
160	LIBC_INLINE constexpr uint32_t ceil_log10_pow2(uint32_t e) {
161	return log10_pow2(e) + 1;
162	}
163
164	LIBC_INLINE constexpr uint32_t div_ceil(uint32_t num, uint32_t denom) {
165	return (num + (denom - 1)) / denom;
166	}
167
168	// Returns the maximum number of 9 digit blocks a number described by the given
169	// index (which is ceil(exponent/16)) and mantissa width could need.
170	LIBC_INLINE constexpr uint32_t length_for_num(uint32_t idx,
171	uint32_t mantissa_width) {
172	return div_ceil(ceil_log10_pow2(idx) + ceil_log10_pow2(mantissa_width + 1),
173	BLOCK_SIZE);
174	}
175
176	// The formula for the table when i is positive (or zero) is as follows:
177	// floor(10^(-9i) * 2^(e + c_1) + 1) % (10^9 * 2^c_1)
178	// Rewritten slightly we get:
179	// floor(5^(-9i) * 2^(e + c_1 - 9i) + 1) % (10^9 * 2^c_1)
180
181	// TODO: Fix long doubles (needs bigger table or alternate algorithm.)
182	// Currently the table values are generated, which is very slow.
183	template <size_t INT_SIZE>
184	LIBC_INLINE constexpr UInt<MID_INT_SIZE> get_table_positive(int exponent,
185	size_t i) {
186	// INT_SIZE is the size of int that is used for the internal calculations of
187	// this function. It should be large enough to hold 2^(exponent+constant), so
188	// ~1000 for double and ~16000 for long double. Be warned that the time
189	// complexity of exponentiation is O(n^2 * log_2(m)) where n is the number of
190	// bits in the number being exponentiated and m is the exponent.
191	const int shift_amount =
192	static_cast<int>(exponent + CALC_SHIFT_CONST - (BLOCK_SIZE * i));
193	if (shift_amount < 0) {
194	return 1;
195	}
196	UInt<INT_SIZE> num(0);
197	// MOD_SIZE is one of the limiting factors for how big the constant argument
198	// can get, since it needs to be small enough to fit in the result UInt,
199	// otherwise we'll get truncation on return.
200	constexpr UInt<INT_SIZE> MOD_SIZE =
201	(UInt<INT_SIZE>(EXP10_9)
202	<< (CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0)));
203
204	num = UInt<INT_SIZE>(1) << (shift_amount);
205	if (i > 0) {
206	UInt<INT_SIZE> fives(EXP5_9);
207	fives.pow_n(i);
208	num = num / fives;
209	}
210
211	num = num + 1;
212	if (num > MOD_SIZE) {
213	auto rem = num.div_uint_half_times_pow_2(
214	EXP10_9, CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0))
215	.value();
216	num = rem;
217	}
218	return num;
219	}
220
221	template <size_t INT_SIZE>
222	LIBC_INLINE UInt<MID_INT_SIZE> get_table_positive_df(int exponent, size_t i) {
223	static_assert(INT_SIZE == 256,
224	"Only 256 is supported as an int size right now.");
225	// This version uses dyadic floats with 256 bit mantissas to perform the same
226	// calculation as above. Due to floating point imprecision it is only accurate
227	// for the first 50 digits, but it's much faster. Since even 128 bit long
228	// doubles are only accurate to ~35 digits, the 50 digits of accuracy are
229	// enough for these floats to be converted back and forth safely. This is
230	// ideal for avoiding the size of the long double table.
231	const int shift_amount =
232	static_cast<int>(exponent + CALC_SHIFT_CONST - (9 * i));
233	if (shift_amount < 0) {
234	return 1;
235	}
236	fputil::DyadicFloat<INT_SIZE> num(Sign::POS, 0, 1);
237	constexpr UInt<INT_SIZE> MOD_SIZE =
238	(UInt<INT_SIZE>(EXP10_9)
239	<< (CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0)));
240
241	constexpr UInt<INT_SIZE> FIVE_EXP_MINUS_NINE_MANT{
242	{0xf387295d242602a7, 0xfdd7645e011abac9, 0x31680a88f8953030,
243	0x89705f4136b4a597}};
244
245	static const fputil::DyadicFloat<INT_SIZE> FIVE_EXP_MINUS_NINE(
246	Sign::POS, -276, FIVE_EXP_MINUS_NINE_MANT);
247
248	if (i > 0) {
249	fputil::DyadicFloat<INT_SIZE> fives =
250	fputil::pow_n(FIVE_EXP_MINUS_NINE, static_cast<uint32_t>(i));
251	num = fives;
252	}
253	num = mul_pow_2(num, shift_amount);
254
255	// Adding one is part of the formula.
256	UInt<INT_SIZE> int_num = num.as_mantissa_type() + 1;
257	if (int_num > MOD_SIZE) {
258	auto rem =
259	int_num
260	.div_uint_half_times_pow_2(
261	EXP10_9, CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0))
262	.value();
263	int_num = rem;
264	}
265
266	UInt<MID_INT_SIZE> result = int_num;
267
268	return result;
269	}
270
271	// The formula for the table when i is negative (or zero) is as follows:
272	// floor(10^(-9i) * 2^(c_0 - e)) % (10^9 * 2^c_0)
273	// Since we know i is always negative, we just take it as unsigned and treat it
274	// as negative. We do the same with exponent, while they're both always negative
275	// in theory, in practice they're converted to positive for simpler
276	// calculations.
277	// The formula being used looks more like this:
278	// floor(10^(9(-i)) 2^(c_0 + (-e))) % (10^9 * 2^c_0)
279	template <size_t INT_SIZE>
280	LIBC_INLINE UInt<MID_INT_SIZE> get_table_negative(int exponent, size_t i) {
281	int shift_amount = CALC_SHIFT_CONST - exponent;
282	UInt<INT_SIZE> num(1);
283	constexpr UInt<INT_SIZE> MOD_SIZE =
284	(UInt<INT_SIZE>(EXP10_9)
285	<< (CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0)));
286
287	size_t ten_blocks = i;
288	size_t five_blocks = 0;
289	if (shift_amount < 0) {
290	int block_shifts = (-shift_amount) / static_cast<int>(BLOCK_SIZE);
291	if (block_shifts < static_cast<int>(ten_blocks)) {
292	ten_blocks = ten_blocks - block_shifts;
293	five_blocks = block_shifts;
294	shift_amount = shift_amount + (block_shifts * BLOCK_SIZE);
295	} else {
296	ten_blocks = 0;
297	five_blocks = i;
298	shift_amount = shift_amount + (static_cast<int>(i) * BLOCK_SIZE);
299	}
300	}
301
302	if (five_blocks > 0) {
303	UInt<INT_SIZE> fives(EXP5_9);
304	fives.pow_n(five_blocks);
305	num = fives;
306	}
307	if (ten_blocks > 0) {
308	UInt<INT_SIZE> tens(EXP10_9);
309	tens.pow_n(ten_blocks);
310	if (five_blocks <= 0) {
311	num = tens;
312	} else {
313	num *= tens;
314	}
315	}
316
317	if (shift_amount > 0) {
318	num = num << shift_amount;
319	} else {
320	num = num >> (-shift_amount);
321	}
322	if (num > MOD_SIZE) {
323	auto rem = num.div_uint_half_times_pow_2(
324	EXP10_9, CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0))
325	.value();
326	num = rem;
327	}
328	return num;
329	}
330
331	template <size_t INT_SIZE>
332	LIBC_INLINE UInt<MID_INT_SIZE> get_table_negative_df(int exponent, size_t i) {
333	static_assert(INT_SIZE == 256,
334	"Only 256 is supported as an int size right now.");
335	// This version uses dyadic floats with 256 bit mantissas to perform the same
336	// calculation as above. Due to floating point imprecision it is only accurate
337	// for the first 50 digits, but it's much faster. Since even 128 bit long
338	// doubles are only accurate to ~35 digits, the 50 digits of accuracy are
339	// enough for these floats to be converted back and forth safely. This is
340	// ideal for avoiding the size of the long double table.
341
342	int shift_amount = CALC_SHIFT_CONST - exponent;
343
344	fputil::DyadicFloat<INT_SIZE> num(Sign::POS, 0, 1);
345	constexpr UInt<INT_SIZE> MOD_SIZE =
346	(UInt<INT_SIZE>(EXP10_9)
347	<< (CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0)));
348
349	constexpr UInt<INT_SIZE> TEN_EXP_NINE_MANT(EXP10_9);
350
351	static const fputil::DyadicFloat<INT_SIZE> TEN_EXP_NINE(Sign::POS, 0,
352	TEN_EXP_NINE_MANT);
353
354	if (i > 0) {
355	fputil::DyadicFloat<INT_SIZE> tens =
356	fputil::pow_n(TEN_EXP_NINE, static_cast<uint32_t>(i));
357	num = tens;
358	}
359	num = mul_pow_2(num, shift_amount);
360
361	UInt<INT_SIZE> int_num = num.as_mantissa_type();
362	if (int_num > MOD_SIZE) {
363	auto rem =
364	int_num
365	.div_uint_half_times_pow_2(
366	EXP10_9, CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0))
367	.value();
368	int_num = rem;
369	}
370
371	UInt<MID_INT_SIZE> result = int_num;
372
373	return result;
374	}
375
376	LIBC_INLINE uint32_t mul_shift_mod_1e9(const FPBits::StorageType mantissa,
377	const UInt<MID_INT_SIZE> &large,
378	const int32_t shift_amount) {
379	// make sure the number of bits is always divisible by 64
380	UInt<internal::div_ceil(MID_INT_SIZE + FPBits::STORAGE_LEN, 64) * 64> val(
381	large);
382	val = (val * mantissa) >> shift_amount;
383	return static_cast<uint32_t>(
384	val.div_uint_half_times_pow_2(static_cast<uint32_t>(EXP10_9), 0).value());
385	}
386
387	} // namespace internal
388
389	// Convert floating point values to their string representation.
390	// Because the result may not fit in a reasonably sized array, the caller must
391	// request blocks of digits and convert them from integers to strings themself.
392	// Blocks contain the most digits that can be stored in an BlockInt. This is 9
393	// digits for a 32 bit int and 18 digits for a 64 bit int.
394	// The intended use pattern is to create a FloatToString object of the
395	// appropriate type, then call get_positive_blocks to get an approximate number
396	// of blocks there are before the decimal point. Now the client code can start
397	// calling get_positive_block in a loop from the number of positive blocks to
398	// zero. This will give all digits before the decimal point. Then the user can
399	// start calling get_negative_block in a loop from 0 until the number of digits
400	// they need is reached. As an optimization, the client can use
401	// zero_blocks_after_point to find the number of blocks that are guaranteed to
402	// be zero after the decimal point and before the non-zero digits. Additionally,
403	// is_lowest_block will return if the current block is the lowest non-zero
404	// block.
405	template <typename T, cpp::enable_if_t<cpp::is_floating_point_v<T>, int> = 0>
406	class FloatToString {
407	fputil::FPBits<T> float_bits;
408	int exponent;
409	FPBits::StorageType mantissa;
410
411	static constexpr int FRACTION_LEN = fputil::FPBits<T>::FRACTION_LEN;
412	static constexpr int EXP_BIAS = fputil::FPBits<T>::EXP_BIAS;
413
414	public:
415	LIBC_INLINE constexpr FloatToString(T init_float) : float_bits(init_float) {
416	exponent = float_bits.get_explicit_exponent();
417	mantissa = float_bits.get_explicit_mantissa();
418
419	// Adjust for the width of the mantissa.
420	exponent -= FRACTION_LEN;
421	}
422
423	LIBC_INLINE constexpr bool is_nan() { return float_bits.is_nan(); }
424	LIBC_INLINE constexpr bool is_inf() { return float_bits.is_inf(); }
425	LIBC_INLINE constexpr bool is_inf_or_nan() {
426	return float_bits.is_inf_or_nan();
427	}
428
429	// get_block returns an integer that represents the digits in the requested
430	// block.
431	LIBC_INLINE constexpr BlockInt get_positive_block(int block_index) {
432	if (exponent >= -FRACTION_LEN) {
433	// idx is ceil(exponent/16) or 0 if exponent is negative. This is used to
434	// find the coarse section of the POW10_SPLIT table that will be used to
435	// calculate the 9 digit window, as well as some other related values.
436	const uint32_t idx =
437	exponent < 0
438	? 0
439	: static_cast<uint32_t>(exponent + (IDX_SIZE - 1)) / IDX_SIZE;
440
441	// shift_amount = -(c0 - exponent) = c_0 + 16 * ceil(exponent/16) -
442	// exponent
443
444	const uint32_t pos_exp = idx * IDX_SIZE;
445
446	UInt<MID_INT_SIZE> val;
447
448	#if defined(LIBC_COPT_FLOAT_TO_STR_USE_DYADIC_FLOAT)
449	// ----------------------- DYADIC FLOAT CALC MODE ------------------------
450	const int32_t SHIFT_CONST = CALC_SHIFT_CONST;
451	val = internal::get_table_positive_df<256>(IDX_SIZE * idx, block_index);
452	#elif defined(LIBC_COPT_FLOAT_TO_STR_USE_INT_CALC)
453
454	// ---------------------------- INT CALC MODE ----------------------------
455	const int32_t SHIFT_CONST = CALC_SHIFT_CONST;
456	const uint64_t MAX_POW_2_SIZE =
457	pos_exp + CALC_SHIFT_CONST - (BLOCK_SIZE * block_index);
458	const uint64_t MAX_POW_5_SIZE =
459	internal::log2_pow5(BLOCK_SIZE * block_index);
460	const uint64_t MAX_INT_SIZE =
461	(MAX_POW_2_SIZE > MAX_POW_5_SIZE) ? MAX_POW_2_SIZE : MAX_POW_5_SIZE;
462
463	if (MAX_INT_SIZE < 1024) {
464	val = internal::get_table_positive<1024>(pos_exp, block_index);
465	} else if (MAX_INT_SIZE < 2048) {
466	val = internal::get_table_positive<2048>(pos_exp, block_index);
467	} else if (MAX_INT_SIZE < 4096) {
468	val = internal::get_table_positive<4096>(pos_exp, block_index);
469	} else if (MAX_INT_SIZE < 8192) {
470	val = internal::get_table_positive<8192>(pos_exp, block_index);
471	} else if (MAX_INT_SIZE < 16384) {
472	val = internal::get_table_positive<16384>(pos_exp, block_index);
473	} else {
474	val = internal::get_table_positive<16384 + 128>(pos_exp, block_index);
475	}
476	#else
477	// ----------------------------- TABLE MODE ------------------------------
478	const int32_t SHIFT_CONST = TABLE_SHIFT_CONST;
479
480	val = POW10_SPLIT[POW10_OFFSET[idx] + block_index];
481	#endif
482	const uint32_t shift_amount = SHIFT_CONST + pos_exp - exponent;
483
484	const BlockInt digits =
485	internal::mul_shift_mod_1e9(mantissa, val, (int32_t)(shift_amount));
486	return digits;
487	} else {
488	return 0;
489	}
490	}
491
492	LIBC_INLINE constexpr BlockInt get_negative_block(int block_index) {
493	if (exponent < 0) {
494	const int32_t idx = -exponent / static_cast<int32_t>(IDX_SIZE);
495
496	UInt<MID_INT_SIZE> val;
497
498	const uint32_t pos_exp = static_cast<uint32_t>(idx * IDX_SIZE);
499
500	#if defined(LIBC_COPT_FLOAT_TO_STR_USE_DYADIC_FLOAT)
501	// ----------------------- DYADIC FLOAT CALC MODE ------------------------
502	const int32_t SHIFT_CONST = CALC_SHIFT_CONST;
503	val = internal::get_table_negative_df<256>(pos_exp, block_index + 1);
504	#elif defined(LIBC_COPT_FLOAT_TO_STR_USE_INT_CALC)
505	// ---------------------------- INT CALC MODE ----------------------------
506	const int32_t SHIFT_CONST = CALC_SHIFT_CONST;
507
508	const uint64_t NUM_FIVES = (block_index + 1) * BLOCK_SIZE;
509	// Round MAX_INT_SIZE up to the nearest 64 (adding 1 because log2_pow5
510	// implicitly rounds down).
511	const uint64_t MAX_INT_SIZE =
512	((internal::log2_pow5(NUM_FIVES) / 64) + 1) * 64;
513
514	if (MAX_INT_SIZE < 1024) {
515	val = internal::get_table_negative<1024>(pos_exp, block_index + 1);
516	} else if (MAX_INT_SIZE < 2048) {
517	val = internal::get_table_negative<2048>(pos_exp, block_index + 1);
518	} else if (MAX_INT_SIZE < 4096) {
519	val = internal::get_table_negative<4096>(pos_exp, block_index + 1);
520	} else if (MAX_INT_SIZE < 8192) {
521	val = internal::get_table_negative<8192>(pos_exp, block_index + 1);
522	} else if (MAX_INT_SIZE < 16384) {
523	val = internal::get_table_negative<16384>(pos_exp, block_index + 1);
524	} else {
525	val = internal::get_table_negative<16384 + 8192>(pos_exp,
526	block_index + 1);
527	}
528	#else
529	// ----------------------------- TABLE MODE ------------------------------
530	// if the requested block is zero
531	const int32_t SHIFT_CONST = TABLE_SHIFT_CONST;
532	if (block_index < MIN_BLOCK_2[idx]) {
533	return 0;
534	}
535	const uint32_t p = POW10_OFFSET_2[idx] + block_index - MIN_BLOCK_2[idx];
536	// If every digit after the requested block is zero.
537	if (p >= POW10_OFFSET_2[idx + 1]) {
538	return 0;
539	}
540
541	val = POW10_SPLIT_2[p];
542	#endif
543	const int32_t shift_amount =
544	SHIFT_CONST + (-exponent - static_cast<int32_t>(pos_exp));
545	BlockInt digits =
546	internal::mul_shift_mod_1e9(mantissa, val, shift_amount);
547	return digits;
548	} else {
549	return 0;
550	}
551	}
552
553	LIBC_INLINE constexpr BlockInt get_block(int block_index) {
554	if (block_index >= 0) {
555	return get_positive_block(block_index);
556	} else {
557	return get_negative_block(-1 - block_index);
558	}
559	}
560
561	LIBC_INLINE constexpr size_t get_positive_blocks() {
562	if (exponent < -FRACTION_LEN)
563	return 0;
564	const uint32_t idx =
565	exponent < 0
566	? 0
567	: static_cast<uint32_t>(exponent + (IDX_SIZE - 1)) / IDX_SIZE;
568	return internal::length_for_num(idx * IDX_SIZE, FRACTION_LEN);
569	}
570
571	// This takes the index of a block after the decimal point (a negative block)
572	// and return if it's sure that all of the digits after it are zero.
573	LIBC_INLINE constexpr bool is_lowest_block(size_t negative_block_index) {
574	#ifdef LIBC_COPT_FLOAT_TO_STR_NO_TABLE
575	// The decimal representation of 2**(-i) will have exactly i digits after
576	// the decimal point.
577	int num_requested_digits =
578	static_cast<int>((negative_block_index + 1) * BLOCK_SIZE);
579
580	return num_requested_digits > -exponent;
581	#else
582	const int32_t idx = -exponent / static_cast<int32_t>(IDX_SIZE);
583	const size_t p =
584	POW10_OFFSET_2[idx] + negative_block_index - MIN_BLOCK_2[idx];
585	// If the remaining digits are all 0, then this is the lowest block.
586	return p >= POW10_OFFSET_2[idx + 1];
587	#endif
588	}
589
590	LIBC_INLINE constexpr size_t zero_blocks_after_point() {
591	#ifdef LIBC_COPT_FLOAT_TO_STR_NO_TABLE
592	if (exponent < -FRACTION_LEN) {
593	const int pos_exp = -exponent - 1;
594	const uint32_t pos_idx =
595	static_cast<uint32_t>(pos_exp + (IDX_SIZE - 1)) / IDX_SIZE;
596	const int32_t pos_len = ((internal::ceil_log10_pow2(pos_idx * IDX_SIZE) -
597	internal::ceil_log10_pow2(FRACTION_LEN + 1)) /
598	BLOCK_SIZE) -
599	1;
600	return static_cast<uint32_t>(pos_len > 0 ? pos_len : 0);
601	}
602	return 0;
603	#else
604	return MIN_BLOCK_2[-exponent / static_cast<int32_t>(IDX_SIZE)];
605	#endif
606	}
607	};
608
609	#if !defined(LIBC_TYPES_LONG_DOUBLE_IS_FLOAT64) && \
610	!defined(LIBC_COPT_FLOAT_TO_STR_NO_SPECIALIZE_LD)
611	// --------------------------- LONG DOUBLE FUNCTIONS ---------------------------
612
613	// this algorithm will work exactly the same for 80 bit and 128 bit long
614	// doubles. They have the same max exponent, but even if they didn't the
615	// constants should be calculated to be correct for any provided floating point
616	// type.
617
618	template <> class FloatToString<long double> {
619	fputil::FPBits<long double> float_bits;
620	bool is_negative = 0;
621	int exponent = 0;
622	FPBits::StorageType mantissa = 0;
623
624	static constexpr int FRACTION_LEN = fputil::FPBits<long double>::FRACTION_LEN;
625	static constexpr int EXP_BIAS = fputil::FPBits<long double>::EXP_BIAS;
626	static constexpr size_t UINT_WORD_SIZE = 64;
627
628	static constexpr size_t FLOAT_AS_INT_WIDTH =
629	internal::div_ceil(fputil::FPBits<long double>::MAX_BIASED_EXPONENT -
630	FPBits::EXP_BIAS,
631	UINT_WORD_SIZE) *
632	UINT_WORD_SIZE;
633	static constexpr size_t EXTRA_INT_WIDTH =
634	internal::div_ceil(sizeof(long double) * CHAR_BIT, UINT_WORD_SIZE) *
635	UINT_WORD_SIZE;
636
637	using wide_int = UInt<FLOAT_AS_INT_WIDTH + EXTRA_INT_WIDTH>;
638
639	// float_as_fixed represents the floating point number as a fixed point number
640	// with the point EXTRA_INT_WIDTH bits from the left of the number. This can
641	// store any number with a negative exponent.
642	wide_int float_as_fixed = 0;
643	int int_block_index = 0;
644
645	static constexpr size_t BLOCK_BUFFER_LEN =
646	internal::div_ceil(internal::log10_pow2(FLOAT_AS_INT_WIDTH), BLOCK_SIZE) +
647	1;
648	BlockInt block_buffer[BLOCK_BUFFER_LEN] = {0};
649	size_t block_buffer_valid = 0;
650
651	template <size_t Bits>
652	LIBC_INLINE static constexpr BlockInt grab_digits(UInt<Bits> &int_num) {
653	auto wide_result = int_num.div_uint_half_times_pow_2(EXP5_9, 9);
654	// the optional only comes into effect when dividing by 0, which will
655	// never happen here. Thus, we just assert that it has value.
656	LIBC_ASSERT(wide_result.has_value());
657	return static_cast<BlockInt>(wide_result.value());
658	}
659
660	LIBC_INLINE static constexpr void zero_leading_digits(wide_int &int_num) {
661	// WORD_SIZE is the width of the numbers used to internally represent the
662	// UInt
663	for (size_t i = 0; i < EXTRA_INT_WIDTH / wide_int::WORD_SIZE; ++i)
664	int_num[i + (FLOAT_AS_INT_WIDTH / wide_int::WORD_SIZE)] = 0;
665	}
666
667	// init_convert initializes float_as_int, cur_block, and block_buffer based on
668	// the mantissa and exponent of the initial number. Calling it will always
669	// return the class to the starting state.
670	LIBC_INLINE constexpr void init_convert() {
671	// No calculation necessary for the 0 case.
672	if (mantissa == 0 && exponent == 0)
673	return;
674
675	if (exponent > 0) {
676	// if the exponent is positive, then the number is fully above the decimal
677	// point. In this case we represent the float as an integer, then divide
678	// by 10^BLOCK_SIZE and take the remainder as our next block. This
679	// generates the digits from right to left, but the digits will be written
680	// from left to right, so it caches the results so they can be read in
681	// reverse order.
682
683	wide_int float_as_int = mantissa;
684
685	float_as_int <<= exponent;
686	int_block_index = 0;
687
688	while (float_as_int > 0) {
689	LIBC_ASSERT(int_block_index < static_cast<int>(BLOCK_BUFFER_LEN));
690	block_buffer[int_block_index] =
691	grab_digits<FLOAT_AS_INT_WIDTH + EXTRA_INT_WIDTH>(float_as_int);
692	++int_block_index;
693	}
694	block_buffer_valid = int_block_index;
695
696	} else {
697	// if the exponent is not positive, then the number is at least partially
698	// below the decimal point. In this case we represent the float as a fixed
699	// point number with the decimal point after the top EXTRA_INT_WIDTH bits.
700	float_as_fixed = mantissa;
701
702	const int SHIFT_AMOUNT = FLOAT_AS_INT_WIDTH + exponent;
703	static_assert(EXTRA_INT_WIDTH >= sizeof(long double) * 8);
704	float_as_fixed <<= SHIFT_AMOUNT;
705
706	// If there are still digits above the decimal point, handle those.
707	if (cpp::countl_zero(float_as_fixed) <
708	static_cast<int>(EXTRA_INT_WIDTH)) {
709	UInt<EXTRA_INT_WIDTH> above_decimal_point =
710	float_as_fixed >> FLOAT_AS_INT_WIDTH;
711
712	size_t positive_int_block_index = 0;
713	while (above_decimal_point > 0) {
714	block_buffer[positive_int_block_index] =
715	grab_digits<EXTRA_INT_WIDTH>(above_decimal_point);
716	++positive_int_block_index;
717	}
718	block_buffer_valid = positive_int_block_index;
719
720	// Zero all digits above the decimal point.
721	zero_leading_digits(float_as_fixed);
722	int_block_index = 0;
723	}
724	}
725	}
726
727	public:
728	LIBC_INLINE constexpr FloatToString(long double init_float)
729	: float_bits(init_float) {
730	is_negative = float_bits.is_neg();
731	exponent = float_bits.get_explicit_exponent();
732	mantissa = float_bits.get_explicit_mantissa();
733
734	// Adjust for the width of the mantissa.
735	exponent -= FRACTION_LEN;
736
737	this->init_convert();
738	}
739
740	LIBC_INLINE constexpr size_t get_positive_blocks() {
741	if (exponent < -FRACTION_LEN)
742	return 0;
743
744	const uint32_t idx =
745	exponent < 0
746	? 0
747	: static_cast<uint32_t>(exponent + (IDX_SIZE - 1)) / IDX_SIZE;
748	return internal::length_for_num(idx * IDX_SIZE, FRACTION_LEN);
749	}
750
751	LIBC_INLINE constexpr size_t zero_blocks_after_point() {
752	#ifdef LIBC_COPT_FLOAT_TO_STR_USE_MEGA_LONG_DOUBLE_TABLE
753	return MIN_BLOCK_2[-exponent / IDX_SIZE];
754	#else
755	if (exponent >= -FRACTION_LEN)
756	return 0;
757
758	const int pos_exp = -exponent - 1;
759	const uint32_t pos_idx =
760	static_cast<uint32_t>(pos_exp + (IDX_SIZE - 1)) / IDX_SIZE;
761	const int32_t pos_len = ((internal::ceil_log10_pow2(pos_idx * IDX_SIZE) -
762	internal::ceil_log10_pow2(FRACTION_LEN + 1)) /
763	BLOCK_SIZE) -
764	1;
765	return static_cast<uint32_t>(pos_len > 0 ? pos_len : 0);
766	#endif
767	}
768
769	LIBC_INLINE constexpr bool is_lowest_block(size_t negative_block_index) {
770	// The decimal representation of 2**(-i) will have exactly i digits after
771	// the decimal point.
772	const int num_requested_digits =
773	static_cast<int>((negative_block_index + 1) * BLOCK_SIZE);
774
775	return num_requested_digits > -exponent;
776	}
777
778	LIBC_INLINE constexpr BlockInt get_positive_block(int block_index) {
779	if (exponent < -FRACTION_LEN)
780	return 0;
781	if (block_index > static_cast<int>(block_buffer_valid) \|\| block_index < 0)
782	return 0;
783
784	LIBC_ASSERT(block_index < static_cast<int>(BLOCK_BUFFER_LEN));
785
786	return block_buffer[block_index];
787	}
788
789	LIBC_INLINE constexpr BlockInt get_negative_block(int negative_block_index) {
790	if (exponent >= 0)
791	return 0;
792
793	// negative_block_index starts at 0 with the first block after the decimal
794	// point, and 1 with the second and so on. This converts to the same
795	// block_index used everywhere else.
796
797	const int block_index = -1 - negative_block_index;
798
799	// If we're currently after the requested block (remember these are
800	// negative indices) we reset the number to the start. This is only
801	// likely to happen in %g calls. This will also reset int_block_index.
802	// if (block_index > int_block_index) {
803	// init_convert();
804	// }
805
806	// Printf is the only existing user of this code and it will only ever move
807	// downwards, except for %g but that currently creates a second
808	// float_to_string object so this assertion still holds. If a new user needs
809	// the ability to step backwards, uncomment the code above.
810	LIBC_ASSERT(block_index <= int_block_index);
811
812	// If we are currently before the requested block. Step until we reach the
813	// requested block. This is likely to only be one step.
814	while (block_index < int_block_index) {
815	zero_leading_digits(float_as_fixed);
816	float_as_fixed.mul(EXP10_9);
817	--int_block_index;
818	}
819
820	// We're now on the requested block, return the current block.
821	return static_cast<BlockInt>(float_as_fixed >> FLOAT_AS_INT_WIDTH);
822	}
823
824	LIBC_INLINE constexpr BlockInt get_block(int block_index) {
825	if (block_index >= 0)
826	return get_positive_block(block_index);
827
828	return get_negative_block(-1 - block_index);
829	}
830	};
831
832	#endif // !LIBC_TYPES_LONG_DOUBLE_IS_FLOAT64 &&
833	// !LIBC_COPT_FLOAT_TO_STR_NO_SPECIALIZE_LD
834
835	} // namespace LIBC_NAMESPACE_DECL
836
837	#endif // LLVM_LIBC_SRC___SUPPORT_FLOAT_TO_STRING_H
838

Warning: This file is not a C or C++ file. It does not have highlighting.

Provided by KDAB

Update your C++ knowledge – Modern C++11/14/17 Training

Find out more

source code of libc/src/__support/float_to_string.h