src/__support/float_to_string.h

07c0a41bSMichael Jones//===-- Utilities to convert floating point values to string ----*- C++ -*-===//
07c0a41bSMichael Jones//
07c0a41bSMichael Jones// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
07c0a41bSMichael Jones// See https://llvm.org/LICENSE.txt for license information.
07c0a41bSMichael Jones// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
07c0a41bSMichael Jones//
07c0a41bSMichael Jones//===----------------------------------------------------------------------===//
07c0a41bSMichael Jones
270547f3SGuillaume Chatelet#ifndef LLVM_LIBC_SRC___SUPPORT_FLOAT_TO_STRING_H
270547f3SGuillaume Chatelet#define LLVM_LIBC_SRC___SUPPORT_FLOAT_TO_STRING_H
07c0a41bSMichael Jones
07c0a41bSMichael Jones#include <stdint.h>
07c0a41bSMichael Jones
a621198aSmichaelrj-google#include "src/__support/CPP/limits.h"
07c0a41bSMichael Jones#include "src/__support/CPP/type_traits.h"
07c0a41bSMichael Jones#include "src/__support/FPUtil/FPBits.h"
688b9730SMichael Jones#include "src/__support/FPUtil/dyadic_float.h"
09efe848SGuillaume Chatelet#include "src/__support/big_int.h"
59c809cdSSiva Chandra Reddy#include "src/__support/common.h"
58a75c6aSSiva Chandra Reddy#include "src/__support/libc_assert.h"
a621198aSmichaelrj-google#include "src/__support/macros/attributes.h"
5ff3ff33SPetr Hosek#include "src/__support/macros/config.h"
e1d64b76SMichael Jones#include "src/__support/sign.h"
688b9730SMichael Jones
688b9730SMichael Jones// This file has 5 compile-time flags to allow the user to configure the float
a621198aSmichaelrj-google// to string behavior. These were used to explore tradeoffs during the design
a621198aSmichaelrj-google// phase, and can still be used to gain specific properties. Unless you
a621198aSmichaelrj-google// specifically know what you're doing, you should leave all these flags off.
a621198aSmichaelrj-google
a621198aSmichaelrj-google// LIBC_COPT_FLOAT_TO_STR_NO_SPECIALIZE_LD
a621198aSmichaelrj-google//  This flag disables the separate long double conversion implementation. It is
a621198aSmichaelrj-google//  not based on the Ryu algorithm, instead generating the digits by
a621198aSmichaelrj-google//  multiplying/dividing the written-out number by 10^9 to get blocks. It's
a621198aSmichaelrj-google//  significantly faster than INT_CALC, only about 10x slower than MEGA_TABLE,
a621198aSmichaelrj-google//  and is small in binary size. Its downside is that it always calculates all
a621198aSmichaelrj-google//  of the digits above the decimal point, making it inefficient for %e calls
a621198aSmichaelrj-google//  with large exponents. This specialization overrides other flags, so this
a621198aSmichaelrj-google//  flag must be set for other flags to effect the long double behavior.
688b9730SMichael Jones
688b9730SMichael Jones// LIBC_COPT_FLOAT_TO_STR_USE_MEGA_LONG_DOUBLE_TABLE
688b9730SMichael Jones//  The Mega Table is ~5 megabytes when compiled. It lists the constants needed
688b9730SMichael Jones//  to perform the Ryu Printf algorithm (described below) for all long double
688b9730SMichael Jones//  values. This makes it extremely fast for both doubles and long doubles, in
688b9730SMichael Jones//  exchange for large binary size.
688b9730SMichael Jones
688b9730SMichael Jones// LIBC_COPT_FLOAT_TO_STR_USE_DYADIC_FLOAT
688b9730SMichael Jones//  Dyadic floats are software floating point numbers, and their accuracy can be
688b9730SMichael Jones//  as high as necessary. This option uses 256 bit dyadic floats to calculate
688b9730SMichael Jones//  the table values that Ryu Printf needs. This is reasonably fast and very
688b9730SMichael Jones//  small compared to the Mega Table, but the 256 bit floats only give accurate
688b9730SMichael Jones//  results for the first ~50 digits of the output. In practice this shouldn't
688b9730SMichael Jones//  be a problem since long doubles are only accurate for ~35 digits, but the
a621198aSmichaelrj-google//  trailing values all being 0s may cause brittle tests to fail.
688b9730SMichael Jones
688b9730SMichael Jones// LIBC_COPT_FLOAT_TO_STR_USE_INT_CALC
688b9730SMichael Jones//  Integer Calculation uses wide integers to do the calculations for the Ryu
688b9730SMichael Jones//  Printf table, which is just as accurate as the Mega Table without requiring
688b9730SMichael Jones//  as much code size. These integers can be very large (~32KB at max, though
688b9730SMichael Jones//  always on the stack) to handle the edges of the long double range. They are
688b9730SMichael Jones//  also very slow, taking multiple seconds on a powerful CPU to calculate the
688b9730SMichael Jones//  values at the end of the range. If no flag is set, this is used for long
688b9730SMichael Jones//  doubles, the flag only changes the double behavior.
688b9730SMichael Jones
688b9730SMichael Jones// LIBC_COPT_FLOAT_TO_STR_NO_TABLE
688b9730SMichael Jones//  This flag doesn't change the actual calculation method, instead it is used
688b9730SMichael Jones//  to disable the normal Ryu Printf table for configurations that don't use any
688b9730SMichael Jones//  table at all.
688b9730SMichael Jones
688b9730SMichael Jones// Default Config:
688b9730SMichael Jones//  If no flags are set, doubles use the normal (and much more reasonably sized)
a621198aSmichaelrj-google//  Ryu Printf table and long doubles use their specialized implementation. This
a621198aSmichaelrj-google//  provides good performance and binary size.
688b9730SMichael Jones
688b9730SMichael Jones#ifdef LIBC_COPT_FLOAT_TO_STR_USE_MEGA_LONG_DOUBLE_TABLE
688b9730SMichael Jones#include "src/__support/ryu_long_double_constants.h"
688b9730SMichael Jones#elif !defined(LIBC_COPT_FLOAT_TO_STR_NO_TABLE)
07c0a41bSMichael Jones#include "src/__support/ryu_constants.h"
688b9730SMichael Jones#else
688b9730SMichael Jonesconstexpr size_t IDX_SIZE = 1;
688b9730SMichael Jonesconstexpr size_t MID_INT_SIZE = 192;
688b9730SMichael Jones#endif
07c0a41bSMichael Jones
07c0a41bSMichael Jones// This implementation is based on the Ryu Printf algorithm by Ulf Adams:
07c0a41bSMichael Jones// Ulf Adams. 2019. Ryū revisited: printf floating point conversion.
07c0a41bSMichael Jones// Proc. ACM Program. Lang. 3, OOPSLA, Article 169 (October 2019), 23 pages.
07c0a41bSMichael Jones// https://doi.org/10.1145/3360595
07c0a41bSMichael Jones
07c0a41bSMichael Jones// This version is modified to require significantly less memory (it doesn't use
07c0a41bSMichael Jones// a large buffer to store the result).
07c0a41bSMichael Jones
07c0a41bSMichael Jones// The general concept of this algorithm is as follows:
07c0a41bSMichael Jones// We want to calculate a 9 digit segment of a floating point number using this
07c0a41bSMichael Jones// formula: floor((mantissa * 2^exponent)/10^i) % 10^9.
07c0a41bSMichael Jones// To do so normally would involve large integers (~1000 bits for doubles), so
07c0a41bSMichael Jones// we use a shortcut. We can avoid calculating 2^exponent / 10^i by using a
07c0a41bSMichael Jones// lookup table. The resulting intermediate value needs to be about 192 bits to
07c0a41bSMichael Jones// store the result with enough precision. Since this is all being done with
07c0a41bSMichael Jones// integers for appropriate precision, we would run into a problem if
07c0a41bSMichael Jones// i > exponent since then 2^exponent / 10^i would be less than 1. To correct
07c0a41bSMichael Jones// for this, the actual calculation done is 2^(exponent + c) / 10^i, and then
07c0a41bSMichael Jones// when multiplying by the mantissa we reverse this by dividing by 2^c, like so:
07c0a41bSMichael Jones// floor((mantissa * table[exponent][i])/(2^c)) % 10^9.
07c0a41bSMichael Jones// This gives a 9 digit value, which is small enough to fit in a 32 bit integer,
07c0a41bSMichael Jones// and that integer is converted into a string as normal, and called a block. In
07c0a41bSMichael Jones// this implementation, the most recent block is buffered, so that if rounding
07c0a41bSMichael Jones// is necessary the block can be adjusted before being written to the output.
07c0a41bSMichael Jones// Any block that is all 9s adds one to the max block counter and doesn't clear
07c0a41bSMichael Jones// the buffer because they can cause the block above them to be rounded up.
07c0a41bSMichael Jones
5ff3ff33SPetr Hoseknamespace LIBC_NAMESPACE_DECL {
07c0a41bSMichael Jones
07c0a41bSMichael Jonesusing BlockInt = uint32_t;
ab65c9c3Smichaelrj-googleconstexpr uint32_t BLOCK_SIZE = 9;
a621198aSmichaelrj-googleconstexpr uint64_t EXP5_9 = 1953125;
a621198aSmichaelrj-googleconstexpr uint64_t EXP10_9 = 1000000000;
07c0a41bSMichael Jones
c09e6905SGuillaume Chateletusing FPBits = fputil::FPBits<long double>;
07c0a41bSMichael Jones
688b9730SMichael Jones// Larger numbers prefer a slightly larger constant than is used for the smaller
688b9730SMichael Jones// numbers.
688b9730SMichael Jonesconstexpr size_t CALC_SHIFT_CONST = 128;
07c0a41bSMichael Jones
07c0a41bSMichael Jonesnamespace internal {
07c0a41bSMichael Jones
688b9730SMichael Jones// Returns floor(log_10(2^e)); requires 0 <= e <= 42039.
a621198aSmichaelrj-googleLIBC_INLINE constexpr uint32_t log10_pow2(uint64_t e) {
8fc87f54SMikhail R. Gadelha  LIBC_ASSERT(e <= 42039 &&
58a75c6aSSiva Chandra Reddy              "Incorrect exponent to perform log10_pow2 approximation.");
688b9730SMichael Jones  // This approximation is based on the float value for log_10(2). It first
688b9730SMichael Jones  // gives an incorrect result for our purposes at 42039 (well beyond the 16383
688b9730SMichael Jones  // maximum for long doubles).
688b9730SMichael Jones
688b9730SMichael Jones  // To get these constants I first evaluated log_10(2) to get an approximation
688b9730SMichael Jones  // of 0.301029996. Next I passed that value through a string to double
688b9730SMichael Jones  // conversion to get an explicit mantissa of 0x13441350fbd738 and an exponent
688b9730SMichael Jones  // of -2 (which becomes -54 when we shift the mantissa to be a non-fractional
688b9730SMichael Jones  // number). Next I shifted the mantissa right 12 bits to create more space for
688b9730SMichael Jones  // the multiplication result, adding 12 to the exponent to compensate. To
688b9730SMichael Jones  // check that this approximation works for our purposes I used the following
688b9730SMichael Jones  // python code:
688b9730SMichael Jones  // for i in range(16384):
688b9730SMichael Jones  //   if(len(str(2**i)) != (((i*0x13441350fbd)>>42)+1)):
688b9730SMichael Jones  //     print(i)
688b9730SMichael Jones  // The reason we add 1 is because this evaluation truncates the result, giving
688b9730SMichael Jones  // us the floor, whereas counting the digits of the power of 2 gives us the
688b9730SMichael Jones  // ceiling. With a similar loop I checked the maximum valid value and found
688b9730SMichael Jones  // 42039.
ab65c9c3Smichaelrj-google  return static_cast<uint32_t>((e * 0x13441350fbdll) >> 42);
688b9730SMichael Jones}
688b9730SMichael Jones
688b9730SMichael Jones// Same as above, but with different constants.
a621198aSmichaelrj-googleLIBC_INLINE constexpr uint32_t log2_pow5(uint64_t e) {
ab65c9c3Smichaelrj-google  return static_cast<uint32_t>((e * 0x12934f0979bll) >> 39);
07c0a41bSMichael Jones}
07c0a41bSMichael Jones
07c0a41bSMichael Jones// Returns 1 + floor(log_10(2^e). This could technically be off by 1 if any
07c0a41bSMichael Jones// power of 2 was also a power of 10, but since that doesn't exist this is
07c0a41bSMichael Jones// always accurate. This is used to calculate the maximum number of base-10
07c0a41bSMichael Jones// digits a given e-bit number could have.
a621198aSmichaelrj-googleLIBC_INLINE constexpr uint32_t ceil_log10_pow2(uint32_t e) {
07c0a41bSMichael Jones  return log10_pow2(e) + 1;
07c0a41bSMichael Jones}
07c0a41bSMichael Jones
a621198aSmichaelrj-googleLIBC_INLINE constexpr uint32_t div_ceil(uint32_t num, uint32_t denom) {
a621198aSmichaelrj-google  return (num + (denom - 1)) / denom;
a621198aSmichaelrj-google}
a621198aSmichaelrj-google
07c0a41bSMichael Jones// Returns the maximum number of 9 digit blocks a number described by the given
07c0a41bSMichael Jones// index (which is ceil(exponent/16)) and mantissa width could need.
a621198aSmichaelrj-googleLIBC_INLINE constexpr uint32_t length_for_num(uint32_t idx,
a621198aSmichaelrj-google                                              uint32_t mantissa_width) {
a621198aSmichaelrj-google  return div_ceil(ceil_log10_pow2(idx) + ceil_log10_pow2(mantissa_width + 1),
a621198aSmichaelrj-google                  BLOCK_SIZE);
07c0a41bSMichael Jones}
07c0a41bSMichael Jones
07c0a41bSMichael Jones// The formula for the table when i is positive (or zero) is as follows:
07c0a41bSMichael Jones// floor(10^(-9i) * 2^(e + c_1) + 1) % (10^9 * 2^c_1)
07c0a41bSMichael Jones// Rewritten slightly we get:
07c0a41bSMichael Jones// floor(5^(-9i) * 2^(e + c_1 - 9i) + 1) % (10^9 * 2^c_1)
07c0a41bSMichael Jones
173d5023SMichael Jones// TODO: Fix long doubles (needs bigger table or alternate algorithm.)
173d5023SMichael Jones// Currently the table values are generated, which is very slow.
07c0a41bSMichael Jonestemplate <size_t INT_SIZE>
6a8e6c9aSGuillaume ChateletLIBC_INLINE constexpr UInt<MID_INT_SIZE> get_table_positive(int exponent,
688b9730SMichael Jones                                                            size_t i) {
07c0a41bSMichael Jones  // INT_SIZE is the size of int that is used for the internal calculations of
07c0a41bSMichael Jones  // this function. It should be large enough to hold 2^(exponent+constant), so
07c0a41bSMichael Jones  // ~1000 for double and ~16000 for long double. Be warned that the time
07c0a41bSMichael Jones  // complexity of exponentiation is O(n^2 * log_2(m)) where n is the number of
07c0a41bSMichael Jones  // bits in the number being exponentiated and m is the exponent.
e9bdf4afSMichael Jones  const int shift_amount =
e9bdf4afSMichael Jones      static_cast<int>(exponent + CALC_SHIFT_CONST - (BLOCK_SIZE * i));
07c0a41bSMichael Jones  if (shift_amount < 0) {
07c0a41bSMichael Jones    return 1;
07c0a41bSMichael Jones  }
6a8e6c9aSGuillaume Chatelet  UInt<INT_SIZE> num(0);
07c0a41bSMichael Jones  // MOD_SIZE is one of the limiting factors for how big the constant argument
07c0a41bSMichael Jones  // can get, since it needs to be small enough to fit in the result UInt,
07c0a41bSMichael Jones  // otherwise we'll get truncation on return.
6a8e6c9aSGuillaume Chatelet  constexpr UInt<INT_SIZE> MOD_SIZE =
6a8e6c9aSGuillaume Chatelet      (UInt<INT_SIZE>(EXP10_9)
688b9730SMichael Jones       << (CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0)));
688b9730SMichael Jones
6a8e6c9aSGuillaume Chatelet  num = UInt<INT_SIZE>(1) << (shift_amount);
07c0a41bSMichael Jones  if (i > 0) {
6a8e6c9aSGuillaume Chatelet    UInt<INT_SIZE> fives(EXP5_9);
07c0a41bSMichael Jones    fives.pow_n(i);
07c0a41bSMichael Jones    num = num / fives;
07c0a41bSMichael Jones  }
07c0a41bSMichael Jones
07c0a41bSMichael Jones  num = num + 1;
07c0a41bSMichael Jones  if (num > MOD_SIZE) {
4e005515Slntue    auto rem = num.div_uint_half_times_pow_2(
a621198aSmichaelrj-google                      EXP10_9, CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0))
688b9730SMichael Jones                   .value();
688b9730SMichael Jones    num = rem;
07c0a41bSMichael Jones  }
07c0a41bSMichael Jones  return num;
07c0a41bSMichael Jones}
07c0a41bSMichael Jones
688b9730SMichael Jonestemplate <size_t INT_SIZE>
6a8e6c9aSGuillaume ChateletLIBC_INLINE UInt<MID_INT_SIZE> get_table_positive_df(int exponent, size_t i) {
688b9730SMichael Jones  static_assert(INT_SIZE == 256,
688b9730SMichael Jones                "Only 256 is supported as an int size right now.");
688b9730SMichael Jones  // This version uses dyadic floats with 256 bit mantissas to perform the same
688b9730SMichael Jones  // calculation as above. Due to floating point imprecision it is only accurate
688b9730SMichael Jones  // for the first 50 digits, but it's much faster. Since even 128 bit long
688b9730SMichael Jones  // doubles are only accurate to ~35 digits, the 50 digits of accuracy are
688b9730SMichael Jones  // enough for these floats to be converted back and forth safely. This is
688b9730SMichael Jones  // ideal for avoiding the size of the long double table.
e9bdf4afSMichael Jones  const int shift_amount =
e9bdf4afSMichael Jones      static_cast<int>(exponent + CALC_SHIFT_CONST - (9 * i));
688b9730SMichael Jones  if (shift_amount < 0) {
688b9730SMichael Jones    return 1;
688b9730SMichael Jones  }
e1d64b76SMichael Jones  fputil::DyadicFloat<INT_SIZE> num(Sign::POS, 0, 1);
6a8e6c9aSGuillaume Chatelet  constexpr UInt<INT_SIZE> MOD_SIZE =
6a8e6c9aSGuillaume Chatelet      (UInt<INT_SIZE>(EXP10_9)
688b9730SMichael Jones       << (CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0)));
688b9730SMichael Jones
6a8e6c9aSGuillaume Chatelet  constexpr UInt<INT_SIZE> FIVE_EXP_MINUS_NINE_MANT{
688b9730SMichael Jones      {0xf387295d242602a7, 0xfdd7645e011abac9, 0x31680a88f8953030,
688b9730SMichael Jones       0x89705f4136b4a597}};
688b9730SMichael Jones
688b9730SMichael Jones  static const fputil::DyadicFloat<INT_SIZE> FIVE_EXP_MINUS_NINE(
e1d64b76SMichael Jones      Sign::POS, -276, FIVE_EXP_MINUS_NINE_MANT);
688b9730SMichael Jones
688b9730SMichael Jones  if (i > 0) {
e1d64b76SMichael Jones    fputil::DyadicFloat<INT_SIZE> fives =
e1d64b76SMichael Jones        fputil::pow_n(FIVE_EXP_MINUS_NINE, static_cast<uint32_t>(i));
688b9730SMichael Jones    num = fives;
688b9730SMichael Jones  }
688b9730SMichael Jones  num = mul_pow_2(num, shift_amount);
688b9730SMichael Jones
688b9730SMichael Jones  // Adding one is part of the formula.
e1d64b76SMichael Jones  UInt<INT_SIZE> int_num = num.as_mantissa_type() + 1;
688b9730SMichael Jones  if (int_num > MOD_SIZE) {
688b9730SMichael Jones    auto rem =
688b9730SMichael Jones        int_num
4e005515Slntue            .div_uint_half_times_pow_2(
4e005515Slntue                EXP10_9, CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0))
688b9730SMichael Jones            .value();
688b9730SMichael Jones    int_num = rem;
688b9730SMichael Jones  }
688b9730SMichael Jones
6a8e6c9aSGuillaume Chatelet  UInt<MID_INT_SIZE> result = int_num;
688b9730SMichael Jones
688b9730SMichael Jones  return result;
688b9730SMichael Jones}
688b9730SMichael Jones
07c0a41bSMichael Jones// The formula for the table when i is negative (or zero) is as follows:
07c0a41bSMichael Jones// floor(10^(-9i) * 2^(c_0 - e)) % (10^9 * 2^c_0)
07c0a41bSMichael Jones// Since we know i is always negative, we just take it as unsigned and treat it
07c0a41bSMichael Jones// as negative. We do the same with exponent, while they're both always negative
07c0a41bSMichael Jones// in theory, in practice they're converted to positive for simpler
07c0a41bSMichael Jones// calculations.
07c0a41bSMichael Jones// The formula being used looks more like this:
07c0a41bSMichael Jones// floor(10^(9*(-i)) * 2^(c_0 + (-e))) % (10^9 * 2^c_0)
688b9730SMichael Jonestemplate <size_t INT_SIZE>
6a8e6c9aSGuillaume ChateletLIBC_INLINE UInt<MID_INT_SIZE> get_table_negative(int exponent, size_t i) {
688b9730SMichael Jones  int shift_amount = CALC_SHIFT_CONST - exponent;
6a8e6c9aSGuillaume Chatelet  UInt<INT_SIZE> num(1);
6a8e6c9aSGuillaume Chatelet  constexpr UInt<INT_SIZE> MOD_SIZE =
6a8e6c9aSGuillaume Chatelet      (UInt<INT_SIZE>(EXP10_9)
688b9730SMichael Jones       << (CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0)));
07c0a41bSMichael Jones
07c0a41bSMichael Jones  size_t ten_blocks = i;
07c0a41bSMichael Jones  size_t five_blocks = 0;
07c0a41bSMichael Jones  if (shift_amount < 0) {
688b9730SMichael Jones    int block_shifts = (-shift_amount) / BLOCK_SIZE;
07c0a41bSMichael Jones    if (block_shifts < static_cast<int>(ten_blocks)) {
07c0a41bSMichael Jones      ten_blocks = ten_blocks - block_shifts;
07c0a41bSMichael Jones      five_blocks = block_shifts;
688b9730SMichael Jones      shift_amount = shift_amount + (block_shifts * BLOCK_SIZE);
07c0a41bSMichael Jones    } else {
07c0a41bSMichael Jones      ten_blocks = 0;
07c0a41bSMichael Jones      five_blocks = i;
ab65c9c3Smichaelrj-google      shift_amount = shift_amount + (static_cast<int>(i) * BLOCK_SIZE);
07c0a41bSMichael Jones    }
07c0a41bSMichael Jones  }
07c0a41bSMichael Jones
07c0a41bSMichael Jones  if (five_blocks > 0) {
6a8e6c9aSGuillaume Chatelet    UInt<INT_SIZE> fives(EXP5_9);
07c0a41bSMichael Jones    fives.pow_n(five_blocks);
688b9730SMichael Jones    num = fives;
07c0a41bSMichael Jones  }
07c0a41bSMichael Jones  if (ten_blocks > 0) {
6a8e6c9aSGuillaume Chatelet    UInt<INT_SIZE> tens(EXP10_9);
07c0a41bSMichael Jones    tens.pow_n(ten_blocks);
688b9730SMichael Jones    if (five_blocks <= 0) {
688b9730SMichael Jones      num = tens;
688b9730SMichael Jones    } else {
07c0a41bSMichael Jones      num *= tens;
07c0a41bSMichael Jones    }
688b9730SMichael Jones  }
07c0a41bSMichael Jones
07c0a41bSMichael Jones  if (shift_amount > 0) {
07c0a41bSMichael Jones    num = num << shift_amount;
07c0a41bSMichael Jones  } else {
07c0a41bSMichael Jones    num = num >> (-shift_amount);
07c0a41bSMichael Jones  }
688b9730SMichael Jones  if (num > MOD_SIZE) {
4e005515Slntue    auto rem = num.div_uint_half_times_pow_2(
a621198aSmichaelrj-google                      EXP10_9, CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0))
688b9730SMichael Jones                   .value();
688b9730SMichael Jones    num = rem;
688b9730SMichael Jones  }
07c0a41bSMichael Jones  return num;
07c0a41bSMichael Jones}
07c0a41bSMichael Jones
688b9730SMichael Jonestemplate <size_t INT_SIZE>
6a8e6c9aSGuillaume ChateletLIBC_INLINE UInt<MID_INT_SIZE> get_table_negative_df(int exponent, size_t i) {
688b9730SMichael Jones  static_assert(INT_SIZE == 256,
688b9730SMichael Jones                "Only 256 is supported as an int size right now.");
688b9730SMichael Jones  // This version uses dyadic floats with 256 bit mantissas to perform the same
688b9730SMichael Jones  // calculation as above. Due to floating point imprecision it is only accurate
688b9730SMichael Jones  // for the first 50 digits, but it's much faster. Since even 128 bit long
688b9730SMichael Jones  // doubles are only accurate to ~35 digits, the 50 digits of accuracy are
688b9730SMichael Jones  // enough for these floats to be converted back and forth safely. This is
688b9730SMichael Jones  // ideal for avoiding the size of the long double table.
688b9730SMichael Jones
688b9730SMichael Jones  int shift_amount = CALC_SHIFT_CONST - exponent;
688b9730SMichael Jones
e1d64b76SMichael Jones  fputil::DyadicFloat<INT_SIZE> num(Sign::POS, 0, 1);
6a8e6c9aSGuillaume Chatelet  constexpr UInt<INT_SIZE> MOD_SIZE =
6a8e6c9aSGuillaume Chatelet      (UInt<INT_SIZE>(EXP10_9)
688b9730SMichael Jones       << (CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0)));
688b9730SMichael Jones
6a8e6c9aSGuillaume Chatelet  constexpr UInt<INT_SIZE> TEN_EXP_NINE_MANT(EXP10_9);
688b9730SMichael Jones
e1d64b76SMichael Jones  static const fputil::DyadicFloat<INT_SIZE> TEN_EXP_NINE(Sign::POS, 0,
688b9730SMichael Jones                                                          TEN_EXP_NINE_MANT);
688b9730SMichael Jones
688b9730SMichael Jones  if (i > 0) {
e1d64b76SMichael Jones    fputil::DyadicFloat<INT_SIZE> tens =
e1d64b76SMichael Jones        fputil::pow_n(TEN_EXP_NINE, static_cast<uint32_t>(i));
688b9730SMichael Jones    num = tens;
688b9730SMichael Jones  }
688b9730SMichael Jones  num = mul_pow_2(num, shift_amount);
688b9730SMichael Jones
e1d64b76SMichael Jones  UInt<INT_SIZE> int_num = num.as_mantissa_type();
688b9730SMichael Jones  if (int_num > MOD_SIZE) {
688b9730SMichael Jones    auto rem =
688b9730SMichael Jones        int_num
4e005515Slntue            .div_uint_half_times_pow_2(
4e005515Slntue                EXP10_9, CALC_SHIFT_CONST + (IDX_SIZE > 1 ? IDX_SIZE : 0))
688b9730SMichael Jones            .value();
688b9730SMichael Jones    int_num = rem;
688b9730SMichael Jones  }
688b9730SMichael Jones
6a8e6c9aSGuillaume Chatelet  UInt<MID_INT_SIZE> result = int_num;
688b9730SMichael Jones
688b9730SMichael Jones  return result;
688b9730SMichael Jones}
688b9730SMichael Jones
c09e6905SGuillaume ChateletLIBC_INLINE uint32_t mul_shift_mod_1e9(const FPBits::StorageType mantissa,
6a8e6c9aSGuillaume Chatelet                                       const UInt<MID_INT_SIZE> &large,
07c0a41bSMichael Jones                                       const int32_t shift_amount) {
*7302c8dbSNick Desaulniers  // make sure the number of bits is always divisible by 64
*7302c8dbSNick Desaulniers  UInt<internal::div_ceil(MID_INT_SIZE + FPBits::STORAGE_LEN, 64) * 64> val(
*7302c8dbSNick Desaulniers      large);
44bf4c89SMikhail R. Gadelha  val = (val * mantissa) >> shift_amount;
4e005515Slntue  return static_cast<uint32_t>(
4e005515Slntue      val.div_uint_half_times_pow_2(static_cast<uint32_t>(EXP10_9), 0).value());
07c0a41bSMichael Jones}
07c0a41bSMichael Jones
07c0a41bSMichael Jones} // namespace internal
07c0a41bSMichael Jones
07c0a41bSMichael Jones// Convert floating point values to their string representation.
07c0a41bSMichael Jones// Because the result may not fit in a reasonably sized array, the caller must
07c0a41bSMichael Jones// request blocks of digits and convert them from integers to strings themself.
07c0a41bSMichael Jones// Blocks contain the most digits that can be stored in an BlockInt. This is 9
07c0a41bSMichael Jones// digits for a 32 bit int and 18 digits for a 64 bit int.
07c0a41bSMichael Jones// The intended use pattern is to create a FloatToString object of the
07c0a41bSMichael Jones// appropriate type, then call get_positive_blocks to get an approximate number
07c0a41bSMichael Jones// of blocks there are before the decimal point. Now the client code can start
07c0a41bSMichael Jones// calling get_positive_block in a loop from the number of positive blocks to
07c0a41bSMichael Jones// zero. This will give all digits before the decimal point. Then the user can
07c0a41bSMichael Jones// start calling get_negative_block in a loop from 0 until the number of digits
07c0a41bSMichael Jones// they need is reached. As an optimization, the client can use
07c0a41bSMichael Jones// zero_blocks_after_point to find the number of blocks that are guaranteed to
07c0a41bSMichael Jones// be zero after the decimal point and before the non-zero digits. Additionally,
07c0a41bSMichael Jones// is_lowest_block will return if the current block is the lowest non-zero
07c0a41bSMichael Jones// block.
07c0a41bSMichael Jonestemplate <typename T, cpp::enable_if_t<cpp::is_floating_point_v<T>, int> = 0>
07c0a41bSMichael Jonesclass FloatToString {
07c0a41bSMichael Jones  fputil::FPBits<T> float_bits;
07c0a41bSMichael Jones  int exponent;
c09e6905SGuillaume Chatelet  FPBits::StorageType mantissa;
07c0a41bSMichael Jones
3546f4daSGuillaume Chatelet  static constexpr int FRACTION_LEN = fputil::FPBits<T>::FRACTION_LEN;
3546f4daSGuillaume Chatelet  static constexpr int EXP_BIAS = fputil::FPBits<T>::EXP_BIAS;
07c0a41bSMichael Jones
07c0a41bSMichael Jonespublic:
494734b0SSiva Chandra Reddy  LIBC_INLINE constexpr FloatToString(T init_float) : float_bits(init_float) {
455d6780SMichael Jones    exponent = float_bits.get_explicit_exponent();
07c0a41bSMichael Jones    mantissa = float_bits.get_explicit_mantissa();
07c0a41bSMichael Jones
07c0a41bSMichael Jones    // Adjust for the width of the mantissa.
3546f4daSGuillaume Chatelet    exponent -= FRACTION_LEN;
07c0a41bSMichael Jones  }
07c0a41bSMichael Jones
494734b0SSiva Chandra Reddy  LIBC_INLINE constexpr bool is_nan() { return float_bits.is_nan(); }
494734b0SSiva Chandra Reddy  LIBC_INLINE constexpr bool is_inf() { return float_bits.is_inf(); }
494734b0SSiva Chandra Reddy  LIBC_INLINE constexpr bool is_inf_or_nan() {
494734b0SSiva Chandra Reddy    return float_bits.is_inf_or_nan();
494734b0SSiva Chandra Reddy  }
07c0a41bSMichael Jones
07c0a41bSMichael Jones  // get_block returns an integer that represents the digits in the requested
07c0a41bSMichael Jones  // block.
494734b0SSiva Chandra Reddy  LIBC_INLINE constexpr BlockInt get_positive_block(int block_index) {
3546f4daSGuillaume Chatelet    if (exponent >= -FRACTION_LEN) {
07c0a41bSMichael Jones      // idx is ceil(exponent/16) or 0 if exponent is negative. This is used to
07c0a41bSMichael Jones      // find the coarse section of the POW10_SPLIT table that will be used to
07c0a41bSMichael Jones      // calculate the 9 digit window, as well as some other related values.
07c0a41bSMichael Jones      const uint32_t idx =
688b9730SMichael Jones          exponent < 0
688b9730SMichael Jones              ? 0
688b9730SMichael Jones              : static_cast<uint32_t>(exponent + (IDX_SIZE - 1)) / IDX_SIZE;
07c0a41bSMichael Jones
07c0a41bSMichael Jones      // shift_amount = -(c0 - exponent) = c_0 + 16 * ceil(exponent/16) -
07c0a41bSMichael Jones      // exponent
07c0a41bSMichael Jones
a621198aSmichaelrj-google      const uint32_t pos_exp = idx * IDX_SIZE;
a621198aSmichaelrj-google
6a8e6c9aSGuillaume Chatelet      UInt<MID_INT_SIZE> val;
07c0a41bSMichael Jones
688b9730SMichael Jones#if defined(LIBC_COPT_FLOAT_TO_STR_USE_DYADIC_FLOAT)
688b9730SMichael Jones      // ----------------------- DYADIC FLOAT CALC MODE ------------------------
688b9730SMichael Jones      const int32_t SHIFT_CONST = CALC_SHIFT_CONST;
688b9730SMichael Jones      val = internal::get_table_positive_df<256>(IDX_SIZE * idx, block_index);
688b9730SMichael Jones#elif defined(LIBC_COPT_FLOAT_TO_STR_USE_INT_CALC)
688b9730SMichael Jones
688b9730SMichael Jones      // ---------------------------- INT CALC MODE ----------------------------
688b9730SMichael Jones      const int32_t SHIFT_CONST = CALC_SHIFT_CONST;
688b9730SMichael Jones      const uint64_t MAX_POW_2_SIZE =
5bd34e0aSmichaelrj-google          pos_exp + CALC_SHIFT_CONST - (BLOCK_SIZE * block_index);
688b9730SMichael Jones      const uint64_t MAX_POW_5_SIZE =
688b9730SMichael Jones          internal::log2_pow5(BLOCK_SIZE * block_index);
688b9730SMichael Jones      const uint64_t MAX_INT_SIZE =
688b9730SMichael Jones          (MAX_POW_2_SIZE > MAX_POW_5_SIZE) ? MAX_POW_2_SIZE : MAX_POW_5_SIZE;
688b9730SMichael Jones
688b9730SMichael Jones      if (MAX_INT_SIZE < 1024) {
688b9730SMichael Jones        val = internal::get_table_positive<1024>(pos_exp, block_index);
688b9730SMichael Jones      } else if (MAX_INT_SIZE < 2048) {
688b9730SMichael Jones        val = internal::get_table_positive<2048>(pos_exp, block_index);
688b9730SMichael Jones      } else if (MAX_INT_SIZE < 4096) {
688b9730SMichael Jones        val = internal::get_table_positive<4096>(pos_exp, block_index);
688b9730SMichael Jones      } else if (MAX_INT_SIZE < 8192) {
688b9730SMichael Jones        val = internal::get_table_positive<8192>(pos_exp, block_index);
5bd34e0aSmichaelrj-google      } else if (MAX_INT_SIZE < 16384) {
688b9730SMichael Jones        val = internal::get_table_positive<16384>(pos_exp, block_index);
5bd34e0aSmichaelrj-google      } else {
5bd34e0aSmichaelrj-google        val = internal::get_table_positive<16384 + 128>(pos_exp, block_index);
07c0a41bSMichael Jones      }
a621198aSmichaelrj-google#else
a621198aSmichaelrj-google      // ----------------------------- TABLE MODE ------------------------------
a621198aSmichaelrj-google      const int32_t SHIFT_CONST = TABLE_SHIFT_CONST;
a621198aSmichaelrj-google
a621198aSmichaelrj-google      val = POW10_SPLIT[POW10_OFFSET[idx] + block_index];
688b9730SMichael Jones#endif
688b9730SMichael Jones      const uint32_t shift_amount = SHIFT_CONST + pos_exp - exponent;
07c0a41bSMichael Jones
07c0a41bSMichael Jones      const BlockInt digits =
07c0a41bSMichael Jones          internal::mul_shift_mod_1e9(mantissa, val, (int32_t)(shift_amount));
07c0a41bSMichael Jones      return digits;
07c0a41bSMichael Jones    } else {
07c0a41bSMichael Jones      return 0;
07c0a41bSMichael Jones    }
07c0a41bSMichael Jones  }
07c0a41bSMichael Jones
a621198aSmichaelrj-google  LIBC_INLINE constexpr BlockInt get_negative_block(int block_index) {
07c0a41bSMichael Jones    if (exponent < 0) {
688b9730SMichael Jones      const int32_t idx = -exponent / IDX_SIZE;
688b9730SMichael Jones
6a8e6c9aSGuillaume Chatelet      UInt<MID_INT_SIZE> val;
688b9730SMichael Jones
8a0ff194Smichaelrj-google      const uint32_t pos_exp = static_cast<uint32_t>(idx * IDX_SIZE);
a621198aSmichaelrj-google
a621198aSmichaelrj-google#if defined(LIBC_COPT_FLOAT_TO_STR_USE_DYADIC_FLOAT)
a621198aSmichaelrj-google      // ----------------------- DYADIC FLOAT CALC MODE ------------------------
a621198aSmichaelrj-google      const int32_t SHIFT_CONST = CALC_SHIFT_CONST;
a621198aSmichaelrj-google      val = internal::get_table_negative_df<256>(pos_exp, block_index + 1);
a621198aSmichaelrj-google#elif defined(LIBC_COPT_FLOAT_TO_STR_USE_INT_CALC)
a621198aSmichaelrj-google      // ---------------------------- INT CALC MODE ----------------------------
a621198aSmichaelrj-google      const int32_t SHIFT_CONST = CALC_SHIFT_CONST;
a621198aSmichaelrj-google
a621198aSmichaelrj-google      const uint64_t NUM_FIVES = (block_index + 1) * BLOCK_SIZE;
a621198aSmichaelrj-google      // Round MAX_INT_SIZE up to the nearest 64 (adding 1 because log2_pow5
a621198aSmichaelrj-google      // implicitly rounds down).
a621198aSmichaelrj-google      const uint64_t MAX_INT_SIZE =
a621198aSmichaelrj-google          ((internal::log2_pow5(NUM_FIVES) / 64) + 1) * 64;
a621198aSmichaelrj-google
a621198aSmichaelrj-google      if (MAX_INT_SIZE < 1024) {
a621198aSmichaelrj-google        val = internal::get_table_negative<1024>(pos_exp, block_index + 1);
a621198aSmichaelrj-google      } else if (MAX_INT_SIZE < 2048) {
a621198aSmichaelrj-google        val = internal::get_table_negative<2048>(pos_exp, block_index + 1);
a621198aSmichaelrj-google      } else if (MAX_INT_SIZE < 4096) {
a621198aSmichaelrj-google        val = internal::get_table_negative<4096>(pos_exp, block_index + 1);
a621198aSmichaelrj-google      } else if (MAX_INT_SIZE < 8192) {
a621198aSmichaelrj-google        val = internal::get_table_negative<8192>(pos_exp, block_index + 1);
a621198aSmichaelrj-google      } else if (MAX_INT_SIZE < 16384) {
a621198aSmichaelrj-google        val = internal::get_table_negative<16384>(pos_exp, block_index + 1);
a621198aSmichaelrj-google      } else {
a621198aSmichaelrj-google        val = internal::get_table_negative<16384 + 8192>(pos_exp,
a621198aSmichaelrj-google                                                         block_index + 1);
a621198aSmichaelrj-google      }
a621198aSmichaelrj-google#else
a621198aSmichaelrj-google      // ----------------------------- TABLE MODE ------------------------------
07c0a41bSMichael Jones      // if the requested block is zero
a621198aSmichaelrj-google      const int32_t SHIFT_CONST = TABLE_SHIFT_CONST;
bfcfc2a6Smichaelrj-google      if (block_index < MIN_BLOCK_2[idx]) {
07c0a41bSMichael Jones        return 0;
07c0a41bSMichael Jones      }
688b9730SMichael Jones      const uint32_t p = POW10_OFFSET_2[idx] + block_index - MIN_BLOCK_2[idx];
07c0a41bSMichael Jones      // If every digit after the requested block is zero.
07c0a41bSMichael Jones      if (p >= POW10_OFFSET_2[idx + 1]) {
07c0a41bSMichael Jones        return 0;
07c0a41bSMichael Jones      }
a621198aSmichaelrj-google
688b9730SMichael Jones      val = POW10_SPLIT_2[p];
688b9730SMichael Jones#endif
ab65c9c3Smichaelrj-google      const int32_t shift_amount =
a621198aSmichaelrj-google          SHIFT_CONST + (-exponent - static_cast<int32_t>(pos_exp));
a621198aSmichaelrj-google      BlockInt digits =
a621198aSmichaelrj-google          internal::mul_shift_mod_1e9(mantissa, val, shift_amount);
07c0a41bSMichael Jones      return digits;
07c0a41bSMichael Jones    } else {
07c0a41bSMichael Jones      return 0;
07c0a41bSMichael Jones    }
07c0a41bSMichael Jones  }
07c0a41bSMichael Jones
a621198aSmichaelrj-google  LIBC_INLINE constexpr BlockInt get_block(int block_index) {
a621198aSmichaelrj-google    if (block_index >= 0) {
a621198aSmichaelrj-google      return get_positive_block(block_index);
a621198aSmichaelrj-google    } else {
a621198aSmichaelrj-google      return get_negative_block(-1 - block_index);
a621198aSmichaelrj-google    }
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  LIBC_INLINE constexpr size_t get_positive_blocks() {
a621198aSmichaelrj-google    if (exponent < -FRACTION_LEN)
a621198aSmichaelrj-google      return 0;
a621198aSmichaelrj-google    const uint32_t idx =
a621198aSmichaelrj-google        exponent < 0
a621198aSmichaelrj-google            ? 0
a621198aSmichaelrj-google            : static_cast<uint32_t>(exponent + (IDX_SIZE - 1)) / IDX_SIZE;
a621198aSmichaelrj-google    return internal::length_for_num(idx * IDX_SIZE, FRACTION_LEN);
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  // This takes the index of a block after the decimal point (a negative block)
a621198aSmichaelrj-google  // and return if it's sure that all of the digits after it are zero.
a621198aSmichaelrj-google  LIBC_INLINE constexpr bool is_lowest_block(size_t negative_block_index) {
a621198aSmichaelrj-google#ifdef LIBC_COPT_FLOAT_TO_STR_NO_TABLE
a621198aSmichaelrj-google    // The decimal representation of 2**(-i) will have exactly i digits after
a621198aSmichaelrj-google    // the decimal point.
a621198aSmichaelrj-google    int num_requested_digits =
a621198aSmichaelrj-google        static_cast<int>((negative_block_index + 1) * BLOCK_SIZE);
a621198aSmichaelrj-google
a621198aSmichaelrj-google    return num_requested_digits > -exponent;
a621198aSmichaelrj-google#else
a621198aSmichaelrj-google    const int32_t idx = -exponent / IDX_SIZE;
a621198aSmichaelrj-google    const size_t p =
a621198aSmichaelrj-google        POW10_OFFSET_2[idx] + negative_block_index - MIN_BLOCK_2[idx];
a621198aSmichaelrj-google    // If the remaining digits are all 0, then this is the lowest block.
a621198aSmichaelrj-google    return p >= POW10_OFFSET_2[idx + 1];
a621198aSmichaelrj-google#endif
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  LIBC_INLINE constexpr size_t zero_blocks_after_point() {
a621198aSmichaelrj-google#ifdef LIBC_COPT_FLOAT_TO_STR_NO_TABLE
a621198aSmichaelrj-google    if (exponent < -FRACTION_LEN) {
a621198aSmichaelrj-google      const int pos_exp = -exponent - 1;
a621198aSmichaelrj-google      const uint32_t pos_idx =
a621198aSmichaelrj-google          static_cast<uint32_t>(pos_exp + (IDX_SIZE - 1)) / IDX_SIZE;
a621198aSmichaelrj-google      const int32_t pos_len = ((internal::ceil_log10_pow2(pos_idx * IDX_SIZE) -
a621198aSmichaelrj-google                                internal::ceil_log10_pow2(FRACTION_LEN + 1)) /
a621198aSmichaelrj-google                               BLOCK_SIZE) -
a621198aSmichaelrj-google                              1;
a621198aSmichaelrj-google      return static_cast<uint32_t>(pos_len > 0 ? pos_len : 0);
a621198aSmichaelrj-google    }
a621198aSmichaelrj-google    return 0;
a621198aSmichaelrj-google#else
a621198aSmichaelrj-google    return MIN_BLOCK_2[-exponent / IDX_SIZE];
a621198aSmichaelrj-google#endif
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google};
a621198aSmichaelrj-google
f7d4236aSGuillaume Chatelet#if !defined(LIBC_TYPES_LONG_DOUBLE_IS_FLOAT64) &&                             \
a621198aSmichaelrj-google    !defined(LIBC_COPT_FLOAT_TO_STR_NO_SPECIALIZE_LD)
a621198aSmichaelrj-google// --------------------------- LONG DOUBLE FUNCTIONS ---------------------------
a621198aSmichaelrj-google
a621198aSmichaelrj-google// this algorithm will work exactly the same for 80 bit and 128 bit long
a621198aSmichaelrj-google// doubles. They have the same max exponent, but even if they didn't the
a621198aSmichaelrj-google// constants should be calculated to be correct for any provided floating point
a621198aSmichaelrj-google// type.
a621198aSmichaelrj-google
a621198aSmichaelrj-googletemplate <> class FloatToString<long double> {
a621198aSmichaelrj-google  fputil::FPBits<long double> float_bits;
a621198aSmichaelrj-google  bool is_negative = 0;
a621198aSmichaelrj-google  int exponent = 0;
a621198aSmichaelrj-google  FPBits::StorageType mantissa = 0;
a621198aSmichaelrj-google
a621198aSmichaelrj-google  static constexpr int FRACTION_LEN = fputil::FPBits<long double>::FRACTION_LEN;
a621198aSmichaelrj-google  static constexpr int EXP_BIAS = fputil::FPBits<long double>::EXP_BIAS;
a621198aSmichaelrj-google  static constexpr size_t UINT_WORD_SIZE = 64;
a621198aSmichaelrj-google
a621198aSmichaelrj-google  static constexpr size_t FLOAT_AS_INT_WIDTH =
a621198aSmichaelrj-google      internal::div_ceil(fputil::FPBits<long double>::MAX_BIASED_EXPONENT -
a621198aSmichaelrj-google                             FPBits::EXP_BIAS,
a621198aSmichaelrj-google                         UINT_WORD_SIZE) *
a621198aSmichaelrj-google      UINT_WORD_SIZE;
a621198aSmichaelrj-google  static constexpr size_t EXTRA_INT_WIDTH =
a621198aSmichaelrj-google      internal::div_ceil(sizeof(long double) * CHAR_BIT, UINT_WORD_SIZE) *
a621198aSmichaelrj-google      UINT_WORD_SIZE;
a621198aSmichaelrj-google
6a8e6c9aSGuillaume Chatelet  using wide_int = UInt<FLOAT_AS_INT_WIDTH + EXTRA_INT_WIDTH>;
a621198aSmichaelrj-google
a621198aSmichaelrj-google  // float_as_fixed represents the floating point number as a fixed point number
a621198aSmichaelrj-google  // with the point EXTRA_INT_WIDTH bits from the left of the number. This can
a621198aSmichaelrj-google  // store any number with a negative exponent.
a621198aSmichaelrj-google  wide_int float_as_fixed = 0;
a621198aSmichaelrj-google  int int_block_index = 0;
a621198aSmichaelrj-google
a621198aSmichaelrj-google  static constexpr size_t BLOCK_BUFFER_LEN =
6812bc40Smichaelrj-google      internal::div_ceil(internal::log10_pow2(FLOAT_AS_INT_WIDTH), BLOCK_SIZE) +
6812bc40Smichaelrj-google      1;
a621198aSmichaelrj-google  BlockInt block_buffer[BLOCK_BUFFER_LEN] = {0};
a621198aSmichaelrj-google  size_t block_buffer_valid = 0;
a621198aSmichaelrj-google
a621198aSmichaelrj-google  template <size_t Bits>
6a8e6c9aSGuillaume Chatelet  LIBC_INLINE static constexpr BlockInt grab_digits(UInt<Bits> &int_num) {
4e005515Slntue    auto wide_result = int_num.div_uint_half_times_pow_2(EXP5_9, 9);
a621198aSmichaelrj-google    // the optional only comes into effect when dividing by 0, which will
a621198aSmichaelrj-google    // never happen here. Thus, we just assert that it has value.
a621198aSmichaelrj-google    LIBC_ASSERT(wide_result.has_value());
a621198aSmichaelrj-google    return static_cast<BlockInt>(wide_result.value());
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  LIBC_INLINE static constexpr void zero_leading_digits(wide_int &int_num) {
a621198aSmichaelrj-google    // WORD_SIZE is the width of the numbers used to internally represent the
a621198aSmichaelrj-google    // UInt
a621198aSmichaelrj-google    for (size_t i = 0; i < EXTRA_INT_WIDTH / wide_int::WORD_SIZE; ++i)
a621198aSmichaelrj-google      int_num[i + (FLOAT_AS_INT_WIDTH / wide_int::WORD_SIZE)] = 0;
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  // init_convert initializes float_as_int, cur_block, and block_buffer based on
a621198aSmichaelrj-google  // the mantissa and exponent of the initial number. Calling it will always
a621198aSmichaelrj-google  // return the class to the starting state.
a621198aSmichaelrj-google  LIBC_INLINE constexpr void init_convert() {
a621198aSmichaelrj-google    // No calculation necessary for the 0 case.
a621198aSmichaelrj-google    if (mantissa == 0 && exponent == 0)
a621198aSmichaelrj-google      return;
a621198aSmichaelrj-google
a621198aSmichaelrj-google    if (exponent > 0) {
a621198aSmichaelrj-google      // if the exponent is positive, then the number is fully above the decimal
a621198aSmichaelrj-google      // point. In this case we represent the float as an integer, then divide
a621198aSmichaelrj-google      // by 10^BLOCK_SIZE and take the remainder as our next block. This
a621198aSmichaelrj-google      // generates the digits from right to left, but the digits will be written
a621198aSmichaelrj-google      // from left to right, so it caches the results so they can be read in
a621198aSmichaelrj-google      // reverse order.
a621198aSmichaelrj-google
a621198aSmichaelrj-google      wide_int float_as_int = mantissa;
a621198aSmichaelrj-google
71c3f5d6SGuillaume Chatelet      float_as_int <<= exponent;
a621198aSmichaelrj-google      int_block_index = 0;
a621198aSmichaelrj-google
a621198aSmichaelrj-google      while (float_as_int > 0) {
6812bc40Smichaelrj-google        LIBC_ASSERT(int_block_index < static_cast<int>(BLOCK_BUFFER_LEN));
4e005515Slntue        block_buffer[int_block_index] =
4e005515Slntue            grab_digits<FLOAT_AS_INT_WIDTH + EXTRA_INT_WIDTH>(float_as_int);
a621198aSmichaelrj-google        ++int_block_index;
a621198aSmichaelrj-google      }
a621198aSmichaelrj-google      block_buffer_valid = int_block_index;
a621198aSmichaelrj-google
a621198aSmichaelrj-google    } else {
a621198aSmichaelrj-google      // if the exponent is not positive, then the number is at least partially
a621198aSmichaelrj-google      // below the decimal point. In this case we represent the float as a fixed
a621198aSmichaelrj-google      // point number with the decimal point after the top EXTRA_INT_WIDTH bits.
a621198aSmichaelrj-google      float_as_fixed = mantissa;
a621198aSmichaelrj-google
a621198aSmichaelrj-google      const int SHIFT_AMOUNT = FLOAT_AS_INT_WIDTH + exponent;
a621198aSmichaelrj-google      static_assert(EXTRA_INT_WIDTH >= sizeof(long double) * 8);
71c3f5d6SGuillaume Chatelet      float_as_fixed <<= SHIFT_AMOUNT;
a621198aSmichaelrj-google
a621198aSmichaelrj-google      // If there are still digits above the decimal point, handle those.
71c3f5d6SGuillaume Chatelet      if (cpp::countl_zero(float_as_fixed) <
71c3f5d6SGuillaume Chatelet          static_cast<int>(EXTRA_INT_WIDTH)) {
6a8e6c9aSGuillaume Chatelet        UInt<EXTRA_INT_WIDTH> above_decimal_point =
a621198aSmichaelrj-google            float_as_fixed >> FLOAT_AS_INT_WIDTH;
a621198aSmichaelrj-google
a621198aSmichaelrj-google        size_t positive_int_block_index = 0;
a621198aSmichaelrj-google        while (above_decimal_point > 0) {
a621198aSmichaelrj-google          block_buffer[positive_int_block_index] =
4e005515Slntue              grab_digits<EXTRA_INT_WIDTH>(above_decimal_point);
a621198aSmichaelrj-google          ++positive_int_block_index;
a621198aSmichaelrj-google        }
a621198aSmichaelrj-google        block_buffer_valid = positive_int_block_index;
a621198aSmichaelrj-google
a621198aSmichaelrj-google        // Zero all digits above the decimal point.
a621198aSmichaelrj-google        zero_leading_digits(float_as_fixed);
a621198aSmichaelrj-google        int_block_index = 0;
a621198aSmichaelrj-google      }
a621198aSmichaelrj-google    }
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-googlepublic:
a621198aSmichaelrj-google  LIBC_INLINE constexpr FloatToString(long double init_float)
a621198aSmichaelrj-google      : float_bits(init_float) {
a621198aSmichaelrj-google    is_negative = float_bits.is_neg();
a621198aSmichaelrj-google    exponent = float_bits.get_explicit_exponent();
a621198aSmichaelrj-google    mantissa = float_bits.get_explicit_mantissa();
a621198aSmichaelrj-google
a621198aSmichaelrj-google    // Adjust for the width of the mantissa.
a621198aSmichaelrj-google    exponent -= FRACTION_LEN;
a621198aSmichaelrj-google
a621198aSmichaelrj-google    this->init_convert();
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  LIBC_INLINE constexpr size_t get_positive_blocks() {
a621198aSmichaelrj-google    if (exponent < -FRACTION_LEN)
a621198aSmichaelrj-google      return 0;
a621198aSmichaelrj-google
a621198aSmichaelrj-google    const uint32_t idx =
a621198aSmichaelrj-google        exponent < 0
a621198aSmichaelrj-google            ? 0
a621198aSmichaelrj-google            : static_cast<uint32_t>(exponent + (IDX_SIZE - 1)) / IDX_SIZE;
a621198aSmichaelrj-google    return internal::length_for_num(idx * IDX_SIZE, FRACTION_LEN);
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  LIBC_INLINE constexpr size_t zero_blocks_after_point() {
a621198aSmichaelrj-google#ifdef LIBC_COPT_FLOAT_TO_STR_USE_MEGA_LONG_DOUBLE_TABLE
a621198aSmichaelrj-google    return MIN_BLOCK_2[-exponent / IDX_SIZE];
a621198aSmichaelrj-google#else
a621198aSmichaelrj-google    if (exponent >= -FRACTION_LEN)
a621198aSmichaelrj-google      return 0;
a621198aSmichaelrj-google
a621198aSmichaelrj-google    const int pos_exp = -exponent - 1;
a621198aSmichaelrj-google    const uint32_t pos_idx =
a621198aSmichaelrj-google        static_cast<uint32_t>(pos_exp + (IDX_SIZE - 1)) / IDX_SIZE;
a621198aSmichaelrj-google    const int32_t pos_len = ((internal::ceil_log10_pow2(pos_idx * IDX_SIZE) -
a621198aSmichaelrj-google                              internal::ceil_log10_pow2(FRACTION_LEN + 1)) /
a621198aSmichaelrj-google                             BLOCK_SIZE) -
a621198aSmichaelrj-google                            1;
a621198aSmichaelrj-google    return static_cast<uint32_t>(pos_len > 0 ? pos_len : 0);
a621198aSmichaelrj-google#endif
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  LIBC_INLINE constexpr bool is_lowest_block(size_t negative_block_index) {
a621198aSmichaelrj-google    // The decimal representation of 2**(-i) will have exactly i digits after
a621198aSmichaelrj-google    // the decimal point.
a621198aSmichaelrj-google    const int num_requested_digits =
a621198aSmichaelrj-google        static_cast<int>((negative_block_index + 1) * BLOCK_SIZE);
a621198aSmichaelrj-google
a621198aSmichaelrj-google    return num_requested_digits > -exponent;
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  LIBC_INLINE constexpr BlockInt get_positive_block(int block_index) {
a621198aSmichaelrj-google    if (exponent < -FRACTION_LEN)
a621198aSmichaelrj-google      return 0;
a621198aSmichaelrj-google    if (block_index > static_cast<int>(block_buffer_valid) || block_index < 0)
a621198aSmichaelrj-google      return 0;
a621198aSmichaelrj-google
6812bc40Smichaelrj-google    LIBC_ASSERT(block_index < static_cast<int>(BLOCK_BUFFER_LEN));
6812bc40Smichaelrj-google
a621198aSmichaelrj-google    return block_buffer[block_index];
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  LIBC_INLINE constexpr BlockInt get_negative_block(int negative_block_index) {
a621198aSmichaelrj-google    if (exponent >= 0)
a621198aSmichaelrj-google      return 0;
a621198aSmichaelrj-google
a621198aSmichaelrj-google    // negative_block_index starts at 0 with the first block after the decimal
a621198aSmichaelrj-google    // point, and 1 with the second and so on. This converts to the same
a621198aSmichaelrj-google    // block_index used everywhere else.
a621198aSmichaelrj-google
a621198aSmichaelrj-google    const int block_index = -1 - negative_block_index;
a621198aSmichaelrj-google
a621198aSmichaelrj-google    // If we're currently after the requested block (remember these are
a621198aSmichaelrj-google    // negative indices) we reset the number to the start. This is only
a621198aSmichaelrj-google    // likely to happen in %g calls. This will also reset int_block_index.
a621198aSmichaelrj-google    // if (block_index > int_block_index) {
a621198aSmichaelrj-google    //   init_convert();
a621198aSmichaelrj-google    // }
a621198aSmichaelrj-google
a621198aSmichaelrj-google    // Printf is the only existing user of this code and it will only ever move
a621198aSmichaelrj-google    // downwards, except for %g but that currently creates a second
a621198aSmichaelrj-google    // float_to_string object so this assertion still holds. If a new user needs
a621198aSmichaelrj-google    // the ability to step backwards, uncomment the code above.
a621198aSmichaelrj-google    LIBC_ASSERT(block_index <= int_block_index);
a621198aSmichaelrj-google
a621198aSmichaelrj-google    // If we are currently before the requested block. Step until we reach the
a621198aSmichaelrj-google    // requested block. This is likely to only be one step.
a621198aSmichaelrj-google    while (block_index < int_block_index) {
a621198aSmichaelrj-google      zero_leading_digits(float_as_fixed);
a621198aSmichaelrj-google      float_as_fixed.mul(EXP10_9);
a621198aSmichaelrj-google      --int_block_index;
a621198aSmichaelrj-google    }
a621198aSmichaelrj-google
a621198aSmichaelrj-google    // We're now on the requested block, return the current block.
a621198aSmichaelrj-google    return static_cast<BlockInt>(float_as_fixed >> FLOAT_AS_INT_WIDTH);
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google
a621198aSmichaelrj-google  LIBC_INLINE constexpr BlockInt get_block(int block_index) {
a621198aSmichaelrj-google    if (block_index >= 0)
a621198aSmichaelrj-google      return get_positive_block(block_index);
a621198aSmichaelrj-google
a621198aSmichaelrj-google    return get_negative_block(-1 - block_index);
a621198aSmichaelrj-google  }
a621198aSmichaelrj-google};
a621198aSmichaelrj-google
f7d4236aSGuillaume Chatelet#endif // !LIBC_TYPES_LONG_DOUBLE_IS_FLOAT64 &&
a621198aSmichaelrj-google       // !LIBC_COPT_FLOAT_TO_STR_NO_SPECIALIZE_LD
688b9730SMichael Jones
5ff3ff33SPetr Hosek} // namespace LIBC_NAMESPACE_DECL
07c0a41bSMichael Jones
270547f3SGuillaume Chatelet#endif // LLVM_LIBC_SRC___SUPPORT_FLOAT_TO_STRING_H