src/__support/str_to_float.h

87c01607SMichael Jones//===-- String to float conversion utils ------------------------*- C++ -*-===//
87c01607SMichael Jones//
87c01607SMichael Jones// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
87c01607SMichael Jones// See https://llvm.org/LICENSE.txt for license information.
87c01607SMichael Jones// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
87c01607SMichael Jones//
87c01607SMichael Jones//===----------------------------------------------------------------------===//
87c01607SMichael Jones
6c4267fbSMichael Jones// -----------------------------------------------------------------------------
6c4267fbSMichael Jones//                               **** WARNING ****
6c4267fbSMichael Jones// This file is shared with libc++. You should also be careful when adding
6c4267fbSMichael Jones// dependencies to this file, since it needs to build for all libc++ targets.
6c4267fbSMichael Jones// -----------------------------------------------------------------------------
6c4267fbSMichael Jones
270547f3SGuillaume Chatelet#ifndef LLVM_LIBC_SRC___SUPPORT_STR_TO_FLOAT_H
270547f3SGuillaume Chatelet#define LLVM_LIBC_SRC___SUPPORT_STR_TO_FLOAT_H
87c01607SMichael Jones
c703e657SGuillaume Chatelet#include "src/__support/CPP/bit.h"
91eb0b65SGuillaume Chatelet#include "src/__support/CPP/limits.h"
cb3c41c2SMichael Jones#include "src/__support/CPP/optional.h"
0504e932SNishant Mittal#include "src/__support/CPP/string_view.h"
87c01607SMichael Jones#include "src/__support/FPUtil/FPBits.h"
a9824312STue Ly#include "src/__support/FPUtil/rounding_mode.h"
59c809cdSSiva Chandra Reddy#include "src/__support/common.h"
87c01607SMichael Jones#include "src/__support/ctype_utils.h"
87c01607SMichael Jones#include "src/__support/detailed_powers_of_ten.h"
87c01607SMichael Jones#include "src/__support/high_precision_decimal.h"
5ff3ff33SPetr Hosek#include "src/__support/macros/config.h"
1896ee38Slntue#include "src/__support/macros/null_check.h"
1896ee38Slntue#include "src/__support/macros/optimization.h"
31d797f4SMichael Jones#include "src/__support/str_to_integer.h"
cb3c41c2SMichael Jones#include "src/__support/str_to_num_result.h"
09efe848SGuillaume Chatelet#include "src/__support/uint128.h"
04a9c625SMichael Jones#include "src/errno/libc_errno.h" // For ERANGE
87c01607SMichael Jones
d851b5c1SMichael Jones#include <stdint.h>
d851b5c1SMichael Jones
5ff3ff33SPetr Hoseknamespace LIBC_NAMESPACE_DECL {
87c01607SMichael Jonesnamespace internal {
87c01607SMichael Jones
6c4267fbSMichael Jones// -----------------------------------------------------------------------------
6c4267fbSMichael Jones//                               **** WARNING ****
6c4267fbSMichael Jones// This interface is shared with libc++, if you change this interface you need
6c4267fbSMichael Jones// to update it in both libc and libc++.
6c4267fbSMichael Jones// -----------------------------------------------------------------------------
cb3c41c2SMichael Jonestemplate <class T> struct ExpandedFloat {
3546f4daSGuillaume Chatelet  typename fputil::FPBits<T>::StorageType mantissa;
cb3c41c2SMichael Jones  int32_t exponent;
cb3c41c2SMichael Jones};
cb3c41c2SMichael Jones
6c4267fbSMichael Jones// -----------------------------------------------------------------------------
6c4267fbSMichael Jones//                               **** WARNING ****
6c4267fbSMichael Jones// This interface is shared with libc++, if you change this interface you need
6c4267fbSMichael Jones// to update it in both libc and libc++.
6c4267fbSMichael Jones// -----------------------------------------------------------------------------
cb3c41c2SMichael Jonestemplate <class T> struct FloatConvertReturn {
cb3c41c2SMichael Jones  ExpandedFloat<T> num = {0, 0};
cb3c41c2SMichael Jones  int error = 0;
cb3c41c2SMichael Jones};
cb3c41c2SMichael Jones
59c809cdSSiva Chandra ReddyLIBC_INLINE uint64_t low64(const UInt128 &num) {
87c01607SMichael Jones  return static_cast<uint64_t>(num & 0xffffffffffffffff);
87c01607SMichael Jones}
87c01607SMichael Jones
59c809cdSSiva Chandra ReddyLIBC_INLINE uint64_t high64(const UInt128 &num) {
87c01607SMichael Jones  return static_cast<uint64_t>(num >> 64);
87c01607SMichael Jones}
87c01607SMichael Jones
59c809cdSSiva Chandra Reddytemplate <class T> LIBC_INLINE void set_implicit_bit(fputil::FPBits<T> &) {
59c809cdSSiva Chandra Reddy  return;
59c809cdSSiva Chandra Reddy}
aa1902f9SMichael Jones
f7d4236aSGuillaume Chatelet#if defined(LIBC_TYPES_LONG_DOUBLE_IS_X86_FLOAT80)
aa1902f9SMichael Jonestemplate <>
494734b0SSiva Chandra ReddyLIBC_INLINE void
494734b0SSiva Chandra Reddyset_implicit_bit<long double>(fputil::FPBits<long double> &result) {
7b387d27SGuillaume Chatelet  result.set_implicit_bit(result.get_biased_exponent() != 0);
aa1902f9SMichael Jones}
f7d4236aSGuillaume Chatelet#endif // LIBC_TYPES_LONG_DOUBLE_IS_X86_FLOAT80
aa1902f9SMichael Jones
87c01607SMichael Jones// This Eisel-Lemire implementation is based on the algorithm described in the
87c01607SMichael Jones// paper Number Parsing at a Gigabyte per Second, Software: Practice and
87c01607SMichael Jones// Experience 51 (8), 2021 (https://arxiv.org/abs/2101.11408), as well as the
87c01607SMichael Jones// description by Nigel Tao
87c01607SMichael Jones// (https://nigeltao.github.io/blog/2020/eisel-lemire.html) and the golang
87c01607SMichael Jones// implementation, also by Nigel Tao
87c01607SMichael Jones// (https://github.com/golang/go/blob/release-branch.go1.16/src/strconv/eisel_lemire.go#L25)
87c01607SMichael Jones// for some optimizations as well as handling 32 bit floats.
87c01607SMichael Jonestemplate <class T>
cb3c41c2SMichael JonesLIBC_INLINE cpp::optional<ExpandedFloat<T>>
cb3c41c2SMichael Joneseisel_lemire(ExpandedFloat<T> init_num,
cb3c41c2SMichael Jones             RoundDirection round = RoundDirection::Nearest) {
c703e657SGuillaume Chatelet  using FPBits = typename fputil::FPBits<T>;
3546f4daSGuillaume Chatelet  using StorageType = typename FPBits::StorageType;
87c01607SMichael Jones
3546f4daSGuillaume Chatelet  StorageType mantissa = init_num.mantissa;
cb3c41c2SMichael Jones  int32_t exp10 = init_num.exponent;
cb3c41c2SMichael Jones
87c01607SMichael Jones  if (sizeof(T) > 8) { // This algorithm cannot handle anything longer than a
87c01607SMichael Jones                       // double, so we skip straight to the fallback.
cb3c41c2SMichael Jones    return cpp::nullopt;
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  // Exp10 Range
87c01607SMichael Jones  if (exp10 < DETAILED_POWERS_OF_TEN_MIN_EXP_10 ||
87c01607SMichael Jones      exp10 > DETAILED_POWERS_OF_TEN_MAX_EXP_10) {
cb3c41c2SMichael Jones    return cpp::nullopt;
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  // Normalization
3546f4daSGuillaume Chatelet  uint32_t clz = cpp::countl_zero<StorageType>(mantissa);
87c01607SMichael Jones  mantissa <<= clz;
87c01607SMichael Jones
3546f4daSGuillaume Chatelet  int32_t exp2 =
c09e6905SGuillaume Chatelet      exp10_to_exp2(exp10) + FPBits::STORAGE_LEN + FPBits::EXP_BIAS - clz;
87c01607SMichael Jones
87c01607SMichael Jones  // Multiplication
1c92911eSMichael Jones  const uint64_t *power_of_ten =
87c01607SMichael Jones      DETAILED_POWERS_OF_TEN[exp10 - DETAILED_POWERS_OF_TEN_MIN_EXP_10];
87c01607SMichael Jones
300f8da8SSiva Chandra Reddy  UInt128 first_approx =
300f8da8SSiva Chandra Reddy      static_cast<UInt128>(mantissa) * static_cast<UInt128>(power_of_ten[1]);
87c01607SMichael Jones
87c01607SMichael Jones  // Wider Approximation
300f8da8SSiva Chandra Reddy  UInt128 final_approx;
87c01607SMichael Jones  // The halfway constant is used to check if the bits that will be shifted away
87c01607SMichael Jones  // intially are all 1. For doubles this is 64 (bitstype size) - 52 (final
87c01607SMichael Jones  // mantissa size) - 3 (we shift away the last two bits separately for
aa1902f9SMichael Jones  // accuracy, and the most significant bit is ignored.) = 9 bits. Similarly,
aa1902f9SMichael Jones  // it's 6 bits for floats in this case.
aa1902f9SMichael Jones  const uint64_t halfway_constant =
c09e6905SGuillaume Chatelet      (uint64_t(1) << (FPBits::STORAGE_LEN - (FPBits::FRACTION_LEN + 3))) - 1;
1c92911eSMichael Jones  if ((high64(first_approx) & halfway_constant) == halfway_constant &&
1c92911eSMichael Jones      low64(first_approx) + mantissa < mantissa) {
300f8da8SSiva Chandra Reddy    UInt128 low_bits =
300f8da8SSiva Chandra Reddy        static_cast<UInt128>(mantissa) * static_cast<UInt128>(power_of_ten[0]);
300f8da8SSiva Chandra Reddy    UInt128 second_approx =
300f8da8SSiva Chandra Reddy        first_approx + static_cast<UInt128>(high64(low_bits));
87c01607SMichael Jones
1c92911eSMichael Jones    if ((high64(second_approx) & halfway_constant) == halfway_constant &&
1c92911eSMichael Jones        low64(second_approx) + 1 == 0 &&
1c92911eSMichael Jones        low64(low_bits) + mantissa < mantissa) {
cb3c41c2SMichael Jones      return cpp::nullopt;
87c01607SMichael Jones    }
1c92911eSMichael Jones    final_approx = second_approx;
87c01607SMichael Jones  } else {
1c92911eSMichael Jones    final_approx = first_approx;
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  // Shifting to 54 bits for doubles and 25 bits for floats
3546f4daSGuillaume Chatelet  StorageType msb = static_cast<StorageType>(high64(final_approx) >>
c09e6905SGuillaume Chatelet                                             (FPBits::STORAGE_LEN - 1));
3546f4daSGuillaume Chatelet  StorageType final_mantissa = static_cast<StorageType>(
c703e657SGuillaume Chatelet      high64(final_approx) >>
c09e6905SGuillaume Chatelet      (msb + FPBits::STORAGE_LEN - (FPBits::FRACTION_LEN + 3)));
2e8fa86eSAlex Brachet  exp2 -= static_cast<uint32_t>(1 ^ msb); // same as !msb
87c01607SMichael Jones
cb3c41c2SMichael Jones  if (round == RoundDirection::Nearest) {
87c01607SMichael Jones    // Half-way ambiguity
1c92911eSMichael Jones    if (low64(final_approx) == 0 &&
1c92911eSMichael Jones        (high64(final_approx) & halfway_constant) == 0 &&
1c92911eSMichael Jones        (final_mantissa & 3) == 1) {
cb3c41c2SMichael Jones      return cpp::nullopt;
87c01607SMichael Jones    }
87c01607SMichael Jones
cb3c41c2SMichael Jones    // Round to even.
1c92911eSMichael Jones    final_mantissa += final_mantissa & 1;
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  } else if (round == RoundDirection::Up) {
cb3c41c2SMichael Jones    // If any of the bits being rounded away are non-zero, then round up.
cb3c41c2SMichael Jones    if (low64(final_approx) > 0 ||
cb3c41c2SMichael Jones        (high64(final_approx) & halfway_constant) > 0) {
cb3c41c2SMichael Jones      // Add two since the last current lowest bit is about to be shifted away.
cb3c41c2SMichael Jones      final_mantissa += 2;
cb3c41c2SMichael Jones    }
cb3c41c2SMichael Jones  }
cb3c41c2SMichael Jones  // else round down, which has no effect.
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  // From 54 to 53 bits for doubles and 25 to 24 bits for floats
1c92911eSMichael Jones  final_mantissa >>= 1;
c09e6905SGuillaume Chatelet  if ((final_mantissa >> (FPBits::FRACTION_LEN + 1)) > 0) {
1c92911eSMichael Jones    final_mantissa >>= 1;
87c01607SMichael Jones    ++exp2;
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  // The if block is equivalent to (but has fewer branches than):
87c01607SMichael Jones  //   if exp2 <= 0 || exp2 >= 0x7FF { etc }
c09e6905SGuillaume Chatelet  if (static_cast<uint32_t>(exp2) - 1 >= (1 << FPBits::EXP_LEN) - 2) {
cb3c41c2SMichael Jones    return cpp::nullopt;
87c01607SMichael Jones  }
87c01607SMichael Jones
cb3c41c2SMichael Jones  ExpandedFloat<T> output;
cb3c41c2SMichael Jones  output.mantissa = final_mantissa;
cb3c41c2SMichael Jones  output.exponent = exp2;
cb3c41c2SMichael Jones  return output;
87c01607SMichael Jones}
87c01607SMichael Jones
7eb32644SMichael Jones// TODO: Re-enable eisel-lemire for long double is double double once it's
7eb32644SMichael Jones// properly supported.
7eb32644SMichael Jones#if !defined(LIBC_TYPES_LONG_DOUBLE_IS_FLOAT64) &&                             \
7eb32644SMichael Jones    !defined(LIBC_TYPES_LONG_DOUBLE_IS_DOUBLE_DOUBLE)
9b397371SMichael Jonestemplate <>
cb3c41c2SMichael JonesLIBC_INLINE cpp::optional<ExpandedFloat<long double>>
cb3c41c2SMichael Joneseisel_lemire<long double>(ExpandedFloat<long double> init_num,
cb3c41c2SMichael Jones                          RoundDirection round) {
c703e657SGuillaume Chatelet  using FPBits = typename fputil::FPBits<long double>;
3546f4daSGuillaume Chatelet  using StorageType = typename FPBits::StorageType;
cb3c41c2SMichael Jones
7302c8dbSNick Desaulniers  UInt128 mantissa = init_num.mantissa;
cb3c41c2SMichael Jones  int32_t exp10 = init_num.exponent;
cb3c41c2SMichael Jones
9b397371SMichael Jones  // Exp10 Range
9b397371SMichael Jones  // This doesn't reach very far into the range for long doubles, since it's
9b397371SMichael Jones  // sized for doubles and their 11 exponent bits, and not for long doubles and
9b397371SMichael Jones  // their 15 exponent bits (max exponent of ~300 for double vs ~5000 for long
9b397371SMichael Jones  // double). This is a known tradeoff, and was made because a proper long
9b397371SMichael Jones  // double table would be approximately 16 times larger. This would have
9b397371SMichael Jones  // significant memory and storage costs all the time to speed up a relatively
9b397371SMichael Jones  // uncommon path. In addition the exp10_to_exp2 function only approximates
9b397371SMichael Jones  // multiplying by log(10)/log(2), and that approximation may not be accurate
9b397371SMichael Jones  // out to the full long double range.
9b397371SMichael Jones  if (exp10 < DETAILED_POWERS_OF_TEN_MIN_EXP_10 ||
9b397371SMichael Jones      exp10 > DETAILED_POWERS_OF_TEN_MAX_EXP_10) {
cb3c41c2SMichael Jones    return cpp::nullopt;
9b397371SMichael Jones  }
9b397371SMichael Jones
9b397371SMichael Jones  // Normalization
7302c8dbSNick Desaulniers  uint32_t clz = cpp::countl_zero(mantissa) -
7302c8dbSNick Desaulniers                 ((sizeof(UInt128) - sizeof(StorageType)) * CHAR_BIT);
9b397371SMichael Jones  mantissa <<= clz;
9b397371SMichael Jones
3546f4daSGuillaume Chatelet  int32_t exp2 =
c09e6905SGuillaume Chatelet      exp10_to_exp2(exp10) + FPBits::STORAGE_LEN + FPBits::EXP_BIAS - clz;
9b397371SMichael Jones
9b397371SMichael Jones  // Multiplication
9b397371SMichael Jones  const uint64_t *power_of_ten =
9b397371SMichael Jones      DETAILED_POWERS_OF_TEN[exp10 - DETAILED_POWERS_OF_TEN_MIN_EXP_10];
9b397371SMichael Jones
9b397371SMichael Jones  // Since the input mantissa is more than 64 bits, we have to multiply with the
9b397371SMichael Jones  // full 128 bits of the power of ten to get an approximation with the same
9b397371SMichael Jones  // number of significant bits. This means that we only get the one
9b397371SMichael Jones  // approximation, and that approximation is 256 bits long.
300f8da8SSiva Chandra Reddy  UInt128 approx_upper = static_cast<UInt128>(high64(mantissa)) *
300f8da8SSiva Chandra Reddy                         static_cast<UInt128>(power_of_ten[1]);
9b397371SMichael Jones
ae3b59e6SMichael Jones  UInt128 approx_middle_a = static_cast<UInt128>(high64(mantissa)) *
ae3b59e6SMichael Jones                            static_cast<UInt128>(power_of_ten[0]);
ae3b59e6SMichael Jones  UInt128 approx_middle_b = static_cast<UInt128>(low64(mantissa)) *
300f8da8SSiva Chandra Reddy                            static_cast<UInt128>(power_of_ten[1]);
9b397371SMichael Jones
ae3b59e6SMichael Jones  UInt128 approx_middle = approx_middle_a + approx_middle_b;
ae3b59e6SMichael Jones
ae3b59e6SMichael Jones  // Handle overflow in the middle
ae3b59e6SMichael Jones  approx_upper += (approx_middle < approx_middle_a) ? UInt128(1) << 64 : 0;
ae3b59e6SMichael Jones
300f8da8SSiva Chandra Reddy  UInt128 approx_lower = static_cast<UInt128>(low64(mantissa)) *
300f8da8SSiva Chandra Reddy                         static_cast<UInt128>(power_of_ten[0]);
9b397371SMichael Jones
300f8da8SSiva Chandra Reddy  UInt128 final_approx_lower =
300f8da8SSiva Chandra Reddy      approx_lower + (static_cast<UInt128>(low64(approx_middle)) << 64);
300f8da8SSiva Chandra Reddy  UInt128 final_approx_upper = approx_upper + high64(approx_middle) +
9b397371SMichael Jones                               (final_approx_lower < approx_lower ? 1 : 0);
9b397371SMichael Jones
9b397371SMichael Jones  // The halfway constant is used to check if the bits that will be shifted away
9b397371SMichael Jones  // intially are all 1. For 80 bit floats this is 128 (bitstype size) - 64
9b397371SMichael Jones  // (final mantissa size) - 3 (we shift away the last two bits separately for
9b397371SMichael Jones  // accuracy, and the most significant bit is ignored.) = 61 bits. Similarly,
9b397371SMichael Jones  // it's 12 bits for 128 bit floats in this case.
300f8da8SSiva Chandra Reddy  constexpr UInt128 HALFWAY_CONSTANT =
c09e6905SGuillaume Chatelet      (UInt128(1) << (FPBits::STORAGE_LEN - (FPBits::FRACTION_LEN + 3))) - 1;
9b397371SMichael Jones
9b397371SMichael Jones  if ((final_approx_upper & HALFWAY_CONSTANT) == HALFWAY_CONSTANT &&
9b397371SMichael Jones      final_approx_lower + mantissa < mantissa) {
cb3c41c2SMichael Jones    return cpp::nullopt;
9b397371SMichael Jones  }
9b397371SMichael Jones
9b397371SMichael Jones  // Shifting to 65 bits for 80 bit floats and 113 bits for 128 bit floats
3546f4daSGuillaume Chatelet  uint32_t msb =
c09e6905SGuillaume Chatelet      static_cast<uint32_t>(final_approx_upper >> (FPBits::STORAGE_LEN - 1));
7302c8dbSNick Desaulniers  UInt128 final_mantissa = final_approx_upper >> (msb + FPBits::STORAGE_LEN -
7302c8dbSNick Desaulniers                                                  (FPBits::FRACTION_LEN + 3));
25a2aeb1SMikhail R. Gadelha  exp2 -= static_cast<uint32_t>(1 ^ msb); // same as !msb
9b397371SMichael Jones
cb3c41c2SMichael Jones  if (round == RoundDirection::Nearest) {
9b397371SMichael Jones    // Half-way ambiguity
cb3c41c2SMichael Jones    if (final_approx_lower == 0 &&
cb3c41c2SMichael Jones        (final_approx_upper & HALFWAY_CONSTANT) == 0 &&
9b397371SMichael Jones        (final_mantissa & 3) == 1) {
cb3c41c2SMichael Jones      return cpp::nullopt;
9b397371SMichael Jones    }
cb3c41c2SMichael Jones    // Round to even.
cb3c41c2SMichael Jones    final_mantissa += final_mantissa & 1;
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  } else if (round == RoundDirection::Up) {
cb3c41c2SMichael Jones    // If any of the bits being rounded away are non-zero, then round up.
cb3c41c2SMichael Jones    if (final_approx_lower > 0 || (final_approx_upper & HALFWAY_CONSTANT) > 0) {
cb3c41c2SMichael Jones      // Add two since the last current lowest bit is about to be shifted away.
cb3c41c2SMichael Jones      final_mantissa += 2;
cb3c41c2SMichael Jones    }
cb3c41c2SMichael Jones  }
cb3c41c2SMichael Jones  // else round down, which has no effect.
9b397371SMichael Jones
9b397371SMichael Jones  // From 65 to 64 bits for 80 bit floats and 113  to 112 bits for 128 bit
9b397371SMichael Jones  // floats
9b397371SMichael Jones  final_mantissa >>= 1;
c09e6905SGuillaume Chatelet  if ((final_mantissa >> (FPBits::FRACTION_LEN + 1)) > 0) {
9b397371SMichael Jones    final_mantissa >>= 1;
9b397371SMichael Jones    ++exp2;
9b397371SMichael Jones  }
9b397371SMichael Jones
9b397371SMichael Jones  // The if block is equivalent to (but has fewer branches than):
9b397371SMichael Jones  //   if exp2 <= 0 || exp2 >= MANTISSA_MAX { etc }
c09e6905SGuillaume Chatelet  if (exp2 - 1 >= (1 << FPBits::EXP_LEN) - 2) {
cb3c41c2SMichael Jones    return cpp::nullopt;
9b397371SMichael Jones  }
9b397371SMichael Jones
cb3c41c2SMichael Jones  ExpandedFloat<long double> output;
7302c8dbSNick Desaulniers  output.mantissa = static_cast<StorageType>(final_mantissa);
cb3c41c2SMichael Jones  output.exponent = exp2;
cb3c41c2SMichael Jones  return output;
9b397371SMichael Jones}
7eb32644SMichael Jones#endif // !defined(LIBC_TYPES_LONG_DOUBLE_IS_FLOAT64) &&
7eb32644SMichael Jones       // !defined(LIBC_TYPES_LONG_DOUBLE_IS_DOUBLE_DOUBLE)
9b397371SMichael Jones
87c01607SMichael Jones// The nth item in POWERS_OF_TWO represents the greatest power of two less than
87c01607SMichael Jones// 10^n. This tells us how much we can safely shift without overshooting.
87c01607SMichael Jonesconstexpr uint8_t POWERS_OF_TWO[19] = {
87c01607SMichael Jones    0, 3, 6, 9, 13, 16, 19, 23, 26, 29, 33, 36, 39, 43, 46, 49, 53, 56, 59,
87c01607SMichael Jones};
87c01607SMichael Jonesconstexpr int32_t NUM_POWERS_OF_TWO =
87c01607SMichael Jones    sizeof(POWERS_OF_TWO) / sizeof(POWERS_OF_TWO[0]);
87c01607SMichael Jones
87c01607SMichael Jones// Takes a mantissa and base 10 exponent and converts it into its closest
87c01607SMichael Jones// floating point type T equivalent. This is the fallback algorithm used when
87c01607SMichael Jones// the Eisel-Lemire algorithm fails, it's slower but more accurate. It's based
87c01607SMichael Jones// on the Simple Decimal Conversion algorithm by Nigel Tao, described at this
87c01607SMichael Jones// link: https://nigeltao.github.io/blog/2020/parse-number-f64-simple.html
87c01607SMichael Jonestemplate <class T>
d34b3c9cSMichael JonesLIBC_INLINE FloatConvertReturn<T> simple_decimal_conversion(
d34b3c9cSMichael Jones    const char *__restrict numStart,
d34b3c9cSMichael Jones    const size_t num_len = cpp::numeric_limits<size_t>::max(),
cb3c41c2SMichael Jones    RoundDirection round = RoundDirection::Nearest) {
c703e657SGuillaume Chatelet  using FPBits = typename fputil::FPBits<T>;
3546f4daSGuillaume Chatelet  using StorageType = typename FPBits::StorageType;
87c01607SMichael Jones
87c01607SMichael Jones  int32_t exp2 = 0;
d34b3c9cSMichael Jones  HighPrecisionDecimal hpd = HighPrecisionDecimal(numStart, num_len);
87c01607SMichael Jones
cb3c41c2SMichael Jones  FloatConvertReturn<T> output;
cb3c41c2SMichael Jones
1c92911eSMichael Jones  if (hpd.get_num_digits() == 0) {
cb3c41c2SMichael Jones    output.num = {0, 0};
cb3c41c2SMichael Jones    return output;
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  // If the exponent is too large and can't be represented in this size of
87c01607SMichael Jones  // float, return inf.
1c92911eSMichael Jones  if (hpd.get_decimal_point() > 0 &&
c09e6905SGuillaume Chatelet      exp10_to_exp2(hpd.get_decimal_point() - 1) > FPBits::EXP_BIAS) {
3ae5a9b6SGuillaume Chatelet    output.num = {0, fputil::FPBits<T>::MAX_BIASED_EXPONENT};
cb3c41c2SMichael Jones    output.error = ERANGE;
cb3c41c2SMichael Jones    return output;
87c01607SMichael Jones  }
87c01607SMichael Jones  // If the exponent is too small even for a subnormal, return 0.
1c92911eSMichael Jones  if (hpd.get_decimal_point() < 0 &&
1c92911eSMichael Jones      exp10_to_exp2(-hpd.get_decimal_point()) >
c09e6905SGuillaume Chatelet          (FPBits::EXP_BIAS + static_cast<int32_t>(FPBits::FRACTION_LEN))) {
cb3c41c2SMichael Jones    output.num = {0, 0};
cb3c41c2SMichael Jones    output.error = ERANGE;
cb3c41c2SMichael Jones    return output;
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  // Right shift until the number is smaller than 1.
1c92911eSMichael Jones  while (hpd.get_decimal_point() > 0) {
1c92911eSMichael Jones    int32_t shift_amount = 0;
1c92911eSMichael Jones    if (hpd.get_decimal_point() >= NUM_POWERS_OF_TWO) {
1c92911eSMichael Jones      shift_amount = 60;
87c01607SMichael Jones    } else {
1c92911eSMichael Jones      shift_amount = POWERS_OF_TWO[hpd.get_decimal_point()];
87c01607SMichael Jones    }
1c92911eSMichael Jones    exp2 += shift_amount;
1c92911eSMichael Jones    hpd.shift(-shift_amount);
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  // Left shift until the number is between 1/2 and 1
1c92911eSMichael Jones  while (hpd.get_decimal_point() < 0 ||
1c92911eSMichael Jones         (hpd.get_decimal_point() == 0 && hpd.get_digits()[0] < 5)) {
1c92911eSMichael Jones    int32_t shift_amount = 0;
87c01607SMichael Jones
1c92911eSMichael Jones    if (-hpd.get_decimal_point() >= NUM_POWERS_OF_TWO) {
1c92911eSMichael Jones      shift_amount = 60;
1c92911eSMichael Jones    } else if (hpd.get_decimal_point() != 0) {
1c92911eSMichael Jones      shift_amount = POWERS_OF_TWO[-hpd.get_decimal_point()];
87c01607SMichael Jones    } else { // This handles the case of the number being between .1 and .5
1c92911eSMichael Jones      shift_amount = 1;
87c01607SMichael Jones    }
1c92911eSMichael Jones    exp2 -= shift_amount;
1c92911eSMichael Jones    hpd.shift(shift_amount);
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  // Left shift once so that the number is between 1 and 2
87c01607SMichael Jones  --exp2;
87c01607SMichael Jones  hpd.shift(1);
87c01607SMichael Jones
87c01607SMichael Jones  // Get the biased exponent
c09e6905SGuillaume Chatelet  exp2 += FPBits::EXP_BIAS;
87c01607SMichael Jones
87c01607SMichael Jones  // Handle the exponent being too large (and return inf).
3ae5a9b6SGuillaume Chatelet  if (exp2 >= FPBits::MAX_BIASED_EXPONENT) {
3ae5a9b6SGuillaume Chatelet    output.num = {0, FPBits::MAX_BIASED_EXPONENT};
cb3c41c2SMichael Jones    output.error = ERANGE;
cb3c41c2SMichael Jones    return output;
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  // Shift left to fill the mantissa
c09e6905SGuillaume Chatelet  hpd.shift(FPBits::FRACTION_LEN);
3546f4daSGuillaume Chatelet  StorageType final_mantissa = hpd.round_to_integer_type<StorageType>();
87c01607SMichael Jones
87c01607SMichael Jones  // Handle subnormals
87c01607SMichael Jones  if (exp2 <= 0) {
87c01607SMichael Jones    // Shift right until there is a valid exponent
87c01607SMichael Jones    while (exp2 < 0) {
87c01607SMichael Jones      hpd.shift(-1);
87c01607SMichael Jones      ++exp2;
87c01607SMichael Jones    }
87c01607SMichael Jones    // Shift right one more time to compensate for the left shift to get it
87c01607SMichael Jones    // between 1 and 2.
87c01607SMichael Jones    hpd.shift(-1);
3546f4daSGuillaume Chatelet    final_mantissa = hpd.round_to_integer_type<StorageType>(round);
87c01607SMichael Jones
87c01607SMichael Jones    // Check if by shifting right we've caused this to round to a normal number.
c09e6905SGuillaume Chatelet    if ((final_mantissa >> FPBits::FRACTION_LEN) != 0) {
87c01607SMichael Jones      ++exp2;
87c01607SMichael Jones    }
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  // Check if rounding added a bit, and shift down if that's the case.
c09e6905SGuillaume Chatelet  if (final_mantissa == StorageType(2) << FPBits::FRACTION_LEN) {
1c92911eSMichael Jones    final_mantissa >>= 1;
87c01607SMichael Jones    ++exp2;
aa1902f9SMichael Jones
aa1902f9SMichael Jones    // Check if this rounding causes exp2 to go out of range and make the result
aa1902f9SMichael Jones    // INF. If this is the case, then finalMantissa and exp2 are already the
aa1902f9SMichael Jones    // correct values for an INF result.
3ae5a9b6SGuillaume Chatelet    if (exp2 >= FPBits::MAX_BIASED_EXPONENT) {
cb3c41c2SMichael Jones      output.error = ERANGE;
aa1902f9SMichael Jones    }
87c01607SMichael Jones  }
87c01607SMichael Jones
4cdf9884SMichael Jones  if (exp2 == 0) {
cb3c41c2SMichael Jones    output.error = ERANGE;
4cdf9884SMichael Jones  }
4cdf9884SMichael Jones
cb3c41c2SMichael Jones  output.num = {final_mantissa, exp2};
cb3c41c2SMichael Jones  return output;
87c01607SMichael Jones}
87c01607SMichael Jones
62c187cbSMichael Jones// This class is used for templating the constants for Clinger's Fast Path,
62c187cbSMichael Jones// described as a method of approximation in
62c187cbSMichael Jones// Clinger WD. How to Read Floating Point Numbers Accurately. SIGPLAN Not 1990
62c187cbSMichael Jones// Jun;25(6):92–101. https://doi.org/10.1145/93548.93557.
62c187cbSMichael Jones// As well as the additions by Gay that extend the useful range by the number of
62c187cbSMichael Jones// exact digits stored by the float type, described in
62c187cbSMichael Jones// Gay DM, Correctly rounded binary-decimal and decimal-binary conversions;
62c187cbSMichael Jones// 1990. AT&T Bell Laboratories Numerical Analysis Manuscript 90-10.
62c187cbSMichael Jonestemplate <class T> class ClingerConsts;
62c187cbSMichael Jones
62c187cbSMichael Jonestemplate <> class ClingerConsts<float> {
62c187cbSMichael Jonespublic:
1c92911eSMichael Jones  static constexpr float POWERS_OF_TEN_ARRAY[] = {1e0, 1e1, 1e2, 1e3, 1e4, 1e5,
62c187cbSMichael Jones                                                  1e6, 1e7, 1e8, 1e9, 1e10};
1c92911eSMichael Jones  static constexpr int32_t EXACT_POWERS_OF_TEN = 10;
1c92911eSMichael Jones  static constexpr int32_t DIGITS_IN_MANTISSA = 7;
1c92911eSMichael Jones  static constexpr float MAX_EXACT_INT = 16777215.0;
62c187cbSMichael Jones};
62c187cbSMichael Jones
62c187cbSMichael Jonestemplate <> class ClingerConsts<double> {
62c187cbSMichael Jonespublic:
1c92911eSMichael Jones  static constexpr double POWERS_OF_TEN_ARRAY[] = {
62c187cbSMichael Jones      1e0,  1e1,  1e2,  1e3,  1e4,  1e5,  1e6,  1e7,  1e8,  1e9,  1e10, 1e11,
62c187cbSMichael Jones      1e12, 1e13, 1e14, 1e15, 1e16, 1e17, 1e18, 1e19, 1e20, 1e21, 1e22};
1c92911eSMichael Jones  static constexpr int32_t EXACT_POWERS_OF_TEN = 22;
1c92911eSMichael Jones  static constexpr int32_t DIGITS_IN_MANTISSA = 15;
1c92911eSMichael Jones  static constexpr double MAX_EXACT_INT = 9007199254740991.0;
62c187cbSMichael Jones};
62c187cbSMichael Jones
f7d4236aSGuillaume Chatelet#if defined(LIBC_TYPES_LONG_DOUBLE_IS_FLOAT64)
aa1902f9SMichael Jonestemplate <> class ClingerConsts<long double> {
aa1902f9SMichael Jonespublic:
0f031daeSTue Ly  static constexpr long double POWERS_OF_TEN_ARRAY[] = {
0f031daeSTue Ly      1e0,  1e1,  1e2,  1e3,  1e4,  1e5,  1e6,  1e7,  1e8,  1e9,  1e10, 1e11,
0f031daeSTue Ly      1e12, 1e13, 1e14, 1e15, 1e16, 1e17, 1e18, 1e19, 1e20, 1e21, 1e22};
aa1902f9SMichael Jones  static constexpr int32_t EXACT_POWERS_OF_TEN =
aa1902f9SMichael Jones      ClingerConsts<double>::EXACT_POWERS_OF_TEN;
aa1902f9SMichael Jones  static constexpr int32_t DIGITS_IN_MANTISSA =
aa1902f9SMichael Jones      ClingerConsts<double>::DIGITS_IN_MANTISSA;
aa1902f9SMichael Jones  static constexpr long double MAX_EXACT_INT =
aa1902f9SMichael Jones      ClingerConsts<double>::MAX_EXACT_INT;
aa1902f9SMichael Jones};
f7d4236aSGuillaume Chatelet#elif defined(LIBC_TYPES_LONG_DOUBLE_IS_X86_FLOAT80)
aa1902f9SMichael Jonestemplate <> class ClingerConsts<long double> {
aa1902f9SMichael Jonespublic:
aa1902f9SMichael Jones  static constexpr long double POWERS_OF_TEN_ARRAY[] = {
aa1902f9SMichael Jones      1e0L,  1e1L,  1e2L,  1e3L,  1e4L,  1e5L,  1e6L,  1e7L,  1e8L,  1e9L,
aa1902f9SMichael Jones      1e10L, 1e11L, 1e12L, 1e13L, 1e14L, 1e15L, 1e16L, 1e17L, 1e18L, 1e19L,
aa1902f9SMichael Jones      1e20L, 1e21L, 1e22L, 1e23L, 1e24L, 1e25L, 1e26L, 1e27L};
aa1902f9SMichael Jones  static constexpr int32_t EXACT_POWERS_OF_TEN = 27;
aa1902f9SMichael Jones  static constexpr int32_t DIGITS_IN_MANTISSA = 21;
aa1902f9SMichael Jones  static constexpr long double MAX_EXACT_INT = 18446744073709551615.0L;
aa1902f9SMichael Jones};
f7d4236aSGuillaume Chatelet#elif defined(LIBC_TYPES_LONG_DOUBLE_IS_FLOAT128)
aa1902f9SMichael Jonestemplate <> class ClingerConsts<long double> {
aa1902f9SMichael Jonespublic:
aa1902f9SMichael Jones  static constexpr long double POWERS_OF_TEN_ARRAY[] = {
aa1902f9SMichael Jones      1e0L,  1e1L,  1e2L,  1e3L,  1e4L,  1e5L,  1e6L,  1e7L,  1e8L,  1e9L,
aa1902f9SMichael Jones      1e10L, 1e11L, 1e12L, 1e13L, 1e14L, 1e15L, 1e16L, 1e17L, 1e18L, 1e19L,
aa1902f9SMichael Jones      1e20L, 1e21L, 1e22L, 1e23L, 1e24L, 1e25L, 1e26L, 1e27L, 1e28L, 1e29L,
aa1902f9SMichael Jones      1e30L, 1e31L, 1e32L, 1e33L, 1e34L, 1e35L, 1e36L, 1e37L, 1e38L, 1e39L,
aa1902f9SMichael Jones      1e40L, 1e41L, 1e42L, 1e43L, 1e44L, 1e45L, 1e46L, 1e47L, 1e48L};
aa1902f9SMichael Jones  static constexpr int32_t EXACT_POWERS_OF_TEN = 48;
aa1902f9SMichael Jones  static constexpr int32_t DIGITS_IN_MANTISSA = 33;
aa1902f9SMichael Jones  static constexpr long double MAX_EXACT_INT =
aa1902f9SMichael Jones      10384593717069655257060992658440191.0L;
aa1902f9SMichael Jones};
7eb32644SMichael Jones#elif defined(LIBC_TYPES_LONG_DOUBLE_IS_DOUBLE_DOUBLE)
7eb32644SMichael Jones// TODO: Add proper double double type support here, currently using constants
7eb32644SMichael Jones// for double since it should be safe.
7eb32644SMichael Jonestemplate <> class ClingerConsts<long double> {
7eb32644SMichael Jonespublic:
7eb32644SMichael Jones  static constexpr double POWERS_OF_TEN_ARRAY[] = {
7eb32644SMichael Jones      1e0,  1e1,  1e2,  1e3,  1e4,  1e5,  1e6,  1e7,  1e8,  1e9,  1e10, 1e11,
7eb32644SMichael Jones      1e12, 1e13, 1e14, 1e15, 1e16, 1e17, 1e18, 1e19, 1e20, 1e21, 1e22};
7eb32644SMichael Jones  static constexpr int32_t EXACT_POWERS_OF_TEN = 22;
7eb32644SMichael Jones  static constexpr int32_t DIGITS_IN_MANTISSA = 15;
7eb32644SMichael Jones  static constexpr double MAX_EXACT_INT = 9007199254740991.0;
7eb32644SMichael Jones};
f7d4236aSGuillaume Chatelet#else
f7d4236aSGuillaume Chatelet#error "Unknown long double type"
aa1902f9SMichael Jones#endif
aa1902f9SMichael Jones
62c187cbSMichael Jones// Take an exact mantissa and exponent and attempt to convert it using only
62c187cbSMichael Jones// exact floating point arithmetic. This only handles numbers with low
62c187cbSMichael Jones// exponents, but handles them quickly. This is an implementation of Clinger's
62c187cbSMichael Jones// Fast Path, as described above.
62c187cbSMichael Jonestemplate <class T>
cb3c41c2SMichael JonesLIBC_INLINE cpp::optional<ExpandedFloat<T>>
cb3c41c2SMichael Jonesclinger_fast_path(ExpandedFloat<T> init_num,
cb3c41c2SMichael Jones                  RoundDirection round = RoundDirection::Nearest) {
c703e657SGuillaume Chatelet  using FPBits = typename fputil::FPBits<T>;
3546f4daSGuillaume Chatelet  using StorageType = typename FPBits::StorageType;
cb3c41c2SMichael Jones
3546f4daSGuillaume Chatelet  StorageType mantissa = init_num.mantissa;
cb3c41c2SMichael Jones  int32_t exp10 = init_num.exponent;
cb3c41c2SMichael Jones
c09e6905SGuillaume Chatelet  if ((mantissa >> FPBits::FRACTION_LEN) > 0) {
cb3c41c2SMichael Jones    return cpp::nullopt;
62c187cbSMichael Jones  }
62c187cbSMichael Jones
c703e657SGuillaume Chatelet  FPBits result;
1557256aSTue Ly  T float_mantissa;
7302c8dbSNick Desaulniers  if constexpr (is_big_int_v<StorageType> || sizeof(T) > sizeof(uint64_t)) {
d851b5c1SMichael Jones    float_mantissa =
7299c7f6SMichael Jones        (static_cast<T>(uint64_t(mantissa >> 64)) * static_cast<T>(0x1.0p64)) +
7299c7f6SMichael Jones        static_cast<T>(uint64_t(mantissa));
1557256aSTue Ly  } else {
1557256aSTue Ly    float_mantissa = static_cast<T>(mantissa);
1557256aSTue Ly  }
62c187cbSMichael Jones
62c187cbSMichael Jones  if (exp10 == 0) {
c703e657SGuillaume Chatelet    result = FPBits(float_mantissa);
62c187cbSMichael Jones  }
62c187cbSMichael Jones  if (exp10 > 0) {
1c92911eSMichael Jones    if (exp10 > ClingerConsts<T>::EXACT_POWERS_OF_TEN +
1c92911eSMichael Jones                    ClingerConsts<T>::DIGITS_IN_MANTISSA) {
cb3c41c2SMichael Jones      return cpp::nullopt;
62c187cbSMichael Jones    }
1c92911eSMichael Jones    if (exp10 > ClingerConsts<T>::EXACT_POWERS_OF_TEN) {
1c92911eSMichael Jones      float_mantissa = float_mantissa *
1c92911eSMichael Jones                       ClingerConsts<T>::POWERS_OF_TEN_ARRAY
1c92911eSMichael Jones                           [exp10 - ClingerConsts<T>::EXACT_POWERS_OF_TEN];
1c92911eSMichael Jones      exp10 = ClingerConsts<T>::EXACT_POWERS_OF_TEN;
62c187cbSMichael Jones    }
1c92911eSMichael Jones    if (float_mantissa > ClingerConsts<T>::MAX_EXACT_INT) {
cb3c41c2SMichael Jones      return cpp::nullopt;
62c187cbSMichael Jones    }
c703e657SGuillaume Chatelet    result =
c703e657SGuillaume Chatelet        FPBits(float_mantissa * ClingerConsts<T>::POWERS_OF_TEN_ARRAY[exp10]);
62c187cbSMichael Jones  } else if (exp10 < 0) {
1c92911eSMichael Jones    if (-exp10 > ClingerConsts<T>::EXACT_POWERS_OF_TEN) {
cb3c41c2SMichael Jones      return cpp::nullopt;
62c187cbSMichael Jones    }
c703e657SGuillaume Chatelet    result =
c703e657SGuillaume Chatelet        FPBits(float_mantissa / ClingerConsts<T>::POWERS_OF_TEN_ARRAY[-exp10]);
62c187cbSMichael Jones  }
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  // If the rounding mode is not nearest, then the sign of the number may affect
cb3c41c2SMichael Jones  // the result. To make sure the rounding mode is respected properly, the
cb3c41c2SMichael Jones  // calculation is redone with a negative result, and the rounding mode is used
cb3c41c2SMichael Jones  // to select the correct result.
cb3c41c2SMichael Jones  if (round != RoundDirection::Nearest) {
c703e657SGuillaume Chatelet    FPBits negative_result;
cb3c41c2SMichael Jones    // I'm 99% sure this will break under fast math optimizations.
c703e657SGuillaume Chatelet    negative_result = FPBits((-float_mantissa) *
c703e657SGuillaume Chatelet                             ClingerConsts<T>::POWERS_OF_TEN_ARRAY[exp10]);
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones    // If the results are equal, then we don't need to use the rounding mode.
2856db0dSGuillaume Chatelet    if (result.get_val() != -negative_result.get_val()) {
c703e657SGuillaume Chatelet      FPBits lower_result;
c703e657SGuillaume Chatelet      FPBits higher_result;
cb3c41c2SMichael Jones
2856db0dSGuillaume Chatelet      if (result.get_val() < -negative_result.get_val()) {
cb3c41c2SMichael Jones        lower_result = result;
cb3c41c2SMichael Jones        higher_result = negative_result;
cb3c41c2SMichael Jones      } else {
cb3c41c2SMichael Jones        lower_result = negative_result;
cb3c41c2SMichael Jones        higher_result = result;
cb3c41c2SMichael Jones      }
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones      if (round == RoundDirection::Up) {
cb3c41c2SMichael Jones        result = higher_result;
cb3c41c2SMichael Jones      } else {
cb3c41c2SMichael Jones        result = lower_result;
cb3c41c2SMichael Jones      }
cb3c41c2SMichael Jones    }
cb3c41c2SMichael Jones  }
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  ExpandedFloat<T> output;
7299c7f6SMichael Jones  output.mantissa = result.get_explicit_mantissa();
7b387d27SGuillaume Chatelet  output.exponent = result.get_biased_exponent();
cb3c41c2SMichael Jones  return output;
62c187cbSMichael Jones}
62c187cbSMichael Jones
2cd20ad9SMichael Jones// The upper bound is the highest base-10 exponent that could possibly give a
2cd20ad9SMichael Jones// non-inf result for this size of float. The value is
2cd20ad9SMichael Jones// log10(2^(exponent bias)).
2cd20ad9SMichael Jones// The generic approximation uses the fact that log10(2^x) ~= x/3
d34b3c9cSMichael Jonestemplate <typename T> LIBC_INLINE constexpr int32_t get_upper_bound() {
c09e6905SGuillaume Chatelet  return fputil::FPBits<T>::EXP_BIAS / 3;
2cd20ad9SMichael Jones}
2cd20ad9SMichael Jones
d34b3c9cSMichael Jonestemplate <> LIBC_INLINE constexpr int32_t get_upper_bound<float>() {
d34b3c9cSMichael Jones  return 39;
d34b3c9cSMichael Jones}
2cd20ad9SMichael Jones
d34b3c9cSMichael Jonestemplate <> LIBC_INLINE constexpr int32_t get_upper_bound<double>() {
d34b3c9cSMichael Jones  return 309;
d34b3c9cSMichael Jones}
2cd20ad9SMichael Jones
2cd20ad9SMichael Jones// The lower bound is the largest negative base-10 exponent that could possibly
2cd20ad9SMichael Jones// give a non-zero result for this size of float. The value is
2cd20ad9SMichael Jones// log10(2^(exponent bias + final mantissa width + intermediate mantissa width))
2cd20ad9SMichael Jones// The intermediate mantissa is the integer that's been parsed from the string,
2cd20ad9SMichael Jones// and the final mantissa is the fractional part of the output number. A very
2cd20ad9SMichael Jones// low base 10 exponent with a very high intermediate mantissa can cancel each
2cd20ad9SMichael Jones// other out, and subnormal numbers allow for the result to be at the very low
2cd20ad9SMichael Jones// end of the final mantissa.
d34b3c9cSMichael Jonestemplate <typename T> LIBC_INLINE constexpr int32_t get_lower_bound() {
c09e6905SGuillaume Chatelet  using FPBits = typename fputil::FPBits<T>;
c09e6905SGuillaume Chatelet  return -((FPBits::EXP_BIAS +
c09e6905SGuillaume Chatelet            static_cast<int32_t>(FPBits::FRACTION_LEN + FPBits::STORAGE_LEN)) /
2cd20ad9SMichael Jones           3);
2cd20ad9SMichael Jones}
2cd20ad9SMichael Jones
d34b3c9cSMichael Jonestemplate <> LIBC_INLINE constexpr int32_t get_lower_bound<float>() {
2cd20ad9SMichael Jones  return -(39 + 6 + 10);
2cd20ad9SMichael Jones}
2cd20ad9SMichael Jones
d34b3c9cSMichael Jonestemplate <> LIBC_INLINE constexpr int32_t get_lower_bound<double>() {
2cd20ad9SMichael Jones  return -(309 + 15 + 20);
2cd20ad9SMichael Jones}
2cd20ad9SMichael Jones
6c4267fbSMichael Jones// -----------------------------------------------------------------------------
6c4267fbSMichael Jones//                               **** WARNING ****
6c4267fbSMichael Jones// This interface is shared with libc++, if you change this interface you need
6c4267fbSMichael Jones// to update it in both libc and libc++.
6c4267fbSMichael Jones// -----------------------------------------------------------------------------
87c01607SMichael Jones// Takes a mantissa and base 10 exponent and converts it into its closest
87c01607SMichael Jones// floating point type T equivalient. First we try the Eisel-Lemire algorithm,
87c01607SMichael Jones// then if that fails then we fall back to a more accurate algorithm for
87c01607SMichael Jones// accuracy. The resulting mantissa and exponent are placed in outputMantissa
87c01607SMichael Jones// and outputExp2.
87c01607SMichael Jonestemplate <class T>
d34b3c9cSMichael JonesLIBC_INLINE FloatConvertReturn<T> decimal_exp_to_float(
d34b3c9cSMichael Jones    ExpandedFloat<T> init_num, bool truncated, RoundDirection round,
d34b3c9cSMichael Jones    const char *__restrict numStart,
d34b3c9cSMichael Jones    const size_t num_len = cpp::numeric_limits<size_t>::max()) {
c703e657SGuillaume Chatelet  using FPBits = typename fputil::FPBits<T>;
3546f4daSGuillaume Chatelet  using StorageType = typename FPBits::StorageType;
cb3c41c2SMichael Jones
3546f4daSGuillaume Chatelet  StorageType mantissa = init_num.mantissa;
cb3c41c2SMichael Jones  int32_t exp10 = init_num.exponent;
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  FloatConvertReturn<T> output;
cb3c41c2SMichael Jones  cpp::optional<ExpandedFloat<T>> opt_output;
cb3c41c2SMichael Jones
62c187cbSMichael Jones  // If the exponent is too large and can't be represented in this size of
2cd20ad9SMichael Jones  // float, return inf. These bounds are relatively loose, but are mostly
2cd20ad9SMichael Jones  // serving as a first pass. Some close numbers getting through is okay.
2cd20ad9SMichael Jones  if (exp10 > get_upper_bound<T>()) {
3ae5a9b6SGuillaume Chatelet    output.num = {0, FPBits::MAX_BIASED_EXPONENT};
cb3c41c2SMichael Jones    output.error = ERANGE;
cb3c41c2SMichael Jones    return output;
62c187cbSMichael Jones  }
62c187cbSMichael Jones  // If the exponent is too small even for a subnormal, return 0.
2cd20ad9SMichael Jones  if (exp10 < get_lower_bound<T>()) {
cb3c41c2SMichael Jones    output.num = {0, 0};
cb3c41c2SMichael Jones    output.error = ERANGE;
cb3c41c2SMichael Jones    return output;
62c187cbSMichael Jones  }
87c01607SMichael Jones
cb3c41c2SMichael Jones  // Clinger's Fast Path and Eisel-Lemire can't set errno, but they can fail.
cb3c41c2SMichael Jones  // For this reason the "error" field in their return values is used to
cb3c41c2SMichael Jones  // represent whether they've failed as opposed to the errno value. Any
cb3c41c2SMichael Jones  // non-zero value represents a failure.
cb3c41c2SMichael Jones
c3228714SGuillaume Chatelet#ifndef LIBC_COPT_STRTOFLOAT_DISABLE_CLINGER_FAST_PATH
62c187cbSMichael Jones  if (!truncated) {
cb3c41c2SMichael Jones    opt_output = clinger_fast_path<T>(init_num, round);
cb3c41c2SMichael Jones    // If the algorithm succeeded the error will be 0, else it will be a
cb3c41c2SMichael Jones    // non-zero number.
cb3c41c2SMichael Jones    if (opt_output.has_value()) {
cb3c41c2SMichael Jones      return {opt_output.value(), 0};
62c187cbSMichael Jones    }
62c187cbSMichael Jones  }
c3228714SGuillaume Chatelet#endif // LIBC_COPT_STRTOFLOAT_DISABLE_CLINGER_FAST_PATH
87c01607SMichael Jones
c3228714SGuillaume Chatelet#ifndef LIBC_COPT_STRTOFLOAT_DISABLE_EISEL_LEMIRE
87c01607SMichael Jones  // Try Eisel-Lemire
cb3c41c2SMichael Jones  opt_output = eisel_lemire<T>(init_num, round);
cb3c41c2SMichael Jones  if (opt_output.has_value()) {
87c01607SMichael Jones    if (!truncated) {
cb3c41c2SMichael Jones      return {opt_output.value(), 0};
87c01607SMichael Jones    }
87c01607SMichael Jones    // If the mantissa is truncated, then the result may be off by the LSB, so
87c01607SMichael Jones    // check if rounding the mantissa up changes the result. If not, then it's
87c01607SMichael Jones    // safe, else use the fallback.
900be901SVictor Toni    auto second_output = eisel_lemire<T>({mantissa + 1, exp10}, round);
900be901SVictor Toni    if (second_output.has_value()) {
900be901SVictor Toni      if (opt_output->mantissa == second_output->mantissa &&
900be901SVictor Toni          opt_output->exponent == second_output->exponent) {
cb3c41c2SMichael Jones        return {opt_output.value(), 0};
87c01607SMichael Jones      }
87c01607SMichael Jones    }
87c01607SMichael Jones  }
c3228714SGuillaume Chatelet#endif // LIBC_COPT_STRTOFLOAT_DISABLE_EISEL_LEMIRE
87c01607SMichael Jones
c3228714SGuillaume Chatelet#ifndef LIBC_COPT_STRTOFLOAT_DISABLE_SIMPLE_DECIMAL_CONVERSION
d34b3c9cSMichael Jones  output = simple_decimal_conversion<T>(numStart, num_len, round);
c3228714SGuillaume Chatelet#else
c3228714SGuillaume Chatelet#warning "Simple decimal conversion is disabled, result may not be correct."
c3228714SGuillaume Chatelet#endif // LIBC_COPT_STRTOFLOAT_DISABLE_SIMPLE_DECIMAL_CONVERSION
87c01607SMichael Jones
cb3c41c2SMichael Jones  return output;
87c01607SMichael Jones}
87c01607SMichael Jones
6c4267fbSMichael Jones// -----------------------------------------------------------------------------
6c4267fbSMichael Jones//                               **** WARNING ****
6c4267fbSMichael Jones// This interface is shared with libc++, if you change this interface you need
6c4267fbSMichael Jones// to update it in both libc and libc++.
6c4267fbSMichael Jones// -----------------------------------------------------------------------------
8298424cSMichael Jones// Takes a mantissa and base 2 exponent and converts it into its closest
8298424cSMichael Jones// floating point type T equivalient. Since the exponent is already in the right
8298424cSMichael Jones// form, this is mostly just shifting and rounding. This is used for hexadecimal
8298424cSMichael Jones// numbers since a base 16 exponent multiplied by 4 is the base 2 exponent.
8298424cSMichael Jonestemplate <class T>
cb3c41c2SMichael JonesLIBC_INLINE FloatConvertReturn<T> binary_exp_to_float(ExpandedFloat<T> init_num,
201cc2d8STue Ly                                                      bool truncated,
cb3c41c2SMichael Jones                                                      RoundDirection round) {
c703e657SGuillaume Chatelet  using FPBits = typename fputil::FPBits<T>;
3546f4daSGuillaume Chatelet  using StorageType = typename FPBits::StorageType;
8298424cSMichael Jones
3546f4daSGuillaume Chatelet  StorageType mantissa = init_num.mantissa;
cb3c41c2SMichael Jones  int32_t exp2 = init_num.exponent;
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  FloatConvertReturn<T> output;
cb3c41c2SMichael Jones
8298424cSMichael Jones  // This is the number of leading zeroes a properly normalized float of type T
8298424cSMichael Jones  // should have.
c09e6905SGuillaume Chatelet  constexpr int32_t INF_EXP = (1 << FPBits::EXP_LEN) - 1;
8298424cSMichael Jones
3546f4daSGuillaume Chatelet  // Normalization step 1: Bring the leading bit to the highest bit of
3546f4daSGuillaume Chatelet  // StorageType.
3546f4daSGuillaume Chatelet  uint32_t amount_to_shift_left = cpp::countl_zero<StorageType>(mantissa);
1c92911eSMichael Jones  mantissa <<= amount_to_shift_left;
8298424cSMichael Jones
3546f4daSGuillaume Chatelet  // Keep exp2 representing the exponent of the lowest bit of StorageType.
1c92911eSMichael Jones  exp2 -= amount_to_shift_left;
8298424cSMichael Jones
f22a65c1SGuillaume Chatelet  // biased_exponent represents the biased exponent of the most significant bit.
c09e6905SGuillaume Chatelet  int32_t biased_exponent = exp2 + FPBits::STORAGE_LEN + FPBits::EXP_BIAS - 1;
8298424cSMichael Jones
201cc2d8STue Ly  // Handle numbers that're too large and get squashed to inf
1c92911eSMichael Jones  if (biased_exponent >= INF_EXP) {
8298424cSMichael Jones    // This indicates an overflow, so we make the result INF and set errno.
c09e6905SGuillaume Chatelet    output.num = {0, (1 << FPBits::EXP_LEN) - 1};
cb3c41c2SMichael Jones    output.error = ERANGE;
cb3c41c2SMichael Jones    return output;
201cc2d8STue Ly  }
201cc2d8STue Ly
f22a65c1SGuillaume Chatelet  uint32_t amount_to_shift_right =
c09e6905SGuillaume Chatelet      FPBits::STORAGE_LEN - FPBits::FRACTION_LEN - 1;
201cc2d8STue Ly
201cc2d8STue Ly  // Handle subnormals.
1c92911eSMichael Jones  if (biased_exponent <= 0) {
1c92911eSMichael Jones    amount_to_shift_right += 1 - biased_exponent;
1c92911eSMichael Jones    biased_exponent = 0;
201cc2d8STue Ly
c09e6905SGuillaume Chatelet    if (amount_to_shift_right > FPBits::STORAGE_LEN) {
201cc2d8STue Ly      // Return 0 if the exponent is too small.
cb3c41c2SMichael Jones      output.num = {0, 0};
cb3c41c2SMichael Jones      output.error = ERANGE;
cb3c41c2SMichael Jones      return output;
201cc2d8STue Ly    }
201cc2d8STue Ly  }
201cc2d8STue Ly
3546f4daSGuillaume Chatelet  StorageType round_bit_mask = StorageType(1) << (amount_to_shift_right - 1);
3546f4daSGuillaume Chatelet  StorageType sticky_mask = round_bit_mask - 1;
1557256aSTue Ly  bool round_bit = static_cast<bool>(mantissa & round_bit_mask);
1c92911eSMichael Jones  bool sticky_bit = static_cast<bool>(mantissa & sticky_mask) || truncated;
201cc2d8STue Ly
c09e6905SGuillaume Chatelet  if (amount_to_shift_right < FPBits::STORAGE_LEN) {
201cc2d8STue Ly    // Shift the mantissa and clear the implicit bit.
1c92911eSMichael Jones    mantissa >>= amount_to_shift_right;
c09e6905SGuillaume Chatelet    mantissa &= FPBits::FRACTION_MASK;
201cc2d8STue Ly  } else {
8298424cSMichael Jones    mantissa = 0;
201cc2d8STue Ly  }
3546f4daSGuillaume Chatelet  bool least_significant_bit = static_cast<bool>(mantissa & StorageType(1));
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  // TODO: check that this rounding behavior is correct.
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  if (round == RoundDirection::Nearest) {
201cc2d8STue Ly    // Perform rounding-to-nearest, tie-to-even.
1c92911eSMichael Jones    if (round_bit && (least_significant_bit || sticky_bit)) {
201cc2d8STue Ly      ++mantissa;
201cc2d8STue Ly    }
cb3c41c2SMichael Jones  } else if (round == RoundDirection::Up) {
cb3c41c2SMichael Jones    if (round_bit || sticky_bit) {
cb3c41c2SMichael Jones      ++mantissa;
cb3c41c2SMichael Jones    }
cb3c41c2SMichael Jones  } else /* (round == RoundDirection::Down)*/ {
cb3c41c2SMichael Jones    if (round_bit && sticky_bit) {
cb3c41c2SMichael Jones      ++mantissa;
cb3c41c2SMichael Jones    }
cb3c41c2SMichael Jones  }
201cc2d8STue Ly
c09e6905SGuillaume Chatelet  if (mantissa > FPBits::FRACTION_MASK) {
201cc2d8STue Ly    // Rounding causes the exponent to increase.
1c92911eSMichael Jones    ++biased_exponent;
201cc2d8STue Ly
1c92911eSMichael Jones    if (biased_exponent == INF_EXP) {
cb3c41c2SMichael Jones      output.error = ERANGE;
8298424cSMichael Jones    }
201cc2d8STue Ly  }
201cc2d8STue Ly
1c92911eSMichael Jones  if (biased_exponent == 0) {
cb3c41c2SMichael Jones    output.error = ERANGE;
201cc2d8STue Ly  }
201cc2d8STue Ly
c09e6905SGuillaume Chatelet  output.num = {mantissa & FPBits::FRACTION_MASK, biased_exponent};
cb3c41c2SMichael Jones  return output;
8298424cSMichael Jones}
8298424cSMichael Jones
87c01607SMichael Jones// checks if the next 4 characters of the string pointer are the start of a
87c01607SMichael Jones// hexadecimal floating point number. Does not advance the string pointer.
59c809cdSSiva Chandra ReddyLIBC_INLINE bool is_float_hex_start(const char *__restrict src,
87c01607SMichael Jones                                    const char decimalPoint) {
cb3c41c2SMichael Jones  if (!(src[0] == '0' && tolower(src[1]) == 'x')) {
87c01607SMichael Jones    return false;
87c01607SMichael Jones  }
cb3c41c2SMichael Jones  size_t first_digit = 2;
cb3c41c2SMichael Jones  if (src[2] == decimalPoint) {
cb3c41c2SMichael Jones    ++first_digit;
87c01607SMichael Jones  }
cb3c41c2SMichael Jones  return isalnum(src[first_digit]) && b36_char_to_int(src[first_digit]) < 16;
87c01607SMichael Jones}
87c01607SMichael Jones
8298424cSMichael Jones// Takes the start of a string representing a decimal float, as well as the
8298424cSMichael Jones// local decimalPoint. It returns if it suceeded in parsing any digits, and if
8298424cSMichael Jones// the return value is true then the outputs are pointer to the end of the
8298424cSMichael Jones// number, and the mantissa and exponent for the closest float T representation.
8298424cSMichael Jones// If the return value is false, then it is assumed that there is no number
8298424cSMichael Jones// here.
8298424cSMichael Jonestemplate <class T>
cb3c41c2SMichael JonesLIBC_INLINE StrToNumResult<ExpandedFloat<T>>
1c92911eSMichael Jonesdecimal_string_to_float(const char *__restrict src, const char DECIMAL_POINT,
cb3c41c2SMichael Jones                        RoundDirection round) {
c703e657SGuillaume Chatelet  using FPBits = typename fputil::FPBits<T>;
3546f4daSGuillaume Chatelet  using StorageType = typename FPBits::StorageType;
c703e657SGuillaume Chatelet
8298424cSMichael Jones  constexpr uint32_t BASE = 10;
8298424cSMichael Jones  constexpr char EXPONENT_MARKER = 'e';
8298424cSMichael Jones
8298424cSMichael Jones  bool truncated = false;
1c92911eSMichael Jones  bool seen_digit = false;
1c92911eSMichael Jones  bool after_decimal = false;
3546f4daSGuillaume Chatelet  StorageType mantissa = 0;
8298424cSMichael Jones  int32_t exponent = 0;
8298424cSMichael Jones
cb3c41c2SMichael Jones  size_t index = 0;
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  StrToNumResult<ExpandedFloat<T>> output({0, 0});
cb3c41c2SMichael Jones
8298424cSMichael Jones  // The goal for the first step of parsing is to convert the number in src to
8298424cSMichael Jones  // the format mantissa * (base ^ exponent)
8298424cSMichael Jones
499ca806STue Ly  // The loop fills the mantissa with as many digits as it can hold
3546f4daSGuillaume Chatelet  const StorageType bitstype_max_div_by_base =
3546f4daSGuillaume Chatelet      cpp::numeric_limits<StorageType>::max() / BASE;
499ca806STue Ly  while (true) {
cb3c41c2SMichael Jones    if (isdigit(src[index])) {
*a0c4f854SMichael Jones      uint32_t digit = b36_char_to_int(src[index]);
1c92911eSMichael Jones      seen_digit = true;
499ca806STue Ly
1c92911eSMichael Jones      if (mantissa < bitstype_max_div_by_base) {
499ca806STue Ly        mantissa = (mantissa * BASE) + digit;
1c92911eSMichael Jones        if (after_decimal) {
499ca806STue Ly          --exponent;
499ca806STue Ly        }
499ca806STue Ly      } else {
499ca806STue Ly        if (digit > 0)
499ca806STue Ly          truncated = true;
1c92911eSMichael Jones        if (!after_decimal)
499ca806STue Ly          ++exponent;
499ca806STue Ly      }
499ca806STue Ly
cb3c41c2SMichael Jones      ++index;
499ca806STue Ly      continue;
499ca806STue Ly    }
cb3c41c2SMichael Jones    if (src[index] == DECIMAL_POINT) {
1c92911eSMichael Jones      if (after_decimal) {
cb3c41c2SMichael Jones        break; // this means that src[index] points to a second decimal point,
cb3c41c2SMichael Jones               // ending the number.
499ca806STue Ly      }
1c92911eSMichael Jones      after_decimal = true;
cb3c41c2SMichael Jones      ++index;
8298424cSMichael Jones      continue;
8298424cSMichael Jones    }
499ca806STue Ly    // The character is neither a digit nor a decimal point.
499ca806STue Ly    break;
8298424cSMichael Jones  }
8298424cSMichael Jones
1c92911eSMichael Jones  if (!seen_digit)
cb3c41c2SMichael Jones    return output;
8298424cSMichael Jones
d34b3c9cSMichael Jones  // TODO: When adding max length argument, handle the case of a trailing
d34b3c9cSMichael Jones  // EXPONENT MARKER, see scanf for more details.
cb3c41c2SMichael Jones  if (tolower(src[index]) == EXPONENT_MARKER) {
ae3b59e6SMichael Jones    bool has_sign = false;
ae3b59e6SMichael Jones    if (src[index + 1] == '+' || src[index + 1] == '-') {
ae3b59e6SMichael Jones      has_sign = true;
ae3b59e6SMichael Jones    }
ae3b59e6SMichael Jones    if (isdigit(src[index + 1 + static_cast<size_t>(has_sign)])) {
cb3c41c2SMichael Jones      ++index;
cb3c41c2SMichael Jones      auto result = strtointeger<int32_t>(src + index, 10);
cb3c41c2SMichael Jones      if (result.has_error())
cb3c41c2SMichael Jones        output.error = result.error;
74da5e6cSMichael Jones      int32_t add_to_exponent = result.value;
cb3c41c2SMichael Jones      index += result.parsed_len;
cc65ecfdSMichael Jones
cc65ecfdSMichael Jones      // Here we do this operation as int64 to avoid overflow.
cc65ecfdSMichael Jones      int64_t temp_exponent = static_cast<int64_t>(exponent) +
cc65ecfdSMichael Jones                              static_cast<int64_t>(add_to_exponent);
cc65ecfdSMichael Jones
cc65ecfdSMichael Jones      // If the result is in the valid range, then we use it. The valid range is
cc65ecfdSMichael Jones      // also within the int32 range, so this prevents overflow issues.
3ae5a9b6SGuillaume Chatelet      if (temp_exponent > FPBits::MAX_BIASED_EXPONENT) {
3ae5a9b6SGuillaume Chatelet        exponent = FPBits::MAX_BIASED_EXPONENT;
3ae5a9b6SGuillaume Chatelet      } else if (temp_exponent < -FPBits::MAX_BIASED_EXPONENT) {
3ae5a9b6SGuillaume Chatelet        exponent = -FPBits::MAX_BIASED_EXPONENT;
3d953234SMichael Jones      } else {
3d953234SMichael Jones        exponent = static_cast<int32_t>(temp_exponent);
cc65ecfdSMichael Jones      }
8298424cSMichael Jones    }
8298424cSMichael Jones  }
8298424cSMichael Jones
cb3c41c2SMichael Jones  output.parsed_len = index;
8298424cSMichael Jones  if (mantissa == 0) { // if we have a 0, then also 0 the exponent.
cb3c41c2SMichael Jones    output.value = {0, 0};
8298424cSMichael Jones  } else {
cb3c41c2SMichael Jones    auto temp =
d34b3c9cSMichael Jones        decimal_exp_to_float<T>({mantissa, exponent}, truncated, round, src);
cb3c41c2SMichael Jones    output.value = temp.num;
cb3c41c2SMichael Jones    output.error = temp.error;
8298424cSMichael Jones  }
cb3c41c2SMichael Jones  return output;
8298424cSMichael Jones}
8298424cSMichael Jones
8298424cSMichael Jones// Takes the start of a string representing a hexadecimal float, as well as the
8298424cSMichael Jones// local decimal point. It returns if it suceeded in parsing any digits, and if
8298424cSMichael Jones// the return value is true then the outputs are pointer to the end of the
8298424cSMichael Jones// number, and the mantissa and exponent for the closest float T representation.
8298424cSMichael Jones// If the return value is false, then it is assumed that there is no number
8298424cSMichael Jones// here.
8298424cSMichael Jonestemplate <class T>
cb3c41c2SMichael JonesLIBC_INLINE StrToNumResult<ExpandedFloat<T>>
cb3c41c2SMichael Joneshexadecimal_string_to_float(const char *__restrict src,
cb3c41c2SMichael Jones                            const char DECIMAL_POINT, RoundDirection round) {
c703e657SGuillaume Chatelet  using FPBits = typename fputil::FPBits<T>;
3546f4daSGuillaume Chatelet  using StorageType = typename FPBits::StorageType;
c703e657SGuillaume Chatelet
8298424cSMichael Jones  constexpr uint32_t BASE = 16;
8298424cSMichael Jones  constexpr char EXPONENT_MARKER = 'p';
8298424cSMichael Jones
8298424cSMichael Jones  bool truncated = false;
1c92911eSMichael Jones  bool seen_digit = false;
1c92911eSMichael Jones  bool after_decimal = false;
3546f4daSGuillaume Chatelet  StorageType mantissa = 0;
8298424cSMichael Jones  int32_t exponent = 0;
8298424cSMichael Jones
cb3c41c2SMichael Jones  size_t index = 0;
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  StrToNumResult<ExpandedFloat<T>> output({0, 0});
cb3c41c2SMichael Jones
8298424cSMichael Jones  // The goal for the first step of parsing is to convert the number in src to
8298424cSMichael Jones  // the format mantissa * (base ^ exponent)
8298424cSMichael Jones
499ca806STue Ly  // The loop fills the mantissa with as many digits as it can hold
3546f4daSGuillaume Chatelet  const StorageType bitstype_max_div_by_base =
3546f4daSGuillaume Chatelet      cpp::numeric_limits<StorageType>::max() / BASE;
499ca806STue Ly  while (true) {
cb3c41c2SMichael Jones    if (isalnum(src[index])) {
cb3c41c2SMichael Jones      uint32_t digit = b36_char_to_int(src[index]);
201cc2d8STue Ly      if (digit < BASE)
1c92911eSMichael Jones        seen_digit = true;
201cc2d8STue Ly      else
201cc2d8STue Ly        break;
499ca806STue Ly
1c92911eSMichael Jones      if (mantissa < bitstype_max_div_by_base) {
499ca806STue Ly        mantissa = (mantissa * BASE) + digit;
1c92911eSMichael Jones        if (after_decimal)
499ca806STue Ly          --exponent;
499ca806STue Ly      } else {
499ca806STue Ly        if (digit > 0)
499ca806STue Ly          truncated = true;
1c92911eSMichael Jones        if (!after_decimal)
499ca806STue Ly          ++exponent;
499ca806STue Ly      }
cb3c41c2SMichael Jones      ++index;
499ca806STue Ly      continue;
499ca806STue Ly    }
cb3c41c2SMichael Jones    if (src[index] == DECIMAL_POINT) {
1c92911eSMichael Jones      if (after_decimal) {
cb3c41c2SMichael Jones        break; // this means that src[index] points to a second decimal point,
cb3c41c2SMichael Jones               // ending the number.
499ca806STue Ly      }
1c92911eSMichael Jones      after_decimal = true;
cb3c41c2SMichael Jones      ++index;
8298424cSMichael Jones      continue;
8298424cSMichael Jones    }
499ca806STue Ly    // The character is neither a hexadecimal digit nor a decimal point.
8298424cSMichael Jones    break;
8298424cSMichael Jones  }
8298424cSMichael Jones
1c92911eSMichael Jones  if (!seen_digit)
cb3c41c2SMichael Jones    return output;
8298424cSMichael Jones
8298424cSMichael Jones  // Convert the exponent from having a base of 16 to having a base of 2.
8298424cSMichael Jones  exponent *= 4;
8298424cSMichael Jones
cb3c41c2SMichael Jones  if (tolower(src[index]) == EXPONENT_MARKER) {
ae3b59e6SMichael Jones    bool has_sign = false;
ae3b59e6SMichael Jones    if (src[index + 1] == '+' || src[index + 1] == '-') {
ae3b59e6SMichael Jones      has_sign = true;
ae3b59e6SMichael Jones    }
ae3b59e6SMichael Jones    if (isdigit(src[index + 1 + static_cast<size_t>(has_sign)])) {
cb3c41c2SMichael Jones      ++index;
cb3c41c2SMichael Jones      auto result = strtointeger<int32_t>(src + index, 10);
cb3c41c2SMichael Jones      if (result.has_error())
cb3c41c2SMichael Jones        output.error = result.error;
cb3c41c2SMichael Jones
74da5e6cSMichael Jones      int32_t add_to_exponent = result.value;
cb3c41c2SMichael Jones      index += result.parsed_len;
cc65ecfdSMichael Jones
cc65ecfdSMichael Jones      // Here we do this operation as int64 to avoid overflow.
cc65ecfdSMichael Jones      int64_t temp_exponent = static_cast<int64_t>(exponent) +
cc65ecfdSMichael Jones                              static_cast<int64_t>(add_to_exponent);
cc65ecfdSMichael Jones
cc65ecfdSMichael Jones      // If the result is in the valid range, then we use it. The valid range is
cc65ecfdSMichael Jones      // also within the int32 range, so this prevents overflow issues.
3ae5a9b6SGuillaume Chatelet      if (temp_exponent > FPBits::MAX_BIASED_EXPONENT) {
3ae5a9b6SGuillaume Chatelet        exponent = FPBits::MAX_BIASED_EXPONENT;
3ae5a9b6SGuillaume Chatelet      } else if (temp_exponent < -FPBits::MAX_BIASED_EXPONENT) {
3ae5a9b6SGuillaume Chatelet        exponent = -FPBits::MAX_BIASED_EXPONENT;
b5f0a876SMichael Jones      } else {
b5f0a876SMichael Jones        exponent = static_cast<int32_t>(temp_exponent);
cc65ecfdSMichael Jones      }
8298424cSMichael Jones    }
8298424cSMichael Jones  }
cb3c41c2SMichael Jones  output.parsed_len = index;
8298424cSMichael Jones  if (mantissa == 0) { // if we have a 0, then also 0 the exponent.
cb3c41c2SMichael Jones    output.value.exponent = 0;
cb3c41c2SMichael Jones    output.value.mantissa = 0;
8298424cSMichael Jones  } else {
cb3c41c2SMichael Jones    auto temp = binary_exp_to_float<T>({mantissa, exponent}, truncated, round);
cb3c41c2SMichael Jones    output.error = temp.error;
cb3c41c2SMichael Jones    output.value = temp.num;
8298424cSMichael Jones  }
cb3c41c2SMichael Jones  return output;
8298424cSMichael Jones}
8298424cSMichael Jones
b43965adSMichael Flanderstemplate <class T>
b43965adSMichael FlandersLIBC_INLINE typename fputil::FPBits<T>::StorageType
0504e932SNishant Mittalnan_mantissa_from_ncharseq(const cpp::string_view ncharseq) {
b43965adSMichael Flanders  using FPBits = typename fputil::FPBits<T>;
b43965adSMichael Flanders  using StorageType = typename FPBits::StorageType;
b43965adSMichael Flanders
b43965adSMichael Flanders  StorageType nan_mantissa = 0;
0504e932SNishant Mittal
0504e932SNishant Mittal  if (ncharseq.data() != nullptr && isdigit(ncharseq[0])) {
b43965adSMichael Flanders    StrToNumResult<StorageType> strtoint_result =
b43965adSMichael Flanders        strtointeger<StorageType>(ncharseq.data(), 0);
0504e932SNishant Mittal    if (!strtoint_result.has_error())
0504e932SNishant Mittal      nan_mantissa = strtoint_result.value;
0504e932SNishant Mittal
0504e932SNishant Mittal    if (strtoint_result.parsed_len != static_cast<ptrdiff_t>(ncharseq.size()))
0504e932SNishant Mittal      nan_mantissa = 0;
0504e932SNishant Mittal  }
0504e932SNishant Mittal
0504e932SNishant Mittal  return nan_mantissa;
0504e932SNishant Mittal}
0504e932SNishant Mittal
87c01607SMichael Jones// Takes a pointer to a string and a pointer to a string pointer. This function
87c01607SMichael Jones// is used as the backend for all of the string to float functions.
d34b3c9cSMichael Jones// TODO: Add src_len member to match strtointeger.
d34b3c9cSMichael Jones// TODO: Next, move from char* and length to string_view
87c01607SMichael Jonestemplate <class T>
cb3c41c2SMichael JonesLIBC_INLINE StrToNumResult<T> strtofloatingpoint(const char *__restrict src) {
c703e657SGuillaume Chatelet  using FPBits = typename fputil::FPBits<T>;
3546f4daSGuillaume Chatelet  using StorageType = typename FPBits::StorageType;
c703e657SGuillaume Chatelet
c703e657SGuillaume Chatelet  FPBits result = FPBits();
1c92911eSMichael Jones  bool seen_digit = false;
cb3c41c2SMichael Jones  char sign = '+';
87c01607SMichael Jones
cb3c41c2SMichael Jones  int error = 0;
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  ptrdiff_t index = first_non_whitespace(src) - src;
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  if (src[index] == '+' || src[index] == '-') {
cb3c41c2SMichael Jones    sign = src[index];
cb3c41c2SMichael Jones    ++index;
87c01607SMichael Jones  }
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones  if (sign == '-') {
11ec512fSGuillaume Chatelet    result.set_sign(Sign::NEG);
87c01607SMichael Jones  }
87c01607SMichael Jones
87c01607SMichael Jones  static constexpr char DECIMAL_POINT = '.';
1c92911eSMichael Jones  static const char *inf_string = "infinity";
1c92911eSMichael Jones  static const char *nan_string = "nan";
87c01607SMichael Jones
cb3c41c2SMichael Jones  if (isdigit(src[index]) || src[index] == DECIMAL_POINT) { // regular number
87c01607SMichael Jones    int base = 10;
cb3c41c2SMichael Jones    if (is_float_hex_start(src + index, DECIMAL_POINT)) {
87c01607SMichael Jones      base = 16;
cb3c41c2SMichael Jones      index += 2;
1c92911eSMichael Jones      seen_digit = true;
87c01607SMichael Jones    }
87c01607SMichael Jones
cb3c41c2SMichael Jones    RoundDirection round_direction = RoundDirection::Nearest;
cb3c41c2SMichael Jones
a9824312STue Ly    switch (fputil::quick_get_round()) {
cb3c41c2SMichael Jones    case FE_TONEAREST:
cb3c41c2SMichael Jones      round_direction = RoundDirection::Nearest;
cb3c41c2SMichael Jones      break;
cb3c41c2SMichael Jones    case FE_UPWARD:
cb3c41c2SMichael Jones      if (sign == '+') {
cb3c41c2SMichael Jones        round_direction = RoundDirection::Up;
cb3c41c2SMichael Jones      } else {
cb3c41c2SMichael Jones        round_direction = RoundDirection::Down;
cb3c41c2SMichael Jones      }
cb3c41c2SMichael Jones      break;
cb3c41c2SMichael Jones    case FE_DOWNWARD:
cb3c41c2SMichael Jones      if (sign == '+') {
cb3c41c2SMichael Jones        round_direction = RoundDirection::Down;
cb3c41c2SMichael Jones      } else {
cb3c41c2SMichael Jones        round_direction = RoundDirection::Up;
cb3c41c2SMichael Jones      }
cb3c41c2SMichael Jones      break;
cb3c41c2SMichael Jones    case FE_TOWARDZERO:
cb3c41c2SMichael Jones      round_direction = RoundDirection::Down;
cb3c41c2SMichael Jones      break;
cb3c41c2SMichael Jones    }
cb3c41c2SMichael Jones
cb3c41c2SMichael Jones    StrToNumResult<ExpandedFloat<T>> parse_result({0, 0});
8298424cSMichael Jones    if (base == 16) {
cb3c41c2SMichael Jones      parse_result = hexadecimal_string_to_float<T>(src + index, DECIMAL_POINT,
cb3c41c2SMichael Jones                                                    round_direction);
8298424cSMichael Jones    } else { // base is 10
cb3c41c2SMichael Jones      parse_result = decimal_string_to_float<T>(src + index, DECIMAL_POINT,
cb3c41c2SMichael Jones                                                round_direction);
8298424cSMichael Jones    }
cb3c41c2SMichael Jones    seen_digit = parse_result.parsed_len != 0;
cb3c41c2SMichael Jones    result.set_mantissa(parse_result.value.mantissa);
7b387d27SGuillaume Chatelet    result.set_biased_exponent(parse_result.value.exponent);
cb3c41c2SMichael Jones    index += parse_result.parsed_len;
cb3c41c2SMichael Jones    error = parse_result.error;
cb3c41c2SMichael Jones  } else if (tolower(src[index]) == 'n') { // NaN
cb3c41c2SMichael Jones    if (tolower(src[index + 1]) == nan_string[1] &&
cb3c41c2SMichael Jones        tolower(src[index + 2]) == nan_string[2]) {
1c92911eSMichael Jones      seen_digit = true;
cb3c41c2SMichael Jones      index += 3;
3546f4daSGuillaume Chatelet      StorageType nan_mantissa = 0;
47d0c83eSMichael Jones      // this handles the case of `NaN(n-character-sequence)`, where the
1cbd25f8SMark de Wever      // n-character-sequence is made of 0 or more letters, numbers, or
1cbd25f8SMark de Wever      // underscore characters in any order.
cb3c41c2SMichael Jones      if (src[index] == '(') {
cb3c41c2SMichael Jones        size_t left_paren = index;
cb3c41c2SMichael Jones        ++index;
ad844632SMichael Jones        while (isalnum(src[index]) || src[index] == '_')
cb3c41c2SMichael Jones          ++index;
cb3c41c2SMichael Jones        if (src[index] == ')') {
cb3c41c2SMichael Jones          ++index;
b43965adSMichael Flanders          nan_mantissa = nan_mantissa_from_ncharseq<T>(
0504e932SNishant Mittal              cpp::string_view(src + (left_paren + 1), index - left_paren - 2));
cb3c41c2SMichael Jones        } else {
cb3c41c2SMichael Jones          index = left_paren;
cb3c41c2SMichael Jones        }
87c01607SMichael Jones      }
ace383dfSGuillaume Chatelet      result = FPBits(result.quiet_nan(result.sign(), nan_mantissa));
87c01607SMichael Jones    }
cb3c41c2SMichael Jones  } else if (tolower(src[index]) == 'i') { // INF
cb3c41c2SMichael Jones    if (tolower(src[index + 1]) == inf_string[1] &&
cb3c41c2SMichael Jones        tolower(src[index + 2]) == inf_string[2]) {
1c92911eSMichael Jones      seen_digit = true;
11ec512fSGuillaume Chatelet      result = FPBits(result.inf(result.sign()));
cb3c41c2SMichael Jones      if (tolower(src[index + 3]) == inf_string[3] &&
cb3c41c2SMichael Jones          tolower(src[index + 4]) == inf_string[4] &&
cb3c41c2SMichael Jones          tolower(src[index + 5]) == inf_string[5] &&
cb3c41c2SMichael Jones          tolower(src[index + 6]) == inf_string[6] &&
cb3c41c2SMichael Jones          tolower(src[index + 7]) == inf_string[7]) {
cb3c41c2SMichael Jones        // if the string is "INFINITY" then consume 8 characters.
cb3c41c2SMichael Jones        index += 8;
87c01607SMichael Jones      } else {
cb3c41c2SMichael Jones        index += 3;
87c01607SMichael Jones      }
87c01607SMichael Jones    }
87c01607SMichael Jones  }
1c92911eSMichael Jones  if (!seen_digit) { // If there is nothing to actually parse, then return 0.
cb3c41c2SMichael Jones    return {T(0), 0, error};
87c01607SMichael Jones  }
87c01607SMichael Jones
aa1902f9SMichael Jones  // This function only does something if T is long double and the platform uses
aa1902f9SMichael Jones  // special 80 bit long doubles. Otherwise it should be inlined out.
aa1902f9SMichael Jones  set_implicit_bit<T>(result);
aa1902f9SMichael Jones
2856db0dSGuillaume Chatelet  return {result.get_val(), index, error};
87c01607SMichael Jones}
87c01607SMichael Jones
0504e932SNishant Mittaltemplate <class T> LIBC_INLINE StrToNumResult<T> strtonan(const char *arg) {
0504e932SNishant Mittal  using FPBits = typename fputil::FPBits<T>;
0504e932SNishant Mittal  using StorageType = typename FPBits::StorageType;
0504e932SNishant Mittal
1896ee38Slntue  LIBC_CRASH_ON_NULLPTR(arg);
1896ee38Slntue
0504e932SNishant Mittal  FPBits result;
0504e932SNishant Mittal  int error = 0;
0504e932SNishant Mittal  StorageType nan_mantissa = 0;
0504e932SNishant Mittal
0504e932SNishant Mittal  ptrdiff_t index = 0;
0504e932SNishant Mittal  while (isalnum(arg[index]) || arg[index] == '_')
0504e932SNishant Mittal    ++index;
0504e932SNishant Mittal
b43965adSMichael Flanders  if (arg[index] == '\0')
b43965adSMichael Flanders    nan_mantissa = nan_mantissa_from_ncharseq<T>(cpp::string_view(arg, index));
0504e932SNishant Mittal
2137894aSGuillaume Chatelet  result = FPBits::quiet_nan(Sign::POS, nan_mantissa);
2856db0dSGuillaume Chatelet  return {result.get_val(), 0, error};
0504e932SNishant Mittal}
0504e932SNishant Mittal
87c01607SMichael Jones} // namespace internal
5ff3ff33SPetr Hosek} // namespace LIBC_NAMESPACE_DECL
87c01607SMichael Jones
270547f3SGuillaume Chatelet#endif // LLVM_LIBC_SRC___SUPPORT_STR_TO_FLOAT_H