fuzzing/stdlib/strtofloat_fuzz.cpp

3a66446aSMichael Jones//===-- strtofloat_fuzz.cpp -----------------------------------------------===//
3a66446aSMichael Jones//
3a66446aSMichael Jones// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
3a66446aSMichael Jones// See https://llvm.org/LICENSE.txt for license information.
3a66446aSMichael Jones// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
3a66446aSMichael Jones//
3a66446aSMichael Jones//===----------------------------------------------------------------------===//
3a66446aSMichael Jones///
3a66446aSMichael Jones/// Fuzzing test for llvm-libc atof implementation.
3a66446aSMichael Jones///
3a66446aSMichael Jones//===----------------------------------------------------------------------===//
3a66446aSMichael Jones#include "src/stdlib/atof.h"
3a66446aSMichael Jones#include "src/stdlib/strtod.h"
3a66446aSMichael Jones#include "src/stdlib/strtof.h"
3a66446aSMichael Jones#include "src/stdlib/strtold.h"
ae3b59e6SMichael Jones
c2399147SGuillaume Chatelet#include "src/__support/FPUtil/FPBits.h"
cfbcbc8fSMichael Jones
5748ad84Slntue#include "hdr/math_macros.h"
3a66446aSMichael Jones#include <stddef.h>
3a66446aSMichael Jones#include <stdint.h>
3a66446aSMichael Jones
ae3b59e6SMichael Jones#include "utils/MPFRWrapper/mpfr_inc.h"
ae3b59e6SMichael Jones
c09e6905SGuillaume Chateletusing LIBC_NAMESPACE::fputil::FPBits;
cfbcbc8fSMichael Jones
2cb47319SMichael Jones// This function calculates the effective precision for a given float type and
2cb47319SMichael Jones// exponent. Subnormals have a lower effective precision since they don't
2cb47319SMichael Jones// necessarily use all of the bits of the mantissa.
2ff8094eSMichael Jonestemplate <typename F> inline constexpr int effective_precision(int exponent) {
6b02d2f8SGuillaume Chatelet  const int full_precision = FPBits<F>::FRACTION_LEN + 1;
2cb47319SMichael Jones
2cb47319SMichael Jones  // This is intended to be 0 when the exponent is the lowest normal and
2cb47319SMichael Jones  // increase as the exponent's magnitude increases.
c09e6905SGuillaume Chatelet  const int bits_below_normal = (-exponent) - (FPBits<F>::EXP_BIAS - 1);
2cb47319SMichael Jones
2cb47319SMichael Jones  // The precision should be the normal, full precision, minus the bits lost
2cb47319SMichael Jones  // by this being a subnormal, minus one for the implicit leading one.
2ff8094eSMichael Jones  const int bits_if_subnormal = full_precision - bits_below_normal - 1;
2ff8094eSMichael Jones
2ff8094eSMichael Jones  if (bits_below_normal >= 0) {
2ff8094eSMichael Jones    return bits_if_subnormal;
2cb47319SMichael Jones  }
2cb47319SMichael Jones  return full_precision;
2cb47319SMichael Jones}
2cb47319SMichael Jones
3a66446aSMichael Jonesextern "C" int LLVMFuzzerTestOneInput(const uint8_t *data, size_t size) {
2ff8094eSMichael Jones  // const char newstr[] = "123";
2ff8094eSMichael Jones  // data = reinterpret_cast<const uint8_t *>(newstr);
2ff8094eSMichael Jones  // size = sizeof(newstr);
3a66446aSMichael Jones  uint8_t *container = new uint8_t[size + 1];
3a66446aSMichael Jones  if (!container)
3a66446aSMichael Jones    __builtin_trap();
3a66446aSMichael Jones  size_t i;
3a66446aSMichael Jones
ae3b59e6SMichael Jones  for (i = 0; i < size; ++i) {
ae3b59e6SMichael Jones    // MPFR's strtofr uses "@" as a base-independent exponent symbol
ae3b59e6SMichael Jones    if (data[i] != '@')
3a66446aSMichael Jones      container[i] = data[i];
ae3b59e6SMichael Jones    else {
ae3b59e6SMichael Jones      container[i] = '#';
ae3b59e6SMichael Jones    }
ae3b59e6SMichael Jones  }
3a66446aSMichael Jones  container[size] = '\0'; // Add null terminator to container.
3a66446aSMichael Jones
3a66446aSMichael Jones  const char *str_ptr = reinterpret_cast<const char *>(container);
3a66446aSMichael Jones
3a66446aSMichael Jones  char *out_ptr = nullptr;
3a66446aSMichael Jones
cfbcbc8fSMichael Jones  size_t base = 0;
cfbcbc8fSMichael Jones
2cb47319SMichael Jones  // This is just used to determine the base and precision.
ae3b59e6SMichael Jones  mpfr_t result;
ae3b59e6SMichael Jones  mpfr_init2(result, 256);
ae3b59e6SMichael Jones  mpfr_t bin_result;
ae3b59e6SMichael Jones  mpfr_init2(bin_result, 256);
ae3b59e6SMichael Jones  mpfr_strtofr(result, str_ptr, &out_ptr, 0 /* base */, MPFR_RNDN);
ae3b59e6SMichael Jones  ptrdiff_t result_strlen = out_ptr - str_ptr;
ae3b59e6SMichael Jones  mpfr_strtofr(bin_result, str_ptr, &out_ptr, 2 /* base */, MPFR_RNDN);
ae3b59e6SMichael Jones  ptrdiff_t bin_result_strlen = out_ptr - str_ptr;
ae3b59e6SMichael Jones
ae3b59e6SMichael Jones  long double bin_result_ld = mpfr_get_ld(bin_result, MPFR_RNDN);
ae3b59e6SMichael Jones  long double result_ld = mpfr_get_ld(result, MPFR_RNDN);
ae3b59e6SMichael Jones
ae3b59e6SMichael Jones  // This detects if mpfr's strtofr selected a base of 2, which libc does not
ae3b59e6SMichael Jones  // support. If a base 2 decoding is detected, it is replaced by a base 10
ae3b59e6SMichael Jones  // decoding.
ae3b59e6SMichael Jones  if ((bin_result_ld != 0.0 || bin_result_strlen == result_strlen) &&
ae3b59e6SMichael Jones      bin_result_ld == result_ld) {
ae3b59e6SMichael Jones    mpfr_strtofr(result, str_ptr, &out_ptr, 10 /* base */, MPFR_RNDN);
ae3b59e6SMichael Jones    result_strlen = out_ptr - str_ptr;
cfbcbc8fSMichael Jones    base = 10;
ae3b59e6SMichael Jones  }
ae3b59e6SMichael Jones
2cb47319SMichael Jones  auto result_exp = mpfr_get_exp(result);
2cb47319SMichael Jones
cfbcbc8fSMichael Jones  mpfr_clear(result);
cfbcbc8fSMichael Jones  mpfr_clear(bin_result);
cfbcbc8fSMichael Jones
cfbcbc8fSMichael Jones  // These must be calculated with the correct precision, and not any more, to
cfbcbc8fSMichael Jones  // prevent numbers like 66336650.00...01 (many zeroes) from causing an issue.
cfbcbc8fSMichael Jones  // 66336650 is exactly between two float values (66336652 and 66336648) so the
cfbcbc8fSMichael Jones  // correct float result for 66336650.00...01 is rounding up to 66336652. The
cfbcbc8fSMichael Jones  // correct double is instead 66336650, which when converted to float is
cfbcbc8fSMichael Jones  // rounded down to 66336648. This means we have to compare against the correct
cfbcbc8fSMichael Jones  // precision to get the correct result.
2cb47319SMichael Jones
cfbcbc8fSMichael Jones  // TODO: Add support for other rounding modes.
2ff8094eSMichael Jones  int float_precision = effective_precision<float>(result_exp);
2ff8094eSMichael Jones  if (float_precision >= 2) {
2ff8094eSMichael Jones    mpfr_t mpfr_float;
2ff8094eSMichael Jones    mpfr_init2(mpfr_float, float_precision);
cfbcbc8fSMichael Jones    mpfr_strtofr(mpfr_float, str_ptr, &out_ptr, base, MPFR_RNDN);
cfbcbc8fSMichael Jones    float volatile float_result = mpfr_get_flt(mpfr_float, MPFR_RNDN);
b6bc9d72SGuillaume Chatelet    auto volatile strtof_result = LIBC_NAMESPACE::strtof(str_ptr, &out_ptr);
ae3b59e6SMichael Jones    ptrdiff_t strtof_strlen = out_ptr - str_ptr;
ae3b59e6SMichael Jones    if (result_strlen != strtof_strlen)
3a66446aSMichael Jones      __builtin_trap();
2ff8094eSMichael Jones    // If any result is NaN, all of them should be NaN. We can't use the usual
2ff8094eSMichael Jones    // comparisons because NaN != NaN.
*dfdef2cbSlntue    if (FPBits<float>(float_result).is_nan() !=
*dfdef2cbSlntue        FPBits<float>(strtof_result).is_nan())
2ff8094eSMichael Jones      __builtin_trap();
*dfdef2cbSlntue    if (!FPBits<float>(float_result).is_nan() && float_result != strtof_result)
2ff8094eSMichael Jones      __builtin_trap();
2ff8094eSMichael Jones    mpfr_clear(mpfr_float);
2ff8094eSMichael Jones  }
2ff8094eSMichael Jones
2ff8094eSMichael Jones  int double_precision = effective_precision<double>(result_exp);
2ff8094eSMichael Jones  if (double_precision >= 2) {
2ff8094eSMichael Jones    mpfr_t mpfr_double;
2ff8094eSMichael Jones    mpfr_init2(mpfr_double, double_precision);
2ff8094eSMichael Jones    mpfr_strtofr(mpfr_double, str_ptr, &out_ptr, base, MPFR_RNDN);
2ff8094eSMichael Jones    double volatile double_result = mpfr_get_d(mpfr_double, MPFR_RNDN);
b6bc9d72SGuillaume Chatelet    auto volatile strtod_result = LIBC_NAMESPACE::strtod(str_ptr, &out_ptr);
b6bc9d72SGuillaume Chatelet    auto volatile atof_result = LIBC_NAMESPACE::atof(str_ptr);
ae3b59e6SMichael Jones    ptrdiff_t strtod_strlen = out_ptr - str_ptr;
ae3b59e6SMichael Jones    if (result_strlen != strtod_strlen)
3a66446aSMichael Jones      __builtin_trap();
*dfdef2cbSlntue    if (FPBits<double>(double_result).is_nan() !=
*dfdef2cbSlntue            FPBits<double>(strtod_result).is_nan() ||
*dfdef2cbSlntue        FPBits<double>(double_result).is_nan() !=
*dfdef2cbSlntue            FPBits<double>(atof_result).is_nan())
2ff8094eSMichael Jones      __builtin_trap();
*dfdef2cbSlntue    if (!FPBits<double>(double_result).is_nan() &&
2ff8094eSMichael Jones        (double_result != strtod_result || double_result != atof_result))
2ff8094eSMichael Jones      __builtin_trap();
2ff8094eSMichael Jones    mpfr_clear(mpfr_double);
2ff8094eSMichael Jones  }
2ff8094eSMichael Jones
2ff8094eSMichael Jones  int long_double_precision = effective_precision<long double>(result_exp);
2ff8094eSMichael Jones  if (long_double_precision >= 2) {
2ff8094eSMichael Jones    mpfr_t mpfr_long_double;
2ff8094eSMichael Jones    mpfr_init2(mpfr_long_double, long_double_precision);
2ff8094eSMichael Jones    mpfr_strtofr(mpfr_long_double, str_ptr, &out_ptr, base, MPFR_RNDN);
2ff8094eSMichael Jones    long double volatile long_double_result =
2ff8094eSMichael Jones        mpfr_get_ld(mpfr_long_double, MPFR_RNDN);
b6bc9d72SGuillaume Chatelet    auto volatile strtold_result = LIBC_NAMESPACE::strtold(str_ptr, &out_ptr);
ae3b59e6SMichael Jones    ptrdiff_t strtold_strlen = out_ptr - str_ptr;
ae3b59e6SMichael Jones    if (result_strlen != strtold_strlen)
3a66446aSMichael Jones      __builtin_trap();
*dfdef2cbSlntue    if (FPBits<long double>(long_double_result).is_nan() ^
*dfdef2cbSlntue        FPBits<long double>(strtold_result).is_nan())
ae3b59e6SMichael Jones      __builtin_trap();
*dfdef2cbSlntue    if (!FPBits<long double>(long_double_result).is_nan() &&
*dfdef2cbSlntue        long_double_result != strtold_result)
ae3b59e6SMichael Jones      __builtin_trap();
2ff8094eSMichael Jones    mpfr_clear(mpfr_long_double);
62e7bdd2SMichael Jones  }
62e7bdd2SMichael Jones
3a66446aSMichael Jones  delete[] container;
3a66446aSMichael Jones  return 0;
3a66446aSMichael Jones}