159338ad8SOverMighty //===-- Half-precision 10^x function --------------------------------------===// 259338ad8SOverMighty // 359338ad8SOverMighty // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 459338ad8SOverMighty // See https://llvm.org/LICENSE.txt for license information. 559338ad8SOverMighty // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 659338ad8SOverMighty // 759338ad8SOverMighty //===----------------------------------------------------------------------===// 859338ad8SOverMighty 959338ad8SOverMighty #include "src/math/exp10f16.h" 1059338ad8SOverMighty #include "expxf16.h" 1159338ad8SOverMighty #include "hdr/errno_macros.h" 1259338ad8SOverMighty #include "hdr/fenv_macros.h" 1359338ad8SOverMighty #include "src/__support/CPP/array.h" 1459338ad8SOverMighty #include "src/__support/FPUtil/FEnvImpl.h" 1559338ad8SOverMighty #include "src/__support/FPUtil/FPBits.h" 1659338ad8SOverMighty #include "src/__support/FPUtil/PolyEval.h" 17127349fcSOverMighty #include "src/__support/FPUtil/cast.h" 1859338ad8SOverMighty #include "src/__support/FPUtil/except_value_utils.h" 1959338ad8SOverMighty #include "src/__support/FPUtil/multiply_add.h" 2059338ad8SOverMighty #include "src/__support/FPUtil/nearest_integer.h" 2159338ad8SOverMighty #include "src/__support/FPUtil/rounding_mode.h" 2259338ad8SOverMighty #include "src/__support/common.h" 2359338ad8SOverMighty #include "src/__support/macros/config.h" 2459338ad8SOverMighty #include "src/__support/macros/optimization.h" 2559338ad8SOverMighty #include "src/__support/macros/properties/cpu_features.h" 2659338ad8SOverMighty 2759338ad8SOverMighty namespace LIBC_NAMESPACE_DECL { 2859338ad8SOverMighty 2959338ad8SOverMighty #ifdef LIBC_TARGET_CPU_HAS_FMA 3059338ad8SOverMighty static constexpr size_t N_EXP10F16_EXCEPTS = 5; 3159338ad8SOverMighty #else 3259338ad8SOverMighty static constexpr size_t N_EXP10F16_EXCEPTS = 8; 3359338ad8SOverMighty #endif 3459338ad8SOverMighty 3559338ad8SOverMighty static constexpr fputil::ExceptValues<float16, N_EXP10F16_EXCEPTS> 3659338ad8SOverMighty EXP10F16_EXCEPTS = {{ 3759338ad8SOverMighty // x = 0x1.8f4p-2, exp10f16(x) = 0x1.3ap+1 (RZ) 3859338ad8SOverMighty {0x363dU, 0x40e8U, 1U, 0U, 1U}, 3959338ad8SOverMighty // x = 0x1.95cp-2, exp10f16(x) = 0x1.3ecp+1 (RZ) 4059338ad8SOverMighty {0x3657U, 0x40fbU, 1U, 0U, 0U}, 4159338ad8SOverMighty // x = -0x1.018p-4, exp10f16(x) = 0x1.bbp-1 (RZ) 4259338ad8SOverMighty {0xac06U, 0x3aecU, 1U, 0U, 0U}, 4359338ad8SOverMighty // x = -0x1.c28p+0, exp10f16(x) = 0x1.1ccp-6 (RZ) 4459338ad8SOverMighty {0xbf0aU, 0x2473U, 1U, 0U, 0U}, 4559338ad8SOverMighty // x = -0x1.e1cp+1, exp10f16(x) = 0x1.694p-13 (RZ) 4659338ad8SOverMighty {0xc387U, 0x09a5U, 1U, 0U, 0U}, 4759338ad8SOverMighty #ifndef LIBC_TARGET_CPU_HAS_FMA 4859338ad8SOverMighty // x = 0x1.0cp+1, exp10f16(x) = 0x1.f04p+6 (RZ) 4959338ad8SOverMighty {0x4030U, 0x57c1U, 1U, 0U, 1U}, 5059338ad8SOverMighty // x = 0x1.1b8p+1, exp10f16(x) = 0x1.47cp+7 (RZ) 5159338ad8SOverMighty {0x406eU, 0x591fU, 1U, 0U, 1U}, 5259338ad8SOverMighty // x = 0x1.1b8p+2, exp10f16(x) = 0x1.a4p+14 (RZ) 5359338ad8SOverMighty {0x446eU, 0x7690U, 1U, 0U, 1U}, 5459338ad8SOverMighty #endif 5559338ad8SOverMighty }}; 5659338ad8SOverMighty 5759338ad8SOverMighty LLVM_LIBC_FUNCTION(float16, exp10f16, (float16 x)) { 5859338ad8SOverMighty using FPBits = fputil::FPBits<float16>; 5959338ad8SOverMighty FPBits x_bits(x); 6059338ad8SOverMighty 6159338ad8SOverMighty uint16_t x_u = x_bits.uintval(); 6259338ad8SOverMighty uint16_t x_abs = x_u & 0x7fffU; 6359338ad8SOverMighty 6459338ad8SOverMighty // When |x| >= 5, or x is NaN. 6559338ad8SOverMighty if (LIBC_UNLIKELY(x_abs >= 0x4500U)) { 6659338ad8SOverMighty // exp10(NaN) = NaN 6759338ad8SOverMighty if (x_bits.is_nan()) { 6859338ad8SOverMighty if (x_bits.is_signaling_nan()) { 6959338ad8SOverMighty fputil::raise_except_if_required(FE_INVALID); 7059338ad8SOverMighty return FPBits::quiet_nan().get_val(); 7159338ad8SOverMighty } 7259338ad8SOverMighty 7359338ad8SOverMighty return x; 7459338ad8SOverMighty } 7559338ad8SOverMighty 7659338ad8SOverMighty // When x >= 5. 7759338ad8SOverMighty if (x_bits.is_pos()) { 7859338ad8SOverMighty // exp10(+inf) = +inf 7959338ad8SOverMighty if (x_bits.is_inf()) 8059338ad8SOverMighty return FPBits::inf().get_val(); 8159338ad8SOverMighty 8259338ad8SOverMighty switch (fputil::quick_get_round()) { 8359338ad8SOverMighty case FE_TONEAREST: 8459338ad8SOverMighty case FE_UPWARD: 8559338ad8SOverMighty fputil::set_errno_if_required(ERANGE); 8659338ad8SOverMighty fputil::raise_except_if_required(FE_OVERFLOW); 8759338ad8SOverMighty return FPBits::inf().get_val(); 8859338ad8SOverMighty default: 8959338ad8SOverMighty return FPBits::max_normal().get_val(); 9059338ad8SOverMighty } 9159338ad8SOverMighty } 9259338ad8SOverMighty 9359338ad8SOverMighty // When x <= -8. 9459338ad8SOverMighty if (x_u >= 0xc800U) { 9559338ad8SOverMighty // exp10(-inf) = +0 9659338ad8SOverMighty if (x_bits.is_inf()) 9759338ad8SOverMighty return FPBits::zero().get_val(); 9859338ad8SOverMighty 9959338ad8SOverMighty fputil::set_errno_if_required(ERANGE); 10059338ad8SOverMighty fputil::raise_except_if_required(FE_UNDERFLOW | FE_INEXACT); 10159338ad8SOverMighty 10259338ad8SOverMighty if (fputil::fenv_is_round_up()) 10359338ad8SOverMighty return FPBits::min_subnormal().get_val(); 10459338ad8SOverMighty return FPBits::zero().get_val(); 10559338ad8SOverMighty } 10659338ad8SOverMighty } 10759338ad8SOverMighty 10859338ad8SOverMighty // When x is 1, 2, 3, or 4. These are hard-to-round cases with exact results. 10959338ad8SOverMighty if (LIBC_UNLIKELY((x_u & ~(0x3c00U | 0x4000U | 0x4200U | 0x4400U)) == 0)) { 11059338ad8SOverMighty switch (x_u) { 11159338ad8SOverMighty case 0x3c00U: // x = 1.0f16 112127349fcSOverMighty return fputil::cast<float16>(10.0); 11359338ad8SOverMighty case 0x4000U: // x = 2.0f16 114127349fcSOverMighty return fputil::cast<float16>(100.0); 11559338ad8SOverMighty case 0x4200U: // x = 3.0f16 116127349fcSOverMighty return fputil::cast<float16>(1'000.0); 11759338ad8SOverMighty case 0x4400U: // x = 4.0f16 118127349fcSOverMighty return fputil::cast<float16>(10'000.0); 11959338ad8SOverMighty } 12059338ad8SOverMighty } 12159338ad8SOverMighty 12259338ad8SOverMighty if (auto r = EXP10F16_EXCEPTS.lookup(x_u); LIBC_UNLIKELY(r.has_value())) 12359338ad8SOverMighty return r.value(); 12459338ad8SOverMighty 12595c24cb9SOverMighty // 10^x = 2^((hi + mid) * log2(10)) * 10^lo 12695c24cb9SOverMighty auto [exp2_hi_mid, exp10_lo] = exp10_range_reduction(x); 127*803220dbSwldfngrs return fputil::cast<float16>(exp2_hi_mid * exp10_lo); 12859338ad8SOverMighty } 12959338ad8SOverMighty 13059338ad8SOverMighty } // namespace LIBC_NAMESPACE_DECL 131