xref: /llvm-project/libc/src/math/generic/exp10f_impl.h (revision 9a95c097d0466c594f40a4ba9ced8a155574fdff)
1bc7a3bd8Slntue //===-- Single-precision 10^x function ------------------------------------===//
2bc7a3bd8Slntue //
3bc7a3bd8Slntue // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4bc7a3bd8Slntue // See https://llvm.org/LICENSE.txt for license information.
5bc7a3bd8Slntue // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6bc7a3bd8Slntue //
7bc7a3bd8Slntue //===----------------------------------------------------------------------===//
8bc7a3bd8Slntue 
9bc7a3bd8Slntue #ifndef LLVM_LIBC_SRC_MATH_GENERIC_EXP10F_IMPL_H
10bc7a3bd8Slntue #define LLVM_LIBC_SRC_MATH_GENERIC_EXP10F_IMPL_H
11bc7a3bd8Slntue 
12bc7a3bd8Slntue #include "explogxf.h"
13bc7a3bd8Slntue #include "src/__support/FPUtil/FEnvImpl.h"
14bc7a3bd8Slntue #include "src/__support/FPUtil/FPBits.h"
15bc7a3bd8Slntue #include "src/__support/FPUtil/multiply_add.h"
16bc7a3bd8Slntue #include "src/__support/FPUtil/rounding_mode.h"
17bc7a3bd8Slntue #include "src/__support/common.h"
18*5ff3ff33SPetr Hosek #include "src/__support/macros/config.h"
19bc7a3bd8Slntue #include "src/__support/macros/optimization.h" // LIBC_UNLIKELY
20bc7a3bd8Slntue 
21*5ff3ff33SPetr Hosek namespace LIBC_NAMESPACE_DECL {
22*5ff3ff33SPetr Hosek namespace generic {
23bc7a3bd8Slntue 
24bc7a3bd8Slntue LIBC_INLINE float exp10f(float x) {
25bc7a3bd8Slntue   using FPBits = typename fputil::FPBits<float>;
26bc7a3bd8Slntue   FPBits xbits(x);
27bc7a3bd8Slntue 
28bc7a3bd8Slntue   uint32_t x_u = xbits.uintval();
29bc7a3bd8Slntue   uint32_t x_abs = x_u & 0x7fff'ffffU;
30bc7a3bd8Slntue 
31bc7a3bd8Slntue   // When |x| >= log10(2^128), or x is nan
32bc7a3bd8Slntue   if (LIBC_UNLIKELY(x_abs >= 0x421a'209bU)) {
33bc7a3bd8Slntue     // When x < log10(2^-150) or nan
34bc7a3bd8Slntue     if (x_u > 0xc234'9e35U) {
35bc7a3bd8Slntue       // exp(-Inf) = 0
36bc7a3bd8Slntue       if (xbits.is_inf())
37bc7a3bd8Slntue         return 0.0f;
38bc7a3bd8Slntue       // exp(nan) = nan
39bc7a3bd8Slntue       if (xbits.is_nan())
40bc7a3bd8Slntue         return x;
41bc7a3bd8Slntue       if (fputil::fenv_is_round_up())
426b02d2f8SGuillaume Chatelet         return FPBits::min_subnormal().get_val();
43bc7a3bd8Slntue       fputil::set_errno_if_required(ERANGE);
44bc7a3bd8Slntue       fputil::raise_except_if_required(FE_UNDERFLOW);
45bc7a3bd8Slntue       return 0.0f;
46bc7a3bd8Slntue     }
47bc7a3bd8Slntue     // x >= log10(2^128) or nan
4811ec512fSGuillaume Chatelet     if (xbits.is_pos() && (x_u >= 0x421a'209bU)) {
49bc7a3bd8Slntue       // x is finite
50bc7a3bd8Slntue       if (x_u < 0x7f80'0000U) {
51bc7a3bd8Slntue         int rounding = fputil::quick_get_round();
52bc7a3bd8Slntue         if (rounding == FE_DOWNWARD || rounding == FE_TOWARDZERO)
536b02d2f8SGuillaume Chatelet           return FPBits::max_normal().get_val();
54bc7a3bd8Slntue 
55bc7a3bd8Slntue         fputil::set_errno_if_required(ERANGE);
56bc7a3bd8Slntue         fputil::raise_except_if_required(FE_OVERFLOW);
57bc7a3bd8Slntue       }
58bc7a3bd8Slntue       // x is +inf or nan
596b02d2f8SGuillaume Chatelet       return x + FPBits::inf().get_val();
60bc7a3bd8Slntue     }
61bc7a3bd8Slntue   }
62bc7a3bd8Slntue 
63bc7a3bd8Slntue   // When |x| <= log10(2)*2^-6
64bc7a3bd8Slntue   if (LIBC_UNLIKELY(x_abs <= 0x3b9a'209bU)) {
65bc7a3bd8Slntue     if (LIBC_UNLIKELY(x_u == 0xb25e'5bd9U)) { // x = -0x1.bcb7b2p-27f
66bc7a3bd8Slntue       if (fputil::fenv_is_round_to_nearest())
67bc7a3bd8Slntue         return 0x1.fffffep-1f;
68bc7a3bd8Slntue     }
69bc7a3bd8Slntue     // |x| < 2^-25
70bc7a3bd8Slntue     // 10^x ~ 1 + log(10) * x
71bc7a3bd8Slntue     if (LIBC_UNLIKELY(x_abs <= 0x3280'0000U)) {
72bc7a3bd8Slntue       return fputil::multiply_add(x, 0x1.26bb1cp+1f, 1.0f);
73bc7a3bd8Slntue     }
74bc7a3bd8Slntue 
75bc7a3bd8Slntue     return static_cast<float>(Exp10Base::powb_lo(x));
76bc7a3bd8Slntue   }
77bc7a3bd8Slntue 
78bc7a3bd8Slntue   // Exceptional value.
79bc7a3bd8Slntue   if (LIBC_UNLIKELY(x_u == 0x3d14'd956U)) { // x = 0x1.29b2acp-5f
80bc7a3bd8Slntue     if (fputil::fenv_is_round_up())
81bc7a3bd8Slntue       return 0x1.1657c4p+0f;
82bc7a3bd8Slntue   }
83bc7a3bd8Slntue 
84bc7a3bd8Slntue   // Exact outputs when x = 1, 2, ..., 10.
85bc7a3bd8Slntue   // Quick check mask: 0x800f'ffffU = ~(bits of 1.0f | ... | bits of 10.0f)
86bc7a3bd8Slntue   if (LIBC_UNLIKELY((x_u & 0x800f'ffffU) == 0)) {
87bc7a3bd8Slntue     switch (x_u) {
88bc7a3bd8Slntue     case 0x3f800000U: // x = 1.0f
89bc7a3bd8Slntue       return 10.0f;
90bc7a3bd8Slntue     case 0x40000000U: // x = 2.0f
91bc7a3bd8Slntue       return 100.0f;
92bc7a3bd8Slntue     case 0x40400000U: // x = 3.0f
93bc7a3bd8Slntue       return 1'000.0f;
94bc7a3bd8Slntue     case 0x40800000U: // x = 4.0f
95bc7a3bd8Slntue       return 10'000.0f;
96bc7a3bd8Slntue     case 0x40a00000U: // x = 5.0f
97bc7a3bd8Slntue       return 100'000.0f;
98bc7a3bd8Slntue     case 0x40c00000U: // x = 6.0f
99bc7a3bd8Slntue       return 1'000'000.0f;
100bc7a3bd8Slntue     case 0x40e00000U: // x = 7.0f
101bc7a3bd8Slntue       return 10'000'000.0f;
102bc7a3bd8Slntue     case 0x41000000U: // x = 8.0f
103bc7a3bd8Slntue       return 100'000'000.0f;
104bc7a3bd8Slntue     case 0x41100000U: // x = 9.0f
105bc7a3bd8Slntue       return 1'000'000'000.0f;
106bc7a3bd8Slntue     case 0x41200000U: // x = 10.0f
107bc7a3bd8Slntue       return 10'000'000'000.0f;
108bc7a3bd8Slntue     }
109bc7a3bd8Slntue   }
110bc7a3bd8Slntue 
111bc7a3bd8Slntue   // Range reduction: 10^x = 2^(mid + hi) * 10^lo
112bc7a3bd8Slntue   //   rr = (2^(mid + hi), lo)
113bc7a3bd8Slntue   auto rr = exp_b_range_reduc<Exp10Base>(x);
114bc7a3bd8Slntue 
115bc7a3bd8Slntue   // The low part is approximated by a degree-5 minimax polynomial.
116bc7a3bd8Slntue   // 10^lo ~ 1 + COEFFS[0] * lo + ... + COEFFS[4] * lo^5
117bc7a3bd8Slntue   using fputil::multiply_add;
118bc7a3bd8Slntue   double lo2 = rr.lo * rr.lo;
119bc7a3bd8Slntue   // c0 = 1 + COEFFS[0] * lo
120bc7a3bd8Slntue   double c0 = multiply_add(rr.lo, Exp10Base::COEFFS[0], 1.0);
121bc7a3bd8Slntue   // c1 = COEFFS[1] + COEFFS[2] * lo
122bc7a3bd8Slntue   double c1 = multiply_add(rr.lo, Exp10Base::COEFFS[2], Exp10Base::COEFFS[1]);
123bc7a3bd8Slntue   // c2 = COEFFS[3] + COEFFS[4] * lo
124bc7a3bd8Slntue   double c2 = multiply_add(rr.lo, Exp10Base::COEFFS[4], Exp10Base::COEFFS[3]);
125bc7a3bd8Slntue   // p = c1 + c2 * lo^2
126bc7a3bd8Slntue   //   = COEFFS[1] + COEFFS[2] * lo + COEFFS[3] * lo^2 + COEFFS[4] * lo^3
127bc7a3bd8Slntue   double p = multiply_add(lo2, c2, c1);
128bc7a3bd8Slntue   // 10^lo ~ c0 + p * lo^2
129bc7a3bd8Slntue   // 10^x = 2^(mid + hi) * 10^lo
130bc7a3bd8Slntue   //      ~ mh * (c0 + p * lo^2)
131bc7a3bd8Slntue   //      = (mh * c0) + p * (mh * lo^2)
132bc7a3bd8Slntue   return static_cast<float>(multiply_add(p, lo2 * rr.mh, c0 * rr.mh));
133bc7a3bd8Slntue }
134bc7a3bd8Slntue 
135*5ff3ff33SPetr Hosek } // namespace generic
136*5ff3ff33SPetr Hosek } // namespace LIBC_NAMESPACE_DECL
137bc7a3bd8Slntue 
138bc7a3bd8Slntue #endif // LLVM_LIBC_SRC_MATH_GENERIC_EXP10F_IMPL_H
139