math/generic/tanpif16.cpp

f7bb1290Swldfngrs//===-- Half-precision tanpif function ------------------------------------===//
f7bb1290Swldfngrs//
f7bb1290Swldfngrs// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
f7bb1290Swldfngrs// See https://llvm.org/LICENSE.txt for license information.
f7bb1290Swldfngrs// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
f7bb1290Swldfngrs//
f7bb1290Swldfngrs//===----------------------------------------------------------------------===//
f7bb1290Swldfngrs
f7bb1290Swldfngrs#include "src/math/tanpif16.h"
f7bb1290Swldfngrs#include "hdr/errno_macros.h"
f7bb1290Swldfngrs#include "hdr/fenv_macros.h"
f7bb1290Swldfngrs#include "sincosf16_utils.h"
f7bb1290Swldfngrs#include "src/__support/FPUtil/FEnvImpl.h"
f7bb1290Swldfngrs#include "src/__support/FPUtil/FPBits.h"
f7bb1290Swldfngrs#include "src/__support/FPUtil/cast.h"
f7bb1290Swldfngrs#include "src/__support/FPUtil/except_value_utils.h"
f7bb1290Swldfngrs#include "src/__support/FPUtil/multiply_add.h"
f7bb1290Swldfngrs#include "src/__support/macros/optimization.h"
f7bb1290Swldfngrs
f7bb1290Swldfngrsnamespace LIBC_NAMESPACE_DECL {
f7bb1290Swldfngrs
f7bb1290Swldfngrsconstexpr size_t N_EXCEPTS = 21;
f7bb1290Swldfngrs
cd04653cSwldfngrsconstexpr fputil::ExceptValues<float16, N_EXCEPTS> TANPIF16_EXCEPTS{{
f7bb1290Swldfngrs    // (input, RZ output, RU offset, RD offset, RN offset)
f7bb1290Swldfngrs    {0x07f2, 0x0e3d, 1, 0, 0}, {0x086a, 0x0eee, 1, 0, 1},
f7bb1290Swldfngrs    {0x08db, 0x0fa0, 1, 0, 0}, {0x094c, 0x1029, 1, 0, 0},
f7bb1290Swldfngrs    {0x0b10, 0x118c, 1, 0, 0}, {0x1ce0, 0x23a8, 1, 0, 1},
f7bb1290Swldfngrs    {0x1235, 0x18e0, 1, 0, 0}, {0x2579, 0x2c4e, 1, 0, 0},
f7bb1290Swldfngrs    {0x28b2, 0x2f68, 1, 0, 1}, {0x2a43, 0x30f4, 1, 0, 1},
f7bb1290Swldfngrs    {0x31b7, 0x3907, 1, 0, 0}, {0x329d, 0x3a12, 1, 0, 1},
f7bb1290Swldfngrs    {0x34f1, 0x3dd7, 1, 0, 0}, {0x3658, 0x41ee, 1, 0, 0},
f7bb1290Swldfngrs    {0x38d4, 0xc1ee, 0, 1, 0}, {0x3d96, 0x41ee, 1, 0, 0},
f7bb1290Swldfngrs    {0x3e6a, 0xc1ee, 0, 1, 0}, {0x40cb, 0x41ee, 1, 0, 0},
f7bb1290Swldfngrs    {0x4135, 0xc1ee, 0, 1, 0}, {0x42cb, 0x41ee, 1, 0, 0},
f7bb1290Swldfngrs    {0x4335, 0xc1ee, 0, 1, 0},
f7bb1290Swldfngrs}};
f7bb1290Swldfngrs
f7bb1290SwldfngrsLLVM_LIBC_FUNCTION(float16, tanpif16, (float16 x)) {
f7bb1290Swldfngrs  using FPBits = typename fputil::FPBits<float16>;
f7bb1290Swldfngrs  FPBits xbits(x);
f7bb1290Swldfngrs
f7bb1290Swldfngrs  uint16_t x_u = xbits.uintval();
f7bb1290Swldfngrs  uint16_t x_abs = x_u & 0x7fff;
f7bb1290Swldfngrs
f7bb1290Swldfngrs  // Handle exceptional values
f7bb1290Swldfngrs  if (LIBC_UNLIKELY(x_abs <= 0x4335)) {
f7bb1290Swldfngrs    if (LIBC_UNLIKELY(x_abs == 0U))
f7bb1290Swldfngrs      return x;
f7bb1290Swldfngrs
f7bb1290Swldfngrs    bool x_sign = x_u >> 15;
cd04653cSwldfngrs    if (auto r = TANPIF16_EXCEPTS.lookup_odd(x_abs, x_sign);
f7bb1290Swldfngrs        LIBC_UNLIKELY(r.has_value()))
f7bb1290Swldfngrs      return r.value();
f7bb1290Swldfngrs  }
f7bb1290Swldfngrs
f7bb1290Swldfngrs  // Numbers greater or equal to 2^10 are integers, or infinity, or NaN
f7bb1290Swldfngrs  if (LIBC_UNLIKELY(x_abs >= 0x6400)) {
f7bb1290Swldfngrs    // Check for NaN or infinity values
f7bb1290Swldfngrs    if (LIBC_UNLIKELY(x_abs >= 0x7c00)) {
f7bb1290Swldfngrs      if (x_abs == 0x7c00) {
f7bb1290Swldfngrs        fputil::set_errno_if_required(EDOM);
f7bb1290Swldfngrs        fputil::raise_except_if_required(FE_INVALID);
f7bb1290Swldfngrs      }
f7bb1290Swldfngrs
f7bb1290Swldfngrs      return x + FPBits::quiet_nan().get_val();
f7bb1290Swldfngrs    }
f7bb1290Swldfngrs
f7bb1290Swldfngrs    return FPBits::zero(xbits.sign()).get_val();
f7bb1290Swldfngrs  }
f7bb1290Swldfngrs  // Range reduction:
f7bb1290Swldfngrs  // For |x| > 1/32, we perform range reduction as follows:
f7bb1290Swldfngrs  // Find k and y such that:
f7bb1290Swldfngrs  //   x = (k + y) * 1/32
f7bb1290Swldfngrs  //   k is an integer
f7bb1290Swldfngrs  //   |y| < 0.5
f7bb1290Swldfngrs  //
f7bb1290Swldfngrs  // This is done by performing:
f7bb1290Swldfngrs  //   k = round(x * 32)
f7bb1290Swldfngrs  //   y = x * 32 - k
f7bb1290Swldfngrs  //
*ecf4f95cSwldfngrs  // Once k and y are computed, we then deduce the answer by the formula:
f7bb1290Swldfngrs  // tan(x) = sin(x) / cos(x)
f7bb1290Swldfngrs  //        = (sin_y * cos_k + cos_y * sin_k) / (cos_y * cos_k - sin_y * sin_k)
f7bb1290Swldfngrs  float xf = x;
f7bb1290Swldfngrs  float sin_k, cos_k, sin_y, cosm1_y;
f7bb1290Swldfngrs  sincospif16_eval(xf, sin_k, cos_k, sin_y, cosm1_y);
f7bb1290Swldfngrs
f7bb1290Swldfngrs  if (LIBC_UNLIKELY(sin_y == 0 && cos_k == 0)) {
f7bb1290Swldfngrs    fputil::set_errno_if_required(EDOM);
f7bb1290Swldfngrs    fputil::raise_except_if_required(FE_DIVBYZERO);
f7bb1290Swldfngrs
f7bb1290Swldfngrs    int16_t x_mp5_u = static_cast<int16_t>(x - 0.5);
f7bb1290Swldfngrs    return ((x_mp5_u & 0x1) ? -1 : 1) * FPBits::inf().get_val();
f7bb1290Swldfngrs  }
f7bb1290Swldfngrs
f7bb1290Swldfngrs  using fputil::multiply_add;
f7bb1290Swldfngrs  return fputil::cast<float16>(
f7bb1290Swldfngrs      multiply_add(sin_y, cos_k, multiply_add(cosm1_y, sin_k, sin_k)) /
f7bb1290Swldfngrs      multiply_add(sin_y, -sin_k, multiply_add(cosm1_y, cos_k, cos_k)));
f7bb1290Swldfngrs}
f7bb1290Swldfngrs
f7bb1290Swldfngrs} // namespace LIBC_NAMESPACE_DECL