arm-optimized-routines/math/pow.c

31914882SAlex Richardson/*
31914882SAlex Richardson * Double-precision x^y function.
31914882SAlex Richardson *
*f3087befSAndrew Turner * Copyright (c) 2018-2024, Arm Limited.
072a4ba8SAndrew Turner * SPDX-License-Identifier: MIT OR Apache-2.0 WITH LLVM-exception
31914882SAlex Richardson */
31914882SAlex Richardson
31914882SAlex Richardson#include <float.h>
31914882SAlex Richardson#include <math.h>
31914882SAlex Richardson#include <stdint.h>
31914882SAlex Richardson#include "math_config.h"
*f3087befSAndrew Turner#include "test_defs.h"
31914882SAlex Richardson
31914882SAlex Richardson/*
31914882SAlex RichardsonWorst-case error: 0.54 ULP (~= ulperr_exp + 1024*Ln2*relerr_log*2^53)
31914882SAlex Richardsonrelerr_log: 1.3 * 2^-68 (Relative error of log, 1.5 * 2^-68 without fma)
31914882SAlex Richardsonulperr_exp: 0.509 ULP (ULP error of exp, 0.511 ULP without fma)
31914882SAlex Richardson*/
31914882SAlex Richardson
31914882SAlex Richardson#define T __pow_log_data.tab
31914882SAlex Richardson#define A __pow_log_data.poly
31914882SAlex Richardson#define Ln2hi __pow_log_data.ln2hi
31914882SAlex Richardson#define Ln2lo __pow_log_data.ln2lo
31914882SAlex Richardson#define N (1 << POW_LOG_TABLE_BITS)
31914882SAlex Richardson#define OFF 0x3fe6955500000000
31914882SAlex Richardson
31914882SAlex Richardson/* Top 12 bits of a double (sign and exponent bits).  */
31914882SAlex Richardsonstatic inline uint32_t
31914882SAlex Richardsontop12 (double x)
31914882SAlex Richardson{
31914882SAlex Richardson  return asuint64 (x) >> 52;
31914882SAlex Richardson}
31914882SAlex Richardson
31914882SAlex Richardson/* Compute y+TAIL = log(x) where the rounded result is y and TAIL has about
31914882SAlex Richardson   additional 15 bits precision.  IX is the bit representation of x, but
31914882SAlex Richardson   normalized in the subnormal range using the sign bit for the exponent.  */
31914882SAlex Richardsonstatic inline double_t
31914882SAlex Richardsonlog_inline (uint64_t ix, double_t *tail)
31914882SAlex Richardson{
31914882SAlex Richardson  /* double_t for better performance on targets with FLT_EVAL_METHOD==2.  */
31914882SAlex Richardson  double_t z, r, y, invc, logc, logctail, kd, hi, t1, t2, lo, lo1, lo2, p;
31914882SAlex Richardson  uint64_t iz, tmp;
31914882SAlex Richardson  int k, i;
31914882SAlex Richardson
31914882SAlex Richardson  /* x = 2^k z; where z is in range [OFF,2*OFF) and exact.
31914882SAlex Richardson     The range is split into N subintervals.
31914882SAlex Richardson     The ith subinterval contains z and c is near its center.  */
31914882SAlex Richardson  tmp = ix - OFF;
31914882SAlex Richardson  i = (tmp >> (52 - POW_LOG_TABLE_BITS)) % N;
31914882SAlex Richardson  k = (int64_t) tmp >> 52; /* arithmetic shift */
31914882SAlex Richardson  iz = ix - (tmp & 0xfffULL << 52);
31914882SAlex Richardson  z = asdouble (iz);
31914882SAlex Richardson  kd = (double_t) k;
31914882SAlex Richardson
31914882SAlex Richardson  /* log(x) = k*Ln2 + log(c) + log1p(z/c-1).  */
31914882SAlex Richardson  invc = T[i].invc;
31914882SAlex Richardson  logc = T[i].logc;
31914882SAlex Richardson  logctail = T[i].logctail;
31914882SAlex Richardson
31914882SAlex Richardson  /* Note: 1/c is j/N or j/N/2 where j is an integer in [N,2N) and
31914882SAlex Richardson     |z/c - 1| < 1/N, so r = z/c - 1 is exactly representible.  */
31914882SAlex Richardson#if HAVE_FAST_FMA
31914882SAlex Richardson  r = fma (z, invc, -1.0);
31914882SAlex Richardson#else
31914882SAlex Richardson  /* Split z such that rhi, rlo and rhi*rhi are exact and |rlo| <= |r|.  */
31914882SAlex Richardson  double_t zhi = asdouble ((iz + (1ULL << 31)) & (-1ULL << 32));
31914882SAlex Richardson  double_t zlo = z - zhi;
31914882SAlex Richardson  double_t rhi = zhi * invc - 1.0;
31914882SAlex Richardson  double_t rlo = zlo * invc;
31914882SAlex Richardson  r = rhi + rlo;
31914882SAlex Richardson#endif
31914882SAlex Richardson
31914882SAlex Richardson  /* k*Ln2 + log(c) + r.  */
31914882SAlex Richardson  t1 = kd * Ln2hi + logc;
31914882SAlex Richardson  t2 = t1 + r;
31914882SAlex Richardson  lo1 = kd * Ln2lo + logctail;
31914882SAlex Richardson  lo2 = t1 - t2 + r;
31914882SAlex Richardson
31914882SAlex Richardson  /* Evaluation is optimized assuming superscalar pipelined execution.  */
31914882SAlex Richardson  double_t ar, ar2, ar3, lo3, lo4;
31914882SAlex Richardson  ar = A[0] * r; /* A[0] = -0.5.  */
31914882SAlex Richardson  ar2 = r * ar;
31914882SAlex Richardson  ar3 = r * ar2;
31914882SAlex Richardson  /* k*Ln2 + log(c) + r + A[0]*r*r.  */
31914882SAlex Richardson#if HAVE_FAST_FMA
31914882SAlex Richardson  hi = t2 + ar2;
31914882SAlex Richardson  lo3 = fma (ar, r, -ar2);
31914882SAlex Richardson  lo4 = t2 - hi + ar2;
31914882SAlex Richardson#else
31914882SAlex Richardson  double_t arhi = A[0] * rhi;
31914882SAlex Richardson  double_t arhi2 = rhi * arhi;
31914882SAlex Richardson  hi = t2 + arhi2;
31914882SAlex Richardson  lo3 = rlo * (ar + arhi);
31914882SAlex Richardson  lo4 = t2 - hi + arhi2;
31914882SAlex Richardson#endif
31914882SAlex Richardson  /* p = log1p(r) - r - A[0]*r*r.  */
31914882SAlex Richardson#if POW_LOG_POLY_ORDER == 8
31914882SAlex Richardson  p = (ar3
31914882SAlex Richardson       * (A[1] + r * A[2] + ar2 * (A[3] + r * A[4] + ar2 * (A[5] + r * A[6]))));
31914882SAlex Richardson#endif
31914882SAlex Richardson  lo = lo1 + lo2 + lo3 + lo4 + p;
31914882SAlex Richardson  y = hi + lo;
31914882SAlex Richardson  *tail = hi - y + lo;
31914882SAlex Richardson  return y;
31914882SAlex Richardson}
31914882SAlex Richardson
31914882SAlex Richardson#undef N
31914882SAlex Richardson#undef T
31914882SAlex Richardson#define N (1 << EXP_TABLE_BITS)
31914882SAlex Richardson#define InvLn2N __exp_data.invln2N
31914882SAlex Richardson#define NegLn2hiN __exp_data.negln2hiN
31914882SAlex Richardson#define NegLn2loN __exp_data.negln2loN
31914882SAlex Richardson#define Shift __exp_data.shift
31914882SAlex Richardson#define T __exp_data.tab
31914882SAlex Richardson#define C2 __exp_data.poly[5 - EXP_POLY_ORDER]
31914882SAlex Richardson#define C3 __exp_data.poly[6 - EXP_POLY_ORDER]
31914882SAlex Richardson#define C4 __exp_data.poly[7 - EXP_POLY_ORDER]
31914882SAlex Richardson#define C5 __exp_data.poly[8 - EXP_POLY_ORDER]
31914882SAlex Richardson#define C6 __exp_data.poly[9 - EXP_POLY_ORDER]
31914882SAlex Richardson
31914882SAlex Richardson/* Handle cases that may overflow or underflow when computing the result that
31914882SAlex Richardson   is scale*(1+TMP) without intermediate rounding.  The bit representation of
31914882SAlex Richardson   scale is in SBITS, however it has a computed exponent that may have
31914882SAlex Richardson   overflown into the sign bit so that needs to be adjusted before using it as
31914882SAlex Richardson   a double.  (int32_t)KI is the k used in the argument reduction and exponent
31914882SAlex Richardson   adjustment of scale, positive k here means the result may overflow and
31914882SAlex Richardson   negative k means the result may underflow.  */
31914882SAlex Richardsonstatic inline double
31914882SAlex Richardsonspecialcase (double_t tmp, uint64_t sbits, uint64_t ki)
31914882SAlex Richardson{
31914882SAlex Richardson  double_t scale, y;
31914882SAlex Richardson
31914882SAlex Richardson  if ((ki & 0x80000000) == 0)
31914882SAlex Richardson    {
31914882SAlex Richardson      /* k > 0, the exponent of scale might have overflowed by <= 460.  */
31914882SAlex Richardson      sbits -= 1009ull << 52;
31914882SAlex Richardson      scale = asdouble (sbits);
31914882SAlex Richardson      y = 0x1p1009 * (scale + scale * tmp);
31914882SAlex Richardson      return check_oflow (eval_as_double (y));
31914882SAlex Richardson    }
31914882SAlex Richardson  /* k < 0, need special care in the subnormal range.  */
31914882SAlex Richardson  sbits += 1022ull << 52;
31914882SAlex Richardson  /* Note: sbits is signed scale.  */
31914882SAlex Richardson  scale = asdouble (sbits);
31914882SAlex Richardson  y = scale + scale * tmp;
31914882SAlex Richardson  if (fabs (y) < 1.0)
31914882SAlex Richardson    {
31914882SAlex Richardson      /* Round y to the right precision before scaling it into the subnormal
31914882SAlex Richardson	 range to avoid double rounding that can cause 0.5+E/2 ulp error where
31914882SAlex Richardson	 E is the worst-case ulp error outside the subnormal range.  So this
31914882SAlex Richardson	 is only useful if the goal is better than 1 ulp worst-case error.  */
31914882SAlex Richardson      double_t hi, lo, one = 1.0;
31914882SAlex Richardson      if (y < 0.0)
31914882SAlex Richardson	one = -1.0;
31914882SAlex Richardson      lo = scale - y + scale * tmp;
31914882SAlex Richardson      hi = one + y;
31914882SAlex Richardson      lo = one - hi + y + lo;
31914882SAlex Richardson      y = eval_as_double (hi + lo) - one;
31914882SAlex Richardson      /* Fix the sign of 0.  */
31914882SAlex Richardson      if (y == 0.0)
31914882SAlex Richardson	y = asdouble (sbits & 0x8000000000000000);
31914882SAlex Richardson      /* The underflow exception needs to be signaled explicitly.  */
31914882SAlex Richardson      force_eval_double (opt_barrier_double (0x1p-1022) * 0x1p-1022);
31914882SAlex Richardson    }
31914882SAlex Richardson  y = 0x1p-1022 * y;
31914882SAlex Richardson  return check_uflow (eval_as_double (y));
31914882SAlex Richardson}
31914882SAlex Richardson
31914882SAlex Richardson#define SIGN_BIAS (0x800 << EXP_TABLE_BITS)
31914882SAlex Richardson
31914882SAlex Richardson/* Computes sign*exp(x+xtail) where |xtail| < 2^-8/N and |xtail| <= |x|.
31914882SAlex Richardson   The sign_bias argument is SIGN_BIAS or 0 and sets the sign to -1 or 1.  */
31914882SAlex Richardsonstatic inline double
31914882SAlex Richardsonexp_inline (double_t x, double_t xtail, uint32_t sign_bias)
31914882SAlex Richardson{
31914882SAlex Richardson  uint32_t abstop;
31914882SAlex Richardson  uint64_t ki, idx, top, sbits;
31914882SAlex Richardson  /* double_t for better performance on targets with FLT_EVAL_METHOD==2.  */
31914882SAlex Richardson  double_t kd, z, r, r2, scale, tail, tmp;
31914882SAlex Richardson
31914882SAlex Richardson  abstop = top12 (x) & 0x7ff;
31914882SAlex Richardson  if (unlikely (abstop - top12 (0x1p-54) >= top12 (512.0) - top12 (0x1p-54)))
31914882SAlex Richardson    {
31914882SAlex Richardson      if (abstop - top12 (0x1p-54) >= 0x80000000)
31914882SAlex Richardson	{
31914882SAlex Richardson	  /* Avoid spurious underflow for tiny x.  */
31914882SAlex Richardson	  /* Note: 0 is common input.  */
31914882SAlex Richardson	  double_t one = WANT_ROUNDING ? 1.0 + x : 1.0;
31914882SAlex Richardson	  return sign_bias ? -one : one;
31914882SAlex Richardson	}
31914882SAlex Richardson      if (abstop >= top12 (1024.0))
31914882SAlex Richardson	{
31914882SAlex Richardson	  /* Note: inf and nan are already handled.  */
31914882SAlex Richardson	  if (asuint64 (x) >> 63)
31914882SAlex Richardson	    return __math_uflow (sign_bias);
31914882SAlex Richardson	  else
31914882SAlex Richardson	    return __math_oflow (sign_bias);
31914882SAlex Richardson	}
31914882SAlex Richardson      /* Large x is special cased below.  */
31914882SAlex Richardson      abstop = 0;
31914882SAlex Richardson    }
31914882SAlex Richardson
31914882SAlex Richardson  /* exp(x) = 2^(k/N) * exp(r), with exp(r) in [2^(-1/2N),2^(1/2N)].  */
31914882SAlex Richardson  /* x = ln2/N*k + r, with int k and r in [-ln2/2N, ln2/2N].  */
31914882SAlex Richardson  z = InvLn2N * x;
31914882SAlex Richardson#if TOINT_INTRINSICS
31914882SAlex Richardson  kd = roundtoint (z);
31914882SAlex Richardson  ki = converttoint (z);
31914882SAlex Richardson#elif EXP_USE_TOINT_NARROW
31914882SAlex Richardson  /* z - kd is in [-0.5-2^-16, 0.5] in all rounding modes.  */
31914882SAlex Richardson  kd = eval_as_double (z + Shift);
31914882SAlex Richardson  ki = asuint64 (kd) >> 16;
31914882SAlex Richardson  kd = (double_t) (int32_t) ki;
31914882SAlex Richardson#else
31914882SAlex Richardson  /* z - kd is in [-1, 1] in non-nearest rounding modes.  */
31914882SAlex Richardson  kd = eval_as_double (z + Shift);
31914882SAlex Richardson  ki = asuint64 (kd);
31914882SAlex Richardson  kd -= Shift;
31914882SAlex Richardson#endif
31914882SAlex Richardson  r = x + kd * NegLn2hiN + kd * NegLn2loN;
31914882SAlex Richardson  /* The code assumes 2^-200 < |xtail| < 2^-8/N.  */
31914882SAlex Richardson  r += xtail;
31914882SAlex Richardson  /* 2^(k/N) ~= scale * (1 + tail).  */
31914882SAlex Richardson  idx = 2 * (ki % N);
31914882SAlex Richardson  top = (ki + sign_bias) << (52 - EXP_TABLE_BITS);
31914882SAlex Richardson  tail = asdouble (T[idx]);
31914882SAlex Richardson  /* This is only a valid scale when -1023*N < k < 1024*N.  */
31914882SAlex Richardson  sbits = T[idx + 1] + top;
31914882SAlex Richardson  /* exp(x) = 2^(k/N) * exp(r) ~= scale + scale * (tail + exp(r) - 1).  */
31914882SAlex Richardson  /* Evaluation is optimized assuming superscalar pipelined execution.  */
31914882SAlex Richardson  r2 = r * r;
31914882SAlex Richardson  /* Without fma the worst case error is 0.25/N ulp larger.  */
31914882SAlex Richardson  /* Worst case error is less than 0.5+1.11/N+(abs poly error * 2^53) ulp.  */
31914882SAlex Richardson#if EXP_POLY_ORDER == 4
31914882SAlex Richardson  tmp = tail + r + r2 * C2 + r * r2 * (C3 + r * C4);
31914882SAlex Richardson#elif EXP_POLY_ORDER == 5
31914882SAlex Richardson  tmp = tail + r + r2 * (C2 + r * C3) + r2 * r2 * (C4 + r * C5);
31914882SAlex Richardson#elif EXP_POLY_ORDER == 6
31914882SAlex Richardson  tmp = tail + r + r2 * (0.5 + r * C3) + r2 * r2 * (C4 + r * C5 + r2 * C6);
31914882SAlex Richardson#endif
31914882SAlex Richardson  if (unlikely (abstop == 0))
31914882SAlex Richardson    return specialcase (tmp, sbits, ki);
31914882SAlex Richardson  scale = asdouble (sbits);
31914882SAlex Richardson  /* Note: tmp == 0 or |tmp| > 2^-200 and scale > 2^-739, so there
31914882SAlex Richardson     is no spurious underflow here even without fma.  */
31914882SAlex Richardson  return eval_as_double (scale + scale * tmp);
31914882SAlex Richardson}
31914882SAlex Richardson
31914882SAlex Richardson/* Returns 0 if not int, 1 if odd int, 2 if even int.  The argument is
31914882SAlex Richardson   the bit representation of a non-zero finite floating-point value.  */
31914882SAlex Richardsonstatic inline int
31914882SAlex Richardsoncheckint (uint64_t iy)
31914882SAlex Richardson{
31914882SAlex Richardson  int e = iy >> 52 & 0x7ff;
31914882SAlex Richardson  if (e < 0x3ff)
31914882SAlex Richardson    return 0;
31914882SAlex Richardson  if (e > 0x3ff + 52)
31914882SAlex Richardson    return 2;
31914882SAlex Richardson  if (iy & ((1ULL << (0x3ff + 52 - e)) - 1))
31914882SAlex Richardson    return 0;
31914882SAlex Richardson  if (iy & (1ULL << (0x3ff + 52 - e)))
31914882SAlex Richardson    return 1;
31914882SAlex Richardson  return 2;
31914882SAlex Richardson}
31914882SAlex Richardson
31914882SAlex Richardson/* Returns 1 if input is the bit representation of 0, infinity or nan.  */
31914882SAlex Richardsonstatic inline int
31914882SAlex Richardsonzeroinfnan (uint64_t i)
31914882SAlex Richardson{
31914882SAlex Richardson  return 2 * i - 1 >= 2 * asuint64 (INFINITY) - 1;
31914882SAlex Richardson}
31914882SAlex Richardson
31914882SAlex Richardsondouble
31914882SAlex Richardsonpow (double x, double y)
31914882SAlex Richardson{
31914882SAlex Richardson  uint32_t sign_bias = 0;
31914882SAlex Richardson  uint64_t ix, iy;
31914882SAlex Richardson  uint32_t topx, topy;
31914882SAlex Richardson
31914882SAlex Richardson  ix = asuint64 (x);
31914882SAlex Richardson  iy = asuint64 (y);
31914882SAlex Richardson  topx = top12 (x);
31914882SAlex Richardson  topy = top12 (y);
31914882SAlex Richardson  if (unlikely (topx - 0x001 >= 0x7ff - 0x001
31914882SAlex Richardson		|| (topy & 0x7ff) - 0x3be >= 0x43e - 0x3be))
31914882SAlex Richardson    {
31914882SAlex Richardson      /* Note: if |y| > 1075 * ln2 * 2^53 ~= 0x1.749p62 then pow(x,y) = inf/0
31914882SAlex Richardson	 and if |y| < 2^-54 / 1075 ~= 0x1.e7b6p-65 then pow(x,y) = +-1.  */
31914882SAlex Richardson      /* Special cases: (x < 0x1p-126 or inf or nan) or
31914882SAlex Richardson	 (|y| < 0x1p-65 or |y| >= 0x1p63 or nan).  */
31914882SAlex Richardson      if (unlikely (zeroinfnan (iy)))
31914882SAlex Richardson	{
31914882SAlex Richardson	  if (2 * iy == 0)
31914882SAlex Richardson	    return issignaling_inline (x) ? x + y : 1.0;
31914882SAlex Richardson	  if (ix == asuint64 (1.0))
31914882SAlex Richardson	    return issignaling_inline (y) ? x + y : 1.0;
31914882SAlex Richardson	  if (2 * ix > 2 * asuint64 (INFINITY)
31914882SAlex Richardson	      || 2 * iy > 2 * asuint64 (INFINITY))
31914882SAlex Richardson	    return x + y;
31914882SAlex Richardson	  if (2 * ix == 2 * asuint64 (1.0))
31914882SAlex Richardson	    return 1.0;
31914882SAlex Richardson	  if ((2 * ix < 2 * asuint64 (1.0)) == !(iy >> 63))
31914882SAlex Richardson	    return 0.0; /* |x|<1 && y==inf or |x|>1 && y==-inf.  */
31914882SAlex Richardson	  return y * y;
31914882SAlex Richardson	}
31914882SAlex Richardson      if (unlikely (zeroinfnan (ix)))
31914882SAlex Richardson	{
31914882SAlex Richardson	  double_t x2 = x * x;
31914882SAlex Richardson	  if (ix >> 63 && checkint (iy) == 1)
31914882SAlex Richardson	    {
31914882SAlex Richardson	      x2 = -x2;
31914882SAlex Richardson	      sign_bias = 1;
31914882SAlex Richardson	    }
31914882SAlex Richardson	  if (WANT_ERRNO && 2 * ix == 0 && iy >> 63)
31914882SAlex Richardson	    return __math_divzero (sign_bias);
31914882SAlex Richardson	  /* Without the barrier some versions of clang hoist the 1/x2 and
31914882SAlex Richardson	     thus division by zero exception can be signaled spuriously.  */
31914882SAlex Richardson	  return iy >> 63 ? opt_barrier_double (1 / x2) : x2;
31914882SAlex Richardson	}
31914882SAlex Richardson      /* Here x and y are non-zero finite.  */
31914882SAlex Richardson      if (ix >> 63)
31914882SAlex Richardson	{
31914882SAlex Richardson	  /* Finite x < 0.  */
31914882SAlex Richardson	  int yint = checkint (iy);
31914882SAlex Richardson	  if (yint == 0)
31914882SAlex Richardson	    return __math_invalid (x);
31914882SAlex Richardson	  if (yint == 1)
31914882SAlex Richardson	    sign_bias = SIGN_BIAS;
31914882SAlex Richardson	  ix &= 0x7fffffffffffffff;
31914882SAlex Richardson	  topx &= 0x7ff;
31914882SAlex Richardson	}
31914882SAlex Richardson      if ((topy & 0x7ff) - 0x3be >= 0x43e - 0x3be)
31914882SAlex Richardson	{
31914882SAlex Richardson	  /* Note: sign_bias == 0 here because y is not odd.  */
31914882SAlex Richardson	  if (ix == asuint64 (1.0))
31914882SAlex Richardson	    return 1.0;
31914882SAlex Richardson	  if ((topy & 0x7ff) < 0x3be)
31914882SAlex Richardson	    {
31914882SAlex Richardson	      /* |y| < 2^-65, x^y ~= 1 + y*log(x).  */
31914882SAlex Richardson	      if (WANT_ROUNDING)
31914882SAlex Richardson		return ix > asuint64 (1.0) ? 1.0 + y : 1.0 - y;
31914882SAlex Richardson	      else
31914882SAlex Richardson		return 1.0;
31914882SAlex Richardson	    }
31914882SAlex Richardson	  return (ix > asuint64 (1.0)) == (topy < 0x800) ? __math_oflow (0)
31914882SAlex Richardson							 : __math_uflow (0);
31914882SAlex Richardson	}
31914882SAlex Richardson      if (topx == 0)
31914882SAlex Richardson	{
31914882SAlex Richardson	  /* Normalize subnormal x so exponent becomes negative.  */
31914882SAlex Richardson	  /* Without the barrier some versions of clang evalutate the mul
31914882SAlex Richardson	     unconditionally causing spurious overflow exceptions.  */
31914882SAlex Richardson	  ix = asuint64 (opt_barrier_double (x) * 0x1p52);
31914882SAlex Richardson	  ix &= 0x7fffffffffffffff;
31914882SAlex Richardson	  ix -= 52ULL << 52;
31914882SAlex Richardson	}
31914882SAlex Richardson    }
31914882SAlex Richardson
31914882SAlex Richardson  double_t lo;
31914882SAlex Richardson  double_t hi = log_inline (ix, &lo);
31914882SAlex Richardson  double_t ehi, elo;
31914882SAlex Richardson#if HAVE_FAST_FMA
31914882SAlex Richardson  ehi = y * hi;
31914882SAlex Richardson  elo = y * lo + fma (y, hi, -ehi);
31914882SAlex Richardson#else
31914882SAlex Richardson  double_t yhi = asdouble (iy & -1ULL << 27);
31914882SAlex Richardson  double_t ylo = y - yhi;
31914882SAlex Richardson  double_t lhi = asdouble (asuint64 (hi) & -1ULL << 27);
31914882SAlex Richardson  double_t llo = hi - lhi + lo;
31914882SAlex Richardson  ehi = yhi * lhi;
31914882SAlex Richardson  elo = ylo * lhi + y * llo; /* |elo| < |ehi| * 2^-25.  */
31914882SAlex Richardson#endif
31914882SAlex Richardson  return exp_inline (ehi, elo, sign_bias);
31914882SAlex Richardson}
31914882SAlex Richardson#if USE_GLIBC_ABI
31914882SAlex Richardsonstrong_alias (pow, __pow_finite)
31914882SAlex Richardsonhidden_alias (pow, __ieee754_pow)
31914882SAlex Richardson# if LDBL_MANT_DIG == 53
31914882SAlex Richardsonlong double powl (long double x, long double y) { return pow (x, y); }
31914882SAlex Richardson# endif
31914882SAlex Richardson#endif
*f3087befSAndrew Turner
*f3087befSAndrew TurnerTEST_ULP (pow, 0.05)
*f3087befSAndrew TurnerTEST_ULP_NONNEAREST (pow, 0.5)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0.5, 2.0, 0, inf, 20000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, -0.5, -2.0, 0, inf, 20000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0.5, 2.0, -0, -inf, 20000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, -0.5, -2.0, -0, -inf, 20000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0.5, 2.0, 0x1p-10, 0x1p10, 40000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0.5, 2.0, -0x1p-10, -0x1p10, 40000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0, inf, 0.5, 2.0, 80000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0, inf, -0.5, -2.0, 80000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0x1.fp-1, 0x1.08p0, 0x1p8, 0x1p17, 80000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0x1.fp-1, 0x1.08p0, -0x1p8, -0x1p17, 80000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0, 0x1p-1000, 0, 1.0, 50000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0x1p1000, inf, 0, 1.0, 50000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0x1.ffffffffffff0p-1, 0x1.0000000000008p0, 0x1p60, 0x1p68,
*f3087befSAndrew Turner		50000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, 0x1.ffffffffff000p-1, 0x1p0, 0x1p50, 0x1p52, 50000)
*f3087befSAndrew TurnerTEST_INTERVAL2 (pow, -0x1.ffffffffff000p-1, -0x1p0, 0x1p50, 0x1p52, 50000)