msun/ld80/e_powl.c

6813d08fSMatt Macy/*-
6813d08fSMatt Macy * Copyright (c) 2008 Stephen L. Moshier <steve@moshier.net>
6813d08fSMatt Macy *
6813d08fSMatt Macy * Permission to use, copy, modify, and distribute this software for any
6813d08fSMatt Macy * purpose with or without fee is hereby granted, provided that the above
6813d08fSMatt Macy * copyright notice and this permission notice appear in all copies.
6813d08fSMatt Macy *
6813d08fSMatt Macy * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
6813d08fSMatt Macy * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
6813d08fSMatt Macy * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
6813d08fSMatt Macy * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
6813d08fSMatt Macy * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
6813d08fSMatt Macy * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
6813d08fSMatt Macy * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
6813d08fSMatt Macy */
6813d08fSMatt Macy
5a4c3b83SDimitry Andric#include <math.h>
5a4c3b83SDimitry Andric
5a4c3b83SDimitry Andric#include "math_private.h"
5a4c3b83SDimitry Andric
5a4c3b83SDimitry Andric/*
5a4c3b83SDimitry Andric * Polynomial evaluator:
5a4c3b83SDimitry Andric *  P[0] x^n  +  P[1] x^(n-1)  +  ...  +  P[n]
5a4c3b83SDimitry Andric */
5a4c3b83SDimitry Andricstatic inline long double
10ac6c48SKonstantin Belousov__polevll(long double x, const long double *PP, int n)
5a4c3b83SDimitry Andric{
5a4c3b83SDimitry Andric	long double y;
10ac6c48SKonstantin Belousov	const long double *P;
5a4c3b83SDimitry Andric
5a4c3b83SDimitry Andric	P = PP;
5a4c3b83SDimitry Andric	y = *P++;
5a4c3b83SDimitry Andric	do {
5a4c3b83SDimitry Andric		y = y * x + *P++;
5a4c3b83SDimitry Andric	} while (--n);
5a4c3b83SDimitry Andric
5a4c3b83SDimitry Andric	return (y);
5a4c3b83SDimitry Andric}
5a4c3b83SDimitry Andric
5a4c3b83SDimitry Andric/*
5a4c3b83SDimitry Andric * Polynomial evaluator:
5a4c3b83SDimitry Andric *  x^n  +  P[0] x^(n-1)  +  P[1] x^(n-2)  +  ...  +  P[n]
5a4c3b83SDimitry Andric */
5a4c3b83SDimitry Andricstatic inline long double
10ac6c48SKonstantin Belousov__p1evll(long double x, const long double *PP, int n)
5a4c3b83SDimitry Andric{
5a4c3b83SDimitry Andric	long double y;
10ac6c48SKonstantin Belousov	const long double *P;
5a4c3b83SDimitry Andric
5a4c3b83SDimitry Andric	P = PP;
5a4c3b83SDimitry Andric	n -= 1;
5a4c3b83SDimitry Andric	y = x + *P++;
5a4c3b83SDimitry Andric	do {
5a4c3b83SDimitry Andric		y = y * x + *P++;
5a4c3b83SDimitry Andric	} while (--n);
5a4c3b83SDimitry Andric
5a4c3b83SDimitry Andric	return (y);
5a4c3b83SDimitry Andric}
5a4c3b83SDimitry Andric
6813d08fSMatt Macy/*							powl.c
6813d08fSMatt Macy *
6813d08fSMatt Macy *	Power function, long double precision
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy * SYNOPSIS:
6813d08fSMatt Macy *
6813d08fSMatt Macy * long double x, y, z, powl();
6813d08fSMatt Macy *
6813d08fSMatt Macy * z = powl( x, y );
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy * DESCRIPTION:
6813d08fSMatt Macy *
6813d08fSMatt Macy * Computes x raised to the yth power.  Analytically,
6813d08fSMatt Macy *
6813d08fSMatt Macy *      x**y  =  exp( y log(x) ).
6813d08fSMatt Macy *
6813d08fSMatt Macy * Following Cody and Waite, this program uses a lookup table
6813d08fSMatt Macy * of 2**-i/32 and pseudo extended precision arithmetic to
6813d08fSMatt Macy * obtain several extra bits of accuracy in both the logarithm
6813d08fSMatt Macy * and the exponential.
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy * ACCURACY:
6813d08fSMatt Macy *
6813d08fSMatt Macy * The relative error of pow(x,y) can be estimated
6813d08fSMatt Macy * by   y dl ln(2),   where dl is the absolute error of
6813d08fSMatt Macy * the internally computed base 2 logarithm.  At the ends
6813d08fSMatt Macy * of the approximation interval the logarithm equal 1/32
6813d08fSMatt Macy * and its relative error is about 1 lsb = 1.1e-19.  Hence
6813d08fSMatt Macy * the predicted relative error in the result is 2.3e-21 y .
6813d08fSMatt Macy *
6813d08fSMatt Macy *                      Relative error:
6813d08fSMatt Macy * arithmetic   domain     # trials      peak         rms
6813d08fSMatt Macy *
6813d08fSMatt Macy *    IEEE     +-1000       40000      2.8e-18      3.7e-19
6813d08fSMatt Macy * .001 < x < 1000, with log(x) uniformly distributed.
6813d08fSMatt Macy * -1000 < y < 1000, y uniformly distributed.
6813d08fSMatt Macy *
6813d08fSMatt Macy *    IEEE     0,8700       60000      6.5e-18      1.0e-18
6813d08fSMatt Macy * 0.99 < x < 1.01, 0 < y < 8700, uniformly distributed.
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy * ERROR MESSAGES:
6813d08fSMatt Macy *
6813d08fSMatt Macy *   message         condition      value returned
6813d08fSMatt Macy * pow overflow     x**y > MAXNUM      INFINITY
6813d08fSMatt Macy * pow underflow   x**y < 1/MAXNUM       0.0
6813d08fSMatt Macy * pow domain      x<0 and y noninteger  0.0
6813d08fSMatt Macy *
6813d08fSMatt Macy */
6813d08fSMatt Macy
6813d08fSMatt Macy#include <float.h>
6813d08fSMatt Macy#include <math.h>
6813d08fSMatt Macy
6813d08fSMatt Macy#include "math_private.h"
6813d08fSMatt Macy
6813d08fSMatt Macy/* Table size */
6813d08fSMatt Macy#define NXT 32
6813d08fSMatt Macy/* log2(Table size) */
6813d08fSMatt Macy#define LNXT 5
6813d08fSMatt Macy
6813d08fSMatt Macy/* log(1+x) =  x - .5x^2 + x^3 *  P(z)/Q(z)
6813d08fSMatt Macy * on the domain  2^(-1/32) - 1  <=  x  <=  2^(1/32) - 1
6813d08fSMatt Macy */
10ac6c48SKonstantin Belousovstatic const long double P[] = {
6813d08fSMatt Macy 8.3319510773868690346226E-4L,
6813d08fSMatt Macy 4.9000050881978028599627E-1L,
6813d08fSMatt Macy 1.7500123722550302671919E0L,
6813d08fSMatt Macy 1.4000100839971580279335E0L,
6813d08fSMatt Macy};
10ac6c48SKonstantin Belousovstatic const long double Q[] = {
6813d08fSMatt Macy/* 1.0000000000000000000000E0L,*/
6813d08fSMatt Macy 5.2500282295834889175431E0L,
6813d08fSMatt Macy 8.4000598057587009834666E0L,
6813d08fSMatt Macy 4.2000302519914740834728E0L,
6813d08fSMatt Macy};
6813d08fSMatt Macy/* A[i] = 2^(-i/32), rounded to IEEE long double precision.
6813d08fSMatt Macy * If i is even, A[i] + B[i/2] gives additional accuracy.
6813d08fSMatt Macy */
10ac6c48SKonstantin Belousovstatic const long double A[33] = {
6813d08fSMatt Macy 1.0000000000000000000000E0L,
6813d08fSMatt Macy 9.7857206208770013448287E-1L,
6813d08fSMatt Macy 9.5760328069857364691013E-1L,
6813d08fSMatt Macy 9.3708381705514995065011E-1L,
6813d08fSMatt Macy 9.1700404320467123175367E-1L,
6813d08fSMatt Macy 8.9735453750155359320742E-1L,
6813d08fSMatt Macy 8.7812608018664974155474E-1L,
6813d08fSMatt Macy 8.5930964906123895780165E-1L,
6813d08fSMatt Macy 8.4089641525371454301892E-1L,
6813d08fSMatt Macy 8.2287773907698242225554E-1L,
6813d08fSMatt Macy 8.0524516597462715409607E-1L,
6813d08fSMatt Macy 7.8799042255394324325455E-1L,
6813d08fSMatt Macy 7.7110541270397041179298E-1L,
6813d08fSMatt Macy 7.5458221379671136985669E-1L,
6813d08fSMatt Macy 7.3841307296974965571198E-1L,
6813d08fSMatt Macy 7.2259040348852331001267E-1L,
6813d08fSMatt Macy 7.0710678118654752438189E-1L,
6813d08fSMatt Macy 6.9195494098191597746178E-1L,
6813d08fSMatt Macy 6.7712777346844636413344E-1L,
6813d08fSMatt Macy 6.6261832157987064729696E-1L,
6813d08fSMatt Macy 6.4841977732550483296079E-1L,
6813d08fSMatt Macy 6.3452547859586661129850E-1L,
6813d08fSMatt Macy 6.2092890603674202431705E-1L,
6813d08fSMatt Macy 6.0762367999023443907803E-1L,
6813d08fSMatt Macy 5.9460355750136053334378E-1L,
6813d08fSMatt Macy 5.8186242938878875689693E-1L,
6813d08fSMatt Macy 5.6939431737834582684856E-1L,
6813d08fSMatt Macy 5.5719337129794626814472E-1L,
6813d08fSMatt Macy 5.4525386633262882960438E-1L,
6813d08fSMatt Macy 5.3357020033841180906486E-1L,
6813d08fSMatt Macy 5.2213689121370692017331E-1L,
6813d08fSMatt Macy 5.1094857432705833910408E-1L,
6813d08fSMatt Macy 5.0000000000000000000000E-1L,
6813d08fSMatt Macy};
10ac6c48SKonstantin Belousovstatic const long double B[17] = {
6813d08fSMatt Macy 0.0000000000000000000000E0L,
6813d08fSMatt Macy 2.6176170809902549338711E-20L,
6813d08fSMatt Macy-1.0126791927256478897086E-20L,
6813d08fSMatt Macy 1.3438228172316276937655E-21L,
6813d08fSMatt Macy 1.2207982955417546912101E-20L,
6813d08fSMatt Macy-6.3084814358060867200133E-21L,
6813d08fSMatt Macy 1.3164426894366316434230E-20L,
6813d08fSMatt Macy-1.8527916071632873716786E-20L,
6813d08fSMatt Macy 1.8950325588932570796551E-20L,
6813d08fSMatt Macy 1.5564775779538780478155E-20L,
6813d08fSMatt Macy 6.0859793637556860974380E-21L,
6813d08fSMatt Macy-2.0208749253662532228949E-20L,
6813d08fSMatt Macy 1.4966292219224761844552E-20L,
6813d08fSMatt Macy 3.3540909728056476875639E-21L,
6813d08fSMatt Macy-8.6987564101742849540743E-22L,
6813d08fSMatt Macy-1.2327176863327626135542E-20L,
6813d08fSMatt Macy 0.0000000000000000000000E0L,
6813d08fSMatt Macy};
6813d08fSMatt Macy
6813d08fSMatt Macy/* 2^x = 1 + x P(x),
6813d08fSMatt Macy * on the interval -1/32 <= x <= 0
6813d08fSMatt Macy */
10ac6c48SKonstantin Belousovstatic const long double R[] = {
6813d08fSMatt Macy 1.5089970579127659901157E-5L,
6813d08fSMatt Macy 1.5402715328927013076125E-4L,
6813d08fSMatt Macy 1.3333556028915671091390E-3L,
6813d08fSMatt Macy 9.6181291046036762031786E-3L,
6813d08fSMatt Macy 5.5504108664798463044015E-2L,
6813d08fSMatt Macy 2.4022650695910062854352E-1L,
6813d08fSMatt Macy 6.9314718055994530931447E-1L,
6813d08fSMatt Macy};
6813d08fSMatt Macy
6813d08fSMatt Macy#define douba(k) A[k]
6813d08fSMatt Macy#define doubb(k) B[k]
6813d08fSMatt Macy#define MEXP (NXT*16384.0L)
6813d08fSMatt Macy/* The following if denormal numbers are supported, else -MEXP: */
6813d08fSMatt Macy#define MNEXP (-NXT*(16384.0L+64.0L))
6813d08fSMatt Macy/* log2(e) - 1 */
6813d08fSMatt Macy#define LOG2EA 0.44269504088896340735992L
6813d08fSMatt Macy
6813d08fSMatt Macy#define F W
6813d08fSMatt Macy#define Fa Wa
6813d08fSMatt Macy#define Fb Wb
6813d08fSMatt Macy#define G W
6813d08fSMatt Macy#define Ga Wa
6813d08fSMatt Macy#define Gb u
6813d08fSMatt Macy#define H W
6813d08fSMatt Macy#define Ha Wb
6813d08fSMatt Macy#define Hb Wb
6813d08fSMatt Macy
6813d08fSMatt Macystatic const long double MAXLOGL = 1.1356523406294143949492E4L;
6813d08fSMatt Macystatic const long double MINLOGL = -1.13994985314888605586758E4L;
6813d08fSMatt Macystatic const long double LOGE2L = 6.9314718055994530941723E-1L;
*0c00dbfeSKonstantin Belousovstatic _Thread_local volatile long double z;
*0c00dbfeSKonstantin Belousovstatic _Thread_local long double w, W, Wa, Wb, ya, yb, u;
6813d08fSMatt Macystatic const long double huge = 0x1p10000L;
6813d08fSMatt Macy#if 0 /* XXX Prevent gcc from erroneously constant folding this. */
6813d08fSMatt Macystatic const long double twom10000 = 0x1p-10000L;
6813d08fSMatt Macy#else
*0c00dbfeSKonstantin Belousovstatic _Thread_local volatile long double twom10000 = 0x1p-10000L;
6813d08fSMatt Macy#endif
6813d08fSMatt Macy
6813d08fSMatt Macystatic long double reducl( long double );
6813d08fSMatt Macystatic long double powil ( long double, int );
6813d08fSMatt Macy
6813d08fSMatt Macylong double
6813d08fSMatt Macypowl(long double x, long double y)
6813d08fSMatt Macy{
6813d08fSMatt Macy/* double F, Fa, Fb, G, Ga, Gb, H, Ha, Hb */
6813d08fSMatt Macyint i, nflg, iyflg, yoddint;
6813d08fSMatt Macylong e;
6813d08fSMatt Macy
6813d08fSMatt Macyif( y == 0.0L )
6813d08fSMatt Macy	return( 1.0L );
6813d08fSMatt Macy
6813d08fSMatt Macyif( x == 1.0L )
6813d08fSMatt Macy	return( 1.0L );
6813d08fSMatt Macy
6813d08fSMatt Macyif( isnan(x) )
6f1b8a07SBruce Evans	return ( nan_mix(x, y) );
6813d08fSMatt Macyif( isnan(y) )
6f1b8a07SBruce Evans	return ( nan_mix(x, y) );
6813d08fSMatt Macy
6813d08fSMatt Macyif( y == 1.0L )
6813d08fSMatt Macy	return( x );
6813d08fSMatt Macy
6813d08fSMatt Macyif( !isfinite(y) && x == -1.0L )
6813d08fSMatt Macy	return( 1.0L );
6813d08fSMatt Macy
6813d08fSMatt Macyif( y >= LDBL_MAX )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	if( x > 1.0L )
6813d08fSMatt Macy		return( INFINITY );
6813d08fSMatt Macy	if( x > 0.0L && x < 1.0L )
6813d08fSMatt Macy		return( 0.0L );
6813d08fSMatt Macy	if( x < -1.0L )
6813d08fSMatt Macy		return( INFINITY );
6813d08fSMatt Macy	if( x > -1.0L && x < 0.0L )
6813d08fSMatt Macy		return( 0.0L );
6813d08fSMatt Macy	}
6813d08fSMatt Macyif( y <= -LDBL_MAX )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	if( x > 1.0L )
6813d08fSMatt Macy		return( 0.0L );
6813d08fSMatt Macy	if( x > 0.0L && x < 1.0L )
6813d08fSMatt Macy		return( INFINITY );
6813d08fSMatt Macy	if( x < -1.0L )
6813d08fSMatt Macy		return( 0.0L );
6813d08fSMatt Macy	if( x > -1.0L && x < 0.0L )
6813d08fSMatt Macy		return( INFINITY );
6813d08fSMatt Macy	}
6813d08fSMatt Macyif( x >= LDBL_MAX )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	if( y > 0.0L )
6813d08fSMatt Macy		return( INFINITY );
6813d08fSMatt Macy	return( 0.0L );
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macyw = floorl(y);
6813d08fSMatt Macy/* Set iyflg to 1 if y is an integer.  */
6813d08fSMatt Macyiyflg = 0;
6813d08fSMatt Macyif( w == y )
6813d08fSMatt Macy	iyflg = 1;
6813d08fSMatt Macy
6813d08fSMatt Macy/* Test for odd integer y.  */
6813d08fSMatt Macyyoddint = 0;
6813d08fSMatt Macyif( iyflg )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	ya = fabsl(y);
6813d08fSMatt Macy	ya = floorl(0.5L * ya);
6813d08fSMatt Macy	yb = 0.5L * fabsl(w);
6813d08fSMatt Macy	if( ya != yb )
6813d08fSMatt Macy		yoddint = 1;
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macyif( x <= -LDBL_MAX )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	if( y > 0.0L )
6813d08fSMatt Macy		{
6813d08fSMatt Macy		if( yoddint )
6813d08fSMatt Macy			return( -INFINITY );
6813d08fSMatt Macy		return( INFINITY );
6813d08fSMatt Macy		}
6813d08fSMatt Macy	if( y < 0.0L )
6813d08fSMatt Macy		{
6813d08fSMatt Macy		if( yoddint )
6813d08fSMatt Macy			return( -0.0L );
6813d08fSMatt Macy		return( 0.0 );
6813d08fSMatt Macy		}
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macy
6813d08fSMatt Macynflg = 0;	/* flag = 1 if x<0 raised to integer power */
6813d08fSMatt Macyif( x <= 0.0L )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	if( x == 0.0L )
6813d08fSMatt Macy		{
6813d08fSMatt Macy		if( y < 0.0 )
6813d08fSMatt Macy			{
6813d08fSMatt Macy			if( signbit(x) && yoddint )
6813d08fSMatt Macy				return( -INFINITY );
6813d08fSMatt Macy			return( INFINITY );
6813d08fSMatt Macy			}
6813d08fSMatt Macy		if( y > 0.0 )
6813d08fSMatt Macy			{
6813d08fSMatt Macy			if( signbit(x) && yoddint )
6813d08fSMatt Macy				return( -0.0L );
6813d08fSMatt Macy			return( 0.0 );
6813d08fSMatt Macy			}
6813d08fSMatt Macy		if( y == 0.0L )
6813d08fSMatt Macy			return( 1.0L );  /*   0**0   */
6813d08fSMatt Macy		else
6813d08fSMatt Macy			return( 0.0L );  /*   0**y   */
6813d08fSMatt Macy		}
6813d08fSMatt Macy	else
6813d08fSMatt Macy		{
6813d08fSMatt Macy		if( iyflg == 0 )
6813d08fSMatt Macy			return (x - x) / (x - x); /* (x<0)**(non-int) is NaN */
6813d08fSMatt Macy		nflg = 1;
6813d08fSMatt Macy		}
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macy/* Integer power of an integer.  */
6813d08fSMatt Macy
6813d08fSMatt Macyif( iyflg )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	i = w;
6813d08fSMatt Macy	w = floorl(x);
6813d08fSMatt Macy	if( (w == x) && (fabsl(y) < 32768.0) )
6813d08fSMatt Macy		{
6813d08fSMatt Macy		w = powil( x, (int) y );
6813d08fSMatt Macy		return( w );
6813d08fSMatt Macy		}
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macy
6813d08fSMatt Macyif( nflg )
6813d08fSMatt Macy	x = fabsl(x);
6813d08fSMatt Macy
6813d08fSMatt Macy/* separate significand from exponent */
6813d08fSMatt Macyx = frexpl( x, &i );
6813d08fSMatt Macye = i;
6813d08fSMatt Macy
6813d08fSMatt Macy/* find significand in antilog table A[] */
6813d08fSMatt Macyi = 1;
6813d08fSMatt Macyif( x <= douba(17) )
6813d08fSMatt Macy	i = 17;
6813d08fSMatt Macyif( x <= douba(i+8) )
6813d08fSMatt Macy	i += 8;
6813d08fSMatt Macyif( x <= douba(i+4) )
6813d08fSMatt Macy	i += 4;
6813d08fSMatt Macyif( x <= douba(i+2) )
6813d08fSMatt Macy	i += 2;
6813d08fSMatt Macyif( x >= douba(1) )
6813d08fSMatt Macy	i = -1;
6813d08fSMatt Macyi += 1;
6813d08fSMatt Macy
6813d08fSMatt Macy
6813d08fSMatt Macy/* Find (x - A[i])/A[i]
6813d08fSMatt Macy * in order to compute log(x/A[i]):
6813d08fSMatt Macy *
6813d08fSMatt Macy * log(x) = log( a x/a ) = log(a) + log(x/a)
6813d08fSMatt Macy *
6813d08fSMatt Macy * log(x/a) = log(1+v),  v = x/a - 1 = (x-a)/a
6813d08fSMatt Macy */
6813d08fSMatt Macyx -= douba(i);
6813d08fSMatt Macyx -= doubb(i/2);
6813d08fSMatt Macyx /= douba(i);
6813d08fSMatt Macy
6813d08fSMatt Macy
6813d08fSMatt Macy/* rational approximation for log(1+v):
6813d08fSMatt Macy *
6813d08fSMatt Macy * log(1+v)  =  v  -  v**2/2  +  v**3 P(v) / Q(v)
6813d08fSMatt Macy */
6813d08fSMatt Macyz = x*x;
6813d08fSMatt Macyw = x * ( z * __polevll( x, P, 3 ) / __p1evll( x, Q, 3 ) );
6813d08fSMatt Macyw = w - ldexpl( z, -1 );   /*  w - 0.5 * z  */
6813d08fSMatt Macy
6813d08fSMatt Macy/* Convert to base 2 logarithm:
6813d08fSMatt Macy * multiply by log2(e) = 1 + LOG2EA
6813d08fSMatt Macy */
6813d08fSMatt Macyz = LOG2EA * w;
6813d08fSMatt Macyz += w;
6813d08fSMatt Macyz += LOG2EA * x;
6813d08fSMatt Macyz += x;
6813d08fSMatt Macy
6813d08fSMatt Macy/* Compute exponent term of the base 2 logarithm. */
6813d08fSMatt Macyw = -i;
6813d08fSMatt Macyw = ldexpl( w, -LNXT );	/* divide by NXT */
6813d08fSMatt Macyw += e;
6813d08fSMatt Macy/* Now base 2 log of x is w + z. */
6813d08fSMatt Macy
6813d08fSMatt Macy/* Multiply base 2 log by y, in extended precision. */
6813d08fSMatt Macy
6813d08fSMatt Macy/* separate y into large part ya
6813d08fSMatt Macy * and small part yb less than 1/NXT
6813d08fSMatt Macy */
6813d08fSMatt Macyya = reducl(y);
6813d08fSMatt Macyyb = y - ya;
6813d08fSMatt Macy
6813d08fSMatt Macy/* (w+z)(ya+yb)
6813d08fSMatt Macy * = w*ya + w*yb + z*y
6813d08fSMatt Macy */
6813d08fSMatt MacyF = z * y  +  w * yb;
6813d08fSMatt MacyFa = reducl(F);
6813d08fSMatt MacyFb = F - Fa;
6813d08fSMatt Macy
6813d08fSMatt MacyG = Fa + w * ya;
6813d08fSMatt MacyGa = reducl(G);
6813d08fSMatt MacyGb = G - Ga;
6813d08fSMatt Macy
6813d08fSMatt MacyH = Fb + Gb;
6813d08fSMatt MacyHa = reducl(H);
6813d08fSMatt Macyw = ldexpl( Ga+Ha, LNXT );
6813d08fSMatt Macy
6813d08fSMatt Macy/* Test the power of 2 for overflow */
6813d08fSMatt Macyif( w > MEXP )
6813d08fSMatt Macy	return (huge * huge);		/* overflow */
6813d08fSMatt Macy
6813d08fSMatt Macyif( w < MNEXP )
6813d08fSMatt Macy	return (twom10000 * twom10000);	/* underflow */
6813d08fSMatt Macy
6813d08fSMatt Macye = w;
6813d08fSMatt MacyHb = H - Ha;
6813d08fSMatt Macy
6813d08fSMatt Macyif( Hb > 0.0L )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	e += 1;
6813d08fSMatt Macy	Hb -= (1.0L/NXT);  /*0.0625L;*/
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macy/* Now the product y * log2(x)  =  Hb + e/NXT.
6813d08fSMatt Macy *
6813d08fSMatt Macy * Compute base 2 exponential of Hb,
6813d08fSMatt Macy * where -0.0625 <= Hb <= 0.
6813d08fSMatt Macy */
6813d08fSMatt Macyz = Hb * __polevll( Hb, R, 6 );  /*    z  =  2**Hb - 1    */
6813d08fSMatt Macy
6813d08fSMatt Macy/* Express e/NXT as an integer plus a negative number of (1/NXT)ths.
6813d08fSMatt Macy * Find lookup table entry for the fractional power of 2.
6813d08fSMatt Macy */
6813d08fSMatt Macyif( e < 0 )
6813d08fSMatt Macy	i = 0;
6813d08fSMatt Macyelse
6813d08fSMatt Macy	i = 1;
6813d08fSMatt Macyi = e/NXT + i;
6813d08fSMatt Macye = NXT*i - e;
6813d08fSMatt Macyw = douba( e );
6813d08fSMatt Macyz = w * z;      /*    2**-e * ( 1 + (2**Hb-1) )    */
6813d08fSMatt Macyz = z + w;
6813d08fSMatt Macyz = ldexpl( z, i );  /* multiply by integer power of 2 */
6813d08fSMatt Macy
6813d08fSMatt Macyif( nflg )
6813d08fSMatt Macy	{
6813d08fSMatt Macy/* For negative x,
6813d08fSMatt Macy * find out if the integer exponent
6813d08fSMatt Macy * is odd or even.
6813d08fSMatt Macy */
6813d08fSMatt Macy	w = ldexpl( y, -1 );
6813d08fSMatt Macy	w = floorl(w);
6813d08fSMatt Macy	w = ldexpl( w, 1 );
6813d08fSMatt Macy	if( w != y )
6813d08fSMatt Macy		z = -z; /* odd exponent */
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macyreturn( z );
6813d08fSMatt Macy}
6813d08fSMatt Macy
6813d08fSMatt Macy
6813d08fSMatt Macy/* Find a multiple of 1/NXT that is within 1/NXT of x. */
5a4c3b83SDimitry Andricstatic inline long double
6813d08fSMatt Macyreducl(long double x)
6813d08fSMatt Macy{
6813d08fSMatt Macylong double t;
6813d08fSMatt Macy
6813d08fSMatt Macyt = ldexpl( x, LNXT );
6813d08fSMatt Macyt = floorl( t );
6813d08fSMatt Macyt = ldexpl( t, -LNXT );
6813d08fSMatt Macyreturn(t);
6813d08fSMatt Macy}
6813d08fSMatt Macy
6813d08fSMatt Macy/*							powil.c
6813d08fSMatt Macy *
6813d08fSMatt Macy *	Real raised to integer power, long double precision
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy * SYNOPSIS:
6813d08fSMatt Macy *
6813d08fSMatt Macy * long double x, y, powil();
6813d08fSMatt Macy * int n;
6813d08fSMatt Macy *
6813d08fSMatt Macy * y = powil( x, n );
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy * DESCRIPTION:
6813d08fSMatt Macy *
6813d08fSMatt Macy * Returns argument x raised to the nth power.
6813d08fSMatt Macy * The routine efficiently decomposes n as a sum of powers of
6813d08fSMatt Macy * two. The desired power is a product of two-to-the-kth
6813d08fSMatt Macy * powers of x.  Thus to compute the 32767 power of x requires
6813d08fSMatt Macy * 28 multiplications instead of 32767 multiplications.
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy * ACCURACY:
6813d08fSMatt Macy *
6813d08fSMatt Macy *
6813d08fSMatt Macy *                      Relative error:
6813d08fSMatt Macy * arithmetic   x domain   n domain  # trials      peak         rms
6813d08fSMatt Macy *    IEEE     .001,1000  -1022,1023  50000       4.3e-17     7.8e-18
6813d08fSMatt Macy *    IEEE        1,2     -1022,1023  20000       3.9e-17     7.6e-18
6813d08fSMatt Macy *    IEEE     .99,1.01     0,8700    10000       3.6e-16     7.2e-17
6813d08fSMatt Macy *
6813d08fSMatt Macy * Returns MAXNUM on overflow, zero on underflow.
6813d08fSMatt Macy *
6813d08fSMatt Macy */
6813d08fSMatt Macy
6813d08fSMatt Macystatic long double
6813d08fSMatt Macypowil(long double x, int nn)
6813d08fSMatt Macy{
6813d08fSMatt Macylong double ww, y;
6813d08fSMatt Macylong double s;
6813d08fSMatt Macyint n, e, sign, asign, lx;
6813d08fSMatt Macy
6813d08fSMatt Macyif( x == 0.0L )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	if( nn == 0 )
6813d08fSMatt Macy		return( 1.0L );
6813d08fSMatt Macy	else if( nn < 0 )
6813d08fSMatt Macy		return( LDBL_MAX );
6813d08fSMatt Macy	else
6813d08fSMatt Macy		return( 0.0L );
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macyif( nn == 0 )
6813d08fSMatt Macy	return( 1.0L );
6813d08fSMatt Macy
6813d08fSMatt Macy
6813d08fSMatt Macyif( x < 0.0L )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	asign = -1;
6813d08fSMatt Macy	x = -x;
6813d08fSMatt Macy	}
6813d08fSMatt Macyelse
6813d08fSMatt Macy	asign = 0;
6813d08fSMatt Macy
6813d08fSMatt Macy
6813d08fSMatt Macyif( nn < 0 )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	sign = -1;
6813d08fSMatt Macy	n = -nn;
6813d08fSMatt Macy	}
6813d08fSMatt Macyelse
6813d08fSMatt Macy	{
6813d08fSMatt Macy	sign = 1;
6813d08fSMatt Macy	n = nn;
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macy/* Overflow detection */
6813d08fSMatt Macy
6813d08fSMatt Macy/* Calculate approximate logarithm of answer */
6813d08fSMatt Macys = x;
6813d08fSMatt Macys = frexpl( s, &lx );
6813d08fSMatt Macye = (lx - 1)*n;
6813d08fSMatt Macyif( (e == 0) || (e > 64) || (e < -64) )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	s = (s - 7.0710678118654752e-1L) / (s +  7.0710678118654752e-1L);
6813d08fSMatt Macy	s = (2.9142135623730950L * s - 0.5L + lx) * nn * LOGE2L;
6813d08fSMatt Macy	}
6813d08fSMatt Macyelse
6813d08fSMatt Macy	{
6813d08fSMatt Macy	s = LOGE2L * e;
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macyif( s > MAXLOGL )
6813d08fSMatt Macy	return (huge * huge);		/* overflow */
6813d08fSMatt Macy
6813d08fSMatt Macyif( s < MINLOGL )
6813d08fSMatt Macy	return (twom10000 * twom10000);	/* underflow */
6813d08fSMatt Macy/* Handle tiny denormal answer, but with less accuracy
6813d08fSMatt Macy * since roundoff error in 1.0/x will be amplified.
6813d08fSMatt Macy * The precise demarcation should be the gradual underflow threshold.
6813d08fSMatt Macy */
6813d08fSMatt Macyif( s < (-MAXLOGL+2.0L) )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	x = 1.0L/x;
6813d08fSMatt Macy	sign = -sign;
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macy/* First bit of the power */
6813d08fSMatt Macyif( n & 1 )
6813d08fSMatt Macy	y = x;
6813d08fSMatt Macy
6813d08fSMatt Macyelse
6813d08fSMatt Macy	{
6813d08fSMatt Macy	y = 1.0L;
6813d08fSMatt Macy	asign = 0;
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macyww = x;
6813d08fSMatt Macyn >>= 1;
6813d08fSMatt Macywhile( n )
6813d08fSMatt Macy	{
6813d08fSMatt Macy	ww = ww * ww;	/* arg to the 2-to-the-kth power */
6813d08fSMatt Macy	if( n & 1 )	/* if that bit is set, then include in product */
6813d08fSMatt Macy		y *= ww;
6813d08fSMatt Macy	n >>= 1;
6813d08fSMatt Macy	}
6813d08fSMatt Macy
6813d08fSMatt Macyif( asign )
6813d08fSMatt Macy	y = -y; /* odd power of negative number */
6813d08fSMatt Macyif( sign < 0 )
6813d08fSMatt Macy	y = 1.0L/y;
6813d08fSMatt Macyreturn(y);
6813d08fSMatt Macy}