libm/common_source/pow.c

*24605Szliu/*
*24605Szliu * Copyright (c) 1985 Regents of the University of California.
*24605Szliu *
*24605Szliu * Use and reproduction of this software are granted  in  accordance  with
*24605Szliu * the terms and conditions specified in  the  Berkeley  Software  License
*24605Szliu * Agreement (in particular, this entails acknowledgement of the programs'
*24605Szliu * source, and inclusion of this notice) with the additional understanding
*24605Szliu * that  all  recipients  should regard themselves as participants  in  an
*24605Szliu * ongoing  research  project and hence should  feel  obligated  to report
*24605Szliu * their  experiences (good or bad) with these elementary function  codes,
*24605Szliu * using "sendbug 4bsd-bugs@BERKELEY", to the authors.
*24605Szliu */
*24605Szliu
*24605Szliu#ifndef lint
*24605Szliustatic char sccsid[] = "@(#)pow.c	1.1 (ELEFUNT) 09/06/85";
*24605Szliu#endif not lint
*24605Szliu
*24605Szliu/* POW(X,Y)
*24605Szliu * RETURN X**Y
*24605Szliu * DOUBLE PRECISION (VAX D format 56 bits, IEEE DOUBLE 53 BITS)
*24605Szliu * CODED IN C BY K.C. NG, 1/8/85;
*24605Szliu * REVISED BY K.C. NG on 7/10/85.
*24605Szliu *
*24605Szliu * Required system supported functions:
*24605Szliu *      scalb(x,n)
*24605Szliu *      logb(x)
*24605Szliu *	copysign(x,y)
*24605Szliu *	finite(x)
*24605Szliu *	drem(x,y)
*24605Szliu *
*24605Szliu * Required kernel functions:
*24605Szliu *	exp__E(a,c)	...return  exp(a+c) - 1 - a*a/2
*24605Szliu *	log__L(x)	...return  (log(1+x) - 2s)/s, s=x/(2+x)
*24605Szliu *	pow_p(x,y)	...return  +(anything)**(finite non zero)
*24605Szliu *
*24605Szliu * Method
*24605Szliu *	1. Compute and return log(x) in three pieces:
*24605Szliu *		log(x) = n*ln2 + hi + lo,
*24605Szliu *	   where n is an integer.
*24605Szliu *	2. Perform y*log(x) by simulating muti-precision arithmetic and
*24605Szliu *	   return the answer in three pieces:
*24605Szliu *		y*log(x) = m*ln2 + hi + lo,
*24605Szliu *	   where m is an integer.
*24605Szliu *	3. Return x**y = exp(y*log(x))
*24605Szliu *		= 2^m * ( exp(hi+lo) ).
*24605Szliu *
*24605Szliu * Special cases:
*24605Szliu *	(anything) ** 0  is 1 ;
*24605Szliu *	(anything) ** 1  is itself;
*24605Szliu *	(anything) ** NaN is NaN;
*24605Szliu *	NaN ** (anything except 0) is NaN;
*24605Szliu *	+-(anything > 1) ** +INF is +INF;
*24605Szliu *	+-(anything > 1) ** -INF is +0;
*24605Szliu *	+-(anything < 1) ** +INF is +0;
*24605Szliu *	+-(anything < 1) ** -INF is +INF;
*24605Szliu *	+-1 ** +-INF is NaN and signal INVALID;
*24605Szliu *	+0 ** +(anything except 0, NaN)  is +0;
*24605Szliu *	-0 ** +(anything except 0, NaN, odd integer)  is +0;
*24605Szliu *	+0 ** -(anything except 0, NaN)  is +INF and signal DIV-BY-ZERO;
*24605Szliu *	-0 ** -(anything except 0, NaN, odd integer)  is +INF with signal;
*24605Szliu *	-0 ** (odd integer) = -( +0 ** (odd integer) );
*24605Szliu *	+INF ** +(anything except 0,NaN) is +INF;
*24605Szliu *	+INF ** -(anything except 0,NaN) is +0;
*24605Szliu *	-INF ** (odd integer) = -( +INF ** (odd integer) );
*24605Szliu *	-INF ** (even integer) = ( +INF ** (even integer) );
*24605Szliu *	-INF ** -(anything except integer,NaN) is NaN with signal;
*24605Szliu *	-(x=anything) ** (k=integer) is (-1)**k * (x ** k);
*24605Szliu *	-(anything except 0) ** (non-integer) is NaN with signal;
*24605Szliu *
*24605Szliu * Accuracy:
*24605Szliu *	pow(x,y) returns x**y nearly rounded. In particular, on a SUN, a VAX,
*24605Szliu *	and a Zilog Z8000,
*24605Szliu *			pow(integer,integer)
*24605Szliu *	always returns the correct integer provided it is representable.
*24605Szliu *	In a test run with 100,000 random arguments with 0 < x, y < 20.0
*24605Szliu *	on a VAX, the maximum observed error was 1.79 ulps (units in the
*24605Szliu *	last place).
*24605Szliu *
*24605Szliu * Constants :
*24605Szliu * The hexadecimal values are the intended ones for the following constants.
*24605Szliu * The decimal values may be used, provided that the compiler will convert
*24605Szliu * from decimal to binary accurately enough to produce the hexadecimal values
*24605Szliu * shown.
*24605Szliu */
*24605Szliu
*24605Szliu#ifdef VAX	/* VAX D format */
*24605Szliu#include <errno.h>
*24605Szliuextern double infnan();
*24605Szliu
*24605Szliu/* double static */
*24605Szliu/* ln2hi  =  6.9314718055829871446E-1    , Hex  2^  0   *  .B17217F7D00000 */
*24605Szliu/* ln2lo  =  1.6465949582897081279E-12   , Hex  2^-39   *  .E7BCD5E4F1D9CC */
*24605Szliu/* invln2 =  1.4426950408889634148E0     , Hex  2^  1   *  .B8AA3B295C17F1 */
*24605Szliu/* sqrt2  =  1.4142135623730950622E0     ; Hex  2^  1   *  .B504F333F9DE65 */
*24605Szliustatic long     ln2hix[] = { 0x72174031, 0x0000f7d0};
*24605Szliustatic long     ln2lox[] = { 0xbcd52ce7, 0xd9cce4f1};
*24605Szliustatic long    invln2x[] = { 0xaa3b40b8, 0x17f1295c};
*24605Szliustatic long     sqrt2x[] = { 0x04f340b5, 0xde6533f9};
*24605Szliu#define    ln2hi    (*(double*)ln2hix)
*24605Szliu#define    ln2lo    (*(double*)ln2lox)
*24605Szliu#define   invln2    (*(double*)invln2x)
*24605Szliu#define    sqrt2    (*(double*)sqrt2x)
*24605Szliu#else	/* IEEE double */
*24605Szliudouble static
*24605Szliuln2hi  =  6.9314718036912381649E-1    , /*Hex  2^ -1   *  1.62E42FEE00000 */
*24605Szliuln2lo  =  1.9082149292705877000E-10   , /*Hex  2^-33   *  1.A39EF35793C76 */
*24605Szliuinvln2 =  1.4426950408889633870E0     , /*Hex  2^  0   *  1.71547652B82FE */
*24605Szliusqrt2  =  1.4142135623730951455E0     ; /*Hex  2^  0   *  1.6A09E667F3BCD */
*24605Szliu#endif
*24605Szliu
*24605Szliudouble static zero=0.0, half=1.0/2.0, one=1.0, two=2.0, negone= -1.0;
*24605Szliu
*24605Szliudouble pow(x,y)
*24605Szliudouble x,y;
*24605Szliu{
*24605Szliu	double drem(),pow_p(),copysign(),t;
*24605Szliu	int finite();
*24605Szliu
*24605Szliu	if     (y==zero)      return(one);
*24605Szliu	else if(y==one
*24605Szliu#ifndef VAX
*24605Szliu		||x!=x
*24605Szliu#endif
*24605Szliu		) return( x );      /* if x is NaN or y=1 */
*24605Szliu#ifndef VAX
*24605Szliu	else if(y!=y)         return( y );      /* if y is NaN */
*24605Szliu#endif
*24605Szliu	else if(!finite(y))                     /* if y is INF */
*24605Szliu	     if((t=copysign(x,one))==one) return(zero/zero);
*24605Szliu	     else if(t>one) return((y>zero)?y:zero);
*24605Szliu	     else return((y<zero)?-y:zero);
*24605Szliu	else if(y==two)       return(x*x);
*24605Szliu	else if(y==negone)    return(one/x);
*24605Szliu
*24605Szliu    /* sign(x) = 1 */
*24605Szliu	else if(copysign(one,x)==one) return(pow_p(x,y));
*24605Szliu
*24605Szliu    /* sign(x)= -1 */
*24605Szliu	/* if y is an even integer */
*24605Szliu	else if ( (t=drem(y,two)) == zero)	return( pow_p(-x,y) );
*24605Szliu
*24605Szliu	/* if y is an odd integer */
*24605Szliu	else if (copysign(t,one) == one) return( -pow_p(-x,y) );
*24605Szliu
*24605Szliu	/* Henceforth y is not an integer */
*24605Szliu	else if(x==zero)	/* x is -0 */
*24605Szliu	    return((y>zero)?-x:one/(-x));
*24605Szliu	else {			/* return NaN */
*24605Szliu#ifdef VAX
*24605Szliu	    return (infnan(EDOM));	/* NaN */
*24605Szliu#else	/* IEEE double */
*24605Szliu	    return(zero/zero);
*24605Szliu#endif
*24605Szliu	}
*24605Szliu}
*24605Szliu
*24605Szliu/* pow_p(x,y) return x**y for x with sign=1 and finite y */
*24605Szliustatic double pow_p(x,y)
*24605Szliudouble x,y;
*24605Szliu{
*24605Szliu        double logb(),scalb(),copysign(),log__L(),exp__E();
*24605Szliu        double c,s,t,z,tx,ty;
*24605Szliu        float sx,sy;
*24605Szliu	long k=0;
*24605Szliu        int n,m;
*24605Szliu
*24605Szliu	if(x==zero||!finite(x)) {           /* if x is +INF or +0 */
*24605Szliu#ifdef VAX
*24605Szliu	     return((y>zero)?x:infnan(ERANGE));	/* if y<zero, return +INF */
*24605Szliu#else
*24605Szliu	     return((y>zero)?x:one/x);
*24605Szliu#endif
*24605Szliu	}
*24605Szliu	if(x==1.0) return(x);	/* if x=1.0, return 1 since y is finite */
*24605Szliu
*24605Szliu    /* reduce x to z in [sqrt(1/2)-1, sqrt(2)-1] */
*24605Szliu        z=scalb(x,-(n=logb(x)));
*24605Szliu#ifndef VAX	/* IEEE double */	/* subnormal number */
*24605Szliu        if(n <= -1022) {n += (m=logb(z)); z=scalb(z,-m);}
*24605Szliu#endif
*24605Szliu        if(z >= sqrt2 ) {n += 1; z *= half;}  z -= one ;
*24605Szliu
*24605Szliu    /* log(x) = nlog2+log(1+z) ~ nlog2 + t + tx */
*24605Szliu	s=z/(two+z); c=z*z*half; tx=s*(c+log__L(s*s));
*24605Szliu	t= z-(c-tx); tx += (z-t)-c;
*24605Szliu
*24605Szliu   /* if y*log(x) is neither too big nor too small */
*24605Szliu	if((s=logb(y)+logb(n+t)) < 12.0)
*24605Szliu	    if(s>-60.0) {
*24605Szliu
*24605Szliu	/* compute y*log(x) ~ mlog2 + t + c */
*24605Szliu        	s=y*(n+invln2*t);
*24605Szliu                m=s+copysign(half,s);   /* m := nint(y*log(x)) */
*24605Szliu		k=y;
*24605Szliu		if((double)k==y) {	/* if y is an integer */
*24605Szliu		    k = m-k*n;
*24605Szliu		    sx=t; tx+=(t-sx); }
*24605Szliu		else	{		/* if y is not an integer */
*24605Szliu		    k =m;
*24605Szliu	 	    tx+=n*ln2lo;
*24605Szliu		    sx=(c=n*ln2hi)+t; tx+=(c-sx)+t; }
*24605Szliu	   /* end of checking whether k==y */
*24605Szliu
*24605Szliu                sy=y; ty=y-sy;          /* y ~ sy + ty */
*24605Szliu		s=(double)sx*sy-k*ln2hi;        /* (sy+ty)*(sx+tx)-kln2 */
*24605Szliu		z=(tx*ty-k*ln2lo);
*24605Szliu		tx=tx*sy; ty=sx*ty;
*24605Szliu		t=ty+z; t+=tx; t+=s;
*24605Szliu		c= -((((t-s)-tx)-ty)-z);
*24605Szliu
*24605Szliu	    /* return exp(y*log(x)) */
*24605Szliu		t += exp__E(t,c); return(scalb(one+t,m));
*24605Szliu	     }
*24605Szliu	/* end of if log(y*log(x)) > -60.0 */
*24605Szliu
*24605Szliu	    else
*24605Szliu		/* exp(+- tiny) = 1 with inexact flag */
*24605Szliu			{ln2hi+ln2lo; return(one);}
*24605Szliu	    else if(copysign(one,y)*(n+invln2*t) <zero)
*24605Szliu		/* exp(-(big#)) underflows to zero */
*24605Szliu	        	return(scalb(one,-5000));
*24605Szliu	    else
*24605Szliu	        /* exp(+(big#)) overflows to INF */
*24605Szliu	    		return(scalb(one, 5000));
*24605Szliu
*24605Szliu}