xref: /csrg-svn/lib/libm/common_source/exp.c (revision 31812)
124593Szliu /*
224593Szliu  * Copyright (c) 1985 Regents of the University of California.
324593Szliu  *
424593Szliu  * Use and reproduction of this software are granted  in  accordance  with
524593Szliu  * the terms and conditions specified in  the  Berkeley  Software  License
624593Szliu  * Agreement (in particular, this entails acknowledgement of the programs'
724593Szliu  * source, and inclusion of this notice) with the additional understanding
824593Szliu  * that  all  recipients  should regard themselves as participants  in  an
924593Szliu  * ongoing  research  project and hence should  feel  obligated  to report
1024593Szliu  * their  experiences (good or bad) with these elementary function  codes,
1124593Szliu  * using "sendbug 4bsd-bugs@BERKELEY", to the authors.
1224593Szliu  */
1324593Szliu 
1424593Szliu #ifndef lint
1524706Selefunt static char sccsid[] =
16*31812Szliu "@(#)exp.c	4.3 (Berkeley) 8/21/85; 1.7 (ucb.elefunt) 07/10/87";
1724593Szliu #endif not lint
1824593Szliu 
1924593Szliu /* EXP(X)
2024593Szliu  * RETURN THE EXPONENTIAL OF X
2124593Szliu  * DOUBLE PRECISION (IEEE 53 bits, VAX D FORMAT 56 BITS)
2224593Szliu  * CODED IN C BY K.C. NG, 1/19/85;
2329410Selefunt  * REVISED BY K.C. NG on 2/6/85, 2/15/85, 3/7/85, 3/24/85, 4/16/85, 6/14/86.
2424593Szliu  *
2524593Szliu  * Required system supported functions:
2624593Szliu  *	scalb(x,n)
2724593Szliu  *	copysign(x,y)
2824593Szliu  *	finite(x)
2924593Szliu  *
3024593Szliu  * Method:
3124593Szliu  *	1. Argument Reduction: given the input x, find r and integer k such
3224593Szliu  *	   that
3324593Szliu  *	                   x = k*ln2 + r,  |r| <= 0.5*ln2 .
3424593Szliu  *	   r will be represented as r := z+c for better accuracy.
3524593Szliu  *
3629410Selefunt  *	2. Compute exp(r) by
3724593Szliu  *
3829410Selefunt  *		exp(r) = 1 + r + r*R1/(2-R1),
3929410Selefunt  *	   where
4029410Selefunt  *		R1 = x - x^2*(p1+x^2*(p2+x^2*(p3+x^2*(p4+p5*x^2)))).
4124593Szliu  *
4229410Selefunt  *	3. exp(x) = 2^k * exp(r) .
4324593Szliu  *
4424593Szliu  * Special cases:
4524593Szliu  *	exp(INF) is INF, exp(NaN) is NaN;
4624593Szliu  *	exp(-INF)=  0;
4724593Szliu  *	for finite argument, only exp(0)=1 is exact.
4824593Szliu  *
4924593Szliu  * Accuracy:
5024593Szliu  *	exp(x) returns the exponential of x nearly rounded. In a test run
5124593Szliu  *	with 1,156,000 random arguments on a VAX, the maximum observed
5229410Selefunt  *	error was 0.869 ulps (units in the last place).
5324593Szliu  *
5424593Szliu  * Constants:
5524593Szliu  * The hexadecimal values are the intended ones for the following constants.
5624593Szliu  * The decimal values may be used, provided that the compiler will convert
5724593Szliu  * from decimal to binary accurately enough to produce the hexadecimal values
5824593Szliu  * shown.
5924593Szliu  */
6024593Szliu 
6131790Szliu #if (defined(VAX)||defined(TAHOE))	/* VAX D format */
62*31812Szliu #ifdef VAX
63*31812Szliu #define _0x(A,B)	0x/**/A/**/B
64*31812Szliu #else	/* VAX */
65*31812Szliu #define _0x(A,B)	0x/**/B/**/A
66*31812Szliu #endif	/* VAX */
6726893Selefunt /* static double */
6824593Szliu /* ln2hi  =  6.9314718055829871446E-1    , Hex  2^  0   *  .B17217F7D00000 */
6924593Szliu /* ln2lo  =  1.6465949582897081279E-12   , Hex  2^-39   *  .E7BCD5E4F1D9CC */
7024593Szliu /* lnhuge =  9.4961163736712506989E1     , Hex  2^  7   *  .BDEC1DA73E9010 */
7124593Szliu /* lntiny = -9.5654310917272452386E1     , Hex  2^  7   * -.BF4F01D72E33AF */
7224593Szliu /* invln2 =  1.4426950408889634148E0     ; Hex  2^  1   *  .B8AA3B295C17F1 */
7329410Selefunt /* p1     =  1.6666666666666602251E-1    , Hex  2^-2    *  .AAAAAAAAAAA9F1 */
7429410Selefunt /* p2     = -2.7777777777015591216E-3    , Hex  2^-8    * -.B60B60B5F5EC94 */
7529410Selefunt /* p3     =  6.6137563214379341918E-5    , Hex  2^-13   *  .8AB355792EF15F */
7629410Selefunt /* p4     = -1.6533902205465250480E-6    , Hex  2^-19   * -.DDEA0E2E935F84 */
7729410Selefunt /* p5     =  4.1381367970572387085E-8    , Hex  2^-24   *  .B1BB4B95F52683 */
78*31812Szliu static long     ln2hix[] = { _0x(7217,4031), _0x(0000,f7d0)};
79*31812Szliu static long     ln2lox[] = { _0x(bcd5,2ce7), _0x(d9cc,e4f1)};
80*31812Szliu static long    lnhugex[] = { _0x(ec1d,43bd), _0x(9010,a73e)};
81*31812Szliu static long    lntinyx[] = { _0x(4f01,c3bf), _0x(33af,d72e)};
82*31812Szliu static long    invln2x[] = { _0x(aa3b,40b8), _0x(17f1,295c)};
83*31812Szliu static long        p1x[] = { _0x(aaaa,3f2a), _0x(a9f1,aaaa)};
84*31812Szliu static long        p2x[] = { _0x(0b60,bc36), _0x(ec94,b5f5)};
85*31812Szliu static long        p3x[] = { _0x(b355,398a), _0x(f15f,792e)};
86*31812Szliu static long        p4x[] = { _0x(ea0e,b6dd), _0x(5f84,2e93)};
87*31812Szliu static long        p5x[] = { _0x(bb4b,3431), _0x(2683,95f5)};
8824593Szliu #define    ln2hi    (*(double*)ln2hix)
8924593Szliu #define    ln2lo    (*(double*)ln2lox)
9024593Szliu #define   lnhuge    (*(double*)lnhugex)
9124593Szliu #define   lntiny    (*(double*)lntinyx)
9224593Szliu #define   invln2    (*(double*)invln2x)
9329410Selefunt #define       p1    (*(double*)p1x)
9429410Selefunt #define       p2    (*(double*)p2x)
9529410Selefunt #define       p3    (*(double*)p3x)
9629410Selefunt #define       p4    (*(double*)p4x)
9729410Selefunt #define       p5    (*(double*)p5x)
9829410Selefunt 
9924593Szliu #else	/* IEEE double */
10026893Selefunt static double
10129410Selefunt p1     =  1.6666666666666601904E-1    , /*Hex  2^-3    *  1.555555555553E */
10229410Selefunt p2     = -2.7777777777015593384E-3    , /*Hex  2^-9    * -1.6C16C16BEBD93 */
10329410Selefunt p3     =  6.6137563214379343612E-5    , /*Hex  2^-14   *  1.1566AAF25DE2C */
10429410Selefunt p4     = -1.6533902205465251539E-6    , /*Hex  2^-20   * -1.BBD41C5D26BF1 */
10529410Selefunt p5     =  4.1381367970572384604E-8    , /*Hex  2^-25   *  1.6376972BEA4D0 */
10624593Szliu ln2hi  =  6.9314718036912381649E-1    , /*Hex  2^ -1   *  1.62E42FEE00000 */
10724593Szliu ln2lo  =  1.9082149292705877000E-10   , /*Hex  2^-33   *  1.A39EF35793C76 */
10824593Szliu lnhuge =  7.1602103751842355450E2     , /*Hex  2^  9   *  1.6602B15B7ECF2 */
10924593Szliu lntiny = -7.5137154372698068983E2     , /*Hex  2^  9   * -1.77AF8EBEAE354 */
11024593Szliu invln2 =  1.4426950408889633870E0     ; /*Hex  2^  0   *  1.71547652B82FE */
11124593Szliu #endif
11224593Szliu 
11324593Szliu double exp(x)
11424593Szliu double x;
11524593Szliu {
11629410Selefunt 	double scalb(), copysign(), z,hi,lo,c;
11724593Szliu 	int k,finite();
11824593Szliu 
11931790Szliu #if (!defined(VAX)&&!defined(TAHOE))
12024593Szliu 	if(x!=x) return(x);	/* x is NaN */
12124593Szliu #endif
12224593Szliu 	if( x <= lnhuge ) {
12324593Szliu 		if( x >= lntiny ) {
12424593Szliu 
12524593Szliu 		    /* argument reduction : x --> x - k*ln2 */
12624593Szliu 
12724593Szliu 			k=invln2*x+copysign(0.5,x);	/* k=NINT(x/ln2) */
12824593Szliu 
12929410Selefunt 		    /* express x-k*ln2 as hi-lo and let x=hi-lo rounded */
13029410Selefunt 
13124593Szliu 			hi=x-k*ln2hi;
13229410Selefunt 			x=hi-(lo=k*ln2lo);
13324593Szliu 
13429410Selefunt 		    /* return 2^k*[1+x+x*c/(2+c)]  */
13529410Selefunt 			z=x*x;
13629410Selefunt 			c= x - z*(p1+z*(p2+z*(p3+z*(p4+z*p5))));
13729890Selefunt 			return  scalb(1.0+(hi-(lo-(x*c)/(2.0-c))),k);
13829410Selefunt 
13924593Szliu 		}
14024593Szliu 		/* end of x > lntiny */
14124593Szliu 
14224593Szliu 		else
14324593Szliu 		     /* exp(-big#) underflows to zero */
14424593Szliu 		     if(finite(x))  return(scalb(1.0,-5000));
14524593Szliu 
14624593Szliu 		     /* exp(-INF) is zero */
14724593Szliu 		     else return(0.0);
14824593Szliu 	}
14924593Szliu 	/* end of x < lnhuge */
15024593Szliu 
15124593Szliu 	else
15224593Szliu 	/* exp(INF) is INF, exp(+big#) overflows to INF */
15324593Szliu 	    return( finite(x) ?  scalb(1.0,5000)  : x);
15424593Szliu }
155