libm/ieee/support.c

24581Szliu/*
24581Szliu * Copyright (c) 1985 Regents of the University of California.
24581Szliu *
24581Szliu * Use and reproduction of this software are granted  in  accordance  with
24581Szliu * the terms and conditions specified in  the  Berkeley  Software  License
24581Szliu * Agreement (in particular, this entails acknowledgement of the programs'
24581Szliu * source, and inclusion of this notice) with the additional understanding
24581Szliu * that  all  recipients  should regard themselves as participants  in  an
24581Szliu * ongoing  research  project and hence should  feel  obligated  to report
24581Szliu * their  experiences (good or bad) with these elementary function  codes,
24581Szliu * using "sendbug 4bsd-bugs@BERKELEY", to the authors.
24581Szliu */
24581Szliu
24581Szliu#ifndef lint
24719Selefuntstatic char sccsid[] =
*27449Szliu"@(#)support.c	1.1 (Berkeley) 5/23/85; 1.3 (ucb.elefunt) 04/26/86";
24581Szliu#endif not lint
24581Szliu
24581Szliu/*
24581Szliu * Some IEEE standard p754 recommended functions and remainder and sqrt for
24581Szliu * supporting the C elementary functions.
24581Szliu ******************************************************************************
24581Szliu * WARNING:
24581Szliu *      These codes are developed (in double) to support the C elementary
24581Szliu * functions temporarily. They are not universal, and some of them are very
24581Szliu * slow (in particular, drem and sqrt is extremely inefficient). Each
24581Szliu * computer system should have its implementation of these functions using
24581Szliu * its own assembler.
24581Szliu ******************************************************************************
24581Szliu *
24581Szliu * IEEE p754 required operations:
24581Szliu *     drem(x,p)
24581Szliu *              returns  x REM y  =  x - [x/y]*y , where [x/y] is the integer
24581Szliu *              nearest x/y; in half way case, choose the even one.
24581Szliu *     sqrt(x)
24581Szliu *              returns the square root of x correctly rounded according to
24581Szliu *		the rounding mod.
24581Szliu *
24581Szliu * IEEE p754 recommended functions:
24581Szliu * (a) copysign(x,y)
24581Szliu *              returns x with the sign of y.
24581Szliu * (b) scalb(x,N)
24581Szliu *              returns  x * (2**N), for integer values N.
24581Szliu * (c) logb(x)
24581Szliu *              returns the unbiased exponent of x, a signed integer in
24581Szliu *              double precision, except that logb(0) is -INF, logb(INF)
24581Szliu *              is +INF, and logb(NAN) is that NAN.
24581Szliu * (d) finite(x)
24581Szliu *              returns the value TRUE if -INF < x < +INF and returns
24581Szliu *              FALSE otherwise.
24581Szliu *
24581Szliu *
24581Szliu * CODED IN C BY K.C. NG, 11/25/84;
24581Szliu * REVISED BY K.C. NG on 1/22/85, 2/13/85, 3/24/85.
24581Szliu */
24581Szliu
24581Szliu
24581Szliu#ifdef VAX      /* VAX D format */
24581Szliu    static unsigned short msign=0x7fff , mexp =0x7f80 ;
24581Szliu    static short  prep1=57, gap=7, bias=129           ;
24581Szliu    static double novf=1.7E38, nunf=3.0E-39, zero=0.0 ;
24581Szliu#else           /*IEEE double format */
24581Szliu    static unsigned short msign=0x7fff, mexp =0x7ff0  ;
24581Szliu    static short prep1=54, gap=4, bias=1023           ;
24581Szliu    static double novf=1.7E308, nunf=3.0E-308,zero=0.0;
24581Szliu#endif
24581Szliu
24581Szliudouble scalb(x,N)
24581Szliudouble x; int N;
24581Szliu{
24581Szliu        int k;
24581Szliu        double scalb();
24581Szliu
24581Szliu#ifdef NATIONAL
24581Szliu        unsigned short *px=(unsigned short *) &x + 3;
24581Szliu#else /* VAX, SUN, ZILOG */
24581Szliu        unsigned short *px=(unsigned short *) &x;
24581Szliu#endif
24581Szliu
24581Szliu        if( x == zero )  return(x);
24581Szliu
24581Szliu#ifdef VAX
24581Szliu        if( (k= *px & mexp ) != ~msign ) {
24581Szliu            if( N<-260) return(nunf*nunf); else if(N>260) return(novf+novf);
24581Szliu#else   /* IEEE */
24581Szliu        if( (k= *px & mexp ) != mexp ) {
24581Szliu            if( N<-2100) return(nunf*nunf); else if(N>2100) return(novf+novf);
24581Szliu            if( k == 0 ) {
24581Szliu                 x *= scalb(1.0,(int)prep1);  N -= prep1; return(scalb(x,N));}
24581Szliu#endif
24581Szliu
24581Szliu            if((k = (k>>gap)+ N) > 0 )
24581Szliu                if( k < (mexp>>gap) ) *px = (*px&~mexp) | (k<<gap);
24581Szliu                else x=novf+novf;               /* overflow */
24581Szliu            else
24581Szliu                if( k > -prep1 )
24581Szliu                                        /* gradual underflow */
24581Szliu                    {*px=(*px&~mexp)|(short)(1<<gap); x *= scalb(1.0,k-1);}
24581Szliu                else
24581Szliu                return(nunf*nunf);
24581Szliu            }
24581Szliu        return(x);
24581Szliu}
24581Szliu
24581Szliu
24581Szliudouble copysign(x,y)
24581Szliudouble x,y;
24581Szliu{
24581Szliu#ifdef NATIONAL
24581Szliu        unsigned short  *px=(unsigned short *) &x+3,
24581Szliu                        *py=(unsigned short *) &y+3;
24581Szliu#else /* VAX, SUN, ZILOG */
24581Szliu        unsigned short  *px=(unsigned short *) &x,
24581Szliu                        *py=(unsigned short *) &y;
24581Szliu#endif
24581Szliu
24581Szliu#ifdef VAX
24581Szliu        if ( (*px & mexp) == 0 ) return(x);
24581Szliu#endif
24581Szliu
24581Szliu        *px = ( *px & msign ) | ( *py & ~msign );
24581Szliu        return(x);
24581Szliu}
24581Szliu
24581Szliudouble logb(x)
24581Szliudouble x;
24581Szliu{
24581Szliu
24581Szliu#ifdef NATIONAL
24581Szliu        short *px=(short *) &x+3, k;
24581Szliu#else /* VAX, SUN, ZILOG */
24581Szliu        short *px=(short *) &x, k;
24581Szliu#endif
24581Szliu
24581Szliu#ifdef VAX
*27449Szliu        return (int)(((*px&mexp)>>gap)-bias);
24581Szliu#else /* IEEE */
24581Szliu        if( (k= *px & mexp ) != mexp )
24581Szliu            if ( k != 0 )
24581Szliu                return ( (k>>gap) - bias );
24581Szliu            else if( x != zero)
24581Szliu                return ( -1022.0 );
24581Szliu            else
24581Szliu                return(-(1.0/zero));
24581Szliu        else if(x != x)
24581Szliu            return(x);
24581Szliu        else
24581Szliu            {*px &= msign; return(x);}
24581Szliu#endif
24581Szliu}
24581Szliu
24581Szliufinite(x)
24581Szliudouble x;
24581Szliu{
24581Szliu#ifdef VAX
24581Szliu        return(1.0);
24581Szliu#else  /* IEEE */
24581Szliu#ifdef NATIONAL
24581Szliu        return( (*((short *) &x+3 ) & mexp ) != mexp );
24581Szliu#else /* SUN, ZILOG */
24581Szliu        return( (*((short *) &x ) & mexp ) != mexp );
24581Szliu#endif
24581Szliu#endif
24581Szliu}
24581Szliu
24581Szliudouble drem(x,p)
24581Szliudouble x,p;
24581Szliu{
24581Szliu        short sign;
24581Szliu        double hp,dp,tmp,drem(),scalb();
24581Szliu        unsigned short  k;
24581Szliu#ifdef NATIONAL
24581Szliu        unsigned short
24581Szliu              *px=(unsigned short *) &x  +3,
24581Szliu              *pp=(unsigned short *) &p  +3,
24581Szliu              *pd=(unsigned short *) &dp +3,
24581Szliu              *pt=(unsigned short *) &tmp+3;
24581Szliu#else /* VAX, SUN, ZILOG */
24581Szliu        unsigned short
24581Szliu              *px=(unsigned short *) &x  ,
24581Szliu              *pp=(unsigned short *) &p  ,
24581Szliu              *pd=(unsigned short *) &dp ,
24581Szliu              *pt=(unsigned short *) &tmp;
24581Szliu#endif
24581Szliu
24581Szliu        *pp &= msign ;
24581Szliu
24581Szliu#ifdef VAX
24581Szliu        if( ( *px & mexp ) == ~msign || p == zero )
24581Szliu#else /* IEEE */
24581Szliu        if( ( *px & mexp ) == mexp || p == zero )
24581Szliu#endif
24581Szliu
24581Szliu                return( (x != x)? x:zero/zero );
24581Szliu
24581Szliu        else  if ( ((*pp & mexp)>>gap) <= 1 )
24581Szliu                /* subnormal p, or almost subnormal p */
24581Szliu            { double b; b=scalb(1.0,(int)prep1);
24581Szliu              p *= b; x = drem(x,p); x *= b; return(drem(x,p)/b);}
24581Szliu        else  if ( p >= novf/2)
24581Szliu            { p /= 2 ; x /= 2; return(drem(x,p)*2);}
24581Szliu        else
24581Szliu            {
24581Szliu                dp=p+p; hp=p/2;
24581Szliu                sign= *px & ~msign ;
24581Szliu                *px &= msign       ;
24581Szliu                while ( x > dp )
24581Szliu                    {
24581Szliu                        k=(*px & mexp) - (*pd & mexp) ;
24581Szliu                        tmp = dp ;
24581Szliu                        *pt += k ;
24581Szliu
24581Szliu#ifdef VAX
24581Szliu                        if( x < tmp ) *pt -= 128 ;
24581Szliu#else /* IEEE */
24581Szliu                        if( x < tmp ) *pt -= 16 ;
24581Szliu#endif
24581Szliu
24581Szliu                        x -= tmp ;
24581Szliu                    }
24581Szliu                if ( x > hp )
24581Szliu                    { x -= p ;  if ( x >= hp ) x -= p ; }
24581Szliu
24581Szliu		*px = *px ^ sign;
24581Szliu                return( x);
24581Szliu
24581Szliu            }
24581Szliu}
24581Szliudouble sqrt(x)
24581Szliudouble x;
24581Szliu{
24581Szliu        double q,s,b,r;
24581Szliu        double logb(),scalb();
24581Szliu        double t,zero=0.0;
24581Szliu        int m,n,i,finite();
24581Szliu#ifdef VAX
24581Szliu        int k=54;
24581Szliu#else   /* IEEE */
24581Szliu        int k=51;
24581Szliu#endif
24581Szliu
24581Szliu    /* sqrt(NaN) is NaN, sqrt(+-0) = +-0 */
24581Szliu        if(x!=x||x==zero) return(x);
24581Szliu
24581Szliu    /* sqrt(negative) is invalid */
24581Szliu        if(x<zero) return(zero/zero);
24581Szliu
24581Szliu    /* sqrt(INF) is INF */
24581Szliu        if(!finite(x)) return(x);
24581Szliu
24581Szliu    /* scale x to [1,4) */
24581Szliu        n=logb(x);
24581Szliu        x=scalb(x,-n);
24581Szliu        if((m=logb(x))!=0) x=scalb(x,-m);       /* subnormal number */
24581Szliu        m += n;
24581Szliu        n = m/2;
24581Szliu        if((n+n)!=m) {x *= 2; m -=1; n=m/2;}
24581Szliu
24581Szliu    /* generate sqrt(x) bit by bit (accumulating in q) */
24581Szliu            q=1.0; s=4.0; x -= 1.0; r=1;
24581Szliu            for(i=1;i<=k;i++) {
24581Szliu                t=s+1; x *= 4; r /= 2;
24581Szliu                if(t<=x) {
24581Szliu                    s=t+t+2, x -= t; q += r;}
24581Szliu                else
24581Szliu                    s *= 2;
24581Szliu                }
24581Szliu
24581Szliu    /* generate the last bit and determine the final rounding */
24581Szliu            r/=2; x *= 4;
24581Szliu            if(x==zero) goto end; 100+r; /* trigger inexact flag */
24581Szliu            if(s<x) {
24581Szliu                q+=r; x -=s; s += 2; s *= 2; x *= 4;
24581Szliu                t = (x-s)-5;
24581Szliu                b=1.0+3*r/4; if(b==1.0) goto end; /* b==1 : Round-to-zero */
24581Szliu                b=1.0+r/4;   if(b>1.0) t=1;	/* b>1 : Round-to-(+INF) */
24581Szliu                if(t>=0) q+=r; }	      /* else: Round-to-nearest */
24581Szliu            else {
24581Szliu                s *= 2; x *= 4;
24581Szliu                t = (x-s)-1;
24581Szliu                b=1.0+3*r/4; if(b==1.0) goto end;
24581Szliu                b=1.0+r/4;   if(b>1.0) t=1;
24581Szliu                if(t>=0) q+=r; }
24581Szliu
24581Szliuend:        return(scalb(q,n));
24581Szliu}
24581Szliu
24581Szliu#if 0
24581Szliu/* DREM(X,Y)
24581Szliu * RETURN X REM Y =X-N*Y, N=[X/Y] ROUNDED (ROUNDED TO EVEN IN THE HALF WAY CASE)
24581Szliu * DOUBLE PRECISION (VAX D format 56 bits, IEEE DOUBLE 53 BITS)
24581Szliu * INTENDED FOR ASSEMBLY LANGUAGE
24581Szliu * CODED IN C BY K.C. NG, 3/23/85, 4/8/85.
24581Szliu *
24581Szliu * Warning: this code should not get compiled in unless ALL of
24581Szliu * the following machine-dependent routines are supplied.
24581Szliu *
24581Szliu * Required machine dependent functions (not on a VAX):
24581Szliu *     swapINX(i): save inexact flag and reset it to "i"
24581Szliu *     swapENI(e): save inexact enable and reset it to "e"
24581Szliu */
24581Szliu
24581Szliudouble drem(x,y)
24581Szliudouble x,y;
24581Szliu{
24581Szliu
24581Szliu#ifdef NATIONAL		/* order of words in floating point number */
24581Szliu	static n0=3,n1=2,n2=1,n3=0;
24581Szliu#else /* VAX, SUN, ZILOG */
24581Szliu	static n0=0,n1=1,n2=2,n3=3;
24581Szliu#endif
24581Szliu
24581Szliu    	static unsigned short mexp =0x7ff0, m25 =0x0190, m57 =0x0390;
24581Szliu	static double zero=0.0;
24581Szliu	double hy,y1,t,t1;
24581Szliu	short k;
24581Szliu	long n;
24581Szliu	int i,e;
24581Szliu	unsigned short xexp,yexp, *px  =(unsigned short *) &x  ,
24581Szliu	      		nx,nf,	  *py  =(unsigned short *) &y  ,
24581Szliu	      		sign,	  *pt  =(unsigned short *) &t  ,
24581Szliu	      			  *pt1 =(unsigned short *) &t1 ;
24581Szliu
24581Szliu	xexp = px[n0] & mexp ;	/* exponent of x */
24581Szliu	yexp = py[n0] & mexp ;	/* exponent of y */
24581Szliu	sign = px[n0] &0x8000;	/* sign of x     */
24581Szliu
24581Szliu/* return NaN if x is NaN, or y is NaN, or x is INF, or y is zero */
24581Szliu	if(x!=x) return(x); if(y!=y) return(y);	     /* x or y is NaN */
24581Szliu	if( xexp == mexp )   return(zero/zero);      /* x is INF */
24581Szliu	if(y==zero) return(y/y);
24581Szliu
24581Szliu/* save the inexact flag and inexact enable in i and e respectively
24581Szliu * and reset them to zero
24581Szliu */
24581Szliu	i=swapINX(0);	e=swapENI(0);
24581Szliu
24581Szliu/* subnormal number */
24581Szliu	nx=0;
24581Szliu	if(yexp==0) {t=1.0,pt[n0]+=m57; y*=t; nx=m57;}
24581Szliu
24581Szliu/* if y is tiny (biased exponent <= 57), scale up y to y*2**57 */
24581Szliu	if( yexp <= m57 ) {py[n0]+=m57; nx+=m57; yexp+=m57;}
24581Szliu
24581Szliu	nf=nx;
24581Szliu	py[n0] &= 0x7fff;
24581Szliu	px[n0] &= 0x7fff;
24581Szliu
24581Szliu/* mask off the least significant 27 bits of y */
24581Szliu	t=y; pt[n3]=0; pt[n2]&=0xf800; y1=t;
24581Szliu
24581Szliu/* LOOP: argument reduction on x whenever x > y */
24581Szliuloop:
24581Szliu	while ( x > y )
24581Szliu	{
24581Szliu	    t=y;
24581Szliu	    t1=y1;
24581Szliu	    xexp=px[n0]&mexp;	  /* exponent of x */
24581Szliu	    k=xexp-yexp-m25;
24581Szliu	    if(k>0) 	/* if x/y >= 2**26, scale up y so that x/y < 2**26 */
24581Szliu		{pt[n0]+=k;pt1[n0]+=k;}
24581Szliu	    n=x/t; x=(x-n*t1)-n*(t-t1);
24581Szliu	}
24581Szliu    /* end while (x > y) */
24581Szliu
24581Szliu	if(nx!=0) {t=1.0; pt[n0]+=nx; x*=t; nx=0; goto loop;}
24581Szliu
24581Szliu/* final adjustment */
24581Szliu
24581Szliu	hy=y/2.0;
24581Szliu	if(x>hy||((x==hy)&&n%2==1)) x-=y;
24581Szliu	px[n0] ^= sign;
24581Szliu	if(nf!=0) { t=1.0; pt[n0]-=nf; x*=t;}
24581Szliu
24581Szliu/* restore inexact flag and inexact enable */
24581Szliu	swapINX(i); swapENI(e);
24581Szliu
24581Szliu	return(x);
24581Szliu}
24581Szliu#endif
24581Szliu
24581Szliu#if 0
24581Szliu/* SQRT
24581Szliu * RETURN CORRECTLY ROUNDED (ACCORDING TO THE ROUNDING MODE) SQRT
24581Szliu * FOR IEEE DOUBLE PRECISION ONLY, INTENDED FOR ASSEMBLY LANGUAGE
24581Szliu * CODED IN C BY K.C. NG, 3/22/85.
24581Szliu *
24581Szliu * Warning: this code should not get compiled in unless ALL of
24581Szliu * the following machine-dependent routines are supplied.
24581Szliu *
24581Szliu * Required machine dependent functions:
24581Szliu *     swapINX(i)  ...return the status of INEXACT flag and reset it to "i"
24581Szliu *     swapRM(r)   ...return the current Rounding Mode and reset it to "r"
24581Szliu *     swapENI(e)  ...return the status of inexact enable and reset it to "e"
24581Szliu *     addc(t)     ...perform t=t+1 regarding t as a 64 bit unsigned integer
24581Szliu *     subc(t)     ...perform t=t-1 regarding t as a 64 bit unsigned integer
24581Szliu */
24581Szliu
24581Szliustatic unsigned long table[] = {
24581Szliu0, 1204, 3062, 5746, 9193, 13348, 18162, 23592, 29598, 36145, 43202, 50740,
24581Szliu58733, 67158, 75992, 85215, 83599, 71378, 60428, 50647, 41945, 34246, 27478,
24581Szliu21581, 16499, 12183, 8588, 5674, 3403, 1742, 661, 130, };
24581Szliu
24581Szliudouble newsqrt(x)
24581Szliudouble x;
24581Szliu{
24581Szliu        double y,z,t,addc(),subc(),b54=134217728.*134217728.; /* b54=2**54 */
24581Szliu        long mx,scalx,mexp=0x7ff00000;
24581Szliu        int i,j,r,e,swapINX(),swapRM(),swapENI();
24581Szliu        unsigned long *py=(unsigned long *) &y   ,
24581Szliu                      *pt=(unsigned long *) &t   ,
24581Szliu                      *px=(unsigned long *) &x   ;
24581Szliu#ifdef NATIONAL         /* ordering of word in a floating point number */
24581Szliu        int n0=1, n1=0;
24581Szliu#else
24581Szliu        int n0=0, n1=1;
24581Szliu#endif
24581Szliu/* Rounding Mode:  RN ...round-to-nearest
24581Szliu *                 RZ ...round-towards 0
24581Szliu *                 RP ...round-towards +INF
24581Szliu *		   RM ...round-towards -INF
24581Szliu */
24581Szliu        int RN=0,RZ=1,RP=2,RM=3;/* machine dependent: work on a Zilog Z8070
24581Szliu                                 * and a National 32081 & 16081
24581Szliu                                 */
24581Szliu
24581Szliu/* exceptions */
24581Szliu	if(x!=x||x==0.0) return(x);  /* sqrt(NaN) is NaN, sqrt(+-0) = +-0 */
24581Szliu	if(x<0) return((x-x)/(x-x)); /* sqrt(negative) is invalid */
24581Szliu        if((mx=px[n0]&mexp)==mexp) return(x);  /* sqrt(+INF) is +INF */
24581Szliu
24581Szliu/* save, reset, initialize */
24581Szliu        e=swapENI(0);   /* ...save and reset the inexact enable */
24581Szliu        i=swapINX(0);   /* ...save INEXACT flag */
24581Szliu        r=swapRM(RN);   /* ...save and reset the Rounding Mode to RN */
24581Szliu        scalx=0;
24581Szliu
24581Szliu/* subnormal number, scale up x to x*2**54 */
24581Szliu        if(mx==0) {x *= b54 ; scalx-=0x01b00000;}
24581Szliu
24581Szliu/* scale x to avoid intermediate over/underflow:
24581Szliu * if (x > 2**512) x=x/2**512; if (x < 2**-512) x=x*2**512 */
24581Szliu        if(mx>0x5ff00000) {px[n0] -= 0x20000000; scalx+= 0x10000000;}
24581Szliu        if(mx<0x1ff00000) {px[n0] += 0x20000000; scalx-= 0x10000000;}
24581Szliu
24581Szliu/* magic initial approximation to almost 8 sig. bits */
24581Szliu        py[n0]=(px[n0]>>1)+0x1ff80000;
24581Szliu        py[n0]=py[n0]-table[(py[n0]>>15)&31];
24581Szliu
24581Szliu/* Heron's rule once with correction to improve y to almost 18 sig. bits */
24581Szliu        t=x/y; y=y+t; py[n0]=py[n0]-0x00100006; py[n1]=0;
24581Szliu
24581Szliu/* triple to almost 56 sig. bits; now y approx. sqrt(x) to within 1 ulp */
24581Szliu        t=y*y; z=t;  pt[n0]+=0x00100000; t+=z; z=(x-z)*y;
24581Szliu        t=z/(t+x) ;  pt[n0]+=0x00100000; y+=t;
24581Szliu
24581Szliu/* twiddle last bit to force y correctly rounded */
24581Szliu        swapRM(RZ);     /* ...set Rounding Mode to round-toward-zero */
24581Szliu        swapINX(0);     /* ...clear INEXACT flag */
24581Szliu        swapENI(e);     /* ...restore inexact enable status */
24581Szliu        t=x/y;          /* ...chopped quotient, possibly inexact */
24581Szliu        j=swapINX(i);   /* ...read and restore inexact flag */
24581Szliu        if(j==0) { if(t==y) goto end; else t=subc(t); }  /* ...t=t-ulp */
24581Szliu        b54+0.1;        /* ..trigger inexact flag, sqrt(x) is inexact */
24581Szliu        if(r==RN) t=addc(t);            /* ...t=t+ulp */
24581Szliu        else if(r==RP) { t=addc(t);y=addc(y);}/* ...t=t+ulp;y=y+ulp; */
24581Szliu        y=y+t;                          /* ...chopped sum */
24581Szliu        py[n0]=py[n0]-0x00100000;       /* ...correctly rounded sqrt(x) */
24581Szliuend:    py[n0]=py[n0]+scalx;            /* ...scale back y */
24581Szliu        swapRM(r);                      /* ...restore Rounding Mode */
24581Szliu        return(y);
24581Szliu}
24581Szliu#endif