libm/ieee/cbrt.c

34123Sbostic/*
24580Szliu * Copyright (c) 1985 Regents of the University of California.
34123Sbostic * All rights reserved.
34123Sbostic *
34123Sbostic * Redistribution and use in source and binary forms are permitted
34925Sbostic * provided that the above copyright notice and this paragraph are
34925Sbostic * duplicated in all such forms and that any documentation,
34925Sbostic * advertising materials, and other materials related to such
34925Sbostic * distribution and use acknowledge that the software was developed
34925Sbostic * by the University of California, Berkeley.  The name of the
34925Sbostic * University may not be used to endorse or promote products derived
34925Sbostic * from this software without specific prior written permission.
34925Sbostic * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
34925Sbostic * IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
34925Sbostic * WARRANTIES OF MERCHANTIBILITY AND FITNESS FOR A PARTICULAR PURPOSE.
34123Sbostic *
34123Sbostic * All recipients should regard themselves as participants in an ongoing
34123Sbostic * research project and hence should feel obligated to report their
34123Sbostic * experiences (good or bad) with these elementary function codes, using
34123Sbostic * the sendbug(8) program, to the authors.
24580Szliu */
24580Szliu
24580Szliu#ifndef lint
*35681Sbosticstatic char sccsid[] = "@(#)cbrt.c	5.5 (Berkeley) 09/22/88";
34123Sbostic#endif /* not lint */
24580Szliu
24580Szliu/* kahan's cube root (53 bits IEEE double precision)
24580Szliu * for IEEE machines only
24580Szliu * coded in C by K.C. Ng, 4/30/85
24580Szliu *
24580Szliu * Accuracy:
24580Szliu *	better than 0.667 ulps according to an error analysis. Maximum
24580Szliu * error observed was 0.666 ulps in an 1,000,000 random arguments test.
24580Szliu *
24580Szliu * Warning: this code is semi machine dependent; the ordering of words in
24580Szliu * a floating point number must be known in advance. I assume that the
24580Szliu * long interger at the address of a floating point number will be the
24580Szliu * leading 32 bits of that floating point number (i.e., sign, exponent,
24580Szliu * and the 20 most significant bits).
24580Szliu * On a National machine, it has different ordering; therefore, this code
24580Szliu * must be compiled with flag -DNATIONAL.
24580Szliu */
31856Szliu#if !defined(vax)&&!defined(tahoe)
24580Szliu
*35681Sbosticstatic const unsigned long
*35681Sbostic		     B1 = 715094163, /* B1 = (682-0.03306235651)*2**20 */
24580Szliu	             B2 = 696219795; /* B2 = (664-0.03306235651)*2**20 */
*35681Sbosticstatic const double
24580Szliu	    C= 19./35.,
24580Szliu	    D= -864./1225.,
24580Szliu	    E= 99./70.,
24580Szliu	    F= 45./28.,
24580Szliu	    G= 5./14.;
24580Szliu
24580Szliudouble cbrt(x)
24580Szliudouble x;
24580Szliu{
24580Szliu	double r,s,t=0.0,w;
24580Szliu	unsigned long *px = (unsigned long *) &x,
24580Szliu	              *pt = (unsigned long *) &t,
24580Szliu		      mexp,sign;
24580Szliu
31856Szliu#ifdef national /* ordering of words in a floating points number */
*35681Sbostic	const int n0=1,n1=0;
31856Szliu#else	/* national */
*35681Sbostic	const int n0=0,n1=1;
31856Szliu#endif	/* national */
24580Szliu
24580Szliu	mexp=px[n0]&0x7ff00000;
24580Szliu	if(mexp==0x7ff00000) return(x); /* cbrt(NaN,INF) is itself */
24580Szliu	if(x==0.0) return(x);		/* cbrt(0) is itself */
24580Szliu
24580Szliu	sign=px[n0]&0x80000000; /* sign= sign(x) */
24580Szliu	px[n0] ^= sign;		/* x=|x| */
24580Szliu
24580Szliu
24580Szliu    /* rough cbrt to 5 bits */
24580Szliu	if(mexp==0) 		/* subnormal number */
24580Szliu	  {pt[n0]=0x43500000; 	/* set t= 2**54 */
24580Szliu	   t*=x; pt[n0]=pt[n0]/3+B2;
24580Szliu	  }
24580Szliu	else
24580Szliu	  pt[n0]=px[n0]/3+B1;
24580Szliu
24580Szliu
24580Szliu    /* new cbrt to 23 bits, may be implemented in single precision */
24580Szliu	r=t*t/x;
24580Szliu	s=C+r*t;
24580Szliu	t*=G+F/(s+E+D/s);
24580Szliu
24580Szliu    /* chopped to 20 bits and make it larger than cbrt(x) */
24580Szliu	pt[n1]=0; pt[n0]+=0x00000001;
24580Szliu
24580Szliu
24580Szliu    /* one step newton iteration to 53 bits with error less than 0.667 ulps */
24580Szliu	s=t*t;		/* t*t is exact */
24580Szliu	r=x/s;
24580Szliu	w=t+t;
33938Sbostic	r=(r-t)/(w+r);	/* r-t is exact */
24580Szliu	t=t+t*r;
24580Szliu
24580Szliu
24580Szliu    /* retore the sign bit */
24580Szliu	pt[n0] |= sign;
24580Szliu	return(t);
24580Szliu}
24580Szliu#endif