libm/ieee/cbrt.c

*24580Szliu/*
*24580Szliu * Copyright (c) 1985 Regents of the University of California.
*24580Szliu *
*24580Szliu * Use and reproduction of this software are granted  in  accordance  with
*24580Szliu * the terms and conditions specified in  the  Berkeley  Software  License
*24580Szliu * Agreement (in particular, this entails acknowledgement of the programs'
*24580Szliu * source, and inclusion of this notice) with the additional understanding
*24580Szliu * that  all  recipients  should regard themselves as participants  in  an
*24580Szliu * ongoing  research  project and hence should  feel  obligated  to report
*24580Szliu * their  experiences (good or bad) with these elementary function  codes,
*24580Szliu * using "sendbug 4bsd-bugs@BERKELEY", to the authors.
*24580Szliu */
*24580Szliu
*24580Szliu#ifndef lint
*24580Szliustatic char sccsid[] = "@(#)cbrt.c	1.1 (ELEFUNT) 09/06/85";
*24580Szliu#endif not lint
*24580Szliu
*24580Szliu/* kahan's cube root (53 bits IEEE double precision)
*24580Szliu * for IEEE machines only
*24580Szliu * coded in C by K.C. Ng, 4/30/85
*24580Szliu *
*24580Szliu * Accuracy:
*24580Szliu *	better than 0.667 ulps according to an error analysis. Maximum
*24580Szliu * error observed was 0.666 ulps in an 1,000,000 random arguments test.
*24580Szliu *
*24580Szliu * Warning: this code is semi machine dependent; the ordering of words in
*24580Szliu * a floating point number must be known in advance. I assume that the
*24580Szliu * long interger at the address of a floating point number will be the
*24580Szliu * leading 32 bits of that floating point number (i.e., sign, exponent,
*24580Szliu * and the 20 most significant bits).
*24580Szliu * On a National machine, it has different ordering; therefore, this code
*24580Szliu * must be compiled with flag -DNATIONAL.
*24580Szliu */
*24580Szliu#ifndef VAX
*24580Szliu
*24580Szliustatic unsigned long B1 = 715094163, /* B1 = (682-0.03306235651)*2**20 */
*24580Szliu	             B2 = 696219795; /* B2 = (664-0.03306235651)*2**20 */
*24580Szliustatic double
*24580Szliu	    C= 19./35.,
*24580Szliu	    D= -864./1225.,
*24580Szliu	    E= 99./70.,
*24580Szliu	    F= 45./28.,
*24580Szliu	    G= 5./14.;
*24580Szliu
*24580Szliudouble cbrt(x)
*24580Szliudouble x;
*24580Szliu{
*24580Szliu	double r,s,t=0.0,w;
*24580Szliu	unsigned long *px = (unsigned long *) &x,
*24580Szliu	              *pt = (unsigned long *) &t,
*24580Szliu		      mexp,sign;
*24580Szliu
*24580Szliu#ifdef NATIONAL /* ordering of words in a floating points number */
*24580Szliu	int n0=1,n1=0;
*24580Szliu#else
*24580Szliu	int n0=0,n1=1;
*24580Szliu#endif
*24580Szliu
*24580Szliu	mexp=px[n0]&0x7ff00000;
*24580Szliu	if(mexp==0x7ff00000) return(x); /* cbrt(NaN,INF) is itself */
*24580Szliu	if(x==0.0) return(x);		/* cbrt(0) is itself */
*24580Szliu
*24580Szliu	sign=px[n0]&0x80000000; /* sign= sign(x) */
*24580Szliu	px[n0] ^= sign;		/* x=|x| */
*24580Szliu
*24580Szliu
*24580Szliu    /* rough cbrt to 5 bits */
*24580Szliu	if(mexp==0) 		/* subnormal number */
*24580Szliu	  {pt[n0]=0x43500000; 	/* set t= 2**54 */
*24580Szliu	   t*=x; pt[n0]=pt[n0]/3+B2;
*24580Szliu	  }
*24580Szliu	else
*24580Szliu	  pt[n0]=px[n0]/3+B1;
*24580Szliu
*24580Szliu
*24580Szliu    /* new cbrt to 23 bits, may be implemented in single precision */
*24580Szliu	r=t*t/x;
*24580Szliu	s=C+r*t;
*24580Szliu	t*=G+F/(s+E+D/s);
*24580Szliu
*24580Szliu    /* chopped to 20 bits and make it larger than cbrt(x) */
*24580Szliu	pt[n1]=0; pt[n0]+=0x00000001;
*24580Szliu
*24580Szliu
*24580Szliu    /* one step newton iteration to 53 bits with error less than 0.667 ulps */
*24580Szliu	s=t*t;		/* t*t is exact */
*24580Szliu	r=x/s;
*24580Szliu	w=t+t;
*24580Szliu	r=(r-t)/(w+r);	/* r-s is exact */
*24580Szliu	t=t+t*r;
*24580Szliu
*24580Szliu
*24580Szliu    /* retore the sign bit */
*24580Szliu	pt[n0] |= sign;
*24580Szliu	return(t);
*24580Szliu}
*24580Szliu#endif