xref: /dflybsd-src/contrib/openbsd_libm/src/s_remquo.c (revision 4382f29d99a100bd77a81697c2f699c11f6a472a)
1*05a0b428SJohn Marino /* @(#)e_fmod.c 1.3 95/01/18 */
2*05a0b428SJohn Marino /*-
3*05a0b428SJohn Marino  * ====================================================
4*05a0b428SJohn Marino  * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
5*05a0b428SJohn Marino  *
6*05a0b428SJohn Marino  * Developed at SunSoft, a Sun Microsystems, Inc. business.
7*05a0b428SJohn Marino  * Permission to use, copy, modify, and distribute this
8*05a0b428SJohn Marino  * software is freely granted, provided that this notice
9*05a0b428SJohn Marino  * is preserved.
10*05a0b428SJohn Marino  * ====================================================
11*05a0b428SJohn Marino  */
12*05a0b428SJohn Marino 
13*05a0b428SJohn Marino #include <float.h>
14*05a0b428SJohn Marino #include <math.h>
15*05a0b428SJohn Marino 
16*05a0b428SJohn Marino #include "math_private.h"
17*05a0b428SJohn Marino 
18*05a0b428SJohn Marino static const double Zero[] = {0.0, -0.0,};
19*05a0b428SJohn Marino 
20*05a0b428SJohn Marino /*
21*05a0b428SJohn Marino  * Return the IEEE remainder and set *quo to the last n bits of the
22*05a0b428SJohn Marino  * quotient, rounded to the nearest integer.  We choose n=31 because
23*05a0b428SJohn Marino  * we wind up computing all the integer bits of the quotient anyway as
24*05a0b428SJohn Marino  * a side-effect of computing the remainder by the shift and subtract
25*05a0b428SJohn Marino  * method.  In practice, this is far more bits than are needed to use
26*05a0b428SJohn Marino  * remquo in reduction algorithms.
27*05a0b428SJohn Marino  */
28*05a0b428SJohn Marino double
remquo(double x,double y,int * quo)29*05a0b428SJohn Marino remquo(double x, double y, int *quo)
30*05a0b428SJohn Marino {
31*05a0b428SJohn Marino 	int32_t n,hx,hy,hz,ix,iy,sx,i;
32*05a0b428SJohn Marino 	u_int32_t lx,ly,lz,q,sxy;
33*05a0b428SJohn Marino 
34*05a0b428SJohn Marino 	EXTRACT_WORDS(hx,lx,x);
35*05a0b428SJohn Marino 	EXTRACT_WORDS(hy,ly,y);
36*05a0b428SJohn Marino 	sxy = (hx ^ hy) & 0x80000000;
37*05a0b428SJohn Marino 	sx = hx&0x80000000;		/* sign of x */
38*05a0b428SJohn Marino 	hx ^=sx;		/* |x| */
39*05a0b428SJohn Marino 	hy &= 0x7fffffff;	/* |y| */
40*05a0b428SJohn Marino 
41*05a0b428SJohn Marino     /* purge off exception values */
42*05a0b428SJohn Marino 	if((hy|ly)==0||(hx>=0x7ff00000)||	/* y=0,or x not finite */
43*05a0b428SJohn Marino 	  ((hy|((ly|-ly)>>31))>0x7ff00000))	/* or y is NaN */
44*05a0b428SJohn Marino 	    return (x*y)/(x*y);
45*05a0b428SJohn Marino 	if(hx<=hy) {
46*05a0b428SJohn Marino 	    if((hx<hy)||(lx<ly)) {
47*05a0b428SJohn Marino 		q = 0;
48*05a0b428SJohn Marino 		goto fixup;	/* |x|<|y| return x or x-y */
49*05a0b428SJohn Marino 	    }
50*05a0b428SJohn Marino 	    if(lx==ly) {
51*05a0b428SJohn Marino 		*quo = 1;
52*05a0b428SJohn Marino 		return Zero[(u_int32_t)sx>>31];	/* |x|=|y| return x*0*/
53*05a0b428SJohn Marino 	    }
54*05a0b428SJohn Marino 	}
55*05a0b428SJohn Marino 
56*05a0b428SJohn Marino     /* determine ix = ilogb(x) */
57*05a0b428SJohn Marino 	if(hx<0x00100000) {	/* subnormal x */
58*05a0b428SJohn Marino 	    if(hx==0) {
59*05a0b428SJohn Marino 		for (ix = -1043, i=lx; i>0; i<<=1) ix -=1;
60*05a0b428SJohn Marino 	    } else {
61*05a0b428SJohn Marino 		for (ix = -1022,i=(hx<<11); i>0; i<<=1) ix -=1;
62*05a0b428SJohn Marino 	    }
63*05a0b428SJohn Marino 	} else ix = (hx>>20)-1023;
64*05a0b428SJohn Marino 
65*05a0b428SJohn Marino     /* determine iy = ilogb(y) */
66*05a0b428SJohn Marino 	if(hy<0x00100000) {	/* subnormal y */
67*05a0b428SJohn Marino 	    if(hy==0) {
68*05a0b428SJohn Marino 		for (iy = -1043, i=ly; i>0; i<<=1) iy -=1;
69*05a0b428SJohn Marino 	    } else {
70*05a0b428SJohn Marino 		for (iy = -1022,i=(hy<<11); i>0; i<<=1) iy -=1;
71*05a0b428SJohn Marino 	    }
72*05a0b428SJohn Marino 	} else iy = (hy>>20)-1023;
73*05a0b428SJohn Marino 
74*05a0b428SJohn Marino     /* set up {hx,lx}, {hy,ly} and align y to x */
75*05a0b428SJohn Marino 	if(ix >= -1022)
76*05a0b428SJohn Marino 	    hx = 0x00100000|(0x000fffff&hx);
77*05a0b428SJohn Marino 	else {		/* subnormal x, shift x to normal */
78*05a0b428SJohn Marino 	    n = -1022-ix;
79*05a0b428SJohn Marino 	    if(n<=31) {
80*05a0b428SJohn Marino 	        hx = (hx<<n)|(lx>>(32-n));
81*05a0b428SJohn Marino 	        lx <<= n;
82*05a0b428SJohn Marino 	    } else {
83*05a0b428SJohn Marino 		hx = lx<<(n-32);
84*05a0b428SJohn Marino 		lx = 0;
85*05a0b428SJohn Marino 	    }
86*05a0b428SJohn Marino 	}
87*05a0b428SJohn Marino 	if(iy >= -1022)
88*05a0b428SJohn Marino 	    hy = 0x00100000|(0x000fffff&hy);
89*05a0b428SJohn Marino 	else {		/* subnormal y, shift y to normal */
90*05a0b428SJohn Marino 	    n = -1022-iy;
91*05a0b428SJohn Marino 	    if(n<=31) {
92*05a0b428SJohn Marino 	        hy = (hy<<n)|(ly>>(32-n));
93*05a0b428SJohn Marino 	        ly <<= n;
94*05a0b428SJohn Marino 	    } else {
95*05a0b428SJohn Marino 		hy = ly<<(n-32);
96*05a0b428SJohn Marino 		ly = 0;
97*05a0b428SJohn Marino 	    }
98*05a0b428SJohn Marino 	}
99*05a0b428SJohn Marino 
100*05a0b428SJohn Marino     /* fix point fmod */
101*05a0b428SJohn Marino 	n = ix - iy;
102*05a0b428SJohn Marino 	q = 0;
103*05a0b428SJohn Marino 	while(n--) {
104*05a0b428SJohn Marino 	    hz=hx-hy;lz=lx-ly; if(lx<ly) hz -= 1;
105*05a0b428SJohn Marino 	    if(hz<0){hx = hx+hx+(lx>>31); lx = lx+lx;}
106*05a0b428SJohn Marino 	    else {hx = hz+hz+(lz>>31); lx = lz+lz; q++;}
107*05a0b428SJohn Marino 	    q <<= 1;
108*05a0b428SJohn Marino 	}
109*05a0b428SJohn Marino 	hz=hx-hy;lz=lx-ly; if(lx<ly) hz -= 1;
110*05a0b428SJohn Marino 	if(hz>=0) {hx=hz;lx=lz;q++;}
111*05a0b428SJohn Marino 
112*05a0b428SJohn Marino     /* convert back to floating value and restore the sign */
113*05a0b428SJohn Marino 	if((hx|lx)==0) {			/* return sign(x)*0 */
114*05a0b428SJohn Marino 	    *quo = (sxy ? -q : q);
115*05a0b428SJohn Marino 	    return Zero[(u_int32_t)sx>>31];
116*05a0b428SJohn Marino 	}
117*05a0b428SJohn Marino 	while(hx<0x00100000) {		/* normalize x */
118*05a0b428SJohn Marino 	    hx = hx+hx+(lx>>31); lx = lx+lx;
119*05a0b428SJohn Marino 	    iy -= 1;
120*05a0b428SJohn Marino 	}
121*05a0b428SJohn Marino 	if(iy>= -1022) {	/* normalize output */
122*05a0b428SJohn Marino 	    hx = ((hx-0x00100000)|((iy+1023)<<20));
123*05a0b428SJohn Marino 	} else {		/* subnormal output */
124*05a0b428SJohn Marino 	    n = -1022 - iy;
125*05a0b428SJohn Marino 	    if(n<=20) {
126*05a0b428SJohn Marino 		lx = (lx>>n)|((u_int32_t)hx<<(32-n));
127*05a0b428SJohn Marino 		hx >>= n;
128*05a0b428SJohn Marino 	    } else if (n<=31) {
129*05a0b428SJohn Marino 		lx = (hx<<(32-n))|(lx>>n); hx = sx;
130*05a0b428SJohn Marino 	    } else {
131*05a0b428SJohn Marino 		lx = hx>>(n-32); hx = sx;
132*05a0b428SJohn Marino 	    }
133*05a0b428SJohn Marino 	}
134*05a0b428SJohn Marino fixup:
135*05a0b428SJohn Marino 	INSERT_WORDS(x,hx,lx);
136*05a0b428SJohn Marino 	y = fabs(y);
137*05a0b428SJohn Marino 	if (y < 0x1p-1021) {
138*05a0b428SJohn Marino 	    if (x+x>y || (x+x==y && (q & 1))) {
139*05a0b428SJohn Marino 		q++;
140*05a0b428SJohn Marino 		x-=y;
141*05a0b428SJohn Marino 	    }
142*05a0b428SJohn Marino 	} else if (x>0.5*y || (x==0.5*y && (q & 1))) {
143*05a0b428SJohn Marino 	    q++;
144*05a0b428SJohn Marino 	    x-=y;
145*05a0b428SJohn Marino 	}
146*05a0b428SJohn Marino 	GET_HIGH_WORD(hx,x);
147*05a0b428SJohn Marino 	SET_HIGH_WORD(x,hx^sx);
148*05a0b428SJohn Marino 	q &= 0x7fffffff;
149*05a0b428SJohn Marino 	*quo = (sxy ? -q : q);
150*05a0b428SJohn Marino 	return x;
151*05a0b428SJohn Marino }
152*05a0b428SJohn Marino 
153*05a0b428SJohn Marino #if	LDBL_MANT_DIG == DBL_MANT_DIG
154*05a0b428SJohn Marino __strong_alias(remquol, remquo);
155*05a0b428SJohn Marino #endif	/* LDBL_MANT_DIG == DBL_MANT_DIG */
156