xref: /dflybsd-src/contrib/openbsd_libm/src/s_csqrtf.c (revision 4382f29d99a100bd77a81697c2f699c11f6a472a)
1*05a0b428SJohn Marino /*	$OpenBSD: s_csqrtf.c,v 1.2 2010/07/18 18:42:26 guenther Exp $	*/
2*05a0b428SJohn Marino /*
3*05a0b428SJohn Marino  * Copyright (c) 2008 Stephen L. Moshier <steve@moshier.net>
4*05a0b428SJohn Marino  *
5*05a0b428SJohn Marino  * Permission to use, copy, modify, and distribute this software for any
6*05a0b428SJohn Marino  * purpose with or without fee is hereby granted, provided that the above
7*05a0b428SJohn Marino  * copyright notice and this permission notice appear in all copies.
8*05a0b428SJohn Marino  *
9*05a0b428SJohn Marino  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10*05a0b428SJohn Marino  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11*05a0b428SJohn Marino  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12*05a0b428SJohn Marino  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13*05a0b428SJohn Marino  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14*05a0b428SJohn Marino  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15*05a0b428SJohn Marino  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
16*05a0b428SJohn Marino  */
17*05a0b428SJohn Marino 
18*05a0b428SJohn Marino /*							csqrtf()
19*05a0b428SJohn Marino  *
20*05a0b428SJohn Marino  *	Complex square root
21*05a0b428SJohn Marino  *
22*05a0b428SJohn Marino  *
23*05a0b428SJohn Marino  *
24*05a0b428SJohn Marino  * SYNOPSIS:
25*05a0b428SJohn Marino  *
26*05a0b428SJohn Marino  * float complex csqrtf();
27*05a0b428SJohn Marino  * float complex z, w;
28*05a0b428SJohn Marino  *
29*05a0b428SJohn Marino  * w = csqrtf( z );
30*05a0b428SJohn Marino  *
31*05a0b428SJohn Marino  *
32*05a0b428SJohn Marino  *
33*05a0b428SJohn Marino  * DESCRIPTION:
34*05a0b428SJohn Marino  *
35*05a0b428SJohn Marino  *
36*05a0b428SJohn Marino  * If z = x + iy,  r = |z|, then
37*05a0b428SJohn Marino  *
38*05a0b428SJohn Marino  *                       1/2
39*05a0b428SJohn Marino  * Re w  =  [ (r + x)/2 ]   ,
40*05a0b428SJohn Marino  *
41*05a0b428SJohn Marino  *                       1/2
42*05a0b428SJohn Marino  * Im w  =  [ (r - x)/2 ]   .
43*05a0b428SJohn Marino  *
44*05a0b428SJohn Marino  * Cancellation error in r-x or r+x is avoided by using the
45*05a0b428SJohn Marino  * identity  2 Re w Im w  =  y.
46*05a0b428SJohn Marino  *
47*05a0b428SJohn Marino  * Note that -w is also a square root of z.  The root chosen
48*05a0b428SJohn Marino  * is always in the right half plane and Im w has the same sign as y.
49*05a0b428SJohn Marino  *
50*05a0b428SJohn Marino  *
51*05a0b428SJohn Marino  *
52*05a0b428SJohn Marino  * ACCURACY:
53*05a0b428SJohn Marino  *
54*05a0b428SJohn Marino  *
55*05a0b428SJohn Marino  *                      Relative error:
56*05a0b428SJohn Marino  * arithmetic   domain     # trials      peak         rms
57*05a0b428SJohn Marino  *    IEEE      -10,+10    1,000,000    1.8e-7       3.5e-8
58*05a0b428SJohn Marino  *
59*05a0b428SJohn Marino  */
60*05a0b428SJohn Marino 
61*05a0b428SJohn Marino #include <complex.h>
62*05a0b428SJohn Marino #include <math.h>
63*05a0b428SJohn Marino 
64*05a0b428SJohn Marino float complex
csqrtf(float complex z)65*05a0b428SJohn Marino csqrtf(float complex z)
66*05a0b428SJohn Marino {
67*05a0b428SJohn Marino 	float complex w;
68*05a0b428SJohn Marino 	float x, y, r, t, scale;
69*05a0b428SJohn Marino 
70*05a0b428SJohn Marino 	x = crealf(z);
71*05a0b428SJohn Marino 	y = cimagf(z);
72*05a0b428SJohn Marino 
73*05a0b428SJohn Marino 	if(y == 0.0f) {
74*05a0b428SJohn Marino 		if (x < 0.0f) {
75*05a0b428SJohn Marino 			w = 0.0f + sqrtf(-x) * I;
76*05a0b428SJohn Marino 			return (w);
77*05a0b428SJohn Marino 		}
78*05a0b428SJohn Marino 		else if (x == 0.0f) {
79*05a0b428SJohn Marino 			return (0.0f + y * I);
80*05a0b428SJohn Marino 		}
81*05a0b428SJohn Marino 		else {
82*05a0b428SJohn Marino 			w = sqrtf(x) + y * I;
83*05a0b428SJohn Marino 			return (w);
84*05a0b428SJohn Marino 		}
85*05a0b428SJohn Marino 	}
86*05a0b428SJohn Marino 
87*05a0b428SJohn Marino 	if (x == 0.0f) {
88*05a0b428SJohn Marino 		r = fabsf(y);
89*05a0b428SJohn Marino 		r = sqrtf(0.5f*r);
90*05a0b428SJohn Marino 		if(y > 0)
91*05a0b428SJohn Marino 			w = r + r * I;
92*05a0b428SJohn Marino 		else
93*05a0b428SJohn Marino 			w = r - r * I;
94*05a0b428SJohn Marino 		return (w);
95*05a0b428SJohn Marino 	}
96*05a0b428SJohn Marino 
97*05a0b428SJohn Marino 	/* Rescale to avoid internal overflow or underflow.  */
98*05a0b428SJohn Marino 	if ((fabsf(x) > 4.0f) || (fabsf(y) > 4.0f)) {
99*05a0b428SJohn Marino 		x *= 0.25f;
100*05a0b428SJohn Marino 		y *= 0.25f;
101*05a0b428SJohn Marino 		scale = 2.0f;
102*05a0b428SJohn Marino 	}
103*05a0b428SJohn Marino 	else {
104*05a0b428SJohn Marino 		x *= 6.7108864e7f; /* 2^26 */
105*05a0b428SJohn Marino 		y *= 6.7108864e7f;
106*05a0b428SJohn Marino 		scale = 1.220703125e-4f; /* 2^-13 */
107*05a0b428SJohn Marino #if 0
108*05a0b428SJohn Marino 		x *= 4.0f;
109*05a0b428SJohn Marino 		y *= 4.0f;
110*05a0b428SJohn Marino 		scale = 0.5f;
111*05a0b428SJohn Marino #endif
112*05a0b428SJohn Marino 	}
113*05a0b428SJohn Marino 	w = x + y * I;
114*05a0b428SJohn Marino 	r = cabsf(w);
115*05a0b428SJohn Marino 	if (x > 0) {
116*05a0b428SJohn Marino 		t = sqrtf( 0.5f * r + 0.5f * x );
117*05a0b428SJohn Marino 		r = scale * fabsf((0.5f * y) / t);
118*05a0b428SJohn Marino 		t *= scale;
119*05a0b428SJohn Marino 	}
120*05a0b428SJohn Marino 	else {
121*05a0b428SJohn Marino 		r = sqrtf(0.5f * r - 0.5f * x);
122*05a0b428SJohn Marino 		t = scale * fabsf((0.5f * y) / r);
123*05a0b428SJohn Marino 		r *= scale;
124*05a0b428SJohn Marino 	}
125*05a0b428SJohn Marino 
126*05a0b428SJohn Marino 	if (y < 0)
127*05a0b428SJohn Marino 		w = t - r * I;
128*05a0b428SJohn Marino 	else
129*05a0b428SJohn Marino 		w = t + r * I;
130*05a0b428SJohn Marino 	return (w);
131*05a0b428SJohn Marino }
132