1*05a0b428SJohn Marino /* $OpenBSD: s_csqrtf.c,v 1.2 2010/07/18 18:42:26 guenther Exp $ */
2*05a0b428SJohn Marino /*
3*05a0b428SJohn Marino * Copyright (c) 2008 Stephen L. Moshier <steve@moshier.net>
4*05a0b428SJohn Marino *
5*05a0b428SJohn Marino * Permission to use, copy, modify, and distribute this software for any
6*05a0b428SJohn Marino * purpose with or without fee is hereby granted, provided that the above
7*05a0b428SJohn Marino * copyright notice and this permission notice appear in all copies.
8*05a0b428SJohn Marino *
9*05a0b428SJohn Marino * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10*05a0b428SJohn Marino * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11*05a0b428SJohn Marino * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12*05a0b428SJohn Marino * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13*05a0b428SJohn Marino * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14*05a0b428SJohn Marino * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15*05a0b428SJohn Marino * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
16*05a0b428SJohn Marino */
17*05a0b428SJohn Marino
18*05a0b428SJohn Marino /* csqrtf()
19*05a0b428SJohn Marino *
20*05a0b428SJohn Marino * Complex square root
21*05a0b428SJohn Marino *
22*05a0b428SJohn Marino *
23*05a0b428SJohn Marino *
24*05a0b428SJohn Marino * SYNOPSIS:
25*05a0b428SJohn Marino *
26*05a0b428SJohn Marino * float complex csqrtf();
27*05a0b428SJohn Marino * float complex z, w;
28*05a0b428SJohn Marino *
29*05a0b428SJohn Marino * w = csqrtf( z );
30*05a0b428SJohn Marino *
31*05a0b428SJohn Marino *
32*05a0b428SJohn Marino *
33*05a0b428SJohn Marino * DESCRIPTION:
34*05a0b428SJohn Marino *
35*05a0b428SJohn Marino *
36*05a0b428SJohn Marino * If z = x + iy, r = |z|, then
37*05a0b428SJohn Marino *
38*05a0b428SJohn Marino * 1/2
39*05a0b428SJohn Marino * Re w = [ (r + x)/2 ] ,
40*05a0b428SJohn Marino *
41*05a0b428SJohn Marino * 1/2
42*05a0b428SJohn Marino * Im w = [ (r - x)/2 ] .
43*05a0b428SJohn Marino *
44*05a0b428SJohn Marino * Cancellation error in r-x or r+x is avoided by using the
45*05a0b428SJohn Marino * identity 2 Re w Im w = y.
46*05a0b428SJohn Marino *
47*05a0b428SJohn Marino * Note that -w is also a square root of z. The root chosen
48*05a0b428SJohn Marino * is always in the right half plane and Im w has the same sign as y.
49*05a0b428SJohn Marino *
50*05a0b428SJohn Marino *
51*05a0b428SJohn Marino *
52*05a0b428SJohn Marino * ACCURACY:
53*05a0b428SJohn Marino *
54*05a0b428SJohn Marino *
55*05a0b428SJohn Marino * Relative error:
56*05a0b428SJohn Marino * arithmetic domain # trials peak rms
57*05a0b428SJohn Marino * IEEE -10,+10 1,000,000 1.8e-7 3.5e-8
58*05a0b428SJohn Marino *
59*05a0b428SJohn Marino */
60*05a0b428SJohn Marino
61*05a0b428SJohn Marino #include <complex.h>
62*05a0b428SJohn Marino #include <math.h>
63*05a0b428SJohn Marino
64*05a0b428SJohn Marino float complex
csqrtf(float complex z)65*05a0b428SJohn Marino csqrtf(float complex z)
66*05a0b428SJohn Marino {
67*05a0b428SJohn Marino float complex w;
68*05a0b428SJohn Marino float x, y, r, t, scale;
69*05a0b428SJohn Marino
70*05a0b428SJohn Marino x = crealf(z);
71*05a0b428SJohn Marino y = cimagf(z);
72*05a0b428SJohn Marino
73*05a0b428SJohn Marino if(y == 0.0f) {
74*05a0b428SJohn Marino if (x < 0.0f) {
75*05a0b428SJohn Marino w = 0.0f + sqrtf(-x) * I;
76*05a0b428SJohn Marino return (w);
77*05a0b428SJohn Marino }
78*05a0b428SJohn Marino else if (x == 0.0f) {
79*05a0b428SJohn Marino return (0.0f + y * I);
80*05a0b428SJohn Marino }
81*05a0b428SJohn Marino else {
82*05a0b428SJohn Marino w = sqrtf(x) + y * I;
83*05a0b428SJohn Marino return (w);
84*05a0b428SJohn Marino }
85*05a0b428SJohn Marino }
86*05a0b428SJohn Marino
87*05a0b428SJohn Marino if (x == 0.0f) {
88*05a0b428SJohn Marino r = fabsf(y);
89*05a0b428SJohn Marino r = sqrtf(0.5f*r);
90*05a0b428SJohn Marino if(y > 0)
91*05a0b428SJohn Marino w = r + r * I;
92*05a0b428SJohn Marino else
93*05a0b428SJohn Marino w = r - r * I;
94*05a0b428SJohn Marino return (w);
95*05a0b428SJohn Marino }
96*05a0b428SJohn Marino
97*05a0b428SJohn Marino /* Rescale to avoid internal overflow or underflow. */
98*05a0b428SJohn Marino if ((fabsf(x) > 4.0f) || (fabsf(y) > 4.0f)) {
99*05a0b428SJohn Marino x *= 0.25f;
100*05a0b428SJohn Marino y *= 0.25f;
101*05a0b428SJohn Marino scale = 2.0f;
102*05a0b428SJohn Marino }
103*05a0b428SJohn Marino else {
104*05a0b428SJohn Marino x *= 6.7108864e7f; /* 2^26 */
105*05a0b428SJohn Marino y *= 6.7108864e7f;
106*05a0b428SJohn Marino scale = 1.220703125e-4f; /* 2^-13 */
107*05a0b428SJohn Marino #if 0
108*05a0b428SJohn Marino x *= 4.0f;
109*05a0b428SJohn Marino y *= 4.0f;
110*05a0b428SJohn Marino scale = 0.5f;
111*05a0b428SJohn Marino #endif
112*05a0b428SJohn Marino }
113*05a0b428SJohn Marino w = x + y * I;
114*05a0b428SJohn Marino r = cabsf(w);
115*05a0b428SJohn Marino if (x > 0) {
116*05a0b428SJohn Marino t = sqrtf( 0.5f * r + 0.5f * x );
117*05a0b428SJohn Marino r = scale * fabsf((0.5f * y) / t);
118*05a0b428SJohn Marino t *= scale;
119*05a0b428SJohn Marino }
120*05a0b428SJohn Marino else {
121*05a0b428SJohn Marino r = sqrtf(0.5f * r - 0.5f * x);
122*05a0b428SJohn Marino t = scale * fabsf((0.5f * y) / r);
123*05a0b428SJohn Marino r *= scale;
124*05a0b428SJohn Marino }
125*05a0b428SJohn Marino
126*05a0b428SJohn Marino if (y < 0)
127*05a0b428SJohn Marino w = t - r * I;
128*05a0b428SJohn Marino else
129*05a0b428SJohn Marino w = t + r * I;
130*05a0b428SJohn Marino return (w);
131*05a0b428SJohn Marino }
132