1*84d9c625SLionel Sambuc /* $NetBSD: s_fmaf.c,v 1.2 2013/02/11 01:29:58 christos Exp $ */
2*84d9c625SLionel Sambuc
3*84d9c625SLionel Sambuc /*-
4*84d9c625SLionel Sambuc * Copyright (c) 2005-2011 David Schultz <das@FreeBSD.ORG>
5*84d9c625SLionel Sambuc * All rights reserved.
6*84d9c625SLionel Sambuc *
7*84d9c625SLionel Sambuc * Redistribution and use in source and binary forms, with or without
8*84d9c625SLionel Sambuc * modification, are permitted provided that the following conditions
9*84d9c625SLionel Sambuc * are met:
10*84d9c625SLionel Sambuc * 1. Redistributions of source code must retain the above copyright
11*84d9c625SLionel Sambuc * notice, this list of conditions and the following disclaimer.
12*84d9c625SLionel Sambuc * 2. Redistributions in binary form must reproduce the above copyright
13*84d9c625SLionel Sambuc * notice, this list of conditions and the following disclaimer in the
14*84d9c625SLionel Sambuc * documentation and/or other materials provided with the distribution.
15*84d9c625SLionel Sambuc *
16*84d9c625SLionel Sambuc * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17*84d9c625SLionel Sambuc * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18*84d9c625SLionel Sambuc * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19*84d9c625SLionel Sambuc * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20*84d9c625SLionel Sambuc * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21*84d9c625SLionel Sambuc * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22*84d9c625SLionel Sambuc * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23*84d9c625SLionel Sambuc * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24*84d9c625SLionel Sambuc * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25*84d9c625SLionel Sambuc * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26*84d9c625SLionel Sambuc * SUCH DAMAGE.
27*84d9c625SLionel Sambuc */
28*84d9c625SLionel Sambuc
29*84d9c625SLionel Sambuc #include <sys/cdefs.h>
30*84d9c625SLionel Sambuc #if 0
31*84d9c625SLionel Sambuc __FBSDID("$FreeBSD: src/lib/msun/src/s_fmaf.c,v 1.3 2011/10/15 04:16:58 das Exp $");
32*84d9c625SLionel Sambuc #else
33*84d9c625SLionel Sambuc __RCSID("$NetBSD: s_fmaf.c,v 1.2 2013/02/11 01:29:58 christos Exp $");
34*84d9c625SLionel Sambuc #endif
35*84d9c625SLionel Sambuc
36*84d9c625SLionel Sambuc #include <fenv.h>
37*84d9c625SLionel Sambuc
38*84d9c625SLionel Sambuc #include "math.h"
39*84d9c625SLionel Sambuc #include "math_private.h"
40*84d9c625SLionel Sambuc
41*84d9c625SLionel Sambuc /*
42*84d9c625SLionel Sambuc * Fused multiply-add: Compute x * y + z with a single rounding error.
43*84d9c625SLionel Sambuc *
44*84d9c625SLionel Sambuc * A double has more than twice as much precision than a float, so
45*84d9c625SLionel Sambuc * direct double-precision arithmetic suffices, except where double
46*84d9c625SLionel Sambuc * rounding occurs.
47*84d9c625SLionel Sambuc */
48*84d9c625SLionel Sambuc float
fmaf(float x,float y,float z)49*84d9c625SLionel Sambuc fmaf(float x, float y, float z)
50*84d9c625SLionel Sambuc {
51*84d9c625SLionel Sambuc double xy, result;
52*84d9c625SLionel Sambuc uint32_t hr, lr;
53*84d9c625SLionel Sambuc
54*84d9c625SLionel Sambuc xy = (double)x * y;
55*84d9c625SLionel Sambuc result = xy + z;
56*84d9c625SLionel Sambuc EXTRACT_WORDS(hr, lr, result);
57*84d9c625SLionel Sambuc /* Common case: The double precision result is fine. */
58*84d9c625SLionel Sambuc if ((lr & 0x1fffffff) != 0x10000000 || /* not a halfway case */
59*84d9c625SLionel Sambuc (hr & 0x7ff00000) == 0x7ff00000 || /* NaN */
60*84d9c625SLionel Sambuc result - xy == z || /* exact */
61*84d9c625SLionel Sambuc fegetround() != FE_TONEAREST) /* not round-to-nearest */
62*84d9c625SLionel Sambuc return (result);
63*84d9c625SLionel Sambuc
64*84d9c625SLionel Sambuc /*
65*84d9c625SLionel Sambuc * If result is inexact, and exactly halfway between two float values,
66*84d9c625SLionel Sambuc * we need to adjust the low-order bit in the direction of the error.
67*84d9c625SLionel Sambuc */
68*84d9c625SLionel Sambuc fesetround(FE_TOWARDZERO);
69*84d9c625SLionel Sambuc volatile double vxy = xy; /* XXX work around gcc CSE bug */
70*84d9c625SLionel Sambuc double adjusted_result = vxy + z;
71*84d9c625SLionel Sambuc fesetround(FE_TONEAREST);
72*84d9c625SLionel Sambuc if (result == adjusted_result)
73*84d9c625SLionel Sambuc SET_LOW_WORD(adjusted_result, lr + 1);
74*84d9c625SLionel Sambuc return (adjusted_result);
75*84d9c625SLionel Sambuc }
76