mpfr/src/erf.c

4a238c70SJohn Marino/* mpfr_erf -- error function of a floating-point number
4a238c70SJohn Marino
*ab6d115fSJohn MarinoCopyright 2001, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
*ab6d115fSJohn MarinoContributed by the AriC and Caramel projects, INRIA.
4a238c70SJohn Marino
4a238c70SJohn MarinoThis file is part of the GNU MPFR Library.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is free software; you can redistribute it and/or modify
4a238c70SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
4a238c70SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
4a238c70SJohn Marinooption) any later version.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is distributed in the hope that it will be useful, but
4a238c70SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
4a238c70SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
4a238c70SJohn MarinoLicense for more details.
4a238c70SJohn Marino
4a238c70SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
4a238c70SJohn Marinoalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
4a238c70SJohn Marinohttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
4a238c70SJohn Marino51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_NEED_LONGLONG_H
4a238c70SJohn Marino#include "mpfr-impl.h"
4a238c70SJohn Marino
4a238c70SJohn Marino#define EXP1 2.71828182845904523536 /* exp(1) */
4a238c70SJohn Marino
4a238c70SJohn Marinostatic int mpfr_erf_0 (mpfr_ptr, mpfr_srcptr, double, mpfr_rnd_t);
4a238c70SJohn Marino
4a238c70SJohn Marinoint
4a238c70SJohn Marinompfr_erf (mpfr_ptr y, mpfr_srcptr x, mpfr_rnd_t rnd_mode)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mpfr_t xf;
4a238c70SJohn Marino  int inex, large;
4a238c70SJohn Marino  MPFR_SAVE_EXPO_DECL (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_LOG_FUNC
4a238c70SJohn Marino    (("x[%Pu]=%.*Rg rnd=%d", mpfr_get_prec (x), mpfr_log_prec, x, rnd_mode),
4a238c70SJohn Marino     ("y[%Pu]=%.*Rg inexact=%d", mpfr_get_prec (y), mpfr_log_prec, y, inex));
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_NAN (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_NAN (y);
4a238c70SJohn Marino          MPFR_RET_NAN;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else if (MPFR_IS_INF (x)) /* erf(+inf) = +1, erf(-inf) = -1 */
4a238c70SJohn Marino        return mpfr_set_si (y, MPFR_INT_SIGN (x), MPFR_RNDN);
4a238c70SJohn Marino      else /* erf(+0) = +0, erf(-0) = -0 */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_ASSERTD (MPFR_IS_ZERO (x));
4a238c70SJohn Marino          return mpfr_set (y, x, MPFR_RNDN); /* should keep the sign of x */
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* now x is neither NaN, Inf nor 0 */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* first try expansion at x=0 when x is small, or asymptotic expansion
4a238c70SJohn Marino     where x is large */
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* around x=0, we have erf(x) = 2x/sqrt(Pi) (1 - x^2/3 + ...),
4a238c70SJohn Marino     with 1 - x^2/3 <= sqrt(Pi)*erf(x)/2/x <= 1 for x >= 0. This means that
4a238c70SJohn Marino     if x^2/3 < 2^(-PREC(y)-1) we can decide of the correct rounding,
4a238c70SJohn Marino     unless we have a worst-case for 2x/sqrt(Pi). */
4a238c70SJohn Marino  if (MPFR_EXP(x) < - (mpfr_exp_t) (MPFR_PREC(y) / 2))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      /* we use 2x/sqrt(Pi) (1 - x^2/3) <= erf(x) <= 2x/sqrt(Pi) for x > 0
4a238c70SJohn Marino         and 2x/sqrt(Pi) <= erf(x) <= 2x/sqrt(Pi) (1 - x^2/3) for x < 0.
4a238c70SJohn Marino         In both cases |2x/sqrt(Pi) (1 - x^2/3)| <= |erf(x)| <= |2x/sqrt(Pi)|.
4a238c70SJohn Marino         We will compute l and h such that l <= |2x/sqrt(Pi) (1 - x^2/3)|
4a238c70SJohn Marino         and |2x/sqrt(Pi)| <= h. If l and h round to the same value to
4a238c70SJohn Marino         precision PREC(y) and rounding rnd_mode, then we are done. */
4a238c70SJohn Marino      mpfr_t l, h; /* lower and upper bounds for erf(x) */
4a238c70SJohn Marino      int ok, inex2;
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_init2 (l, MPFR_PREC(y) + 17);
4a238c70SJohn Marino      mpfr_init2 (h, MPFR_PREC(y) + 17);
4a238c70SJohn Marino      /* first compute l */
4a238c70SJohn Marino      mpfr_mul (l, x, x, MPFR_RNDU);
4a238c70SJohn Marino      mpfr_div_ui (l, l, 3, MPFR_RNDU); /* upper bound on x^2/3 */
4a238c70SJohn Marino      mpfr_ui_sub (l, 1, l, MPFR_RNDZ); /* lower bound on 1 - x^2/3 */
4a238c70SJohn Marino      mpfr_const_pi (h, MPFR_RNDU); /* upper bound of Pi */
4a238c70SJohn Marino      mpfr_sqrt (h, h, MPFR_RNDU); /* upper bound on sqrt(Pi) */
4a238c70SJohn Marino      mpfr_div (l, l, h, MPFR_RNDZ); /* lower bound on 1/sqrt(Pi) (1 - x^2/3) */
4a238c70SJohn Marino      mpfr_mul_2ui (l, l, 1, MPFR_RNDZ); /* 2/sqrt(Pi) (1 - x^2/3) */
4a238c70SJohn Marino      mpfr_mul (l, l, x, MPFR_RNDZ); /* |l| is a lower bound on
4a238c70SJohn Marino                                       |2x/sqrt(Pi) (1 - x^2/3)| */
4a238c70SJohn Marino      /* now compute h */
4a238c70SJohn Marino      mpfr_const_pi (h, MPFR_RNDD); /* lower bound on Pi */
4a238c70SJohn Marino      mpfr_sqrt (h, h, MPFR_RNDD); /* lower bound on sqrt(Pi) */
4a238c70SJohn Marino      mpfr_div_2ui (h, h, 1, MPFR_RNDD); /* lower bound on sqrt(Pi)/2 */
4a238c70SJohn Marino      /* since sqrt(Pi)/2 < 1, the following should not underflow */
4a238c70SJohn Marino      mpfr_div (h, x, h, MPFR_IS_POS(x) ? MPFR_RNDU : MPFR_RNDD);
4a238c70SJohn Marino      /* round l and h to precision PREC(y) */
4a238c70SJohn Marino      inex = mpfr_prec_round (l, MPFR_PREC(y), rnd_mode);
4a238c70SJohn Marino      inex2 = mpfr_prec_round (h, MPFR_PREC(y), rnd_mode);
4a238c70SJohn Marino      /* Caution: we also need inex=inex2 (inex might be 0). */
4a238c70SJohn Marino      ok = SAME_SIGN (inex, inex2) && mpfr_cmp (l, h) == 0;
4a238c70SJohn Marino      if (ok)
4a238c70SJohn Marino        mpfr_set (y, h, rnd_mode);
4a238c70SJohn Marino      mpfr_clear (l);
4a238c70SJohn Marino      mpfr_clear (h);
4a238c70SJohn Marino      if (ok)
4a238c70SJohn Marino        goto end;
4a238c70SJohn Marino      /* this test can still fail for small precision, for example
4a238c70SJohn Marino         for x=-0.100E-2 with a target precision of 3 bits, since
4a238c70SJohn Marino         the error term x^2/3 is not that small. */
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_init2 (xf, 53);
4a238c70SJohn Marino  mpfr_const_log2 (xf, MPFR_RNDU);
4a238c70SJohn Marino  mpfr_div (xf, x, xf, MPFR_RNDZ); /* round to zero ensures we get a lower
4a238c70SJohn Marino                                     bound of |x/log(2)| */
4a238c70SJohn Marino  mpfr_mul (xf, xf, x, MPFR_RNDZ);
4a238c70SJohn Marino  large = mpfr_cmp_ui (xf, MPFR_PREC (y) + 1) > 0;
4a238c70SJohn Marino  mpfr_clear (xf);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* when x goes to infinity, we have erf(x) = 1 - 1/sqrt(Pi)/exp(x^2)/x + ...
4a238c70SJohn Marino     and |erf(x) - 1| <= exp(-x^2) is true for any x >= 0, thus if
4a238c70SJohn Marino     exp(-x^2) < 2^(-PREC(y)-1) the result is 1 or 1-epsilon.
4a238c70SJohn Marino     This rewrites as x^2/log(2) > p+1. */
4a238c70SJohn Marino  if (MPFR_UNLIKELY (large))
4a238c70SJohn Marino    /* |erf x| = 1 or 1- */
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_rnd_t rnd2 = MPFR_IS_POS (x) ? rnd_mode : MPFR_INVERT_RND(rnd_mode);
4a238c70SJohn Marino      if (rnd2 == MPFR_RNDN || rnd2 == MPFR_RNDU || rnd2 == MPFR_RNDA)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          inex = MPFR_INT_SIGN (x);
4a238c70SJohn Marino          mpfr_set_si (y, inex, rnd2);
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else /* round to zero */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          inex = -MPFR_INT_SIGN (x);
4a238c70SJohn Marino          mpfr_setmax (y, 0); /* warning: setmax keeps the old sign of y */
4a238c70SJohn Marino          MPFR_SET_SAME_SIGN (y, x);
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino  else  /* use Taylor */
4a238c70SJohn Marino    {
4a238c70SJohn Marino      double xf2;
4a238c70SJohn Marino
4a238c70SJohn Marino      /* FIXME: get rid of doubles/mpfr_get_d here */
4a238c70SJohn Marino      xf2 = mpfr_get_d (x, MPFR_RNDN);
4a238c70SJohn Marino      xf2 = xf2 * xf2; /* xf2 ~ x^2 */
4a238c70SJohn Marino      inex = mpfr_erf_0 (y, x, xf2, rnd_mode);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino end:
4a238c70SJohn Marino  MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino  return mpfr_check_range (y, inex, rnd_mode);
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marino/* return x*2^e */
4a238c70SJohn Marinostatic double
4a238c70SJohn Marinomul_2exp (double x, mpfr_exp_t e)
4a238c70SJohn Marino{
4a238c70SJohn Marino  if (e > 0)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      while (e--)
4a238c70SJohn Marino        x *= 2.0;
4a238c70SJohn Marino    }
4a238c70SJohn Marino  else
4a238c70SJohn Marino    {
4a238c70SJohn Marino      while (e++)
4a238c70SJohn Marino        x /= 2.0;
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  return x;
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marino/* evaluates erf(x) using the expansion at x=0:
4a238c70SJohn Marino
4a238c70SJohn Marino   erf(x) = 2/sqrt(Pi) * sum((-1)^k*x^(2k+1)/k!/(2k+1), k=0..infinity)
4a238c70SJohn Marino
4a238c70SJohn Marino   Assumes x is neither NaN nor infinite nor zero.
4a238c70SJohn Marino   Assumes also that e*x^2 <= n (target precision).
4a238c70SJohn Marino */
4a238c70SJohn Marinostatic int
4a238c70SJohn Marinompfr_erf_0 (mpfr_ptr res, mpfr_srcptr x, double xf2, mpfr_rnd_t rnd_mode)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mpfr_prec_t n, m;
4a238c70SJohn Marino  mpfr_exp_t nuk, sigmak;
4a238c70SJohn Marino  double tauk;
4a238c70SJohn Marino  mpfr_t y, s, t, u;
4a238c70SJohn Marino  unsigned int k;
4a238c70SJohn Marino  int log2tauk;
4a238c70SJohn Marino  int inex;
4a238c70SJohn Marino  MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino  n = MPFR_PREC (res); /* target precision */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* initial working precision */
4a238c70SJohn Marino  m = n + (mpfr_prec_t) (xf2 / LOG2) + 8 + MPFR_INT_CEIL_LOG2 (n);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_init2 (y, m);
4a238c70SJohn Marino  mpfr_init2 (s, m);
4a238c70SJohn Marino  mpfr_init2 (t, m);
4a238c70SJohn Marino  mpfr_init2 (u, m);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_ZIV_INIT (loop, m);
4a238c70SJohn Marino  for (;;)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_mul (y, x, x, MPFR_RNDU); /* err <= 1 ulp */
4a238c70SJohn Marino      mpfr_set_ui (s, 1, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_set_ui (t, 1, MPFR_RNDN);
4a238c70SJohn Marino      tauk = 0.0;
4a238c70SJohn Marino
4a238c70SJohn Marino      for (k = 1; ; k++)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_mul (t, y, t, MPFR_RNDU);
4a238c70SJohn Marino          mpfr_div_ui (t, t, k, MPFR_RNDU);
4a238c70SJohn Marino          mpfr_div_ui (u, t, 2 * k + 1, MPFR_RNDU);
4a238c70SJohn Marino          sigmak = MPFR_GET_EXP (s);
4a238c70SJohn Marino          if (k % 2)
4a238c70SJohn Marino            mpfr_sub (s, s, u, MPFR_RNDN);
4a238c70SJohn Marino          else
4a238c70SJohn Marino            mpfr_add (s, s, u, MPFR_RNDN);
4a238c70SJohn Marino          sigmak -= MPFR_GET_EXP(s);
4a238c70SJohn Marino          nuk = MPFR_GET_EXP(u) - MPFR_GET_EXP(s);
4a238c70SJohn Marino
4a238c70SJohn Marino          if ((nuk < - (mpfr_exp_t) m) && ((double) k >= xf2))
4a238c70SJohn Marino            break;
4a238c70SJohn Marino
4a238c70SJohn Marino          /* tauk <- 1/2 + tauk * 2^sigmak + (1+8k)*2^nuk */
4a238c70SJohn Marino          tauk = 0.5 + mul_2exp (tauk, sigmak)
4a238c70SJohn Marino            + mul_2exp (1.0 + 8.0 * (double) k, nuk);
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_mul (s, x, s, MPFR_RNDU);
4a238c70SJohn Marino      MPFR_SET_EXP (s, MPFR_GET_EXP (s) + 1);
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_const_pi (t, MPFR_RNDZ);
4a238c70SJohn Marino      mpfr_sqrt (t, t, MPFR_RNDZ);
4a238c70SJohn Marino      mpfr_div (s, s, t, MPFR_RNDN);
4a238c70SJohn Marino      tauk = 4.0 * tauk + 11.0; /* final ulp-error on s */
4a238c70SJohn Marino      log2tauk = __gmpfr_ceil_log2 (tauk);
4a238c70SJohn Marino
4a238c70SJohn Marino      if (MPFR_LIKELY (MPFR_CAN_ROUND (s, m - log2tauk, n, rnd_mode)))
4a238c70SJohn Marino        break;
4a238c70SJohn Marino
4a238c70SJohn Marino      /* Actualisation of the precision */
4a238c70SJohn Marino      MPFR_ZIV_NEXT (loop, m);
4a238c70SJohn Marino      mpfr_set_prec (y, m);
4a238c70SJohn Marino      mpfr_set_prec (s, m);
4a238c70SJohn Marino      mpfr_set_prec (t, m);
4a238c70SJohn Marino      mpfr_set_prec (u, m);
4a238c70SJohn Marino
4a238c70SJohn Marino    }
4a238c70SJohn Marino  MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino  inex = mpfr_set (res, s, rnd_mode);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_clear (y);
4a238c70SJohn Marino  mpfr_clear (t);
4a238c70SJohn Marino  mpfr_clear (u);
4a238c70SJohn Marino  mpfr_clear (s);
4a238c70SJohn Marino
4a238c70SJohn Marino  return inex;
4a238c70SJohn Marino}