mpfr/src/ai.c

4a238c70SJohn Marino/* mpfr_ai -- Airy function Ai
4a238c70SJohn Marino
*ab6d115fSJohn MarinoCopyright 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
*ab6d115fSJohn MarinoContributed by the AriC and Caramel projects, INRIA.
4a238c70SJohn Marino
4a238c70SJohn MarinoThis file is part of the GNU MPFR Library.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is free software; you can redistribute it and/or modify
4a238c70SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
4a238c70SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
4a238c70SJohn Marinooption) any later version.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is distributed in the hope that it will be useful, but
4a238c70SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
4a238c70SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
4a238c70SJohn MarinoLicense for more details.
4a238c70SJohn Marino
4a238c70SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
4a238c70SJohn Marinoalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
4a238c70SJohn Marinohttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
4a238c70SJohn Marino51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_NEED_LONGLONG_H
4a238c70SJohn Marino#include "mpfr-impl.h"
4a238c70SJohn Marino
4a238c70SJohn Marino/* Reminder and notations:
4a238c70SJohn Marino   -----------------------
4a238c70SJohn Marino
4a238c70SJohn Marino   Ai is the solution of:
4a238c70SJohn Marino        / y'' - x*y = 0
4a238c70SJohn Marino       {    Ai(0)   = 1/ ( 9^(1/3)*Gamma(2/3) )
4a238c70SJohn Marino        \  Ai'(0)   = -1/ ( 3^(1/3)*Gamma(1/3) )
4a238c70SJohn Marino
4a238c70SJohn Marino   Series development:
4a238c70SJohn Marino       Ai(x) = sum (a_i*x^i)
4a238c70SJohn Marino             = sum (t_i)
4a238c70SJohn Marino
4a238c70SJohn Marino   Recurrences:
4a238c70SJohn Marino       a_(i+3) = a_i / ((i+2)*(i+3))
4a238c70SJohn Marino       t_(i+3) = t_i * x^3 / ((i+2)*(i+3))
4a238c70SJohn Marino
4a238c70SJohn Marino   Values:
4a238c70SJohn Marino       a_0 = Ai(0)  ~  0.355
4a238c70SJohn Marino       a_1 = Ai'(0) ~ -0.259
4a238c70SJohn Marino*/
4a238c70SJohn Marino
4a238c70SJohn Marino
4a238c70SJohn Marino/* Airy function Ai evaluated by the most naive algorithm */
4a238c70SJohn Marinostatic int
4a238c70SJohn Marinompfr_ai1 (mpfr_ptr y, mpfr_srcptr x, mpfr_rnd_t rnd)
4a238c70SJohn Marino{
4a238c70SJohn Marino  MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino  MPFR_SAVE_EXPO_DECL (expo);
4a238c70SJohn Marino  mpfr_prec_t wprec;             /* working precision */
4a238c70SJohn Marino  mpfr_prec_t prec;              /* target precision */
4a238c70SJohn Marino  mpfr_prec_t err;               /* used to estimate the evaluation error */
4a238c70SJohn Marino  mpfr_prec_t correct_bits;      /* estimates the number of correct bits*/
4a238c70SJohn Marino  unsigned long int k;
4a238c70SJohn Marino  unsigned long int cond;        /* condition number of the series */
4a238c70SJohn Marino  unsigned long int assumed_exponent; /* used as a lowerbound of |EXP(Ai(x))| */
4a238c70SJohn Marino  int r;
4a238c70SJohn Marino  mpfr_t s;                      /* used to store the partial sum */
4a238c70SJohn Marino  mpfr_t ti, tip1;   /* used to store successive values of t_i */
4a238c70SJohn Marino  mpfr_t x3;                     /* used to store x^3 */
4a238c70SJohn Marino  mpfr_t tmp_sp, tmp2_sp;        /* small precision variables */
4a238c70SJohn Marino  unsigned long int x3u;         /* used to store ceil(x^3) */
4a238c70SJohn Marino  mpfr_t temp1, temp2;
4a238c70SJohn Marino  int test1, test2;
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Logging */
4a238c70SJohn Marino  MPFR_LOG_FUNC (
4a238c70SJohn Marino    ("x[%Pu]=%.*Rg rnd=%d", mpfr_get_prec (x), mpfr_log_prec, x, rnd),
4a238c70SJohn Marino    ("y[%Pu]=%.*Rg", mpfr_get_prec (y), mpfr_log_prec, y) );
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Special cases */
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_NAN (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_NAN (y);
4a238c70SJohn Marino          MPFR_RET_NAN;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else if (MPFR_IS_INF (x))
4a238c70SJohn Marino        return mpfr_set_ui (y, 0, rnd);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Save current exponents range */
4a238c70SJohn Marino  MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_IS_ZERO (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_t y1, y2;
4a238c70SJohn Marino      prec = MPFR_PREC (y) + 3;
4a238c70SJohn Marino      mpfr_init2 (y1, prec);
4a238c70SJohn Marino      mpfr_init2 (y2, prec);
4a238c70SJohn Marino      MPFR_ZIV_INIT (loop, prec);
4a238c70SJohn Marino
4a238c70SJohn Marino      /* ZIV loop */
4a238c70SJohn Marino      for (;;)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_gamma_one_and_two_third (y1, y2, prec); /* y2 = Gamma(2/3)(1 + delta1), |delta1| <= 2^{1-prec}. */
4a238c70SJohn Marino
4a238c70SJohn Marino          r = mpfr_set_ui (y1, 9, MPFR_RNDN);
4a238c70SJohn Marino          MPFR_ASSERTD (r == 0);
4a238c70SJohn Marino          mpfr_cbrt (y1, y1, MPFR_RNDN); /* y1 = cbrt(9)(1 + delta2), |delta2| <= 2^{-prec}. */
4a238c70SJohn Marino          mpfr_mul (y1, y1, y2, MPFR_RNDN);
4a238c70SJohn Marino          mpfr_ui_div (y1, 1, y1, MPFR_RNDN);
4a238c70SJohn Marino          if (MPFR_LIKELY (MPFR_CAN_ROUND (y1, prec - 3, MPFR_PREC (y), rnd)))
4a238c70SJohn Marino            break;
4a238c70SJohn Marino          MPFR_ZIV_NEXT (loop, prec);
4a238c70SJohn Marino        }
4a238c70SJohn Marino      r = mpfr_set (y, y1, rnd);
4a238c70SJohn Marino      MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino      MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino      mpfr_clear (y1);
4a238c70SJohn Marino      mpfr_clear (y2);
4a238c70SJohn Marino      return mpfr_check_range (y, r, rnd);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* FIXME: underflow for large values of |x| ? */
4a238c70SJohn Marino
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Set initial precision */
4a238c70SJohn Marino  /* If we compute sum(i=0, N-1, t_i), the relative error is bounded by  */
4a238c70SJohn Marino  /*       2*(4N)*2^(1-wprec)*C(|x|)/Ai(x)                               */
4a238c70SJohn Marino  /* where C(|x|) = 1 if 0<=x<=1                                         */
4a238c70SJohn Marino  /*   and C(|x|) = (1/2)*x^(-1/4)*exp(2/3 x^(3/2))  if x >= 1           */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* A priori, we do not know N, so we estimate it to ~ prec             */
4a238c70SJohn Marino  /* If 0<=x<=1, we estimate Ai(x) ~ 1/8                                 */
4a238c70SJohn Marino  /* if 1<=x,    we estimate Ai(x) ~ (1/4)*x^(-1/4)*exp(-2/3 * x^(3/2))  */
4a238c70SJohn Marino  /* if x<=0,    ?????                                                   */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* We begin with 11 guard bits */
4a238c70SJohn Marino  prec = MPFR_PREC (y)+11;
4a238c70SJohn Marino  MPFR_ZIV_INIT (loop, prec);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* The working precision is heuristically chosen in order to obtain  */
4a238c70SJohn Marino  /* approximately prec correct bits in the sum. To sum up: the sum    */
4a238c70SJohn Marino  /* is stopped when the *exact* sum gives ~ prec correct bit. And     */
4a238c70SJohn Marino  /* when it is stopped, the accuracy of the computed sum, with respect*/
4a238c70SJohn Marino  /* to the exact one should be ~prec bits.                            */
4a238c70SJohn Marino  mpfr_init2 (tmp_sp, MPFR_SMALL_PRECISION);
4a238c70SJohn Marino  mpfr_init2 (tmp2_sp, MPFR_SMALL_PRECISION);
4a238c70SJohn Marino  mpfr_abs (tmp_sp, x, MPFR_RNDU);
4a238c70SJohn Marino  mpfr_pow_ui (tmp_sp, tmp_sp, 3, MPFR_RNDU);
4a238c70SJohn Marino  mpfr_sqrt (tmp_sp, tmp_sp, MPFR_RNDU); /* tmp_sp ~ x^3/2 */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* 0.96179669392597567 >~ 2/3 * log2(e). See algorithms.tex */
4a238c70SJohn Marino  mpfr_set_str (tmp2_sp, "0.96179669392597567", 10, MPFR_RNDU);
4a238c70SJohn Marino  mpfr_mul (tmp2_sp, tmp_sp, tmp2_sp, MPFR_RNDU);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* cond represents the number of lost bits in the evaluation of the sum */
4a238c70SJohn Marino  if ( (MPFR_IS_ZERO (x)) || (MPFR_GET_EXP (x) <= 0) )
4a238c70SJohn Marino    cond = 0;
4a238c70SJohn Marino  else
4a238c70SJohn Marino    cond = mpfr_get_ui (tmp2_sp, MPFR_RNDU) - (MPFR_GET_EXP (x)-1)/4 - 1;
4a238c70SJohn Marino
4a238c70SJohn Marino  /* The variable assumed_exponent is used to store the maximal assumed */
4a238c70SJohn Marino  /* exponent of Ai(x). More precisely, we assume that |Ai(x)| will be  */
4a238c70SJohn Marino  /* greater than 2^{-assumed_exponent}.                                */
4a238c70SJohn Marino  if (MPFR_IS_ZERO (x))
4a238c70SJohn Marino    assumed_exponent = 2;
4a238c70SJohn Marino  else
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_POS (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (MPFR_GET_EXP (x) <= 0)
4a238c70SJohn Marino            assumed_exponent = 3;
4a238c70SJohn Marino          else
4a238c70SJohn Marino            assumed_exponent = (2 + (MPFR_GET_EXP (x)/4 + 1)
4a238c70SJohn Marino                                + mpfr_get_ui (tmp2_sp, MPFR_RNDU));
4a238c70SJohn Marino        }
4a238c70SJohn Marino      /* We do not know Ai (x) yet */
4a238c70SJohn Marino      /* We cover the case when EXP (Ai (x))>=-10 */
4a238c70SJohn Marino      else
4a238c70SJohn Marino        assumed_exponent = 10;
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  wprec = prec + MPFR_INT_CEIL_LOG2 (prec) + 5 + cond + assumed_exponent;
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_init (ti);
4a238c70SJohn Marino  mpfr_init (tip1);
4a238c70SJohn Marino  mpfr_init (temp1);
4a238c70SJohn Marino  mpfr_init (temp2);
4a238c70SJohn Marino  mpfr_init (x3);
4a238c70SJohn Marino  mpfr_init (s);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* ZIV loop */
4a238c70SJohn Marino  for (;;)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      MPFR_LOG_MSG (("Working precision: %Pu\n", wprec));
4a238c70SJohn Marino      mpfr_set_prec (ti, wprec);
4a238c70SJohn Marino      mpfr_set_prec (tip1, wprec);
4a238c70SJohn Marino      mpfr_set_prec (x3, wprec);
4a238c70SJohn Marino      mpfr_set_prec (s, wprec);
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_sqr (x3, x, MPFR_RNDU);
4a238c70SJohn Marino      mpfr_mul (x3, x3, x, (MPFR_IS_POS (x)?MPFR_RNDU:MPFR_RNDD));  /* x3=x^3 */
4a238c70SJohn Marino      if (MPFR_IS_NEG (x))
4a238c70SJohn Marino        MPFR_CHANGE_SIGN (x3);
4a238c70SJohn Marino      x3u = mpfr_get_ui (x3, MPFR_RNDU);   /* x3u >= ceil(x^3) */
4a238c70SJohn Marino      if (MPFR_IS_NEG (x))
4a238c70SJohn Marino        MPFR_CHANGE_SIGN (x3);
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_gamma_one_and_two_third (temp1, temp2, wprec);
4a238c70SJohn Marino      mpfr_set_ui (ti, 9, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_cbrt (ti, ti, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_mul (ti, ti, temp2, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_ui_div (ti, 1, ti , MPFR_RNDN); /* ti = 1/( Gamma (2/3)*9^(1/3) ) */
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_set_ui (tip1, 3, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_cbrt (tip1, tip1, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_mul (tip1, tip1, temp1, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_neg (tip1, tip1, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_div (tip1, x, tip1, MPFR_RNDN); /* tip1 = -x/(Gamma (1/3)*3^(1/3)) */
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_add (s, ti, tip1, MPFR_RNDN);
4a238c70SJohn Marino
4a238c70SJohn Marino
4a238c70SJohn Marino      /* Evaluation of the series */
4a238c70SJohn Marino      k = 2;
4a238c70SJohn Marino      for (;;)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_mul (ti, ti, x3, MPFR_RNDN);
4a238c70SJohn Marino          mpfr_mul (tip1, tip1, x3, MPFR_RNDN);
4a238c70SJohn Marino
4a238c70SJohn Marino          mpfr_div_ui2 (ti, ti, k, (k+1), MPFR_RNDN);
4a238c70SJohn Marino          mpfr_div_ui2 (tip1, tip1, (k+1), (k+2), MPFR_RNDN);
4a238c70SJohn Marino
4a238c70SJohn Marino          k += 3;
4a238c70SJohn Marino          mpfr_add (s, s, ti, MPFR_RNDN);
4a238c70SJohn Marino          mpfr_add (s, s, tip1, MPFR_RNDN);
4a238c70SJohn Marino
4a238c70SJohn Marino          /* FIXME: if s==0 */
4a238c70SJohn Marino          test1 = MPFR_IS_ZERO (ti)
4a238c70SJohn Marino            || (MPFR_GET_EXP (ti) + (mpfr_exp_t)prec + 3 <= MPFR_GET_EXP (s));
4a238c70SJohn Marino          test2 = MPFR_IS_ZERO (tip1)
4a238c70SJohn Marino            || (MPFR_GET_EXP (tip1) + (mpfr_exp_t)prec + 3 <= MPFR_GET_EXP (s));
4a238c70SJohn Marino
4a238c70SJohn Marino          if ( test1 && test2 && (x3u <= k*(k+1)/2) )
4a238c70SJohn Marino            break; /* FIXME: if k*(k+1) overflows */
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      MPFR_LOG_MSG (("Truncation rank: %lu\n", k));
4a238c70SJohn Marino
4a238c70SJohn Marino      err = 4 + MPFR_INT_CEIL_LOG2 (k) + cond - MPFR_GET_EXP (s);
4a238c70SJohn Marino
4a238c70SJohn Marino      /* err is the number of bits lost due to the evaluation error */
4a238c70SJohn Marino      /* wprec-(prec+1): number of bits lost due to the approximation error */
4a238c70SJohn Marino      MPFR_LOG_MSG (("Roundoff error: %Pu\n", err));
4a238c70SJohn Marino      MPFR_LOG_MSG (("Approxim error: %Pu\n", wprec-prec-1));
4a238c70SJohn Marino
4a238c70SJohn Marino      if (wprec < err+1)
4a238c70SJohn Marino        correct_bits=0;
4a238c70SJohn Marino      else
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (wprec < err+prec+1)
4a238c70SJohn Marino            correct_bits =  wprec - err - 1;
4a238c70SJohn Marino          else
4a238c70SJohn Marino            correct_bits = prec;
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      if (MPFR_LIKELY (MPFR_CAN_ROUND (s, correct_bits, MPFR_PREC (y), rnd)))
4a238c70SJohn Marino        break;
4a238c70SJohn Marino
4a238c70SJohn Marino      if (correct_bits == 0)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          assumed_exponent *= 2;
4a238c70SJohn Marino          MPFR_LOG_MSG (("Not a single bit correct (assumed_exponent=%lu)\n",
4a238c70SJohn Marino                         assumed_exponent));
4a238c70SJohn Marino          wprec = prec + 5 + MPFR_INT_CEIL_LOG2 (k) + cond + assumed_exponent;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (correct_bits < prec)
4a238c70SJohn Marino            { /* The precision was badly chosen */
4a238c70SJohn Marino              MPFR_LOG_MSG (("Bad assumption on the exponent of Ai(x)", 0));
4a238c70SJohn Marino              MPFR_LOG_MSG ((" (E=%ld)\n", (long) MPFR_GET_EXP (s)));
4a238c70SJohn Marino              wprec = prec + err + 1;
4a238c70SJohn Marino            }
4a238c70SJohn Marino          else
4a238c70SJohn Marino            { /* We are really in a bad case of the TMD */
4a238c70SJohn Marino              MPFR_ZIV_NEXT (loop, prec);
4a238c70SJohn Marino
4a238c70SJohn Marino              /* We update wprec */
4a238c70SJohn Marino              /* We assume that K will not be multiplied by more than 4 */
4a238c70SJohn Marino              wprec = prec + (MPFR_INT_CEIL_LOG2 (k)+2) + 5 + cond
4a238c70SJohn Marino                - MPFR_GET_EXP (s);
4a238c70SJohn Marino            }
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino    } /* End of ZIV loop */
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino  r = mpfr_set (y, s, rnd);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_clear (ti);
4a238c70SJohn Marino  mpfr_clear (tip1);
4a238c70SJohn Marino  mpfr_clear (temp1);
4a238c70SJohn Marino  mpfr_clear (temp2);
4a238c70SJohn Marino  mpfr_clear (x3);
4a238c70SJohn Marino  mpfr_clear (s);
4a238c70SJohn Marino  mpfr_clear (tmp_sp);
4a238c70SJohn Marino  mpfr_clear (tmp2_sp);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino  return mpfr_check_range (y, r, rnd);
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marino
4a238c70SJohn Marino/* Airy function Ai evaluated by Smith algorithm */
4a238c70SJohn Marinostatic int
4a238c70SJohn Marinompfr_ai2 (mpfr_ptr y, mpfr_srcptr x, mpfr_rnd_t rnd)
4a238c70SJohn Marino{
4a238c70SJohn Marino  MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino  MPFR_SAVE_EXPO_DECL (expo);
4a238c70SJohn Marino  mpfr_prec_t wprec;             /* working precision */
4a238c70SJohn Marino  mpfr_prec_t prec;              /* target precision */
4a238c70SJohn Marino  mpfr_prec_t err;               /* used to estimate the evaluation error */
4a238c70SJohn Marino  mpfr_prec_t correctBits;       /* estimates the number of correct bits*/
4a238c70SJohn Marino  unsigned long int i, j, L, t;
4a238c70SJohn Marino  unsigned long int cond;        /* condition number of the series */
4a238c70SJohn Marino  unsigned long int assumed_exponent; /* used as a lowerbound of |EXP(Ai(x))| */
4a238c70SJohn Marino  int r;                         /* returned ternary value */
4a238c70SJohn Marino  mpfr_t s;                      /* used to store the partial sum */
4a238c70SJohn Marino  mpfr_t u0, u1;
4a238c70SJohn Marino  mpfr_t *z;                     /* used to store the (x^3j) */
4a238c70SJohn Marino  mpfr_t result;
4a238c70SJohn Marino  mpfr_t tmp_sp, tmp2_sp;        /* small precision variables */
4a238c70SJohn Marino  unsigned long int x3u;         /* used to store ceil (x^3) */
4a238c70SJohn Marino  mpfr_t temp1, temp2;
4a238c70SJohn Marino  int test0, test1;
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Logging */
4a238c70SJohn Marino  MPFR_LOG_FUNC (
4a238c70SJohn Marino    ("x[%Pu]=%.*Rg rnd=%d", mpfr_get_prec (x),  mpfr_log_prec, x, rnd),
4a238c70SJohn Marino    ("y[%Pu]=%.*Rg", mpfr_get_prec (y), mpfr_log_prec, y));
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Special cases */
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_NAN (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_NAN (y);
4a238c70SJohn Marino          MPFR_RET_NAN;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else if (MPFR_IS_INF (x))
4a238c70SJohn Marino        return mpfr_set_ui (y, 0, rnd);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Save current exponents range */
4a238c70SJohn Marino  MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* FIXME: underflow for large values of |x| */
4a238c70SJohn Marino
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Set initial precision */
4a238c70SJohn Marino  /* See the analysis for the naive evaluation */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* We begin with 11 guard bits */
4a238c70SJohn Marino  prec = MPFR_PREC (y) + 11;
4a238c70SJohn Marino  MPFR_ZIV_INIT (loop, prec);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_init2 (tmp_sp, MPFR_SMALL_PRECISION);
4a238c70SJohn Marino  mpfr_init2 (tmp2_sp, MPFR_SMALL_PRECISION);
4a238c70SJohn Marino  mpfr_abs (tmp_sp, x, MPFR_RNDU);
4a238c70SJohn Marino  mpfr_pow_ui (tmp_sp, tmp_sp, 3, MPFR_RNDU);
4a238c70SJohn Marino  mpfr_sqrt (tmp_sp, tmp_sp, MPFR_RNDU); /* tmp_sp ~ x^3/2 */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* 0.96179669392597567 >~ 2/3 * log2(e). See algorithms.tex */
4a238c70SJohn Marino  mpfr_set_str (tmp2_sp, "0.96179669392597567", 10, MPFR_RNDU);
4a238c70SJohn Marino  mpfr_mul (tmp2_sp, tmp_sp, tmp2_sp, MPFR_RNDU);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* cond represents the number of lost bits in the evaluation of the sum */
4a238c70SJohn Marino  if ( (MPFR_IS_ZERO (x)) || (MPFR_GET_EXP (x) <= 0) )
4a238c70SJohn Marino    cond = 0;
4a238c70SJohn Marino  else
4a238c70SJohn Marino    cond = mpfr_get_ui (tmp2_sp, MPFR_RNDU) - (MPFR_GET_EXP (x) - 1)/4 - 1;
4a238c70SJohn Marino
4a238c70SJohn Marino  /* This variable is used to store the maximal assumed exponent of       */
4a238c70SJohn Marino  /* Ai (x). More precisely, we assume that |Ai (x)| will be greater than */
4a238c70SJohn Marino  /* 2^{-assumedExp}.                                                     */
4a238c70SJohn Marino  if (MPFR_IS_ZERO (x))
4a238c70SJohn Marino    assumed_exponent = 2;
4a238c70SJohn Marino  else
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_POS (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (MPFR_GET_EXP (x) <= 0)
4a238c70SJohn Marino            assumed_exponent = 3;
4a238c70SJohn Marino          else
4a238c70SJohn Marino            assumed_exponent = (2 + (MPFR_GET_EXP (x)/4 + 1)
4a238c70SJohn Marino                                + mpfr_get_ui (tmp2_sp, MPFR_RNDU));
4a238c70SJohn Marino        }
4a238c70SJohn Marino      /* We do not know Ai (x) yet */
4a238c70SJohn Marino      /* We cover the case when EXP (Ai (x))>=-10 */
4a238c70SJohn Marino      else
4a238c70SJohn Marino        assumed_exponent = 10;
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  wprec = prec + MPFR_INT_CEIL_LOG2 (prec) + 6 + cond + assumed_exponent;
4a238c70SJohn Marino
4a238c70SJohn Marino  /* We assume that the truncation rank will be ~ prec */
4a238c70SJohn Marino  L = __gmpfr_isqrt (prec);
4a238c70SJohn Marino  MPFR_LOG_MSG (("size of blocks L = %lu\n", L));
4a238c70SJohn Marino
4a238c70SJohn Marino  z = (mpfr_t *) (*__gmp_allocate_func) ( (L + 1) * sizeof (mpfr_t) );
4a238c70SJohn Marino  MPFR_ASSERTN (z != NULL);
4a238c70SJohn Marino  for (j=0; j<=L; j++)
4a238c70SJohn Marino    mpfr_init (z[j]);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_init (s);
4a238c70SJohn Marino  mpfr_init (u0); mpfr_init (u1);
4a238c70SJohn Marino  mpfr_init (result);
4a238c70SJohn Marino  mpfr_init (temp1);
4a238c70SJohn Marino  mpfr_init (temp2);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* ZIV loop */
4a238c70SJohn Marino  for (;;)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      MPFR_LOG_MSG (("working precision: %Pu\n", wprec));
4a238c70SJohn Marino
4a238c70SJohn Marino      for (j=0; j<=L; j++)
4a238c70SJohn Marino        mpfr_set_prec (z[j], wprec);
4a238c70SJohn Marino      mpfr_set_prec (s, wprec);
4a238c70SJohn Marino      mpfr_set_prec (u0, wprec); mpfr_set_prec (u1, wprec);
4a238c70SJohn Marino      mpfr_set_prec (result, wprec);
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_set_ui (u0, 1, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_set (u1, x, MPFR_RNDN);
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_set_ui (z[0], 1, MPFR_RNDU);
4a238c70SJohn Marino      mpfr_sqr (z[1], u1, MPFR_RNDU);
4a238c70SJohn Marino      mpfr_mul (z[1], z[1], x, (MPFR_IS_POS (x) ? MPFR_RNDU : MPFR_RNDD) );
4a238c70SJohn Marino
4a238c70SJohn Marino      if (MPFR_IS_NEG (x))
4a238c70SJohn Marino        MPFR_CHANGE_SIGN (z[1]);
4a238c70SJohn Marino      x3u = mpfr_get_ui (z[1], MPFR_RNDU);   /* x3u >= ceil (x^3) */
4a238c70SJohn Marino      if (MPFR_IS_NEG (x))
4a238c70SJohn Marino        MPFR_CHANGE_SIGN (z[1]);
4a238c70SJohn Marino
4a238c70SJohn Marino      for (j=2; j<=L ;j++)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (j%2 == 0)
4a238c70SJohn Marino            mpfr_sqr (z[j], z[j/2], MPFR_RNDN);
4a238c70SJohn Marino          else
4a238c70SJohn Marino            mpfr_mul (z[j], z[j-1], z[1], MPFR_RNDN);
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_gamma_one_and_two_third (temp1, temp2, wprec);
4a238c70SJohn Marino      mpfr_set_ui (u0, 9, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_cbrt (u0, u0, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_mul (u0, u0, temp2, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_ui_div (u0, 1, u0 , MPFR_RNDN); /* u0 = 1/( Gamma (2/3)*9^(1/3) ) */
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_set_ui (u1, 3, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_cbrt (u1, u1, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_mul (u1, u1, temp1, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_neg (u1, u1, MPFR_RNDN);
4a238c70SJohn Marino      mpfr_div (u1, x, u1, MPFR_RNDN); /* u1 = -x/(Gamma (1/3)*3^(1/3)) */
4a238c70SJohn Marino
4a238c70SJohn Marino      mpfr_set_ui (result, 0, MPFR_RNDN);
4a238c70SJohn Marino      t = 0;
4a238c70SJohn Marino
4a238c70SJohn Marino      /* Evaluation of the series by Smith' method    */
4a238c70SJohn Marino      for (i=0; ; i++)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          t += 3 * L;
4a238c70SJohn Marino
4a238c70SJohn Marino          /* k = 0 */
4a238c70SJohn Marino          t -= 3;
4a238c70SJohn Marino          mpfr_set (s, z[L-1], MPFR_RNDN);
4a238c70SJohn Marino          for (j=L-2; ; j--)
4a238c70SJohn Marino            {
4a238c70SJohn Marino              t -= 3;
4a238c70SJohn Marino              mpfr_div_ui2 (s, s, (t+2), (t+3), MPFR_RNDN);
4a238c70SJohn Marino              mpfr_add (s, s, z[j], MPFR_RNDN);
4a238c70SJohn Marino              if (j==0)
4a238c70SJohn Marino                break;
4a238c70SJohn Marino            }
4a238c70SJohn Marino          mpfr_mul (s, s, u0, MPFR_RNDN);
4a238c70SJohn Marino          mpfr_add (result, result, s, MPFR_RNDN);
4a238c70SJohn Marino
4a238c70SJohn Marino          mpfr_mul (u0, u0, z[L], MPFR_RNDN);
4a238c70SJohn Marino          for (j=0; j<=L-1; j++)
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_div_ui2 (u0, u0, (t + 2), (t + 3), MPFR_RNDN);
4a238c70SJohn Marino              t += 3;
4a238c70SJohn Marino            }
4a238c70SJohn Marino
4a238c70SJohn Marino          t++;
4a238c70SJohn Marino
4a238c70SJohn Marino          /* k = 1 */
4a238c70SJohn Marino          t -= 3;
4a238c70SJohn Marino          mpfr_set (s, z[L-1], MPFR_RNDN);
4a238c70SJohn Marino          for (j=L-2; ; j--)
4a238c70SJohn Marino            {
4a238c70SJohn Marino              t -= 3;
4a238c70SJohn Marino              mpfr_div_ui2 (s, s, (t + 2), (t + 3), MPFR_RNDN);
4a238c70SJohn Marino              mpfr_add (s, s, z[j], MPFR_RNDN);
4a238c70SJohn Marino              if (j==0)
4a238c70SJohn Marino                break;
4a238c70SJohn Marino            }
4a238c70SJohn Marino          mpfr_mul (s, s, u1, MPFR_RNDN);
4a238c70SJohn Marino          mpfr_add (result, result, s, MPFR_RNDN);
4a238c70SJohn Marino
4a238c70SJohn Marino          mpfr_mul (u1, u1, z[L], MPFR_RNDN);
4a238c70SJohn Marino          for (j=0; j<=L-1; j++)
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_div_ui2 (u1, u1, (t + 2), (t + 3), MPFR_RNDN);
4a238c70SJohn Marino              t += 3;
4a238c70SJohn Marino            }
4a238c70SJohn Marino
4a238c70SJohn Marino          t++;
4a238c70SJohn Marino
4a238c70SJohn Marino          /* k = 2 */
4a238c70SJohn Marino          t++;
4a238c70SJohn Marino
4a238c70SJohn Marino          /* End of the loop over k */
4a238c70SJohn Marino          t -= 3;
4a238c70SJohn Marino
4a238c70SJohn Marino          test0 = MPFR_IS_ZERO (u0) ||
4a238c70SJohn Marino            MPFR_GET_EXP (u0) + (mpfr_exp_t)prec + 4 <= MPFR_GET_EXP (result);
4a238c70SJohn Marino          test1 = MPFR_IS_ZERO (u1) ||
4a238c70SJohn Marino            MPFR_GET_EXP (u1) + (mpfr_exp_t)prec + 4 <= MPFR_GET_EXP (result);
4a238c70SJohn Marino
4a238c70SJohn Marino          if ( test0 && test1 && (x3u <= (t + 2) * (t + 3) / 2) )
4a238c70SJohn Marino            break;
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      MPFR_LOG_MSG (("Truncation rank: %lu\n", t));
4a238c70SJohn Marino
4a238c70SJohn Marino      err = (5 + MPFR_INT_CEIL_LOG2 (L+1) + MPFR_INT_CEIL_LOG2 (i+1)
4a238c70SJohn Marino             + cond - MPFR_GET_EXP (result));
4a238c70SJohn Marino
4a238c70SJohn Marino      /* err is the number of bits lost due to the evaluation error */
4a238c70SJohn Marino      /* wprec-(prec+1): number of bits lost due to the approximation error */
4a238c70SJohn Marino      MPFR_LOG_MSG (("Roundoff error: %Pu\n", err));
4a238c70SJohn Marino      MPFR_LOG_MSG (("Approxim error: %Pu\n", wprec - prec - 1));
4a238c70SJohn Marino
4a238c70SJohn Marino      if (wprec < err+1)
4a238c70SJohn Marino        correctBits = 0;
4a238c70SJohn Marino      else
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (wprec < err+prec+1)
4a238c70SJohn Marino            correctBits = wprec - err - 1;
4a238c70SJohn Marino          else
4a238c70SJohn Marino            correctBits = prec;
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      if (MPFR_LIKELY (MPFR_CAN_ROUND (result, correctBits,
4a238c70SJohn Marino                                       MPFR_PREC (y), rnd)))
4a238c70SJohn Marino        break;
4a238c70SJohn Marino
4a238c70SJohn Marino      for (j=0; j<=L; j++)
4a238c70SJohn Marino        mpfr_clear (z[j]);
4a238c70SJohn Marino      (*__gmp_free_func) (z, (L + 1) * sizeof (mpfr_t));
4a238c70SJohn Marino      L = __gmpfr_isqrt (t);
4a238c70SJohn Marino      MPFR_LOG_MSG (("size of blocks L = %lu\n", L));
4a238c70SJohn Marino      z = (mpfr_t *) (*__gmp_allocate_func) ( (L + 1) * sizeof (mpfr_t));
4a238c70SJohn Marino      MPFR_ASSERTN (z != NULL);
4a238c70SJohn Marino      for (j=0; j<=L; j++)
4a238c70SJohn Marino        mpfr_init (z[j]);
4a238c70SJohn Marino
4a238c70SJohn Marino      if (correctBits == 0)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          assumed_exponent *= 2;
4a238c70SJohn Marino          MPFR_LOG_MSG (("Not a single bit correct (assumed_exponent=%lu)\n",
4a238c70SJohn Marino                         assumed_exponent));
4a238c70SJohn Marino          wprec = prec + 6 + MPFR_INT_CEIL_LOG2 (t) + cond + assumed_exponent;
4a238c70SJohn Marino        }
4a238c70SJohn Marino    else
4a238c70SJohn Marino      {
4a238c70SJohn Marino        if (correctBits < prec)
4a238c70SJohn Marino          { /* The precision was badly chosen */
4a238c70SJohn Marino            MPFR_LOG_MSG (("Bad assumption on the exponent of Ai (x)", 0));
4a238c70SJohn Marino            MPFR_LOG_MSG ((" (E=%ld)\n", (long) (MPFR_GET_EXP (result))));
4a238c70SJohn Marino            wprec = prec + err + 1;
4a238c70SJohn Marino          }
4a238c70SJohn Marino        else
4a238c70SJohn Marino          { /* We are really in a bad case of the TMD */
4a238c70SJohn Marino            MPFR_ZIV_NEXT (loop, prec);
4a238c70SJohn Marino
4a238c70SJohn Marino            /* We update wprec */
4a238c70SJohn Marino            /* We assume that t will not be multiplied by more than 4 */
4a238c70SJohn Marino            wprec = (prec + (MPFR_INT_CEIL_LOG2 (t) + 2) + 6 + cond
4a238c70SJohn Marino                     - MPFR_GET_EXP (result));
4a238c70SJohn Marino          }
4a238c70SJohn Marino      }
4a238c70SJohn Marino    } /* End of ZIV loop */
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino  MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  r = mpfr_set (y, result, rnd);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_clear (tmp_sp);
4a238c70SJohn Marino  mpfr_clear (tmp2_sp);
4a238c70SJohn Marino  for (j=0; j<=L; j++)
4a238c70SJohn Marino    mpfr_clear (z[j]);
4a238c70SJohn Marino  (*__gmp_free_func) (z, (L + 1) * sizeof (mpfr_t));
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_clear (s);
4a238c70SJohn Marino  mpfr_clear (u0); mpfr_clear (u1);
4a238c70SJohn Marino  mpfr_clear (result);
4a238c70SJohn Marino  mpfr_clear (temp1);
4a238c70SJohn Marino  mpfr_clear (temp2);
4a238c70SJohn Marino
4a238c70SJohn Marino  return r;
4a238c70SJohn Marino}
4a238c70SJohn Marino
4a238c70SJohn Marino/* We consider that the boundary between the area where the naive method
4a238c70SJohn Marino   should preferably be used and the area where Smith' method should preferably
4a238c70SJohn Marino   be used has the following form:
4a238c70SJohn Marino   it is a triangle defined by two lines (one for the negative values of x, and
4a238c70SJohn Marino   one for the positive values of x) crossing at x=0.
4a238c70SJohn Marino
4a238c70SJohn Marino   More precisely,
4a238c70SJohn Marino
4a238c70SJohn Marino   * If x<0 and MPFR_AI_THRESHOLD1*x + MPFR_AI_THRESHOLD2*prec > MPFR_AI_SCALE,
4a238c70SJohn Marino   use Smith' algorithm;
4a238c70SJohn Marino   * If x>0 and MPFR_AI_THRESHOLD3*x + MPFR_AI_THRESHOLD2*prec > MPFR_AI_SCALE,
4a238c70SJohn Marino   use Smith' algorithm;
4a238c70SJohn Marino   * otherwise, use the naive method.
4a238c70SJohn Marino*/
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_AI_SCALE 1048576
4a238c70SJohn Marino
4a238c70SJohn Marinoint
4a238c70SJohn Marinompfr_ai (mpfr_ptr y, mpfr_srcptr x, mpfr_rnd_t rnd)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mpfr_t temp1, temp2;
4a238c70SJohn Marino  int use_ai2;
4a238c70SJohn Marino  MPFR_SAVE_EXPO_DECL (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* The exponent range must be large enough for the computation of temp1. */
4a238c70SJohn Marino  MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_init2 (temp1, MPFR_SMALL_PRECISION);
4a238c70SJohn Marino  mpfr_init2 (temp2, MPFR_SMALL_PRECISION);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_set (temp1, x, MPFR_RNDN);
4a238c70SJohn Marino  mpfr_set_si (temp2, MPFR_AI_THRESHOLD2, MPFR_RNDN);
4a238c70SJohn Marino  mpfr_mul_ui (temp2, temp2, MPFR_PREC (y) > ULONG_MAX ?
4a238c70SJohn Marino               ULONG_MAX : (unsigned long) MPFR_PREC (y), MPFR_RNDN);
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_IS_NEG (x))
4a238c70SJohn Marino      mpfr_mul_si (temp1, temp1, MPFR_AI_THRESHOLD1, MPFR_RNDN);
4a238c70SJohn Marino  else
4a238c70SJohn Marino      mpfr_mul_si (temp1, temp1, MPFR_AI_THRESHOLD3, MPFR_RNDN);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_add (temp1, temp1, temp2, MPFR_RNDN);
4a238c70SJohn Marino  mpfr_clear (temp2);
4a238c70SJohn Marino
4a238c70SJohn Marino  use_ai2 = mpfr_cmp_si (temp1, MPFR_AI_SCALE) > 0;
4a238c70SJohn Marino  mpfr_clear (temp1);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_FREE (expo); /* Ignore all previous exceptions. */
4a238c70SJohn Marino
4a238c70SJohn Marino  return use_ai2 ? mpfr_ai2 (y, x, rnd) : mpfr_ai1 (y, x, rnd);
4a238c70SJohn Marino}