mpfr/src/mpn_exp.c

4a238c70SJohn Marino/* mpfr_mpn_exp -- auxiliary function for mpfr_get_str and mpfr_set_str
4a238c70SJohn Marino
*ab6d115fSJohn MarinoCopyright 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
*ab6d115fSJohn MarinoContributed by the AriC and Caramel projects, INRIA.
4a238c70SJohn Marino
4a238c70SJohn MarinoThis file is part of the GNU MPFR Library.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is free software; you can redistribute it and/or modify
4a238c70SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
4a238c70SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
4a238c70SJohn Marinooption) any later version.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is distributed in the hope that it will be useful, but
4a238c70SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
4a238c70SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
4a238c70SJohn MarinoLicense for more details.
4a238c70SJohn Marino
4a238c70SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
4a238c70SJohn Marinoalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
4a238c70SJohn Marinohttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
4a238c70SJohn Marino51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
4a238c70SJohn Marino
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_NEED_LONGLONG_H
4a238c70SJohn Marino#include "mpfr-impl.h"
4a238c70SJohn Marino
4a238c70SJohn Marino/* this function computes an approximation of b^e in {a, n}, with exponent
4a238c70SJohn Marino   stored in exp_r. The computed value is rounded toward zero (truncated).
4a238c70SJohn Marino   It returns an integer f such that the final error is bounded by 2^f ulps,
4a238c70SJohn Marino   that is:
4a238c70SJohn Marino   a*2^exp_r <= b^e <= 2^exp_r (a + 2^f),
4a238c70SJohn Marino   where a represents {a, n}, i.e. the integer
4a238c70SJohn Marino   a[0] + a[1]*B + ... + a[n-1]*B^(n-1) where B=2^GMP_NUMB_BITS
4a238c70SJohn Marino
4a238c70SJohn Marino   Return -1 is the result is exact.
4a238c70SJohn Marino   Return -2 if an overflow occurred in the computation of exp_r.
4a238c70SJohn Marino*/
4a238c70SJohn Marino
4a238c70SJohn Marinolong
4a238c70SJohn Marinompfr_mpn_exp (mp_limb_t *a, mpfr_exp_t *exp_r, int b, mpfr_exp_t e, size_t n)
4a238c70SJohn Marino{
4a238c70SJohn Marino  mp_limb_t *c, B;
4a238c70SJohn Marino  mpfr_exp_t f, h;
4a238c70SJohn Marino  int i;
4a238c70SJohn Marino  unsigned long t; /* number of bits in e */
4a238c70SJohn Marino  unsigned long bits;
4a238c70SJohn Marino  size_t n1;
4a238c70SJohn Marino  unsigned int error;           /* (number - 1) of loop a^2b inexact */
4a238c70SJohn Marino                                 /* error == t means no error */
4a238c70SJohn Marino  int err_s_a2 = 0;
4a238c70SJohn Marino  int err_s_ab = 0;              /* number of error when shift A^2, AB */
4a238c70SJohn Marino  MPFR_TMP_DECL(marker);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_ASSERTN(e > 0);
4a238c70SJohn Marino  MPFR_ASSERTN((2 <= b) && (b <= 62));
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_TMP_MARK(marker);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* initialization of a, b, f, h */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* normalize the base */
4a238c70SJohn Marino  B = (mp_limb_t) b;
4a238c70SJohn Marino  count_leading_zeros (h, B);
4a238c70SJohn Marino
4a238c70SJohn Marino  bits = GMP_NUMB_BITS - h;
4a238c70SJohn Marino
4a238c70SJohn Marino  B = B << h;
4a238c70SJohn Marino  h = - h;
4a238c70SJohn Marino
4a238c70SJohn Marino  /* allocate space for A and set it to B */
4a238c70SJohn Marino  c = MPFR_TMP_LIMBS_ALLOC (2 * n);
4a238c70SJohn Marino  a [n - 1] = B;
4a238c70SJohn Marino  MPN_ZERO (a, n - 1);
4a238c70SJohn Marino  /* initial exponent for A: invariant is A = {a, n} * 2^f */
4a238c70SJohn Marino  f = h - (n - 1) * GMP_NUMB_BITS;
4a238c70SJohn Marino
4a238c70SJohn Marino  /* determine number of bits in e */
4a238c70SJohn Marino  count_leading_zeros (t, (mp_limb_t) e);
4a238c70SJohn Marino
4a238c70SJohn Marino  t = GMP_NUMB_BITS - t; /* number of bits of exponent e */
4a238c70SJohn Marino
4a238c70SJohn Marino  error = t; /* error <= GMP_NUMB_BITS */
4a238c70SJohn Marino
4a238c70SJohn Marino  MPN_ZERO (c, 2 * n);
4a238c70SJohn Marino
4a238c70SJohn Marino  for (i = t - 2; i >= 0; i--)
4a238c70SJohn Marino    {
4a238c70SJohn Marino
4a238c70SJohn Marino      /* determine precision needed */
4a238c70SJohn Marino      bits = n * GMP_NUMB_BITS - mpn_scan1 (a, 0);
4a238c70SJohn Marino      n1 = (n * GMP_NUMB_BITS - bits) / GMP_NUMB_BITS;
4a238c70SJohn Marino
4a238c70SJohn Marino      /* square of A : {c+2n1, 2(n-n1)} = {a+n1, n-n1}^2 */
4a238c70SJohn Marino      mpn_sqr_n (c + 2 * n1, a + n1, n - n1);
4a238c70SJohn Marino
4a238c70SJohn Marino      /* set {c+n, 2n1-n} to 0 : {c, n} = {a, n}^2*K^n */
4a238c70SJohn Marino
4a238c70SJohn Marino      /* check overflow on f */
4a238c70SJohn Marino      if (MPFR_UNLIKELY(f < MPFR_EXP_MIN/2 || f > MPFR_EXP_MAX/2))
4a238c70SJohn Marino        {
4a238c70SJohn Marino        overflow:
4a238c70SJohn Marino          MPFR_TMP_FREE(marker);
4a238c70SJohn Marino          return -2;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      /* FIXME: Could f = 2*f + n * GMP_NUMB_BITS be used? */
4a238c70SJohn Marino      f = 2*f;
4a238c70SJohn Marino      MPFR_SADD_OVERFLOW (f, f, n * GMP_NUMB_BITS,
4a238c70SJohn Marino                          mpfr_exp_t, mpfr_uexp_t,
4a238c70SJohn Marino                          MPFR_EXP_MIN, MPFR_EXP_MAX,
4a238c70SJohn Marino                          goto overflow, goto overflow);
4a238c70SJohn Marino      if ((c[2*n - 1] & MPFR_LIMB_HIGHBIT) == 0)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          /* shift A by one bit to the left */
4a238c70SJohn Marino          mpn_lshift (a, c + n, n, 1);
4a238c70SJohn Marino          a[0] |= mpn_lshift (c + n - 1, c + n - 1, 1, 1);
4a238c70SJohn Marino          f --;
4a238c70SJohn Marino          if (error != t)
4a238c70SJohn Marino            err_s_a2 ++;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else
4a238c70SJohn Marino        MPN_COPY (a, c + n, n);
4a238c70SJohn Marino
4a238c70SJohn Marino      if ((error == t) && (2 * n1 <= n) &&
4a238c70SJohn Marino          (mpn_scan1 (c + 2 * n1, 0) < (n - 2 * n1) * GMP_NUMB_BITS))
4a238c70SJohn Marino        error = i;
4a238c70SJohn Marino
4a238c70SJohn Marino      if (e & ((mpfr_exp_t) 1 << i))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          /* multiply A by B */
4a238c70SJohn Marino          c[2 * n - 1] = mpn_mul_1 (c + n - 1, a, n, B);
4a238c70SJohn Marino          f += h + GMP_NUMB_BITS;
4a238c70SJohn Marino          if ((c[2 * n - 1] & MPFR_LIMB_HIGHBIT) == 0)
4a238c70SJohn Marino            { /* shift A by one bit to the left */
4a238c70SJohn Marino              mpn_lshift (a, c + n, n, 1);
4a238c70SJohn Marino              a[0] |= mpn_lshift (c + n - 1, c + n - 1, 1, 1);
4a238c70SJohn Marino              f --;
4a238c70SJohn Marino            }
4a238c70SJohn Marino          else
4a238c70SJohn Marino            {
4a238c70SJohn Marino              MPN_COPY (a, c + n, n);
4a238c70SJohn Marino              if (error != t)
4a238c70SJohn Marino                err_s_ab ++;
4a238c70SJohn Marino            }
4a238c70SJohn Marino          if ((error == t) && (c[n - 1] != 0))
4a238c70SJohn Marino            error = i;
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_TMP_FREE(marker);
4a238c70SJohn Marino
4a238c70SJohn Marino  *exp_r = f;
4a238c70SJohn Marino
4a238c70SJohn Marino  if (error == t)
4a238c70SJohn Marino    return -1; /* result is exact */
4a238c70SJohn Marino  else /* error <= t-2 <= GMP_NUMB_BITS-2
4a238c70SJohn Marino          err_s_ab, err_s_a2 <= t-1       */
4a238c70SJohn Marino    {
4a238c70SJohn Marino      /* if there are p loops after the first inexact result, with
4a238c70SJohn Marino         j shifts in a^2 and l shifts in a*b, then the final error is
4a238c70SJohn Marino         at most 2^(p+ceil((j+1)/2)+l+1)*ulp(res).
4a238c70SJohn Marino         This is bounded by 2^(5/2*t-1/2) where t is the number of bits of e.
4a238c70SJohn Marino      */
4a238c70SJohn Marino      error = error + err_s_ab + err_s_a2 / 2 + 3; /* <= 5t/2-1/2 */
4a238c70SJohn Marino#if 0
4a238c70SJohn Marino      if ((error - 1) >= ((n * GMP_NUMB_BITS - 1) / 2))
4a238c70SJohn Marino        error = n * GMP_NUMB_BITS; /* result is completely wrong:
4a238c70SJohn Marino                                         this is very unlikely since error is
4a238c70SJohn Marino                                         at most 5/2*log_2(e), and
4a238c70SJohn Marino                                         n * GMP_NUMB_BITS is at least
4a238c70SJohn Marino                                         3*log_2(e) */
4a238c70SJohn Marino#endif
4a238c70SJohn Marino      return error;
4a238c70SJohn Marino    }
4a238c70SJohn Marino}