mpfr/src/pow_ui.c

4a238c70SJohn Marino/* mpfr_pow_ui-- compute the power of a floating-point
4a238c70SJohn Marino                                  by a machine integer
4a238c70SJohn Marino
*ab6d115fSJohn MarinoCopyright 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
*ab6d115fSJohn MarinoContributed by the AriC and Caramel projects, INRIA.
4a238c70SJohn Marino
4a238c70SJohn MarinoThis file is part of the GNU MPFR Library.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is free software; you can redistribute it and/or modify
4a238c70SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
4a238c70SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
4a238c70SJohn Marinooption) any later version.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is distributed in the hope that it will be useful, but
4a238c70SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
4a238c70SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
4a238c70SJohn MarinoLicense for more details.
4a238c70SJohn Marino
4a238c70SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
4a238c70SJohn Marinoalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
4a238c70SJohn Marinohttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
4a238c70SJohn Marino51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_NEED_LONGLONG_H
4a238c70SJohn Marino#include "mpfr-impl.h"
4a238c70SJohn Marino
4a238c70SJohn Marino/* sets y to x^n, and return 0 if exact, non-zero otherwise */
4a238c70SJohn Marinoint
4a238c70SJohn Marinompfr_pow_ui (mpfr_ptr y, mpfr_srcptr x, unsigned long int n, mpfr_rnd_t rnd)
4a238c70SJohn Marino{
4a238c70SJohn Marino  unsigned long m;
4a238c70SJohn Marino  mpfr_t res;
4a238c70SJohn Marino  mpfr_prec_t prec, err;
4a238c70SJohn Marino  int inexact;
4a238c70SJohn Marino  mpfr_rnd_t rnd1;
4a238c70SJohn Marino  MPFR_SAVE_EXPO_DECL (expo);
4a238c70SJohn Marino  MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino  MPFR_BLOCK_DECL (flags);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_LOG_FUNC
4a238c70SJohn Marino    (("x[%Pu]=%.*Rg n=%lu rnd=%d",
4a238c70SJohn Marino      mpfr_get_prec (x), mpfr_log_prec, x, n, rnd),
4a238c70SJohn Marino     ("y[%Pu]=%.*Rg inexact=%d",
4a238c70SJohn Marino      mpfr_get_prec (y), mpfr_log_prec, y, inexact));
4a238c70SJohn Marino
4a238c70SJohn Marino  /* x^0 = 1 for any x, even a NaN */
4a238c70SJohn Marino  if (MPFR_UNLIKELY (n == 0))
4a238c70SJohn Marino    return mpfr_set_ui (y, 1, rnd);
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_NAN (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_NAN (y);
4a238c70SJohn Marino          MPFR_RET_NAN;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else if (MPFR_IS_INF (x))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          /* Inf^n = Inf, (-Inf)^n = Inf for n even, -Inf for n odd */
4a238c70SJohn Marino          if (MPFR_IS_NEG (x) && (n & 1) == 1)
4a238c70SJohn Marino            MPFR_SET_NEG (y);
4a238c70SJohn Marino          else
4a238c70SJohn Marino            MPFR_SET_POS (y);
4a238c70SJohn Marino          MPFR_SET_INF (y);
4a238c70SJohn Marino          MPFR_RET (0);
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else /* x is zero */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_ASSERTD (MPFR_IS_ZERO (x));
4a238c70SJohn Marino          /* 0^n = 0 for any n */
4a238c70SJohn Marino          MPFR_SET_ZERO (y);
4a238c70SJohn Marino          if (MPFR_IS_POS (x) || (n & 1) == 0)
4a238c70SJohn Marino            MPFR_SET_POS (y);
4a238c70SJohn Marino          else
4a238c70SJohn Marino            MPFR_SET_NEG (y);
4a238c70SJohn Marino          MPFR_RET (0);
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino  else if (MPFR_UNLIKELY (n <= 2))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (n < 2)
4a238c70SJohn Marino        /* x^1 = x */
4a238c70SJohn Marino        return mpfr_set (y, x, rnd);
4a238c70SJohn Marino      else
4a238c70SJohn Marino        /* x^2 = sqr(x) */
4a238c70SJohn Marino        return mpfr_sqr (y, x, rnd);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Augment exponent range */
4a238c70SJohn Marino  MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* setup initial precision */
4a238c70SJohn Marino  prec = MPFR_PREC (y) + 3 + GMP_NUMB_BITS
4a238c70SJohn Marino    + MPFR_INT_CEIL_LOG2 (MPFR_PREC (y));
4a238c70SJohn Marino  mpfr_init2 (res, prec);
4a238c70SJohn Marino
4a238c70SJohn Marino  rnd1 = MPFR_IS_POS (x) ? MPFR_RNDU : MPFR_RNDD; /* away */
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_ZIV_INIT (loop, prec);
4a238c70SJohn Marino  for (;;)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      int i;
4a238c70SJohn Marino
4a238c70SJohn Marino      for (m = n, i = 0; m; i++, m >>= 1)
4a238c70SJohn Marino        ;
4a238c70SJohn Marino      /* now 2^(i-1) <= n < 2^i */
4a238c70SJohn Marino      MPFR_ASSERTD (prec > (mpfr_prec_t) i);
4a238c70SJohn Marino      err = prec - 1 - (mpfr_prec_t) i;
4a238c70SJohn Marino      /* First step: compute square from x */
4a238c70SJohn Marino      MPFR_BLOCK (flags,
4a238c70SJohn Marino                  inexact = mpfr_mul (res, x, x, MPFR_RNDU);
4a238c70SJohn Marino                  MPFR_ASSERTD (i >= 2);
4a238c70SJohn Marino                  if (n & (1UL << (i-2)))
4a238c70SJohn Marino                    inexact |= mpfr_mul (res, res, x, rnd1);
4a238c70SJohn Marino                  for (i -= 3; i >= 0 && !MPFR_BLOCK_EXCEP; i--)
4a238c70SJohn Marino                    {
4a238c70SJohn Marino                      inexact |= mpfr_mul (res, res, res, MPFR_RNDU);
4a238c70SJohn Marino                      if (n & (1UL << i))
4a238c70SJohn Marino                        inexact |= mpfr_mul (res, res, x, rnd1);
4a238c70SJohn Marino                    });
4a238c70SJohn Marino      /* let r(n) be the number of roundings: we have r(2)=1, r(3)=2,
4a238c70SJohn Marino         and r(2n)=2r(n)+1, r(2n+1)=2r(n)+2, thus r(n)=n-1.
4a238c70SJohn Marino         Using Higham's method, to each rounding corresponds a factor
4a238c70SJohn Marino         (1-theta) with 0 <= theta <= 2^(1-p), thus at the end the
4a238c70SJohn Marino         absolute error is bounded by (n-1)*2^(1-p)*res <= 2*(n-1)*ulp(res)
4a238c70SJohn Marino         since 2^(-p)*x <= ulp(x). Since n < 2^i, this gives a maximal
4a238c70SJohn Marino         error of 2^(1+i)*ulp(res).
4a238c70SJohn Marino      */
4a238c70SJohn Marino      if (MPFR_LIKELY (inexact == 0
4a238c70SJohn Marino                       || MPFR_OVERFLOW (flags) || MPFR_UNDERFLOW (flags)
4a238c70SJohn Marino                       || MPFR_CAN_ROUND (res, err, MPFR_PREC (y), rnd)))
4a238c70SJohn Marino        break;
4a238c70SJohn Marino      /* Actualisation of the precision */
4a238c70SJohn Marino      MPFR_ZIV_NEXT (loop, prec);
4a238c70SJohn Marino      mpfr_set_prec (res, prec);
4a238c70SJohn Marino    }
4a238c70SJohn Marino  MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_UNLIKELY (MPFR_OVERFLOW (flags) || MPFR_UNDERFLOW (flags)))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpz_t z;
4a238c70SJohn Marino
4a238c70SJohn Marino      /* Internal overflow or underflow. However the approximation error has
4a238c70SJohn Marino       * not been taken into account. So, let's solve this problem by using
4a238c70SJohn Marino       * mpfr_pow_z, which can handle it. This case could be improved in the
4a238c70SJohn Marino       * future, without having to use mpfr_pow_z.
4a238c70SJohn Marino       */
4a238c70SJohn Marino      MPFR_LOG_MSG (("Internal overflow or underflow,"
4a238c70SJohn Marino                     " let's use mpfr_pow_z.\n", 0));
4a238c70SJohn Marino      mpfr_clear (res);
4a238c70SJohn Marino      MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino      mpz_init (z);
4a238c70SJohn Marino      mpz_set_ui (z, n);
4a238c70SJohn Marino      inexact = mpfr_pow_z (y, x, z, rnd);
4a238c70SJohn Marino      mpz_clear (z);
4a238c70SJohn Marino      return inexact;
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  inexact = mpfr_set (y, res, rnd);
4a238c70SJohn Marino  mpfr_clear (res);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino  return mpfr_check_range (y, inexact, rnd);
4a238c70SJohn Marino}