mpfr/src/pow_si.c

4a238c70SJohn Marino/* mpfr_pow_si -- power function x^y with y a signed int
4a238c70SJohn Marino
*ab6d115fSJohn MarinoCopyright 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
*ab6d115fSJohn MarinoContributed by the AriC and Caramel projects, INRIA.
4a238c70SJohn Marino
4a238c70SJohn MarinoThis file is part of the GNU MPFR Library.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is free software; you can redistribute it and/or modify
4a238c70SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
4a238c70SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
4a238c70SJohn Marinooption) any later version.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is distributed in the hope that it will be useful, but
4a238c70SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
4a238c70SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
4a238c70SJohn MarinoLicense for more details.
4a238c70SJohn Marino
4a238c70SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
4a238c70SJohn Marinoalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
4a238c70SJohn Marinohttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
4a238c70SJohn Marino51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_NEED_LONGLONG_H
4a238c70SJohn Marino#include "mpfr-impl.h"
4a238c70SJohn Marino
4a238c70SJohn Marino/* The computation of y = pow_si(x,n) is done by
4a238c70SJohn Marino *    y = pow_ui(x,n)       if n >= 0
4a238c70SJohn Marino *    y = 1 / pow_ui(x,-n)  if n < 0
4a238c70SJohn Marino */
4a238c70SJohn Marino
4a238c70SJohn Marinoint
4a238c70SJohn Marinompfr_pow_si (mpfr_ptr y, mpfr_srcptr x, long int n, mpfr_rnd_t rnd)
4a238c70SJohn Marino{
4a238c70SJohn Marino  MPFR_LOG_FUNC
4a238c70SJohn Marino    (("x[%Pu]=%.*Rg n=%ld rnd=%d",
4a238c70SJohn Marino      mpfr_get_prec (x), mpfr_log_prec, x, n, rnd),
4a238c70SJohn Marino     ("y[%Pu]=%.*Rg", mpfr_get_prec (y), mpfr_log_prec, y));
4a238c70SJohn Marino
4a238c70SJohn Marino  if (n >= 0)
4a238c70SJohn Marino    return mpfr_pow_ui (y, x, n, rnd);
4a238c70SJohn Marino  else
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (MPFR_IS_NAN (x))
4a238c70SJohn Marino            {
4a238c70SJohn Marino              MPFR_SET_NAN (y);
4a238c70SJohn Marino              MPFR_RET_NAN;
4a238c70SJohn Marino            }
4a238c70SJohn Marino          else
4a238c70SJohn Marino            {
4a238c70SJohn Marino              int positive = MPFR_IS_POS (x) || ((unsigned long) n & 1) == 0;
4a238c70SJohn Marino              if (MPFR_IS_INF (x))
4a238c70SJohn Marino                MPFR_SET_ZERO (y);
4a238c70SJohn Marino              else /* x is zero */
4a238c70SJohn Marino                {
4a238c70SJohn Marino                  MPFR_ASSERTD (MPFR_IS_ZERO (x));
4a238c70SJohn Marino                  MPFR_SET_INF (y);
4a238c70SJohn Marino                  mpfr_set_divby0 ();
4a238c70SJohn Marino                }
4a238c70SJohn Marino              if (positive)
4a238c70SJohn Marino                MPFR_SET_POS (y);
4a238c70SJohn Marino              else
4a238c70SJohn Marino                MPFR_SET_NEG (y);
4a238c70SJohn Marino              MPFR_RET (0);
4a238c70SJohn Marino            }
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      /* detect exact powers: x^(-n) is exact iff x is a power of 2 */
4a238c70SJohn Marino      if (mpfr_cmp_si_2exp (x, MPFR_SIGN(x), MPFR_EXP(x) - 1) == 0)
4a238c70SJohn Marino        {
4a238c70SJohn Marino          mpfr_exp_t expx = MPFR_EXP (x) - 1, expy;
4a238c70SJohn Marino          MPFR_ASSERTD (n < 0);
4a238c70SJohn Marino          /* Warning: n * expx may overflow!
4a238c70SJohn Marino           *
4a238c70SJohn Marino           * Some systems (apparently alpha-freebsd) abort with
4a238c70SJohn Marino           * LONG_MIN / 1, and LONG_MIN / -1 is undefined.
4a238c70SJohn Marino           * http://www.freebsd.org/cgi/query-pr.cgi?pr=72024
4a238c70SJohn Marino           *
4a238c70SJohn Marino           * Proof of the overflow checking. The expressions below are
4a238c70SJohn Marino           * assumed to be on the rational numbers, but the word "overflow"
4a238c70SJohn Marino           * still has its own meaning in the C context. / still denotes
4a238c70SJohn Marino           * the integer (truncated) division, and // denotes the exact
4a238c70SJohn Marino           * division.
4a238c70SJohn Marino           * - First, (__gmpfr_emin - 1) / n and (__gmpfr_emax - 1) / n
4a238c70SJohn Marino           *   cannot overflow due to the constraints on the exponents of
4a238c70SJohn Marino           *   MPFR numbers.
4a238c70SJohn Marino           * - If n = -1, then n * expx = - expx, which is representable
4a238c70SJohn Marino           *   because of the constraints on the exponents of MPFR numbers.
4a238c70SJohn Marino           * - If expx = 0, then n * expx = 0, which is representable.
4a238c70SJohn Marino           * - If n < -1 and expx > 0:
4a238c70SJohn Marino           *   + If expx > (__gmpfr_emin - 1) / n, then
4a238c70SJohn Marino           *           expx >= (__gmpfr_emin - 1) / n + 1
4a238c70SJohn Marino           *                > (__gmpfr_emin - 1) // n,
4a238c70SJohn Marino           *     and
4a238c70SJohn Marino           *           n * expx < __gmpfr_emin - 1,
4a238c70SJohn Marino           *     i.e.
4a238c70SJohn Marino           *           n * expx <= __gmpfr_emin - 2.
4a238c70SJohn Marino           *     This corresponds to an underflow, with a null result in
4a238c70SJohn Marino           *     the rounding-to-nearest mode.
4a238c70SJohn Marino           *   + If expx <= (__gmpfr_emin - 1) / n, then n * expx cannot
4a238c70SJohn Marino           *     overflow since 0 < expx <= (__gmpfr_emin - 1) / n and
4a238c70SJohn Marino           *           0 > n * expx >= n * ((__gmpfr_emin - 1) / n)
4a238c70SJohn Marino           *                        >= __gmpfr_emin - 1.
4a238c70SJohn Marino           * - If n < -1 and expx < 0:
4a238c70SJohn Marino           *   + If expx < (__gmpfr_emax - 1) / n, then
4a238c70SJohn Marino           *           expx <= (__gmpfr_emax - 1) / n - 1
4a238c70SJohn Marino           *                < (__gmpfr_emax - 1) // n,
4a238c70SJohn Marino           *     and
4a238c70SJohn Marino           *           n * expx > __gmpfr_emax - 1,
4a238c70SJohn Marino           *     i.e.
4a238c70SJohn Marino           *           n * expx >= __gmpfr_emax.
4a238c70SJohn Marino           *     This corresponds to an overflow (2^(n * expx) has an
4a238c70SJohn Marino           *     exponent > __gmpfr_emax).
4a238c70SJohn Marino           *   + If expx >= (__gmpfr_emax - 1) / n, then n * expx cannot
4a238c70SJohn Marino           *     overflow since 0 > expx >= (__gmpfr_emax - 1) / n and
4a238c70SJohn Marino           *           0 < n * expx <= n * ((__gmpfr_emax - 1) / n)
4a238c70SJohn Marino           *                        <= __gmpfr_emax - 1.
4a238c70SJohn Marino           * Note: one could use expx bounds based on MPFR_EXP_MIN and
4a238c70SJohn Marino           * MPFR_EXP_MAX instead of __gmpfr_emin and __gmpfr_emax. The
4a238c70SJohn Marino           * current bounds do not lead to noticeably slower code and
4a238c70SJohn Marino           * allow us to avoid a bug in Sun's compiler for Solaris/x86
4a238c70SJohn Marino           * (when optimizations are enabled); known affected versions:
4a238c70SJohn Marino           *   cc: Sun C 5.8 2005/10/13
4a238c70SJohn Marino           *   cc: Sun C 5.8 Patch 121016-02 2006/03/31
4a238c70SJohn Marino           *   cc: Sun C 5.8 Patch 121016-04 2006/10/18
4a238c70SJohn Marino           */
4a238c70SJohn Marino          expy =
4a238c70SJohn Marino            n != -1 && expx > 0 && expx > (__gmpfr_emin - 1) / n ?
4a238c70SJohn Marino            MPFR_EMIN_MIN - 2 /* Underflow */ :
4a238c70SJohn Marino            n != -1 && expx < 0 && expx < (__gmpfr_emax - 1) / n ?
4a238c70SJohn Marino            MPFR_EMAX_MAX /* Overflow */ : n * expx;
4a238c70SJohn Marino          return mpfr_set_si_2exp (y, n % 2 ? MPFR_INT_SIGN (x) : 1,
4a238c70SJohn Marino                                   expy, rnd);
4a238c70SJohn Marino        }
4a238c70SJohn Marino
4a238c70SJohn Marino      /* General case */
4a238c70SJohn Marino      {
4a238c70SJohn Marino        /* Declaration of the intermediary variable */
4a238c70SJohn Marino        mpfr_t t;
4a238c70SJohn Marino        /* Declaration of the size variable */
4a238c70SJohn Marino        mpfr_prec_t Ny;                              /* target precision */
4a238c70SJohn Marino        mpfr_prec_t Nt;                              /* working precision */
4a238c70SJohn Marino        mpfr_rnd_t rnd1;
4a238c70SJohn Marino        int size_n;
4a238c70SJohn Marino        int inexact;
4a238c70SJohn Marino        unsigned long abs_n;
4a238c70SJohn Marino        MPFR_SAVE_EXPO_DECL (expo);
4a238c70SJohn Marino        MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino        abs_n = - (unsigned long) n;
4a238c70SJohn Marino        count_leading_zeros (size_n, (mp_limb_t) abs_n);
4a238c70SJohn Marino        size_n = GMP_NUMB_BITS - size_n;
4a238c70SJohn Marino
4a238c70SJohn Marino        /* initial working precision */
4a238c70SJohn Marino        Ny = MPFR_PREC (y);
4a238c70SJohn Marino        Nt = Ny + size_n + 3 + MPFR_INT_CEIL_LOG2 (Ny);
4a238c70SJohn Marino
4a238c70SJohn Marino        MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino        /* initialise of intermediary   variable */
4a238c70SJohn Marino        mpfr_init2 (t, Nt);
4a238c70SJohn Marino
4a238c70SJohn Marino        /* We will compute rnd(rnd1(1/x) ^ |n|), where rnd1 is the rounding
4a238c70SJohn Marino           toward sign(x), to avoid spurious overflow or underflow, as in
4a238c70SJohn Marino           mpfr_pow_z. */
4a238c70SJohn Marino        rnd1 = MPFR_EXP (x) < 1 ? MPFR_RNDZ :
4a238c70SJohn Marino          (MPFR_SIGN (x) > 0 ? MPFR_RNDU : MPFR_RNDD);
4a238c70SJohn Marino
4a238c70SJohn Marino        MPFR_ZIV_INIT (loop, Nt);
4a238c70SJohn Marino        for (;;)
4a238c70SJohn Marino          {
4a238c70SJohn Marino            MPFR_BLOCK_DECL (flags);
4a238c70SJohn Marino
4a238c70SJohn Marino            /* compute (1/x)^|n| */
4a238c70SJohn Marino            MPFR_BLOCK (flags, mpfr_ui_div (t, 1, x, rnd1));
4a238c70SJohn Marino            MPFR_ASSERTD (! MPFR_UNDERFLOW (flags));
4a238c70SJohn Marino            /* t = (1/x)*(1+theta) where |theta| <= 2^(-Nt) */
4a238c70SJohn Marino            if (MPFR_UNLIKELY (MPFR_OVERFLOW (flags)))
4a238c70SJohn Marino              goto overflow;
4a238c70SJohn Marino            MPFR_BLOCK (flags, mpfr_pow_ui (t, t, abs_n, rnd));
4a238c70SJohn Marino            /* t = (1/x)^|n|*(1+theta')^(|n|+1) where |theta'| <= 2^(-Nt).
4a238c70SJohn Marino               If (|n|+1)*2^(-Nt) <= 1/2, which is satisfied as soon as
4a238c70SJohn Marino               Nt >= bits(n)+2, then we can use Lemma \ref{lemma_graillat}
4a238c70SJohn Marino               from algorithms.tex, which yields x^n*(1+theta) with
4a238c70SJohn Marino               |theta| <= 2(|n|+1)*2^(-Nt), thus the error is bounded by
4a238c70SJohn Marino               2(|n|+1) ulps <= 2^(bits(n)+2) ulps. */
4a238c70SJohn Marino            if (MPFR_UNLIKELY (MPFR_OVERFLOW (flags)))
4a238c70SJohn Marino              {
4a238c70SJohn Marino              overflow:
4a238c70SJohn Marino                MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino                mpfr_clear (t);
4a238c70SJohn Marino                MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino                MPFR_LOG_MSG (("overflow\n", 0));
4a238c70SJohn Marino                return mpfr_overflow (y, rnd, abs_n & 1 ?
4a238c70SJohn Marino                                      MPFR_SIGN (x) : MPFR_SIGN_POS);
4a238c70SJohn Marino              }
4a238c70SJohn Marino            if (MPFR_UNLIKELY (MPFR_UNDERFLOW (flags)))
4a238c70SJohn Marino              {
4a238c70SJohn Marino                MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino                mpfr_clear (t);
4a238c70SJohn Marino                MPFR_LOG_MSG (("underflow\n", 0));
4a238c70SJohn Marino                if (rnd == MPFR_RNDN)
4a238c70SJohn Marino                  {
4a238c70SJohn Marino                    mpfr_t y2, nn;
4a238c70SJohn Marino
4a238c70SJohn Marino                    /* We cannot decide now whether the result should be
4a238c70SJohn Marino                       rounded toward zero or away from zero. So, like
4a238c70SJohn Marino                       in mpfr_pow_pos_z, let's use the general case of
4a238c70SJohn Marino                       mpfr_pow in precision 2. */
4a238c70SJohn Marino                    MPFR_ASSERTD (mpfr_cmp_si_2exp (x, MPFR_SIGN (x),
4a238c70SJohn Marino                                                    MPFR_EXP (x) - 1) != 0);
4a238c70SJohn Marino                    mpfr_init2 (y2, 2);
4a238c70SJohn Marino                    mpfr_init2 (nn, sizeof (long) * CHAR_BIT);
4a238c70SJohn Marino                    inexact = mpfr_set_si (nn, n, MPFR_RNDN);
4a238c70SJohn Marino                    MPFR_ASSERTN (inexact == 0);
4a238c70SJohn Marino                    inexact = mpfr_pow_general (y2, x, nn, rnd, 1,
4a238c70SJohn Marino                                                (mpfr_save_expo_t *) NULL);
4a238c70SJohn Marino                    mpfr_clear (nn);
4a238c70SJohn Marino                    mpfr_set (y, y2, MPFR_RNDN);
4a238c70SJohn Marino                    mpfr_clear (y2);
4a238c70SJohn Marino                    MPFR_SAVE_EXPO_UPDATE_FLAGS (expo, MPFR_FLAGS_UNDERFLOW);
4a238c70SJohn Marino                    goto end;
4a238c70SJohn Marino                  }
4a238c70SJohn Marino                else
4a238c70SJohn Marino                  {
4a238c70SJohn Marino                    MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino                    return mpfr_underflow (y, rnd, abs_n & 1 ?
4a238c70SJohn Marino                                           MPFR_SIGN (x) : MPFR_SIGN_POS);
4a238c70SJohn Marino                  }
4a238c70SJohn Marino              }
4a238c70SJohn Marino            /* error estimate -- see pow function in algorithms.ps */
4a238c70SJohn Marino            if (MPFR_LIKELY (MPFR_CAN_ROUND (t, Nt - size_n - 2, Ny, rnd)))
4a238c70SJohn Marino              break;
4a238c70SJohn Marino
4a238c70SJohn Marino            /* actualisation of the precision */
4a238c70SJohn Marino            MPFR_ZIV_NEXT (loop, Nt);
4a238c70SJohn Marino            mpfr_set_prec (t, Nt);
4a238c70SJohn Marino          }
4a238c70SJohn Marino        MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino        inexact = mpfr_set (y, t, rnd);
4a238c70SJohn Marino        mpfr_clear (t);
4a238c70SJohn Marino
4a238c70SJohn Marino      end:
4a238c70SJohn Marino        MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino        return mpfr_check_range (y, inexact, rnd);
4a238c70SJohn Marino      }
4a238c70SJohn Marino    }
4a238c70SJohn Marino}