mpfr/src/hypot.c

4a238c70SJohn Marino/* mpfr_hypot -- Euclidean distance
4a238c70SJohn Marino
*ab6d115fSJohn MarinoCopyright 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
*ab6d115fSJohn MarinoContributed by the AriC and Caramel projects, INRIA.
4a238c70SJohn Marino
4a238c70SJohn MarinoThis file is part of the GNU MPFR Library.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is free software; you can redistribute it and/or modify
4a238c70SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
4a238c70SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
4a238c70SJohn Marinooption) any later version.
4a238c70SJohn Marino
4a238c70SJohn MarinoThe GNU MPFR Library is distributed in the hope that it will be useful, but
4a238c70SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
4a238c70SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
4a238c70SJohn MarinoLicense for more details.
4a238c70SJohn Marino
4a238c70SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
4a238c70SJohn Marinoalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
4a238c70SJohn Marinohttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
4a238c70SJohn Marino51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
4a238c70SJohn Marino
4a238c70SJohn Marino#define MPFR_NEED_LONGLONG_H
4a238c70SJohn Marino#include "mpfr-impl.h"
4a238c70SJohn Marino
4a238c70SJohn Marino/* The computation of hypot of x and y is done by  *
4a238c70SJohn Marino *    hypot(x,y)= sqrt(x^2+y^2) = z                */
4a238c70SJohn Marino
4a238c70SJohn Marinoint
4a238c70SJohn Marinompfr_hypot (mpfr_ptr z, mpfr_srcptr x, mpfr_srcptr y, mpfr_rnd_t rnd_mode)
4a238c70SJohn Marino{
4a238c70SJohn Marino  int inexact, exact;
4a238c70SJohn Marino  mpfr_t t, te, ti; /* auxiliary variables */
4a238c70SJohn Marino  mpfr_prec_t N, Nz; /* size variables */
4a238c70SJohn Marino  mpfr_prec_t Nt;   /* precision of the intermediary variable */
4a238c70SJohn Marino  mpfr_prec_t threshold;
4a238c70SJohn Marino  mpfr_exp_t Ex, sh;
4a238c70SJohn Marino  mpfr_uexp_t diff_exp;
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_DECL (expo);
4a238c70SJohn Marino  MPFR_ZIV_DECL (loop);
4a238c70SJohn Marino  MPFR_BLOCK_DECL (flags);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_LOG_FUNC
4a238c70SJohn Marino    (("x[%Pu]=%.*Rg y[%Pu]=%.*Rg rnd=%d",
4a238c70SJohn Marino      mpfr_get_prec (x), mpfr_log_prec, x,
4a238c70SJohn Marino      mpfr_get_prec (y), mpfr_log_prec, y, rnd_mode),
4a238c70SJohn Marino     ("z[%Pu]=%.*Rg inexact=%d",
4a238c70SJohn Marino      mpfr_get_prec (z), mpfr_log_prec, z, inexact));
4a238c70SJohn Marino
4a238c70SJohn Marino  /* particular cases */
4a238c70SJohn Marino  if (MPFR_ARE_SINGULAR (x, y))
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_IS_INF (x) || MPFR_IS_INF (y))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          /* Return +inf, even when the other number is NaN. */
4a238c70SJohn Marino          MPFR_SET_INF (z);
4a238c70SJohn Marino          MPFR_SET_POS (z);
4a238c70SJohn Marino          MPFR_RET (0);
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else if (MPFR_IS_NAN (x) || MPFR_IS_NAN (y))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          MPFR_SET_NAN (z);
4a238c70SJohn Marino          MPFR_RET_NAN;
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else if (MPFR_IS_ZERO (x))
4a238c70SJohn Marino        return mpfr_abs (z, y, rnd_mode);
4a238c70SJohn Marino      else /* y is necessarily 0 */
4a238c70SJohn Marino        return mpfr_abs (z, x, rnd_mode);
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  if (mpfr_cmpabs (x, y) < 0)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_srcptr u;
4a238c70SJohn Marino      u = x;
4a238c70SJohn Marino      x = y;
4a238c70SJohn Marino      y = u;
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* now |x| >= |y| */
4a238c70SJohn Marino
4a238c70SJohn Marino  Ex = MPFR_GET_EXP (x);
4a238c70SJohn Marino  diff_exp = (mpfr_uexp_t) Ex - MPFR_GET_EXP (y);
4a238c70SJohn Marino
4a238c70SJohn Marino  N = MPFR_PREC (x);   /* Precision of input variable */
4a238c70SJohn Marino  Nz = MPFR_PREC (z);   /* Precision of output variable */
4a238c70SJohn Marino  threshold = (MAX (N, Nz) + (rnd_mode == MPFR_RNDN ? 1 : 0)) << 1;
4a238c70SJohn Marino  if (rnd_mode == MPFR_RNDA)
4a238c70SJohn Marino    rnd_mode = MPFR_RNDU; /* since the result is positive, RNDA = RNDU */
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Is |x| a suitable approximation to the precision Nz ?
4a238c70SJohn Marino     (see algorithms.tex for explanations) */
4a238c70SJohn Marino  if (diff_exp > threshold)
4a238c70SJohn Marino    /* result is |x| or |x|+ulp(|x|,Nz) */
4a238c70SJohn Marino    {
4a238c70SJohn Marino      if (MPFR_UNLIKELY (rnd_mode == MPFR_RNDU))
4a238c70SJohn Marino        {
4a238c70SJohn Marino          /* If z > abs(x), then it was already rounded up; otherwise
4a238c70SJohn Marino             z = abs(x), and we need to add one ulp due to y. */
4a238c70SJohn Marino          if (mpfr_abs (z, x, rnd_mode) == 0)
4a238c70SJohn Marino            mpfr_nexttoinf (z);
4a238c70SJohn Marino          MPFR_RET (1);
4a238c70SJohn Marino        }
4a238c70SJohn Marino      else /* MPFR_RNDZ, MPFR_RNDD, MPFR_RNDN */
4a238c70SJohn Marino        {
4a238c70SJohn Marino          if (MPFR_LIKELY (Nz >= N))
4a238c70SJohn Marino            {
4a238c70SJohn Marino              mpfr_abs (z, x, rnd_mode);  /* exact */
4a238c70SJohn Marino              MPFR_RET (-1);
4a238c70SJohn Marino            }
4a238c70SJohn Marino          else
4a238c70SJohn Marino            {
4a238c70SJohn Marino              MPFR_SET_EXP (z, Ex);
4a238c70SJohn Marino              MPFR_SET_SIGN (z, 1);
4a238c70SJohn Marino              MPFR_RNDRAW_GEN (inexact, z, MPFR_MANT (x), N, rnd_mode, 1,
4a238c70SJohn Marino                               goto addoneulp,
4a238c70SJohn Marino                               if (MPFR_UNLIKELY (++ MPFR_EXP (z) >
4a238c70SJohn Marino                                                  __gmpfr_emax))
4a238c70SJohn Marino                                 return mpfr_overflow (z, rnd_mode, 1);
4a238c70SJohn Marino                               );
4a238c70SJohn Marino
4a238c70SJohn Marino              if (MPFR_UNLIKELY (inexact == 0))
4a238c70SJohn Marino                inexact = -1;
4a238c70SJohn Marino              MPFR_RET (inexact);
4a238c70SJohn Marino            }
4a238c70SJohn Marino        }
4a238c70SJohn Marino    }
4a238c70SJohn Marino
4a238c70SJohn Marino  /* General case */
4a238c70SJohn Marino
4a238c70SJohn Marino  N = MAX (MPFR_PREC (x), MPFR_PREC (y));
4a238c70SJohn Marino
4a238c70SJohn Marino  /* working precision */
4a238c70SJohn Marino  Nt = Nz + MPFR_INT_CEIL_LOG2 (Nz) + 4;
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_init2 (t, Nt);
4a238c70SJohn Marino  mpfr_init2 (te, Nt);
4a238c70SJohn Marino  mpfr_init2 (ti, Nt);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_MARK (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  /* Scale x and y to avoid overflow/underflow in x^2 and overflow in y^2
4a238c70SJohn Marino     (as |x| >= |y|). The scaling of y can underflow only when the target
4a238c70SJohn Marino     precision is huge, otherwise the case would already have been handled
4a238c70SJohn Marino     by the diff_exp > threshold code. */
4a238c70SJohn Marino  sh = mpfr_get_emax () / 2 - Ex - 1;
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_ZIV_INIT (loop, Nt);
4a238c70SJohn Marino  for (;;)
4a238c70SJohn Marino    {
4a238c70SJohn Marino      mpfr_prec_t err;
4a238c70SJohn Marino
4a238c70SJohn Marino      exact = mpfr_mul_2si (te, x, sh, MPFR_RNDZ);
4a238c70SJohn Marino      exact |= mpfr_mul_2si (ti, y, sh, MPFR_RNDZ);
4a238c70SJohn Marino      exact |= mpfr_sqr (te, te, MPFR_RNDZ);
4a238c70SJohn Marino      /* Use fma in order to avoid underflow when diff_exp<=MPFR_EMAX_MAX-2 */
4a238c70SJohn Marino      exact |= mpfr_fma (t, ti, ti, te, MPFR_RNDZ);
4a238c70SJohn Marino      exact |= mpfr_sqrt (t, t, MPFR_RNDZ);
4a238c70SJohn Marino
4a238c70SJohn Marino      err = Nt < N ? 4 : 2;
4a238c70SJohn Marino      if (MPFR_LIKELY (exact == 0
4a238c70SJohn Marino                       || MPFR_CAN_ROUND (t, Nt-err, Nz, rnd_mode)))
4a238c70SJohn Marino        break;
4a238c70SJohn Marino
4a238c70SJohn Marino      MPFR_ZIV_NEXT (loop, Nt);
4a238c70SJohn Marino      mpfr_set_prec (t, Nt);
4a238c70SJohn Marino      mpfr_set_prec (te, Nt);
4a238c70SJohn Marino      mpfr_set_prec (ti, Nt);
4a238c70SJohn Marino    }
4a238c70SJohn Marino  MPFR_ZIV_FREE (loop);
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_BLOCK (flags, inexact = mpfr_div_2si (z, t, sh, rnd_mode));
4a238c70SJohn Marino  MPFR_ASSERTD (exact == 0 || inexact != 0);
4a238c70SJohn Marino
4a238c70SJohn Marino  mpfr_clear (t);
4a238c70SJohn Marino  mpfr_clear (ti);
4a238c70SJohn Marino  mpfr_clear (te);
4a238c70SJohn Marino
4a238c70SJohn Marino  /*
4a238c70SJohn Marino    exact  inexact
4a238c70SJohn Marino    0         0         result is exact, ternary flag is 0
4a238c70SJohn Marino    0       non zero    t is exact, ternary flag given by inexact
4a238c70SJohn Marino    1         0         impossible (see above)
4a238c70SJohn Marino    1       non zero    ternary flag given by inexact
4a238c70SJohn Marino  */
4a238c70SJohn Marino
4a238c70SJohn Marino  MPFR_SAVE_EXPO_FREE (expo);
4a238c70SJohn Marino
4a238c70SJohn Marino  if (MPFR_OVERFLOW (flags))
4a238c70SJohn Marino    mpfr_set_overflow ();
4a238c70SJohn Marino  /* hypot(x,y) >= |x|, thus underflow is not possible. */
4a238c70SJohn Marino
4a238c70SJohn Marino  return mpfr_check_range (z, inexact, rnd_mode);
4a238c70SJohn Marino}