gmp/mpf/sqrt.c

86d7f5d3SJohn Marino/* mpf_sqrt -- Compute the square root of a float.
86d7f5d3SJohn Marino
86d7f5d3SJohn MarinoCopyright 1993, 1994, 1996, 2000, 2001, 2004, 2005 Free Software Foundation,
86d7f5d3SJohn MarinoInc.
86d7f5d3SJohn Marino
86d7f5d3SJohn MarinoThis file is part of the GNU MP Library.
86d7f5d3SJohn Marino
86d7f5d3SJohn MarinoThe GNU MP Library is free software; you can redistribute it and/or modify
86d7f5d3SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
86d7f5d3SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
86d7f5d3SJohn Marinooption) any later version.
86d7f5d3SJohn Marino
86d7f5d3SJohn MarinoThe GNU MP Library is distributed in the hope that it will be useful, but
86d7f5d3SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
86d7f5d3SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
86d7f5d3SJohn MarinoLicense for more details.
86d7f5d3SJohn Marino
86d7f5d3SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
86d7f5d3SJohn Marinoalong with the GNU MP Library.  If not, see http://www.gnu.org/licenses/.  */
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino#include <stdio.h> /* for NULL */
86d7f5d3SJohn Marino#include "gmp.h"
86d7f5d3SJohn Marino#include "gmp-impl.h"
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino/* As usual, the aim is to produce PREC(r) limbs of result, with the high
86d7f5d3SJohn Marino   limb non-zero.  This is accomplished by applying mpn_sqrtrem to either
86d7f5d3SJohn Marino   2*prec or 2*prec-1 limbs, both such sizes resulting in prec limbs.
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino   The choice between 2*prec or 2*prec-1 limbs is based on the input
86d7f5d3SJohn Marino   exponent.  With b=2^GMP_NUMB_BITS the limb base then we can think of
86d7f5d3SJohn Marino   effectively taking out a factor b^(2k), for suitable k, to get to an
86d7f5d3SJohn Marino   integer input of the desired size ready for mpn_sqrtrem.  It must be an
86d7f5d3SJohn Marino   even power taken out, ie. an even number of limbs, so the square root
86d7f5d3SJohn Marino   gives factor b^k and the radix point is still on a limb boundary.  So if
86d7f5d3SJohn Marino   EXP(r) is even we'll get an even number of input limbs 2*prec, or if
86d7f5d3SJohn Marino   EXP(r) is odd we get an odd number 2*prec-1.
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino   Further limbs below the 2*prec or 2*prec-1 used don't affect the result
86d7f5d3SJohn Marino   and are simply truncated.  This can be seen by considering an integer x,
86d7f5d3SJohn Marino   with s=floor(sqrt(x)).  s is the unique integer satisfying s^2 <= x <
86d7f5d3SJohn Marino   (s+1)^2.  Notice that adding a fraction part to x (ie. some further bits)
86d7f5d3SJohn Marino   doesn't change the inequality, s remains the unique solution.  Working
86d7f5d3SJohn Marino   suitable factors of 2 into this argument lets it apply to an intended
86d7f5d3SJohn Marino   precision at any position for any x, not just the integer binary point.
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino   If the input is smaller than 2*prec or 2*prec-1, then we just pad with
86d7f5d3SJohn Marino   zeros, that of course being our usual interpretation of short inputs.
86d7f5d3SJohn Marino   The effect is to extend the root beyond the size of the input (for
86d7f5d3SJohn Marino   instance into fractional limbs if u is an integer).  */
86d7f5d3SJohn Marino
86d7f5d3SJohn Marinovoid
86d7f5d3SJohn Marinompf_sqrt (mpf_ptr r, mpf_srcptr u)
86d7f5d3SJohn Marino{
86d7f5d3SJohn Marino  mp_size_t usize;
86d7f5d3SJohn Marino  mp_ptr up, tp;
86d7f5d3SJohn Marino  mp_size_t prec, tsize;
86d7f5d3SJohn Marino  mp_exp_t uexp, expodd;
86d7f5d3SJohn Marino  TMP_DECL;
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino  usize = u->_mp_size;
86d7f5d3SJohn Marino  if (usize <= 0)
86d7f5d3SJohn Marino    {
86d7f5d3SJohn Marino      if (usize < 0)
86d7f5d3SJohn Marino        SQRT_OF_NEGATIVE;
86d7f5d3SJohn Marino      r->_mp_size = 0;
86d7f5d3SJohn Marino      r->_mp_exp = 0;
86d7f5d3SJohn Marino      return;
86d7f5d3SJohn Marino    }
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino  TMP_MARK;
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino  uexp = u->_mp_exp;
86d7f5d3SJohn Marino  prec = r->_mp_prec;
86d7f5d3SJohn Marino  up = u->_mp_d;
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino  expodd = (uexp & 1);
86d7f5d3SJohn Marino  tsize = 2 * prec - expodd;
86d7f5d3SJohn Marino  r->_mp_size = prec;
86d7f5d3SJohn Marino  r->_mp_exp = (uexp + expodd) / 2;    /* ceil(uexp/2) */
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino  /* root size is ceil(tsize/2), this will be our desired "prec" limbs */
86d7f5d3SJohn Marino  ASSERT ((tsize + 1) / 2 == prec);
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino  tp = TMP_ALLOC_LIMBS (tsize);
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino  if (usize > tsize)
86d7f5d3SJohn Marino    {
86d7f5d3SJohn Marino      up += usize - tsize;
86d7f5d3SJohn Marino      usize = tsize;
86d7f5d3SJohn Marino      MPN_COPY (tp, up, tsize);
86d7f5d3SJohn Marino    }
86d7f5d3SJohn Marino  else
86d7f5d3SJohn Marino    {
86d7f5d3SJohn Marino      MPN_ZERO (tp, tsize - usize);
86d7f5d3SJohn Marino      MPN_COPY (tp + (tsize - usize), up, usize);
86d7f5d3SJohn Marino    }
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino  mpn_sqrtrem (r->_mp_d, NULL, tp, tsize);
86d7f5d3SJohn Marino
86d7f5d3SJohn Marino  TMP_FREE;
86d7f5d3SJohn Marino}