dist/src/get_float128.c

299c6f0cSmrg/* mpfr_get_float128 -- convert a multiple precision floating-point
2ba2404bSmrg                        number to a _Float128 number
299c6f0cSmrg
*ba125506SmrgCopyright 2012-2023 Free Software Foundation, Inc.
299c6f0cSmrgContributed by the AriC and Caramba projects, INRIA.
299c6f0cSmrg
299c6f0cSmrgThis file is part of the GNU MPFR Library.
299c6f0cSmrg
299c6f0cSmrgThe GNU MPFR Library is free software; you can redistribute it and/or modify
299c6f0cSmrgit under the terms of the GNU Lesser General Public License as published by
299c6f0cSmrgthe Free Software Foundation; either version 3 of the License, or (at your
299c6f0cSmrgoption) any later version.
299c6f0cSmrg
299c6f0cSmrgThe GNU MPFR Library is distributed in the hope that it will be useful, but
299c6f0cSmrgWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
299c6f0cSmrgor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
299c6f0cSmrgLicense for more details.
299c6f0cSmrg
299c6f0cSmrgYou should have received a copy of the GNU Lesser General Public License
299c6f0cSmrgalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
2ba2404bSmrghttps://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
299c6f0cSmrg51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
299c6f0cSmrg
299c6f0cSmrg#include "mpfr-impl.h"
299c6f0cSmrg
299c6f0cSmrg#ifdef MPFR_WANT_FLOAT128
299c6f0cSmrg
299c6f0cSmrg/* generic code */
2ba2404bSmrg_Float128
299c6f0cSmrgmpfr_get_float128 (mpfr_srcptr x, mpfr_rnd_t rnd_mode)
299c6f0cSmrg{
299c6f0cSmrg
299c6f0cSmrg  if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))
2ba2404bSmrg    return (_Float128) mpfr_get_d (x, rnd_mode);
299c6f0cSmrg  else /* now x is a normal non-zero number */
299c6f0cSmrg    {
2ba2404bSmrg      _Float128 r; /* result */
2ba2404bSmrg      _Float128 m;
299c6f0cSmrg      mpfr_exp_t e;  /* exponent of x (before rounding) */
299c6f0cSmrg      mpfr_exp_t sh; /* exponent shift, so that x/2^sh is in the double range */
299c6f0cSmrg      const int emin = -16381;
299c6f0cSmrg      const int esub = emin - IEEE_FLOAT128_MANT_DIG;
299c6f0cSmrg      int sign;
299c6f0cSmrg
299c6f0cSmrg      sign = MPFR_SIGN (x);
299c6f0cSmrg      e = MPFR_GET_EXP (x);
299c6f0cSmrg
299c6f0cSmrg      if (MPFR_UNLIKELY (e <= esub))
299c6f0cSmrg        {
299c6f0cSmrg          if (MPFR_IS_LIKE_RNDZ (rnd_mode, sign < 0) ||
299c6f0cSmrg              (rnd_mode == MPFR_RNDN && (e < esub || mpfr_powerof2_raw (x))))
299c6f0cSmrg            return sign < 0 ? -0.0 : 0.0;
299c6f0cSmrg          r = 1.0;
299c6f0cSmrg          sh = esub;
299c6f0cSmrg        }
299c6f0cSmrg      else
299c6f0cSmrg        {
299c6f0cSmrg          mpfr_t y;
299c6f0cSmrg          mp_limb_t *yp;
299c6f0cSmrg          int prec, i;  /* small enough to fit in an int */
299c6f0cSmrg          MPFR_SAVE_EXPO_DECL (expo);
299c6f0cSmrg
299c6f0cSmrg          MPFR_SAVE_EXPO_MARK (expo);
299c6f0cSmrg
2ba2404bSmrg          /* First round x to the target _Float128 precision, taking the
299c6f0cSmrg             reduced precision of the subnormals into account, so that all
299c6f0cSmrg             subsequent operations are exact (this avoids double rounding
299c6f0cSmrg             problems). */
299c6f0cSmrg          prec = e < emin ? e - esub : IEEE_FLOAT128_MANT_DIG;
299c6f0cSmrg          MPFR_ASSERTD (prec >= MPFR_PREC_MIN);
299c6f0cSmrg          mpfr_init2 (y, prec);
299c6f0cSmrg
299c6f0cSmrg          mpfr_set (y, x, rnd_mode);
299c6f0cSmrg          sh = MPFR_GET_EXP (y);
299c6f0cSmrg          MPFR_SET_EXP (y, 0);
299c6f0cSmrg          MPFR_SET_POS (y);
299c6f0cSmrg          yp = MPFR_MANT (y);
299c6f0cSmrg
299c6f0cSmrg          r = 0.0;
299c6f0cSmrg          for (i = 0; i < MPFR_LIMB_SIZE (y); i++)
299c6f0cSmrg            {
299c6f0cSmrg              /* Note: MPFR_LIMB_MAX is avoided below as it might not
299c6f0cSmrg                 always work if GMP_NUMB_BITS > IEEE_FLOAT128_MANT_DIG.
299c6f0cSmrg                 MPFR_LIMB_HIGHBIT has the advantage to fit on 1 bit. */
299c6f0cSmrg              r += yp[i];
2ba2404bSmrg              r *= 1 / (2 * (_Float128) MPFR_LIMB_HIGHBIT);
299c6f0cSmrg            }
299c6f0cSmrg
299c6f0cSmrg          mpfr_clear (y);
299c6f0cSmrg
299c6f0cSmrg          MPFR_SAVE_EXPO_FREE (expo);
299c6f0cSmrg        }
299c6f0cSmrg
299c6f0cSmrg      /* we now have to multiply r by 2^sh */
299c6f0cSmrg      MPFR_ASSERTD (r > 0);
299c6f0cSmrg      if (sh != 0)
299c6f0cSmrg        {
299c6f0cSmrg          /* An overflow may occur (example: 0.5*2^1024) */
299c6f0cSmrg          while (r < 1.0)
299c6f0cSmrg            {
299c6f0cSmrg              r += r;
299c6f0cSmrg              sh--;
299c6f0cSmrg            }
299c6f0cSmrg
299c6f0cSmrg          if (sh > 0)
299c6f0cSmrg            m = 2.0;
299c6f0cSmrg          else
299c6f0cSmrg            {
299c6f0cSmrg              m = 0.5;
299c6f0cSmrg              sh = -sh;
299c6f0cSmrg            }
299c6f0cSmrg
299c6f0cSmrg          for (;;)
299c6f0cSmrg            {
299c6f0cSmrg              if (sh % 2)
299c6f0cSmrg                r = r * m;
299c6f0cSmrg              sh >>= 1;
299c6f0cSmrg              if (sh == 0)
299c6f0cSmrg                break;
299c6f0cSmrg              m = m * m;
299c6f0cSmrg            }
299c6f0cSmrg        }
299c6f0cSmrg      if (sign < 0)
299c6f0cSmrg        r = -r;
299c6f0cSmrg      return r;
299c6f0cSmrg    }
299c6f0cSmrg}
299c6f0cSmrg
299c6f0cSmrg#endif /* MPFR_WANT_FLOAT128 */