gmp/mpf/mul_ui.c

*86d7f5d3SJohn Marino/* mpf_mul_ui -- Multiply a float and an unsigned integer.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoCopyright 1993, 1994, 1996, 2001, 2003, 2004 Free Software Foundation, Inc.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoThis file is part of the GNU MP Library.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoThe GNU MP Library is free software; you can redistribute it and/or modify
*86d7f5d3SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
*86d7f5d3SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
*86d7f5d3SJohn Marinooption) any later version.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoThe GNU MP Library is distributed in the hope that it will be useful, but
*86d7f5d3SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
*86d7f5d3SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
*86d7f5d3SJohn MarinoLicense for more details.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
*86d7f5d3SJohn Marinoalong with the GNU MP Library.  If not, see http://www.gnu.org/licenses/.  */
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino#include "gmp.h"
*86d7f5d3SJohn Marino#include "gmp-impl.h"
*86d7f5d3SJohn Marino#include "longlong.h"
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino/* The core operation is a multiply of PREC(r) limbs from u by v, producing
*86d7f5d3SJohn Marino   either PREC(r) or PREC(r)+1 result limbs.  If u is shorter than PREC(r),
*86d7f5d3SJohn Marino   then we take only as much as it has.  If u is longer we incorporate a
*86d7f5d3SJohn Marino   carry from the lower limbs.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   If u has just 1 extra limb, then the carry to add is high(up[0]*v).  That
*86d7f5d3SJohn Marino   is of course what mpn_mul_1 would do if it was called with PREC(r)+1
*86d7f5d3SJohn Marino   limbs of input.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   If u has more than 1 extra limb, then there can be a further carry bit
*86d7f5d3SJohn Marino   out of lower uncalculated limbs (the way the low of one product adds to
*86d7f5d3SJohn Marino   the high of the product below it).  This is of course what an mpn_mul_1
*86d7f5d3SJohn Marino   would do if it was called with the full u operand.  But we instead work
*86d7f5d3SJohn Marino   downwards explicitly, until a carry occurs or until a value other than
*86d7f5d3SJohn Marino   GMP_NUMB_MAX occurs (that being the only value a carry bit can propagate
*86d7f5d3SJohn Marino   across).
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   The carry determination normally requires two umul_ppmm's, only rarely
*86d7f5d3SJohn Marino   will GMP_NUMB_MAX occur and require further products.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   The carry limb is conveniently added into the mul_1 using mpn_mul_1c when
*86d7f5d3SJohn Marino   that function exists, otherwise a subsequent mpn_add_1 is needed.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   Clearly when mpn_mul_1c is used the carry must be calculated first.  But
*86d7f5d3SJohn Marino   this is also the case when add_1 is used, since if r==u and ABSIZ(r) >
*86d7f5d3SJohn Marino   PREC(r) then the mpn_mul_1 overwrites the low part of the input.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   A reuse r==u with size > prec can occur from a size PREC(r)+1 in the
*86d7f5d3SJohn Marino   usual way, or it can occur from an mpf_set_prec_raw leaving a bigger
*86d7f5d3SJohn Marino   sized value.  In both cases we can end up calling mpn_mul_1 with
*86d7f5d3SJohn Marino   overlapping src and dst regions, but this will be with dst < src and such
*86d7f5d3SJohn Marino   an overlap is permitted.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   Not done:
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   No attempt is made to determine in advance whether the result will be
*86d7f5d3SJohn Marino   PREC(r) or PREC(r)+1 limbs.  If it's going to be PREC(r)+1 then we could
*86d7f5d3SJohn Marino   take one less limb from u and generate just PREC(r), that of course
*86d7f5d3SJohn Marino   satisfying application requested precision.  But any test counting bits
*86d7f5d3SJohn Marino   or forming the high product would almost certainly take longer than the
*86d7f5d3SJohn Marino   incremental cost of an extra limb in mpn_mul_1.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   Enhancements:
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   Repeated mpf_mul_ui's with an even v will accumulate low zero bits on the
*86d7f5d3SJohn Marino   result, leaving low zero limbs after a while, which it might be nice to
*86d7f5d3SJohn Marino   strip to save work in subsequent operations.  Calculating the low limb
*86d7f5d3SJohn Marino   explicitly would let us direct mpn_mul_1 to put the balance at rp when
*86d7f5d3SJohn Marino   the low is zero (instead of normally rp+1).  But it's not clear whether
*86d7f5d3SJohn Marino   this would be worthwhile.  Explicit code for the low limb will probably
*86d7f5d3SJohn Marino   be slower than having it done in mpn_mul_1, so we need to consider how
*86d7f5d3SJohn Marino   often a zero will be stripped and how much that's likely to save
*86d7f5d3SJohn Marino   later.  */
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marinovoid
*86d7f5d3SJohn Marinompf_mul_ui (mpf_ptr r, mpf_srcptr u, unsigned long int v)
*86d7f5d3SJohn Marino{
*86d7f5d3SJohn Marino  mp_srcptr up;
*86d7f5d3SJohn Marino  mp_size_t usize;
*86d7f5d3SJohn Marino  mp_size_t size;
*86d7f5d3SJohn Marino  mp_size_t prec, excess;
*86d7f5d3SJohn Marino  mp_limb_t cy_limb, vl, cbit, cin;
*86d7f5d3SJohn Marino  mp_ptr rp;
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  usize = u->_mp_size;
*86d7f5d3SJohn Marino  if (UNLIKELY (v == 0) || UNLIKELY (usize == 0))
*86d7f5d3SJohn Marino    {
*86d7f5d3SJohn Marino      r->_mp_size = 0;
*86d7f5d3SJohn Marino      r->_mp_exp = 0;
*86d7f5d3SJohn Marino      return;
*86d7f5d3SJohn Marino    }
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino#if BITS_PER_ULONG > GMP_NUMB_BITS  /* avoid warnings about shift amount */
*86d7f5d3SJohn Marino  if (v > GMP_NUMB_MAX)
*86d7f5d3SJohn Marino    {
*86d7f5d3SJohn Marino      mpf_t     vf;
*86d7f5d3SJohn Marino      mp_limb_t vp[2];
*86d7f5d3SJohn Marino      vp[0] = v & GMP_NUMB_MASK;
*86d7f5d3SJohn Marino      vp[1] = v >> GMP_NUMB_BITS;
*86d7f5d3SJohn Marino      PTR(vf) = vp;
*86d7f5d3SJohn Marino      SIZ(vf) = 2;
*86d7f5d3SJohn Marino      ASSERT_CODE (PREC(vf) = 2);
*86d7f5d3SJohn Marino      EXP(vf) = 2;
*86d7f5d3SJohn Marino      mpf_mul (r, u, vf);
*86d7f5d3SJohn Marino      return;
*86d7f5d3SJohn Marino    }
*86d7f5d3SJohn Marino#endif
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  size = ABS (usize);
*86d7f5d3SJohn Marino  prec = r->_mp_prec;
*86d7f5d3SJohn Marino  up = u->_mp_d;
*86d7f5d3SJohn Marino  vl = v;
*86d7f5d3SJohn Marino  excess = size - prec;
*86d7f5d3SJohn Marino  cin = 0;
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  if (excess > 0)
*86d7f5d3SJohn Marino    {
*86d7f5d3SJohn Marino      /* up is bigger than desired rp, shorten it to prec limbs and
*86d7f5d3SJohn Marino         determine a carry-in */
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino      mp_limb_t  vl_shifted = vl << GMP_NAIL_BITS;
*86d7f5d3SJohn Marino      mp_limb_t  hi, lo, next_lo, sum;
*86d7f5d3SJohn Marino      mp_size_t  i;
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino      /* high limb of top product */
*86d7f5d3SJohn Marino      i = excess - 1;
*86d7f5d3SJohn Marino      umul_ppmm (cin, lo, up[i], vl_shifted);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino      /* and carry bit out of products below that, if any */
*86d7f5d3SJohn Marino      for (;;)
*86d7f5d3SJohn Marino        {
*86d7f5d3SJohn Marino          i--;
*86d7f5d3SJohn Marino          if (i < 0)
*86d7f5d3SJohn Marino            break;
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino          umul_ppmm (hi, next_lo, up[i], vl_shifted);
*86d7f5d3SJohn Marino          lo >>= GMP_NAIL_BITS;
*86d7f5d3SJohn Marino          ADDC_LIMB (cbit, sum, hi, lo);
*86d7f5d3SJohn Marino          cin += cbit;
*86d7f5d3SJohn Marino          lo = next_lo;
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino          /* Continue only if the sum is GMP_NUMB_MAX.  GMP_NUMB_MAX is the
*86d7f5d3SJohn Marino             only value a carry from below can propagate across.  If we've
*86d7f5d3SJohn Marino             just seen the carry out (ie. cbit!=0) then sum!=GMP_NUMB_MAX,
*86d7f5d3SJohn Marino             so this test stops us for that case too.  */
*86d7f5d3SJohn Marino          if (LIKELY (sum != GMP_NUMB_MAX))
*86d7f5d3SJohn Marino            break;
*86d7f5d3SJohn Marino        }
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino      up += excess;
*86d7f5d3SJohn Marino      size = prec;
*86d7f5d3SJohn Marino    }
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  rp = r->_mp_d;
*86d7f5d3SJohn Marino#if HAVE_NATIVE_mpn_mul_1c
*86d7f5d3SJohn Marino  cy_limb = mpn_mul_1c (rp, up, size, vl, cin);
*86d7f5d3SJohn Marino#else
*86d7f5d3SJohn Marino  cy_limb = mpn_mul_1 (rp, up, size, vl);
*86d7f5d3SJohn Marino  __GMPN_ADD_1 (cbit, rp, rp, size, cin);
*86d7f5d3SJohn Marino  cy_limb += cbit;
*86d7f5d3SJohn Marino#endif
*86d7f5d3SJohn Marino  rp[size] = cy_limb;
*86d7f5d3SJohn Marino  cy_limb = cy_limb != 0;
*86d7f5d3SJohn Marino  r->_mp_exp = u->_mp_exp + cy_limb;
*86d7f5d3SJohn Marino  size += cy_limb;
*86d7f5d3SJohn Marino  r->_mp_size = usize >= 0 ? size : -size;
*86d7f5d3SJohn Marino}