gmp/mpz/cong.c

*86d7f5d3SJohn Marino/* mpz_congruent_p -- test congruence of two mpz's.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoCopyright 2001, 2002, 2005 Free Software Foundation, Inc.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoThis file is part of the GNU MP Library.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoThe GNU MP Library is free software; you can redistribute it and/or modify
*86d7f5d3SJohn Marinoit under the terms of the GNU Lesser General Public License as published by
*86d7f5d3SJohn Marinothe Free Software Foundation; either version 3 of the License, or (at your
*86d7f5d3SJohn Marinooption) any later version.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoThe GNU MP Library is distributed in the hope that it will be useful, but
*86d7f5d3SJohn MarinoWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
*86d7f5d3SJohn Marinoor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
*86d7f5d3SJohn MarinoLicense for more details.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn MarinoYou should have received a copy of the GNU Lesser General Public License
*86d7f5d3SJohn Marinoalong with the GNU MP Library.  If not, see http://www.gnu.org/licenses/.  */
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino#include "gmp.h"
*86d7f5d3SJohn Marino#include "gmp-impl.h"
*86d7f5d3SJohn Marino#include "longlong.h"
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino/* For big divisors this code is only very slightly better than the user
*86d7f5d3SJohn Marino   doing a combination of mpz_sub and mpz_tdiv_r, but it's quite convenient,
*86d7f5d3SJohn Marino   and perhaps in the future can be improved, in similar ways to
*86d7f5d3SJohn Marino   mpn_divisible_p perhaps.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   The csize==1 / dsize==1 special case makes mpz_congruent_p as good as
*86d7f5d3SJohn Marino   mpz_congruent_ui_p on relevant operands, though such a combination
*86d7f5d3SJohn Marino   probably doesn't occur often.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   Alternatives:
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   If c<d then it'd work to just form a%d and compare a and c (either as
*86d7f5d3SJohn Marino   a==c or a+c==d depending on the signs), but the saving from avoiding the
*86d7f5d3SJohn Marino   abs(a-c) calculation would be small compared to the division.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   Similarly if both a<d and c<d then it would work to just compare a and c
*86d7f5d3SJohn Marino   (a==c or a+c==d), but this isn't considered a particularly important case
*86d7f5d3SJohn Marino   and so isn't done for the moment.
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino   Low zero limbs on d could be stripped and the corresponding limbs of a
*86d7f5d3SJohn Marino   and c tested and skipped, but doing so would introduce a borrow when a
*86d7f5d3SJohn Marino   and c differ in sign and have non-zero skipped limbs.  It doesn't seem
*86d7f5d3SJohn Marino   worth the complications to do this, since low zero limbs on d should
*86d7f5d3SJohn Marino   occur only rarely.  */
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marinoint
*86d7f5d3SJohn Marinompz_congruent_p (mpz_srcptr a, mpz_srcptr c, mpz_srcptr d)
*86d7f5d3SJohn Marino{
*86d7f5d3SJohn Marino  mp_size_t  asize, csize, dsize, sign;
*86d7f5d3SJohn Marino  mp_srcptr  ap, cp, dp;
*86d7f5d3SJohn Marino  mp_ptr     xp;
*86d7f5d3SJohn Marino  mp_limb_t  alow, clow, dlow, dmask, r;
*86d7f5d3SJohn Marino  int        result;
*86d7f5d3SJohn Marino  TMP_DECL;
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  dsize = SIZ(d);
*86d7f5d3SJohn Marino  if (UNLIKELY (dsize == 0))
*86d7f5d3SJohn Marino    return (mpz_cmp (a, c) == 0);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  dsize = ABS(dsize);
*86d7f5d3SJohn Marino  dp = PTR(d);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  if (ABSIZ(a) < ABSIZ(c))
*86d7f5d3SJohn Marino    MPZ_SRCPTR_SWAP (a, c);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  asize = SIZ(a);
*86d7f5d3SJohn Marino  csize = SIZ(c);
*86d7f5d3SJohn Marino  sign = (asize ^ csize);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  asize = ABS(asize);
*86d7f5d3SJohn Marino  ap = PTR(a);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  if (csize == 0)
*86d7f5d3SJohn Marino    return mpn_divisible_p (ap, asize, dp, dsize);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  csize = ABS(csize);
*86d7f5d3SJohn Marino  cp = PTR(c);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  alow = ap[0];
*86d7f5d3SJohn Marino  clow = cp[0];
*86d7f5d3SJohn Marino  dlow = dp[0];
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  /* Check a==c mod low zero bits of dlow.  This might catch a few cases of
*86d7f5d3SJohn Marino     a!=c quickly, and it helps the csize==1 special cases below.  */
*86d7f5d3SJohn Marino  dmask = LOW_ZEROS_MASK (dlow) & GMP_NUMB_MASK;
*86d7f5d3SJohn Marino  alow = (sign >= 0 ? alow : -alow);
*86d7f5d3SJohn Marino  if (((alow-clow) & dmask) != 0)
*86d7f5d3SJohn Marino    return 0;
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  if (csize == 1)
*86d7f5d3SJohn Marino    {
*86d7f5d3SJohn Marino      if (dsize == 1)
*86d7f5d3SJohn Marino        {
*86d7f5d3SJohn Marino        cong_1:
*86d7f5d3SJohn Marino          if (sign < 0)
*86d7f5d3SJohn Marino            NEG_MOD (clow, clow, dlow);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino          if (ABOVE_THRESHOLD (asize, BMOD_1_TO_MOD_1_THRESHOLD))
*86d7f5d3SJohn Marino            {
*86d7f5d3SJohn Marino              r = mpn_mod_1 (ap, asize, dlow);
*86d7f5d3SJohn Marino              if (clow < dlow)
*86d7f5d3SJohn Marino                return r == clow;
*86d7f5d3SJohn Marino              else
*86d7f5d3SJohn Marino                return r == (clow % dlow);
*86d7f5d3SJohn Marino            }
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino          if ((dlow & 1) == 0)
*86d7f5d3SJohn Marino            {
*86d7f5d3SJohn Marino              /* Strip low zero bits to get odd d required by modexact.  If
*86d7f5d3SJohn Marino                 d==e*2^n then a==c mod d if and only if both a==c mod e and
*86d7f5d3SJohn Marino                 a==c mod 2^n, the latter having been done above.  */
*86d7f5d3SJohn Marino              unsigned  twos;
*86d7f5d3SJohn Marino              count_trailing_zeros (twos, dlow);
*86d7f5d3SJohn Marino              dlow >>= twos;
*86d7f5d3SJohn Marino            }
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino          r = mpn_modexact_1c_odd (ap, asize, dlow, clow);
*86d7f5d3SJohn Marino          return r == 0 || r == dlow;
*86d7f5d3SJohn Marino        }
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino      /* dlow==0 is avoided since we don't want to bother handling extra low
*86d7f5d3SJohn Marino         zero bits if dsecond is even (would involve borrow if a,c differ in
*86d7f5d3SJohn Marino         sign and alow,clow!=0).  */
*86d7f5d3SJohn Marino      if (dsize == 2 && dlow != 0)
*86d7f5d3SJohn Marino        {
*86d7f5d3SJohn Marino          mp_limb_t  dsecond = dp[1];
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino          if (dsecond <= dmask)
*86d7f5d3SJohn Marino            {
*86d7f5d3SJohn Marino              unsigned   twos;
*86d7f5d3SJohn Marino              count_trailing_zeros (twos, dlow);
*86d7f5d3SJohn Marino              dlow = (dlow >> twos) | (dsecond << (GMP_NUMB_BITS-twos));
*86d7f5d3SJohn Marino              ASSERT_LIMB (dlow);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino              /* dlow will be odd here, so the test for it even under cong_1
*86d7f5d3SJohn Marino                 is unnecessary, but the rest of that code is wanted. */
*86d7f5d3SJohn Marino              goto cong_1;
*86d7f5d3SJohn Marino            }
*86d7f5d3SJohn Marino        }
*86d7f5d3SJohn Marino    }
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  TMP_MARK;
*86d7f5d3SJohn Marino  xp = TMP_ALLOC_LIMBS (asize+1);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  /* calculate abs(a-c) */
*86d7f5d3SJohn Marino  if (sign >= 0)
*86d7f5d3SJohn Marino    {
*86d7f5d3SJohn Marino      /* same signs, subtract */
*86d7f5d3SJohn Marino      if (asize > csize || mpn_cmp (ap, cp, asize) >= 0)
*86d7f5d3SJohn Marino        ASSERT_NOCARRY (mpn_sub (xp, ap, asize, cp, csize));
*86d7f5d3SJohn Marino      else
*86d7f5d3SJohn Marino        ASSERT_NOCARRY (mpn_sub_n (xp, cp, ap, asize));
*86d7f5d3SJohn Marino      MPN_NORMALIZE (xp, asize);
*86d7f5d3SJohn Marino    }
*86d7f5d3SJohn Marino  else
*86d7f5d3SJohn Marino    {
*86d7f5d3SJohn Marino      /* different signs, add */
*86d7f5d3SJohn Marino      mp_limb_t  carry;
*86d7f5d3SJohn Marino      carry = mpn_add (xp, ap, asize, cp, csize);
*86d7f5d3SJohn Marino      xp[asize] = carry;
*86d7f5d3SJohn Marino      asize += (carry != 0);
*86d7f5d3SJohn Marino    }
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  result = mpn_divisible_p (xp, asize, dp, dsize);
*86d7f5d3SJohn Marino
*86d7f5d3SJohn Marino  TMP_FREE;
*86d7f5d3SJohn Marino  return result;
*86d7f5d3SJohn Marino}