xref: /dflybsd-src/contrib/gmp/mpn/generic/gcd_lehmer.c (revision 86d7f5d305c6adaa56ff4582ece9859d73106103)
186d7f5d3SJohn Marino /* gcd_lehmer.c.
286d7f5d3SJohn Marino 
386d7f5d3SJohn Marino    THE FUNCTIONS IN THIS FILE ARE INTERNAL WITH MUTABLE INTERFACES.  IT IS ONLY
486d7f5d3SJohn Marino    SAFE TO REACH THEM THROUGH DOCUMENTED INTERFACES.  IN FACT, IT IS ALMOST
586d7f5d3SJohn Marino    GUARANTEED THAT THEY'LL CHANGE OR DISAPPEAR IN A FUTURE GNU MP RELEASE.
686d7f5d3SJohn Marino 
786d7f5d3SJohn Marino Copyright 2003, 2004, 2005, 2008 Free Software Foundation, Inc.
886d7f5d3SJohn Marino 
986d7f5d3SJohn Marino This file is part of the GNU MP Library.
1086d7f5d3SJohn Marino 
1186d7f5d3SJohn Marino The GNU MP Library is free software; you can redistribute it and/or modify
1286d7f5d3SJohn Marino it under the terms of the GNU Lesser General Public License as published by
1386d7f5d3SJohn Marino the Free Software Foundation; either version 3 of the License, or (at your
1486d7f5d3SJohn Marino option) any later version.
1586d7f5d3SJohn Marino 
1686d7f5d3SJohn Marino The GNU MP Library is distributed in the hope that it will be useful, but
1786d7f5d3SJohn Marino WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
1886d7f5d3SJohn Marino or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
1986d7f5d3SJohn Marino License for more details.
2086d7f5d3SJohn Marino 
2186d7f5d3SJohn Marino You should have received a copy of the GNU Lesser General Public License
2286d7f5d3SJohn Marino along with the GNU MP Library.  If not, see http://www.gnu.org/licenses/.  */
2386d7f5d3SJohn Marino 
2486d7f5d3SJohn Marino #include "gmp.h"
2586d7f5d3SJohn Marino #include "gmp-impl.h"
2686d7f5d3SJohn Marino #include "longlong.h"
2786d7f5d3SJohn Marino 
2886d7f5d3SJohn Marino /* Use binary algorithm to compute G <-- GCD (U, V) for usize, vsize == 2.
2986d7f5d3SJohn Marino    Both U and V must be odd. */
3086d7f5d3SJohn Marino static inline mp_size_t
gcd_2(mp_ptr gp,mp_srcptr up,mp_srcptr vp)3186d7f5d3SJohn Marino gcd_2 (mp_ptr gp, mp_srcptr up, mp_srcptr vp)
3286d7f5d3SJohn Marino {
3386d7f5d3SJohn Marino   mp_limb_t u0, u1, v0, v1;
3486d7f5d3SJohn Marino   mp_size_t gn;
3586d7f5d3SJohn Marino 
3686d7f5d3SJohn Marino   u0 = up[0];
3786d7f5d3SJohn Marino   u1 = up[1];
3886d7f5d3SJohn Marino   v0 = vp[0];
3986d7f5d3SJohn Marino   v1 = vp[1];
4086d7f5d3SJohn Marino 
4186d7f5d3SJohn Marino   ASSERT (u0 & 1);
4286d7f5d3SJohn Marino   ASSERT (v0 & 1);
4386d7f5d3SJohn Marino 
4486d7f5d3SJohn Marino   /* Check for u0 != v0 needed to ensure that argument to
4586d7f5d3SJohn Marino    * count_trailing_zeros is non-zero. */
4686d7f5d3SJohn Marino   while (u1 != v1 && u0 != v0)
4786d7f5d3SJohn Marino     {
4886d7f5d3SJohn Marino       unsigned long int r;
4986d7f5d3SJohn Marino       if (u1 > v1)
5086d7f5d3SJohn Marino 	{
5186d7f5d3SJohn Marino 	  u1 -= v1 + (u0 < v0);
5286d7f5d3SJohn Marino 	  u0 = (u0 - v0) & GMP_NUMB_MASK;
5386d7f5d3SJohn Marino 	  count_trailing_zeros (r, u0);
5486d7f5d3SJohn Marino 	  u0 = ((u1 << (GMP_NUMB_BITS - r)) & GMP_NUMB_MASK) | (u0 >> r);
5586d7f5d3SJohn Marino 	  u1 >>= r;
5686d7f5d3SJohn Marino 	}
5786d7f5d3SJohn Marino       else  /* u1 < v1.  */
5886d7f5d3SJohn Marino 	{
5986d7f5d3SJohn Marino 	  v1 -= u1 + (v0 < u0);
6086d7f5d3SJohn Marino 	  v0 = (v0 - u0) & GMP_NUMB_MASK;
6186d7f5d3SJohn Marino 	  count_trailing_zeros (r, v0);
6286d7f5d3SJohn Marino 	  v0 = ((v1 << (GMP_NUMB_BITS - r)) & GMP_NUMB_MASK) | (v0 >> r);
6386d7f5d3SJohn Marino 	  v1 >>= r;
6486d7f5d3SJohn Marino 	}
6586d7f5d3SJohn Marino     }
6686d7f5d3SJohn Marino 
6786d7f5d3SJohn Marino   gp[0] = u0, gp[1] = u1, gn = 1 + (u1 != 0);
6886d7f5d3SJohn Marino 
6986d7f5d3SJohn Marino   /* If U == V == GCD, done.  Otherwise, compute GCD (V, |U - V|).  */
7086d7f5d3SJohn Marino   if (u1 == v1 && u0 == v0)
7186d7f5d3SJohn Marino     return gn;
7286d7f5d3SJohn Marino 
7386d7f5d3SJohn Marino   v0 = (u0 == v0) ? ((u1 > v1) ? u1-v1 : v1-u1) : ((u0 > v0) ? u0-v0 : v0-u0);
7486d7f5d3SJohn Marino   gp[0] = mpn_gcd_1 (gp, gn, v0);
7586d7f5d3SJohn Marino 
7686d7f5d3SJohn Marino   return 1;
7786d7f5d3SJohn Marino }
7886d7f5d3SJohn Marino 
7986d7f5d3SJohn Marino /* Temporary storage: n */
8086d7f5d3SJohn Marino mp_size_t
mpn_gcd_lehmer_n(mp_ptr gp,mp_ptr ap,mp_ptr bp,mp_size_t n,mp_ptr tp)8186d7f5d3SJohn Marino mpn_gcd_lehmer_n (mp_ptr gp, mp_ptr ap, mp_ptr bp, mp_size_t n, mp_ptr tp)
8286d7f5d3SJohn Marino {
8386d7f5d3SJohn Marino   /* Relax this requirement, and normalize at the start? Must disallow
8486d7f5d3SJohn Marino      A = B = 0, though. */
8586d7f5d3SJohn Marino   ASSERT(ap[n-1] > 0 || bp[n-1] > 0);
8686d7f5d3SJohn Marino 
8786d7f5d3SJohn Marino   while (n > 2)
8886d7f5d3SJohn Marino     {
8986d7f5d3SJohn Marino       struct hgcd_matrix1 M;
9086d7f5d3SJohn Marino       mp_limb_t ah, al, bh, bl;
9186d7f5d3SJohn Marino       mp_limb_t mask;
9286d7f5d3SJohn Marino 
9386d7f5d3SJohn Marino       mask = ap[n-1] | bp[n-1];
9486d7f5d3SJohn Marino       ASSERT (mask > 0);
9586d7f5d3SJohn Marino 
9686d7f5d3SJohn Marino       if (mask & GMP_NUMB_HIGHBIT)
9786d7f5d3SJohn Marino 	{
9886d7f5d3SJohn Marino 	  ah = ap[n-1]; al = ap[n-2];
9986d7f5d3SJohn Marino 	  bh = bp[n-1]; bl = bp[n-2];
10086d7f5d3SJohn Marino 	}
10186d7f5d3SJohn Marino       else
10286d7f5d3SJohn Marino 	{
10386d7f5d3SJohn Marino 	  int shift;
10486d7f5d3SJohn Marino 
10586d7f5d3SJohn Marino 	  count_leading_zeros (shift, mask);
10686d7f5d3SJohn Marino 	  ah = MPN_EXTRACT_NUMB (shift, ap[n-1], ap[n-2]);
10786d7f5d3SJohn Marino 	  al = MPN_EXTRACT_NUMB (shift, ap[n-2], ap[n-3]);
10886d7f5d3SJohn Marino 	  bh = MPN_EXTRACT_NUMB (shift, bp[n-1], bp[n-2]);
10986d7f5d3SJohn Marino 	  bl = MPN_EXTRACT_NUMB (shift, bp[n-2], bp[n-3]);
11086d7f5d3SJohn Marino 	}
11186d7f5d3SJohn Marino 
11286d7f5d3SJohn Marino       /* Try an mpn_nhgcd2 step */
11386d7f5d3SJohn Marino       if (mpn_hgcd2 (ah, al, bh, bl, &M))
11486d7f5d3SJohn Marino 	{
11586d7f5d3SJohn Marino 	  n = mpn_hgcd_mul_matrix1_inverse_vector (&M, tp, ap, bp, n);
11686d7f5d3SJohn Marino 	  MP_PTR_SWAP (ap, tp);
11786d7f5d3SJohn Marino 	}
11886d7f5d3SJohn Marino       else
11986d7f5d3SJohn Marino 	{
12086d7f5d3SJohn Marino 	  /* mpn_hgcd2 has failed. Then either one of a or b is very
12186d7f5d3SJohn Marino 	     small, or the difference is very small. Perform one
12286d7f5d3SJohn Marino 	     subtraction followed by one division. */
12386d7f5d3SJohn Marino 	  mp_size_t gn;
12486d7f5d3SJohn Marino 
12586d7f5d3SJohn Marino 	  /* Temporary storage n */
12686d7f5d3SJohn Marino 	  n = mpn_gcd_subdiv_step (gp, &gn, ap, bp, n, tp);
12786d7f5d3SJohn Marino 	  if (n == 0)
12886d7f5d3SJohn Marino 	    return gn;
12986d7f5d3SJohn Marino 	}
13086d7f5d3SJohn Marino     }
13186d7f5d3SJohn Marino 
13286d7f5d3SJohn Marino   if (n == 1)
13386d7f5d3SJohn Marino     {
13486d7f5d3SJohn Marino       *gp = mpn_gcd_1(ap, 1, bp[0]);
13586d7f5d3SJohn Marino       return 1;
13686d7f5d3SJohn Marino     }
13786d7f5d3SJohn Marino 
13886d7f5d3SJohn Marino   /* Due to the calling convention for mpn_gcd, at most one can be
13986d7f5d3SJohn Marino      even. */
14086d7f5d3SJohn Marino 
14186d7f5d3SJohn Marino   if (! (ap[0] & 1))
14286d7f5d3SJohn Marino     MP_PTR_SWAP (ap, bp);
14386d7f5d3SJohn Marino 
14486d7f5d3SJohn Marino   ASSERT (ap[0] & 1);
14586d7f5d3SJohn Marino 
14686d7f5d3SJohn Marino   if (bp[0] == 0)
14786d7f5d3SJohn Marino     {
14886d7f5d3SJohn Marino       *gp = mpn_gcd_1 (ap, 2, bp[1]);
14986d7f5d3SJohn Marino       return 1;
15086d7f5d3SJohn Marino     }
15186d7f5d3SJohn Marino   else if (! (bp[0] & 1))
15286d7f5d3SJohn Marino     {
15386d7f5d3SJohn Marino       int r;
15486d7f5d3SJohn Marino       count_trailing_zeros (r, bp[0]);
15586d7f5d3SJohn Marino       bp[0] = ((bp[1] << (GMP_NUMB_BITS - r)) & GMP_NUMB_MASK) | (bp[0] >> r);
15686d7f5d3SJohn Marino       bp[1] >>= r;
15786d7f5d3SJohn Marino     }
15886d7f5d3SJohn Marino 
15986d7f5d3SJohn Marino   return gcd_2(gp, ap, bp);
16086d7f5d3SJohn Marino }
161