186d7f5d3SJohn Marino /* gcd_lehmer.c.
286d7f5d3SJohn Marino
386d7f5d3SJohn Marino THE FUNCTIONS IN THIS FILE ARE INTERNAL WITH MUTABLE INTERFACES. IT IS ONLY
486d7f5d3SJohn Marino SAFE TO REACH THEM THROUGH DOCUMENTED INTERFACES. IN FACT, IT IS ALMOST
586d7f5d3SJohn Marino GUARANTEED THAT THEY'LL CHANGE OR DISAPPEAR IN A FUTURE GNU MP RELEASE.
686d7f5d3SJohn Marino
786d7f5d3SJohn Marino Copyright 2003, 2004, 2005, 2008 Free Software Foundation, Inc.
886d7f5d3SJohn Marino
986d7f5d3SJohn Marino This file is part of the GNU MP Library.
1086d7f5d3SJohn Marino
1186d7f5d3SJohn Marino The GNU MP Library is free software; you can redistribute it and/or modify
1286d7f5d3SJohn Marino it under the terms of the GNU Lesser General Public License as published by
1386d7f5d3SJohn Marino the Free Software Foundation; either version 3 of the License, or (at your
1486d7f5d3SJohn Marino option) any later version.
1586d7f5d3SJohn Marino
1686d7f5d3SJohn Marino The GNU MP Library is distributed in the hope that it will be useful, but
1786d7f5d3SJohn Marino WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
1886d7f5d3SJohn Marino or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public
1986d7f5d3SJohn Marino License for more details.
2086d7f5d3SJohn Marino
2186d7f5d3SJohn Marino You should have received a copy of the GNU Lesser General Public License
2286d7f5d3SJohn Marino along with the GNU MP Library. If not, see http://www.gnu.org/licenses/. */
2386d7f5d3SJohn Marino
2486d7f5d3SJohn Marino #include "gmp.h"
2586d7f5d3SJohn Marino #include "gmp-impl.h"
2686d7f5d3SJohn Marino #include "longlong.h"
2786d7f5d3SJohn Marino
2886d7f5d3SJohn Marino /* Use binary algorithm to compute G <-- GCD (U, V) for usize, vsize == 2.
2986d7f5d3SJohn Marino Both U and V must be odd. */
3086d7f5d3SJohn Marino static inline mp_size_t
gcd_2(mp_ptr gp,mp_srcptr up,mp_srcptr vp)3186d7f5d3SJohn Marino gcd_2 (mp_ptr gp, mp_srcptr up, mp_srcptr vp)
3286d7f5d3SJohn Marino {
3386d7f5d3SJohn Marino mp_limb_t u0, u1, v0, v1;
3486d7f5d3SJohn Marino mp_size_t gn;
3586d7f5d3SJohn Marino
3686d7f5d3SJohn Marino u0 = up[0];
3786d7f5d3SJohn Marino u1 = up[1];
3886d7f5d3SJohn Marino v0 = vp[0];
3986d7f5d3SJohn Marino v1 = vp[1];
4086d7f5d3SJohn Marino
4186d7f5d3SJohn Marino ASSERT (u0 & 1);
4286d7f5d3SJohn Marino ASSERT (v0 & 1);
4386d7f5d3SJohn Marino
4486d7f5d3SJohn Marino /* Check for u0 != v0 needed to ensure that argument to
4586d7f5d3SJohn Marino * count_trailing_zeros is non-zero. */
4686d7f5d3SJohn Marino while (u1 != v1 && u0 != v0)
4786d7f5d3SJohn Marino {
4886d7f5d3SJohn Marino unsigned long int r;
4986d7f5d3SJohn Marino if (u1 > v1)
5086d7f5d3SJohn Marino {
5186d7f5d3SJohn Marino u1 -= v1 + (u0 < v0);
5286d7f5d3SJohn Marino u0 = (u0 - v0) & GMP_NUMB_MASK;
5386d7f5d3SJohn Marino count_trailing_zeros (r, u0);
5486d7f5d3SJohn Marino u0 = ((u1 << (GMP_NUMB_BITS - r)) & GMP_NUMB_MASK) | (u0 >> r);
5586d7f5d3SJohn Marino u1 >>= r;
5686d7f5d3SJohn Marino }
5786d7f5d3SJohn Marino else /* u1 < v1. */
5886d7f5d3SJohn Marino {
5986d7f5d3SJohn Marino v1 -= u1 + (v0 < u0);
6086d7f5d3SJohn Marino v0 = (v0 - u0) & GMP_NUMB_MASK;
6186d7f5d3SJohn Marino count_trailing_zeros (r, v0);
6286d7f5d3SJohn Marino v0 = ((v1 << (GMP_NUMB_BITS - r)) & GMP_NUMB_MASK) | (v0 >> r);
6386d7f5d3SJohn Marino v1 >>= r;
6486d7f5d3SJohn Marino }
6586d7f5d3SJohn Marino }
6686d7f5d3SJohn Marino
6786d7f5d3SJohn Marino gp[0] = u0, gp[1] = u1, gn = 1 + (u1 != 0);
6886d7f5d3SJohn Marino
6986d7f5d3SJohn Marino /* If U == V == GCD, done. Otherwise, compute GCD (V, |U - V|). */
7086d7f5d3SJohn Marino if (u1 == v1 && u0 == v0)
7186d7f5d3SJohn Marino return gn;
7286d7f5d3SJohn Marino
7386d7f5d3SJohn Marino v0 = (u0 == v0) ? ((u1 > v1) ? u1-v1 : v1-u1) : ((u0 > v0) ? u0-v0 : v0-u0);
7486d7f5d3SJohn Marino gp[0] = mpn_gcd_1 (gp, gn, v0);
7586d7f5d3SJohn Marino
7686d7f5d3SJohn Marino return 1;
7786d7f5d3SJohn Marino }
7886d7f5d3SJohn Marino
7986d7f5d3SJohn Marino /* Temporary storage: n */
8086d7f5d3SJohn Marino mp_size_t
mpn_gcd_lehmer_n(mp_ptr gp,mp_ptr ap,mp_ptr bp,mp_size_t n,mp_ptr tp)8186d7f5d3SJohn Marino mpn_gcd_lehmer_n (mp_ptr gp, mp_ptr ap, mp_ptr bp, mp_size_t n, mp_ptr tp)
8286d7f5d3SJohn Marino {
8386d7f5d3SJohn Marino /* Relax this requirement, and normalize at the start? Must disallow
8486d7f5d3SJohn Marino A = B = 0, though. */
8586d7f5d3SJohn Marino ASSERT(ap[n-1] > 0 || bp[n-1] > 0);
8686d7f5d3SJohn Marino
8786d7f5d3SJohn Marino while (n > 2)
8886d7f5d3SJohn Marino {
8986d7f5d3SJohn Marino struct hgcd_matrix1 M;
9086d7f5d3SJohn Marino mp_limb_t ah, al, bh, bl;
9186d7f5d3SJohn Marino mp_limb_t mask;
9286d7f5d3SJohn Marino
9386d7f5d3SJohn Marino mask = ap[n-1] | bp[n-1];
9486d7f5d3SJohn Marino ASSERT (mask > 0);
9586d7f5d3SJohn Marino
9686d7f5d3SJohn Marino if (mask & GMP_NUMB_HIGHBIT)
9786d7f5d3SJohn Marino {
9886d7f5d3SJohn Marino ah = ap[n-1]; al = ap[n-2];
9986d7f5d3SJohn Marino bh = bp[n-1]; bl = bp[n-2];
10086d7f5d3SJohn Marino }
10186d7f5d3SJohn Marino else
10286d7f5d3SJohn Marino {
10386d7f5d3SJohn Marino int shift;
10486d7f5d3SJohn Marino
10586d7f5d3SJohn Marino count_leading_zeros (shift, mask);
10686d7f5d3SJohn Marino ah = MPN_EXTRACT_NUMB (shift, ap[n-1], ap[n-2]);
10786d7f5d3SJohn Marino al = MPN_EXTRACT_NUMB (shift, ap[n-2], ap[n-3]);
10886d7f5d3SJohn Marino bh = MPN_EXTRACT_NUMB (shift, bp[n-1], bp[n-2]);
10986d7f5d3SJohn Marino bl = MPN_EXTRACT_NUMB (shift, bp[n-2], bp[n-3]);
11086d7f5d3SJohn Marino }
11186d7f5d3SJohn Marino
11286d7f5d3SJohn Marino /* Try an mpn_nhgcd2 step */
11386d7f5d3SJohn Marino if (mpn_hgcd2 (ah, al, bh, bl, &M))
11486d7f5d3SJohn Marino {
11586d7f5d3SJohn Marino n = mpn_hgcd_mul_matrix1_inverse_vector (&M, tp, ap, bp, n);
11686d7f5d3SJohn Marino MP_PTR_SWAP (ap, tp);
11786d7f5d3SJohn Marino }
11886d7f5d3SJohn Marino else
11986d7f5d3SJohn Marino {
12086d7f5d3SJohn Marino /* mpn_hgcd2 has failed. Then either one of a or b is very
12186d7f5d3SJohn Marino small, or the difference is very small. Perform one
12286d7f5d3SJohn Marino subtraction followed by one division. */
12386d7f5d3SJohn Marino mp_size_t gn;
12486d7f5d3SJohn Marino
12586d7f5d3SJohn Marino /* Temporary storage n */
12686d7f5d3SJohn Marino n = mpn_gcd_subdiv_step (gp, &gn, ap, bp, n, tp);
12786d7f5d3SJohn Marino if (n == 0)
12886d7f5d3SJohn Marino return gn;
12986d7f5d3SJohn Marino }
13086d7f5d3SJohn Marino }
13186d7f5d3SJohn Marino
13286d7f5d3SJohn Marino if (n == 1)
13386d7f5d3SJohn Marino {
13486d7f5d3SJohn Marino *gp = mpn_gcd_1(ap, 1, bp[0]);
13586d7f5d3SJohn Marino return 1;
13686d7f5d3SJohn Marino }
13786d7f5d3SJohn Marino
13886d7f5d3SJohn Marino /* Due to the calling convention for mpn_gcd, at most one can be
13986d7f5d3SJohn Marino even. */
14086d7f5d3SJohn Marino
14186d7f5d3SJohn Marino if (! (ap[0] & 1))
14286d7f5d3SJohn Marino MP_PTR_SWAP (ap, bp);
14386d7f5d3SJohn Marino
14486d7f5d3SJohn Marino ASSERT (ap[0] & 1);
14586d7f5d3SJohn Marino
14686d7f5d3SJohn Marino if (bp[0] == 0)
14786d7f5d3SJohn Marino {
14886d7f5d3SJohn Marino *gp = mpn_gcd_1 (ap, 2, bp[1]);
14986d7f5d3SJohn Marino return 1;
15086d7f5d3SJohn Marino }
15186d7f5d3SJohn Marino else if (! (bp[0] & 1))
15286d7f5d3SJohn Marino {
15386d7f5d3SJohn Marino int r;
15486d7f5d3SJohn Marino count_trailing_zeros (r, bp[0]);
15586d7f5d3SJohn Marino bp[0] = ((bp[1] << (GMP_NUMB_BITS - r)) & GMP_NUMB_MASK) | (bp[0] >> r);
15686d7f5d3SJohn Marino bp[1] >>= r;
15786d7f5d3SJohn Marino }
15886d7f5d3SJohn Marino
15986d7f5d3SJohn Marino return gcd_2(gp, ap, bp);
16086d7f5d3SJohn Marino }
161