1*627f7eb2Smrg /* mpn_divrem -- Divide natural numbers, producing both remainder and
2*627f7eb2Smrg quotient.
3*627f7eb2Smrg
4*627f7eb2Smrg Copyright (C) 1993, 1994, 1995, 1996 Free Software Foundation, Inc.
5*627f7eb2Smrg
6*627f7eb2Smrg This file is part of the GNU MP Library.
7*627f7eb2Smrg
8*627f7eb2Smrg The GNU MP Library is free software; you can redistribute it and/or modify
9*627f7eb2Smrg it under the terms of the GNU Lesser General Public License as published by
10*627f7eb2Smrg the Free Software Foundation; either version 2.1 of the License, or (at your
11*627f7eb2Smrg option) any later version.
12*627f7eb2Smrg
13*627f7eb2Smrg The GNU MP Library is distributed in the hope that it will be useful, but
14*627f7eb2Smrg WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
15*627f7eb2Smrg or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public
16*627f7eb2Smrg License for more details.
17*627f7eb2Smrg
18*627f7eb2Smrg You should have received a copy of the GNU Lesser General Public License
19*627f7eb2Smrg along with the GNU MP Library; see the file COPYING.LIB. If not, write to
20*627f7eb2Smrg the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
21*627f7eb2Smrg MA 02111-1307, USA. */
22*627f7eb2Smrg
23*627f7eb2Smrg #include <config.h>
24*627f7eb2Smrg #include "gmp-impl.h"
25*627f7eb2Smrg
26*627f7eb2Smrg /* Divide num (NP/NSIZE) by den (DP/DSIZE) and write
27*627f7eb2Smrg the NSIZE-DSIZE least significant quotient limbs at QP
28*627f7eb2Smrg and the DSIZE long remainder at NP. If QEXTRA_LIMBS is
29*627f7eb2Smrg non-zero, generate that many fraction bits and append them after the
30*627f7eb2Smrg other quotient limbs.
31*627f7eb2Smrg Return the most significant limb of the quotient, this is always 0 or 1.
32*627f7eb2Smrg
33*627f7eb2Smrg Preconditions:
34*627f7eb2Smrg 0. NSIZE >= DSIZE.
35*627f7eb2Smrg 1. The most significant bit of the divisor must be set.
36*627f7eb2Smrg 2. QP must either not overlap with the input operands at all, or
37*627f7eb2Smrg QP + DSIZE >= NP must hold true. (This means that it's
38*627f7eb2Smrg possible to put the quotient in the high part of NUM, right after the
39*627f7eb2Smrg remainder in NUM.
40*627f7eb2Smrg 3. NSIZE >= DSIZE, even if QEXTRA_LIMBS is non-zero. */
41*627f7eb2Smrg
42*627f7eb2Smrg mp_limb_t
43*627f7eb2Smrg #if __STDC__
mpn_divrem(mp_ptr qp,mp_size_t qextra_limbs,mp_ptr np,mp_size_t nsize,mp_srcptr dp,mp_size_t dsize)44*627f7eb2Smrg mpn_divrem (mp_ptr qp, mp_size_t qextra_limbs,
45*627f7eb2Smrg mp_ptr np, mp_size_t nsize,
46*627f7eb2Smrg mp_srcptr dp, mp_size_t dsize)
47*627f7eb2Smrg #else
48*627f7eb2Smrg mpn_divrem (qp, qextra_limbs, np, nsize, dp, dsize)
49*627f7eb2Smrg mp_ptr qp;
50*627f7eb2Smrg mp_size_t qextra_limbs;
51*627f7eb2Smrg mp_ptr np;
52*627f7eb2Smrg mp_size_t nsize;
53*627f7eb2Smrg mp_srcptr dp;
54*627f7eb2Smrg mp_size_t dsize;
55*627f7eb2Smrg #endif
56*627f7eb2Smrg {
57*627f7eb2Smrg mp_limb_t most_significant_q_limb = 0;
58*627f7eb2Smrg
59*627f7eb2Smrg switch (dsize)
60*627f7eb2Smrg {
61*627f7eb2Smrg case 0:
62*627f7eb2Smrg /* We are asked to divide by zero, so go ahead and do it! (To make
63*627f7eb2Smrg the compiler not remove this statement, return the value.) */
64*627f7eb2Smrg return 1 / dsize;
65*627f7eb2Smrg
66*627f7eb2Smrg case 1:
67*627f7eb2Smrg {
68*627f7eb2Smrg mp_size_t i;
69*627f7eb2Smrg mp_limb_t n1;
70*627f7eb2Smrg mp_limb_t d;
71*627f7eb2Smrg
72*627f7eb2Smrg d = dp[0];
73*627f7eb2Smrg n1 = np[nsize - 1];
74*627f7eb2Smrg
75*627f7eb2Smrg if (n1 >= d)
76*627f7eb2Smrg {
77*627f7eb2Smrg n1 -= d;
78*627f7eb2Smrg most_significant_q_limb = 1;
79*627f7eb2Smrg }
80*627f7eb2Smrg
81*627f7eb2Smrg qp += qextra_limbs;
82*627f7eb2Smrg for (i = nsize - 2; i >= 0; i--)
83*627f7eb2Smrg udiv_qrnnd (qp[i], n1, n1, np[i], d);
84*627f7eb2Smrg qp -= qextra_limbs;
85*627f7eb2Smrg
86*627f7eb2Smrg for (i = qextra_limbs - 1; i >= 0; i--)
87*627f7eb2Smrg udiv_qrnnd (qp[i], n1, n1, 0, d);
88*627f7eb2Smrg
89*627f7eb2Smrg np[0] = n1;
90*627f7eb2Smrg }
91*627f7eb2Smrg break;
92*627f7eb2Smrg
93*627f7eb2Smrg case 2:
94*627f7eb2Smrg {
95*627f7eb2Smrg mp_size_t i;
96*627f7eb2Smrg mp_limb_t n1, n0, n2;
97*627f7eb2Smrg mp_limb_t d1, d0;
98*627f7eb2Smrg
99*627f7eb2Smrg np += nsize - 2;
100*627f7eb2Smrg d1 = dp[1];
101*627f7eb2Smrg d0 = dp[0];
102*627f7eb2Smrg n1 = np[1];
103*627f7eb2Smrg n0 = np[0];
104*627f7eb2Smrg
105*627f7eb2Smrg if (n1 >= d1 && (n1 > d1 || n0 >= d0))
106*627f7eb2Smrg {
107*627f7eb2Smrg sub_ddmmss (n1, n0, n1, n0, d1, d0);
108*627f7eb2Smrg most_significant_q_limb = 1;
109*627f7eb2Smrg }
110*627f7eb2Smrg
111*627f7eb2Smrg for (i = qextra_limbs + nsize - 2 - 1; i >= 0; i--)
112*627f7eb2Smrg {
113*627f7eb2Smrg mp_limb_t q;
114*627f7eb2Smrg mp_limb_t r;
115*627f7eb2Smrg
116*627f7eb2Smrg if (i >= qextra_limbs)
117*627f7eb2Smrg np--;
118*627f7eb2Smrg else
119*627f7eb2Smrg np[0] = 0;
120*627f7eb2Smrg
121*627f7eb2Smrg if (n1 == d1)
122*627f7eb2Smrg {
123*627f7eb2Smrg /* Q should be either 111..111 or 111..110. Need special
124*627f7eb2Smrg treatment of this rare case as normal division would
125*627f7eb2Smrg give overflow. */
126*627f7eb2Smrg q = ~(mp_limb_t) 0;
127*627f7eb2Smrg
128*627f7eb2Smrg r = n0 + d1;
129*627f7eb2Smrg if (r < d1) /* Carry in the addition? */
130*627f7eb2Smrg {
131*627f7eb2Smrg add_ssaaaa (n1, n0, r - d0, np[0], 0, d0);
132*627f7eb2Smrg qp[i] = q;
133*627f7eb2Smrg continue;
134*627f7eb2Smrg }
135*627f7eb2Smrg n1 = d0 - (d0 != 0);
136*627f7eb2Smrg n0 = -d0;
137*627f7eb2Smrg }
138*627f7eb2Smrg else
139*627f7eb2Smrg {
140*627f7eb2Smrg udiv_qrnnd (q, r, n1, n0, d1);
141*627f7eb2Smrg umul_ppmm (n1, n0, d0, q);
142*627f7eb2Smrg }
143*627f7eb2Smrg
144*627f7eb2Smrg n2 = np[0];
145*627f7eb2Smrg q_test:
146*627f7eb2Smrg if (n1 > r || (n1 == r && n0 > n2))
147*627f7eb2Smrg {
148*627f7eb2Smrg /* The estimated Q was too large. */
149*627f7eb2Smrg q--;
150*627f7eb2Smrg
151*627f7eb2Smrg sub_ddmmss (n1, n0, n1, n0, 0, d0);
152*627f7eb2Smrg r += d1;
153*627f7eb2Smrg if (r >= d1) /* If not carry, test Q again. */
154*627f7eb2Smrg goto q_test;
155*627f7eb2Smrg }
156*627f7eb2Smrg
157*627f7eb2Smrg qp[i] = q;
158*627f7eb2Smrg sub_ddmmss (n1, n0, r, n2, n1, n0);
159*627f7eb2Smrg }
160*627f7eb2Smrg np[1] = n1;
161*627f7eb2Smrg np[0] = n0;
162*627f7eb2Smrg }
163*627f7eb2Smrg break;
164*627f7eb2Smrg
165*627f7eb2Smrg default:
166*627f7eb2Smrg {
167*627f7eb2Smrg mp_size_t i;
168*627f7eb2Smrg mp_limb_t dX, d1, n0;
169*627f7eb2Smrg
170*627f7eb2Smrg np += nsize - dsize;
171*627f7eb2Smrg dX = dp[dsize - 1];
172*627f7eb2Smrg d1 = dp[dsize - 2];
173*627f7eb2Smrg n0 = np[dsize - 1];
174*627f7eb2Smrg
175*627f7eb2Smrg if (n0 >= dX)
176*627f7eb2Smrg {
177*627f7eb2Smrg if (n0 > dX || mpn_cmp (np, dp, dsize - 1) >= 0)
178*627f7eb2Smrg {
179*627f7eb2Smrg mpn_sub_n (np, np, dp, dsize);
180*627f7eb2Smrg n0 = np[dsize - 1];
181*627f7eb2Smrg most_significant_q_limb = 1;
182*627f7eb2Smrg }
183*627f7eb2Smrg }
184*627f7eb2Smrg
185*627f7eb2Smrg for (i = qextra_limbs + nsize - dsize - 1; i >= 0; i--)
186*627f7eb2Smrg {
187*627f7eb2Smrg mp_limb_t q;
188*627f7eb2Smrg mp_limb_t n1, n2;
189*627f7eb2Smrg mp_limb_t cy_limb;
190*627f7eb2Smrg
191*627f7eb2Smrg if (i >= qextra_limbs)
192*627f7eb2Smrg {
193*627f7eb2Smrg np--;
194*627f7eb2Smrg n2 = np[dsize];
195*627f7eb2Smrg }
196*627f7eb2Smrg else
197*627f7eb2Smrg {
198*627f7eb2Smrg n2 = np[dsize - 1];
199*627f7eb2Smrg MPN_COPY_DECR (np + 1, np, dsize);
200*627f7eb2Smrg np[0] = 0;
201*627f7eb2Smrg }
202*627f7eb2Smrg
203*627f7eb2Smrg if (n0 == dX)
204*627f7eb2Smrg /* This might over-estimate q, but it's probably not worth
205*627f7eb2Smrg the extra code here to find out. */
206*627f7eb2Smrg q = ~(mp_limb_t) 0;
207*627f7eb2Smrg else
208*627f7eb2Smrg {
209*627f7eb2Smrg mp_limb_t r;
210*627f7eb2Smrg
211*627f7eb2Smrg udiv_qrnnd (q, r, n0, np[dsize - 1], dX);
212*627f7eb2Smrg umul_ppmm (n1, n0, d1, q);
213*627f7eb2Smrg
214*627f7eb2Smrg while (n1 > r || (n1 == r && n0 > np[dsize - 2]))
215*627f7eb2Smrg {
216*627f7eb2Smrg q--;
217*627f7eb2Smrg r += dX;
218*627f7eb2Smrg if (r < dX) /* I.e. "carry in previous addition?" */
219*627f7eb2Smrg break;
220*627f7eb2Smrg n1 -= n0 < d1;
221*627f7eb2Smrg n0 -= d1;
222*627f7eb2Smrg }
223*627f7eb2Smrg }
224*627f7eb2Smrg
225*627f7eb2Smrg /* Possible optimization: We already have (q * n0) and (1 * n1)
226*627f7eb2Smrg after the calculation of q. Taking advantage of that, we
227*627f7eb2Smrg could make this loop make two iterations less. */
228*627f7eb2Smrg
229*627f7eb2Smrg cy_limb = mpn_submul_1 (np, dp, dsize, q);
230*627f7eb2Smrg
231*627f7eb2Smrg if (n2 != cy_limb)
232*627f7eb2Smrg {
233*627f7eb2Smrg mpn_add_n (np, np, dp, dsize);
234*627f7eb2Smrg q--;
235*627f7eb2Smrg }
236*627f7eb2Smrg
237*627f7eb2Smrg qp[i] = q;
238*627f7eb2Smrg n0 = np[dsize - 1];
239*627f7eb2Smrg }
240*627f7eb2Smrg }
241*627f7eb2Smrg }
242*627f7eb2Smrg
243*627f7eb2Smrg return most_significant_q_limb;
244*627f7eb2Smrg }
245