1*37da2899SCharles.Forsyth #include "os.h"
2*37da2899SCharles.Forsyth #include <mp.h>
3*37da2899SCharles.Forsyth #include "dat.h"
4*37da2899SCharles.Forsyth
5*37da2899SCharles.Forsyth #define LO(x) ((x) & ((1<<(Dbits/2))-1))
6*37da2899SCharles.Forsyth #define HI(x) ((x) >> (Dbits/2))
7*37da2899SCharles.Forsyth
8*37da2899SCharles.Forsyth static void
mpdigmul(mpdigit a,mpdigit b,mpdigit * p)9*37da2899SCharles.Forsyth mpdigmul(mpdigit a, mpdigit b, mpdigit *p)
10*37da2899SCharles.Forsyth {
11*37da2899SCharles.Forsyth mpdigit x, ah, al, bh, bl, p1, p2, p3, p4;
12*37da2899SCharles.Forsyth int carry;
13*37da2899SCharles.Forsyth
14*37da2899SCharles.Forsyth // half digits
15*37da2899SCharles.Forsyth ah = HI(a);
16*37da2899SCharles.Forsyth al = LO(a);
17*37da2899SCharles.Forsyth bh = HI(b);
18*37da2899SCharles.Forsyth bl = LO(b);
19*37da2899SCharles.Forsyth
20*37da2899SCharles.Forsyth // partial products
21*37da2899SCharles.Forsyth p1 = ah*bl;
22*37da2899SCharles.Forsyth p2 = bh*al;
23*37da2899SCharles.Forsyth p3 = bl*al;
24*37da2899SCharles.Forsyth p4 = ah*bh;
25*37da2899SCharles.Forsyth
26*37da2899SCharles.Forsyth // p = ((p1+p2)<<(Dbits/2)) + (p4<<Dbits) + p3
27*37da2899SCharles.Forsyth carry = 0;
28*37da2899SCharles.Forsyth x = p1<<(Dbits/2);
29*37da2899SCharles.Forsyth p3 += x;
30*37da2899SCharles.Forsyth if(p3 < x)
31*37da2899SCharles.Forsyth carry++;
32*37da2899SCharles.Forsyth x = p2<<(Dbits/2);
33*37da2899SCharles.Forsyth p3 += x;
34*37da2899SCharles.Forsyth if(p3 < x)
35*37da2899SCharles.Forsyth carry++;
36*37da2899SCharles.Forsyth p4 += carry + HI(p1) + HI(p2); // can't carry out of the high digit
37*37da2899SCharles.Forsyth p[0] = p3;
38*37da2899SCharles.Forsyth p[1] = p4;
39*37da2899SCharles.Forsyth }
40*37da2899SCharles.Forsyth
41*37da2899SCharles.Forsyth // prereq: p must have room for n+1 digits
42*37da2899SCharles.Forsyth void
mpvecdigmuladd(mpdigit * b,int n,mpdigit m,mpdigit * p)43*37da2899SCharles.Forsyth mpvecdigmuladd(mpdigit *b, int n, mpdigit m, mpdigit *p)
44*37da2899SCharles.Forsyth {
45*37da2899SCharles.Forsyth int i;
46*37da2899SCharles.Forsyth mpdigit carry, x, y, part[2];
47*37da2899SCharles.Forsyth
48*37da2899SCharles.Forsyth carry = 0;
49*37da2899SCharles.Forsyth part[1] = 0;
50*37da2899SCharles.Forsyth for(i = 0; i < n; i++){
51*37da2899SCharles.Forsyth x = part[1] + carry;
52*37da2899SCharles.Forsyth if(x < carry)
53*37da2899SCharles.Forsyth carry = 1;
54*37da2899SCharles.Forsyth else
55*37da2899SCharles.Forsyth carry = 0;
56*37da2899SCharles.Forsyth y = *p;
57*37da2899SCharles.Forsyth mpdigmul(*b++, m, part);
58*37da2899SCharles.Forsyth x += part[0];
59*37da2899SCharles.Forsyth if(x < part[0])
60*37da2899SCharles.Forsyth carry++;
61*37da2899SCharles.Forsyth x += y;
62*37da2899SCharles.Forsyth if(x < y)
63*37da2899SCharles.Forsyth carry++;
64*37da2899SCharles.Forsyth *p++ = x;
65*37da2899SCharles.Forsyth }
66*37da2899SCharles.Forsyth *p = part[1] + carry;
67*37da2899SCharles.Forsyth }
68*37da2899SCharles.Forsyth
69*37da2899SCharles.Forsyth // prereq: p must have room for n+1 digits
70*37da2899SCharles.Forsyth int
mpvecdigmulsub(mpdigit * b,int n,mpdigit m,mpdigit * p)71*37da2899SCharles.Forsyth mpvecdigmulsub(mpdigit *b, int n, mpdigit m, mpdigit *p)
72*37da2899SCharles.Forsyth {
73*37da2899SCharles.Forsyth int i;
74*37da2899SCharles.Forsyth mpdigit x, y, part[2], borrow;
75*37da2899SCharles.Forsyth
76*37da2899SCharles.Forsyth borrow = 0;
77*37da2899SCharles.Forsyth part[1] = 0;
78*37da2899SCharles.Forsyth for(i = 0; i < n; i++){
79*37da2899SCharles.Forsyth x = *p;
80*37da2899SCharles.Forsyth y = x - borrow;
81*37da2899SCharles.Forsyth if(y > x)
82*37da2899SCharles.Forsyth borrow = 1;
83*37da2899SCharles.Forsyth else
84*37da2899SCharles.Forsyth borrow = 0;
85*37da2899SCharles.Forsyth x = part[1];
86*37da2899SCharles.Forsyth mpdigmul(*b++, m, part);
87*37da2899SCharles.Forsyth x += part[0];
88*37da2899SCharles.Forsyth if(x < part[0])
89*37da2899SCharles.Forsyth borrow++;
90*37da2899SCharles.Forsyth x = y - x;
91*37da2899SCharles.Forsyth if(x > y)
92*37da2899SCharles.Forsyth borrow++;
93*37da2899SCharles.Forsyth *p++ = x;
94*37da2899SCharles.Forsyth }
95*37da2899SCharles.Forsyth
96*37da2899SCharles.Forsyth x = *p;
97*37da2899SCharles.Forsyth y = x - borrow - part[1];
98*37da2899SCharles.Forsyth *p = y;
99*37da2899SCharles.Forsyth if(y > x)
100*37da2899SCharles.Forsyth return -1;
101*37da2899SCharles.Forsyth else
102*37da2899SCharles.Forsyth return 1;
103*37da2899SCharles.Forsyth }
104