xref: /inferno-os/libmp/port/mpvecdigmuladd.c (revision 37da2899f40661e3e9631e497da8dc59b971cbd0)
1*37da2899SCharles.Forsyth #include "os.h"
2*37da2899SCharles.Forsyth #include <mp.h>
3*37da2899SCharles.Forsyth #include "dat.h"
4*37da2899SCharles.Forsyth 
5*37da2899SCharles.Forsyth #define LO(x) ((x) & ((1<<(Dbits/2))-1))
6*37da2899SCharles.Forsyth #define HI(x) ((x) >> (Dbits/2))
7*37da2899SCharles.Forsyth 
8*37da2899SCharles.Forsyth static void
mpdigmul(mpdigit a,mpdigit b,mpdigit * p)9*37da2899SCharles.Forsyth mpdigmul(mpdigit a, mpdigit b, mpdigit *p)
10*37da2899SCharles.Forsyth {
11*37da2899SCharles.Forsyth 	mpdigit x, ah, al, bh, bl, p1, p2, p3, p4;
12*37da2899SCharles.Forsyth 	int carry;
13*37da2899SCharles.Forsyth 
14*37da2899SCharles.Forsyth 	// half digits
15*37da2899SCharles.Forsyth 	ah = HI(a);
16*37da2899SCharles.Forsyth 	al = LO(a);
17*37da2899SCharles.Forsyth 	bh = HI(b);
18*37da2899SCharles.Forsyth 	bl = LO(b);
19*37da2899SCharles.Forsyth 
20*37da2899SCharles.Forsyth 	// partial products
21*37da2899SCharles.Forsyth 	p1 = ah*bl;
22*37da2899SCharles.Forsyth 	p2 = bh*al;
23*37da2899SCharles.Forsyth 	p3 = bl*al;
24*37da2899SCharles.Forsyth 	p4 = ah*bh;
25*37da2899SCharles.Forsyth 
26*37da2899SCharles.Forsyth 	// p = ((p1+p2)<<(Dbits/2)) + (p4<<Dbits) + p3
27*37da2899SCharles.Forsyth 	carry = 0;
28*37da2899SCharles.Forsyth 	x = p1<<(Dbits/2);
29*37da2899SCharles.Forsyth 	p3 += x;
30*37da2899SCharles.Forsyth 	if(p3 < x)
31*37da2899SCharles.Forsyth 		carry++;
32*37da2899SCharles.Forsyth 	x = p2<<(Dbits/2);
33*37da2899SCharles.Forsyth 	p3 += x;
34*37da2899SCharles.Forsyth 	if(p3 < x)
35*37da2899SCharles.Forsyth 		carry++;
36*37da2899SCharles.Forsyth 	p4 += carry + HI(p1) + HI(p2);	// can't carry out of the high digit
37*37da2899SCharles.Forsyth 	p[0] = p3;
38*37da2899SCharles.Forsyth 	p[1] = p4;
39*37da2899SCharles.Forsyth }
40*37da2899SCharles.Forsyth 
41*37da2899SCharles.Forsyth // prereq: p must have room for n+1 digits
42*37da2899SCharles.Forsyth void
mpvecdigmuladd(mpdigit * b,int n,mpdigit m,mpdigit * p)43*37da2899SCharles.Forsyth mpvecdigmuladd(mpdigit *b, int n, mpdigit m, mpdigit *p)
44*37da2899SCharles.Forsyth {
45*37da2899SCharles.Forsyth 	int i;
46*37da2899SCharles.Forsyth 	mpdigit carry, x, y, part[2];
47*37da2899SCharles.Forsyth 
48*37da2899SCharles.Forsyth 	carry = 0;
49*37da2899SCharles.Forsyth 	part[1] = 0;
50*37da2899SCharles.Forsyth 	for(i = 0; i < n; i++){
51*37da2899SCharles.Forsyth 		x = part[1] + carry;
52*37da2899SCharles.Forsyth 		if(x < carry)
53*37da2899SCharles.Forsyth 			carry = 1;
54*37da2899SCharles.Forsyth 		else
55*37da2899SCharles.Forsyth 			carry = 0;
56*37da2899SCharles.Forsyth 		y = *p;
57*37da2899SCharles.Forsyth 		mpdigmul(*b++, m, part);
58*37da2899SCharles.Forsyth 		x += part[0];
59*37da2899SCharles.Forsyth 		if(x < part[0])
60*37da2899SCharles.Forsyth 			carry++;
61*37da2899SCharles.Forsyth 		x += y;
62*37da2899SCharles.Forsyth 		if(x < y)
63*37da2899SCharles.Forsyth 			carry++;
64*37da2899SCharles.Forsyth 		*p++ = x;
65*37da2899SCharles.Forsyth 	}
66*37da2899SCharles.Forsyth 	*p = part[1] + carry;
67*37da2899SCharles.Forsyth }
68*37da2899SCharles.Forsyth 
69*37da2899SCharles.Forsyth // prereq: p must have room for n+1 digits
70*37da2899SCharles.Forsyth int
mpvecdigmulsub(mpdigit * b,int n,mpdigit m,mpdigit * p)71*37da2899SCharles.Forsyth mpvecdigmulsub(mpdigit *b, int n, mpdigit m, mpdigit *p)
72*37da2899SCharles.Forsyth {
73*37da2899SCharles.Forsyth 	int i;
74*37da2899SCharles.Forsyth 	mpdigit x, y, part[2], borrow;
75*37da2899SCharles.Forsyth 
76*37da2899SCharles.Forsyth 	borrow = 0;
77*37da2899SCharles.Forsyth 	part[1] = 0;
78*37da2899SCharles.Forsyth 	for(i = 0; i < n; i++){
79*37da2899SCharles.Forsyth 		x = *p;
80*37da2899SCharles.Forsyth 		y = x - borrow;
81*37da2899SCharles.Forsyth 		if(y > x)
82*37da2899SCharles.Forsyth 			borrow = 1;
83*37da2899SCharles.Forsyth 		else
84*37da2899SCharles.Forsyth 			borrow = 0;
85*37da2899SCharles.Forsyth 		x = part[1];
86*37da2899SCharles.Forsyth 		mpdigmul(*b++, m, part);
87*37da2899SCharles.Forsyth 		x += part[0];
88*37da2899SCharles.Forsyth 		if(x < part[0])
89*37da2899SCharles.Forsyth 			borrow++;
90*37da2899SCharles.Forsyth 		x = y - x;
91*37da2899SCharles.Forsyth 		if(x > y)
92*37da2899SCharles.Forsyth 			borrow++;
93*37da2899SCharles.Forsyth 		*p++ = x;
94*37da2899SCharles.Forsyth 	}
95*37da2899SCharles.Forsyth 
96*37da2899SCharles.Forsyth 	x = *p;
97*37da2899SCharles.Forsyth 	y = x - borrow - part[1];
98*37da2899SCharles.Forsyth 	*p = y;
99*37da2899SCharles.Forsyth 	if(y > x)
100*37da2899SCharles.Forsyth 		return -1;
101*37da2899SCharles.Forsyth 	else
102*37da2899SCharles.Forsyth 		return 1;
103*37da2899SCharles.Forsyth }
104