xref: /inferno-os/libmemdraw/draw.c (revision adad243147f6102c6e975f48951c05745d56b92d)
137da2899SCharles.Forsyth #include "lib9.h"
237da2899SCharles.Forsyth #include "draw.h"
337da2899SCharles.Forsyth #include "memdraw.h"
437da2899SCharles.Forsyth #include "pool.h"
537da2899SCharles.Forsyth 
637da2899SCharles.Forsyth extern Pool* imagmem;
737da2899SCharles.Forsyth int drawdebug;
837da2899SCharles.Forsyth static int	tablesbuilt;
937da2899SCharles.Forsyth 
1037da2899SCharles.Forsyth /* perfect approximation to NTSC = .299r+.587g+.114b when 0 ≤ r,g,b < 256 */
1137da2899SCharles.Forsyth #define RGB2K(r,g,b)	((156763*(r)+307758*(g)+59769*(b))>>19)
1237da2899SCharles.Forsyth 
1337da2899SCharles.Forsyth /*
1437da2899SCharles.Forsyth  * for 0 ≤ x ≤ 255*255, (x*0x0101+0x100)>>16 is a perfect approximation.
1537da2899SCharles.Forsyth  * for 0 ≤ x < (1<<16), x/255 = ((x+1)*0x0101)>>16 is a perfect approximation.
1637da2899SCharles.Forsyth  * the last one is perfect for all up to 1<<16, avoids a multiply, but requires a rathole.
1737da2899SCharles.Forsyth  */
1837da2899SCharles.Forsyth /* #define DIV255(x) (((x)*257+256)>>16)  */
1937da2899SCharles.Forsyth #define DIV255(x) ((((x)+1)*257)>>16)
2037da2899SCharles.Forsyth /* #define DIV255(x) (tmp=(x)+1, (tmp+(tmp>>8))>>8) */
2137da2899SCharles.Forsyth 
2237da2899SCharles.Forsyth #define MUL(x, y, t)	(t = (x)*(y)+128, (t+(t>>8))>>8)
2337da2899SCharles.Forsyth #define MASK13	0xFF00FF00
2437da2899SCharles.Forsyth #define MASK02	0x00FF00FF
2537da2899SCharles.Forsyth #define MUL13(a, x, t)		(t = (a)*(((x)&MASK13)>>8)+0x800080, ((t+((t>>8)&MASK02))>>8)&MASK02)
2637da2899SCharles.Forsyth #define MUL02(a, x, t)		(t = (a)*(((x)&MASK02)>>0)+0x800080, ((t+((t>>8)&MASK02))>>8)&MASK02)
2737da2899SCharles.Forsyth #define MUL0123(a, x, s, t)	((MUL13(a, x, s)<<8)|MUL02(a, x, t))
2837da2899SCharles.Forsyth 
2937da2899SCharles.Forsyth #define MUL2(u, v, x, y)	(t = (u)*(v)+(x)*(y)+256, (t+(t>>8))>>8)
3037da2899SCharles.Forsyth 
3137da2899SCharles.Forsyth #define BWADD(x, y)	((((x)&MASK13)+((y)&MASK13))&MASK13|(((x)&MASK02)+((y)&MASK02))&MASK02)
3237da2899SCharles.Forsyth 
3337da2899SCharles.Forsyth static void mktables(void);
3437da2899SCharles.Forsyth typedef int Subdraw(Memdrawparam*);
3537da2899SCharles.Forsyth static Subdraw chardraw, alphadraw, memoptdraw;
3637da2899SCharles.Forsyth 
3737da2899SCharles.Forsyth static Memimage*	memones;
3837da2899SCharles.Forsyth static Memimage*	memzeros;
3937da2899SCharles.Forsyth Memimage *memwhite;
4037da2899SCharles.Forsyth Memimage *memblack;
4137da2899SCharles.Forsyth Memimage *memtransparent;
4237da2899SCharles.Forsyth Memimage *memopaque;
4337da2899SCharles.Forsyth 
4437da2899SCharles.Forsyth int	_ifmt(Fmt*);
4537da2899SCharles.Forsyth 
4637da2899SCharles.Forsyth void
memimageinit(void)4737da2899SCharles.Forsyth memimageinit(void)
4837da2899SCharles.Forsyth {
4937da2899SCharles.Forsyth 	static int didinit = 0;
5037da2899SCharles.Forsyth 	char *n;
5137da2899SCharles.Forsyth 
5237da2899SCharles.Forsyth 	if(didinit)
5337da2899SCharles.Forsyth 		return;
5437da2899SCharles.Forsyth 
5537da2899SCharles.Forsyth 	didinit = 1;
5637da2899SCharles.Forsyth 
5737da2899SCharles.Forsyth 	n = poolname(imagmem);
5837da2899SCharles.Forsyth 	if(strcmp(n, "Image") == 0 || strcmp(n, "image") == 0)
5937da2899SCharles.Forsyth 		poolsetcompact(imagmem, memimagemove);
6037da2899SCharles.Forsyth 	mktables();
6137da2899SCharles.Forsyth 	_memmkcmap();
6237da2899SCharles.Forsyth 
6337da2899SCharles.Forsyth 	fmtinstall('R', Rfmt);
6437da2899SCharles.Forsyth 	fmtinstall('P', Pfmt);
6537da2899SCharles.Forsyth 	fmtinstall('b', _ifmt);
6637da2899SCharles.Forsyth 
6737da2899SCharles.Forsyth 	memones = allocmemimage(Rect(0,0,1,1), GREY1);
6837da2899SCharles.Forsyth 	memones->flags |= Frepl;
6937da2899SCharles.Forsyth 	memones->clipr = Rect(-0x3FFFFFF, -0x3FFFFFF, 0x3FFFFFF, 0x3FFFFFF);
7037da2899SCharles.Forsyth 	*byteaddr(memones, ZP) = ~0;
7137da2899SCharles.Forsyth 
7237da2899SCharles.Forsyth 	memzeros = allocmemimage(Rect(0,0,1,1), GREY1);
7337da2899SCharles.Forsyth 	memzeros->flags |= Frepl;
7437da2899SCharles.Forsyth 	memzeros->clipr = Rect(-0x3FFFFFF, -0x3FFFFFF, 0x3FFFFFF, 0x3FFFFFF);
7537da2899SCharles.Forsyth 	*byteaddr(memzeros, ZP) = 0;
7637da2899SCharles.Forsyth 
7737da2899SCharles.Forsyth 	if(memones == nil || memzeros == nil)
7837da2899SCharles.Forsyth 		assert(0 /*cannot initialize memimage library */);	/* RSC BUG */
7937da2899SCharles.Forsyth 
8037da2899SCharles.Forsyth 	memwhite = memones;
8137da2899SCharles.Forsyth 	memblack = memzeros;
8237da2899SCharles.Forsyth 	memopaque = memones;
8337da2899SCharles.Forsyth 	memtransparent = memzeros;
8437da2899SCharles.Forsyth }
8537da2899SCharles.Forsyth 
8637da2899SCharles.Forsyth static ulong imgtorgba(Memimage*, ulong);
8737da2899SCharles.Forsyth static ulong rgbatoimg(Memimage*, ulong);
8837da2899SCharles.Forsyth static ulong pixelbits(Memimage*, Point);
8937da2899SCharles.Forsyth 
9037da2899SCharles.Forsyth #define DBG if(0)
9137da2899SCharles.Forsyth void
memimagedraw(Memimage * dst,Rectangle r,Memimage * src,Point p0,Memimage * mask,Point p1,int op)9237da2899SCharles.Forsyth memimagedraw(Memimage *dst, Rectangle r, Memimage *src, Point p0, Memimage *mask, Point p1, int op)
9337da2899SCharles.Forsyth {
9437da2899SCharles.Forsyth 	Memdrawparam par;
9537da2899SCharles.Forsyth 
9637da2899SCharles.Forsyth 	if(mask == nil)
9737da2899SCharles.Forsyth 		mask = memopaque;
9837da2899SCharles.Forsyth 
9937da2899SCharles.Forsyth DBG	print("memimagedraw %p/%luX %R @ %p %p/%luX %P %p/%luX %P... ", dst, dst->chan, r, dst->data->bdata, src, src->chan, p0, mask, mask->chan, p1);
10037da2899SCharles.Forsyth 
10137da2899SCharles.Forsyth 	if(drawclip(dst, &r, src, &p0, mask, &p1, &par.sr, &par.mr) == 0){
10237da2899SCharles.Forsyth //		if(drawdebug)
10337da2899SCharles.Forsyth //			iprint("empty clipped rectangle\n");
10437da2899SCharles.Forsyth 		return;
10537da2899SCharles.Forsyth 	}
10637da2899SCharles.Forsyth 
10737da2899SCharles.Forsyth 	if(op < Clear || op > SoverD){
10837da2899SCharles.Forsyth //		if(drawdebug)
10937da2899SCharles.Forsyth //			iprint("op out of range: %d\n", op);
11037da2899SCharles.Forsyth 		return;
11137da2899SCharles.Forsyth 	}
11237da2899SCharles.Forsyth 
11337da2899SCharles.Forsyth 	par.op = op;
11437da2899SCharles.Forsyth 	par.dst = dst;
11537da2899SCharles.Forsyth 	par.r = r;
11637da2899SCharles.Forsyth 	par.src = src;
11737da2899SCharles.Forsyth 	/* par.sr set by drawclip */
11837da2899SCharles.Forsyth 	par.mask = mask;
11937da2899SCharles.Forsyth 	/* par.mr set by drawclip */
12037da2899SCharles.Forsyth 
12137da2899SCharles.Forsyth 	par.state = 0;
12237da2899SCharles.Forsyth 	if(src->flags&Frepl){
12337da2899SCharles.Forsyth 		par.state |= Replsrc;
12437da2899SCharles.Forsyth 		if(Dx(src->r)==1 && Dy(src->r)==1){
12537da2899SCharles.Forsyth 			par.sval = pixelbits(src, src->r.min);
12637da2899SCharles.Forsyth 			par.state |= Simplesrc;
12737da2899SCharles.Forsyth 			par.srgba = imgtorgba(src, par.sval);
12837da2899SCharles.Forsyth 			par.sdval = rgbatoimg(dst, par.srgba);
12937da2899SCharles.Forsyth 			if((par.srgba&0xFF) == 0 && (op&DoutS)){
13037da2899SCharles.Forsyth //				if (drawdebug) iprint("fill with transparent source\n");
13137da2899SCharles.Forsyth 				return;	/* no-op successfully handled */
13237da2899SCharles.Forsyth 			}
13337da2899SCharles.Forsyth 		}
13437da2899SCharles.Forsyth 	}
13537da2899SCharles.Forsyth 
13637da2899SCharles.Forsyth 	if(mask->flags & Frepl){
13737da2899SCharles.Forsyth 		par.state |= Replmask;
13837da2899SCharles.Forsyth 		if(Dx(mask->r)==1 && Dy(mask->r)==1){
13937da2899SCharles.Forsyth 			par.mval = pixelbits(mask, mask->r.min);
14037da2899SCharles.Forsyth 			if(par.mval == 0 && (op&DoutS)){
14137da2899SCharles.Forsyth //				if(drawdebug) iprint("fill with zero mask\n");
14237da2899SCharles.Forsyth 				return;	/* no-op successfully handled */
14337da2899SCharles.Forsyth 			}
14437da2899SCharles.Forsyth 			par.state |= Simplemask;
14537da2899SCharles.Forsyth 			if(par.mval == ~0)
14637da2899SCharles.Forsyth 				par.state |= Fullmask;
14737da2899SCharles.Forsyth 			par.mrgba = imgtorgba(mask, par.mval);
14837da2899SCharles.Forsyth 		}
14937da2899SCharles.Forsyth 	}
15037da2899SCharles.Forsyth 
15137da2899SCharles.Forsyth //	if(drawdebug)
15237da2899SCharles.Forsyth //		iprint("dr %R sr %R mr %R...", r, par.sr, par.mr);
15337da2899SCharles.Forsyth DBG print("draw dr %R sr %R mr %R %lux\n", r, par.sr, par.mr, par.state);
15437da2899SCharles.Forsyth 
15537da2899SCharles.Forsyth 	/*
15637da2899SCharles.Forsyth 	 * Now that we've clipped the parameters down to be consistent, we
15737da2899SCharles.Forsyth 	 * simply try sub-drawing routines in order until we find one that was able
15837da2899SCharles.Forsyth 	 * to handle us.  If the sub-drawing routine returns zero, it means it was
15937da2899SCharles.Forsyth 	 * unable to satisfy the request, so we do not return.
16037da2899SCharles.Forsyth 	 */
16137da2899SCharles.Forsyth 
16237da2899SCharles.Forsyth 	/*
16337da2899SCharles.Forsyth 	 * Hardware support.  Each video driver provides this function,
16437da2899SCharles.Forsyth 	 * which checks to see if there is anything it can help with.
16537da2899SCharles.Forsyth 	 * There could be an if around this checking to see if dst is in video memory.
16637da2899SCharles.Forsyth 	 */
16737da2899SCharles.Forsyth DBG print("test hwdraw\n");
16837da2899SCharles.Forsyth 	if(hwdraw(&par)){
16937da2899SCharles.Forsyth //if(drawdebug) iprint("hw handled\n");
17037da2899SCharles.Forsyth DBG print("hwdraw handled\n");
17137da2899SCharles.Forsyth 		return;
17237da2899SCharles.Forsyth 	}
17337da2899SCharles.Forsyth 	/*
17437da2899SCharles.Forsyth 	 * Optimizations using memmove and memset.
17537da2899SCharles.Forsyth 	 */
17637da2899SCharles.Forsyth DBG print("test memoptdraw\n");
17737da2899SCharles.Forsyth 	if(memoptdraw(&par)){
17837da2899SCharles.Forsyth //if(drawdebug) iprint("memopt handled\n");
17937da2899SCharles.Forsyth DBG print("memopt handled\n");
18037da2899SCharles.Forsyth 		return;
18137da2899SCharles.Forsyth 	}
18237da2899SCharles.Forsyth 
18337da2899SCharles.Forsyth 	/*
18437da2899SCharles.Forsyth 	 * Character drawing.
18537da2899SCharles.Forsyth 	 * Solid source color being painted through a boolean mask onto a high res image.
18637da2899SCharles.Forsyth 	 */
18737da2899SCharles.Forsyth DBG print("test chardraw\n");
18837da2899SCharles.Forsyth 	if(chardraw(&par)){
18937da2899SCharles.Forsyth //if(drawdebug) iprint("chardraw handled\n");
19037da2899SCharles.Forsyth DBG print("chardraw handled\n");
19137da2899SCharles.Forsyth 		return;
19237da2899SCharles.Forsyth 	}
19337da2899SCharles.Forsyth 
19437da2899SCharles.Forsyth 	/*
19537da2899SCharles.Forsyth 	 * General calculation-laden case that does alpha for each pixel.
19637da2899SCharles.Forsyth 	 */
19737da2899SCharles.Forsyth DBG print("do alphadraw\n");
19837da2899SCharles.Forsyth 	alphadraw(&par);
19937da2899SCharles.Forsyth //if(drawdebug) iprint("alphadraw handled\n");
20037da2899SCharles.Forsyth DBG print("alphadraw handled\n");
20137da2899SCharles.Forsyth }
20237da2899SCharles.Forsyth #undef DBG
20337da2899SCharles.Forsyth 
20437da2899SCharles.Forsyth /*
20537da2899SCharles.Forsyth  * Clip the destination rectangle further based on the properties of the
20637da2899SCharles.Forsyth  * source and mask rectangles.  Once the destination rectangle is properly
20737da2899SCharles.Forsyth  * clipped, adjust the source and mask rectangles to be the same size.
20837da2899SCharles.Forsyth  * Then if source or mask is replicated, move its clipped rectangle
20937da2899SCharles.Forsyth  * so that its minimum point falls within the repl rectangle.
21037da2899SCharles.Forsyth  *
21137da2899SCharles.Forsyth  * Return zero if the final rectangle is null.
21237da2899SCharles.Forsyth  */
21337da2899SCharles.Forsyth int
drawclip(Memimage * dst,Rectangle * r,Memimage * src,Point * p0,Memimage * mask,Point * p1,Rectangle * sr,Rectangle * mr)21437da2899SCharles.Forsyth drawclip(Memimage *dst, Rectangle *r, Memimage *src, Point *p0, Memimage *mask, Point *p1, Rectangle *sr, Rectangle *mr)
21537da2899SCharles.Forsyth {
21637da2899SCharles.Forsyth 	Point rmin, delta;
21737da2899SCharles.Forsyth 	int splitcoords;
21837da2899SCharles.Forsyth 	Rectangle omr;
21937da2899SCharles.Forsyth 
22037da2899SCharles.Forsyth 	if(r->min.x>=r->max.x || r->min.y>=r->max.y)
22137da2899SCharles.Forsyth 		return 0;
22237da2899SCharles.Forsyth 	splitcoords = (p0->x!=p1->x) || (p0->y!=p1->y);
22337da2899SCharles.Forsyth 	/* clip to destination */
22437da2899SCharles.Forsyth 	rmin = r->min;
22537da2899SCharles.Forsyth 	if(!rectclip(r, dst->r) || !rectclip(r, dst->clipr))
22637da2899SCharles.Forsyth 		return 0;
22737da2899SCharles.Forsyth 	/* move mask point */
22837da2899SCharles.Forsyth 	p1->x += r->min.x-rmin.x;
22937da2899SCharles.Forsyth 	p1->y += r->min.y-rmin.y;
23037da2899SCharles.Forsyth 	/* move source point */
23137da2899SCharles.Forsyth 	p0->x += r->min.x-rmin.x;
23237da2899SCharles.Forsyth 	p0->y += r->min.y-rmin.y;
23337da2899SCharles.Forsyth 	/* map destination rectangle into source */
23437da2899SCharles.Forsyth 	sr->min = *p0;
23537da2899SCharles.Forsyth 	sr->max.x = p0->x+Dx(*r);
23637da2899SCharles.Forsyth 	sr->max.y = p0->y+Dy(*r);
23737da2899SCharles.Forsyth 	/* sr is r in source coordinates; clip to source */
23837da2899SCharles.Forsyth 	if(!(src->flags&Frepl) && !rectclip(sr, src->r))
23937da2899SCharles.Forsyth 		return 0;
24037da2899SCharles.Forsyth 	if(!rectclip(sr, src->clipr))
24137da2899SCharles.Forsyth 		return 0;
24237da2899SCharles.Forsyth 	/* compute and clip rectangle in mask */
24337da2899SCharles.Forsyth 	if(splitcoords){
24437da2899SCharles.Forsyth 		/* move mask point with source */
24537da2899SCharles.Forsyth 		p1->x += sr->min.x-p0->x;
24637da2899SCharles.Forsyth 		p1->y += sr->min.y-p0->y;
24737da2899SCharles.Forsyth 		mr->min = *p1;
24837da2899SCharles.Forsyth 		mr->max.x = p1->x+Dx(*sr);
24937da2899SCharles.Forsyth 		mr->max.y = p1->y+Dy(*sr);
25037da2899SCharles.Forsyth 		omr = *mr;
25137da2899SCharles.Forsyth 		/* mr is now rectangle in mask; clip it */
25237da2899SCharles.Forsyth 		if(!(mask->flags&Frepl) && !rectclip(mr, mask->r))
25337da2899SCharles.Forsyth 			return 0;
25437da2899SCharles.Forsyth 		if(!rectclip(mr, mask->clipr))
25537da2899SCharles.Forsyth 			return 0;
25637da2899SCharles.Forsyth 		/* reflect any clips back to source */
25737da2899SCharles.Forsyth 		sr->min.x += mr->min.x-omr.min.x;
25837da2899SCharles.Forsyth 		sr->min.y += mr->min.y-omr.min.y;
25937da2899SCharles.Forsyth 		sr->max.x += mr->max.x-omr.max.x;
26037da2899SCharles.Forsyth 		sr->max.y += mr->max.y-omr.max.y;
26137da2899SCharles.Forsyth 		*p1 = mr->min;
26237da2899SCharles.Forsyth 	}else{
26337da2899SCharles.Forsyth 		if(!(mask->flags&Frepl) && !rectclip(sr, mask->r))
26437da2899SCharles.Forsyth 			return 0;
26537da2899SCharles.Forsyth 		if(!rectclip(sr, mask->clipr))
26637da2899SCharles.Forsyth 			return 0;
26737da2899SCharles.Forsyth 		*p1 = sr->min;
26837da2899SCharles.Forsyth 	}
26937da2899SCharles.Forsyth 
27037da2899SCharles.Forsyth 	/* move source clipping back to destination */
27137da2899SCharles.Forsyth 	delta.x = r->min.x - p0->x;
27237da2899SCharles.Forsyth 	delta.y = r->min.y - p0->y;
27337da2899SCharles.Forsyth 	r->min.x = sr->min.x + delta.x;
27437da2899SCharles.Forsyth 	r->min.y = sr->min.y + delta.y;
27537da2899SCharles.Forsyth 	r->max.x = sr->max.x + delta.x;
27637da2899SCharles.Forsyth 	r->max.y = sr->max.y + delta.y;
27737da2899SCharles.Forsyth 
27837da2899SCharles.Forsyth 	/* move source rectangle so sr->min is in src->r */
27937da2899SCharles.Forsyth 	if(src->flags&Frepl) {
28037da2899SCharles.Forsyth 		delta.x = drawreplxy(src->r.min.x, src->r.max.x, sr->min.x) - sr->min.x;
28137da2899SCharles.Forsyth 		delta.y = drawreplxy(src->r.min.y, src->r.max.y, sr->min.y) - sr->min.y;
28237da2899SCharles.Forsyth 		sr->min.x += delta.x;
28337da2899SCharles.Forsyth 		sr->min.y += delta.y;
28437da2899SCharles.Forsyth 		sr->max.x += delta.x;
28537da2899SCharles.Forsyth 		sr->max.y += delta.y;
28637da2899SCharles.Forsyth 	}
28737da2899SCharles.Forsyth 	*p0 = sr->min;
28837da2899SCharles.Forsyth 
28937da2899SCharles.Forsyth 	/* move mask point so it is in mask->r */
29037da2899SCharles.Forsyth 	*p1 = drawrepl(mask->r, *p1);
29137da2899SCharles.Forsyth 	mr->min = *p1;
29237da2899SCharles.Forsyth 	mr->max.x = p1->x+Dx(*sr);
29337da2899SCharles.Forsyth 	mr->max.y = p1->y+Dy(*sr);
29437da2899SCharles.Forsyth 
29537da2899SCharles.Forsyth 	assert(Dx(*sr) == Dx(*mr) && Dx(*mr) == Dx(*r));
29637da2899SCharles.Forsyth 	assert(Dy(*sr) == Dy(*mr) && Dy(*mr) == Dy(*r));
29737da2899SCharles.Forsyth 	assert(ptinrect(*p0, src->r));
29837da2899SCharles.Forsyth 	assert(ptinrect(*p1, mask->r));
29937da2899SCharles.Forsyth 	assert(ptinrect(r->min, dst->r));
30037da2899SCharles.Forsyth 
30137da2899SCharles.Forsyth 	return 1;
30237da2899SCharles.Forsyth }
30337da2899SCharles.Forsyth 
30437da2899SCharles.Forsyth /*
30537da2899SCharles.Forsyth  * Conversion tables.
30637da2899SCharles.Forsyth  */
30737da2899SCharles.Forsyth static uchar replbit[1+8][256];		/* replbit[x][y] is the replication of the x-bit quantity y to 8-bit depth */
30837da2899SCharles.Forsyth 
30937da2899SCharles.Forsyth /*
31037da2899SCharles.Forsyth  * bitmap of how to replicate n bits to fill 8, for 1 ≤ n ≤ 8.
31137da2899SCharles.Forsyth  * the X's are where to put the bottom (ones) bit of the n-bit pattern.
31237da2899SCharles.Forsyth  * only the top 8 bits of the result are actually used.
31337da2899SCharles.Forsyth  * (the lower 8 bits are needed to get bits in the right place
31437da2899SCharles.Forsyth  * when n is not a divisor of 8.)
31537da2899SCharles.Forsyth  *
31637da2899SCharles.Forsyth  * Should check to see if its easier to just refer to replmul than
31737da2899SCharles.Forsyth  * use the precomputed values in replbit.  On PCs it may well
31837da2899SCharles.Forsyth  * be; on machines with slow multiply instructions it probably isn't.
31937da2899SCharles.Forsyth  */
32037da2899SCharles.Forsyth #define a ((((((((((((((((0
32137da2899SCharles.Forsyth #define X *2+1)
32237da2899SCharles.Forsyth #define _ *2)
32337da2899SCharles.Forsyth static int replmul[1+8] = {
32437da2899SCharles.Forsyth 	0,
32537da2899SCharles.Forsyth 	a X X X X X X X X X X X X X X X X,
32637da2899SCharles.Forsyth 	a _ X _ X _ X _ X _ X _ X _ X _ X,
32737da2899SCharles.Forsyth 	a _ _ X _ _ X _ _ X _ _ X _ _ X _,
32837da2899SCharles.Forsyth 	a _ _ _ X _ _ _ X _ _ _ X _ _ _ X,
32937da2899SCharles.Forsyth 	a _ _ _ _ X _ _ _ _ X _ _ _ _ X _,
33037da2899SCharles.Forsyth 	a _ _ _ _ _ X _ _ _ _ _ X _ _ _ _,
33137da2899SCharles.Forsyth 	a _ _ _ _ _ _ X _ _ _ _ _ _ X _ _,
33237da2899SCharles.Forsyth 	a _ _ _ _ _ _ _ X _ _ _ _ _ _ _ X,
33337da2899SCharles.Forsyth };
33437da2899SCharles.Forsyth #undef a
33537da2899SCharles.Forsyth #undef X
33637da2899SCharles.Forsyth #undef _
33737da2899SCharles.Forsyth 
33837da2899SCharles.Forsyth static void
mktables(void)33937da2899SCharles.Forsyth mktables(void)
34037da2899SCharles.Forsyth {
341d0e1d143Sforsyth 	int i, j, small;
34237da2899SCharles.Forsyth 
34337da2899SCharles.Forsyth 	if(tablesbuilt)
34437da2899SCharles.Forsyth 		return;
34537da2899SCharles.Forsyth 
34637da2899SCharles.Forsyth 	fmtinstall('R', Rfmt);
34737da2899SCharles.Forsyth 	fmtinstall('P', Pfmt);
34837da2899SCharles.Forsyth 	tablesbuilt = 1;
34937da2899SCharles.Forsyth 
35037da2899SCharles.Forsyth 	/* bit replication up to 8 bits */
35137da2899SCharles.Forsyth 	for(i=0; i<256; i++){
35237da2899SCharles.Forsyth 		for(j=0; j<=8; j++){	/* j <= 8 [sic] */
35337da2899SCharles.Forsyth 			small = i & ((1<<j)-1);
35437da2899SCharles.Forsyth 			replbit[j][i] = (small*replmul[j])>>8;
35537da2899SCharles.Forsyth 		}
35637da2899SCharles.Forsyth 	}
35737da2899SCharles.Forsyth }
35837da2899SCharles.Forsyth 
35937da2899SCharles.Forsyth static uchar ones = 0xff;
36037da2899SCharles.Forsyth 
36137da2899SCharles.Forsyth /*
36237da2899SCharles.Forsyth  * General alpha drawing case.  Can handle anything.
36337da2899SCharles.Forsyth  */
36437da2899SCharles.Forsyth typedef struct	Buffer	Buffer;
36537da2899SCharles.Forsyth struct Buffer {
36637da2899SCharles.Forsyth 	/* used by most routines */
36737da2899SCharles.Forsyth 	uchar	*red;
36837da2899SCharles.Forsyth 	uchar	*grn;
36937da2899SCharles.Forsyth 	uchar	*blu;
37037da2899SCharles.Forsyth 	uchar	*alpha;
37137da2899SCharles.Forsyth 	uchar	*grey;
37237da2899SCharles.Forsyth 	ulong	*rgba;
37337da2899SCharles.Forsyth 	int	delta;	/* number of bytes to add to pointer to get next pixel to the right */
37437da2899SCharles.Forsyth 
37537da2899SCharles.Forsyth 	/* used by boolcalc* for mask data */
37637da2899SCharles.Forsyth 	uchar	*m;		/* ptr to mask data r.min byte; like p->bytermin */
37737da2899SCharles.Forsyth 	int		mskip;	/* no. of left bits to skip in *m */
37837da2899SCharles.Forsyth 	uchar	*bm;		/* ptr to mask data img->r.min byte; like p->bytey0s */
37937da2899SCharles.Forsyth 	int		bmskip;	/* no. of left bits to skip in *bm */
38037da2899SCharles.Forsyth 	uchar	*em;		/* ptr to mask data img->r.max.x byte; like p->bytey0e */
38137da2899SCharles.Forsyth 	int		emskip;	/* no. of right bits to skip in *em */
38237da2899SCharles.Forsyth };
38337da2899SCharles.Forsyth 
38437da2899SCharles.Forsyth typedef struct	Param	Param;
38537da2899SCharles.Forsyth typedef Buffer	Readfn(Param*, uchar*, int);
38637da2899SCharles.Forsyth typedef void	Writefn(Param*, uchar*, Buffer);
38737da2899SCharles.Forsyth typedef Buffer	Calcfn(Buffer, Buffer, Buffer, int, int, int);
38837da2899SCharles.Forsyth 
38937da2899SCharles.Forsyth enum {
39037da2899SCharles.Forsyth 	MAXBCACHE = 16
39137da2899SCharles.Forsyth };
39237da2899SCharles.Forsyth 
39337da2899SCharles.Forsyth /* giant rathole to customize functions with */
39437da2899SCharles.Forsyth struct Param {
39537da2899SCharles.Forsyth 	Readfn	*replcall;
39637da2899SCharles.Forsyth 	Readfn	*greymaskcall;
39737da2899SCharles.Forsyth 	Readfn	*convreadcall;
39837da2899SCharles.Forsyth 	Writefn	*convwritecall;
39937da2899SCharles.Forsyth 
40037da2899SCharles.Forsyth 	Memimage *img;
40137da2899SCharles.Forsyth 	Rectangle	r;
40237da2899SCharles.Forsyth 	int	dx;	/* of r */
40337da2899SCharles.Forsyth 	int	needbuf;
40437da2899SCharles.Forsyth 	int	convgrey;
40537da2899SCharles.Forsyth 	int	alphaonly;
40637da2899SCharles.Forsyth 
40737da2899SCharles.Forsyth 	uchar	*bytey0s;		/* byteaddr(Pt(img->r.min.x, img->r.min.y)) */
40837da2899SCharles.Forsyth 	uchar	*bytermin;	/* byteaddr(Pt(r.min.x, img->r.min.y)) */
40937da2899SCharles.Forsyth 	uchar	*bytey0e;		/* byteaddr(Pt(img->r.max.x, img->r.min.y)) */
41037da2899SCharles.Forsyth 	int		bwidth;
41137da2899SCharles.Forsyth 
41237da2899SCharles.Forsyth 	int	replcache;	/* if set, cache buffers */
41337da2899SCharles.Forsyth 	Buffer	bcache[MAXBCACHE];
41437da2899SCharles.Forsyth 	ulong	bfilled;
41537da2899SCharles.Forsyth 	uchar	*bufbase;
41637da2899SCharles.Forsyth 	int	bufoff;
41737da2899SCharles.Forsyth 	int	bufdelta;
41837da2899SCharles.Forsyth 
41937da2899SCharles.Forsyth 	int	dir;
42037da2899SCharles.Forsyth 
42137da2899SCharles.Forsyth 	int	convbufoff;
42237da2899SCharles.Forsyth 	uchar	*convbuf;
42337da2899SCharles.Forsyth 	Param	*convdpar;
42437da2899SCharles.Forsyth 	int	convdx;
42537da2899SCharles.Forsyth };
42637da2899SCharles.Forsyth 
42737da2899SCharles.Forsyth static Readfn	greymaskread, replread, readptr;
42837da2899SCharles.Forsyth static Writefn	nullwrite;
42937da2899SCharles.Forsyth static Calcfn	alphacalc0, alphacalc14, alphacalc2810, alphacalc3679, alphacalc5, alphacalc11, alphacalcS;
43037da2899SCharles.Forsyth static Calcfn	boolcalc14, boolcalc236789, boolcalc1011;
43137da2899SCharles.Forsyth 
43237da2899SCharles.Forsyth static Readfn*	readfn(Memimage*);
43337da2899SCharles.Forsyth static Readfn*	readalphafn(Memimage*);
43437da2899SCharles.Forsyth static Writefn*	writefn(Memimage*);
43537da2899SCharles.Forsyth 
43637da2899SCharles.Forsyth static Calcfn*	boolcopyfn(Memimage*, Memimage*);
43737da2899SCharles.Forsyth static Readfn*	convfn(Memimage*, Param*, Memimage*, Param*, int*);
43837da2899SCharles.Forsyth static Readfn*	ptrfn(Memimage*);
43937da2899SCharles.Forsyth 
44037da2899SCharles.Forsyth static Calcfn *alphacalc[Ncomp] =
44137da2899SCharles.Forsyth {
44237da2899SCharles.Forsyth 	alphacalc0,		/* Clear */
44337da2899SCharles.Forsyth 	alphacalc14,		/* DoutS */
44437da2899SCharles.Forsyth 	alphacalc2810,		/* SoutD */
44537da2899SCharles.Forsyth 	alphacalc3679,		/* DxorS */
44637da2899SCharles.Forsyth 	alphacalc14,		/* DinS */
44737da2899SCharles.Forsyth 	alphacalc5,		/* D */
44837da2899SCharles.Forsyth 	alphacalc3679,		/* DatopS */
44937da2899SCharles.Forsyth 	alphacalc3679,		/* DoverS */
45037da2899SCharles.Forsyth 	alphacalc2810,		/* SinD */
45137da2899SCharles.Forsyth 	alphacalc3679,		/* SatopD */
45237da2899SCharles.Forsyth 	alphacalc2810,		/* S */
45337da2899SCharles.Forsyth 	alphacalc11,		/* SoverD */
45437da2899SCharles.Forsyth };
45537da2899SCharles.Forsyth 
45637da2899SCharles.Forsyth static Calcfn *boolcalc[Ncomp] =
45737da2899SCharles.Forsyth {
45837da2899SCharles.Forsyth 	alphacalc0,		/* Clear */
45937da2899SCharles.Forsyth 	boolcalc14,		/* DoutS */
46037da2899SCharles.Forsyth 	boolcalc236789,		/* SoutD */
46137da2899SCharles.Forsyth 	boolcalc236789,		/* DxorS */
46237da2899SCharles.Forsyth 	boolcalc14,		/* DinS */
46337da2899SCharles.Forsyth 	alphacalc5,		/* D */
46437da2899SCharles.Forsyth 	boolcalc236789,		/* DatopS */
46537da2899SCharles.Forsyth 	boolcalc236789,		/* DoverS */
46637da2899SCharles.Forsyth 	boolcalc236789,		/* SinD */
46737da2899SCharles.Forsyth 	boolcalc236789,		/* SatopD */
46837da2899SCharles.Forsyth 	boolcalc1011,		/* S */
46937da2899SCharles.Forsyth 	boolcalc1011,		/* SoverD */
47037da2899SCharles.Forsyth };
47137da2899SCharles.Forsyth 
47237da2899SCharles.Forsyth /*
47337da2899SCharles.Forsyth  * Avoid standard Lock, QLock so that can be used in kernel.
47437da2899SCharles.Forsyth  */
47537da2899SCharles.Forsyth typedef struct Dbuf Dbuf;
47637da2899SCharles.Forsyth struct Dbuf
47737da2899SCharles.Forsyth {
47837da2899SCharles.Forsyth 	uchar *p;
47937da2899SCharles.Forsyth 	int n;
48037da2899SCharles.Forsyth 	Param spar, mpar, dpar;
4817e004309SCharles.Forsyth 	int inuse;
48237da2899SCharles.Forsyth };
48337da2899SCharles.Forsyth static Dbuf dbuf[10];
48437da2899SCharles.Forsyth 
48537da2899SCharles.Forsyth static Dbuf*
allocdbuf(void)48637da2899SCharles.Forsyth allocdbuf(void)
48737da2899SCharles.Forsyth {
48837da2899SCharles.Forsyth 	int i;
48937da2899SCharles.Forsyth 
49037da2899SCharles.Forsyth 	for(i=0; i<nelem(dbuf); i++){
49137da2899SCharles.Forsyth 		if(dbuf[i].inuse)
49237da2899SCharles.Forsyth 			continue;
49337da2899SCharles.Forsyth 		if(!_tas(&dbuf[i].inuse))
49437da2899SCharles.Forsyth 			return &dbuf[i];
49537da2899SCharles.Forsyth 	}
49637da2899SCharles.Forsyth 	return nil;
49737da2899SCharles.Forsyth }
49837da2899SCharles.Forsyth 
49937da2899SCharles.Forsyth static void
getparam(Param * p,Memimage * img,Rectangle r,int convgrey,int needbuf,int * ndrawbuf)50037da2899SCharles.Forsyth getparam(Param *p, Memimage *img, Rectangle r, int convgrey, int needbuf, int *ndrawbuf)
50137da2899SCharles.Forsyth {
50237da2899SCharles.Forsyth 	int nbuf;
50337da2899SCharles.Forsyth 
50437da2899SCharles.Forsyth 	memset(p, 0, sizeof *p);
50537da2899SCharles.Forsyth 
50637da2899SCharles.Forsyth 	p->img = img;
50737da2899SCharles.Forsyth 	p->r = r;
50837da2899SCharles.Forsyth 	p->dx = Dx(r);
50937da2899SCharles.Forsyth 	p->needbuf = needbuf;
51037da2899SCharles.Forsyth 	p->convgrey = convgrey;
51137da2899SCharles.Forsyth 
51237da2899SCharles.Forsyth 	assert(img->r.min.x <= r.min.x && r.min.x < img->r.max.x);
51337da2899SCharles.Forsyth 
51437da2899SCharles.Forsyth 	p->bytey0s = byteaddr(img, Pt(img->r.min.x, img->r.min.y));
51537da2899SCharles.Forsyth 	p->bytermin = byteaddr(img, Pt(r.min.x, img->r.min.y));
51637da2899SCharles.Forsyth 	p->bytey0e = byteaddr(img, Pt(img->r.max.x, img->r.min.y));
51737da2899SCharles.Forsyth 	p->bwidth = sizeof(ulong)*img->width;
51837da2899SCharles.Forsyth 
51937da2899SCharles.Forsyth 	assert(p->bytey0s <= p->bytermin && p->bytermin <= p->bytey0e);
52037da2899SCharles.Forsyth 
52137da2899SCharles.Forsyth 	if(p->r.min.x == p->img->r.min.x)
52237da2899SCharles.Forsyth 		assert(p->bytermin == p->bytey0s);
52337da2899SCharles.Forsyth 
52437da2899SCharles.Forsyth 	nbuf = 1;
52537da2899SCharles.Forsyth 	if((img->flags&Frepl) && Dy(img->r) <= MAXBCACHE && Dy(img->r) < Dy(r)){
52637da2899SCharles.Forsyth 		p->replcache = 1;
52737da2899SCharles.Forsyth 		nbuf = Dy(img->r);
52837da2899SCharles.Forsyth 	}
52937da2899SCharles.Forsyth 	p->bufdelta = 4*p->dx;
53037da2899SCharles.Forsyth 	p->bufoff = *ndrawbuf;
53137da2899SCharles.Forsyth 	*ndrawbuf += p->bufdelta*nbuf;
53237da2899SCharles.Forsyth }
53337da2899SCharles.Forsyth 
53437da2899SCharles.Forsyth static void
clipy(Memimage * img,int * y)53537da2899SCharles.Forsyth clipy(Memimage *img, int *y)
53637da2899SCharles.Forsyth {
53737da2899SCharles.Forsyth 	int dy;
53837da2899SCharles.Forsyth 
53937da2899SCharles.Forsyth 	dy = Dy(img->r);
54037da2899SCharles.Forsyth 	if(*y == dy)
54137da2899SCharles.Forsyth 		*y = 0;
54237da2899SCharles.Forsyth 	else if(*y == -1)
54337da2899SCharles.Forsyth 		*y = dy-1;
54437da2899SCharles.Forsyth 	assert(0 <= *y && *y < dy);
54537da2899SCharles.Forsyth }
54637da2899SCharles.Forsyth 
54737da2899SCharles.Forsyth static void
dumpbuf(char * s,Buffer b,int n)54837da2899SCharles.Forsyth dumpbuf(char *s, Buffer b, int n)
54937da2899SCharles.Forsyth {
55037da2899SCharles.Forsyth 	int i;
55137da2899SCharles.Forsyth 	uchar *p;
55237da2899SCharles.Forsyth 
55337da2899SCharles.Forsyth 	print("%s", s);
55437da2899SCharles.Forsyth 	for(i=0; i<n; i++){
55537da2899SCharles.Forsyth 		print(" ");
55637da2899SCharles.Forsyth 		if(p=b.grey){
55737da2899SCharles.Forsyth 			print(" k%.2uX", *p);
55837da2899SCharles.Forsyth 			b.grey += b.delta;
55937da2899SCharles.Forsyth 		}else{
56037da2899SCharles.Forsyth 			if(p=b.red){
56137da2899SCharles.Forsyth 				print(" r%.2uX", *p);
56237da2899SCharles.Forsyth 				b.red += b.delta;
56337da2899SCharles.Forsyth 			}
56437da2899SCharles.Forsyth 			if(p=b.grn){
56537da2899SCharles.Forsyth 				print(" g%.2uX", *p);
56637da2899SCharles.Forsyth 				b.grn += b.delta;
56737da2899SCharles.Forsyth 			}
56837da2899SCharles.Forsyth 			if(p=b.blu){
56937da2899SCharles.Forsyth 				print(" b%.2uX", *p);
57037da2899SCharles.Forsyth 				b.blu += b.delta;
57137da2899SCharles.Forsyth 			}
57237da2899SCharles.Forsyth 		}
57337da2899SCharles.Forsyth 		if((p=b.alpha) != &ones){
57437da2899SCharles.Forsyth 			print(" α%.2uX", *p);
57537da2899SCharles.Forsyth 			b.alpha += b.delta;
57637da2899SCharles.Forsyth 		}
57737da2899SCharles.Forsyth 	}
57837da2899SCharles.Forsyth 	print("\n");
57937da2899SCharles.Forsyth }
58037da2899SCharles.Forsyth 
58137da2899SCharles.Forsyth /*
58237da2899SCharles.Forsyth  * For each scan line, we expand the pixels from source, mask, and destination
58337da2899SCharles.Forsyth  * into byte-aligned red, green, blue, alpha, and grey channels.  If buffering is not
58437da2899SCharles.Forsyth  * needed and the channels were already byte-aligned (grey8, rgb24, rgba32, rgb32),
58537da2899SCharles.Forsyth  * the readers need not copy the data: they can simply return pointers to the data.
58637da2899SCharles.Forsyth  * If the destination image is grey and the source is not, it is converted using the NTSC
58737da2899SCharles.Forsyth  * formula.
58837da2899SCharles.Forsyth  *
58937da2899SCharles.Forsyth  * Once we have all the channels, we call either rgbcalc or greycalc, depending on
59037da2899SCharles.Forsyth  * whether the destination image is color.  This is allowed to overwrite the dst buffer (perhaps
59137da2899SCharles.Forsyth  * the actual data, perhaps a copy) with its result.  It should only overwrite the dst buffer
59237da2899SCharles.Forsyth  * with the same format (i.e. red bytes with red bytes, etc.)  A new buffer is returned from
59337da2899SCharles.Forsyth  * the calculator, and that buffer is passed to a function to write it to the destination.
59437da2899SCharles.Forsyth  * If the buffer is already pointing at the destination, the writing function is a no-op.
59537da2899SCharles.Forsyth  */
59637da2899SCharles.Forsyth #define DBG if(0)
59737da2899SCharles.Forsyth static int
alphadraw(Memdrawparam * par)59837da2899SCharles.Forsyth alphadraw(Memdrawparam *par)
59937da2899SCharles.Forsyth {
60037da2899SCharles.Forsyth 	int isgrey, starty, endy, op;
60137da2899SCharles.Forsyth 	int needbuf, dsty, srcy, masky;
60237da2899SCharles.Forsyth 	int y, dir, dx, dy, ndrawbuf;
60337da2899SCharles.Forsyth 	uchar *drawbuf;
60437da2899SCharles.Forsyth 	Buffer bsrc, bdst, bmask;
60537da2899SCharles.Forsyth 	Readfn *rdsrc, *rdmask, *rddst;
60637da2899SCharles.Forsyth 	Calcfn *calc;
60737da2899SCharles.Forsyth 	Writefn *wrdst;
60837da2899SCharles.Forsyth 	Memimage *src, *mask, *dst;
60937da2899SCharles.Forsyth 	Rectangle r, sr, mr;
61037da2899SCharles.Forsyth 	Dbuf *z;
61137da2899SCharles.Forsyth 
61237da2899SCharles.Forsyth 	z = allocdbuf();
61337da2899SCharles.Forsyth 	if(z == nil)
61437da2899SCharles.Forsyth 		return 0;
61537da2899SCharles.Forsyth 
61637da2899SCharles.Forsyth 	r = par->r;
61737da2899SCharles.Forsyth 	dx = Dx(r);
61837da2899SCharles.Forsyth 	dy = Dy(r);
61937da2899SCharles.Forsyth 
62037da2899SCharles.Forsyth 	src = par->src;
62137da2899SCharles.Forsyth 	mask = par->mask;
62237da2899SCharles.Forsyth 	dst = par->dst;
62337da2899SCharles.Forsyth 	sr = par->sr;
62437da2899SCharles.Forsyth 	mr = par->mr;
62537da2899SCharles.Forsyth 	op = par->op;
62637da2899SCharles.Forsyth 
62737da2899SCharles.Forsyth 	isgrey = dst->flags&Fgrey;
62837da2899SCharles.Forsyth 
62937da2899SCharles.Forsyth 	/*
63037da2899SCharles.Forsyth 	 * Buffering when src and dst are the same bitmap is sufficient but not
63137da2899SCharles.Forsyth 	 * necessary.  There are stronger conditions we could use.  We could
63237da2899SCharles.Forsyth 	 * check to see if the rectangles intersect, and if simply moving in the
63337da2899SCharles.Forsyth 	 * correct y direction can avoid the need to buffer.
63437da2899SCharles.Forsyth 	 */
63537da2899SCharles.Forsyth 	needbuf = (src->data == dst->data);
63637da2899SCharles.Forsyth 
63737da2899SCharles.Forsyth 	ndrawbuf = 0;
63837da2899SCharles.Forsyth 	getparam(&z->spar, src, sr, isgrey, needbuf, &ndrawbuf);
63937da2899SCharles.Forsyth 	getparam(&z->dpar, dst, r, isgrey, needbuf, &ndrawbuf);
64037da2899SCharles.Forsyth 	getparam(&z->mpar, mask, mr, 0, needbuf, &ndrawbuf);
64137da2899SCharles.Forsyth 
64237da2899SCharles.Forsyth 	dir = (needbuf && byteaddr(dst, r.min) > byteaddr(src, sr.min)) ? -1 : 1;
64337da2899SCharles.Forsyth 	z->spar.dir = z->mpar.dir = z->dpar.dir = dir;
64437da2899SCharles.Forsyth 
64537da2899SCharles.Forsyth 	/*
64637da2899SCharles.Forsyth 	 * If the mask is purely boolean, we can convert from src to dst format
64737da2899SCharles.Forsyth 	 * when we read src, and then just copy it to dst where the mask tells us to.
64837da2899SCharles.Forsyth 	 * This requires a boolean (1-bit grey) mask and lack of a source alpha channel.
64937da2899SCharles.Forsyth 	 *
65037da2899SCharles.Forsyth 	 * The computation is accomplished by assigning the function pointers as follows:
65137da2899SCharles.Forsyth 	 *	rdsrc - read and convert source into dst format in a buffer
65237da2899SCharles.Forsyth 	 * 	rdmask - convert mask to bytes, set pointer to it
65337da2899SCharles.Forsyth 	 * 	rddst - fill with pointer to real dst data, but do no reads
65437da2899SCharles.Forsyth 	 *	calc - copy src onto dst when mask says to.
65537da2899SCharles.Forsyth 	 *	wrdst - do nothing
65637da2899SCharles.Forsyth 	 * This is slightly sleazy, since things aren't doing exactly what their names say,
65737da2899SCharles.Forsyth 	 * but it avoids a fair amount of code duplication to make this a case here
65837da2899SCharles.Forsyth 	 * rather than have a separate booldraw.
65937da2899SCharles.Forsyth 	 */
66037da2899SCharles.Forsyth //if(drawdebug) iprint("flag %lud mchan %lux=?%x dd %d\n", src->flags&Falpha, mask->chan, GREY1, dst->depth);
66137da2899SCharles.Forsyth 	if(!(src->flags&Falpha) && mask->chan == GREY1 && dst->depth >= 8 && op == SoverD){
66237da2899SCharles.Forsyth //if(drawdebug) iprint("boolcopy...");
66337da2899SCharles.Forsyth 		rdsrc = convfn(dst, &z->dpar, src, &z->spar, &ndrawbuf);
66437da2899SCharles.Forsyth 		rddst = readptr;
66537da2899SCharles.Forsyth 		rdmask = readfn(mask);
66637da2899SCharles.Forsyth 		calc = boolcopyfn(dst, mask);
66737da2899SCharles.Forsyth 		wrdst = nullwrite;
66837da2899SCharles.Forsyth 	}else{
66937da2899SCharles.Forsyth 		/* usual alphadraw parameter fetching */
67037da2899SCharles.Forsyth 		rdsrc = readfn(src);
67137da2899SCharles.Forsyth 		rddst = readfn(dst);
67237da2899SCharles.Forsyth 		wrdst = writefn(dst);
67337da2899SCharles.Forsyth 		calc = alphacalc[op];
67437da2899SCharles.Forsyth 
67537da2899SCharles.Forsyth 		/*
67637da2899SCharles.Forsyth 		 * If there is no alpha channel, we'll ask for a grey channel
67737da2899SCharles.Forsyth 		 * and pretend it is the alpha.
67837da2899SCharles.Forsyth 		 */
67937da2899SCharles.Forsyth 		if(mask->flags&Falpha){
68037da2899SCharles.Forsyth 			rdmask = readalphafn(mask);
68137da2899SCharles.Forsyth 			z->mpar.alphaonly = 1;
68237da2899SCharles.Forsyth 		}else{
68337da2899SCharles.Forsyth 			z->mpar.greymaskcall = readfn(mask);
68437da2899SCharles.Forsyth 			z->mpar.convgrey = 1;
68537da2899SCharles.Forsyth 			rdmask = greymaskread;
68637da2899SCharles.Forsyth 
68737da2899SCharles.Forsyth 			/*
68837da2899SCharles.Forsyth 			 * Should really be above, but then boolcopyfns would have
68937da2899SCharles.Forsyth 			 * to deal with bit alignment, and I haven't written that.
69037da2899SCharles.Forsyth 			 *
69137da2899SCharles.Forsyth 			 * This is a common case for things like ellipse drawing.
69237da2899SCharles.Forsyth 			 * When there's no alpha involved and the mask is boolean,
69337da2899SCharles.Forsyth 			 * we can avoid all the division and multiplication.
69437da2899SCharles.Forsyth 			 */
69537da2899SCharles.Forsyth 			if(mask->chan == GREY1 && !(src->flags&Falpha))
69637da2899SCharles.Forsyth 				calc = boolcalc[op];
69737da2899SCharles.Forsyth 			else if(op == SoverD && !(src->flags&Falpha))
69837da2899SCharles.Forsyth 				calc = alphacalcS;
69937da2899SCharles.Forsyth 		}
70037da2899SCharles.Forsyth 	}
70137da2899SCharles.Forsyth 
70237da2899SCharles.Forsyth 	/*
70337da2899SCharles.Forsyth 	 * If the image has a small enough repl rectangle,
70437da2899SCharles.Forsyth 	 * we can just read each line once and cache them.
70537da2899SCharles.Forsyth 	 */
70637da2899SCharles.Forsyth 	if(z->spar.replcache){
70737da2899SCharles.Forsyth 		z->spar.replcall = rdsrc;
70837da2899SCharles.Forsyth 		rdsrc = replread;
70937da2899SCharles.Forsyth 	}
71037da2899SCharles.Forsyth 	if(z->mpar.replcache){
71137da2899SCharles.Forsyth 		z->mpar.replcall = rdmask;
71237da2899SCharles.Forsyth 		rdmask = replread;
71337da2899SCharles.Forsyth 	}
71437da2899SCharles.Forsyth 
71537da2899SCharles.Forsyth 	if(z->n < ndrawbuf){
71637da2899SCharles.Forsyth 		free(z->p);
71737da2899SCharles.Forsyth 		if((z->p = mallocz(ndrawbuf, 0)) == nil){
71837da2899SCharles.Forsyth 			z->inuse = 0;
71937da2899SCharles.Forsyth 			return 0;
72037da2899SCharles.Forsyth 		}
72137da2899SCharles.Forsyth 		z->n = ndrawbuf;
72237da2899SCharles.Forsyth 	}
72337da2899SCharles.Forsyth 	drawbuf = z->p;
72437da2899SCharles.Forsyth 
72537da2899SCharles.Forsyth 	/*
72637da2899SCharles.Forsyth 	 * Before we were saving only offsets from drawbuf in the parameter
72737da2899SCharles.Forsyth 	 * structures; now that drawbuf has been grown to accomodate us,
72837da2899SCharles.Forsyth 	 * we can fill in the pointers.
72937da2899SCharles.Forsyth 	 */
73037da2899SCharles.Forsyth 	z->spar.bufbase = drawbuf+z->spar.bufoff;
73137da2899SCharles.Forsyth 	z->mpar.bufbase = drawbuf+z->mpar.bufoff;
73237da2899SCharles.Forsyth 	z->dpar.bufbase = drawbuf+z->dpar.bufoff;
73337da2899SCharles.Forsyth 	z->spar.convbuf = drawbuf+z->spar.convbufoff;
73437da2899SCharles.Forsyth 
73537da2899SCharles.Forsyth 	if(dir == 1){
73637da2899SCharles.Forsyth 		starty = 0;
73737da2899SCharles.Forsyth 		endy = dy;
73837da2899SCharles.Forsyth 	}else{
73937da2899SCharles.Forsyth 		starty = dy-1;
74037da2899SCharles.Forsyth 		endy = -1;
74137da2899SCharles.Forsyth 	}
74237da2899SCharles.Forsyth 
74337da2899SCharles.Forsyth 	/*
74437da2899SCharles.Forsyth 	 * srcy, masky, and dsty are offsets from the top of their
74537da2899SCharles.Forsyth 	 * respective Rectangles.  they need to be contained within
74637da2899SCharles.Forsyth 	 * the rectangles, so clipy can keep them there without division.
74737da2899SCharles.Forsyth  	 */
74837da2899SCharles.Forsyth 	srcy = (starty + sr.min.y - src->r.min.y)%Dy(src->r);
74937da2899SCharles.Forsyth 	masky = (starty + mr.min.y - mask->r.min.y)%Dy(mask->r);
75037da2899SCharles.Forsyth 	dsty = starty + r.min.y - dst->r.min.y;
75137da2899SCharles.Forsyth 
75237da2899SCharles.Forsyth 	assert(0 <= srcy && srcy < Dy(src->r));
75337da2899SCharles.Forsyth 	assert(0 <= masky && masky < Dy(mask->r));
75437da2899SCharles.Forsyth 	assert(0 <= dsty && dsty < Dy(dst->r));
75537da2899SCharles.Forsyth 
75637da2899SCharles.Forsyth 	for(y=starty; y!=endy; y+=dir, srcy+=dir, masky+=dir, dsty+=dir){
75737da2899SCharles.Forsyth 		clipy(src, &srcy);
75837da2899SCharles.Forsyth 		clipy(dst, &dsty);
75937da2899SCharles.Forsyth 		clipy(mask, &masky);
76037da2899SCharles.Forsyth 
76137da2899SCharles.Forsyth 		bsrc = rdsrc(&z->spar, z->spar.bufbase, srcy);
76237da2899SCharles.Forsyth DBG print("[");
76337da2899SCharles.Forsyth 		bmask = rdmask(&z->mpar, z->mpar.bufbase, masky);
76437da2899SCharles.Forsyth DBG print("]\n");
76537da2899SCharles.Forsyth 		bdst = rddst(&z->dpar, z->dpar.bufbase, dsty);
76637da2899SCharles.Forsyth 		if(op != Clear && (bsrc.delta != 4 || bdst.delta != 4 || src->chan != dst->chan))
76737da2899SCharles.Forsyth 			bdst.rgba = nil;
76837da2899SCharles.Forsyth DBG		dumpbuf("src", bsrc, dx);
76937da2899SCharles.Forsyth DBG		dumpbuf("mask", bmask, dx);
77037da2899SCharles.Forsyth DBG		dumpbuf("dst", bdst, dx);
77137da2899SCharles.Forsyth 		bdst = calc(bdst, bsrc, bmask, dx, isgrey, op);
77237da2899SCharles.Forsyth 		wrdst(&z->dpar, z->dpar.bytermin+dsty*z->dpar.bwidth, bdst);
77337da2899SCharles.Forsyth 	}
77437da2899SCharles.Forsyth 
77537da2899SCharles.Forsyth 	z->inuse = 0;
77637da2899SCharles.Forsyth 	return 1;
77737da2899SCharles.Forsyth }
77837da2899SCharles.Forsyth #undef DBG
77937da2899SCharles.Forsyth 
78037da2899SCharles.Forsyth static Buffer
alphacalc0(Buffer bdst,Buffer b1,Buffer b2,int dx,int grey,int op)78137da2899SCharles.Forsyth alphacalc0(Buffer bdst, Buffer b1, Buffer b2, int dx, int grey, int op)
78237da2899SCharles.Forsyth {
78337da2899SCharles.Forsyth 	USED(b1.grey);
78437da2899SCharles.Forsyth 	USED(b2.grey);
78537da2899SCharles.Forsyth 	USED(grey);
78637da2899SCharles.Forsyth 	USED(op);
78737da2899SCharles.Forsyth 	memset(bdst.rgba, 0, dx*bdst.delta);
78837da2899SCharles.Forsyth 	return bdst;
78937da2899SCharles.Forsyth }
79037da2899SCharles.Forsyth 
79137da2899SCharles.Forsyth static Buffer
alphacalc14(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int grey,int op)79237da2899SCharles.Forsyth alphacalc14(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int grey, int op)
79337da2899SCharles.Forsyth {
79437da2899SCharles.Forsyth 	Buffer obdst;
79537da2899SCharles.Forsyth 	int fd, sadelta;
79637da2899SCharles.Forsyth 	int i, sa, ma;
79737da2899SCharles.Forsyth 	ulong s, t;
79837da2899SCharles.Forsyth 
79937da2899SCharles.Forsyth 	obdst = bdst;
80037da2899SCharles.Forsyth 	sadelta = bsrc.alpha == &ones ? 0 : bsrc.delta;
80137da2899SCharles.Forsyth 
80237da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
80337da2899SCharles.Forsyth 		sa = *bsrc.alpha;
80437da2899SCharles.Forsyth 		ma = *bmask.alpha;
80537da2899SCharles.Forsyth 		fd = MUL(sa, ma, t);
80637da2899SCharles.Forsyth 		if(op == DoutS)
80737da2899SCharles.Forsyth 			fd = 255-fd;
80837da2899SCharles.Forsyth 
80937da2899SCharles.Forsyth 		if(grey){
81037da2899SCharles.Forsyth 			*bdst.grey = MUL(fd, *bdst.grey, t);
81137da2899SCharles.Forsyth 			bsrc.grey += bsrc.delta;
81237da2899SCharles.Forsyth 			bdst.grey += bdst.delta;
81337da2899SCharles.Forsyth 		}else{
81437da2899SCharles.Forsyth 			if(bdst.rgba){
81537da2899SCharles.Forsyth 				*bdst.rgba = MUL0123(fd, *bdst.rgba, s, t);
81637da2899SCharles.Forsyth 				bsrc.rgba++;
81737da2899SCharles.Forsyth 				bdst.rgba++;
81837da2899SCharles.Forsyth 				bsrc.alpha += sadelta;
81937da2899SCharles.Forsyth 				bmask.alpha += bmask.delta;
82037da2899SCharles.Forsyth 				continue;
82137da2899SCharles.Forsyth 			}
82237da2899SCharles.Forsyth 			*bdst.red = MUL(fd, *bdst.red, t);
82337da2899SCharles.Forsyth 			*bdst.grn = MUL(fd, *bdst.grn, t);
82437da2899SCharles.Forsyth 			*bdst.blu = MUL(fd, *bdst.blu, t);
82537da2899SCharles.Forsyth 			bsrc.red += bsrc.delta;
82637da2899SCharles.Forsyth 			bsrc.blu += bsrc.delta;
82737da2899SCharles.Forsyth 			bsrc.grn += bsrc.delta;
82837da2899SCharles.Forsyth 			bdst.red += bdst.delta;
82937da2899SCharles.Forsyth 			bdst.blu += bdst.delta;
83037da2899SCharles.Forsyth 			bdst.grn += bdst.delta;
83137da2899SCharles.Forsyth 		}
83237da2899SCharles.Forsyth 		if(bdst.alpha != &ones){
83337da2899SCharles.Forsyth 			*bdst.alpha = MUL(fd, *bdst.alpha, t);
83437da2899SCharles.Forsyth 			bdst.alpha += bdst.delta;
83537da2899SCharles.Forsyth 		}
83637da2899SCharles.Forsyth 		bmask.alpha += bmask.delta;
83737da2899SCharles.Forsyth 		bsrc.alpha += sadelta;
83837da2899SCharles.Forsyth 	}
83937da2899SCharles.Forsyth 	return obdst;
84037da2899SCharles.Forsyth }
84137da2899SCharles.Forsyth 
84237da2899SCharles.Forsyth static Buffer
alphacalc2810(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int grey,int op)84337da2899SCharles.Forsyth alphacalc2810(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int grey, int op)
84437da2899SCharles.Forsyth {
84537da2899SCharles.Forsyth 	Buffer obdst;
84637da2899SCharles.Forsyth 	int fs, sadelta;
84737da2899SCharles.Forsyth 	int i, ma, da;
84837da2899SCharles.Forsyth 	ulong s, t;
84937da2899SCharles.Forsyth 
85037da2899SCharles.Forsyth 	obdst = bdst;
85137da2899SCharles.Forsyth 	sadelta = bsrc.alpha == &ones ? 0 : bsrc.delta;
85237da2899SCharles.Forsyth 
85337da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
85437da2899SCharles.Forsyth 		ma = *bmask.alpha;
85537da2899SCharles.Forsyth 		da = *bdst.alpha;
85637da2899SCharles.Forsyth 		if(op == SoutD)
85737da2899SCharles.Forsyth 			da = 255-da;
85837da2899SCharles.Forsyth 		fs = ma;
85937da2899SCharles.Forsyth 		if(op != S)
86037da2899SCharles.Forsyth 			fs = MUL(fs, da, t);
86137da2899SCharles.Forsyth 
86237da2899SCharles.Forsyth 		if(grey){
86337da2899SCharles.Forsyth 			*bdst.grey = MUL(fs, *bsrc.grey, t);
86437da2899SCharles.Forsyth 			bsrc.grey += bsrc.delta;
86537da2899SCharles.Forsyth 			bdst.grey += bdst.delta;
86637da2899SCharles.Forsyth 		}else{
86737da2899SCharles.Forsyth 			if(bdst.rgba){
86837da2899SCharles.Forsyth 				*bdst.rgba = MUL0123(fs, *bsrc.rgba, s, t);
86937da2899SCharles.Forsyth 				bsrc.rgba++;
87037da2899SCharles.Forsyth 				bdst.rgba++;
87137da2899SCharles.Forsyth 				bmask.alpha += bmask.delta;
87237da2899SCharles.Forsyth 				bdst.alpha += bdst.delta;
87337da2899SCharles.Forsyth 				continue;
87437da2899SCharles.Forsyth 			}
87537da2899SCharles.Forsyth 			*bdst.red = MUL(fs, *bsrc.red, t);
87637da2899SCharles.Forsyth 			*bdst.grn = MUL(fs, *bsrc.grn, t);
87737da2899SCharles.Forsyth 			*bdst.blu = MUL(fs, *bsrc.blu, t);
87837da2899SCharles.Forsyth 			bsrc.red += bsrc.delta;
87937da2899SCharles.Forsyth 			bsrc.blu += bsrc.delta;
88037da2899SCharles.Forsyth 			bsrc.grn += bsrc.delta;
88137da2899SCharles.Forsyth 			bdst.red += bdst.delta;
88237da2899SCharles.Forsyth 			bdst.blu += bdst.delta;
88337da2899SCharles.Forsyth 			bdst.grn += bdst.delta;
88437da2899SCharles.Forsyth 		}
88537da2899SCharles.Forsyth 		if(bdst.alpha != &ones){
88637da2899SCharles.Forsyth 			*bdst.alpha = MUL(fs, *bsrc.alpha, t);
88737da2899SCharles.Forsyth 			bdst.alpha += bdst.delta;
88837da2899SCharles.Forsyth 		}
88937da2899SCharles.Forsyth 		bmask.alpha += bmask.delta;
89037da2899SCharles.Forsyth 		bsrc.alpha += sadelta;
89137da2899SCharles.Forsyth 	}
89237da2899SCharles.Forsyth 	return obdst;
89337da2899SCharles.Forsyth }
89437da2899SCharles.Forsyth 
89537da2899SCharles.Forsyth static Buffer
alphacalc3679(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int grey,int op)89637da2899SCharles.Forsyth alphacalc3679(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int grey, int op)
89737da2899SCharles.Forsyth {
89837da2899SCharles.Forsyth 	Buffer obdst;
89937da2899SCharles.Forsyth 	int fs, fd, sadelta;
90037da2899SCharles.Forsyth 	int i, sa, ma, da;
90137da2899SCharles.Forsyth 	ulong s, t, q1, q2;
90237da2899SCharles.Forsyth 
90337da2899SCharles.Forsyth 	obdst = bdst;
90437da2899SCharles.Forsyth 	sadelta = bsrc.alpha == &ones ? 0 : bsrc.delta;
90537da2899SCharles.Forsyth 
90637da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
90737da2899SCharles.Forsyth 		sa = *bsrc.alpha;
90837da2899SCharles.Forsyth 		ma = *bmask.alpha;
90937da2899SCharles.Forsyth 		da = *bdst.alpha;
91037da2899SCharles.Forsyth 		if(op == SatopD)
91137da2899SCharles.Forsyth 			fs = MUL(ma, da, t);
91237da2899SCharles.Forsyth 		else
91337da2899SCharles.Forsyth 			fs = MUL(ma, 255-da, t);
91437da2899SCharles.Forsyth 		if(op == DoverS)
91537da2899SCharles.Forsyth 			fd = 255;
91637da2899SCharles.Forsyth 		else{
91737da2899SCharles.Forsyth 			fd = MUL(sa, ma, t);
91837da2899SCharles.Forsyth 			if(op != DatopS)
91937da2899SCharles.Forsyth 				fd = 255-fd;
92037da2899SCharles.Forsyth 		}
92137da2899SCharles.Forsyth 
92237da2899SCharles.Forsyth 		if(grey){
92337da2899SCharles.Forsyth 			*bdst.grey = MUL(fs, *bsrc.grey, s)+MUL(fd, *bdst.grey, t);
92437da2899SCharles.Forsyth 			bsrc.grey += bsrc.delta;
92537da2899SCharles.Forsyth 			bdst.grey += bdst.delta;
92637da2899SCharles.Forsyth 		}else{
92737da2899SCharles.Forsyth 			if(bdst.rgba){
92837da2899SCharles.Forsyth 				q1 = MUL0123(fs, *bsrc.rgba, s, t);
92937da2899SCharles.Forsyth 				q2 = MUL0123(fd, *bdst.rgba, s, t);
93037da2899SCharles.Forsyth 				*bdst.rgba = BWADD(q1, q2);
93137da2899SCharles.Forsyth 				bsrc.rgba++;
93237da2899SCharles.Forsyth 				bdst.rgba++;
93337da2899SCharles.Forsyth 				bsrc.alpha += sadelta;
93437da2899SCharles.Forsyth 				bmask.alpha += bmask.delta;
93537da2899SCharles.Forsyth 				bdst.alpha += bdst.delta;
93637da2899SCharles.Forsyth 				continue;
93737da2899SCharles.Forsyth 			}
93837da2899SCharles.Forsyth 			*bdst.red = MUL(fs, *bsrc.red, s)+MUL(fd, *bdst.red, t);
93937da2899SCharles.Forsyth 			*bdst.grn = MUL(fs, *bsrc.grn, s)+MUL(fd, *bdst.grn, t);
94037da2899SCharles.Forsyth 			*bdst.blu = MUL(fs, *bsrc.blu, s)+MUL(fd, *bdst.blu, t);
94137da2899SCharles.Forsyth 			bsrc.red += bsrc.delta;
94237da2899SCharles.Forsyth 			bsrc.blu += bsrc.delta;
94337da2899SCharles.Forsyth 			bsrc.grn += bsrc.delta;
94437da2899SCharles.Forsyth 			bdst.red += bdst.delta;
94537da2899SCharles.Forsyth 			bdst.blu += bdst.delta;
94637da2899SCharles.Forsyth 			bdst.grn += bdst.delta;
94737da2899SCharles.Forsyth 		}
94837da2899SCharles.Forsyth 		if(bdst.alpha != &ones){
94937da2899SCharles.Forsyth 			*bdst.alpha = MUL(fs, sa, s)+MUL(fd, da, t);
95037da2899SCharles.Forsyth 			bdst.alpha += bdst.delta;
95137da2899SCharles.Forsyth 		}
95237da2899SCharles.Forsyth 		bmask.alpha += bmask.delta;
95337da2899SCharles.Forsyth 		bsrc.alpha += sadelta;
95437da2899SCharles.Forsyth 	}
95537da2899SCharles.Forsyth 	return obdst;
95637da2899SCharles.Forsyth }
95737da2899SCharles.Forsyth 
95837da2899SCharles.Forsyth static Buffer
alphacalc5(Buffer bdst,Buffer b1,Buffer b2,int dx,int grey,int op)95937da2899SCharles.Forsyth alphacalc5(Buffer bdst, Buffer b1, Buffer b2, int dx, int grey, int op)
96037da2899SCharles.Forsyth {
96137da2899SCharles.Forsyth 	USED(b1.grey);
96237da2899SCharles.Forsyth 	USED(b2.grey);
96337da2899SCharles.Forsyth 	USED(dx);
96437da2899SCharles.Forsyth 	USED(grey);
96537da2899SCharles.Forsyth 	USED(op);
96637da2899SCharles.Forsyth 	return bdst;
96737da2899SCharles.Forsyth }
96837da2899SCharles.Forsyth 
96937da2899SCharles.Forsyth static Buffer
alphacalc11(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int grey,int op)97037da2899SCharles.Forsyth alphacalc11(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int grey, int op)
97137da2899SCharles.Forsyth {
97237da2899SCharles.Forsyth 	Buffer obdst;
97337da2899SCharles.Forsyth 	int fd, sadelta;
97437da2899SCharles.Forsyth 	int i, sa, ma;
97537da2899SCharles.Forsyth 	ulong s, t, q1, q2;
97637da2899SCharles.Forsyth 
97737da2899SCharles.Forsyth 	USED(op);
97837da2899SCharles.Forsyth 	obdst = bdst;
97937da2899SCharles.Forsyth 	sadelta = bsrc.alpha == &ones ? 0 : bsrc.delta;
98037da2899SCharles.Forsyth 
98137da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
98237da2899SCharles.Forsyth 		sa = *bsrc.alpha;
98337da2899SCharles.Forsyth 		ma = *bmask.alpha;
98437da2899SCharles.Forsyth 		fd = 255-MUL(sa, ma, t);
98537da2899SCharles.Forsyth 
98637da2899SCharles.Forsyth 		if(grey){
98737da2899SCharles.Forsyth 			*bdst.grey = MUL(ma, *bsrc.grey, s)+MUL(fd, *bdst.grey, t);
98837da2899SCharles.Forsyth 			bsrc.grey += bsrc.delta;
98937da2899SCharles.Forsyth 			bdst.grey += bdst.delta;
99037da2899SCharles.Forsyth 		}else{
99137da2899SCharles.Forsyth 			if(bdst.rgba){
99237da2899SCharles.Forsyth 				q1 = MUL0123(ma, *bsrc.rgba, s, t);
99337da2899SCharles.Forsyth 				q2 = MUL0123(fd, *bdst.rgba, s, t);
99437da2899SCharles.Forsyth 				*bdst.rgba = BWADD(q1, q2);
99537da2899SCharles.Forsyth 				bsrc.rgba++;
99637da2899SCharles.Forsyth 				bdst.rgba++;
99737da2899SCharles.Forsyth 				bsrc.alpha += sadelta;
99837da2899SCharles.Forsyth 				bmask.alpha += bmask.delta;
99937da2899SCharles.Forsyth 				continue;
100037da2899SCharles.Forsyth 			}
100137da2899SCharles.Forsyth 			*bdst.red = MUL(ma, *bsrc.red, s)+MUL(fd, *bdst.red, t);
100237da2899SCharles.Forsyth 			*bdst.grn = MUL(ma, *bsrc.grn, s)+MUL(fd, *bdst.grn, t);
100337da2899SCharles.Forsyth 			*bdst.blu = MUL(ma, *bsrc.blu, s)+MUL(fd, *bdst.blu, t);
100437da2899SCharles.Forsyth 			bsrc.red += bsrc.delta;
100537da2899SCharles.Forsyth 			bsrc.blu += bsrc.delta;
100637da2899SCharles.Forsyth 			bsrc.grn += bsrc.delta;
100737da2899SCharles.Forsyth 			bdst.red += bdst.delta;
100837da2899SCharles.Forsyth 			bdst.blu += bdst.delta;
100937da2899SCharles.Forsyth 			bdst.grn += bdst.delta;
101037da2899SCharles.Forsyth 		}
101137da2899SCharles.Forsyth 		if(bdst.alpha != &ones){
101237da2899SCharles.Forsyth 			*bdst.alpha = MUL(ma, sa, s)+MUL(fd, *bdst.alpha, t);
101337da2899SCharles.Forsyth 			bdst.alpha += bdst.delta;
101437da2899SCharles.Forsyth 		}
101537da2899SCharles.Forsyth 		bmask.alpha += bmask.delta;
101637da2899SCharles.Forsyth 		bsrc.alpha += sadelta;
101737da2899SCharles.Forsyth 	}
101837da2899SCharles.Forsyth 	return obdst;
101937da2899SCharles.Forsyth }
102037da2899SCharles.Forsyth 
102137da2899SCharles.Forsyth /*
102237da2899SCharles.Forsyth not used yet
102337da2899SCharles.Forsyth source and mask alpha 1
102437da2899SCharles.Forsyth static Buffer
102537da2899SCharles.Forsyth alphacalcS0(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int grey, int op)
102637da2899SCharles.Forsyth {
102737da2899SCharles.Forsyth 	Buffer obdst;
102837da2899SCharles.Forsyth 	int i;
102937da2899SCharles.Forsyth 
103037da2899SCharles.Forsyth 	USED(op);
103137da2899SCharles.Forsyth 	obdst = bdst;
103237da2899SCharles.Forsyth 	if(bsrc.delta == bdst.delta){
103337da2899SCharles.Forsyth 		memmove(bdst.rgba, bsrc.rgba, dx*bdst.delta);
103437da2899SCharles.Forsyth 		return obdst;
103537da2899SCharles.Forsyth 	}
103637da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
103737da2899SCharles.Forsyth 		if(grey){
103837da2899SCharles.Forsyth 			*bdst.grey = *bsrc.grey;
103937da2899SCharles.Forsyth 			bsrc.grey += bsrc.delta;
104037da2899SCharles.Forsyth 			bdst.grey += bdst.delta;
104137da2899SCharles.Forsyth 		}else{
104237da2899SCharles.Forsyth 			*bdst.red = *bsrc.red;
104337da2899SCharles.Forsyth 			*bdst.grn = *bsrc.grn;
104437da2899SCharles.Forsyth 			*bdst.blu = *bsrc.blu;
104537da2899SCharles.Forsyth 			bsrc.red += bsrc.delta;
104637da2899SCharles.Forsyth 			bsrc.blu += bsrc.delta;
104737da2899SCharles.Forsyth 			bsrc.grn += bsrc.delta;
104837da2899SCharles.Forsyth 			bdst.red += bdst.delta;
104937da2899SCharles.Forsyth 			bdst.blu += bdst.delta;
105037da2899SCharles.Forsyth 			bdst.grn += bdst.delta;
105137da2899SCharles.Forsyth 		}
105237da2899SCharles.Forsyth 		if(bdst.alpha != &ones){
105337da2899SCharles.Forsyth 			*bdst.alpha = 255;
105437da2899SCharles.Forsyth 			bdst.alpha += bdst.delta;
105537da2899SCharles.Forsyth 		}
105637da2899SCharles.Forsyth 	}
105737da2899SCharles.Forsyth 	return obdst;
105837da2899SCharles.Forsyth }
105937da2899SCharles.Forsyth */
106037da2899SCharles.Forsyth 
106137da2899SCharles.Forsyth /* source alpha 1 */
106237da2899SCharles.Forsyth static Buffer
alphacalcS(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int grey,int op)106337da2899SCharles.Forsyth alphacalcS(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int grey, int op)
106437da2899SCharles.Forsyth {
106537da2899SCharles.Forsyth 	Buffer obdst;
106637da2899SCharles.Forsyth 	int fd;
106737da2899SCharles.Forsyth 	int i, ma;
106837da2899SCharles.Forsyth 	ulong s, t;
106937da2899SCharles.Forsyth 
107037da2899SCharles.Forsyth 	USED(op);
107137da2899SCharles.Forsyth 	obdst = bdst;
107237da2899SCharles.Forsyth 
107337da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
107437da2899SCharles.Forsyth 		ma = *bmask.alpha;
107537da2899SCharles.Forsyth 		fd = 255-ma;
107637da2899SCharles.Forsyth 
107737da2899SCharles.Forsyth 		if(grey){
107837da2899SCharles.Forsyth 			*bdst.grey = MUL(ma, *bsrc.grey, s)+MUL(fd, *bdst.grey, t);
107937da2899SCharles.Forsyth 			bsrc.grey += bsrc.delta;
108037da2899SCharles.Forsyth 			bdst.grey += bdst.delta;
108137da2899SCharles.Forsyth 		}else{
108237da2899SCharles.Forsyth 			*bdst.red = MUL(ma, *bsrc.red, s)+MUL(fd, *bdst.red, t);
108337da2899SCharles.Forsyth 			*bdst.grn = MUL(ma, *bsrc.grn, s)+MUL(fd, *bdst.grn, t);
108437da2899SCharles.Forsyth 			*bdst.blu = MUL(ma, *bsrc.blu, s)+MUL(fd, *bdst.blu, t);
108537da2899SCharles.Forsyth 			bsrc.red += bsrc.delta;
108637da2899SCharles.Forsyth 			bsrc.blu += bsrc.delta;
108737da2899SCharles.Forsyth 			bsrc.grn += bsrc.delta;
108837da2899SCharles.Forsyth 			bdst.red += bdst.delta;
108937da2899SCharles.Forsyth 			bdst.blu += bdst.delta;
109037da2899SCharles.Forsyth 			bdst.grn += bdst.delta;
109137da2899SCharles.Forsyth 		}
109237da2899SCharles.Forsyth 		if(bdst.alpha != &ones){
109337da2899SCharles.Forsyth 			*bdst.alpha = ma+MUL(fd, *bdst.alpha, t);
109437da2899SCharles.Forsyth 			bdst.alpha += bdst.delta;
109537da2899SCharles.Forsyth 		}
109637da2899SCharles.Forsyth 		bmask.alpha += bmask.delta;
109737da2899SCharles.Forsyth 	}
109837da2899SCharles.Forsyth 	return obdst;
109937da2899SCharles.Forsyth }
110037da2899SCharles.Forsyth 
110137da2899SCharles.Forsyth static Buffer
boolcalc14(Buffer bdst,Buffer b1,Buffer bmask,int dx,int grey,int op)110237da2899SCharles.Forsyth boolcalc14(Buffer bdst, Buffer b1, Buffer bmask, int dx, int grey, int op)
110337da2899SCharles.Forsyth {
110437da2899SCharles.Forsyth 	Buffer obdst;
110537da2899SCharles.Forsyth 	int i, ma, zero;
110637da2899SCharles.Forsyth 
110737da2899SCharles.Forsyth 	USED(b1.grey);
110837da2899SCharles.Forsyth 	obdst = bdst;
110937da2899SCharles.Forsyth 
111037da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
111137da2899SCharles.Forsyth 		ma = *bmask.alpha;
111237da2899SCharles.Forsyth 		zero = ma ? op == DoutS : op == DinS;
111337da2899SCharles.Forsyth 
111437da2899SCharles.Forsyth 		if(grey){
111537da2899SCharles.Forsyth 			if(zero)
111637da2899SCharles.Forsyth 				*bdst.grey = 0;
111737da2899SCharles.Forsyth 			bdst.grey += bdst.delta;
111837da2899SCharles.Forsyth 		}else{
111937da2899SCharles.Forsyth 			if(zero)
112037da2899SCharles.Forsyth 				*bdst.red = *bdst.grn = *bdst.blu = 0;
112137da2899SCharles.Forsyth 			bdst.red += bdst.delta;
112237da2899SCharles.Forsyth 			bdst.blu += bdst.delta;
112337da2899SCharles.Forsyth 			bdst.grn += bdst.delta;
112437da2899SCharles.Forsyth 		}
112537da2899SCharles.Forsyth 		bmask.alpha += bmask.delta;
112637da2899SCharles.Forsyth 		if(bdst.alpha != &ones){
112737da2899SCharles.Forsyth 			if(zero)
112837da2899SCharles.Forsyth 				*bdst.alpha = 0;
112937da2899SCharles.Forsyth 			bdst.alpha += bdst.delta;
113037da2899SCharles.Forsyth 		}
113137da2899SCharles.Forsyth 	}
113237da2899SCharles.Forsyth 	return obdst;
113337da2899SCharles.Forsyth }
113437da2899SCharles.Forsyth 
113537da2899SCharles.Forsyth static Buffer
boolcalc236789(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int grey,int op)113637da2899SCharles.Forsyth boolcalc236789(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int grey, int op)
113737da2899SCharles.Forsyth {
113837da2899SCharles.Forsyth 	Buffer obdst;
113937da2899SCharles.Forsyth 	int fs, fd;
114037da2899SCharles.Forsyth 	int i, ma, da, zero;
114137da2899SCharles.Forsyth 	ulong s, t;
114237da2899SCharles.Forsyth 
114337da2899SCharles.Forsyth 	obdst = bdst;
114437da2899SCharles.Forsyth 	zero = !(op&1);
114537da2899SCharles.Forsyth 
114637da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
114737da2899SCharles.Forsyth 		ma = *bmask.alpha;
114837da2899SCharles.Forsyth 		da = *bdst.alpha;
114937da2899SCharles.Forsyth 		fs = da;
115037da2899SCharles.Forsyth 		if(op&2)
115137da2899SCharles.Forsyth 			fs = 255-da;
115237da2899SCharles.Forsyth 		fd = 0;
115337da2899SCharles.Forsyth 		if(op&4)
115437da2899SCharles.Forsyth 			fd = 255;
115537da2899SCharles.Forsyth 
115637da2899SCharles.Forsyth 		if(grey){
115737da2899SCharles.Forsyth 			if(ma)
115837da2899SCharles.Forsyth 				*bdst.grey = MUL(fs, *bsrc.grey, s)+MUL(fd, *bdst.grey, t);
115937da2899SCharles.Forsyth 			else if(zero)
116037da2899SCharles.Forsyth 				*bdst.grey = 0;
116137da2899SCharles.Forsyth 			bsrc.grey += bsrc.delta;
116237da2899SCharles.Forsyth 			bdst.grey += bdst.delta;
116337da2899SCharles.Forsyth 		}else{
116437da2899SCharles.Forsyth 			if(ma){
116537da2899SCharles.Forsyth 				*bdst.red = MUL(fs, *bsrc.red, s)+MUL(fd, *bdst.red, t);
116637da2899SCharles.Forsyth 				*bdst.grn = MUL(fs, *bsrc.grn, s)+MUL(fd, *bdst.grn, t);
116737da2899SCharles.Forsyth 				*bdst.blu = MUL(fs, *bsrc.blu, s)+MUL(fd, *bdst.blu, t);
116837da2899SCharles.Forsyth 			}
116937da2899SCharles.Forsyth 			else if(zero)
117037da2899SCharles.Forsyth 				*bdst.red = *bdst.grn = *bdst.blu = 0;
117137da2899SCharles.Forsyth 			bsrc.red += bsrc.delta;
117237da2899SCharles.Forsyth 			bsrc.blu += bsrc.delta;
117337da2899SCharles.Forsyth 			bsrc.grn += bsrc.delta;
117437da2899SCharles.Forsyth 			bdst.red += bdst.delta;
117537da2899SCharles.Forsyth 			bdst.blu += bdst.delta;
117637da2899SCharles.Forsyth 			bdst.grn += bdst.delta;
117737da2899SCharles.Forsyth 		}
117837da2899SCharles.Forsyth 		bmask.alpha += bmask.delta;
117937da2899SCharles.Forsyth 		if(bdst.alpha != &ones){
118037da2899SCharles.Forsyth 			if(ma)
118137da2899SCharles.Forsyth 				*bdst.alpha = fs+MUL(fd, da, t);
118237da2899SCharles.Forsyth 			else if(zero)
118337da2899SCharles.Forsyth 				*bdst.alpha = 0;
118437da2899SCharles.Forsyth 			bdst.alpha += bdst.delta;
118537da2899SCharles.Forsyth 		}
118637da2899SCharles.Forsyth 	}
118737da2899SCharles.Forsyth 	return obdst;
118837da2899SCharles.Forsyth }
118937da2899SCharles.Forsyth 
119037da2899SCharles.Forsyth static Buffer
boolcalc1011(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int grey,int op)119137da2899SCharles.Forsyth boolcalc1011(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int grey, int op)
119237da2899SCharles.Forsyth {
119337da2899SCharles.Forsyth 	Buffer obdst;
119437da2899SCharles.Forsyth 	int i, ma, zero;
119537da2899SCharles.Forsyth 
119637da2899SCharles.Forsyth 	obdst = bdst;
119737da2899SCharles.Forsyth 	zero = !(op&1);
119837da2899SCharles.Forsyth 
119937da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
120037da2899SCharles.Forsyth 		ma = *bmask.alpha;
120137da2899SCharles.Forsyth 
120237da2899SCharles.Forsyth 		if(grey){
120337da2899SCharles.Forsyth 			if(ma)
120437da2899SCharles.Forsyth 				*bdst.grey = *bsrc.grey;
120537da2899SCharles.Forsyth 			else if(zero)
120637da2899SCharles.Forsyth 				*bdst.grey = 0;
120737da2899SCharles.Forsyth 			bsrc.grey += bsrc.delta;
120837da2899SCharles.Forsyth 			bdst.grey += bdst.delta;
120937da2899SCharles.Forsyth 		}else{
121037da2899SCharles.Forsyth 			if(ma){
121137da2899SCharles.Forsyth 				*bdst.red = *bsrc.red;
121237da2899SCharles.Forsyth 				*bdst.grn = *bsrc.grn;
121337da2899SCharles.Forsyth 				*bdst.blu = *bsrc.blu;
121437da2899SCharles.Forsyth 			}
121537da2899SCharles.Forsyth 			else if(zero)
121637da2899SCharles.Forsyth 				*bdst.red = *bdst.grn = *bdst.blu = 0;
121737da2899SCharles.Forsyth 			bsrc.red += bsrc.delta;
121837da2899SCharles.Forsyth 			bsrc.blu += bsrc.delta;
121937da2899SCharles.Forsyth 			bsrc.grn += bsrc.delta;
122037da2899SCharles.Forsyth 			bdst.red += bdst.delta;
122137da2899SCharles.Forsyth 			bdst.blu += bdst.delta;
122237da2899SCharles.Forsyth 			bdst.grn += bdst.delta;
122337da2899SCharles.Forsyth 		}
122437da2899SCharles.Forsyth 		bmask.alpha += bmask.delta;
122537da2899SCharles.Forsyth 		if(bdst.alpha != &ones){
122637da2899SCharles.Forsyth 			if(ma)
122737da2899SCharles.Forsyth 				*bdst.alpha = 255;
122837da2899SCharles.Forsyth 			else if(zero)
122937da2899SCharles.Forsyth 				*bdst.alpha = 0;
123037da2899SCharles.Forsyth 			bdst.alpha += bdst.delta;
123137da2899SCharles.Forsyth 		}
123237da2899SCharles.Forsyth 	}
123337da2899SCharles.Forsyth 	return obdst;
123437da2899SCharles.Forsyth }
123537da2899SCharles.Forsyth /*
123637da2899SCharles.Forsyth  * Replicated cached scan line read.  Call the function listed in the Param,
123737da2899SCharles.Forsyth  * but cache the result so that for replicated images we only do the work once.
123837da2899SCharles.Forsyth  */
123937da2899SCharles.Forsyth static Buffer
replread(Param * p,uchar * s,int y)124037da2899SCharles.Forsyth replread(Param *p, uchar *s, int y)
124137da2899SCharles.Forsyth {
124237da2899SCharles.Forsyth 	Buffer *b;
124337da2899SCharles.Forsyth 
124437da2899SCharles.Forsyth 	USED(s);
124537da2899SCharles.Forsyth 	b = &p->bcache[y];
124637da2899SCharles.Forsyth 	if((p->bfilled & (1<<y)) == 0){
124737da2899SCharles.Forsyth 		p->bfilled |= 1<<y;
124837da2899SCharles.Forsyth 		*b = p->replcall(p, p->bufbase+y*p->bufdelta, y);
124937da2899SCharles.Forsyth 	}
125037da2899SCharles.Forsyth 	return *b;
125137da2899SCharles.Forsyth }
125237da2899SCharles.Forsyth 
125337da2899SCharles.Forsyth /*
125437da2899SCharles.Forsyth  * Alpha reading function that simply relabels the grey pointer.
125537da2899SCharles.Forsyth  */
125637da2899SCharles.Forsyth static Buffer
greymaskread(Param * p,uchar * buf,int y)125737da2899SCharles.Forsyth greymaskread(Param *p, uchar *buf, int y)
125837da2899SCharles.Forsyth {
125937da2899SCharles.Forsyth 	Buffer b;
126037da2899SCharles.Forsyth 
126137da2899SCharles.Forsyth 	b = p->greymaskcall(p, buf, y);
126237da2899SCharles.Forsyth 	b.alpha = b.grey;
126337da2899SCharles.Forsyth 	return b;
126437da2899SCharles.Forsyth }
126537da2899SCharles.Forsyth 
126637da2899SCharles.Forsyth #define DBG if(0)
126737da2899SCharles.Forsyth static Buffer
readnbit(Param * p,uchar * buf,int y)126837da2899SCharles.Forsyth readnbit(Param *p, uchar *buf, int y)
126937da2899SCharles.Forsyth {
127037da2899SCharles.Forsyth 	Buffer b;
127137da2899SCharles.Forsyth 	Memimage *img;
127237da2899SCharles.Forsyth 	uchar *repl, *r, *w, *ow, bits;
127337da2899SCharles.Forsyth 	int i, n, sh, depth, x, dx, npack, nbits;
127437da2899SCharles.Forsyth 
127537da2899SCharles.Forsyth 	b.rgba = (ulong*)buf;
127637da2899SCharles.Forsyth 	b.grey = w = buf;
127737da2899SCharles.Forsyth 	b.red = b.blu = b.grn = w;
127837da2899SCharles.Forsyth 	b.alpha = &ones;
127937da2899SCharles.Forsyth 	b.delta = 1;
128037da2899SCharles.Forsyth 
128137da2899SCharles.Forsyth 	dx = p->dx;
128237da2899SCharles.Forsyth 	img = p->img;
128337da2899SCharles.Forsyth 	depth = img->depth;
128437da2899SCharles.Forsyth 	repl = &replbit[depth][0];
128537da2899SCharles.Forsyth 	npack = 8/depth;
128637da2899SCharles.Forsyth 	sh = 8-depth;
128737da2899SCharles.Forsyth 
128837da2899SCharles.Forsyth 	/* copy from p->r.min.x until end of repl rectangle */
128937da2899SCharles.Forsyth 	x = p->r.min.x;
129037da2899SCharles.Forsyth 	n = dx;
129137da2899SCharles.Forsyth 	if(n > p->img->r.max.x - x)
129237da2899SCharles.Forsyth 		n = p->img->r.max.x - x;
129337da2899SCharles.Forsyth 
129437da2899SCharles.Forsyth 	r = p->bytermin + y*p->bwidth;
129537da2899SCharles.Forsyth DBG print("readnbit dx %d %p=%p+%d*%d, *r=%d fetch %d ", dx, r, p->bytermin, y, p->bwidth, *r, n);
129637da2899SCharles.Forsyth 	bits = *r++;
129737da2899SCharles.Forsyth 	nbits = 8;
129837da2899SCharles.Forsyth 	if(i=x&(npack-1)){
129937da2899SCharles.Forsyth DBG print("throwaway %d...", i);
130037da2899SCharles.Forsyth 		bits <<= depth*i;
130137da2899SCharles.Forsyth 		nbits -= depth*i;
130237da2899SCharles.Forsyth 	}
130337da2899SCharles.Forsyth 	for(i=0; i<n; i++){
130437da2899SCharles.Forsyth 		if(nbits == 0){
130537da2899SCharles.Forsyth DBG print("(%.2ux)...", *r);
130637da2899SCharles.Forsyth 			bits = *r++;
130737da2899SCharles.Forsyth 			nbits = 8;
130837da2899SCharles.Forsyth 		}
130937da2899SCharles.Forsyth 		*w++ = repl[bits>>sh];
131037da2899SCharles.Forsyth DBG print("bit %x...", repl[bits>>sh]);
131137da2899SCharles.Forsyth 		bits <<= depth;
131237da2899SCharles.Forsyth 		nbits -= depth;
131337da2899SCharles.Forsyth 	}
131437da2899SCharles.Forsyth 	dx -= n;
131537da2899SCharles.Forsyth 	if(dx == 0)
131637da2899SCharles.Forsyth 		return b;
131737da2899SCharles.Forsyth 
131837da2899SCharles.Forsyth 	assert(x+i == p->img->r.max.x);
131937da2899SCharles.Forsyth 
132037da2899SCharles.Forsyth 	/* copy from beginning of repl rectangle until where we were before. */
132137da2899SCharles.Forsyth 	x = p->img->r.min.x;
132237da2899SCharles.Forsyth 	n = dx;
132337da2899SCharles.Forsyth 	if(n > p->r.min.x - x)
132437da2899SCharles.Forsyth 		n = p->r.min.x - x;
132537da2899SCharles.Forsyth 
132637da2899SCharles.Forsyth 	r = p->bytey0s + y*p->bwidth;
132737da2899SCharles.Forsyth DBG print("x=%d r=%p...", x, r);
132837da2899SCharles.Forsyth 	bits = *r++;
132937da2899SCharles.Forsyth 	nbits = 8;
133037da2899SCharles.Forsyth 	if(i=x&(npack-1)){
133137da2899SCharles.Forsyth 		bits <<= depth*i;
133237da2899SCharles.Forsyth 		nbits -= depth*i;
133337da2899SCharles.Forsyth 	}
133437da2899SCharles.Forsyth DBG print("nbits=%d...", nbits);
133537da2899SCharles.Forsyth 	for(i=0; i<n; i++){
133637da2899SCharles.Forsyth 		if(nbits == 0){
133737da2899SCharles.Forsyth 			bits = *r++;
133837da2899SCharles.Forsyth 			nbits = 8;
133937da2899SCharles.Forsyth 		}
134037da2899SCharles.Forsyth 		*w++ = repl[bits>>sh];
134137da2899SCharles.Forsyth DBG print("bit %x...", repl[bits>>sh]);
134237da2899SCharles.Forsyth 		bits <<= depth;
134337da2899SCharles.Forsyth 		nbits -= depth;
134437da2899SCharles.Forsyth DBG print("bits %x nbits %d...", bits, nbits);
134537da2899SCharles.Forsyth 	}
134637da2899SCharles.Forsyth 	dx -= n;
134737da2899SCharles.Forsyth 	if(dx == 0)
134837da2899SCharles.Forsyth 		return b;
134937da2899SCharles.Forsyth 
135037da2899SCharles.Forsyth 	assert(dx > 0);
135137da2899SCharles.Forsyth 	/* now we have exactly one full scan line: just replicate the buffer itself until we are done */
135237da2899SCharles.Forsyth 	ow = buf;
135337da2899SCharles.Forsyth 	while(dx--)
135437da2899SCharles.Forsyth 		*w++ = *ow++;
135537da2899SCharles.Forsyth 
135637da2899SCharles.Forsyth 	return b;
135737da2899SCharles.Forsyth }
135837da2899SCharles.Forsyth #undef DBG
135937da2899SCharles.Forsyth 
136037da2899SCharles.Forsyth #define DBG if(0)
136137da2899SCharles.Forsyth static void
writenbit(Param * p,uchar * w,Buffer src)136237da2899SCharles.Forsyth writenbit(Param *p, uchar *w, Buffer src)
136337da2899SCharles.Forsyth {
136437da2899SCharles.Forsyth 	uchar *r;
136537da2899SCharles.Forsyth 	ulong bits;
136637da2899SCharles.Forsyth 	int i, sh, depth, npack, nbits, x, ex;
136737da2899SCharles.Forsyth 
136837da2899SCharles.Forsyth 	assert(src.grey != nil && src.delta == 1);
136937da2899SCharles.Forsyth 
137037da2899SCharles.Forsyth 	x = p->r.min.x;
137137da2899SCharles.Forsyth 	ex = x+p->dx;
137237da2899SCharles.Forsyth 	depth = p->img->depth;
137337da2899SCharles.Forsyth 	npack = 8/depth;
137437da2899SCharles.Forsyth 
137537da2899SCharles.Forsyth 	i=x&(npack-1);
137637da2899SCharles.Forsyth 	bits = i ? (*w >> (8-depth*i)) : 0;
137737da2899SCharles.Forsyth 	nbits = depth*i;
137837da2899SCharles.Forsyth 	sh = 8-depth;
137937da2899SCharles.Forsyth 	r = src.grey;
138037da2899SCharles.Forsyth 
138137da2899SCharles.Forsyth 	for(; x<ex; x++){
138237da2899SCharles.Forsyth 		bits <<= depth;
138337da2899SCharles.Forsyth DBG print(" %x", *r);
138437da2899SCharles.Forsyth 		bits |= (*r++ >> sh);
138537da2899SCharles.Forsyth 		nbits += depth;
138637da2899SCharles.Forsyth 		if(nbits == 8){
138737da2899SCharles.Forsyth 			*w++ = bits;
138837da2899SCharles.Forsyth 			nbits = 0;
138937da2899SCharles.Forsyth 		}
139037da2899SCharles.Forsyth 	}
139137da2899SCharles.Forsyth 
139237da2899SCharles.Forsyth 	if(nbits){
139337da2899SCharles.Forsyth 		sh = 8-nbits;
139437da2899SCharles.Forsyth 		bits <<= sh;
139537da2899SCharles.Forsyth 		bits |= *w & ((1<<sh)-1);
139637da2899SCharles.Forsyth 		*w = bits;
139737da2899SCharles.Forsyth 	}
139837da2899SCharles.Forsyth DBG print("\n");
139937da2899SCharles.Forsyth 	return;
140037da2899SCharles.Forsyth }
140137da2899SCharles.Forsyth #undef DBG
140237da2899SCharles.Forsyth 
140337da2899SCharles.Forsyth static Buffer
readcmap(Param * p,uchar * buf,int y)140437da2899SCharles.Forsyth readcmap(Param *p, uchar *buf, int y)
140537da2899SCharles.Forsyth {
140637da2899SCharles.Forsyth 	Buffer b;
140737da2899SCharles.Forsyth 	int a, convgrey, copyalpha, dx, i, m;
140837da2899SCharles.Forsyth 	uchar *q, *cmap, *begin, *end, *r, *w;
140937da2899SCharles.Forsyth 
141037da2899SCharles.Forsyth 	begin = p->bytey0s + y*p->bwidth;
141137da2899SCharles.Forsyth 	r = p->bytermin + y*p->bwidth;
141237da2899SCharles.Forsyth 	end = p->bytey0e + y*p->bwidth;
141337da2899SCharles.Forsyth 	cmap = p->img->cmap->cmap2rgb;
141437da2899SCharles.Forsyth 	convgrey = p->convgrey;
141537da2899SCharles.Forsyth 	copyalpha = (p->img->flags&Falpha) ? 1 : 0;
141637da2899SCharles.Forsyth 
141737da2899SCharles.Forsyth 	w = buf;
141837da2899SCharles.Forsyth 	dx = p->dx;
141937da2899SCharles.Forsyth 	if(copyalpha){
142037da2899SCharles.Forsyth 		b.alpha = buf++;
142137da2899SCharles.Forsyth 		a = p->img->shift[CAlpha]/8;
142237da2899SCharles.Forsyth 		m = p->img->shift[CMap]/8;
142337da2899SCharles.Forsyth 		for(i=0; i<dx; i++){
142437da2899SCharles.Forsyth 			*w++ = r[a];
142537da2899SCharles.Forsyth 			q = cmap+r[m]*3;
142637da2899SCharles.Forsyth 			r += 2;
142737da2899SCharles.Forsyth 			if(r == end)
142837da2899SCharles.Forsyth 				r = begin;
142937da2899SCharles.Forsyth 			if(convgrey){
143037da2899SCharles.Forsyth 				*w++ = RGB2K(q[0], q[1], q[2]);
143137da2899SCharles.Forsyth 			}else{
143237da2899SCharles.Forsyth 				*w++ = q[2];	/* blue */
143337da2899SCharles.Forsyth 				*w++ = q[1];	/* green */
143437da2899SCharles.Forsyth 				*w++ = q[0];	/* red */
143537da2899SCharles.Forsyth 			}
143637da2899SCharles.Forsyth 		}
143737da2899SCharles.Forsyth 	}else{
143837da2899SCharles.Forsyth 		b.alpha = &ones;
143937da2899SCharles.Forsyth 		for(i=0; i<dx; i++){
144037da2899SCharles.Forsyth 			q = cmap+*r++*3;
144137da2899SCharles.Forsyth 			if(r == end)
144237da2899SCharles.Forsyth 				r = begin;
144337da2899SCharles.Forsyth 			if(convgrey){
144437da2899SCharles.Forsyth 				*w++ = RGB2K(q[0], q[1], q[2]);
144537da2899SCharles.Forsyth 			}else{
144637da2899SCharles.Forsyth 				*w++ = q[2];	/* blue */
144737da2899SCharles.Forsyth 				*w++ = q[1];	/* green */
144837da2899SCharles.Forsyth 				*w++ = q[0];	/* red */
144937da2899SCharles.Forsyth 			}
145037da2899SCharles.Forsyth 		}
145137da2899SCharles.Forsyth 	}
145237da2899SCharles.Forsyth 
145337da2899SCharles.Forsyth 	b.rgba = (ulong*)(buf-copyalpha);
145437da2899SCharles.Forsyth 
145537da2899SCharles.Forsyth 	if(convgrey){
145637da2899SCharles.Forsyth 		b.grey = buf;
145737da2899SCharles.Forsyth 		b.red = b.blu = b.grn = buf;
145837da2899SCharles.Forsyth 		b.delta = 1+copyalpha;
145937da2899SCharles.Forsyth 	}else{
146037da2899SCharles.Forsyth 		b.blu = buf;
146137da2899SCharles.Forsyth 		b.grn = buf+1;
146237da2899SCharles.Forsyth 		b.red = buf+2;
146337da2899SCharles.Forsyth 		b.grey = nil;
146437da2899SCharles.Forsyth 		b.delta = 3+copyalpha;
146537da2899SCharles.Forsyth 	}
146637da2899SCharles.Forsyth 	return b;
146737da2899SCharles.Forsyth }
146837da2899SCharles.Forsyth 
146937da2899SCharles.Forsyth static void
writecmap(Param * p,uchar * w,Buffer src)147037da2899SCharles.Forsyth writecmap(Param *p, uchar *w, Buffer src)
147137da2899SCharles.Forsyth {
147237da2899SCharles.Forsyth 	uchar *cmap, *red, *grn, *blu;
147337da2899SCharles.Forsyth 	int i, dx, delta;
147437da2899SCharles.Forsyth 
147537da2899SCharles.Forsyth 	cmap = p->img->cmap->rgb2cmap;
147637da2899SCharles.Forsyth 
147737da2899SCharles.Forsyth 	delta = src.delta;
147837da2899SCharles.Forsyth 	red= src.red;
147937da2899SCharles.Forsyth 	grn = src.grn;
148037da2899SCharles.Forsyth 	blu = src.blu;
148137da2899SCharles.Forsyth 
148237da2899SCharles.Forsyth 	dx = p->dx;
148337da2899SCharles.Forsyth 	for(i=0; i<dx; i++, red+=delta, grn+=delta, blu+=delta)
148437da2899SCharles.Forsyth 		*w++ = cmap[(*red>>4)*256+(*grn>>4)*16+(*blu>>4)];
148537da2899SCharles.Forsyth }
148637da2899SCharles.Forsyth 
148737da2899SCharles.Forsyth #define DBG if(0)
148837da2899SCharles.Forsyth static Buffer
readbyte(Param * p,uchar * buf,int y)148937da2899SCharles.Forsyth readbyte(Param *p, uchar *buf, int y)
149037da2899SCharles.Forsyth {
149137da2899SCharles.Forsyth 	Buffer b;
149237da2899SCharles.Forsyth 	Memimage *img;
149337da2899SCharles.Forsyth 	int dx, isgrey, convgrey, alphaonly, copyalpha, i, nb;
149437da2899SCharles.Forsyth 	uchar *begin, *end, *r, *w, *rrepl, *grepl, *brepl, *arepl, *krepl;
149537da2899SCharles.Forsyth 	uchar ured, ugrn, ublu;
149637da2899SCharles.Forsyth 	ulong u;
149737da2899SCharles.Forsyth 
149837da2899SCharles.Forsyth 	img = p->img;
149937da2899SCharles.Forsyth 	begin = p->bytey0s + y*p->bwidth;
150037da2899SCharles.Forsyth 	r = p->bytermin + y*p->bwidth;
150137da2899SCharles.Forsyth 	end = p->bytey0e + y*p->bwidth;
150237da2899SCharles.Forsyth 
150337da2899SCharles.Forsyth 	w = buf;
150437da2899SCharles.Forsyth 	dx = p->dx;
150537da2899SCharles.Forsyth 	nb = img->depth/8;
150637da2899SCharles.Forsyth 
150737da2899SCharles.Forsyth 	convgrey = p->convgrey;	/* convert rgb to grey */
150837da2899SCharles.Forsyth 	isgrey = img->flags&Fgrey;
150937da2899SCharles.Forsyth 	alphaonly = p->alphaonly;
151037da2899SCharles.Forsyth 	copyalpha = (img->flags&Falpha) ? 1 : 0;
151137da2899SCharles.Forsyth 
151237da2899SCharles.Forsyth DBG print("copyalpha %d alphaonly %d convgrey %d isgrey %d\n", copyalpha, alphaonly, convgrey, isgrey);
151337da2899SCharles.Forsyth 	/* if we can, avoid processing everything */
151437da2899SCharles.Forsyth 	if(!(img->flags&Frepl) && !convgrey && (img->flags&Fbytes)){
151537da2899SCharles.Forsyth 		memset(&b, 0, sizeof b);
151637da2899SCharles.Forsyth 		if(p->needbuf){
151737da2899SCharles.Forsyth 			memmove(buf, r, dx*nb);
151837da2899SCharles.Forsyth 			r = buf;
151937da2899SCharles.Forsyth 		}
152037da2899SCharles.Forsyth 		b.rgba = (ulong*)r;
152137da2899SCharles.Forsyth 		if(copyalpha)
152237da2899SCharles.Forsyth 			b.alpha = r+img->shift[CAlpha]/8;
152337da2899SCharles.Forsyth 		else
152437da2899SCharles.Forsyth 			b.alpha = &ones;
152537da2899SCharles.Forsyth 		if(isgrey){
152637da2899SCharles.Forsyth 			b.grey = r+img->shift[CGrey]/8;
152737da2899SCharles.Forsyth 			b.red = b.grn = b.blu = b.grey;
152837da2899SCharles.Forsyth 		}else{
152937da2899SCharles.Forsyth 			b.red = r+img->shift[CRed]/8;
153037da2899SCharles.Forsyth 			b.grn = r+img->shift[CGreen]/8;
153137da2899SCharles.Forsyth 			b.blu = r+img->shift[CBlue]/8;
153237da2899SCharles.Forsyth 		}
153337da2899SCharles.Forsyth 		b.delta = nb;
153437da2899SCharles.Forsyth 		return b;
153537da2899SCharles.Forsyth 	}
153637da2899SCharles.Forsyth 
153737da2899SCharles.Forsyth DBG print("2\n");
153837da2899SCharles.Forsyth 	rrepl = replbit[img->nbits[CRed]];
153937da2899SCharles.Forsyth 	grepl = replbit[img->nbits[CGreen]];
154037da2899SCharles.Forsyth 	brepl = replbit[img->nbits[CBlue]];
154137da2899SCharles.Forsyth 	arepl = replbit[img->nbits[CAlpha]];
154237da2899SCharles.Forsyth 	krepl = replbit[img->nbits[CGrey]];
154337da2899SCharles.Forsyth 
154437da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
154537da2899SCharles.Forsyth 		u = r[0] | (r[1]<<8) | (r[2]<<16) | (r[3]<<24);
154637da2899SCharles.Forsyth 		if(copyalpha) {
154737da2899SCharles.Forsyth 			*w++ = arepl[(u>>img->shift[CAlpha]) & img->mask[CAlpha]];
154837da2899SCharles.Forsyth DBG print("a %x\n", w[-1]);
154937da2899SCharles.Forsyth 		}
155037da2899SCharles.Forsyth 
155137da2899SCharles.Forsyth 		if(isgrey)
155237da2899SCharles.Forsyth 			*w++ = krepl[(u >> img->shift[CGrey]) & img->mask[CGrey]];
155337da2899SCharles.Forsyth 		else if(!alphaonly){
155437da2899SCharles.Forsyth 			ured = rrepl[(u >> img->shift[CRed]) & img->mask[CRed]];
155537da2899SCharles.Forsyth 			ugrn = grepl[(u >> img->shift[CGreen]) & img->mask[CGreen]];
155637da2899SCharles.Forsyth 			ublu = brepl[(u >> img->shift[CBlue]) & img->mask[CBlue]];
155737da2899SCharles.Forsyth 			if(convgrey){
155837da2899SCharles.Forsyth DBG print("g %x %x %x\n", ured, ugrn, ublu);
155937da2899SCharles.Forsyth 				*w++ = RGB2K(ured, ugrn, ublu);
156037da2899SCharles.Forsyth DBG print("%x\n", w[-1]);
156137da2899SCharles.Forsyth 			}else{
156237da2899SCharles.Forsyth 				*w++ = ublu;
156337da2899SCharles.Forsyth 				*w++ = ugrn;
156437da2899SCharles.Forsyth 				*w++ = ured;
156537da2899SCharles.Forsyth 			}
156637da2899SCharles.Forsyth 		}
156737da2899SCharles.Forsyth 		r += nb;
156837da2899SCharles.Forsyth 		if(r == end)
156937da2899SCharles.Forsyth 			r = begin;
157037da2899SCharles.Forsyth 	}
157137da2899SCharles.Forsyth 
157237da2899SCharles.Forsyth 	b.alpha = copyalpha ? buf : &ones;
157337da2899SCharles.Forsyth 	b.rgba = (ulong*)buf;
157437da2899SCharles.Forsyth 	if(alphaonly){
157537da2899SCharles.Forsyth 		b.red = b.grn = b.blu = b.grey = nil;
157637da2899SCharles.Forsyth 		if(!copyalpha)
157737da2899SCharles.Forsyth 			b.rgba = nil;
157837da2899SCharles.Forsyth 		b.delta = 1;
157937da2899SCharles.Forsyth 	}else if(isgrey || convgrey){
158037da2899SCharles.Forsyth 		b.grey = buf+copyalpha;
158137da2899SCharles.Forsyth 		b.red = b.grn = b.blu = buf+copyalpha;
158237da2899SCharles.Forsyth 		b.delta = copyalpha+1;
158337da2899SCharles.Forsyth DBG print("alpha %x grey %x\n", b.alpha ? *b.alpha : 0xFF, *b.grey);
158437da2899SCharles.Forsyth 	}else{
158537da2899SCharles.Forsyth 		b.blu = buf+copyalpha;
158637da2899SCharles.Forsyth 		b.grn = buf+copyalpha+1;
158737da2899SCharles.Forsyth 		b.grey = nil;
158837da2899SCharles.Forsyth 		b.red = buf+copyalpha+2;
158937da2899SCharles.Forsyth 		b.delta = copyalpha+3;
159037da2899SCharles.Forsyth 	}
159137da2899SCharles.Forsyth 	return b;
159237da2899SCharles.Forsyth }
159337da2899SCharles.Forsyth #undef DBG
159437da2899SCharles.Forsyth 
159537da2899SCharles.Forsyth #define DBG if(0)
159637da2899SCharles.Forsyth static void
writebyte(Param * p,uchar * w,Buffer src)159737da2899SCharles.Forsyth writebyte(Param *p, uchar *w, Buffer src)
159837da2899SCharles.Forsyth {
159937da2899SCharles.Forsyth 	Memimage *img;
160037da2899SCharles.Forsyth 	int i, isalpha, isgrey, nb, delta, dx, adelta;
160137da2899SCharles.Forsyth 	uchar ff, *red, *grn, *blu, *grey, *alpha;
160237da2899SCharles.Forsyth 	ulong u, mask;
160337da2899SCharles.Forsyth 
160437da2899SCharles.Forsyth 	img = p->img;
160537da2899SCharles.Forsyth 
160637da2899SCharles.Forsyth 	red = src.red;
160737da2899SCharles.Forsyth 	grn = src.grn;
160837da2899SCharles.Forsyth 	blu = src.blu;
160937da2899SCharles.Forsyth 	alpha = src.alpha;
161037da2899SCharles.Forsyth 	delta = src.delta;
161137da2899SCharles.Forsyth 	grey = src.grey;
161237da2899SCharles.Forsyth 	dx = p->dx;
161337da2899SCharles.Forsyth 
161437da2899SCharles.Forsyth 	nb = img->depth/8;
161537da2899SCharles.Forsyth 	mask = (nb==4) ? 0 : ~((1<<img->depth)-1);
161637da2899SCharles.Forsyth 
161737da2899SCharles.Forsyth 	isalpha = img->flags&Falpha;
161837da2899SCharles.Forsyth 	isgrey = img->flags&Fgrey;
161937da2899SCharles.Forsyth 	adelta = src.delta;
162037da2899SCharles.Forsyth 
162137da2899SCharles.Forsyth 	if(isalpha && (alpha == nil || alpha == &ones)){
162237da2899SCharles.Forsyth 		ff = 0xFF;
162337da2899SCharles.Forsyth 		alpha = &ff;
162437da2899SCharles.Forsyth 		adelta = 0;
162537da2899SCharles.Forsyth 	}
162637da2899SCharles.Forsyth 
162737da2899SCharles.Forsyth 	for(i=0; i<dx; i++){
162837da2899SCharles.Forsyth 		u = w[0] | (w[1]<<8) | (w[2]<<16) | (w[3]<<24);
162937da2899SCharles.Forsyth DBG print("u %.8lux...", u);
163037da2899SCharles.Forsyth 		u &= mask;
163137da2899SCharles.Forsyth DBG print("&mask %.8lux...", u);
163237da2899SCharles.Forsyth 		if(isgrey){
163337da2899SCharles.Forsyth 			u |= ((*grey >> (8-img->nbits[CGrey])) & img->mask[CGrey]) << img->shift[CGrey];
163437da2899SCharles.Forsyth DBG print("|grey %.8lux...", u);
163537da2899SCharles.Forsyth 			grey += delta;
163637da2899SCharles.Forsyth 		}else{
163737da2899SCharles.Forsyth 			u |= ((*red >> (8-img->nbits[CRed])) & img->mask[CRed]) << img->shift[CRed];
163837da2899SCharles.Forsyth 			u |= ((*grn >> (8-img->nbits[CGreen])) & img->mask[CGreen]) << img->shift[CGreen];
163937da2899SCharles.Forsyth 			u |= ((*blu >> (8-img->nbits[CBlue])) & img->mask[CBlue]) << img->shift[CBlue];
164037da2899SCharles.Forsyth 			red += delta;
164137da2899SCharles.Forsyth 			grn += delta;
164237da2899SCharles.Forsyth 			blu += delta;
164337da2899SCharles.Forsyth DBG print("|rgb %.8lux...", u);
164437da2899SCharles.Forsyth 		}
164537da2899SCharles.Forsyth 
164637da2899SCharles.Forsyth 		if(isalpha){
164737da2899SCharles.Forsyth 			u |= ((*alpha >> (8-img->nbits[CAlpha])) & img->mask[CAlpha]) << img->shift[CAlpha];
164837da2899SCharles.Forsyth 			alpha += adelta;
164937da2899SCharles.Forsyth DBG print("|alpha %.8lux...", u);
165037da2899SCharles.Forsyth 		}
165137da2899SCharles.Forsyth 
165237da2899SCharles.Forsyth 		w[0] = u;
165337da2899SCharles.Forsyth 		w[1] = u>>8;
165437da2899SCharles.Forsyth 		w[2] = u>>16;
165537da2899SCharles.Forsyth 		w[3] = u>>24;
165637da2899SCharles.Forsyth 		w += nb;
165737da2899SCharles.Forsyth 	}
165837da2899SCharles.Forsyth }
165937da2899SCharles.Forsyth #undef DBG
166037da2899SCharles.Forsyth 
166137da2899SCharles.Forsyth static Readfn*
readfn(Memimage * img)166237da2899SCharles.Forsyth readfn(Memimage *img)
166337da2899SCharles.Forsyth {
166437da2899SCharles.Forsyth 	if(img->depth < 8)
166537da2899SCharles.Forsyth 		return readnbit;
166637da2899SCharles.Forsyth 	if(img->nbits[CMap] == 8)
166737da2899SCharles.Forsyth 		return readcmap;
166837da2899SCharles.Forsyth 	return readbyte;
166937da2899SCharles.Forsyth }
167037da2899SCharles.Forsyth 
167137da2899SCharles.Forsyth static Readfn*
readalphafn(Memimage * m)167237da2899SCharles.Forsyth readalphafn(Memimage *m)
167337da2899SCharles.Forsyth {
167437da2899SCharles.Forsyth 	USED(m);
167537da2899SCharles.Forsyth 	return readbyte;
167637da2899SCharles.Forsyth }
167737da2899SCharles.Forsyth 
167837da2899SCharles.Forsyth static Writefn*
writefn(Memimage * img)167937da2899SCharles.Forsyth writefn(Memimage *img)
168037da2899SCharles.Forsyth {
168137da2899SCharles.Forsyth 	if(img->depth < 8)
168237da2899SCharles.Forsyth 		return writenbit;
168337da2899SCharles.Forsyth 	if(img->chan == CMAP8)
168437da2899SCharles.Forsyth 		return writecmap;
168537da2899SCharles.Forsyth 	return writebyte;
168637da2899SCharles.Forsyth }
168737da2899SCharles.Forsyth 
168837da2899SCharles.Forsyth static void
nullwrite(Param * p,uchar * s,Buffer b)168937da2899SCharles.Forsyth nullwrite(Param *p, uchar *s, Buffer b)
169037da2899SCharles.Forsyth {
169137da2899SCharles.Forsyth 	USED(p);
169237da2899SCharles.Forsyth 	USED(s);
169337da2899SCharles.Forsyth 	USED(b.grey);
169437da2899SCharles.Forsyth }
169537da2899SCharles.Forsyth 
169637da2899SCharles.Forsyth static Buffer
readptr(Param * p,uchar * s,int y)169737da2899SCharles.Forsyth readptr(Param *p, uchar *s, int y)
169837da2899SCharles.Forsyth {
169937da2899SCharles.Forsyth 	Buffer b;
170037da2899SCharles.Forsyth 	uchar *q;
170137da2899SCharles.Forsyth 
170237da2899SCharles.Forsyth 	USED(s);
170337da2899SCharles.Forsyth 	q = p->bytermin + y*p->bwidth;
170437da2899SCharles.Forsyth 	b.red = q;	/* ptr to data */
170537da2899SCharles.Forsyth 	b.grn = b.blu = b.grey = b.alpha = nil;
170637da2899SCharles.Forsyth 	b.rgba = (ulong*)q;
170737da2899SCharles.Forsyth 	b.delta = p->img->depth/8;
170837da2899SCharles.Forsyth 	return b;
170937da2899SCharles.Forsyth }
171037da2899SCharles.Forsyth 
171137da2899SCharles.Forsyth static Buffer
boolmemmove(Buffer bdst,Buffer bsrc,Buffer b1,int dx,int i,int o)171237da2899SCharles.Forsyth boolmemmove(Buffer bdst, Buffer bsrc, Buffer b1, int dx, int i, int o)
171337da2899SCharles.Forsyth {
171437da2899SCharles.Forsyth 	USED(i);
171537da2899SCharles.Forsyth 	USED(o);
171637da2899SCharles.Forsyth 	USED(b1.grey);
171737da2899SCharles.Forsyth 	memmove(bdst.red, bsrc.red, dx*bdst.delta);
171837da2899SCharles.Forsyth 	return bdst;
171937da2899SCharles.Forsyth }
172037da2899SCharles.Forsyth 
172137da2899SCharles.Forsyth static Buffer
boolcopy8(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int i,int o)172237da2899SCharles.Forsyth boolcopy8(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int i, int o)
172337da2899SCharles.Forsyth {
172437da2899SCharles.Forsyth 	uchar *m, *r, *w, *ew;
172537da2899SCharles.Forsyth 
172637da2899SCharles.Forsyth 	USED(i);
172737da2899SCharles.Forsyth 	USED(o);
172837da2899SCharles.Forsyth 	m = bmask.grey;
172937da2899SCharles.Forsyth 	w = bdst.red;
173037da2899SCharles.Forsyth 	r = bsrc.red;
173137da2899SCharles.Forsyth 	ew = w+dx;
173237da2899SCharles.Forsyth 	for(; w < ew; w++,r++)
173337da2899SCharles.Forsyth 		if(*m++)
173437da2899SCharles.Forsyth 			*w = *r;
173537da2899SCharles.Forsyth 	return bdst;	/* not used */
173637da2899SCharles.Forsyth }
173737da2899SCharles.Forsyth 
173837da2899SCharles.Forsyth static Buffer
boolcopy16(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int i,int o)173937da2899SCharles.Forsyth boolcopy16(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int i, int o)
174037da2899SCharles.Forsyth {
174137da2899SCharles.Forsyth 	uchar *m;
174237da2899SCharles.Forsyth 	ushort *r, *w, *ew;
174337da2899SCharles.Forsyth 
174437da2899SCharles.Forsyth 	USED(i);
174537da2899SCharles.Forsyth 	USED(o);
174637da2899SCharles.Forsyth 	m = bmask.grey;
174737da2899SCharles.Forsyth 	w = (ushort*)bdst.red;
174837da2899SCharles.Forsyth 	r = (ushort*)bsrc.red;
174937da2899SCharles.Forsyth 	ew = w+dx;
175037da2899SCharles.Forsyth 	for(; w < ew; w++,r++)
175137da2899SCharles.Forsyth 		if(*m++)
175237da2899SCharles.Forsyth 			*w = *r;
175337da2899SCharles.Forsyth 	return bdst;	/* not used */
175437da2899SCharles.Forsyth }
175537da2899SCharles.Forsyth 
175637da2899SCharles.Forsyth static Buffer
boolcopy24(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int i,int o)175737da2899SCharles.Forsyth boolcopy24(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int i, int o)
175837da2899SCharles.Forsyth {
175937da2899SCharles.Forsyth 	uchar *m;
176037da2899SCharles.Forsyth 	uchar *r, *w, *ew;
176137da2899SCharles.Forsyth 
176237da2899SCharles.Forsyth 	USED(i);
176337da2899SCharles.Forsyth 	USED(o);
176437da2899SCharles.Forsyth 	m = bmask.grey;
176537da2899SCharles.Forsyth 	w = bdst.red;
176637da2899SCharles.Forsyth 	r = bsrc.red;
176737da2899SCharles.Forsyth 	ew = w+dx*3;
176837da2899SCharles.Forsyth 	while(w < ew){
176937da2899SCharles.Forsyth 		if(*m++){
177037da2899SCharles.Forsyth 			*w++ = *r++;
177137da2899SCharles.Forsyth 			*w++ = *r++;
177237da2899SCharles.Forsyth 			*w++ = *r++;
177337da2899SCharles.Forsyth 		}else{
177437da2899SCharles.Forsyth 			w += 3;
177537da2899SCharles.Forsyth 			r += 3;
177637da2899SCharles.Forsyth 		}
177737da2899SCharles.Forsyth 	}
177837da2899SCharles.Forsyth 	return bdst;	/* not used */
177937da2899SCharles.Forsyth }
178037da2899SCharles.Forsyth 
178137da2899SCharles.Forsyth static Buffer
boolcopy32(Buffer bdst,Buffer bsrc,Buffer bmask,int dx,int i,int o)178237da2899SCharles.Forsyth boolcopy32(Buffer bdst, Buffer bsrc, Buffer bmask, int dx, int i, int o)
178337da2899SCharles.Forsyth {
178437da2899SCharles.Forsyth 	uchar *m;
178537da2899SCharles.Forsyth 	ulong *r, *w, *ew;
178637da2899SCharles.Forsyth 
178737da2899SCharles.Forsyth 	USED(i);
178837da2899SCharles.Forsyth 	USED(o);
178937da2899SCharles.Forsyth 	m = bmask.grey;
179037da2899SCharles.Forsyth 	w = (ulong*)bdst.red;
179137da2899SCharles.Forsyth 	r = (ulong*)bsrc.red;
179237da2899SCharles.Forsyth 	ew = w+dx;
179337da2899SCharles.Forsyth 	for(; w < ew; w++,r++)
179437da2899SCharles.Forsyth 		if(*m++)
179537da2899SCharles.Forsyth 			*w = *r;
179637da2899SCharles.Forsyth 	return bdst;	/* not used */
179737da2899SCharles.Forsyth }
179837da2899SCharles.Forsyth 
179937da2899SCharles.Forsyth static Buffer
genconv(Param * p,uchar * buf,int y)180037da2899SCharles.Forsyth genconv(Param *p, uchar *buf, int y)
180137da2899SCharles.Forsyth {
180237da2899SCharles.Forsyth 	Buffer b;
180337da2899SCharles.Forsyth 	int nb;
180437da2899SCharles.Forsyth 	uchar *r, *w, *ew;
180537da2899SCharles.Forsyth 
180637da2899SCharles.Forsyth 	/* read from source into RGB format in convbuf */
180737da2899SCharles.Forsyth 	b = p->convreadcall(p, p->convbuf, y);
180837da2899SCharles.Forsyth 
180937da2899SCharles.Forsyth 	/* write RGB format into dst format in buf */
181037da2899SCharles.Forsyth 	p->convwritecall(p->convdpar, buf, b);
181137da2899SCharles.Forsyth 
181237da2899SCharles.Forsyth 	if(p->convdx){
181337da2899SCharles.Forsyth 		nb = p->convdpar->img->depth/8;
181437da2899SCharles.Forsyth 		r = buf;
181537da2899SCharles.Forsyth 		w = buf+nb*p->dx;
181637da2899SCharles.Forsyth 		ew = buf+nb*p->convdx;
181737da2899SCharles.Forsyth 		while(w<ew)
181837da2899SCharles.Forsyth 			*w++ = *r++;
181937da2899SCharles.Forsyth 	}
182037da2899SCharles.Forsyth 
182137da2899SCharles.Forsyth 	b.red = buf;
182237da2899SCharles.Forsyth 	b.blu = b.grn = b.grey = b.alpha = nil;
182337da2899SCharles.Forsyth 	b.rgba = (ulong*)buf;
182437da2899SCharles.Forsyth 	b.delta = 0;
182537da2899SCharles.Forsyth 
182637da2899SCharles.Forsyth 	return b;
182737da2899SCharles.Forsyth }
182837da2899SCharles.Forsyth 
182937da2899SCharles.Forsyth static Readfn*
convfn(Memimage * dst,Param * dpar,Memimage * src,Param * spar,int * ndrawbuf)183037da2899SCharles.Forsyth convfn(Memimage *dst, Param *dpar, Memimage *src, Param *spar, int *ndrawbuf)
183137da2899SCharles.Forsyth {
183237da2899SCharles.Forsyth 	if(dst->chan == src->chan && !(src->flags&Frepl)){
183337da2899SCharles.Forsyth //if(drawdebug) iprint("readptr...");
183437da2899SCharles.Forsyth 		return readptr;
183537da2899SCharles.Forsyth 	}
183637da2899SCharles.Forsyth 
183737da2899SCharles.Forsyth 	if(dst->chan==CMAP8 && (src->chan==GREY1||src->chan==GREY2||src->chan==GREY4)){
183837da2899SCharles.Forsyth 		/* cheat because we know the replicated value is exactly the color map entry. */
183937da2899SCharles.Forsyth //if(drawdebug) iprint("Readnbit...");
184037da2899SCharles.Forsyth 		return readnbit;
184137da2899SCharles.Forsyth 	}
184237da2899SCharles.Forsyth 
184337da2899SCharles.Forsyth 	spar->convreadcall = readfn(src);
184437da2899SCharles.Forsyth 	spar->convwritecall = writefn(dst);
184537da2899SCharles.Forsyth 	spar->convdpar = dpar;
184637da2899SCharles.Forsyth 
184737da2899SCharles.Forsyth 	/* allocate a conversion buffer */
184837da2899SCharles.Forsyth 	spar->convbufoff = *ndrawbuf;
184937da2899SCharles.Forsyth 	*ndrawbuf += spar->dx*4;
185037da2899SCharles.Forsyth 
185137da2899SCharles.Forsyth 	if(spar->dx > Dx(spar->img->r)){
185237da2899SCharles.Forsyth 		spar->convdx = spar->dx;
185337da2899SCharles.Forsyth 		spar->dx = Dx(spar->img->r);
185437da2899SCharles.Forsyth 	}
185537da2899SCharles.Forsyth 
185637da2899SCharles.Forsyth //if(drawdebug) iprint("genconv...");
185737da2899SCharles.Forsyth 	return genconv;
185837da2899SCharles.Forsyth }
185937da2899SCharles.Forsyth 
186037da2899SCharles.Forsyth static ulong
pixelbits(Memimage * i,Point pt)186137da2899SCharles.Forsyth pixelbits(Memimage *i, Point pt)
186237da2899SCharles.Forsyth {
186337da2899SCharles.Forsyth 	uchar *p;
186437da2899SCharles.Forsyth 	ulong val;
186537da2899SCharles.Forsyth 	int off, bpp, npack;
186637da2899SCharles.Forsyth 
186737da2899SCharles.Forsyth 	val = 0;
186837da2899SCharles.Forsyth 	p = byteaddr(i, pt);
186937da2899SCharles.Forsyth 	switch(bpp=i->depth){
187037da2899SCharles.Forsyth 	case 1:
187137da2899SCharles.Forsyth 	case 2:
187237da2899SCharles.Forsyth 	case 4:
187337da2899SCharles.Forsyth 		npack = 8/bpp;
187437da2899SCharles.Forsyth 		off = pt.x%npack;
187537da2899SCharles.Forsyth 		val = p[0] >> bpp*(npack-1-off);
187637da2899SCharles.Forsyth 		val &= (1<<bpp)-1;
187737da2899SCharles.Forsyth 		break;
187837da2899SCharles.Forsyth 	case 8:
187937da2899SCharles.Forsyth 		val = p[0];
188037da2899SCharles.Forsyth 		break;
188137da2899SCharles.Forsyth 	case 16:
188237da2899SCharles.Forsyth 		val = p[0]|(p[1]<<8);
188337da2899SCharles.Forsyth 		break;
188437da2899SCharles.Forsyth 	case 24:
188537da2899SCharles.Forsyth 		val = p[0]|(p[1]<<8)|(p[2]<<16);
188637da2899SCharles.Forsyth 		break;
188737da2899SCharles.Forsyth 	case 32:
188837da2899SCharles.Forsyth 		val = p[0]|(p[1]<<8)|(p[2]<<16)|(p[3]<<24);
188937da2899SCharles.Forsyth 		break;
189037da2899SCharles.Forsyth 	}
189137da2899SCharles.Forsyth 	while(bpp<32){
189237da2899SCharles.Forsyth 		val |= val<<bpp;
189337da2899SCharles.Forsyth 		bpp *= 2;
189437da2899SCharles.Forsyth 	}
189537da2899SCharles.Forsyth 	return val;
189637da2899SCharles.Forsyth }
189737da2899SCharles.Forsyth 
189837da2899SCharles.Forsyth static Calcfn*
boolcopyfn(Memimage * img,Memimage * mask)189937da2899SCharles.Forsyth boolcopyfn(Memimage *img, Memimage *mask)
190037da2899SCharles.Forsyth {
190137da2899SCharles.Forsyth 	if(mask->flags&Frepl && Dx(mask->r)==1 && Dy(mask->r)==1 && pixelbits(mask, mask->r.min)==~0)
190237da2899SCharles.Forsyth 		return boolmemmove;
190337da2899SCharles.Forsyth 
190437da2899SCharles.Forsyth 	switch(img->depth){
190537da2899SCharles.Forsyth 	case 8:
190637da2899SCharles.Forsyth 		return boolcopy8;
190737da2899SCharles.Forsyth 	case 16:
190837da2899SCharles.Forsyth 		return boolcopy16;
190937da2899SCharles.Forsyth 	case 24:
191037da2899SCharles.Forsyth 		return boolcopy24;
191137da2899SCharles.Forsyth 	case 32:
191237da2899SCharles.Forsyth 		return boolcopy32;
191337da2899SCharles.Forsyth 	default:
191437da2899SCharles.Forsyth 		assert(0 /* boolcopyfn */);
191537da2899SCharles.Forsyth 	}
191637da2899SCharles.Forsyth 	return nil;
191737da2899SCharles.Forsyth }
191837da2899SCharles.Forsyth 
191937da2899SCharles.Forsyth /*
192037da2899SCharles.Forsyth  * Optimized draw for filling and scrolling; uses memset and memmove.
192137da2899SCharles.Forsyth  */
192237da2899SCharles.Forsyth static void
memsetb(void * vp,uchar val,int n)192337da2899SCharles.Forsyth memsetb(void *vp, uchar val, int n)
192437da2899SCharles.Forsyth {
192537da2899SCharles.Forsyth 	uchar *p, *ep;
192637da2899SCharles.Forsyth 
192737da2899SCharles.Forsyth 	p = vp;
192837da2899SCharles.Forsyth 	ep = p+n;
192937da2899SCharles.Forsyth 	while(p<ep)
193037da2899SCharles.Forsyth 		*p++ = val;
193137da2899SCharles.Forsyth }
193237da2899SCharles.Forsyth 
193337da2899SCharles.Forsyth static void
memsets(void * vp,ushort val,int n)193437da2899SCharles.Forsyth memsets(void *vp, ushort val, int n)
193537da2899SCharles.Forsyth {
193637da2899SCharles.Forsyth 	ushort *p, *ep;
193737da2899SCharles.Forsyth 
193837da2899SCharles.Forsyth 	p = vp;
193937da2899SCharles.Forsyth 	ep = p+n;
194037da2899SCharles.Forsyth 	while(p<ep)
194137da2899SCharles.Forsyth 		*p++ = val;
194237da2899SCharles.Forsyth }
194337da2899SCharles.Forsyth 
194437da2899SCharles.Forsyth static void
memsetl(void * vp,ulong val,int n)194537da2899SCharles.Forsyth memsetl(void *vp, ulong val, int n)
194637da2899SCharles.Forsyth {
194737da2899SCharles.Forsyth 	ulong *p, *ep;
194837da2899SCharles.Forsyth 
194937da2899SCharles.Forsyth 	p = vp;
195037da2899SCharles.Forsyth 	ep = p+n;
195137da2899SCharles.Forsyth 	while(p<ep)
195237da2899SCharles.Forsyth 		*p++ = val;
195337da2899SCharles.Forsyth }
195437da2899SCharles.Forsyth 
195537da2899SCharles.Forsyth static void
memset24(void * vp,ulong val,int n)195637da2899SCharles.Forsyth memset24(void *vp, ulong val, int n)
195737da2899SCharles.Forsyth {
195837da2899SCharles.Forsyth 	uchar *p, *ep;
195937da2899SCharles.Forsyth 	uchar a,b,c;
196037da2899SCharles.Forsyth 
196137da2899SCharles.Forsyth 	p = vp;
196237da2899SCharles.Forsyth 	ep = p+3*n;
196337da2899SCharles.Forsyth 	a = val;
196437da2899SCharles.Forsyth 	b = val>>8;
196537da2899SCharles.Forsyth 	c = val>>16;
196637da2899SCharles.Forsyth 	while(p<ep){
196737da2899SCharles.Forsyth 		*p++ = a;
196837da2899SCharles.Forsyth 		*p++ = b;
196937da2899SCharles.Forsyth 		*p++ = c;
197037da2899SCharles.Forsyth 	}
197137da2899SCharles.Forsyth }
197237da2899SCharles.Forsyth 
197337da2899SCharles.Forsyth static ulong
imgtorgba(Memimage * img,ulong val)197437da2899SCharles.Forsyth imgtorgba(Memimage *img, ulong val)
197537da2899SCharles.Forsyth {
197637da2899SCharles.Forsyth 	uchar r, g, b, a;
197737da2899SCharles.Forsyth 	int nb, ov, v;
197837da2899SCharles.Forsyth 	ulong chan;
197937da2899SCharles.Forsyth 	uchar *p;
198037da2899SCharles.Forsyth 
198137da2899SCharles.Forsyth 	a = 0xFF;
198237da2899SCharles.Forsyth 	r = g = b = 0xAA;	/* garbage */
198337da2899SCharles.Forsyth 	for(chan=img->chan; chan; chan>>=8){
198437da2899SCharles.Forsyth 		nb = NBITS(chan);
198537da2899SCharles.Forsyth 		ov = v = val&((1<<nb)-1);
198637da2899SCharles.Forsyth 		val >>= nb;
198737da2899SCharles.Forsyth 
198837da2899SCharles.Forsyth 		while(nb < 8){
198937da2899SCharles.Forsyth 			v |= v<<nb;
199037da2899SCharles.Forsyth 			nb *= 2;
199137da2899SCharles.Forsyth 		}
199237da2899SCharles.Forsyth 		v >>= (nb-8);
199337da2899SCharles.Forsyth 
199437da2899SCharles.Forsyth 		switch(TYPE(chan)){
199537da2899SCharles.Forsyth 		case CRed:
199637da2899SCharles.Forsyth 			r = v;
199737da2899SCharles.Forsyth 			break;
199837da2899SCharles.Forsyth 		case CGreen:
199937da2899SCharles.Forsyth 			g = v;
200037da2899SCharles.Forsyth 			break;
200137da2899SCharles.Forsyth 		case CBlue:
200237da2899SCharles.Forsyth 			b = v;
200337da2899SCharles.Forsyth 			break;
200437da2899SCharles.Forsyth 		case CAlpha:
200537da2899SCharles.Forsyth 			a = v;
200637da2899SCharles.Forsyth 			break;
200737da2899SCharles.Forsyth 		case CGrey:
200837da2899SCharles.Forsyth 			r = g = b = v;
200937da2899SCharles.Forsyth 			break;
201037da2899SCharles.Forsyth 		case CMap:
201137da2899SCharles.Forsyth 			p = img->cmap->cmap2rgb+3*ov;
201237da2899SCharles.Forsyth 			r = *p++;
201337da2899SCharles.Forsyth 			g = *p++;
201437da2899SCharles.Forsyth 			b = *p;
201537da2899SCharles.Forsyth 			break;
201637da2899SCharles.Forsyth 		}
201737da2899SCharles.Forsyth 	}
201837da2899SCharles.Forsyth 	return (r<<24)|(g<<16)|(b<<8)|a;
201937da2899SCharles.Forsyth }
202037da2899SCharles.Forsyth 
202137da2899SCharles.Forsyth static ulong
rgbatoimg(Memimage * img,ulong rgba)202237da2899SCharles.Forsyth rgbatoimg(Memimage *img, ulong rgba)
202337da2899SCharles.Forsyth {
202437da2899SCharles.Forsyth 	ulong chan;
202537da2899SCharles.Forsyth 	int d, nb;
202637da2899SCharles.Forsyth 	ulong v;
202737da2899SCharles.Forsyth 	uchar *p, r, g, b, a, m;
202837da2899SCharles.Forsyth 
202937da2899SCharles.Forsyth 	v = 0;
203037da2899SCharles.Forsyth 	r = rgba>>24;
203137da2899SCharles.Forsyth 	g = rgba>>16;
203237da2899SCharles.Forsyth 	b = rgba>>8;
203337da2899SCharles.Forsyth 	a = rgba;
203437da2899SCharles.Forsyth 	d = 0;
203537da2899SCharles.Forsyth 	for(chan=img->chan; chan; chan>>=8){
203637da2899SCharles.Forsyth 		nb = NBITS(chan);
203737da2899SCharles.Forsyth 		switch(TYPE(chan)){
203837da2899SCharles.Forsyth 		case CRed:
203937da2899SCharles.Forsyth 			v |= (r>>(8-nb))<<d;
204037da2899SCharles.Forsyth 			break;
204137da2899SCharles.Forsyth 		case CGreen:
204237da2899SCharles.Forsyth 			v |= (g>>(8-nb))<<d;
204337da2899SCharles.Forsyth 			break;
204437da2899SCharles.Forsyth 		case CBlue:
204537da2899SCharles.Forsyth 			v |= (b>>(8-nb))<<d;
204637da2899SCharles.Forsyth 			break;
204737da2899SCharles.Forsyth 		case CAlpha:
204837da2899SCharles.Forsyth 			v |= (a>>(8-nb))<<d;
204937da2899SCharles.Forsyth 			break;
205037da2899SCharles.Forsyth 		case CMap:
205137da2899SCharles.Forsyth 			p = img->cmap->rgb2cmap;
205237da2899SCharles.Forsyth 			m = p[(r>>4)*256+(g>>4)*16+(b>>4)];
205337da2899SCharles.Forsyth 			v |= (m>>(8-nb))<<d;
205437da2899SCharles.Forsyth 			break;
205537da2899SCharles.Forsyth 		case CGrey:
205637da2899SCharles.Forsyth 			m = RGB2K(r,g,b);
205737da2899SCharles.Forsyth 			v |= (m>>(8-nb))<<d;
205837da2899SCharles.Forsyth 			break;
205937da2899SCharles.Forsyth 		}
206037da2899SCharles.Forsyth 		d += nb;
206137da2899SCharles.Forsyth 	}
206237da2899SCharles.Forsyth //	print("rgba2img %.8lux = %.*lux\n", rgba, 2*d/8, v);
206337da2899SCharles.Forsyth 	return v;
206437da2899SCharles.Forsyth }
206537da2899SCharles.Forsyth 
206637da2899SCharles.Forsyth #define DBG if(0)
206737da2899SCharles.Forsyth static int
memoptdraw(Memdrawparam * par)206837da2899SCharles.Forsyth memoptdraw(Memdrawparam *par)
206937da2899SCharles.Forsyth {
207037da2899SCharles.Forsyth 	int m, y, dy, dx, op;
207137da2899SCharles.Forsyth 	ulong v;
207237da2899SCharles.Forsyth 	Memimage *src;
207337da2899SCharles.Forsyth 	Memimage *dst;
207437da2899SCharles.Forsyth 
207537da2899SCharles.Forsyth 	dx = Dx(par->r);
207637da2899SCharles.Forsyth 	dy = Dy(par->r);
207737da2899SCharles.Forsyth 	src = par->src;
207837da2899SCharles.Forsyth 	dst = par->dst;
207937da2899SCharles.Forsyth 	op = par->op;
208037da2899SCharles.Forsyth 
208137da2899SCharles.Forsyth DBG print("state %lux mval %lux dd %d\n", par->state, par->mval, dst->depth);
208237da2899SCharles.Forsyth 	/*
208337da2899SCharles.Forsyth 	 * If we have an opaque mask and source is one opaque pixel we can convert to the
208437da2899SCharles.Forsyth 	 * destination format and just replicate with memset.
208537da2899SCharles.Forsyth 	 */
208637da2899SCharles.Forsyth 	m = Simplesrc|Simplemask|Fullmask;
208737da2899SCharles.Forsyth 	if((par->state&m)==m && (par->srgba&0xFF) == 0xFF && (op ==S || op == SoverD)){
208837da2899SCharles.Forsyth 		uchar *dp, p[4];
208937da2899SCharles.Forsyth 		int d, dwid, ppb, np, nb;
209037da2899SCharles.Forsyth 		uchar lm, rm;
209137da2899SCharles.Forsyth 
209237da2899SCharles.Forsyth DBG print("memopt, dst %p, dst->data->bdata %p\n", dst, dst->data->bdata);
209337da2899SCharles.Forsyth 		dwid = dst->width*sizeof(ulong);
209437da2899SCharles.Forsyth 		dp = byteaddr(dst, par->r.min);
209537da2899SCharles.Forsyth 		v = par->sdval;
209637da2899SCharles.Forsyth DBG print("sdval %lud, depth %d\n", v, dst->depth);
209737da2899SCharles.Forsyth 		switch(dst->depth){
209837da2899SCharles.Forsyth 		case 1:
209937da2899SCharles.Forsyth 		case 2:
210037da2899SCharles.Forsyth 		case 4:
210137da2899SCharles.Forsyth 			for(d=dst->depth; d<8; d*=2)
210237da2899SCharles.Forsyth 				v |= (v<<d);
210337da2899SCharles.Forsyth 			ppb = 8/dst->depth;	/* pixels per byte */
210437da2899SCharles.Forsyth 			m = ppb-1;
210537da2899SCharles.Forsyth 			/* left edge */
210637da2899SCharles.Forsyth 			np = par->r.min.x&m;		/* no. pixels unused on left side of word */
210737da2899SCharles.Forsyth 			dx -= (ppb-np);
210837da2899SCharles.Forsyth 			nb = 8 - np * dst->depth;		/* no. bits used on right side of word */
210937da2899SCharles.Forsyth 			lm = (1<<nb)-1;
211037da2899SCharles.Forsyth DBG print("np %d x %d nb %d lm %ux ppb %d m %ux\n", np, par->r.min.x, nb, lm, ppb, m);
211137da2899SCharles.Forsyth 
211237da2899SCharles.Forsyth 			/* right edge */
211337da2899SCharles.Forsyth 			np = par->r.max.x&m;	/* no. pixels used on left side of word */
211437da2899SCharles.Forsyth 			dx -= np;
211537da2899SCharles.Forsyth 			nb = 8 - np * dst->depth;		/* no. bits unused on right side of word */
211637da2899SCharles.Forsyth 			rm = ~((1<<nb)-1);
211737da2899SCharles.Forsyth DBG print("np %d x %d nb %d rm %ux ppb %d m %ux\n", np, par->r.max.x, nb, rm, ppb, m);
211837da2899SCharles.Forsyth 
211937da2899SCharles.Forsyth DBG print("dx %d Dx %d\n", dx, Dx(par->r));
212037da2899SCharles.Forsyth 			/* lm, rm are masks that are 1 where we should touch the bits */
212137da2899SCharles.Forsyth 			if(dx < 0){	/* just one byte */
212237da2899SCharles.Forsyth 				lm &= rm;
212337da2899SCharles.Forsyth 				for(y=0; y<dy; y++, dp+=dwid)
212437da2899SCharles.Forsyth 					*dp ^= (v ^ *dp) & lm;
212537da2899SCharles.Forsyth 			}else if(dx == 0){	/* no full bytes */
212637da2899SCharles.Forsyth 				if(lm)
212737da2899SCharles.Forsyth 					dwid--;
212837da2899SCharles.Forsyth 
212937da2899SCharles.Forsyth 				for(y=0; y<dy; y++, dp+=dwid){
213037da2899SCharles.Forsyth 					if(lm){
213137da2899SCharles.Forsyth DBG print("dp %p v %lux lm %ux (v ^ *dp) & lm %lux\n", dp, v, lm, (v^*dp)&lm);
213237da2899SCharles.Forsyth 						*dp ^= (v ^ *dp) & lm;
213337da2899SCharles.Forsyth 						dp++;
213437da2899SCharles.Forsyth 					}
213537da2899SCharles.Forsyth 					*dp ^= (v ^ *dp) & rm;
213637da2899SCharles.Forsyth 				}
213737da2899SCharles.Forsyth 			}else{		/* full bytes in middle */
213837da2899SCharles.Forsyth 				dx /= ppb;
213937da2899SCharles.Forsyth 				if(lm)
214037da2899SCharles.Forsyth 					dwid--;
214137da2899SCharles.Forsyth 				dwid -= dx;
214237da2899SCharles.Forsyth 
214337da2899SCharles.Forsyth 				for(y=0; y<dy; y++, dp+=dwid){
214437da2899SCharles.Forsyth 					if(lm){
214537da2899SCharles.Forsyth 						*dp ^= (v ^ *dp) & lm;
214637da2899SCharles.Forsyth 						dp++;
214737da2899SCharles.Forsyth 					}
214837da2899SCharles.Forsyth 					memset(dp, v, dx);
214937da2899SCharles.Forsyth 					dp += dx;
215037da2899SCharles.Forsyth 					*dp ^= (v ^ *dp) & rm;
215137da2899SCharles.Forsyth 				}
215237da2899SCharles.Forsyth 			}
215337da2899SCharles.Forsyth 			return 1;
215437da2899SCharles.Forsyth 		case 8:
215537da2899SCharles.Forsyth 			for(y=0; y<dy; y++, dp+=dwid)
215637da2899SCharles.Forsyth 				memset(dp, v, dx);
215737da2899SCharles.Forsyth 			return 1;
215837da2899SCharles.Forsyth 		case 16:
215937da2899SCharles.Forsyth 			p[0] = v;		/* make little endian */
216037da2899SCharles.Forsyth 			p[1] = v>>8;
216137da2899SCharles.Forsyth 			v = *(ushort*)p;
216237da2899SCharles.Forsyth DBG print("dp=%p; dx=%d; for(y=0; y<%d; y++, dp+=%d)\nmemsets(dp, v, dx);\n",
216337da2899SCharles.Forsyth 	dp, dx, dy, dwid);
216437da2899SCharles.Forsyth 			for(y=0; y<dy; y++, dp+=dwid)
216537da2899SCharles.Forsyth 				memsets(dp, v, dx);
216637da2899SCharles.Forsyth 			return 1;
216737da2899SCharles.Forsyth 		case 24:
216837da2899SCharles.Forsyth 			for(y=0; y<dy; y++, dp+=dwid)
216937da2899SCharles.Forsyth 				memset24(dp, v, dx);
217037da2899SCharles.Forsyth 			return 1;
217137da2899SCharles.Forsyth 		case 32:
217237da2899SCharles.Forsyth 			p[0] = v;		/* make little endian */
217337da2899SCharles.Forsyth 			p[1] = v>>8;
217437da2899SCharles.Forsyth 			p[2] = v>>16;
217537da2899SCharles.Forsyth 			p[3] = v>>24;
217637da2899SCharles.Forsyth 			v = *(ulong*)p;
217737da2899SCharles.Forsyth 			for(y=0; y<dy; y++, dp+=dwid)
217837da2899SCharles.Forsyth 				memsetl(dp, v, dx);
217937da2899SCharles.Forsyth 			return 1;
218037da2899SCharles.Forsyth 		default:
218137da2899SCharles.Forsyth 			assert(0 /* bad dest depth in memoptdraw */);
218237da2899SCharles.Forsyth 		}
218337da2899SCharles.Forsyth 	}
218437da2899SCharles.Forsyth 
218537da2899SCharles.Forsyth 	/*
218637da2899SCharles.Forsyth 	 * If no source alpha, an opaque mask, we can just copy the
218737da2899SCharles.Forsyth 	 * source onto the destination.  If the channels are the same and
218837da2899SCharles.Forsyth 	 * the source is not replicated, memmove suffices.
218937da2899SCharles.Forsyth 	 */
219037da2899SCharles.Forsyth 	m = Simplemask|Fullmask;
219137da2899SCharles.Forsyth 	if((par->state&(m|Replsrc))==m && src->depth >= 8
219237da2899SCharles.Forsyth 	&& src->chan == dst->chan && (op == S || (op == SoverD && !(src->flags&Falpha)))){
219337da2899SCharles.Forsyth 		uchar *sp, *dp;
219437da2899SCharles.Forsyth 		long swid, dwid, nb;
219537da2899SCharles.Forsyth 		int dir;
219637da2899SCharles.Forsyth 
219737da2899SCharles.Forsyth 		if(src->data == dst->data && byteaddr(dst, par->r.min) > byteaddr(src, par->sr.min))
219837da2899SCharles.Forsyth 			dir = -1;
219937da2899SCharles.Forsyth 		else
220037da2899SCharles.Forsyth 			dir = 1;
220137da2899SCharles.Forsyth 
220237da2899SCharles.Forsyth 		swid = src->width*sizeof(ulong);
220337da2899SCharles.Forsyth 		dwid = dst->width*sizeof(ulong);
220437da2899SCharles.Forsyth 		sp = byteaddr(src, par->sr.min);
220537da2899SCharles.Forsyth 		dp = byteaddr(dst, par->r.min);
220637da2899SCharles.Forsyth 		if(dir == -1){
220737da2899SCharles.Forsyth 			sp += (dy-1)*swid;
220837da2899SCharles.Forsyth 			dp += (dy-1)*dwid;
220937da2899SCharles.Forsyth 			swid = -swid;
221037da2899SCharles.Forsyth 			dwid = -dwid;
221137da2899SCharles.Forsyth 		}
221237da2899SCharles.Forsyth 		nb = (dx*src->depth)/8;
221337da2899SCharles.Forsyth 		for(y=0; y<dy; y++, sp+=swid, dp+=dwid)
221437da2899SCharles.Forsyth 			memmove(dp, sp, nb);
221537da2899SCharles.Forsyth 		return 1;
221637da2899SCharles.Forsyth 	}
221737da2899SCharles.Forsyth 
221837da2899SCharles.Forsyth 	/*
221937da2899SCharles.Forsyth 	 * If we have a 1-bit mask, 1-bit source, and 1-bit destination, and
222037da2899SCharles.Forsyth 	 * they're all bit aligned, we can just use bit operators.  This happens
222137da2899SCharles.Forsyth 	 * when we're manipulating boolean masks, e.g. in the arc code.
222237da2899SCharles.Forsyth 	 */
222337da2899SCharles.Forsyth 	if((par->state&(Simplemask|Simplesrc|Replmask|Replsrc))==0
222437da2899SCharles.Forsyth 	&& dst->chan==GREY1 && src->chan==GREY1 && par->mask->chan==GREY1
222537da2899SCharles.Forsyth 	&& (par->r.min.x&7)==(par->sr.min.x&7) && (par->r.min.x&7)==(par->mr.min.x&7)){
222637da2899SCharles.Forsyth 		uchar *sp, *dp, *mp;
222737da2899SCharles.Forsyth 		uchar lm, rm;
222837da2899SCharles.Forsyth 		long swid, dwid, mwid;
222937da2899SCharles.Forsyth 		int i, x, dir;
223037da2899SCharles.Forsyth 
223137da2899SCharles.Forsyth 		sp = byteaddr(src, par->sr.min);
223237da2899SCharles.Forsyth 		dp = byteaddr(dst, par->r.min);
223337da2899SCharles.Forsyth 		mp = byteaddr(par->mask, par->mr.min);
223437da2899SCharles.Forsyth 		swid = src->width*sizeof(ulong);
223537da2899SCharles.Forsyth 		dwid = dst->width*sizeof(ulong);
223637da2899SCharles.Forsyth 		mwid = par->mask->width*sizeof(ulong);
223737da2899SCharles.Forsyth 
223837da2899SCharles.Forsyth 		if(src->data == dst->data && byteaddr(dst, par->r.min) > byteaddr(src, par->sr.min)){
223937da2899SCharles.Forsyth 			dir = -1;
224037da2899SCharles.Forsyth 		}else
224137da2899SCharles.Forsyth 			dir = 1;
224237da2899SCharles.Forsyth 
224337da2899SCharles.Forsyth 		lm = 0xFF>>(par->r.min.x&7);
224437da2899SCharles.Forsyth 		rm = 0xFF<<(8-(par->r.max.x&7));
224537da2899SCharles.Forsyth 		dx -= (8-(par->r.min.x&7)) + (par->r.max.x&7);
224637da2899SCharles.Forsyth 
224737da2899SCharles.Forsyth 		if(dx < 0){	/* one byte wide */
224837da2899SCharles.Forsyth 			lm &= rm;
224937da2899SCharles.Forsyth 			if(dir == -1){
225037da2899SCharles.Forsyth 				dp += dwid*(dy-1);
225137da2899SCharles.Forsyth 				sp += swid*(dy-1);
225237da2899SCharles.Forsyth 				mp += mwid*(dy-1);
225337da2899SCharles.Forsyth 				dwid = -dwid;
225437da2899SCharles.Forsyth 				swid = -swid;
225537da2899SCharles.Forsyth 				mwid = -mwid;
225637da2899SCharles.Forsyth 			}
225737da2899SCharles.Forsyth 			for(y=0; y<dy; y++){
225837da2899SCharles.Forsyth 				*dp ^= (*dp ^ *sp) & *mp & lm;
225937da2899SCharles.Forsyth 				dp += dwid;
226037da2899SCharles.Forsyth 				sp += swid;
226137da2899SCharles.Forsyth 				mp += mwid;
226237da2899SCharles.Forsyth 			}
226337da2899SCharles.Forsyth 			return 1;
226437da2899SCharles.Forsyth 		}
226537da2899SCharles.Forsyth 
226637da2899SCharles.Forsyth 		dx /= 8;
226737da2899SCharles.Forsyth 		if(dir == 1){
226837da2899SCharles.Forsyth 			i = (lm!=0)+dx+(rm!=0);
226937da2899SCharles.Forsyth 			mwid -= i;
227037da2899SCharles.Forsyth 			swid -= i;
227137da2899SCharles.Forsyth 			dwid -= i;
227237da2899SCharles.Forsyth 			for(y=0; y<dy; y++, dp+=dwid, sp+=swid, mp+=mwid){
227337da2899SCharles.Forsyth 				if(lm){
227437da2899SCharles.Forsyth 					*dp ^= (*dp ^ *sp++) & *mp++ & lm;
227537da2899SCharles.Forsyth 					dp++;
227637da2899SCharles.Forsyth 				}
227737da2899SCharles.Forsyth 				for(x=0; x<dx; x++){
227837da2899SCharles.Forsyth 					*dp ^= (*dp ^ *sp++) & *mp++;
227937da2899SCharles.Forsyth 					dp++;
228037da2899SCharles.Forsyth 				}
228137da2899SCharles.Forsyth 				if(rm){
228237da2899SCharles.Forsyth 					*dp ^= (*dp ^ *sp++) & *mp++ & rm;
228337da2899SCharles.Forsyth 					dp++;
228437da2899SCharles.Forsyth 				}
228537da2899SCharles.Forsyth 			}
228637da2899SCharles.Forsyth 			return 1;
228737da2899SCharles.Forsyth 		}else{
228837da2899SCharles.Forsyth 		/* dir == -1 */
228937da2899SCharles.Forsyth 			i = (lm!=0)+dx+(rm!=0);
229037da2899SCharles.Forsyth 			dp += dwid*(dy-1)+i-1;
229137da2899SCharles.Forsyth 			sp += swid*(dy-1)+i-1;
229237da2899SCharles.Forsyth 			mp += mwid*(dy-1)+i-1;
229337da2899SCharles.Forsyth 			dwid = -dwid+i;
229437da2899SCharles.Forsyth 			swid = -swid+i;
229537da2899SCharles.Forsyth 			mwid = -mwid+i;
229637da2899SCharles.Forsyth 			for(y=0; y<dy; y++, dp+=dwid, sp+=swid, mp+=mwid){
229737da2899SCharles.Forsyth 				if(rm){
229837da2899SCharles.Forsyth 					*dp ^= (*dp ^ *sp--) & *mp-- & rm;
229937da2899SCharles.Forsyth 					dp--;
230037da2899SCharles.Forsyth 				}
230137da2899SCharles.Forsyth 				for(x=0; x<dx; x++){
230237da2899SCharles.Forsyth 					*dp ^= (*dp ^ *sp--) & *mp--;
230337da2899SCharles.Forsyth 					dp--;
230437da2899SCharles.Forsyth 				}
230537da2899SCharles.Forsyth 				if(lm){
230637da2899SCharles.Forsyth 					*dp ^= (*dp ^ *sp--) & *mp-- & lm;
230737da2899SCharles.Forsyth 					dp--;
230837da2899SCharles.Forsyth 				}
230937da2899SCharles.Forsyth 			}
231037da2899SCharles.Forsyth 		}
231137da2899SCharles.Forsyth 		return 1;
231237da2899SCharles.Forsyth 	}
231337da2899SCharles.Forsyth 	return 0;
231437da2899SCharles.Forsyth }
231537da2899SCharles.Forsyth #undef DBG
231637da2899SCharles.Forsyth 
231737da2899SCharles.Forsyth /*
231837da2899SCharles.Forsyth  * Boolean character drawing.
231937da2899SCharles.Forsyth  * Solid opaque color through a 1-bit greyscale mask.
232037da2899SCharles.Forsyth  */
232137da2899SCharles.Forsyth #define DBG if(0)
232237da2899SCharles.Forsyth static int
chardraw(Memdrawparam * par)232337da2899SCharles.Forsyth chardraw(Memdrawparam *par)
232437da2899SCharles.Forsyth {
232537da2899SCharles.Forsyth 	ulong bits;
232637da2899SCharles.Forsyth 	int i, ddepth, dy, dx, x, bx, ex, y, npack, bsh, depth, op;
232737da2899SCharles.Forsyth 	ulong v, maskwid, dstwid;
232837da2899SCharles.Forsyth 	uchar *wp, *rp, *q, *wc;
232937da2899SCharles.Forsyth 	ushort *ws;
233037da2899SCharles.Forsyth 	ulong *wl;
233137da2899SCharles.Forsyth 	uchar sp[4];
233237da2899SCharles.Forsyth 	Rectangle r, mr;
233337da2899SCharles.Forsyth 	Memimage *mask, *src, *dst;
233437da2899SCharles.Forsyth 
233537da2899SCharles.Forsyth if(0) if(drawdebug) iprint("chardraw? mf %lux md %d sf %lux dxs %d dys %d dd %d ddat %p sdat %p\n",
233637da2899SCharles.Forsyth 		par->mask->flags, par->mask->depth, par->src->flags,
233737da2899SCharles.Forsyth 		Dx(par->src->r), Dy(par->src->r), par->dst->depth, par->dst->data, par->src->data);
233837da2899SCharles.Forsyth 
233937da2899SCharles.Forsyth 	mask = par->mask;
234037da2899SCharles.Forsyth 	src = par->src;
234137da2899SCharles.Forsyth 	dst = par->dst;
234237da2899SCharles.Forsyth 	r = par->r;
234337da2899SCharles.Forsyth 	mr = par->mr;
234437da2899SCharles.Forsyth 	op = par->op;
234537da2899SCharles.Forsyth 
234637da2899SCharles.Forsyth 	if((par->state&(Replsrc|Simplesrc|Replmask)) != (Replsrc|Simplesrc)
234737da2899SCharles.Forsyth 	|| mask->depth != 1 || src->flags&Falpha || dst->depth<8 || dst->data==src->data
234837da2899SCharles.Forsyth 	|| op != SoverD)
234937da2899SCharles.Forsyth 		return 0;
235037da2899SCharles.Forsyth 
235137da2899SCharles.Forsyth //if(drawdebug) iprint("chardraw...");
235237da2899SCharles.Forsyth 
235337da2899SCharles.Forsyth 	depth = mask->depth;
235437da2899SCharles.Forsyth 	maskwid = mask->width*sizeof(ulong);
235537da2899SCharles.Forsyth 	rp = byteaddr(mask, mr.min);
235637da2899SCharles.Forsyth 	npack = 8/depth;
235737da2899SCharles.Forsyth 	bsh = (mr.min.x % npack) * depth;
235837da2899SCharles.Forsyth 
235937da2899SCharles.Forsyth 	wp = byteaddr(dst, r.min);
236037da2899SCharles.Forsyth 	dstwid = dst->width*sizeof(ulong);
236137da2899SCharles.Forsyth DBG print("bsh %d\n", bsh);
236237da2899SCharles.Forsyth 	dy = Dy(r);
236337da2899SCharles.Forsyth 	dx = Dx(r);
236437da2899SCharles.Forsyth 
236537da2899SCharles.Forsyth 	ddepth = dst->depth;
236637da2899SCharles.Forsyth 
236737da2899SCharles.Forsyth 	/*
236837da2899SCharles.Forsyth 	 * for loop counts from bsh to bsh+dx
236937da2899SCharles.Forsyth 	 *
237037da2899SCharles.Forsyth 	 * we want the bottom bits to be the amount
237137da2899SCharles.Forsyth 	 * to shift the pixels down, so for n≡0 (mod 8) we want
237237da2899SCharles.Forsyth 	 * bottom bits 7.  for n≡1, 6, etc.
237337da2899SCharles.Forsyth 	 * the bits come from -n-1.
237437da2899SCharles.Forsyth 	 */
237537da2899SCharles.Forsyth 
237637da2899SCharles.Forsyth 	bx = -bsh-1;
237737da2899SCharles.Forsyth 	ex = -bsh-1-dx;
23786e425a9dSCharles.Forsyth 	bits = 0;
237937da2899SCharles.Forsyth 	v = par->sdval;
238037da2899SCharles.Forsyth 
238137da2899SCharles.Forsyth 	/* make little endian */
238237da2899SCharles.Forsyth 	sp[0] = v;
238337da2899SCharles.Forsyth 	sp[1] = v>>8;
238437da2899SCharles.Forsyth 	sp[2] = v>>16;
238537da2899SCharles.Forsyth 	sp[3] = v>>24;
238637da2899SCharles.Forsyth 
238737da2899SCharles.Forsyth //print("sp %x %x %x %x\n", sp[0], sp[1], sp[2], sp[3]);
238837da2899SCharles.Forsyth 	for(y=0; y<dy; y++, rp+=maskwid, wp+=dstwid){
238937da2899SCharles.Forsyth 		q = rp;
239037da2899SCharles.Forsyth 		if(bsh)
239137da2899SCharles.Forsyth 			bits = *q++;
239237da2899SCharles.Forsyth 		switch(ddepth){
239337da2899SCharles.Forsyth 		case 8:
239437da2899SCharles.Forsyth //if(drawdebug) iprint("8loop...");
239537da2899SCharles.Forsyth 			wc = wp;
239637da2899SCharles.Forsyth 			for(x=bx; x>ex; x--, wc++){
239737da2899SCharles.Forsyth 				i = x&7;
239837da2899SCharles.Forsyth 				if(i == 8-1)
239937da2899SCharles.Forsyth 					bits = *q++;
240037da2899SCharles.Forsyth DBG print("bits %lux sh %d...", bits, i);
240137da2899SCharles.Forsyth 				if((bits>>i)&1)
240237da2899SCharles.Forsyth 					*wc = v;
240337da2899SCharles.Forsyth 			}
240437da2899SCharles.Forsyth 			break;
240537da2899SCharles.Forsyth 		case 16:
240637da2899SCharles.Forsyth 			ws = (ushort*)wp;
240737da2899SCharles.Forsyth 			v = *(ushort*)sp;
240837da2899SCharles.Forsyth 			for(x=bx; x>ex; x--, ws++){
240937da2899SCharles.Forsyth 				i = x&7;
241037da2899SCharles.Forsyth 				if(i == 8-1)
241137da2899SCharles.Forsyth 					bits = *q++;
241237da2899SCharles.Forsyth DBG print("bits %lux sh %d...", bits, i);
241337da2899SCharles.Forsyth 				if((bits>>i)&1)
241437da2899SCharles.Forsyth 					*ws = v;
241537da2899SCharles.Forsyth 			}
241637da2899SCharles.Forsyth 			break;
241737da2899SCharles.Forsyth 		case 24:
241837da2899SCharles.Forsyth 			wc = wp;
241937da2899SCharles.Forsyth 			for(x=bx; x>ex; x--, wc+=3){
242037da2899SCharles.Forsyth 				i = x&7;
242137da2899SCharles.Forsyth 				if(i == 8-1)
242237da2899SCharles.Forsyth 					bits = *q++;
242337da2899SCharles.Forsyth DBG print("bits %lux sh %d...", bits, i);
242437da2899SCharles.Forsyth 				if((bits>>i)&1){
242537da2899SCharles.Forsyth 					wc[0] = sp[0];
242637da2899SCharles.Forsyth 					wc[1] = sp[1];
242737da2899SCharles.Forsyth 					wc[2] = sp[2];
242837da2899SCharles.Forsyth 				}
242937da2899SCharles.Forsyth 			}
243037da2899SCharles.Forsyth 			break;
243137da2899SCharles.Forsyth 		case 32:
243237da2899SCharles.Forsyth 			wl = (ulong*)wp;
243337da2899SCharles.Forsyth 			v = *(ulong*)sp;
243437da2899SCharles.Forsyth 			for(x=bx; x>ex; x--, wl++){
243537da2899SCharles.Forsyth 				i = x&7;
243637da2899SCharles.Forsyth 				if(i == 8-1)
243737da2899SCharles.Forsyth 					bits = *q++;
243837da2899SCharles.Forsyth DBG iprint("bits %lux sh %d...", bits, i);
243937da2899SCharles.Forsyth 				if((bits>>i)&1)
244037da2899SCharles.Forsyth 					*wl = v;
244137da2899SCharles.Forsyth 			}
244237da2899SCharles.Forsyth 			break;
244337da2899SCharles.Forsyth 		}
244437da2899SCharles.Forsyth 	}
244537da2899SCharles.Forsyth 
244637da2899SCharles.Forsyth DBG print("\n");
244737da2899SCharles.Forsyth 	return 1;
244837da2899SCharles.Forsyth }
244937da2899SCharles.Forsyth #undef DBG
245037da2899SCharles.Forsyth 
245137da2899SCharles.Forsyth 
245237da2899SCharles.Forsyth /*
245337da2899SCharles.Forsyth  * Fill entire byte with replicated (if necessary) copy of source pixel,
245437da2899SCharles.Forsyth  * assuming destination ldepth is >= source ldepth.
245537da2899SCharles.Forsyth  *
245637da2899SCharles.Forsyth  * This code is just plain wrong for >8bpp.
245737da2899SCharles.Forsyth  *
245837da2899SCharles.Forsyth ulong
245937da2899SCharles.Forsyth membyteval(Memimage *src)
246037da2899SCharles.Forsyth {
246137da2899SCharles.Forsyth 	int i, val, bpp;
246237da2899SCharles.Forsyth 	uchar uc;
246337da2899SCharles.Forsyth 
246437da2899SCharles.Forsyth 	unloadmemimage(src, src->r, &uc, 1);
246537da2899SCharles.Forsyth 	bpp = src->depth;
246637da2899SCharles.Forsyth 	uc <<= (src->r.min.x&(7/src->depth))*src->depth;
246737da2899SCharles.Forsyth 	uc &= ~(0xFF>>bpp);
2468*adad2431Sforsyth 	// pixel value is now in high part of byte. repeat throughout byte
246937da2899SCharles.Forsyth 	val = uc;
247037da2899SCharles.Forsyth 	for(i=bpp; i<8; i<<=1)
247137da2899SCharles.Forsyth 		val |= val>>i;
247237da2899SCharles.Forsyth 	return val;
247337da2899SCharles.Forsyth }
247437da2899SCharles.Forsyth  *
247537da2899SCharles.Forsyth  */
247637da2899SCharles.Forsyth 
247737da2899SCharles.Forsyth void
memfillcolor(Memimage * i,ulong val)247837da2899SCharles.Forsyth memfillcolor(Memimage *i, ulong val)
247937da2899SCharles.Forsyth {
248037da2899SCharles.Forsyth 	ulong bits;
248137da2899SCharles.Forsyth 	int d, y;
2482f8b3fca7SCharles.Forsyth 	uchar p[4];
248337da2899SCharles.Forsyth 
248437da2899SCharles.Forsyth 	if(val == DNofill)
248537da2899SCharles.Forsyth 		return;
248637da2899SCharles.Forsyth 
248737da2899SCharles.Forsyth 	bits = rgbatoimg(i, val);
248837da2899SCharles.Forsyth 	switch(i->depth){
248937da2899SCharles.Forsyth 	case 24:	/* 24-bit images suck */
249037da2899SCharles.Forsyth 		for(y=i->r.min.y; y<i->r.max.y; y++)
249137da2899SCharles.Forsyth 			memset24(byteaddr(i, Pt(i->r.min.x, y)), bits, Dx(i->r));
249237da2899SCharles.Forsyth 		break;
249337da2899SCharles.Forsyth 	default:	/* 1, 2, 4, 8, 16, 32 */
249437da2899SCharles.Forsyth 		for(d=i->depth; d<32; d*=2)
249537da2899SCharles.Forsyth 			bits = (bits << d) | bits;
2496f8b3fca7SCharles.Forsyth 		p[0] = bits;		/* make little endian */
2497f8b3fca7SCharles.Forsyth 		p[1] = bits>>8;
2498f8b3fca7SCharles.Forsyth 		p[2] = bits>>16;
2499f8b3fca7SCharles.Forsyth 		p[3] = bits>>24;
2500f8b3fca7SCharles.Forsyth 		bits = *(u32int*)p;
250137da2899SCharles.Forsyth 		memsetl(wordaddr(i, i->r.min), bits, i->width*Dy(i->r));
250237da2899SCharles.Forsyth 		break;
250337da2899SCharles.Forsyth 	}
250437da2899SCharles.Forsyth }
250537da2899SCharles.Forsyth 
2506