libm/national/support.s

*34129Sbostic;
*34129Sbostic; Copyright (c) 1985 Regents of the University of California.
*34129Sbostic; All rights reserved.
*34129Sbostic;
*34129Sbostic; Redistribution and use in source and binary forms are permitted
*34129Sbostic; provided that this notice is preserved and that due credit is given
*34129Sbostic; to the University of California at Berkeley. The name of the University
*34129Sbostic; may not be used to endorse or promote products derived from this
*34129Sbostic; software without specific prior written permission. This software
*34129Sbostic; is provided ``as is'' without express or implied warranty.
*34129Sbostic;
*34129Sbostic; All recipients should regard themselves as participants in an ongoing
*34129Sbostic; research project and hence should feel obligated to report their
*34129Sbostic; experiences (good or bad) with these elementary function codes, using
*34129Sbostic; the sendbug(8) program, to the authors.
*34129Sbostic;
*34129Sbostic;	@(#)support.s	5.2 (Berkeley) 04/29/88
*34129Sbostic;
*34129Sbostic
26460Selefunt; IEEE recommended functions
26460Selefunt;
26460Selefunt; double copysign(x,y)
26460Selefunt; double x,y;
26460Selefunt; IEEE 754 recommended function, return x*sign(y)
26460Selefunt; Coded by K.C. Ng in National 32k assembler, 11/9/85.
26460Selefunt;
26460Selefunt	.vers	2
26460Selefunt	.text
26460Selefunt	.align	2
26460Selefunt	.globl	_copysign
26460Selefunt_copysign:
26460Selefunt	movl	4(sp),f0
26460Selefunt	movd	8(sp),r0
26460Selefunt	movd	16(sp),r1
26460Selefunt	xord	r0,r1
26907Selefunt	andd	0x80000000,r1
26460Selefunt	cmpqd	0,r1
26460Selefunt	beq	end
26460Selefunt	negl	f0,f0
26460Selefuntend:	ret	0
26460Selefunt
26460Selefunt;
26460Selefunt; double logb(x)
26460Selefunt; double x;
26460Selefunt; IEEE p854 recommended function, return the exponent of x (return float(N)
26460Selefunt; such that 1 <= x*2**-N < 2, even for subnormal number.
26460Selefunt; Coded by K.C. Ng in National 32k assembler, 11/9/85.
26460Selefunt; Note: subnormal number (if implemented) will be taken care of.
26460Selefunt;
26460Selefunt	.vers	2
26460Selefunt	.text
26460Selefunt	.align	2
26460Selefunt	.globl	_logb
26460Selefunt_logb:
26460Selefunt;
26460Selefunt; extract the exponent of x
26460Selefunt; glossaries:	r0 = high part of x
26460Selefunt;		r1 = unbias exponent of x
26460Selefunt;		r2 = 20 (first exponent bit position)
26460Selefunt;
26460Selefunt	movd	8(sp),r0
26460Selefunt	movd	20,r2
26460Selefunt	extd	r2,r0,r1,11	; extract the exponent of x
26460Selefunt	cmpqd	0,r1		; if exponent bits = 0, goto L3
26460Selefunt	beq	L3
26460Selefunt	cmpd	0x7ff,r1
26460Selefunt	beq	L2		; if exponent bits = 0x7ff, goto L2
26460SelefuntL1:	subd	1023,r1		; unbias the exponent
26460Selefunt	movdl	r1,f0		; convert the exponent to floating value
26460Selefunt	ret	0
26460Selefunt;
26460Selefunt; x is INF or NaN, simply return x
26460Selefunt;
26460SelefuntL2:
26460Selefunt	movl	4(sp),f0	; logb(+inf)=+inf, logb(NaN)=NaN
26460Selefunt	ret	0
26460Selefunt;
26460Selefunt; x is 0 or subnormal
26460Selefunt;
26460SelefuntL3:
26460Selefunt	movl	4(sp),f0
26460Selefunt	cmpl	0f0,f0
26460Selefunt	beq	L5		; x is 0 , goto L5 (return -inf)
26460Selefunt;
26460Selefunt; Now x is subnormal
26460Selefunt;
26460Selefunt	mull	L64,f0		; scale up f0 with 2**64
26460Selefunt	movl	f0,tos
26460Selefunt	movd	tos,r0
26460Selefunt	movd	tos,r0		; now r0 = new high part of x
26460Selefunt	extd	r2,r0,r1,11	; extract the exponent of x to r1
26460Selefunt	subd	1087,r1		; unbias the exponent with correction
26460Selefunt	movdl	r1,f0		; convert the exponent to floating value
26460Selefunt	ret	0
26460Selefunt;
26460Selefunt; x is 0, return logb(0)= -INF
26460Selefunt;
26460SelefuntL5:
26460Selefunt	movl	0f1.0e300,f0
26460Selefunt	mull	0f-1.0e300,f0	; multiply two big numbers to get -INF
26460Selefunt	ret	0
26460Selefunt;
26460Selefunt; double rint(x)
26460Selefunt; double x;
26460Selefunt; ... delivers integer nearest x in direction of prevailing rounding
26460Selefunt; ... mode
26460Selefunt; Coded by K.C. Ng in National 32k assembler, 11/9/85.
26460Selefunt; Note: subnormal number (if implemented) will be taken care of.
26460Selefunt;
26460Selefunt	.vers	2
26460Selefunt	.text
26460Selefunt	.align	2
26460Selefunt	.globl	_rint
26460Selefunt_rint:
26460Selefunt;
26460Selefunt	movd	8(sp),r0
26460Selefunt	movd	20,r2
26460Selefunt	extd	r2,r0,r1,11	; extract the exponent of x
26460Selefunt	cmpd	0x433,r1
26460Selefunt	ble	itself
26460Selefunt	movl	L52,f2		; f2 = L = 2**52
26460Selefunt	cmpqd	0,r0
26460Selefunt	ble	L1
26460Selefunt	negl	f2,f2		; f2 = s = copysign(L,x)
26460SelefuntL1:	addl	f2,f0		; f0 = x + s
26460Selefunt	subl	f2,f0		; f0 = f0 - s
26460Selefunt	ret	0
26460Selefuntitself:	movl	4(sp),f0
26460Selefunt	ret	0
26460SelefuntL52:	.double	0x0,0x43300000	; L52=2**52
26460Selefunt;
26460Selefunt; int finite(x)
26460Selefunt; double x;
26460Selefunt; IEEE 754 recommended function, return 0 if x is NaN or INF, else 0
26460Selefunt; Coded by K.C. Ng in National 32k assembler, 11/9/85.
26460Selefunt;
26460Selefunt	.vers	2
26460Selefunt	.text
26460Selefunt	.align	2
26460Selefunt	.globl	_finite
26460Selefunt_finite:
26460Selefunt	movd	4(sp),r1
26460Selefunt	andd	0x800fffff,r1
26460Selefunt	cmpd	0x7ff00000,r1
26460Selefunt	sned	r0		; r0=0 if exponent(x) = 0x7ff
26460Selefunt	ret	0
26460Selefunt;
26460Selefunt; double scalb(x,N)
26460Selefunt; double x; int N;
26460Selefunt; IEEE 754 recommended function, return x*2**N by adjusting
26460Selefunt; exponent of x.
26460Selefunt; Coded by K.C. Ng in National 32k assembler, 11/9/85.
26460Selefunt; Note: subnormal number (if implemented) will be taken care of
26460Selefunt;
26460Selefunt	.vers	2
26460Selefunt	.text
26460Selefunt	.align	2
26460Selefunt	.globl	_scalb
26460Selefunt_scalb:
26460Selefunt;
26460Selefunt; if x=0 return 0
26460Selefunt;
26460Selefunt	movl	4(sp),f0
26460Selefunt	cmpl	0f0,f0
26460Selefunt	beq	end		; scalb(0,N) is x itself
26460Selefunt;
26460Selefunt; extract the exponent of x
26460Selefunt; glossaries:	r0 = high part of x,
26460Selefunt;		r1 = unbias exponent of x,
26460Selefunt;		r2 = 20 (first exponent bit position).
26460Selefunt;
26460Selefunt	movd	8(sp),r0	; r0 = high part of x
26460Selefunt	movd	20,r2		; r2 = 20
26460Selefunt	extd	r2,r0,r1,11	; extract the exponent of x in r1
26460Selefunt	cmpd	0x7ff,r1
26460Selefunt;
26460Selefunt; if exponent of x is 0x7ff, then x is NaN or INF; simply return x
26460Selefunt;
26460Selefunt	beq	end
26460Selefunt	cmpqd	0,r1
26460Selefunt;
26460Selefunt; if exponent of x is zero, then x is subnormal; goto L19
26460Selefunt;
26460Selefunt	beq	L19
26460Selefunt	addd	12(sp),r1	; r1 = (exponent of x) + N
26460Selefunt	bfs	inof		; if integer overflows, goto inof
26460Selefunt	cmpqd	0,r1		; if new exponent <= 0, goto underflow
26460Selefunt	bge	underflow
26460Selefunt	cmpd	2047,r1		; if new exponent >= 2047 goto overflow
26460Selefunt	ble	overflow
26460Selefunt	insd	r2,r1,r0,11	; insert the new exponent
26460Selefunt	movd	r0,tos
26460Selefunt	movd	8(sp),tos
26460Selefunt	movl	tos,f0		; return x*2**N
26460Selefuntend:	ret	0
26460Selefuntinof:	bcs	underflow	; negative int overflow if Carry bit is set
26460Selefuntoverflow:
26460Selefunt	andd	0x80000000,r0	; keep the sign of x
26460Selefunt	ord	0x7fe00000,r0	; set x to a huge number
26460Selefunt	movd	r0,tos
26460Selefunt	movqd	0,tos
26460Selefunt	movl	tos,f0
26460Selefunt	mull	0f1.0e300,f0	; multiply two huge number to get overflow
26460Selefunt	ret	0
26460Selefuntunderflow:
26460Selefunt	addd	64,r1		; add 64 to exonent to see if it is subnormal
26460Selefunt	cmpqd	0,r1
26460Selefunt	bge	zero		; underflow to zero
26460Selefunt	insd	r2,r1,r0,11	; insert the new exponent
26460Selefunt	movd	r0,tos
26460Selefunt	movd	8(sp),tos
26460Selefunt	movl	tos,f0
26460Selefunt	mull	L30,f0		; readjust x by multiply it with 2**-64
26460Selefunt	ret	0
26460Selefuntzero:	andd	0x80000000,r0	; keep the sign of x
26460Selefunt	ord	0x00100000,r0	; set x to a tiny number
26460Selefunt	movd	r0,tos
26460Selefunt	movqd	0,tos
26460Selefunt	movl	tos,f0
26460Selefunt	mull	0f1.0e-300,f0	; underflow to 0  by multipling two tiny nos.
26460Selefunt	ret	0
26460SelefuntL19:		; subnormal number
26460Selefunt	mull	L32,f0		; scale up x by 2**64
26460Selefunt	movl	f0,tos
26460Selefunt	movd	tos,r0
26460Selefunt	movd	tos,r0		; get the high part of new x
26460Selefunt	extd	r2,r0,r1,11	; extract the exponent of x in r1
26460Selefunt	addd	12(sp),r1	; exponent of x + N
26460Selefunt	subd	64,r1		; adjust it by subtracting 64
26460Selefunt	cmpqd	0,r1
26460Selefunt	bge	underflow
26460Selefunt	cmpd	2047,r1
26460Selefunt	ble	overflow
26460Selefunt	insd	r2,r1,r0,11	; insert back the incremented exponent
26460Selefunt	movd	r0,tos
26460Selefunt	movd	8(sp),tos
26460Selefunt	movl	tos,f0
26460Selefuntend:	ret	0
26460SelefuntL30:	.double	0x0,0x3bf00000	; floating point 2**-64
26460SelefuntL32:	.double	0x0,0x43f00000	; floating point 2**64
31848Szliu;
31848Szliu; double drem(x,y)
31848Szliu; double x,y;
31848Szliu; IEEE double remainder function, return x-n*y, where n=x/y rounded to
31848Szliu; nearest integer (half way case goes to even). Result exact.
31848Szliu; Coded by K.C. Ng in National 32k assembly, 11/19/85.
31848Szliu;
31848Szliu	.vers	2
31848Szliu	.text
31848Szliu	.align	2
31848Szliu	.globl	_drem
31848Szliu_drem:
31848Szliu;
31848Szliu; glossaries:
31848Szliu;		r2 = high part of x
31848Szliu;		r3 = exponent of x
31848Szliu;		r4 = high part of y
31848Szliu;		r5 = exponent of y
31848Szliu;		r6 = sign of x
31848Szliu;		r7 = constant 0x7ff00000
31848Szliu;
31848Szliu;  16(fp) : y
31848Szliu;   8(fp) : x
31848Szliu; -12(fp) : adjustment on y when y is subnormal
31848Szliu; -16(fp) : fsr
31848Szliu; -20(fp) : nx
31848Szliu; -28(fp) : t
31848Szliu; -36(fp) : t1
31848Szliu; -40(fp) : nf
31848Szliu;
31848Szliu;
31848Szliu	enter	[r3,r4,r5,r6,r7],40
31848Szliu	movl	f6,tos
31848Szliu	movl	f4,tos
31848Szliu	movl	0f0,-12(fp)
31848Szliu	movd	0,-20(fp)
31848Szliu	movd	0,-40(fp)
31848Szliu	movd	0x7ff00000,r7	; initialize r7=0x7ff00000
31848Szliu	movd	12(fp),r2	; r2 = high(x)
31848Szliu	movd	r2,r3
31848Szliu	andd	r7,r3		; r3 = xexp
31848Szliu	cmpd	r7,r3
31848Szliu; if x is NaN or INF goto L1
31848Szliu	beq	L1
31848Szliu	movd	20(fp),r4
31848Szliu	bicd	[31],r4		; r4 = high part of |y|
31848Szliu	movd	r4,20(fp)	; y = |y|
31848Szliu	movd	r4,r5
31848Szliu	andd	r7,r5		; r5 = yexp
31848Szliu	cmpd	r7,r5
31848Szliu	beq	L2		; if y is NaN or INF goto L2
31848Szliu	cmpd	0x04000000,r5	;
31848Szliu	bgt	L3		; if y is tiny goto L3
31848Szliu;
31848Szliu; now y != 0 , x is finite
31848Szliu;
31848SzliuL10:
31848Szliu	movd	r2,r6
31848Szliu	andd	0x80000000,r6	; r6 = sign(x)
31848Szliu	bicd	[31],r2		; x <- |x|
31848Szliu	sfsr	r1
31848Szliu	movd	r1,-16(fp)	; save fsr in -16(fp)
31848Szliu	bicd	[5],r1
31848Szliu	lfsr	r1		; disable inexact interupt
31848Szliu	movd	16(fp),r0	; r0 = low part of y
31848Szliu	movd	r0,r1		; r1 = r0 = low part of y
31848Szliu	andd	0xf8000000,r1	; mask off the lsb 27 bits of y
31848Szliu
31848Szliu	movd	r2,12(fp)	; update x to |x|
31848Szliu	movd	r0,-28(fp)	;
31848Szliu	movd	r4,-24(fp)	; t  = y
31848Szliu	movd	r4,-32(fp)	;
31848Szliu	movd	r1,-36(fp)	; t1 = y with trialing 27 zeros
31848Szliu	movd	0x01900000,r1	; r1 = 25 in exponent field
31848SzliuLOOP:
31848Szliu	movl	8(fp),f0	; f0 = x
31848Szliu	movl	16(fp),f2	; f2 = y
31848Szliu	cmpl	f0,f2
31848Szliu	ble	fnad		; goto fnad (final adjustment) if x <= y
31848Szliu	movd	r4,-32(fp)
31848Szliu	movd	r3,r0
31848Szliu	subd	r5,r0		; xexp - yexp
31848Szliu	subd	r1,r0		; r0 = xexp - yexp - m25
31848Szliu	cmpqd	0,r0		; r0 > 0 ?
31848Szliu	bge	1f
31848Szliu	addd	r4,r0		; scale up (high) y
31848Szliu	movd	r0,-24(fp)	; scale up t
31848Szliu	movl	-28(fp),f2	; t
31848Szliu	movd	r0,-32(fp)	; scale up t1
31848Szliu1:
31848Szliu	movl	-36(fp),f4	; t1
31848Szliu	movl	f0,f6
31848Szliu	divl	f2,f6		; f6 = x/t
31848Szliu	floorld	f6,r0		; r0 = [x/t]
31848Szliu	movdl	r0,f6		; f6 = n
31848Szliu	subl	f4,f2		; t = t - t1 (tail of t1)
31848Szliu	mull	f6,f4		; f4 = n*t1	...exact
31848Szliu	subl	f4,f0		; x = x - n*t1
31848Szliu	mull	f6,f2		; n*(t-t1)	...exact
31848Szliu	subl	f2,f0		; x = x - n*(t-t1)
31848Szliu; update xexp
31848Szliu	movl	f0,8(fp)
31848Szliu	movd	12(fp),r3
31848Szliu	andd	r7,r3
31848Szliu	jump	LOOP
31848Szliufnad:
31848Szliu	cmpqd	0,-20(fp)	; 0 = nx?
31848Szliu	beq	final
31848Szliu	mull	-12(fp),8(fp)	; scale up x the same amount as y
31848Szliu	movd	0,-20(fp)
31848Szliu	movd	12(fp),r2
31848Szliu	movd	r2,r3
31848Szliu	andd	r7,r3		; update exponent of x
31848Szliu	jump	LOOP
31848Szliu
31848Szliufinal:
31848Szliu	movl	16(fp),f2	; f2 = y (f0=x, r0=n)
31848Szliu	subd	0x100000,r4	; high y /2
31848Szliu	movd	r4,-24(fp)
31848Szliu	movl	-28(fp),f4	; f4 = y/2
31848Szliu	cmpl	f0,f4		; x > y/2 ?
31848Szliu	bgt	1f
31848Szliu	bne	2f
31848Szliu	andd	1,r0		; n is odd or even
31848Szliu	cmpqd	0,r0
31848Szliu	beq	2f
31848Szliu1:
31848Szliu	subl	f2,f0		; x = x - y
31848Szliu2:
31848Szliu	cmpqd	0,-40(fp)
31848Szliu	beq	3f
31848Szliu	divl	-12(fp),f0	; scale down the answer
31848Szliu3:
31848Szliu	movl	f0,tos
31848Szliu	xord	r6,tos
31848Szliu	movl	tos,f0
31848Szliu	movd	-16(fp),r0
31848Szliu	lfsr	r0		; restore the fsr
31848Szliu
31848Szliuend:	movl	tos,f4
31848Szliu	movl	tos,f6
31848Szliu	exit	[r3,r4,r5,r6,r7]
31848Szliu	ret	0
31848Szliu;
31848Szliu; y is NaN or INF
31848Szliu;
31848SzliuL2:
31848Szliu	movd	16(fp),r0	; r0 = low part of y
31848Szliu	andd	0xfffff,r4	; r4 = high part of y & 0x000fffff
31848Szliu	ord	r4,r0
31848Szliu	cmpqd	0,r0
31848Szliu	beq	L4
31848Szliu	movl	16(fp),f0	; y is NaN, return y
31848Szliu	jump	end
31848SzliuL4:	movl	8(fp),f0	; y is inf, return x
31848Szliu	jump	end
31848Szliu;
31848Szliu; exponent of y is less than 64, y may be zero or subnormal
31848Szliu;
31848SzliuL3:
31848Szliu	movl	16(fp),f0
31848Szliu	cmpl	0f0,f0
31848Szliu	bne	L5
31848Szliu	divl	f0,f0		; y is 0, return NaN by doing 0/0
31848Szliu	jump	end
31848Szliu;
31848Szliu; subnormal y or tiny y
31848Szliu;
31848SzliuL5:
31848Szliu	movd	0x04000000,-20(fp)	; nx = 64 in exponent field
31848Szliu	movl	L64,f2
31848Szliu	movl	f2,-12(fp)
31848Szliu	mull	f2,f0
31848Szliu	cmpl	f0,LTINY
31848Szliu	bgt	L6
31848Szliu	mull	f2,f0
31848Szliu	addd	0x04000000,-20(fp)	; nx = nx + 64 in exponent field
31848Szliu	mull	f2,-12(fp)
31848SzliuL6:
31848Szliu	movd	-20(fp),-40(fp)
31848Szliu	movl	f0,16(fp)
31848Szliu	movd	20(fp),r4
31848Szliu	movd	r4,r5
31848Szliu	andd	r7,r5		; exponent of new y
31848Szliu	jump	L10
31848Szliu;
31848Szliu; x is NaN or INF, return x-x
31848Szliu;
31848SzliuL1:
31848Szliu	movl	8(fp),f0
31848Szliu	subl	f0,f0		; if x is INF, then INF-INF is NaN
31848Szliu	ret	0
31848SzliuL64:	.double 0x0,0x43f00000	; L64 = 2**64
31848SzliuLTINY:	.double 0x0,0x04000000	; LTINY = 2**-959