sparc/gen/modf.s

*54388Storek/*
*54388Storek * Copyright (c) 1992 The Regents of the University of California.
*54388Storek * All rights reserved.
*54388Storek *
*54388Storek * This software was developed by the Computer Systems Engineering group
*54388Storek * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and
*54388Storek * contributed to Berkeley.
*54388Storek *
*54388Storek * %sccs.include.redist.c%
*54388Storek *
*54388Storek * from: $Header: modf.s,v 1.3 92/06/20 00:00:54 torek Exp $
*54388Storek */
*54388Storek
*54388Storek#if defined(LIBC_SCCS) && !defined(lint)
*54388Storek	.asciz "@(#)modf.s	5.1 (Berkeley) 06/25/92"
*54388Storek#endif /* LIBC_SCCS and not lint */
*54388Storek
*54388Storek#include "DEFS.h"
*54388Storek#include <machine/fsr.h>
*54388Storek
*54388Storek/*
*54388Storek * double modf(double val, double *iptr)
*54388Storek *
*54388Storek * Returns the fractional part of `val', storing the integer part of
*54388Storek * `val' in *iptr.  Both *iptr and the return value have the same sign
*54388Storek * as `val'.
*54388Storek *
*54388Storek * Method:
*54388Storek *
*54388Storek * We use the fpu's normalization hardware to compute the integer portion
*54388Storek * of the double precision argument.  Sun IEEE double precision numbers
*54388Storek * have 52 bits of mantissa, 11 bits of exponent, and one bit of sign,
*54388Storek * with the sign occupying bit 31 of word 0, and the exponent bits 30:20
*54388Storek * of word 0.  Thus, values >= 2^52 are by definition integers.
*54388Storek *
*54388Storek * If we take a value that is in the range [+0..2^52) and add 2^52, all
*54388Storek * of the fractional bits fall out and all of the integer bits are summed
*54388Storek * with 2^52.  If we then subtract 2^52, we get those integer bits back.
*54388Storek * This must be done with rounding set to `towards 0' or `towards -inf'.
*54388Storek * `Toward -inf' fails when the value is 0 (we get -0 back)....
*54388Storek *
*54388Storek * Note that this method will work anywhere, but is machine dependent in
*54388Storek * various aspects.
*54388Storek *
*54388Storek * Stack usage:
*54388Storek *	4@[%fp - 4]	saved %fsr
*54388Storek *	4@[%fp - 8]	new %fsr with rounding set to `towards 0'
*54388Storek *	8@[%fp - 16]	space for moving between %i and %f registers
*54388Storek * Register usage:
*54388Storek *	%i0%i1		double val;
*54388Storek *	%l0		scratch
*54388Storek *	%l1		sign bit (0x80000000)
*54388Storek *	%i2		double *iptr;
*54388Storek *	%f2:f3		`magic number' 2^52, in fpu registers
*54388Storek *	%f4:f5		double v, in fpu registers
*54388Storek */
*54388Storek
*54388Storek	.align	8
*54388StorekLmagic:
*54388Storek	.word	0x43300000	! sign = 0, exponent = 52 + 1023, mantissa = 0
*54388Storek	.word	0		! (i.e., .double 0r4503599627370496e+00)
*54388Storek
*54388StorekL0:
*54388Storek	.word	0		! 0.0
*54388Storek	.word	0
*54388Storek
*54388StorekENTRY(modf)
*54388Storek	save	%sp, -64-16, %sp
*54388Storek
*54388Storek	/*
*54388Storek	 * First, compute v = abs(val) by clearing sign bit,
*54388Storek	 * and then set up the fpu registers.  This would be
*54388Storek	 * much easier if we could do alu operations on fpu registers!
*54388Storek	 */
*54388Storek	sethi	0x80000000, %l1		! sign bit
*54388Storek	andn	%i0, %l1, %l0
*54388Storek	st	%l0, [%fp - 16]
*54388Storek	sethi	%hi(Lmagic), %l0
*54388Storek	ldd	[%l0 + %lo(Lmagic)], %f2
*54388Storek	st	%i1, [%fp - 12]
*54388Storek	ldd	[%fp - 16], %f4		! %f4:f5 = v
*54388Storek
*54388Storek	/*
*54388Storek	 * Is %f4:f5 >= %f2:f3 ?  If so, it is all integer bits.
*54388Storek	 * It is probably less, though.
*54388Storek	 */
*54388Storek	fcmped	%f4, %f2
*54388Storek	nop				! fpop2 delay
*54388Storek	fbuge	Lbig			! if >= (or unordered), go out
*54388Storek	nop
*54388Storek
*54388Storek	/*
*54388Storek	 * v < 2^52, so add 2^52, then subtract 2^52, but do it all
*54388Storek	 * with rounding set towards zero.  We leave any enabled
*54388Storek	 * traps enabled, but change the rounding mode.  This might
*54388Storek	 * not be so good.  Oh well....
*54388Storek	 */
*54388Storek	st	%fsr, [%fp - 4]		! %l5 = current FSR mode
*54388Storek	set	FSR_RD, %l3		! %l3 = rounding direction mask
*54388Storek	ld	[%fp - 4], %l5
*54388Storek	set	FSR_RD_RZ << FSR_RD_SHIFT, %l4
*54388Storek	andn	%l5, %l3, %l6
*54388Storek	or	%l6, %l4, %l6		! round towards zero, please
*54388Storek	and	%l5, %l3, %l5		! save original rounding mode
*54388Storek	st	%l6, [%fp - 8]
*54388Storek	ld	[%fp - 8], %fsr
*54388Storek
*54388Storek	faddd	%f4, %f2, %f4		! %f4:f5 += 2^52
*54388Storek	fsubd	%f4, %f2, %f4		! %f4:f5 -= 2^52
*54388Storek
*54388Storek	/*
*54388Storek	 * Restore %fsr, but leave exceptions accrued.
*54388Storek	 */
*54388Storek	st	%fsr, [%fp - 4]
*54388Storek	ld	[%fp - 4], %l6
*54388Storek	andn	%l6, %l3, %l6		! %l6 = %fsr & ~FSR_RD;
*54388Storek	or	%l5, %l6, %l5		! %l5 |= %l6;
*54388Storek	st	%l5, [%fp - 4]
*54388Storek	ld	[%fp - 4], %fsr		! restore %fsr, leaving accrued stuff
*54388Storek
*54388Storek	/*
*54388Storek	 * Now insert the original sign in %f4:f5.
*54388Storek	 * This is a lot of work, so it is conditional here.
*54388Storek	 */
*54388Storek	btst	%l1, %i0
*54388Storek	be	1f
*54388Storek	nop
*54388Storek	st	%f4, [%fp - 16]
*54388Storek	ld	[%fp - 16], %g1
*54388Storek	or	%l1, %g1, %g1
*54388Storek	st	%g1, [%fp - 16]
*54388Storek	ld	[%fp - 16], %f4
*54388Storek1:
*54388Storek
*54388Storek	/*
*54388Storek	 * The value in %f4:f5 is now the integer portion of the original
*54388Storek	 * argument.  We need to store this in *ival (%i2), subtract it
*54388Storek	 * from the original value argument (%i0:i1), and return the result.
*54388Storek	 */
*54388Storek	std	%f4, [%i2]		! *ival = %f4:f5;
*54388Storek	std	%i0, [%fp - 16]
*54388Storek	ldd	[%fp - 16], %f0		! %f0:f1 = val;
*54388Storek	fsubd	%f0, %f4, %f0		! %f0:f1 -= %f4:f5;
*54388Storek	ret
*54388Storek	restore
*54388Storek
*54388StorekLbig:
*54388Storek	/*
*54388Storek	 * We get here if the original comparison of %f4:f5 (v) to
*54388Storek	 * %f2:f3 (2^52) came out `greater or unordered'.  In this
*54388Storek	 * case the integer part is the original value, and the
*54388Storek	 * fractional part is 0.
*54388Storek	 */
*54388Storek	sethi	%hi(L0), %l0
*54388Storek	std	%f0, [%i2]		! *ival = val;
*54388Storek	ldd	[%l0 + %lo(L0)], %f0	! return 0.0;
*54388Storek	ret
*54388Storek	restore