17e76048aSMarcel Moolenaar /* $NetBSD: fpu_subr.c,v 1.4 2005/12/11 12:18:42 christos Exp $ */
27e76048aSMarcel Moolenaar
37e76048aSMarcel Moolenaar /*
4*51369649SPedro F. Giffuni * SPDX-License-Identifier: BSD-3-Clause
5*51369649SPedro F. Giffuni *
67e76048aSMarcel Moolenaar * Copyright (c) 1992, 1993
77e76048aSMarcel Moolenaar * The Regents of the University of California. All rights reserved.
87e76048aSMarcel Moolenaar *
97e76048aSMarcel Moolenaar * This software was developed by the Computer Systems Engineering group
107e76048aSMarcel Moolenaar * at Lawrence Berkeley Laboratory under DARPA contract BG 91-66 and
117e76048aSMarcel Moolenaar * contributed to Berkeley.
127e76048aSMarcel Moolenaar *
137e76048aSMarcel Moolenaar * All advertising materials mentioning features or use of this software
147e76048aSMarcel Moolenaar * must display the following acknowledgement:
157e76048aSMarcel Moolenaar * This product includes software developed by the University of
167e76048aSMarcel Moolenaar * California, Lawrence Berkeley Laboratory.
177e76048aSMarcel Moolenaar *
187e76048aSMarcel Moolenaar * Redistribution and use in source and binary forms, with or without
197e76048aSMarcel Moolenaar * modification, are permitted provided that the following conditions
207e76048aSMarcel Moolenaar * are met:
217e76048aSMarcel Moolenaar * 1. Redistributions of source code must retain the above copyright
227e76048aSMarcel Moolenaar * notice, this list of conditions and the following disclaimer.
237e76048aSMarcel Moolenaar * 2. Redistributions in binary form must reproduce the above copyright
247e76048aSMarcel Moolenaar * notice, this list of conditions and the following disclaimer in the
257e76048aSMarcel Moolenaar * documentation and/or other materials provided with the distribution.
267e76048aSMarcel Moolenaar * 3. Neither the name of the University nor the names of its contributors
277e76048aSMarcel Moolenaar * may be used to endorse or promote products derived from this software
287e76048aSMarcel Moolenaar * without specific prior written permission.
297e76048aSMarcel Moolenaar *
307e76048aSMarcel Moolenaar * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
317e76048aSMarcel Moolenaar * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
327e76048aSMarcel Moolenaar * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
337e76048aSMarcel Moolenaar * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
347e76048aSMarcel Moolenaar * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
357e76048aSMarcel Moolenaar * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
367e76048aSMarcel Moolenaar * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
377e76048aSMarcel Moolenaar * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
387e76048aSMarcel Moolenaar * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
397e76048aSMarcel Moolenaar * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
407e76048aSMarcel Moolenaar * SUCH DAMAGE.
417e76048aSMarcel Moolenaar */
427e76048aSMarcel Moolenaar
437e76048aSMarcel Moolenaar /*
447e76048aSMarcel Moolenaar * FPU subroutines.
457e76048aSMarcel Moolenaar */
467e76048aSMarcel Moolenaar
477e76048aSMarcel Moolenaar #include <sys/types.h>
482aa95aceSPeter Grehan #include <sys/systm.h>
497e76048aSMarcel Moolenaar
507e76048aSMarcel Moolenaar #include <machine/fpu.h>
517e76048aSMarcel Moolenaar
527e76048aSMarcel Moolenaar #include <powerpc/fpu/fpu_arith.h>
537e76048aSMarcel Moolenaar #include <powerpc/fpu/fpu_emu.h>
547e76048aSMarcel Moolenaar
557e76048aSMarcel Moolenaar /*
567e76048aSMarcel Moolenaar * Shift the given number right rsh bits. Any bits that `fall off' will get
577e76048aSMarcel Moolenaar * shoved into the sticky field; we return the resulting sticky. Note that
587e76048aSMarcel Moolenaar * shifting NaNs is legal (this will never shift all bits out); a NaN's
597e76048aSMarcel Moolenaar * sticky field is ignored anyway.
607e76048aSMarcel Moolenaar */
617e76048aSMarcel Moolenaar int
fpu_shr(struct fpn * fp,int rsh)627e76048aSMarcel Moolenaar fpu_shr(struct fpn *fp, int rsh)
637e76048aSMarcel Moolenaar {
647e76048aSMarcel Moolenaar u_int m0, m1, m2, m3, s;
657e76048aSMarcel Moolenaar int lsh;
667e76048aSMarcel Moolenaar
677e76048aSMarcel Moolenaar #ifdef DIAGNOSTIC
687e76048aSMarcel Moolenaar if (rsh <= 0 || (fp->fp_class != FPC_NUM && !ISNAN(fp)))
697e76048aSMarcel Moolenaar panic("fpu_rightshift 1");
707e76048aSMarcel Moolenaar #endif
717e76048aSMarcel Moolenaar
727e76048aSMarcel Moolenaar m0 = fp->fp_mant[0];
737e76048aSMarcel Moolenaar m1 = fp->fp_mant[1];
747e76048aSMarcel Moolenaar m2 = fp->fp_mant[2];
757e76048aSMarcel Moolenaar m3 = fp->fp_mant[3];
767e76048aSMarcel Moolenaar
777e76048aSMarcel Moolenaar /* If shifting all the bits out, take a shortcut. */
787e76048aSMarcel Moolenaar if (rsh >= FP_NMANT) {
797e76048aSMarcel Moolenaar #ifdef DIAGNOSTIC
807e76048aSMarcel Moolenaar if ((m0 | m1 | m2 | m3) == 0)
817e76048aSMarcel Moolenaar panic("fpu_rightshift 2");
827e76048aSMarcel Moolenaar #endif
837e76048aSMarcel Moolenaar fp->fp_mant[0] = 0;
847e76048aSMarcel Moolenaar fp->fp_mant[1] = 0;
857e76048aSMarcel Moolenaar fp->fp_mant[2] = 0;
867e76048aSMarcel Moolenaar fp->fp_mant[3] = 0;
877e76048aSMarcel Moolenaar #ifdef notdef
887e76048aSMarcel Moolenaar if ((m0 | m1 | m2 | m3) == 0)
897e76048aSMarcel Moolenaar fp->fp_class = FPC_ZERO;
907e76048aSMarcel Moolenaar else
917e76048aSMarcel Moolenaar #endif
927e76048aSMarcel Moolenaar fp->fp_sticky = 1;
937e76048aSMarcel Moolenaar return (1);
947e76048aSMarcel Moolenaar }
957e76048aSMarcel Moolenaar
967e76048aSMarcel Moolenaar /* Squish out full words. */
977e76048aSMarcel Moolenaar s = fp->fp_sticky;
987e76048aSMarcel Moolenaar if (rsh >= 32 * 3) {
997e76048aSMarcel Moolenaar s |= m3 | m2 | m1;
1007e76048aSMarcel Moolenaar m3 = m0, m2 = 0, m1 = 0, m0 = 0;
1017e76048aSMarcel Moolenaar } else if (rsh >= 32 * 2) {
1027e76048aSMarcel Moolenaar s |= m3 | m2;
1037e76048aSMarcel Moolenaar m3 = m1, m2 = m0, m1 = 0, m0 = 0;
1047e76048aSMarcel Moolenaar } else if (rsh >= 32) {
1057e76048aSMarcel Moolenaar s |= m3;
1067e76048aSMarcel Moolenaar m3 = m2, m2 = m1, m1 = m0, m0 = 0;
1077e76048aSMarcel Moolenaar }
1087e76048aSMarcel Moolenaar
1097e76048aSMarcel Moolenaar /* Handle any remaining partial word. */
1107e76048aSMarcel Moolenaar if ((rsh &= 31) != 0) {
1117e76048aSMarcel Moolenaar lsh = 32 - rsh;
1127e76048aSMarcel Moolenaar s |= m3 << lsh;
1137e76048aSMarcel Moolenaar m3 = (m3 >> rsh) | (m2 << lsh);
1147e76048aSMarcel Moolenaar m2 = (m2 >> rsh) | (m1 << lsh);
1157e76048aSMarcel Moolenaar m1 = (m1 >> rsh) | (m0 << lsh);
1167e76048aSMarcel Moolenaar m0 >>= rsh;
1177e76048aSMarcel Moolenaar }
1187e76048aSMarcel Moolenaar fp->fp_mant[0] = m0;
1197e76048aSMarcel Moolenaar fp->fp_mant[1] = m1;
1207e76048aSMarcel Moolenaar fp->fp_mant[2] = m2;
1217e76048aSMarcel Moolenaar fp->fp_mant[3] = m3;
1227e76048aSMarcel Moolenaar fp->fp_sticky = s;
1237e76048aSMarcel Moolenaar return (s);
1247e76048aSMarcel Moolenaar }
1257e76048aSMarcel Moolenaar
1267e76048aSMarcel Moolenaar /*
1277e76048aSMarcel Moolenaar * Force a number to be normal, i.e., make its fraction have all zero
1287e76048aSMarcel Moolenaar * bits before FP_1, then FP_1, then all 1 bits. This is used for denorms
1297e76048aSMarcel Moolenaar * and (sometimes) for intermediate results.
1307e76048aSMarcel Moolenaar *
1317e76048aSMarcel Moolenaar * Internally, this may use a `supernormal' -- a number whose fp_mant
1327e76048aSMarcel Moolenaar * is greater than or equal to 2.0 -- so as a side effect you can hand it
1337e76048aSMarcel Moolenaar * a supernormal and it will fix it (provided fp->fp_mant[3] == 0).
1347e76048aSMarcel Moolenaar */
1357e76048aSMarcel Moolenaar void
fpu_norm(struct fpn * fp)1367e76048aSMarcel Moolenaar fpu_norm(struct fpn *fp)
1377e76048aSMarcel Moolenaar {
1387e76048aSMarcel Moolenaar u_int m0, m1, m2, m3, top, sup, nrm;
1397e76048aSMarcel Moolenaar int lsh, rsh, exp;
1407e76048aSMarcel Moolenaar
1417e76048aSMarcel Moolenaar exp = fp->fp_exp;
1427e76048aSMarcel Moolenaar m0 = fp->fp_mant[0];
1437e76048aSMarcel Moolenaar m1 = fp->fp_mant[1];
1447e76048aSMarcel Moolenaar m2 = fp->fp_mant[2];
1457e76048aSMarcel Moolenaar m3 = fp->fp_mant[3];
1467e76048aSMarcel Moolenaar
1477e76048aSMarcel Moolenaar /* Handle severe subnormals with 32-bit moves. */
1487e76048aSMarcel Moolenaar if (m0 == 0) {
1497e76048aSMarcel Moolenaar if (m1)
1507e76048aSMarcel Moolenaar m0 = m1, m1 = m2, m2 = m3, m3 = 0, exp -= 32;
1517e76048aSMarcel Moolenaar else if (m2)
1527e76048aSMarcel Moolenaar m0 = m2, m1 = m3, m2 = 0, m3 = 0, exp -= 2 * 32;
1537e76048aSMarcel Moolenaar else if (m3)
1547e76048aSMarcel Moolenaar m0 = m3, m1 = 0, m2 = 0, m3 = 0, exp -= 3 * 32;
1557e76048aSMarcel Moolenaar else {
1567e76048aSMarcel Moolenaar fp->fp_class = FPC_ZERO;
1577e76048aSMarcel Moolenaar return;
1587e76048aSMarcel Moolenaar }
1597e76048aSMarcel Moolenaar }
1607e76048aSMarcel Moolenaar
1617e76048aSMarcel Moolenaar /* Now fix any supernormal or remaining subnormal. */
1627e76048aSMarcel Moolenaar nrm = FP_1;
1637e76048aSMarcel Moolenaar sup = nrm << 1;
1647e76048aSMarcel Moolenaar if (m0 >= sup) {
1657e76048aSMarcel Moolenaar /*
1667e76048aSMarcel Moolenaar * We have a supernormal number. We need to shift it right.
1677e76048aSMarcel Moolenaar * We may assume m3==0.
1687e76048aSMarcel Moolenaar */
1697e76048aSMarcel Moolenaar for (rsh = 1, top = m0 >> 1; top >= sup; rsh++) /* XXX slow */
1707e76048aSMarcel Moolenaar top >>= 1;
1717e76048aSMarcel Moolenaar exp += rsh;
1727e76048aSMarcel Moolenaar lsh = 32 - rsh;
1737e76048aSMarcel Moolenaar m3 = m2 << lsh;
1747e76048aSMarcel Moolenaar m2 = (m2 >> rsh) | (m1 << lsh);
1757e76048aSMarcel Moolenaar m1 = (m1 >> rsh) | (m0 << lsh);
1767e76048aSMarcel Moolenaar m0 = top;
1777e76048aSMarcel Moolenaar } else if (m0 < nrm) {
1787e76048aSMarcel Moolenaar /*
1797e76048aSMarcel Moolenaar * We have a regular denorm (a subnormal number), and need
1807e76048aSMarcel Moolenaar * to shift it left.
1817e76048aSMarcel Moolenaar */
1827e76048aSMarcel Moolenaar for (lsh = 1, top = m0 << 1; top < nrm; lsh++) /* XXX slow */
1837e76048aSMarcel Moolenaar top <<= 1;
1847e76048aSMarcel Moolenaar exp -= lsh;
1857e76048aSMarcel Moolenaar rsh = 32 - lsh;
1867e76048aSMarcel Moolenaar m0 = top | (m1 >> rsh);
1877e76048aSMarcel Moolenaar m1 = (m1 << lsh) | (m2 >> rsh);
1887e76048aSMarcel Moolenaar m2 = (m2 << lsh) | (m3 >> rsh);
1897e76048aSMarcel Moolenaar m3 <<= lsh;
1907e76048aSMarcel Moolenaar }
1917e76048aSMarcel Moolenaar
1927e76048aSMarcel Moolenaar fp->fp_exp = exp;
1937e76048aSMarcel Moolenaar fp->fp_mant[0] = m0;
1947e76048aSMarcel Moolenaar fp->fp_mant[1] = m1;
1957e76048aSMarcel Moolenaar fp->fp_mant[2] = m2;
1967e76048aSMarcel Moolenaar fp->fp_mant[3] = m3;
1977e76048aSMarcel Moolenaar }
1987e76048aSMarcel Moolenaar
1997e76048aSMarcel Moolenaar /*
2007e76048aSMarcel Moolenaar * Concoct a `fresh' Quiet NaN per Appendix N.
2017e76048aSMarcel Moolenaar * As a side effect, we set NV (invalid) for the current exceptions.
2027e76048aSMarcel Moolenaar */
2037e76048aSMarcel Moolenaar struct fpn *
fpu_newnan(struct fpemu * fe)2047e76048aSMarcel Moolenaar fpu_newnan(struct fpemu *fe)
2057e76048aSMarcel Moolenaar {
2067e76048aSMarcel Moolenaar struct fpn *fp;
2077e76048aSMarcel Moolenaar
2087e76048aSMarcel Moolenaar fe->fe_cx |= FPSCR_VXSNAN;
2097e76048aSMarcel Moolenaar fp = &fe->fe_f3;
2107e76048aSMarcel Moolenaar fp->fp_class = FPC_QNAN;
2117e76048aSMarcel Moolenaar fp->fp_sign = 0;
2127e76048aSMarcel Moolenaar fp->fp_mant[0] = FP_1 - 1;
2137e76048aSMarcel Moolenaar fp->fp_mant[1] = fp->fp_mant[2] = fp->fp_mant[3] = ~0;
2147e76048aSMarcel Moolenaar DUMPFPN(FPE_REG, fp);
2157e76048aSMarcel Moolenaar return (fp);
2167e76048aSMarcel Moolenaar }
217