Replace the unmaintainable assembler code responsible for 88100 precise FPU

fault handling with a C wrapper around the softfloat code, as already done for 88110 kernels. As a bonus, attempting to read or write FPU control registers but fcr62 and fcr63 in userland will now correctly signal an illegal instruction, instead of leaving the destination register unchanged and pretending nothing bad happened. Be sure to rm m88100_fp.d in your kernel compile directory after updating your tree.
author: miod <miod@openbsd.org> 2014-06-09 16:26:32 +0000
committer: miod <miod@openbsd.org> 2014-06-09 16:26:32 +0000
commit: af421d72ce5387c9dfb0050c65afb3f1be689da3 (patch)
tree: a19a10d528e1311fadec189e654f76237dc71077
parent: Remove redundant regdump() output. (diff)
download: wireguard-openbsd-af421d72ce5387c9dfb0050c65afb3f1be689da3.tar.xz
wireguard-openbsd-af421d72ce5387c9dfb0050c65afb3f1be689da3.zip
10 files changed, 732 insertions, 2137 deletions
diff --git a/sys/arch/aviion/conf/Makefile.aviion b/sys/arch/aviion/conf/Makefile.aviion
index 749079ca0b7..bde4c65043a 100644
--- a/sys/arch/aviion/conf/Makefile.aviion
+++ b/sys/arch/aviion/conf/Makefile.aviion
@@ -1,4 +1,4 @@
-#	$OpenBSD: Makefile.aviion,v 1.45 2014/05/08 22:17:33 miod Exp $
+#	$OpenBSD: Makefile.aviion,v 1.46 2014/06/09 16:26:32 miod Exp $
 
 # For instructions on building kernels consult the config(8) and options(4)
 # manual pages.
@@ -143,7 +143,7 @@ db_structinfo.h: $S/ddb/db_structinfo.c $S/ddb/parse_structinfo.pl
 	rm -f db_structinfo.o
 
 locore.o: ${_machdir}/${_mach}/locore.S assym.h
-eh.o m88100_fp.o mutex.o process.o subr.o: assym.h
+eh.o m88100_fp_imp.o mutex.o process.o subr.o: assym.h
 
 # The install target can be redefined by putting a
 # install-kernel-${MACHINE_NAME} target into /etc/mk.conf
diff --git a/sys/arch/luna88k/conf/Makefile.luna88k b/sys/arch/luna88k/conf/Makefile.luna88k
index abe39b556e1..22d551e682f 100644
--- a/sys/arch/luna88k/conf/Makefile.luna88k
+++ b/sys/arch/luna88k/conf/Makefile.luna88k
@@ -1,4 +1,4 @@
-#	$OpenBSD: Makefile.luna88k,v 1.53 2014/05/08 22:17:33 miod Exp $
+#	$OpenBSD: Makefile.luna88k,v 1.54 2014/06/09 16:26:32 miod Exp $
 
 # For instructions on building kernels consult the config(8) and options(4)
 # manual pages.
@@ -143,7 +143,7 @@ db_structinfo.h: $S/ddb/db_structinfo.c $S/ddb/parse_structinfo.pl
 	rm -f db_structinfo.o
 
 locore.o: ${_machdir}/${_mach}/locore.S assym.h
-eh.o m88100_fp.o mutex.o process.o subr.o: assym.h
+eh.o m88100_fp_imp.o mutex.o process.o subr.o: assym.h
 
 # The install target can be redefined by putting a
 # install-kernel-${MACHINE_NAME} target into /etc/mk.conf
diff --git a/sys/arch/m88k/conf/files.m88k b/sys/arch/m88k/conf/files.m88k
index 44679231cc2..ee78c974160 100644
--- a/sys/arch/m88k/conf/files.m88k
+++ b/sys/arch/m88k/conf/files.m88k
@@ -1,14 +1,16 @@
-#	$OpenBSD: files.m88k,v 1.26 2014/06/09 10:26:10 miod Exp $
+#	$OpenBSD: files.m88k,v 1.27 2014/06/09 16:26:32 miod Exp $
 
 file	arch/m88k/m88k/atomic.S				multiprocessor
 file	arch/m88k/m88k/db_disasm.c			ddb
 file	arch/m88k/m88k/db_interface.c			ddb
 file	arch/m88k/m88k/db_sstep.c			ddb
 file	arch/m88k/m88k/db_trace.c			ddb
+file	arch/m88k/m88k/fpu.c
 file	arch/m88k/m88k/in_cksum.c			inet
-file	arch/m88k/m88k/m88100_fp.S			m88100
+file	arch/m88k/m88k/m88100_fp.c			m88100
 file	arch/m88k/m88k/m88100_fp_imp.S			m88100
 file	arch/m88k/m88k/m88100_machdep.c			m88100
+file	arch/m88k/m88k/m88110_fp.c			m88110
 file	arch/m88k/m88k/m88110_mmu.S			m88110
 file	arch/m88k/m88k/m8820x_machdep.c			m88100
 file	arch/m88k/m88k/m88k_machdep.c
@@ -26,9 +28,7 @@ file	arch/m88k/m88k/vectors_88100.S			m88100
 file	arch/m88k/m88k/vectors_88110.S			m88110
 file	arch/m88k/m88k/vm_machdep.c
 
-# floating-point support code for 88110
-file	arch/m88k/m88k/m88110_fp.c			m88110
-file	lib/libkern/softfloat.c				m88110
+file	lib/libkern/softfloat.c
 
 file	lib/libkern/arch/m88k/divsi3.S
 file	lib/libkern/arch/m88k/modsi3.S
diff --git a/sys/arch/m88k/include/ieeefp.h b/sys/arch/m88k/include/ieeefp.h
index 1af791fc06e..540f3099dc8 100644
--- a/sys/arch/m88k/include/ieeefp.h
+++ b/sys/arch/m88k/include/ieeefp.h
@@ -1,4 +1,4 @@
-/*	$OpenBSD: ieeefp.h,v 1.4 2010/04/21 15:37:32 miod Exp $ */
+/*	$OpenBSD: ieeefp.h,v 1.5 2014/06/09 16:26:32 miod Exp $ */
 /*
  * Copyright (c) 1996 Nivas Madhur
  * All rights reserved.
@@ -56,7 +56,7 @@ typedef enum {
 #ifdef _KERNEL
 
 /*
- * Defines for the 88110 floating-point completion code.
+ * Defines for the floating-point completion code.
  */
 
 #include <sys/param.h>
@@ -83,6 +83,6 @@ countLeadingZeros32(u_int32_t a)
 	return (a != 0 ? 31 - rc : rc);
 }
 
-#endif
+#endif /* _KERNEL */
 
 #endif /* _M88K_IEEEFP_H_ */
diff --git a/sys/arch/m88k/m88k/fpu.c b/sys/arch/m88k/m88k/fpu.c
new file mode 100644
index 00000000000..69885828861
--- /dev/null
+++ b/sys/arch/m88k/m88k/fpu.c
@@ -0,0 +1,308 @@
+/*	$OpenBSD: fpu.c,v 1.1 2014/06/09 16:26:32 miod Exp $	*/
+
+/*
+ * Copyright (c) 2007, 2014, Miodrag Vallat.
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice, this permission notice, and the disclaimer below
+ * appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+/*
+ * Common bits between the 88100 and the 88110 floating point completion
+ * code.
+ */
+
+#include <sys/types.h>
+#include <sys/param.h>
+#include <sys/proc.h>
+
+#include <machine/fpu.h>
+#include <machine/frame.h>
+#include <machine/ieeefp.h>
+
+#include <lib/libkern/softfloat.h>
+
+#include <m88k/m88k/fpu.h>
+
+/*
+ * Values for individual bits in fcmp results.
+ */
+#define	CC_UN	0x00000001	/* unordered */
+#define	CC_LEG	0x00000002	/* less than, equal or greater than */
+#define	CC_EQ	0x00000004	/* equal */
+#define	CC_NE	0x00000008	/* not equal */
+#define	CC_GT	0x00000010	/* greater than */
+#define	CC_LE	0x00000020	/* less than or equal */
+#define	CC_LT	0x00000040	/* less than */
+#define	CC_GE	0x00000080	/* greater than or equal */
+#define	CC_OU	0x00000100	/* out of range */
+#define	CC_IB	0x00000200	/* in range or on boundary */
+#define	CC_IN	0x00000400	/* in range */
+#define	CC_OB	0x00000800	/* out of range or on boundary */
+/* the following only on 88110 */
+#define	CC_UE	0x00001000	/* unordered or equal */
+#define	CC_LG	0x00002000	/* less than or greater than */
+#define	CC_UG	0x00004000	/* unordered or greater than */
+#define	CC_ULE	0x00008000	/* unordered or less than or equal */
+#define	CC_UL	0x00010000	/* unordered or less than */
+#define	CC_UGE	0x00020000	/* unordered or greater than or equal */
+
+/*
+ * Inlines from softfloat-specialize.h which are not made public, needed
+ * for fpu_compare.
+ */
+#define	float32_is_nan(a) \
+	(0xff000000 < (a << 1))
+#define	float32_is_signaling_nan(a) \
+	((((a >> 22) & 0x1ff) == 0x1fe) && (a & 0x003fffff))
+
+/*
+ * Store a floating-point result, converting it to the required format if it
+ * is of smaller precision.
+ *
+ * This assumes the original format (orig_width) is not FTYPE_INT, and the
+ * final format (width) <= orig_width.
+ */
+void
+fpu_store(struct trapframe *frame, u_int regno, u_int orig_width, u_int width,
+    fparg *src)
+{
+	u_int32_t tmp;
+	u_int rd;
+
+	switch (width) {
+	case FTYPE_INT:
+		rd = float_get_round(frame->tf_fpcr);
+		switch (orig_width) {
+		case FTYPE_SNG:
+			if (rd == FP_RZ)
+				tmp = float32_to_int32_round_to_zero(src->sng);
+			else
+				tmp = float32_to_int32(src->sng);
+			break;
+		case FTYPE_DBL:
+			if (rd == FP_RZ)
+				tmp = float64_to_int32_round_to_zero(src->dbl);
+			else
+				tmp = float64_to_int32(src->dbl);
+			break;
+		}
+		if (regno != 0)
+			frame->tf_r[regno] = tmp;
+		break;
+	case FTYPE_SNG:
+		switch (orig_width) {
+		case FTYPE_SNG:
+			tmp = src->sng;
+			break;
+		case FTYPE_DBL:
+			tmp = float64_to_float32(src->dbl);
+			break;
+		}
+		if (regno != 0)
+			frame->tf_r[regno] = tmp;
+		break;
+	case FTYPE_DBL:
+		switch (orig_width) {
+		case FTYPE_DBL:
+			tmp = (u_int32_t)(src->dbl >> 32);
+			if (regno != 0)
+				frame->tf_r[regno] = tmp;
+			tmp = (u_int32_t)src->dbl;
+			if (regno != 31)
+				frame->tf_r[regno + 1] = tmp;
+			break;
+		}
+		break;
+	}
+}
+
+/*
+ * Return the largest precision of all precision inputs.
+ *
+ * This assumes none of the inputs is FTYPE_INT.
+ */
+u_int
+fpu_precision(u_int ts1, u_int ts2, u_int td)
+{
+	return max(td, max(ts1, ts2));
+}
+
+/*
+ * Perform a compare instruction (fcmp, fcmpu).
+ *
+ * If either operand is NaN, the result is unordered.  This causes an
+ * reserved operand exception (except for nonsignalling NaNs for fcmpu).
+ */
+void
+fpu_compare(struct trapframe *frame, fparg *s1, fparg *s2, u_int width,
+    u_int rd, u_int fcmpu)
+{
+	u_int32_t cc;
+	int zero, s1positive, s2positive;
+
+	/*
+	 * Handle NaNs first, and raise invalid if fcmp or signaling NaN.
+	 */
+	switch (width) {
+	case FTYPE_SNG:
+		if (float32_is_nan(s1->sng)) {
+			if (!fcmpu || float32_is_signaling_nan(s1->sng))
+				float_set_invalid();
+			cc = CC_UN;
+			goto done;
+		}
+		if (float32_is_nan(s2->sng)) {
+			if (!fcmpu || float32_is_signaling_nan(s2->sng))
+				float_set_invalid();
+			cc = CC_UN;
+			goto done;
+		}
+		break;
+	case FTYPE_DBL:
+		if (float64_is_nan(s1->dbl)) {
+			if (!fcmpu || float64_is_signaling_nan(s1->dbl))
+				float_set_invalid();
+			cc = CC_UN;
+			goto done;
+		}
+		if (float64_is_nan(s2->dbl)) {
+			if (!fcmpu || float64_is_signaling_nan(s2->dbl))
+				float_set_invalid();
+			cc = CC_UN;
+			goto done;
+		}
+		break;
+	}
+
+	/*
+	 * Now order the two numbers.
+	 */
+	switch (width) {
+	case FTYPE_SNG:
+		if (float32_eq(s1->sng, s2->sng))
+			cc = CC_EQ;
+		else if (float32_lt(s1->sng, s2->sng))
+			cc = CC_LT | CC_NE;
+		else
+			cc = CC_GT | CC_NE;
+		break;
+	case FTYPE_DBL:
+		if (float64_eq(s1->dbl, s2->dbl))
+			cc = CC_EQ;
+		else if (float64_lt(s1->dbl, s2->dbl))
+			cc = CC_LT | CC_NE;
+		else
+			cc = CC_GT | CC_NE;
+		break;
+	}
+
+done:
+
+	/*
+	 * Complete condition code mask.
+	 */
+
+	if (cc & CC_UN)
+		cc |= CC_UE | CC_UG | CC_ULE | CC_UL | CC_UGE;
+	if (cc & CC_EQ)
+		cc |= CC_LE | CC_GE | CC_UE;
+	if (cc & CC_GT)
+		cc |= CC_GE;
+	if (cc & CC_LT)
+		cc |= CC_LE;
+	if (cc & (CC_LT | CC_GT))
+		cc |= CC_LG;
+	if (cc & (CC_LT | CC_GT | CC_EQ))
+		cc |= CC_LEG;
+	if (cc & CC_GT)
+		cc |= CC_UG;
+	if (cc & CC_LE)
+		cc |= CC_ULE;
+	if (cc & CC_LT)
+		cc |= CC_UL;
+	if (cc & CC_GE)
+		cc |= CC_UGE;
+
+	/*
+	 * Fill the interval bits.
+	 * s1 is compared to the interval [0, s2].
+	 */
+	if (!(cc & CC_UN)) {
+		if (cc & CC_EQ) {
+			/* if s1 and s2 are equal, s1 is on boundary */
+			cc |= CC_IB | CC_OB;
+			goto completed;
+		}
+
+		/* s1 and s2 are either Zero, numbers or Inf */
+		switch (width) {
+		case FTYPE_SNG:
+			zero = float32_eq(s1->sng, 0);
+			break;
+		case FTYPE_DBL:
+			zero = float64_eq(s1->dbl, 0LL);
+			break;
+		}
+		if (zero) {
+			/* if s1 is zero, it is on boundary */
+			cc |= CC_IB | CC_OB;
+			goto completed;
+		}
+
+		switch (width) {
+		case FTYPE_SNG:
+			s1positive = s1->sng >> 31 == 0;
+			s2positive = s2->sng >> 31 == 0;
+			break;
+		case FTYPE_DBL:
+			s1positive = s1->dbl >> 63 == 0;
+			s2positive = s2->dbl >> 63 == 0;
+			break;
+		}
+		if (s2positive) {
+			/* s2 is positive, the interval is [0, s2] */
+			if (cc & CC_GT) {
+				/* 0 <= s2 < s1 -> out of interval */
+				cc |= CC_OU | CC_OB;
+			} else if (s1positive) {
+				/* 0 < s1 < s2 -> in interval */
+				cc |= CC_IB | CC_IN;
+			} else {
+				/* s1 < 0 <= s2 */
+				cc |= CC_OU | CC_OB;
+			}
+		} else {
+			/* s2 is negative, the interval is [s2, 0] */
+			if (cc & CC_LT) {
+				/* s1 < s2 <= 0 */
+				cc |= CC_OU | CC_OB;
+			} else if (!s1positive) {
+				/* s2 < s1 < 0 */
+				cc |= CC_IB | CC_IN;
+			} else {
+				/* s2 < 0 < s1 */
+				cc |= CC_OU | CC_OB;
+			}
+		}
+	}
+
+#ifdef M88100
+	if (CPU_IS88100)
+		cc &= ~(CC_UE | CC_LG | CC_UG | CC_ULE | CC_UL | CC_UGE);
+#endif
+
+completed:
+	if (rd != 0)
+		frame->tf_r[rd] = cc;
+}
diff --git a/sys/arch/m88k/m88k/fpu.h b/sys/arch/m88k/m88k/fpu.h
new file mode 100644
index 00000000000..0e62030f789
--- /dev/null
+++ b/sys/arch/m88k/m88k/fpu.h
@@ -0,0 +1,42 @@
+/*	$OpenBSD: fpu.h,v 1.1 2014/06/09 16:26:32 miod Exp $	*/
+
+/*
+ * Copyright (c) 2014 Miodrag Vallat.
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+/*
+ * Internal defines for the floating-point completion code.
+ */
+
+/*
+ * Data width (matching the TD field of the instructions)
+ */
+#define	FTYPE_SNG	0
+#define	FTYPE_DBL	1
+#define	FTYPE_EXT	2
+#define	FTYPE_INT	3	/* not a real T value */
+
+#define	IGNORE_PRECISION	FTYPE_SNG
+
+/* floating point value */
+typedef union {
+	float32		sng;
+	float64		dbl;
+} fparg;
+
+void	fpu_compare(struct trapframe *, fparg *, fparg *, u_int, u_int, u_int);
+int	fpu_emulate(struct trapframe *, u_int32_t);
+u_int	fpu_precision(u_int, u_int, u_int);
+void	fpu_store(struct trapframe *, u_int, u_int, u_int, fparg *);
diff --git a/sys/arch/m88k/m88k/m88100_fp.S b/sys/arch/m88k/m88k/m88100_fp.S
deleted file mode 100644
index 6e4cbd40c62..00000000000
--- a/sys/arch/m88k/m88k/m88100_fp.S
+++ /dev/null
@@ -1,1816 +0,0 @@
-/* $OpenBSD: m88100_fp.S,v 1.10 2014/06/09 10:26:10 miod Exp $	*/
-/*
- * Mach Operating System
- * Copyright (c) 1991 Carnegie Mellon University
- * Copyright (c) 1991 OMRON Corporation
- * All Rights Reserved.
- *
- * Permission to use, copy, modify and distribute this software and its
- * documentation is hereby granted, provided that both the copyright
- * notice and this permission notice appear in all copies of the
- * software, derivative works or modified versions, and any portions
- * thereof, and that both notices appear in supporting documentation.
- *
- * CARNEGIE MELLON AND OMRON ALLOW FREE USE OF THIS SOFTWARE IN ITS "AS IS"
- * CONDITION.  CARNEGIE MELLON AND OMRON DISCLAIM ANY LIABILITY OF ANY KIND
- * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
- *
- * Carnegie Mellon requests users of this software to return to
- *
- *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
- *  School of Computer Science
- *  Carnegie Mellon University
- *  Pittsburgh PA 15213-3890
- *
- * any improvements or extensions that they make and grant Carnegie the
- * rights to redistribute these changes.
- */
-
-/* Floating point trouble routines */
-#include "assym.h"
-#include <machine/trap.h>
-#include <machine/asm.h>
-
-#define destsize 10
-
-/* Floating-Point Status Register bits */
-#define inexact		0
-#define overflow	1
-#define underflow	2
-#define divzero		3
-#define oper		4
-
-#define sign		31
-#define s1size		9
-#define s2size		7
-#define dsize		5
-
-#define FADDop		0x05
-#define FSUBop		0x06
-#define FCMPop		0x07
-#define FMULop		0x00
-#define FDIVop		0x0e
-#define FSQRTop		0x0f
-#define INTop		0x09
-#define NINTop		0x0a
-#define TRNCop		0x0b
-
-#define s1nan		7
-#define s2nan		6
-#define s1inf		5
-#define s2inf		4
-#define s1zero		3
-#define s2zero		2
-#define sigbit		19
-
-#define rndhi		15
-#define rndlo		14
-
-ENTRY(m88100_fpu_precise_exception)
-	or	%r29, %r2,  %r0		/* r29 is now the E.F. */
-	subu	%r31, %r31, 16
-	st	%r1,  %r31, 8
-	st	%r29, %r31, 12
-
-	ld	%r2,  %r29, EF_FPSR
-	ld	%r3,  %r29, EF_FPCR
-	ld	%r4,  %r29, EF_FPECR
-	ld	%r5,  %r29, EF_FPHS1
-	ld	%r6,  %r29, EF_FPLS1
-	ld	%r7,  %r29, EF_FPHS2
-	ld	%r8,  %r29, EF_FPLS2
-	ld	%r9,  %r29, EF_FPPT
-
-	/*
-	 * Load into %r1 the return address for the zero handlers. Looking at
-	 * FPECR, branch to the appropriate zero handler. However, if none of
-	 * the zero bits are enabled, then a floating point instruction was
-	 * issued with the floating point unit disabled. This will cause an
-	 * unimplemented opcode 0.
-	 */
-
-	or.u	%r1, %r0, %hi16(wrapup)	/* load return address of function */
-	or	%r1, %r1, %lo16(wrapup)
-
-	bb0	6, %r4, 3f		/* branch to FPunimp if bit set */
-	br	FPuimp
-3:
-	bb0	7, %r4, 4f		/* branch to FPintover if bit set */
-	br	FPintover
-4:
-#if 0
-	bb0	5, %r4, 5f		/* branch to FPpriviol if bit set */
-	br	FPpriviol
-#endif
-5:
-	bb0	4, %r4, 6f		/* branch to FPresoper if bit set */
-	br	FPresoper
-6:
-	bb0	3, %r4, 7f		/* branch to FPdivzero if bit set */
-	br	FPdivzero
-7:
-	or.u	%r4, %r4, 0xffff
-
-ASLOCAL(FPuimp)
-	subu	%r31, %r31, 16		/* allocate stack */
-	st	%r1,  %r31, 0		/* save return address */
-	or	%r2,  %r0,  T_FPEPFLT	/* load trap type */
-	bsr.n	_C_LABEL(m88100_trap)
-	 or	%r3,  %r29, %r0
-	ld	%r1,  %r31, 0		/* recover return address */
-	addu	%r31, %r31, 16		/* deallocate stack */
-	jmp	%r1
-
-	/*
-	 * To write back the results to the user registers, disable exceptions
-	 * and the floating point unit. Write FPSR and FPCR and load the SNIP
-	 * and SFIP.
-	 * r5 will contain the upper word of the result
-	 * r6 will contain the lower word of the result
-	 */
-
-ASLOCAL(wrapup)
-	FLUSH_PIPELINE		/* make sure all floating point operations */
-				/* have finished */
-	ldcr	%r10, %cr1	/* load the PSR */
-#if 0
-	set	%r10, %r10, 1<PSR_FPU_DISABLE_BIT>
-#endif
-	set	%r10, %r10, 1<PSR_INTERRUPT_DISABLE_BIT>
-	stcr	%r10, %cr1
-
-	ld	%r1,  %r31, 8
-	ld	%r29, %r31, 12
-	addu	%r31, %r31, 16
-
-	fstcr	%r2, FPSR		/* write revised value of FPSR... */
-	fstcr	%r3, FPCR		/* ...and FPCR... */
-	st	%r2, %r29, EF_FPSR	/* ...into the trapframe as well */
-	st	%r3, %r29, EF_FPCR
-
-	/* result writeback routine */
-	addu	%r3, %r29, EF_R0
-	extu	%r2, %r9,  5<0>		/* get 5 bits of destination register */
-	bb0	5,   %r9,  writesingle	/* branch if destination is single */
-
-/* writedouble here */
-	st	%r5, %r3[%r2]		/* write high word */
-	add	%r2, %r2, 1		/* for double, the low word is the */
-					/* unspecified register */
-	clr	%r2, %r2, 27<5>		/* perform equivalent of mod 32 */
-ASLOCAL(writesingle)
-	jmp.n	%r1
-	 st	%r6, %r3[%r2]		/* write low word into memory */
-
-/*
- * Check if the numerator is zero. If the numerator is zero, then handle
- * this instruction as you would a 0/0 invalid operation.
- */
-
-ASLOCAL(FPdivzero)
-	bb1.n	s1size, %r9, 1f		/* branch if numerator double */
-	 st	%r1,  %r31, 0		/* save return address */
-/* single number */
-	clr	%r10, %r5,  1<sign>	/* clear sign bit */
-	extu	%r11, %r6,  3<29>	/* grab upper bits of lower word */
-	or	%r10, %r10, %r11	/* combine ones of mantissa */
-	bcnd	eq0,  %r10, resoper	/* numerator is zero, handle */
-					/* reserved operand */
-	br	setbit			/* set divzero bit */
-1:
-/* double number */
-	clr	%r10, %r5,  1<sign>	/* clear sign bit */
-	or	%r10, %r10, %r6		/* or high and low words */
-	bcnd	ne0,  %r10, setbit	/* set divzero bit */
-
-/*
- * The numerator is zero, so handle the invalid operation by setting the
- * invalid operation bit and writing a quiet NaN to the destination.
- */
-
-ASLOCAL(resoper)
-	set	%r2, %r2, 1<oper>
-	set	%r5, %r0, 0<0>	/* put a NaN in high word */
-	set	%r6, %r0, 0<0>	/* put a NaN in low word */
-	br	FP_div_return	/* writing to a word which may be ignored */
-				/* is just as quick as checking the precision */
-				/* of the destination */
-
-/*
- * The operation is divide by zero, so set the divide by zero bit in the
- * FPSR.
- * Considering the sign of the numerator and zero, write a correctly
- * signed infinity of the proper precision into the destination.
- */
-
-setbit:
-	set	%r2, %r2, 1<divzero>
-	bb1	dsize, %r9, FPzero_double	/* branch to handle double result */
-FPzero_single:
-	clr	%r10, %r5, 31<0>	/* clear all of S1HI except sign bit */
-	xor	%r10, %r7, %r10		/* xor the sign bits of the operands */
-	or.u	%r6,  %r0, 0x7f80	/* load single precision infinity */
-	br.n	FP_div_return
-	 or	%r6,  %r6, %r10		/* load correctly signed infinity */
-
-FPzero_double:
-	clr	%r10, %r5, 31<0>	/* clear all of S1HI except sign bit */
-	xor	%r10, %r7, %r10		/* xor the sign bits of the operands */
-	or.u	%r5,  %r0, 0x7ff0	/* load double precision infinity */
-	or	%r5,  %r5, %r10		/* load correctly signed infinity */
-	or	%r6,  %r0, %r0		/* clear lower word of double */
-
-FP_div_return:
-	ld	%r1,  %r31, 0		/* load return address */
-	jmp	%r1
-
-/*
- * Both NINT and TRNC require a certain rounding mode, so check which
- * instruction caused the integer conversion overflow. Use a substitute
- * FPCR in %r1, and modify the rounding mode if the instruction is NINT
- * or TRNC.
- */
-ASLOCAL(FPintover)
-	extu	%r10, %r9,  5<11>	/* extract opcode */
-	cmp	%r11, %r10, INTop	/* see if instruction is INT */
-	st	%r1,  %r31, 0		/* save return address */
-	bb1.n	eq,   %r11, checksize	/* instruction is INT, do not modify */
-					/* rounding mode */
-	 or	%r1,  %r0,  %r3		/* load FPCR into r1 */
-	cmp	%r11, %r10, NINTop	/* see if instruction is NINT */
-	bb1	eq,   %r11, NINT	/* instruction is NINT */
-TRNC:
-	clr	%r1,  %r1,  2<rndlo>	/* clear rounding mode bits, */
-					/* instruction is TRNC */
-	br.n	checksize		/* branch to check size */
-	 set	%r1,  %r1,  1<rndlo>	/* make rounding mode round towards */
-					/* zero */
-NINT:
-	clr	%r1,  %r1,  2<rndlo>	/* make rounding mode round to */
-					/* nearest */
-
-/* See whether the source is single or double precision. */
-
-checksize:
-	bb1	s2size, %r9, checkdoub	/* S2 is double, branch to see if */
-					/* there is a false alarm */
-
-/*
- * An integer has more bits than the mantissa of a single precision floating
- * point number, so to check for false alarms (i.e. valid conversion), simply
- * check the exponents. False alarms are detected for 2**30 to (2**30) - 1
- * and -2**30 to -2**31. Only seven bits need to be looked at since an
- * exception will not occur for the other half of the numbering system.
- * To speed up the processing, first check to see if the exponent is 32 or
- * greater.
- *
- * This code was originally written for the exponent in the control
- * register to have the most significant bit (8 - single, 11 - double)
- * flipped and sign extended. For precise exceptions, however, the most
- * significant bit is only sign extended. Therefore, the code was chopped
- * up so that it would work for positive values of real exponent which were
- * only sign extended.
- */
-
-checksing:
-	extu	%r10, %r7, 7<20>/* internal representation for single */
-				/* precision is IEEE 8 bits sign extended */
-				/* to 11 bits; for real exp. = 30, the */
-				/* above instruction gives a result exp. */
-				/* that has the MSB flipped and sign */
-				/* extended like in the IMPCR */
-	cmp	%r11, %r10, 31	/* compare to 32, but exp. off by 1 */
-				/* these 2 instructions to speed up valid */
-				/* execution of valid cases */
-	bb1	ge,   %r11, overflw /* valid case, perform overflow routine */
-	bb1	sign, %r7, checksingn /* source operand is negative */
-
-/*
- * If the number is positve and the exponent is greater than 30, than it is
- * overflow.
- */
-checksingp:
-	cmp	%r10, %r10, 29		/* compare to 30, but exp. off by 1 */
-	bb1	gt,   %r10, overflw	/* no false alarm, its overflow */
-	br	conversionsp		/* finish single precision conversion */
-
-/*
- * If the number is negative, and the exponent is 30, or 31 with a mantissa
- * of 0, then it is a false alarm.
- */
-checksingn:
-	cmp	%r11, %r10, 30		/* compare to 31, but exp. off by 1 */
-	bb1	lt,   %r11, conversionsn/* exp. less than 31, so convert */
-	extu	%r10, %r8,  3<29>	/* get upper three bits of lower */
-					/* mantissa */
-	mak	%r12, %r7,  20<3>	/* get upper 20 bits of mantissa */
-	or	%r10, %r10, %r12	/* form complete mantissa */
-	bcnd	eq0,  %r10, conversionsn/* complete conversion if mantissa */
-					/* is 0 */
-	br	overflw			/* no false alarm, its overflow */
-
-/*
- * False alarms are detected for 2**30 to (2**30) - 1 and -2**30 to -2**31.
- * Only seven bits need to be looked at since an exception will not occur
- * for the other half of the numbering system.
- * To speed up the processing, first check to see if the exponent is 32 or
- * greater. Since there are more mantissa bits than integer bits, rounding
- * could cause overflow. (2**31) - 1 needs to be checked so that it does
- * not round to 2**31, and -2**31 needs to be checked in case it rounds to
- * -((2**31) + 1).
- */
-checkdoub:
-	extu	%r10, %r7, 10<20>/* internal representation for double */
-				/* precision is the same IEEE 11 bits */
-				/* for real exp. = 30, the */
-				/* above instruction gives a result exp. */
-				/* that has the MSB flipped and sign */
-				/* extended like in the IMPCR */
-	cmp	%r11, %r10, 31	/* compare to 32, but exp. off by 1 */
-				/* these 2 instructions to speed up valid */
-				/* execution of valid cases */
-	bb1	ge,   %r11, overflw /* valid case, perform overflow routine */
-	bb1	sign, %r7,  checkdoubn /* source operand is negative */
-
-/*
- * If the exponent is not 31, then the floating point number will be rounded
- * before the conversion is done. A branch table is set up with bits 4 and 3
- * being the rounding mode, and bits 2, 1, and 0 are the guard, round, and
- * sticky bits.
- */
-checkdoubp:
-	cmp	%r11, %r10, 30		/* compare to 31, but exponent is */
-					/* off by 1 */
-	bb1	eq,   %r11, overflw	/* no false alarm, it's overflow */
-	extu	%r12, %r8,  1<22>	/* get LSB for integer with exp. = 30 */
-	mak	%r12, %r12, 1<2>	/* start to set up field for branch */
-					/* table */
-	extu	%r11, %r8,  1<21>	/* get guard bit */
-	mak	%r11, %r11, 1<1>	/* set up field for branch table */
-	or	%r12, %r11, %r12	/* set up field for branch table */
-	extu	%r11, %r8,  21<0>	/* get bits for sticky bit */
-	bcnd	eq0,  %r11, nostickyp	/* do not set sticky */
-	set	%r12, %r12, 1<0>	/* set sticky bit */
-nostickyp:
-	rot	%r11, %r1,  0<rndlo>	/* shift rounding mode to 2 LSB''s */
-	mak	%r11, %r11, 2<3>	/* set up field, clear other bits */
-	or	%r12, %r11, %r12	/* set up field for branch table */
-	lda	%r12, %r0[%r12]		/* scale r12 */
-	or.u	%r12, %r12, %hi16(ptable)/* load pointer into table */
-	addu	%r12, %r12, %lo16(ptable)
-	jmp	%r12
-
-ptable:
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	paddone
-	br	conversiondp
-	br	conversiondp
-	br	paddone
-	br	paddone
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	paddone
-	br	paddone
-	br	paddone
-	br	conversiondp
-	br	paddone
-	br	paddone
-	br	paddone
-
-/*
- * Add one to the bit of the mantissa which corresponds to the LSB of an
- * integer. If the mantissa overflows, then there is a valid integer
- * overflow conversion; otherwise, the mantissa can be converted to the
- * integer.
- */
-paddone:
-	or	%r10, %r0,  %r0		/* clear r10 */
-	set	%r10, %r10, 1<22>	/* set LSB bit to 1 for adding */
-	addu.co	%r8,  %r8,  %r10	/* add the 1 obtained from rounding */
-	clr	%r11, %r7,  12<20>	/* clear exponent and sign */
-	addu.ci	%r11, %r0,  %r11	/* add carry */
-	bb1	20,   %r11, overflw	/* overflow to 2**31, abort the rest */
-	br.n	conversiondp		/* since the exp. was 30, and the exp.*/
-					/* did not round up to 31, the */
-					/* largest number that S2 could */
-					/* become is 2**31-1 */
-	 or	%r7,  %r0,  %r11	/* store r11 into r7 for conversion */
-
-/*
- * Now check for negative double precision sources. If the exponent is 30,
- * then convert the false alarm. If the exponent is 31, then check the
- * mantissa bits which correspond to integer bits. If any of them are a one,
- * then there is overflow. If they are zero, then check the guard, round,
- * and sticky bits.
- * Round toward zero and positive will not cause a roundup, but round toward
- * nearest and negative may, so perform those roundings. If there is no
- * overflow, then convert and return.
- */
-checkdoubn:
-	cmp	%r11, %r10, 29		/* compare to 30, but exp. off by 1 */
-	bb1	eq,   %r11, conversiondn/* false alarm if exp. = 30 */
-	extu	%r10, %r8,  11<21>	/* check upper bits of lower mantissa */
-	bcnd	ne0,  %r10, overflw	/* one of the bits is a 1, so oflow */
-	extu	%r10, %r7,  20<0>	/* check upper bits of upper mantissa */
-	bcnd	ne0,  %r10, overflw	/* one of the bits is a 1, so oflow */
-	bb0	rndlo, %r1, possround	/* rounding mode is either round near */
-					/* or round negative, which may cause */
-					/* a round */
-	br.n	FPintov_return		/* round positive, which will not */
-					/* cause a round */
-	 set	%r6,  %r0,  1<sign>
-possround:
-	extu	%r12, %r8,  1<20>	/* get guard bit */
-	extu	%r11, %r8,  20<0>	/* get bits for sticky bit */
-	bcnd.n	eq0,  %r11, nostickyn	/* do not set sticky */
-	 mak	%r12, %r12, 1<1>	/* set up field for branch table */
-	set	%r12, %r12, 1<0>	/* set sticky bit */
-nostickyn:
-	bb1	rndhi, %r1, negative	/* rounding mode is negative */
-nearest:
-	cmp	%r12, %r12, 3		/* are both guard and sticky set */
-	bb1	eq,  %r12, overflw	/* both guard and sticky are set, */
-					/* so signal overflow */
-	or	%r6,  %r0,  %r0		/* clear destination register r6 */
-	br.n	FPintov_return
-	 set	%r6,  %r6,  1<sign>	/* set the sign bit and take care of */
-					/* this special case */
-negative:
-	bcnd	ne0,  %r12, overflw	/* -2**31 will be rounded to */
-					/* -(2**31+1), so signal overflow */
-	or	%r6,  %r0,  %r0		/* clear destination register r6 */
-	br.n	FPintov_return
-	 set	%r6, %r6, 1<sign>	/* set the sign bit and take care of */
-					/* this special case */
-
-	/*
-	 * Since the exp. was 30, and there was no round-up, the largest
-	 * number that S2 could have been was 2**31 - 1
-	 */
-
-	/* Convert the single precision positive floating point number. */
-
-conversionsp:
-	extu	%r6,  %r8,  3<29>	/* extract lower bits of integer */
-	mak	%r6,  %r6,  3<7>	/* shift left to correct place in int */
-	mak	%r10, %r7,  20<10>	/* shift left upper bits of integer */
-	or	%r6,  %r6,  %r10	/* form most of integer */
-	br.n	FPintov_return
-	 set	%r6,  %r6,  1<30>	/* set hidden one */
-
-	/* Convert the single precision negative floating point number. */
-
-conversionsn:
-	bb1	eq,   %r11, exp31s	/* use old r11 to see if exp. is 31 */
-	extu	%r6,  %r8,  3<29>	/* extract lower bits of mantissa */
-	mak	%r6,  %r6,  3<7>	/* shift left to correct place in int */
-	mak	%r10, %r7,  20<10>	/* shift left upper bits of integer */
-	or	%r6,  %r6,  %r10	/* form most of integer */
-	set	%r6,  %r6,  1<30>	/* set hidden one */
-	or.c	%r6,  %r0,  %r6		/* negate result */
-	br.n	FPintov_return
-	 addu	%r6,  %r6,  1		/* add 1 to get 2''s complement */
-exp31s:
-	or	%r6,  %r0,  %r0		/* clear r6 */
-	br.n	FPintov_return
-	 set	%r6,  %r6,  1<sign>	/* set sign bit */
-
-	/* Convert the double precision positive floating point number. */
-
-conversiondp:
-	extu	%r6,  %r8,  10<22>	/* extract lower bits of integer */
-	mak	%r10, %r7,  20<10>	/* shift left upper bits of integer */
-	or	%r6,  %r6,  %r10	/* form most of integer */
-	br.n	FPintov_return
-	 set	%r6,  %r6,  1<30>	/* set hidden one */
-
-	/*
-	 * Convert the double precision negative floating point number.
-	 * The number, whose exponent is 30, must be rounded before converting.
-	 * Bits 4 and 3 are the rounding mode, and bits 2, 1, and 0 are the
-	 * guard, round, and sticky bits for the branch table.
-	 */
-
-conversiondn:
-	extu	%r12, %r8,  1<22>	/* get LSB for integer with exp. = 30 */
-	mak	%r12, %r12, 1<2>	/* start to set up field for branch */
-					/* table */
-	extu	%r11, %r8,  1<21>	/* get guard bit */
-	mak	%r11, %r11, 1<1>	/* set up field for branch table */
-	or	%r12, %r11, %r12	/* set up field for branch table */
-	extu	%r11, %r8,  21<0>	/* get bits for sticky bit */
-	bcnd	eq0,  %r11, nostkyn	/* do not set sticky */
-	set	%r12, %r12, 1<0>	/* set sticky bit */
-nostkyn:
-	rot	%r11, %r1,  0<rndlo>	/* shift rounding mode to 2 LSB''s */
-	mak	%r11, %r11, 2<3>	/* set up field, clear other bits */
-	or	%r12, %r11, %r12	/* set up field for branch table */
-	lda	%r12, %r0[%r12]		/* scale r12 */
-	or.u	%r12, %r12, %hi16(ntable)/* load pointer into table */
-	addu	%r12, %r12, %lo16(ntable)
-	jmp	%r12
-
-ntable:
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	naddone
-	br	nnoaddone
-	br	nnoaddone
-	br	naddone
-	br	naddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	naddone
-	br	naddone
-	br	naddone
-	br	nnoaddone
-	br	naddone
-	br	naddone
-	br	naddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-
-/*
- * Add one to the mantissa, and check to see if it overflows to -2**31.
- * The conversion is done in nnoaddone.
- */
-
-naddone:
-	or	%r10, %r0,  %r0		/* clear r10 */
-	set	%r10, %r10, 1<22>	/* set LSB bit to 1 for adding */
-	add.co	%r8,  %r8,  %r10	/* add the 1 obtained from rounding */
-	clr	%r7,  %r7,  12<20>	/* clear exponent and sign */
-	add.ci	%r7,  %r0,  %r7		/* add carry */
-	bb1	20,   %r7,  maxneg	/* rounded to -2**31, handle separately */
-					/* the exponent was originally 30 */
-nnoaddone:
-	extu	%r6,  %r8,  11<22>	/* extract lower bits of integer */
-	mak	%r10, %r7,  20<10>	/* shift left upper bits of integer */
-	or	%r6,  %r6,  %r10	/* form most of integer */
-	set	%r6,  %r6,  1<30>	/* set hidden one */
-	or.c	%r6,  %r0,  %r6		/* negate integer */
-	br.n	FPintov_return
-	 addu	%r6,  %r6,  1		/* add 1 to get 2''s complement */
-
-maxneg:
-	or	%r6,  %r0,  %r0		/* clear integer */
-	br.n	FPintov_return
-	 set	%r6,  %r6,  1<sign>	/* set sign bit */
-
-	/* For valid overflows, write the correctly signed largest integer. */
-overflw:
-	set	%r2,  %r2,  1<oper>
-	bb0.n	sign, %r7,  FPintov_return /* if positive then return */
-	 set	%r6,  %r6,  31<0>	/* set result to largest positive int */
-	or.c	%r6,  %r0,  %r6		/* negate r6, giving largest negative */
-					/* integer */
-
-FPintov_return:
-	ld	%r1,  %r31, 0		/* load return address from memory */
-	jmp	%r1
-
-/*
- * Some instructions only have the S2 operations, so clear S1HI and S1LO
- * for those instructions so that the previous contents of S1HI and S1LO
- * do not influence this instruction.
- */
-
-ASLOCAL(FPresoper)
-	st	%r1,  %r31, 0
-	extu	%r10, %r9,  5<11>	/* extract opcode */
-#if 0
-	cmp	%r11, %r10, FSQRTop	/* compare to FSQRT */
-	bb1	eq,   %r11, S1clear	/* clear S1 if instruction only had S2 operand */
-#endif
-	cmp	%r11, %r10, INTop	/* compare to INT */
-	bb1	eq,   %r11, S1clear	/* clear S1 if instruction only had S2 operand */
-	cmp	%r11, %r10, NINTop	/* compare to NINT */
-	bb1	eq,   %r11, S1clear	/* clear S1 if instruction only had S2 operand */
-	cmp	%r11, %r10, TRNCop	/* compare to TRNC */
-	bb0	eq,   %r11, opercheck	/* check for reserved operands */
-
-ASLOCAL(S1clear)
-	or	%r5,  %r0,  %r0	/* clear any NaN''s, denorms, or infinities */
-	or	%r6,  %r0,  %r0	/* that may be left in S1HI, S1LO from a */
-				/* previous instruction */
-
-/*
- * r12 contains the following flags:
- *   bit 9 -- s1sign
- *   bit 8 -- s2sign
- *   bit 7 -- s1nan
- *   bit 6 -- s2nan
- *   bit 5 -- s1inf
- *   bit 4 -- s2inf
- *   bit 3 -- s1zero
- *   bit 2 -- s2zero
- *   bit 1 -- s1denorm
- *   bit 0 -- s2denorm
- */
-
-/*
- * Using code for both single and double precision, check if S1 is either
- * a NaN or infinity and set the appropriate flags in %r12. Then check if
- * S2 is a NaN or infinity. If it is a NaN, then branch to the NaN routine.
- */
-
-ASLOCAL(opercheck)
-	extu	%r10, %r5,  11<20>	/* internal representation for double */
-	bb1.n	s1size, %r9, S1NaNdoub	/* S1 is double precision */
-	 or	%r12, %r0,  %r0		/* clear operand flag register */
-ASLOCAL(S1NaNsing)
-	xor	%r10, %r10, 0x0080	/* internal representation for single */
-	ext	%r10, %r10, 8<0>	/* precision is IEEE 8 bits sign extended */
-					/* to 11 bits; for real exp. > 0, the */
-					/* above instructions gives a result */
-					/* exp. that has the MSB flipped and */
-					/* sign extended like in the IMPCR */
-	cmp	%r11, %r10, 127		/* Is exponent equal to IEEE 255 */
-					/* (here 127) */
-	bb1	ne,   %r11, S2NaN	/* source 1 is not a NaN or infinity */
-	mak	%r10, %r5,  20<0>	/* load r10 with upper bits of S1 */
-					/* mantissa */
-	extu	%r11, %r6,  3<29>	/* get 3 upper bits of lower word */
-	or	%r11, %r10, %r11	/* combine any existing 1 */
-	bcnd	eq0,  %r11, noS1NaNs	/* since r11 can only hold 0 or a */
-					/* > 0 number, branch to noS1NaN */
-					/* when eq0 */
-	br.n	S2NaN			/* see if S2 has a NaN */
-	 set	%r12, %r12, 1<s1nan>	/* indicate that S1 has a NaN */
-ASLOCAL(noS1NaNs)
-	br.n	S2NaN			/* check contents of S2 */
-	 set	%r12, %r0, 1<s1inf>	/* indicate that S1 has an infinity */
-
-ASLOCAL(S1NaNdoub)
-	xor	%r10, %r10, 0x0400	/* precision is the same IEEE 11 bits */
-					/* The above instructions gives a */
-					/* result exp. that has the MSB */
-					/* flipped and sign extended like in */
-					/* the IMPCR */
-	cmp	%r11, %r10, 1023	/* Is exp. equal to IEEE 2047 */
-					/* (internal 1023) */
-	bb1	ne,   %r11, S2NaN	/* source 1 is not a NaN or infinity */
-	mak	%r10, %r5,  20<0>	/* load r10 with upper bits of S1 */
-					/* mantissa */
-	or	%r11, %r6,  %r10	/* combine existing 1''s of mantissa */
-	bcnd	eq0,  %r11, noS1NaNd	/* since r11 can only hold 0 or a */
-					/* > 0 number, branch to noS1NaN */
-					/* when eq0 */
-	br.n	S2NaN			/* see if S2 has a NaN */
-	 set	%r12, %r12, 1<s1nan>	/* indicate that S1 has a NaN */
-ASLOCAL(noS1NaNd)
-	set	%r12, %r0,  1<s1inf>	/* indicate that S1 has an infinity */
-
-ASLOCAL(S2NaN)
-	bb1.n	s2size, %r9, S2NaNdoub	/* S1 is double precision */
-	 extu	%r10, %r7,  11<20>	/* internal representation for double */
-ASLOCAL(S2NaNsing)
-	xor	%r10, %r10, 0x0080	/* internal representation for single */
-	ext	%r10, %r10, 8<0>	/* precision is IEEE 8 bits sign */
-					/* extended to 11 bits; for real exp. */
-					/* > 0, the above instruction gives a */
-					/* result exp. that has the MSB */
-					/* flipped and sign extended like in */
-					/* the IMPCR */
-	cmp	%r11, %r10, 127		/* Is exponent equal to IEEE 255 */
-					/* (here 127) */
-	bb1	ne,   %r11, inf		/* source 2 is not a NaN or infinity */
-	mak	%r10, %r7,  20<0>	/* load r10 with upper bits of S1 */
-					/* mantissa */
-	extu	%r11, %r8,  3<29>	/* get 3 upper bits of lower word */
-	or	%r11, %r10, %r11	/* combine any existing 1''s */
-	bcnd	eq0,  %r11, noS2NaNs	/* since r11 can only hold 0 or a > 0 */
-					/* number, branch to noS2NaNs */
-					/* when eq0 */
-	br.n	_ASM_LABEL(NaN)		/* branch to NaN routine */
-	 set	%r12, %r12, 1<s2nan>	/* indicate that s2 has a NaN */
-ASLOCAL(noS2NaNs)
-	bb0	s1nan, %r12, 1f		/* branch to NaN if S1 is a NaN */
-	br	_ASM_LABEL(NaN)
-1:
-	br.n	_ASM_LABEL(infinity)	/* If S1 had a NaN we would have */
-					/* already branched, and S2 does not */
-					/* have a NaN, but it does have an */
-					/* infinity, so branch to handle the */
-					/* finity */
-	 set	%r12, %r12, 1<s2inf>	/* indicate that S2 has an infinity */
-
-ASLOCAL(S2NaNdoub)
-	xor	%r10, %r10, 0x0400	/* precision is the same IEEE 11 bits */
-					/* The above instruction gives a */
-					/* result exp. that has the MSB */
-					/* flipped and sign extended like in */
-					/* the IMPCR */
-	cmp	%r11, %r10, 1023	/* Is exp. equal to IEEE 2047 */
-					/* (internal 1023) */
-	bb1	ne,   %r11, inf		/* source 2 is not a NaN or infinity */
-	mak	%r10, %r7, 20<0>	/* load r10 with upper bits of S2 */
-					/* mantissa */
-	or	%r11, %r8,  %r10	/* combine existing 1''s of mantissa */
-	bcnd	eq0,  %r11, noS2NaNd	/* since r11 can only hold 0 or a > 0 */
-					/* number, branch to noS2NaNd */
-					/* when eq0 */
-	br.n	_ASM_LABEL(NaN)		/* branch to NaN routine */
-	 set	%r12, %r12, 1<s2nan>	/* indicate that s2 has a NaN */
-ASLOCAL(noS2NaNd)
-	bb0	s1nan, %r12, 1f		/* branch to NaN if S1 is a NaN */
-	br	_ASM_LABEL(NaN)
-1:
-	br.n	_ASM_LABEL(infinity)	/* If S1 had a NaN we would have */
-					/* already branched, and S2 does not */
-					/* have a NaN, but it does have an */
-					/* infinity, so branch to handle the */
-					/* finity */
-	 set	%r12, %r12, 1<s2inf>	/* indicate that S2 has an infinity */
-
-/*
- * If S2 was a NaN, the routine would have already branched to NaN. If S1
- * is a NaN, then branch to NaN. If S1 is not a NaN and S2 is infinity, then
- * we would have already branched to infinity. If S1 is infinity, then branch.
- * If the routine still has not branched, then branch to denorm, the only
- * reserved operand left.
- */
-
-ASLOCAL(inf)
-	bb0	s1nan, %r12, 1f		/* branch if S1 has a NaN and S2 does */
-					/* not */
-	br	_ASM_LABEL(NaN)
-1:
-	bb0	s1inf, %r12, 2f		/* Neither S1 or S2 has a NaN, and we */
-					/* would have branched already if S2 */
-					/* had an infinity, so branch if S1 */
-					/* is infinity */
-	br	_ASM_LABEL(infinity)
-2:
-	br	_ASM_LABEL(denorm)	/* branch to denorm, the only */
-					/* remaining alternative */
-
-/*
- * If either S1 or S2 is a signalling NaN, then set the invalid operation
- * bit of the FPSR.
- * If S1 is the only NaN or one of two NaN''s, then write
- * a quiet S1 to the result. A signalling NaN must be made quiet before
- * it can be written, but a signalling S2 is not modified in this routine
- * if S1 is a NaN.
- */
-ASLOCAL(NaN)
-	bb0.n	s1nan, %r12, S2sigcheck		/* S1 is not a NaN */
-	 st	%r1,  %r31,  0			/* save return address */
-	bb1	sigbit, %r5, S2sigcheck		/* S1 is not a signaling NaN */
-	set	%r2,  %r2,  1<oper>
-	br.n	S1write				/* FPSR bit already set, S1 is */
-						/* made quiet, and since we */
-						/* always write S1 if it is */
-						/* a NaN, write S1 and skip */
-						/* rest of routine */
-	 set	%r5,  %r5,  1<sigbit>		/* make S1 a quiet NaN */
-
-ASLOCAL(S2sigcheck)
-	bb0	s2nan, %r12, S1write		/* S2 is not a NaN */
-	bb1	sigbit, %r7, S1write		/* S2 is not a signaling NaN */
-	set	%r2,  %r2,  1<oper>
-	set	%r7,  %r7,  1<sigbit>		/* make S2 a quiet NaN */
-
-/*
- * Write a single or double precision quiet NaN unless the opeation is FCMP.
- * If the operation is FCMP, then set the not comparable bit in the result.
- */
-ASLOCAL(S1write)
-	bb0	s1nan, %r12, S2write		/* do not write S1 */
-						/* if it is not a NaN */
-	extu	%r10, %r9,  5<11>		/* extract opcode */
-	cmp	%r11, %r10, FCMPop		/* compare to FCMP */
-	bb1	ne,   %r11, S1noFCMP		/* operation is not FCMP */
-	set	%r6,  %r0,  1<nc>		/* set the not comparable bit */
-	br.n	FPnan_return
-	 set	%r6,  %r6,  1<ne>		/* set the not equal bit */
-ASLOCAL(S1noFCMP)
-	bb1.n	dsize, %r9, wrdoubS1		/* double destination */
-	 set	%r5,  %r5,  11<20>		/* set all exponent bits to 1 */
-/*
- * The single result will be formed the same way whether S1 is a single or
- * double.
- */
-ASLOCAL(wrsingS1)
-	mak	%r10, %r5,  28<3>		/* wipe out extra exponent */
-						/* bits */
-	extu	%r11, %r6,  3<29>		/* get lower three bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* combine all of result */
-						/* except sign */
-	clr	%r6,  %r5,  31<0>		/* clear all but sign */
-	br.n	FPnan_return
-	 or	%r6,  %r6,  %r10		/* form result */
-
-ASLOCAL(wrdoubS1)
-	set	%r6,  %r6,  29<0>		/* set extra bits of lower */
-						/* word */
-	br	FPnan_return			/* no modification necessary */
-						/* for writing double to */
-						/* double, so return */
-
-ASLOCAL(S2write)
-	extu	%r10, %r9,  5<11>		/* extract opcode */
-	cmp	%r11, %r10, FCMPop		/* compare to FCMP */
-	bb1.n	ne,   %r11, S2noFCMP		/* operation is not FCMP */
-	 set	%r7,  %r7,  11<20>		/* set all exponent bits to 1 */
-	set	%r6,  %r0,  1<nc>		/* set the not comparable bit */
-	br.n	FPnan_return
-	 set	%r6,  %r6,  1<ne>		/* set the not equal bit */
-ASLOCAL(S2noFCMP)
-	bb1.n	dsize, %r9, wrdoubS2		/* double destination */
-	 set	%r5,  %r5,  11<20>		/* set all exponent bits to 1 */
-/*
- * The single result will be formed the same way whether S1 is a single or
- * double.
- */
-ASLOCAL(wrsingS2)
-	mak	%r10, %r7,  28<3>		/* wipe out extra exponent */
-						/* bits */
-	extu	%r11, %r8,  3<29>		/* get lower three bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* combine all of result */
-						/* except sign */
-	clr	%r6,  %r7,  31<0>		/* clear all but sign */
-	br.n	FPnan_return
-	 or	%r6,  %r6,  %r10		/* form result */
-
-ASLOCAL(wrdoubS2)
-	set	%r6,  %r8,  29<0>		/* set extra bits of lower */
-						/* word */
-
-/* Return from this subroutine with the result. */
-
-ASLOCAL(FPnan_return)
-						/* no modification necessary */
-						/* for writing double to */
-						/* double, so return */
-	ld	%r1,  %r31,  0			/* retrieve return address */
-	jmp	%r1
-
-/*
- * infinity
- */
-
-/*
- * Extract the opcode, compare to a constant, and branch to the code
- * for the instruction.
- */
-
-ASLOCAL(infinity)
-	extu	%r10, %r9,  5<11>		/* extract opcode */
-	cmp	%r11, %r10, FADDop		/* compare to FADD */
-	bb1.n	eq,   %r11, FADD		/* operation is FADD */
-	 st	%r1,  %r31, 0			/* save return address */
-	cmp	%r11, %r10, FSUBop		/* compare to FSUB */
-	bb1	eq,   %r11, FSUB		/* operation is FSUB */
-	cmp	%r11, %r10, FCMPop		/* compare to FCMP */
-	bb1	eq,   %r11, FCMP		/* operation is FCMP */
-	cmp	%r11, %r10, FMULop		/* compare to FMUL */
-	bb1	eq,   %r11, FMUL		/* operation is FMUL */
-	cmp	%r11, %r10, FDIVop		/* compare to FDIV */
-	bb1	eq,   %r11, FDIV		/* operation is FDIV */
-#if 0
-	cmp	%r11, %r10, FSQRTop		/* compare to FSQRT */
-	bb1	eq,   %r11, FSQRT		/* operation is FSQRT */
-#endif
-	cmp	%r11, %r10, INTop		/* compare to INT */
-	bb1	eq,   %r11, FP_inf_overflw	/* operation is INT */
-	cmp	%r11, %r10, NINTop		/* compare to NINT */
-	bb1	eq,   %r11, FP_inf_overflw	/* operation is NINT */
-	cmp	%r11, %r10, TRNCop		/* compare to TRNC */
-	bb1	eq,   %r11, FP_inf_overflw	/* operation is TRNC */
-
-/*
- * Adding infinities of opposite signs will cause an exception,
- * but all other operands will result in a correctly signed infinity.
- */
-
-FADD:
-	bb0	s1inf, %r12, addS2write		/* branch if S1 not infinity */
-	bb0	s2inf, %r12, addS1write		/* S2 is not inf., so branch */
-						/* to write S1 */
-	bb1	sign, %r5, addS1neg		/* handle case of S1 negative */
-addS1pos:
-	bb1	sign, %r7, excpt		/* adding infinities of */
-						/* different signs causes an */
-						/* exception */
-	br	poswrinf			/* branch to write positive */
-						/* infinity */
-addS1neg:
-	bb0	sign, %r7, excpt		/* adding infinities of */
-						/* different signs causes an */
-						/* exception */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-addS1write:
-	bb0	sign, %r5, poswrinf		/* branch to write positive */
-						/* infinity */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-addS2write:
-	bb0	sign, %r7, poswrinf		/* branch to write positive */
-						/* infinity */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-
-/*
- * Subtracting infinities of the same sign will cause an exception,
- * but all other operands will result in a correctly signed infinity.
- */
-
-FSUB:
-	bb0	s1inf, %r12, subS2write		/* branch if S1 not infinity */
-	bb0	s2inf, %r12, subS1write		/* S2 is not inf., so branch */
-						/* to write S1 */
-	bb1	sign, %r5, subS1neg		/* handle case of S1 negative */
-subS1pos:
-	bb0	sign, %r7, excpt		/* subtracting infinities of */
-						/* the same sign causes an */
-						/* exception */
-	br	poswrinf			/* branch to write positive */
-						/* infinity */
-subS1neg:
-	bb1	sign, %r7, excpt		/* subtracting infinities of */
-						/* the same sign causes an */
-						/* exception */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-subS1write:
-	bb0	sign, %r5, poswrinf		/* branch to write positive */
-						/* infinity */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-subS2write:
-	bb1	sign, %r7, poswrinf		/* branch to write positive */
-						/* infinity */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-
-/*
- * Compare the operands, at least one of which is infinity, and set the
- * correct bits in the destination register.
- */
-
-FCMP:
-	bb0.n	s1inf, %r12, FCMPS1f		/* branch for finite S1 */
-	 set	%r4,  %r0,  1<cp>		/* since neither S1 or S2 is */
-						/* a NaN, set cp */
-FCMPS1i:
-	bb1	sign, %r5, FCMPS1ni		/* branch to negative S1i */
-FCMPS1pi:
-	bb0	s2inf, %r12, FCMPS1piS2f	/* branch to finite S2 */
-						/* with S1pi */
-FCMPS1piS2i:
-	bb1	sign, %r7, FCMPS1piS2ni		/* branch to negative S2i */
-						/* with S1pi */
-FCMPS1piS2pi:
-	set	%r4,  %r4, 1<eq>		/* set eq bit */
-	set	%r4,  %r4, 1<le>		/* set le bit */
-	set	%r4,  %r4, 1<ge>		/* set ge bit */
-	set	%r4,  %r4, 1<ib>		/* set ib bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1piS2ni:
-	set	%r4,  %r4, 1<ne>		/* set ne bit */
-	set	%r4,  %r4, 1<gt>		/* set gt bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ge>		/* set ge bit */
-FCMPS1piS2f:
-	set	%r4,  %r4, 1<ne>		/* set ne bit */
-	set	%r4,  %r4, 1<gt>		/* set gt bit */
-	bsr.n	_ASM_LABEL(zero)		/* see if any of the operands */
-						/* are zero */
-	 set	%r4,  %r4, 1<ge>		/* set ge bit */
-	bb0	s2zero, %r12, FCMPS1piS2nz	/* check for negative if s2 */
-						/* not zero */
-	set	%r4,  %r4, 1<ou>		/* set ou bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1piS2nz:
-	bb1	sign, %r7, move			/* return if s2 is negative */
-FCMPS1piS2pf:
-	set	%r4,  %r4, 1<ou>		/* set ou bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1ni:
-	bb0	s2inf, %r12, FCMPS1niS2f	/* branch to finite S2 */
-						/* with S1ni */
-FCMPS1niS2i:
-	bb1	sign, %r7, FCMPS1niS2ni		/* branch to negative S2i */
-						/* with S1ni */
-FCMPS1niS2pi:
-	set	%r4,  %r4, 1<ne>		/* set eq bit */
-	set	%r4,  %r4, 1<le>		/* set le bit */
-	set	%r4,  %r4, 1<lt>		/* set lt bit */
-	set	%r4,  %r4, 1<ou>		/* set ou bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1niS2ni:
-	set	%r4,  %r4, 1<eq>		/* set eq bit */
-	set	%r4,  %r4, 1<le>		/* set le bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ge>		/* set ge bit */
-FCMPS1niS2f:
-	set	%r4,  %r4, 1<ne>		/* set eq bit */
-	set	%r4,  %r4, 1<le>		/* set le bit */
-	bsr.n	_ASM_LABEL(zero)		/* see if any of the operands */
-						/* are zero */
-	 set	%r4,  %r4, 1<lt>		/* set lt bit */
-	bb0	s2zero, %r12, FCMPS1niS2nz	/* branch if s2 is not zero */
-	set	%r4,  %r4, 1<ou>		/* set ou bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1niS2nz:
-	bb1	sign, %r7, move			/* return if s2 is negative */
-	set	%r4,  %r4, 1<ou>		/* set ou bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1f:
-	bb1	sign, %r5, FCMPS1nf		/* branch to negative S1f */
-FCMPS1pf:
-	bb1.n	sign, %r7, FCMPS1pfS2ni		/* branch to negative S2i */
-						/* with S1pf */
-	 set	%r4,  %r4, 1<ne>		/* set ne bit */
-FCMPS1pfS2pi:
-	set	%r4,  %r4, 1<le>		/* set le bit */
-	set	%r4,  %r4, 1<lt>		/* set lt bit */
-	bsr.n	_ASM_LABEL(zero)
-	 set	%r4,  %r4, 1<ib>		/* set ib bit */
-	bb0	s1zero, %r12, FCMPS1pfS2pinozero
-FCMPS1pfS2pizero:
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1pfS2pinozero:
-	br.n	move
-	 set	%r4,  %r4, 1<in>		/* set in bit */
-FCMPS1pfS2ni:
-	set	%r4,  %r4, 1<gt>		/* set gt bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ge>		/* set ge bit */
-FCMPS1nf:
-	bb1.n	sign, %r7, FCMPS1nfS2ni		/* branch to negative S2i */
-						/* with S1nf */
-	 set	%r4,  %r4, 1<ne>		/* set ne bit */
-	set	%r4,  %r4, 1<le>		/* set gt bit */
-	set	%r4,  %r4, 1<lt>		/* set ge bit */
-	bsr.n	_ASM_LABEL(zero)		/* see which of the operands */
-						/* are zero */
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-	bb0	s1zero, %r12, FCMPS1nfS2pinozero /* no ls and lo */
-FCMPS1nfS2pizero:
-	br.n	move
-	 set	%r4,  %r4, 1<ib>		/* set ib bit */
-FCMPS1nfS2pinozero:
-	br.n	move
-	 set	%r4,  %r4, 1<ou>		/* set ou bit */
-FCMPS1nfS2ni:
-	set	%r4,  %r4, 1<gt>		/* set gt bit */
-	set	%r4,  %r4, 1<ge>		/* set ge bit */
-
-move:
-	br.n	inf_return
-	 or	%r6,  %r0, %r4			/* transfer answer to r6 */
-/*
- * Multiplying infinity and zero causes an exception, but all other
- * operations produce a correctly signed infinity.
- */
-
-FMUL:
-	bsr	_ASM_LABEL(zero)		/* see if any of the operands */
-						/* are zero */
-	bb1	s1zero, %r12, excpt		/* infinity X 0 causes an */
-						/* exception */
-	bb1	s2zero, %r12, excpt		/* infinity X 0 causes an */
-						/* exception */
-	bb1	sign, %r5, FMULS1neg		/* handle negative cases */
-						/* of S1 */
-	bb0	sign, %r7, poswrinf		/* + X + = + */
-	br	negwrinf			/* + X - = - */
-FMULS1neg:
-	bb1	sign, %r7, poswrinf		/* - X - = + */
-	br	negwrinf			/* - X + = - */
-
-/*
- * Dividing infinity by infinity causes an exception, but dividing
- * infinity by a finite yields a correctly signed infinity, and
- * dividing a finite by an infinity produces a correctly signed zero.
- */
-
-FDIV:
-	bb1	s1inf, %r12, FDIVS1inf		/* handle case of S1 being */
-						/* infinity */
-	bb1	sign, %r5, FDIVS1nf		/* handle cases of S1 being */
-						/* neg. non-inf. */
-	bb1	sign, %r7, FDIVS1pfS2mi		/* handle case of negative S2 */
-FDIVS1pfS2pi:
-	br	poswrzero			/* +f / +inf = +0 */
-FDIVS1pfS2mi:
-	br	negwrzero			/* +f / -inf = -0 */
-FDIVS1nf:
-	bb1	sign, %r7, FDIVS1nfS2mi		/* handle case of negative S2 */
-FDIVS1nfS2pi:
-	br	negwrzero			/* -f / +inf = -0 */
-FDIVS1nfS2mi:
-	br	poswrzero			/* -f / -inf = +0 */
-FDIVS1inf:
-	bb1	s2inf, %r12, excpt		/* inf / inf = exception */
-	bb1	sign, %r5, FDIVS1mi		/* handle cases of S1 being */
-						/* neg. inf. */
-	bb1	sign, %r7, FDIVS1piS2nf		/* handle case of negative S2 */
-FDIVS1piS2pf:
-	br	poswrinf			/* +inf / +f = +inf */
-FDIVS1piS2nf:
-	br	negwrinf			/* +inf / -f = -inf */
-FDIVS1mi:
-	bb1	sign, %r7, FDIVS1miS2nf		/* handle case of negative S2 */
-FDIVS1miS2pf:
-	br	negwrinf			/* -inf / +f = -inf */
-FDIVS1miS2nf:
-	br	poswrinf			/* -inf / -f = +inf */
-
-/*
- * The square root of positive infinity is positive infinity,
- * but the square root of negative infinity is a NaN.
- */
-
-#if 0
-FSQRT:
-	bb0	sign, %r7, poswrinf		/* write sqrt(inf) = inf */
-	br	excpt				/* write sqrt(-inf) = NaN */
-#endif
-
-excpt:
-	set	%r2,  %r2, 1<oper>
-	set	%r5,  %r0, 0<0>			/* write NaN into r5 */
-	br.n	inf_return
-	 set	%r6,  %r0, 0<0>			/* write NaN into r6, writing */
-						/* NaN''s into both of these */
-						/* registers is quicker than */
-						/* checking for single or */
-						/* double precision */
-
-/* Write positive infinity of the correct precision */
-
-poswrinf:
-	bb1	dsize, %r9, poswrinfd		/* branch to write double */
-						/* precision inf. */
-	br.n	inf_return
-	 or.u	%r6,  %r0, 0x7f80		/* load r6 with single */
-						/* precision pos inf. */
-poswrinfd:
-	or.u	%r5,  %r0, 0x7ff0		/* load double precision */
-						/* pos inf. */
-	br.n	inf_return
-	 or	%r6,  %r0, %r0
-
-/* Write negative infinity of the correct precision */
-
-negwrinf:
-	bb1	dsize, %r9, negwrinfd		/* branch to write double */
-						/* precision inf. */
-	br.n	inf_return
-	 or.u	%r6,  %r0, 0xff80		/* load r6 with single */
-						/* precision neg inf. */
-negwrinfd:
-	or.u	%r5,  %r0, 0xfff0		/* load double precision */
-						/* neg inf. */
-	br.n	inf_return
-	 or	%r6,  %r0, %r0
-
-/* Write a positive zero disregarding precision. */
-
-poswrzero:
-	or	%r5,  %r0, %r0			/* write to both high word */
-						/* and low word now */
-	br.n	inf_return			/* it does not matter that */
-						/* both are written */
-	 or	%r6,  %r0, %r0
-
-/* Write a negative zero of the correct precision. */
-
-negwrzero:
-	or	%r6,  %r0, %r0			/* clear low word */
-	bb1	dsize, %r9, negwrzerod		/* branch to write double */
-						/* precision zero */
-	br.n	inf_return
-	 set	%r6,  %r6, 1<31>		/* set sign bit */
-negwrzerod:
-	or	%r5,  %r0, %r0			/* clear high word */
-	br.n	inf_return
-	 set	%r5,  %r5, 1<31>		/* set sign bit */
-
-FP_inf_overflw:
-	set	%r2,  %r2, 1<oper>
-	set	%r2,  %r2, 1<overflow>
-	set	%r2,  %r2, 1<inexact>
-
-	bb0.n	sign, %r7, inf_return		/* if positive then return */
-
-	 set	%r6,  %r6, 31<0>		/* set result to largest */
-						/* positive integer */
-	or.c	%r6,  %r0, %r6			/* negate r6, giving largest */
-						/* negative int. */
-
-inf_return:
-	ld	%r1,  %r31, 0			/* load return address */
-	jmp	%r1
-
-/*
- * denorm
- */
-
-/*
- * Check to see if either S1 or S2 is a denormalized number. First
- * extract the exponent to see if it is zero, and then check to see if
- * the mantissa is not zero. If the number is denormalized, then set the
- * 1 or 0 bit 10 %r12.
- */
-
-ASLOCAL(denorm)
-	st	%r1,  %r31, 0			/* save return address */
-dnmcheckS1:
-	extu	%r10, %r5,  11<20>		/* extract exponent */
-	bcnd	ne0,  %r10, dnmsetS2		/* S1 is not a denorm, so S2 */
-						/* must be */
-	bb1.n	9,    %r9,  dnmcheckS1d		/* S1 is double precision */
-	 mak	%r10, %r5,  20<3>		/* mak field with only */
-						/* mantissa bits */
-dnmcheckS1s:
-	extu	%r11, %r6,  3<29>		/* get three low bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* assemble all of the */
-						/* mantissa bits */
-	bcnd	eq0,  %r10, dnmsetS2		/* S1 is not a denorm, so S2 */
-						/* must be */
-	br	dnmsetS1			/* S1 is a denorm */
-
-dnmcheckS1d:
-	or	%r10, %r6,  %r10		/* or all of mantissa bits */
-	bcnd	eq0,  %r10, dnmsetS2		/* S1 is not a denorm, so S2 */
-						/* must be */
-dnmsetS1:
-	set	%r12, %r12, 1<1>		/* S1 is a denorm */
-
-dnmcheckS2:
-	extu	%r10, %r7,  11<20>		/* extract exponent */
-	bcnd	ne0,  %r10, S1form		/* S2 is not a denorm */
-	bb1.n	7,    %r9,  dnmcheckS2d		/* S2 is double precision */
-	 mak	%r10, %r7,  20<3>		/* mak field with only */
-						/* mantissa bits */
-dnmcheckS2s:
-	extu	%r11, %r8,  3<29>		/* get three low bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* assemble all of the */
-						/* mantissa bits */
-	bcnd	eq0,  %r10, S1form		/* S2 is not a denorm */
-	br	dnmsetS2			/* S1 is a denorm */
-dnmcheckS2d:
-	or	%r10, %r8,  %r10		/* or all or mantissa bits */
-	bcnd	eq0,  %r10, S1form		/* S2 is not a denorm */
-dnmsetS2:
-	set	%r12, %r12, 1<0>		/* S2 is a denorm */
-
-/*
- * Since the operations are going to be reperformed with modified denorms,
- * the operands which were initially single precision need to be modified
- * back to single precision.
- */
-
-S1form:
-	bb1	9,    %r9,  S2form		/* S1 is double precision, so */
-						/* do not modify S1 into */
-						/* single format */
-	mak	%r11, %r5,  28<3>		/* over final exponent and */
-						/* mantissa, eliminating */
-						/* extra 3 bits of exponent */
-	extu	%r6,  %r6,  3<29>		/* get low 3 bits of mantissa */
-	or	%r11, %r6,  %r11		/* form complete mantissa and */
-						/* exponent */
-	extu	%r10, %r5,  1<31>		/* get the 31 bit */
-	mak	%r10, %r10, 1<31>		/* place 31 bit into correct */
-						/* position */
-	or	%r6,  %r10, %r11		/* or 31, exponent, and all */
-						/* of mantissa */
-
-S2form:
-	bb1	7,    %r9,  checkop		/* S2 is double precision, so */
-						/* do not modify S2 into */
-						/* single format */
-	mak	%r11, %r7,  28<3>		/* over final exponent and */
-						/* mantissa, eliminating */
-						/* extra 3 bits of exponent */
-	extu	%r8,  %r8,  3<29>		/* get low 3 bits of mantissa */
-	or	%r11, %r8,  %r11		/* form complete mantissa and */
-						/* exponent */
-	extu	%r10, %r7,  1<31>		/* get the 31 bit */
-	mak	%r10, %r10, 1<31>		/* place 31 bit into correct */
-						/* position */
-	or	%r8,  %r10, %r11		/* or 31, exponent, and all */
-						/* of mantissa */
-
-/*
- * Extract the opcode, compare to a constant, and branch to the code that
- * deals with that opcode.
- */
-
-checkop:
-	extu	%r10, %r9,  5<11>		/* extract opcode */
-	cmp	%r11, %r10, 0x05		/* compare to FADD */
-	bb1	2,    %r11, denorm_FADD		/* operation is FADD */
-	cmp	%r11, %r10, 0x06		/* compare to FSUB */
-	bb1	2,    %r11, denorm_FSUB		/* operation is FSUB */
-	cmp	%r11, %r10, 0x07		/* compare to FCMP */
-	bb1	2,    %r11, denorm_FCMP		/* operation is FCMP */
-	cmp	%r11, %r10, 0x00		/* compare to FMUL */
-	bb1	2,    %r11, denorm_FMUL		/* operation is FMUL */
-	cmp	%r11, %r10, 0x0e		/* compare to FDIV */
-	bb1	2,    %r11, denorm_FDIV		/* operation is FDIV */
-#if 0
-	cmp	%r11, %r10, 0x0f		/* compare to FSQRT */
-	bb1	2,    %r11, denorm_FSQRT	/* operation is FSQRT */
-#endif
-	cmp	%r11, %r10, 0x09		/* compare to INT */
-	bb1	2,    %r11, denorm_INT		/* operation is INT */
-	cmp	%r11, %r10, 0x0a		/* compare to NINT */
-	bb1	2,    %r11, denorm_NINT		/* operation is NINT */
-	cmp	%r11, %r10, 0x0b		/* compare to TRNC */
-	bb1	2,    %r11, denorm_TRNC		/* operation is TRNC */
-
-/*
- * For all the following operations, the denormalized number is set to
- * zero and the operation is reperformed the correct destination and source
- * sizes.
- */
-
-denorm_FADD:
-	bb0	1,   %r12, FADDS2dnm		/* S1 is not denorm, so S2 */
-						/* must be */
-	or	%r5, %r0,  %r0			/* set S1 to zero */
-	or	%r6, %r0,  %r0
-FADDS2chk:
-	bb0	0,   %r12, FADDcalc		/* S2 is not a denorm */
-FADDS2dnm:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FADDcalc:
-	bb1	5,   %r9,  FADDdD		/* branch for double */
-						/* precision destination */
-FADDsD:
-	bb1	9,   %r9,  FADDsDdS1		/* branch for double */
-						/* precision S1 */
-FADDsDsS1:
-	bb1	7,   %r9,  FADDsDsS1dS2		/* branch for double */
-						/* precision S2 */
-FADDsDsS1sS2:
-	br.n	denorm_return
-	 fadd.sss %r6, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FADDsDsS1dS2:
-	br.n	denorm_return
-	 fadd.ssd %r6, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FADDsDdS1:
-	bb1	7,   %r9,  FADDsDdS1dS2		/* branch for double */
-						/* precision S2 */
-FADDsDdS1sS2:
-	br.n	denorm_return
-	 fadd.sds %r6, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FADDsDdS1dS2:
-	br.n	denorm_return
-	 fadd.sdd %r6, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-FADDdD:
-	bb1	9,   %r9,  FADDdDdS1		/* branch for double */
-						/* precision S1 */
-FADDdDsS1:
-	bb1	7,   %r9,  FADDdDsS1dS2		/* branch for double */
-						/* precision S2 */
-FADDdDsS1sS2:
-	br.n	denorm_return
-	 fadd.dss %r5, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FADDdDsS1dS2:
-	br.n	denorm_return
-	 fadd.dsd %r5, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FADDdDdS1:
-	bb1	7,   %r9,  FADDdDdS1dS2		/* branch for double */
-						/* precision S2 */
-FADDdDdS1sS2:
-	br.n	denorm_return
-	 fadd.dds %r5, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FADDdDdS1dS2:
-	br.n	denorm_return
-	 fadd.ddd %r5, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_FSUB:
-	bb0	1,   %r12, FSUBS2dnm		/* S1 is not denorm, so S2 */
-						/* must be */
-	or	%r5, %r0,  %r0			/* set S1 to zero */
-	or	%r6, %r0,  %r0
-FSUBS2chk:
-	bb0	0,   %r12, FSUBcalc		/* S2 is not a denorm */
-FSUBS2dnm:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FSUBcalc:
-	bb1	5,   %r9,  FSUBdD		/* branch for double */
-						/* precision destination */
-FSUBsD:
-	bb1	9,   %r9,  FSUBsDdS1		/* branch for double */
-						/* precision S1 */
-FSUBsDsS1:
-	bb1	7,   %r9,  FSUBsDsS1dS2		/* branch for double */
-						/* precision S2 */
-FSUBsDsS1sS2:
-	br.n	denorm_return
-	 fsub.sss %r6, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSUBsDsS1dS2:
-	br.n	denorm_return
-	 fsub.ssd %r6, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FSUBsDdS1:
-	bb1	7,   %r9,  FSUBsDdS1dS2		/* branch for double */
-						/* precision S2 */
-FSUBsDdS1sS2:
-	br.n	denorm_return
-	 fsub.sds %r6, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSUBsDdS1dS2:
-	br.n	denorm_return
-	 fsub.sdd %r6, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-FSUBdD:
-	bb1	9,   %r9,  FSUBdDdS1		/* branch for double */
-						/* precision S1 */
-FSUBdDsS1:
-	bb1	7,   %r9,  FSUBdDsS1dS2		/* branch for double */
-						/* precision S2 */
-FSUBdDsS1sS2:
-	br.n	denorm_return
-	 fsub.dss %r5, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSUBdDsS1dS2:
-	br.n	denorm_return
-	 fsub.dsd %r5, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FSUBdDdS1:
-	bb1	7,   %r9,  FSUBdDdS1dS2		/* branch for double */
-						/* precision S2 */
-FSUBdDdS1sS2:
-	br.n	denorm_return
-	 fsub.dds %r5, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSUBdDdS1dS2:
-	br.n	denorm_return
-	 fsub.ddd %r5, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_FCMP:
-	bb0	1,   %r12, FCMPS2dnm		/* S1 is not denorm, so S2 */
-						/* must be */
-	or	%r5, %r0,  %r0			/* set S1 to zero */
-	or	%r6, %r0,  %r0
-FCMPS2chk:
-	bb0	0,   %r12, FCMPcalc		/* S2 is not a denorm */
-FCMPS2dnm:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FCMPcalc:
-	bb1	9,   %r9,  FCMPdS1		/* branch for double */
-						/* precision S1 */
-FCMPsS1:
-	bb1	7,   %r9,  FCMPsS1dS2		/* branch for double */
-						/* precision S2 */
-FCMPsS1sS2:
-	br.n	denorm_return
-	 fcmp.sss %r6, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FCMPsS1dS2:
-	br.n	denorm_return
-	 fcmp.ssd %r6, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FCMPdS1:
-	bb1	7,   %r9,  FCMPdS1dS2		/* branch for double */
-						/* precision S2 */
-FCMPdS1sS2:
-	br.n	denorm_return
-	 fcmp.sds %r6, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FCMPdS1dS2:
-	br.n	denorm_return
-	 fcmp.sdd %r6, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_FMUL:
-	bb0	1,   %r12, FMULS2dnm		/* S1 is not denorm, so S2 */
-						/* must be */
-	or	%r5, %r0,  %r0			/* set S1 to zero */
-	or	%r6, %r0,  %r0
-FMULS2chk:
-	bb0	0,   %r12, FMULcalc		/* S2 is not a denorm */
-FMULS2dnm:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FMULcalc:
-	bb1	5,   %r9,  FMULdD		/* branch for double */
-						/* precision destination */
-FMULsD:
-	bb1	9,   %r9,  FMULsDdS1		/* branch for double */
-						/* precision S1 */
-FMULsDsS1:
-	bb1	7,   %r9,  FMULsDsS1dS2		/* branch for double */
-						/* precision S2 */
-FMULsDsS1sS2:
-	br.n	denorm_return
-	 fmul.sss %r6, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FMULsDsS1dS2:
-	br.n	denorm_return
-	 fmul.ssd %r6, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FMULsDdS1:
-	bb1	7,   %r9,  FMULsDdS1dS2		/* branch for double */
-						/* precision S2 */
-FMULsDdS1sS2:
-	br.n	denorm_return
-	 fmul.sds %r6, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FMULsDdS1dS2:
-	br.n	denorm_return
-	 fmul.sdd %r6, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-FMULdD:
-	bb1	9,   %r9,  FMULdDdS1		/* branch for double */
-						/* precision S1 */
-FMULdDsS1:
-	bb1	7,   %r9,  FMULdDsS1dS2		/* branch for double */
-						/* precision S2 */
-FMULdDsS1sS2:
-	br.n	denorm_return
-	 fmul.dss %r5, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FMULdDsS1dS2:
-	br.n	denorm_return
-	 fmul.dsd %r5, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FMULdDdS1:
-	bb1	7,   %r9,  FMULdDdS1dS2		/* branch for double */
-						/* precision S2 */
-FMULdDdS1sS2:
-	br.n	denorm_return
-	 fmul.dds %r5, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FMULdDdS1dS2:
-	br.n	denorm_return
-	 fmul.ddd %r5, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_FDIV:
-	bb0	1,   %r12, FDIVS2dnm		/* S1 is not denorm, so S2 */
-						/* must be */
-	or	%r5, %r0,  %r0			/* set S1 to zero */
-	or	%r6, %r0,  %r0
-FDIVS2chk:
-	bb0	0,   %r12, FDIVcalc		/* S2 is not a denorm */
-FDIVS2dnm:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FDIVcalc:
-	bb1	5,   %r9,  FDIVdD		/* branch for double */
-						/* precision destination */
-FDIVsD:
-	bb1	9,   %r9,  FDIVsDdS1		/* branch for double */
-						/* precision S1 */
-FDIVsDsS1:
-	bb1	7,   %r9,  FDIVsDsS1dS2		/* branch for double */
-						/* precision S2 */
-FDIVsDsS1sS2:
-	fdiv.sss %r6, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVsDsS1dS2:
-	fdiv.ssd %r6, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVsDdS1:
-	bb1	7,   %r9,  FDIVsDdS1dS2		/* branch for double */
-						/* precision S2 */
-FDIVsDdS1sS2:
-	fdiv.sds %r6, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVsDdS1dS2:
-	fdiv.sdd %r6, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVdD:
-	bb1	9,   %r9,  FDIVdDdS1		/* branch for double */
-						/* precision S1 */
-FDIVdDsS1:
-	bb1	7,   %r9,  FDIVdDsS1dS2		/* branch for double */
-						/* precision S2 */
-FDIVdDsS1sS2:
-	fdiv.dss %r5, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVdDsS1dS2:
-	fdiv.dsd %r5, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVdDdS1:
-	bb1	7,   %r9,  FDIVdDdS1dS2		/* branch for double */
-						/* precision S2 */
-FDIVdDdS1sS2:
-	fdiv.dds %r5, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVdDdS1dS2:
-	fdiv.ddd %r5, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-
-#if 0
-denorm_FSQRT:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FSQRTcalc:
-	bb1	5,   %r9,  FSQRTdD		/* branch for double */
-						/* precision destination */
-FSQRTsD:
-	bb1	7,   %r9,  FSQRTsDdS2		/* branch for double */
-						/* precision S2 */
-FSQRTsDsS2:
-	br.n	denorm_return
-	 fsqrt.ss %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSQRTsDdS2:
-	br.n	denorm_return
-	 fsqrt.sd %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FSQRTdD:
-	bb1	7,   %r9,  FSQRTdDdS2		/* branch for double */
-						/* precision S2 */
-FSQRTdDsS2:
-	br.n	denorm_return
-	 fsqrt.ds %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSQRTdDdS2:
-	br.n	denorm_return
-	 fsqrt.dd %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-#endif
-
-denorm_INT:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-INTcalc:
-	bb1	7,   %r9,  INTdS2		/* branch for double */
-						/* precision S2 */
-INTsS2:
-	br.n	denorm_return
-	 int.ss %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-INTdS2:
-	br.n	denorm_return
-	 int.sd %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_NINT:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-NINTcalc:
-	bb1	7,   %r9,  NINTdS2		/* branch for double */
-						/* precision S2 */
-NINTsS2:
-	br.n	denorm_return
-	 nint.ss %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-NINTdS2:
-	br.n	denorm_return
-	 nint.sd %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_TRNC:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-TRNCcalc:
-	bb1	7,   %r9,  TRNCdS2		/* branch for double */
-						/* precision S2 */
-TRNCsS2:
-	br.n	denorm_return
-	 trnc.ss %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-TRNCdS2:
-	trnc.sd %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-/* Return to the routine that detected the reserved operand. */
-
-denorm_return:
-	ld	%r1, %r31, 0			/* load return address */
-	jmp	%r1
-
-/*
- * S1 and/or S2 is an infinity, and the other operand may be a zero.
- * Knowing which operands are infinity, check the remaining operands for zeros.
- */
-
-ASLOCAL(zero)
-	bb0	s1inf, %r12, S1noinf		/* see if S1 is zero */
-	bb0	s2inf, %r12, S2noinf		/* see if S2 is zero */
-	jmp	%r1
-
-/*
- * See if S1 is zero. Whether or not S1 is a zero, being in this routine
- * implies that S2 is infinity, so return to subroutine infinity after
- * completing this code. Set the s1zero flag in %r12 if S1 is zero.
- */
-
-S1noinf:
-	bb1	s1size, %r9, S1noinfd		/* work with double precision */
-						/* operand */
-S1noinfs:
-	or	%r10, %r0,  %r5			/* load high word into r10 */
-	clr	%r10, %r10, 1<sign>		/* clear the sign bit */
-	extu	%r11, %r6,  3<29>		/* extract lower 3 bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* or these 3 bits with high */
-						/* word */
-	bcnd	ne0,  %r10, operation		/* do not set zero flag */
-	jmp.n	%r1				/* since this operand was not */
-						/* infinity, S2 must have */
-						/* been, so return */
-	 set	%r12, %r12, 1<s1zero>		/* set zeroflag */
-S1noinfd:
-	clr	%r10, %r5,  1<sign>		/* clear the sign bit */
-	or	%r10, %r6,  %r10		/* or high and low word */
-	bcnd	ne0,  %r10, operation		/* do not set zero flag */
-	jmp.n	%r1				/* since this operand was not */
-						/* infinity, S2 must have */
-						/* been, so return */
-	 set	%r12, %r12, 1<s1zero>		/* set zeroflag */
-
-/* Check S2 for zero. If it is zero, then set the s2zero flag in r12. */
-
-S2noinf:
-	bb1	s2size, %r9, S2noinfd		/* work with double precision */
-						/* operand */
-S2noinfs:
-	or	%r10, %r0,  %r7			/* load high word into r10 */
-	clr	%r10, %r10, 1<sign>		/* clear the sign bit */
-	extu	%r11, %r8,  3<29>		/* extract lower 3 bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* or these 3 bits with high */
-						/* word */
-	bcnd	ne0,  %r10, operation		/* do not set zero flag */
-	jmp.n	%r1				/* since this operand was not */
-						/* infinity, S1 must have */
-						/* been, so return */
-	 set	%r12, %r12, 1<s2zero>		/* set zeroflag */
-S2noinfd:
-	clr	%r10, %r7,  1<sign>		/* clear the sign bit */
-	or	%r10, %r8,  %r10		/* or high and low word */
-	bcnd	ne0,  %r10, operation		/* do not set zero flag */
-	set	%r12, %r12, 1<s2zero>		/* set zeroflag */
-						/* since this operand was not */
-						/* infinity, S1 must have */
-						/* been, so return */
-operation:
-	jmp	%r1
diff --git a/sys/arch/m88k/m88k/m88100_fp.c b/sys/arch/m88k/m88k/m88100_fp.c
new file mode 100644
index 00000000000..9a5d79590d2
--- /dev/null
+++ b/sys/arch/m88k/m88k/m88100_fp.c
@@ -0,0 +1,345 @@
+/*	$OpenBSD: m88100_fp.c,v 1.1 2014/06/09 16:26:32 miod Exp $	*/
+
+/*
+ * Copyright (c) 2007, 2014, Miodrag Vallat.
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice, this permission notice, and the disclaimer below
+ * appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+#include <sys/types.h>
+#include <sys/param.h>
+#include <sys/proc.h>
+#include <sys/signalvar.h>
+#include <sys/systm.h>
+
+#include <machine/fpu.h>
+#include <machine/frame.h>
+#include <machine/ieeefp.h>
+#include <machine/trap.h>
+#include <machine/m88100.h>
+
+#include <lib/libkern/softfloat.h>
+
+#include <m88k/m88k/fpu.h>
+
+int	m88100_fpu_emulate(struct trapframe *);
+void	m88100_fpu_fetch(struct trapframe *, u_int, u_int, u_int, fparg *);
+
+/*
+ * All 88100 precise floating-point exceptions are handled there.
+ *
+ * We ignore the exception cause register completely, except for the
+ * `privilege violation' bit, and attempt to perform the computation in
+ * software if needed.
+ */
+
+void
+m88100_fpu_precise_exception(struct trapframe *frame)
+{
+	struct proc *p = curproc;
+	int fault_type;
+	vaddr_t fault_addr;
+	union sigval sv;
+	int sig;
+
+	fault_addr = frame->tf_sxip & XIP_ADDR;
+
+	/* if FPECR_FUNIMP is set, all other bits are undefined, ignore them */
+	if (ISSET(frame->tf_fpecr, FPECR_FUNIMP))
+		frame->tf_fpecr = FPECR_FUNIMP;
+
+	/* Reset the exception cause register */
+	__asm__ volatile ("fstcr %r0, %fcr0");
+
+	if (ISSET(frame->tf_fpecr, FPECR_FPRV)) {
+		sig = SIGILL;
+		fault_type = ILL_PRVREG;
+	} else {
+		sig = m88100_fpu_emulate(frame);
+		fault_type = SI_NOINFO;
+	}
+
+	/*
+	 * Update the floating point status register regardless of
+	 * whether we'll deliver a signal or not.
+	 */
+	__asm__ volatile ("fstcr %0, %%fcr62" :: "r"(frame->tf_fpsr));
+
+	if (sig != 0) {
+		if (sig == SIGILL) {
+			if (fault_type == SI_NOINFO)
+				fault_type = ILL_ILLOPC;
+		} else {
+			if (frame->tf_fpecr & FPECR_FIOV)
+				fault_type = FPE_FLTSUB;
+			else if (frame->tf_fpecr & FPECR_FROP)
+				fault_type = FPE_FLTINV;
+			else if (frame->tf_fpecr & FPECR_FDVZ)
+				fault_type = FPE_INTDIV;
+			else if (frame->tf_fpecr & FPECR_FUNF) {
+				if (frame->tf_fpsr & FPSR_EFUNF)
+					fault_type = FPE_FLTUND;
+				else if (frame->tf_fpsr & FPSR_EFINX)
+					fault_type = FPE_FLTRES;
+			} else if (frame->tf_fpecr & FPECR_FOVF) {
+				if (frame->tf_fpsr & FPSR_EFOVF)
+					fault_type = FPE_FLTOVF;
+				else if (frame->tf_fpsr & FPSR_EFINX)
+					fault_type = FPE_FLTRES;
+			} else if (frame->tf_fpecr & FPECR_FINX)
+				fault_type = FPE_FLTRES;
+		}
+
+		sv.sival_ptr = (void *)fault_addr;
+		KERNEL_LOCK();
+		trapsignal(p, sig, 0, fault_type, sv);
+		KERNEL_UNLOCK();
+	}
+}
+
+/*
+ * Load a floating-point argument into a fparg union, then convert it to
+ * the required format if it is of larger precision.
+ *
+ * This assumes the final format (width) is not FTYPE_INT, and the original
+ * format (orig_width) <= width.
+ */
+void
+m88100_fpu_fetch(struct trapframe *frame, u_int operandno, u_int orig_width,
+    u_int width, fparg *dest)
+{
+	u_int32_t tmp;
+
+	switch (orig_width) {
+	case FTYPE_INT:
+		tmp = operandno == 1 ? frame->tf_fpls1 : frame->tf_fpls2;
+		switch (width) {
+		case FTYPE_SNG:
+			dest->sng = int32_to_float32(tmp);
+			break;
+		case FTYPE_DBL:
+			dest->dbl = int32_to_float64(tmp);
+			break;
+		}
+		break;
+	case FTYPE_SNG:
+		tmp = operandno == 1 ? frame->tf_fphs1 : frame->tf_fphs2;
+		switch (width) {
+		case FTYPE_SNG:
+			dest->sng = tmp;
+			break;
+		case FTYPE_DBL:
+			dest->dbl = float32_to_float64(tmp);
+			break;
+		}
+		break;
+	case FTYPE_DBL:
+		tmp = operandno == 1 ? frame->tf_fphs1 : frame->tf_fphs2;
+		dest->dbl = ((float64)tmp) << 32;
+		tmp = operandno == 1 ? frame->tf_fpls1 : frame->tf_fpls2;
+		dest->dbl |= (float64)tmp;
+		break;
+	}
+}
+
+/*
+ * Emulate an FPU instruction.  On return, the trapframe registers
+ * will be modified to reflect the settings the hardware would have left.
+ */
+int
+m88100_fpu_emulate(struct trapframe *frame)
+{
+	u_int rd, t1, t2, td, tmax, opcode;
+	u_int32_t old_fpsr, old_fpcr;
+	int rc;
+
+	fparg arg1, arg2, dest;
+
+	/*
+	 * Crack the instruction.
+	 */
+	rd = frame->tf_fppt & 0x1f;
+	opcode = (frame->tf_fppt >> 11) & 0x1f;
+	t1 = (frame->tf_fppt >> 9) & 0x03;
+	t2 = (frame->tf_fppt >> 7) & 0x03;
+	td = (frame->tf_fppt >> 5) & 0x03;
+
+	if (rd == 0)	/* r0 not allowed as destination */
+		return (SIGILL);
+
+	switch (opcode) {
+	case 0x00:	/* fmul */
+	case 0x05:	/* fadd */
+	case 0x06:	/* fsub */
+	case 0x0e:	/* fdiv */
+		if ((t1 != FTYPE_SNG && t1 != FTYPE_DBL) ||
+		    (t2 != FTYPE_SNG && t2 != FTYPE_DBL) ||
+		    (td != FTYPE_SNG && td != FTYPE_DBL))
+			return (SIGILL);
+		break;
+	case 0x04:	/* flt */
+		if ((td != FTYPE_SNG && td != FTYPE_DBL) ||
+		    t2 != 0x00 || t1 != 0x00)
+			return (SIGILL);
+		break;
+	case 0x07:	/* fcmp */
+		if ((t1 != FTYPE_SNG && t1 != FTYPE_DBL) ||
+		    (t2 != FTYPE_SNG && t2 != FTYPE_DBL) ||
+		    td != 0x00)
+			return (SIGILL);
+		break;
+	case 0x09:	/* int */
+	case 0x0a:	/* nint */
+	case 0x0b:	/* trnc */
+		if ((t2 != FTYPE_SNG && t2 != FTYPE_DBL) ||
+		    t1 != 0x00 || td != 0x00)
+			return (SIGILL);
+		break;
+	default:
+		return (SIGILL);
+	}
+
+	/*
+	 * Temporarily reset the status register, so that we can tell
+	 * which exceptions are new after processing the opcode.
+	 */
+	old_fpsr = frame->tf_fpsr;
+	frame->tf_fpsr = 0;
+
+	/*
+	 * Save fpcr as well, since we might need to change rounding mode
+	 * temporarily.
+	 */
+	old_fpcr = frame->tf_fpcr;
+
+	/*
+	 * The logic for instruction emulation is:
+	 *
+	 * - the computation precision is the largest one of all the operands.
+	 * - all source operands are converted to this precision if needed.
+	 * - computation is performed.
+	 * - the result is stored into the destination operand, converting it
+	 *   to the destination precision if lower.
+	 */
+
+	switch (opcode) {
+	case 0x00:	/* fmul */
+		tmax = fpu_precision(t1, t2, td);
+		m88100_fpu_fetch(frame, 1, t1, tmax, &arg1);
+		m88100_fpu_fetch(frame, 2, t2, tmax, &arg2);
+		switch (tmax) {
+		case FTYPE_SNG:
+			dest.sng = float32_mul(arg1.sng, arg2.sng);
+			break;
+		case FTYPE_DBL:
+			dest.dbl = float64_mul(arg1.dbl, arg2.dbl);
+			break;
+		}
+		fpu_store(frame, rd, tmax, td, &dest);
+		break;
+
+	case 0x04:	/* flt */
+		m88100_fpu_fetch(frame, 2, FTYPE_INT, td, &dest);
+		fpu_store(frame, rd, td, td, &dest);
+		break;
+
+	case 0x05:	/* fadd */
+		tmax = fpu_precision(t1, t2, td);
+		m88100_fpu_fetch(frame, 1, t1, tmax, &arg1);
+		m88100_fpu_fetch(frame, 2, t2, tmax, &arg2);
+		switch (tmax) {
+		case FTYPE_SNG:
+			dest.sng = float32_add(arg1.sng, arg2.sng);
+			break;
+		case FTYPE_DBL:
+			dest.dbl = float64_add(arg1.dbl, arg2.dbl);
+			break;
+		}
+		fpu_store(frame, rd, tmax, td, &dest);
+		break;
+
+	case 0x06:	/* fsub */
+		tmax = fpu_precision(t1, t2, td);
+		m88100_fpu_fetch(frame, 1, t1, tmax, &arg1);
+		m88100_fpu_fetch(frame, 2, t2, tmax, &arg2);
+		switch (tmax) {
+		case FTYPE_SNG:
+			dest.sng = float32_sub(arg1.sng, arg2.sng);
+			break;
+		case FTYPE_DBL:
+			dest.dbl = float64_sub(arg1.dbl, arg2.dbl);
+			break;
+		}
+		fpu_store(frame, rd, tmax, td, &dest);
+		break;
+
+	case 0x07:	/* fcmp */
+		tmax = fpu_precision(t1, t2, IGNORE_PRECISION);
+		m88100_fpu_fetch(frame, 1, t1, tmax, &arg1);
+		m88100_fpu_fetch(frame, 2, t2, tmax, &arg2);
+		fpu_compare(frame, &arg1, &arg2, tmax, rd, 0);
+		break;
+
+	case 0x09:	/* int */
+do_int:
+		m88100_fpu_fetch(frame, 2, t2, t2, &dest);
+		fpu_store(frame, rd, t2, FTYPE_INT, &dest);
+		break;
+
+	case 0x0a:	/* nint */
+		/* round to nearest */
+		frame->tf_fpcr = (old_fpcr & ~(FPCR_RD_MASK << FPCR_RD_SHIFT)) |
+		    (FP_RN << FPCR_RD_SHIFT);
+		goto do_int;
+
+	case 0x0b:	/* trnc */
+		/* round towards zero */
+		frame->tf_fpcr = (old_fpcr & ~(FPCR_RD_MASK << FPCR_RD_SHIFT)) |
+		    (FP_RZ << FPCR_RD_SHIFT);
+		goto do_int;
+
+	case 0x0e:	/* fdiv */
+		tmax = fpu_precision(t1, t2, td);
+		m88100_fpu_fetch(frame, 1, t1, tmax, &arg1);
+		m88100_fpu_fetch(frame, 2, t2, tmax, &arg2);
+		switch (tmax) {
+		case FTYPE_SNG:
+			dest.sng = float32_div(arg1.sng, arg2.sng);
+			break;
+		case FTYPE_DBL:
+			dest.dbl = float64_div(arg1.dbl, arg2.dbl);
+			break;
+		}
+		fpu_store(frame, rd, tmax, td, &dest);
+		break;
+	}
+
+	/*
+	 * Mark new exceptions, if any, in the fpsr, and decide whether
+	 * to send a signal or not.
+	 */
+
+	if (frame->tf_fpsr & old_fpcr)
+		rc = SIGFPE;
+	else
+		rc = 0;
+	frame->tf_fpsr |= old_fpsr;
+
+	/*
+	 * Restore fpcr as well.
+	 */
+	frame->tf_fpcr = old_fpcr;
+
+	return (rc);
+}
diff --git a/sys/arch/m88k/m88k/m88110_fp.c b/sys/arch/m88k/m88k/m88110_fp.c
index ee04e7a1d9c..7b60277d657 100644
--- a/sys/arch/m88k/m88k/m88110_fp.c
+++ b/sys/arch/m88k/m88k/m88110_fp.c
@@ -1,4 +1,4 @@
-/*	$OpenBSD: m88110_fp.c,v 1.9 2014/03/29 18:09:29 guenther Exp $	*/
+/*	$OpenBSD: m88110_fp.c,v 1.10 2014/06/09 16:26:32 miod Exp $	*/
 
 /*
  * Copyright (c) 2007, Miodrag Vallat.
@@ -31,58 +31,10 @@
 
 #include <lib/libkern/softfloat.h>
 
-/*
- * Values for individual bits in fcmp results.
- */
-#define	CC_UN	0x00000001	/* unordered */
-#define	CC_LEG	0x00000002	/* less than, equal or greater than */
-#define	CC_EQ	0x00000004	/* equal */
-#define	CC_NE	0x00000008	/* not equal */
-#define	CC_GT	0x00000010	/* greater than */
-#define	CC_LE	0x00000020	/* less than or equal */
-#define	CC_LT	0x00000040	/* less than */
-#define	CC_GE	0x00000080	/* greater than or equal */
-#define	CC_OU	0x00000100	/* out of range */
-#define	CC_IB	0x00000200	/* in range or on boundary */
-#define	CC_IN	0x00000400	/* in range */
-#define	CC_OB	0x00000800	/* out of range or on boundary */
-#define	CC_UE	0x00001000	/* unordered or equal */
-#define	CC_LG	0x00002000	/* less than or greater than */
-#define	CC_UG	0x00004000	/* unordered or greater than */
-#define	CC_ULE	0x00008000	/* unordered or less than or equal */
-#define	CC_UL	0x00010000	/* unordered or less than */
-#define	CC_UGE	0x00020000	/* unordered or greater than or equal */
-
-/*
- * Data width (matching the TD field of the instructions)
- */
-#define	FTYPE_SNG	0
-#define	FTYPE_DBL	1
-#define	FTYPE_EXT	2
-#define	FTYPE_INT	3	/* not a real T value */
-
-#define	IGNORE_PRECISION	FTYPE_SNG
-
-/* floating point value */
-typedef union {
-	float32		sng;
-	float64		dbl;
-} fparg;
+#include <m88k/m88k/fpu.h>
 
-void	fpu_compare(struct trapframe *, fparg *, fparg *, u_int, u_int, u_int);
-int	fpu_emulate(struct trapframe *, u_int32_t);
-void	fpu_fetch(struct trapframe *, u_int, u_int, u_int, fparg *);
-u_int	fpu_precision(u_int, u_int, u_int);
-void	fpu_store(struct trapframe *, u_int, u_int, u_int, fparg *);
-
-/*
- * Inlines from softfloat-specialize.h which are not made public, needed
- * for fpu_compare.
- */
-#define	float32_is_nan(a) \
-	(0xff000000 < (a << 1))
-#define	float32_is_signaling_nan(a) \
-	((((a >> 22) & 0x1ff) == 0x1fe) && (a & 0x003fffff))
+int	m88110_fpu_emulate(struct trapframe *, u_int32_t);
+void	m88110_fpu_fetch(struct trapframe *, u_int, u_int, u_int, fparg *);
 
 /*
  * All 88110 floating-point exceptions are handled there.
@@ -171,7 +123,7 @@ m88110_fpu_exception(struct trapframe *frame)
 			fault_type = FPE_FLTINV;
 			goto deliver;
 		}
-		sig = fpu_emulate(frame, insn);
+		sig = m88110_fpu_emulate(frame, insn);
 		fault_type = SI_NOINFO;
 		/*
 		 * Update the floating point status register regardless of
@@ -229,8 +181,8 @@ deliver:
  * format (orig_width) <= width.
  */
 void
-fpu_fetch(struct trapframe *frame, u_int regno, u_int orig_width, u_int width,
-    fparg *dest)
+m88110_fpu_fetch(struct trapframe *frame, u_int regno, u_int orig_width,
+    u_int width, fparg *dest)
 {
 	u_int32_t tmp;
 
@@ -267,83 +219,11 @@ fpu_fetch(struct trapframe *frame, u_int regno, u_int orig_width, u_int width,
 }
 
 /*
- * Store a floating-point result, converting it to the required format if it
- * is of smaller precision.
- *
- * This assumes the original format (orig_width) is not FTYPE_INT, and the
- * final format (width) <= orig_width.
- */
-void
-fpu_store(struct trapframe *frame, u_int regno, u_int orig_width, u_int width,
-    fparg *src)
-{
-	u_int32_t tmp;
-	u_int rd;
-
-	switch (width) {
-	case FTYPE_INT:
-		rd = float_get_round(frame->tf_fpcr);
-		switch (orig_width) {
-		case FTYPE_SNG:
-			if (rd == FP_RZ)
-				tmp = float32_to_int32_round_to_zero(src->sng);
-			else
-				tmp = float32_to_int32(src->sng);
-			break;
-		case FTYPE_DBL:
-			if (rd == FP_RZ)
-				tmp = float64_to_int32_round_to_zero(src->dbl);
-			else
-				tmp = float64_to_int32(src->dbl);
-			break;
-		}
-		if (regno != 0)
-			frame->tf_r[regno] = tmp;
-		break;
-	case FTYPE_SNG:
-		switch (orig_width) {
-		case FTYPE_SNG:
-			tmp = src->sng;
-			break;
-		case FTYPE_DBL:
-			tmp = float64_to_float32(src->dbl);
-			break;
-		}
-		if (regno != 0)
-			frame->tf_r[regno] = tmp;
-		break;
-	case FTYPE_DBL:
-		switch (orig_width) {
-		case FTYPE_DBL:
-			tmp = (u_int32_t)(src->dbl >> 32);
-			if (regno != 0)
-				frame->tf_r[regno] = tmp;
-			tmp = (u_int32_t)src->dbl;
-			if (regno != 31)
-				frame->tf_r[regno + 1] = tmp;
-			break;
-		}
-		break;
-	}
-}
-
-/*
- * Return the largest precision of all precision inputs.
- *
- * This assumes none of the inputs is FTYPE_INT.
- */
-u_int
-fpu_precision(u_int ts1, u_int ts2, u_int td)
-{
-	return max(td, max(ts1, ts2));
-}
-
-/*
  * Emulate an FPU instruction.  On return, the trapframe registers
  * will be modified to reflect the settings the hardware would have left.
  */
 int
-fpu_emulate(struct trapframe *frame, u_int32_t insn)
+m88110_fpu_emulate(struct trapframe *frame, u_int32_t insn)
 {
 	u_int rf, rd, rs1, rs2, t1, t2, td, tmax, opcode;
 	u_int32_t old_fpsr, old_fpcr;
@@ -442,8 +322,8 @@ fpu_emulate(struct trapframe *frame, u_int32_t insn)
 	switch (opcode) {
 	case 0x00:	/* fmul */
 		tmax = fpu_precision(t1, t2, td);
-		fpu_fetch(frame, rs1, t1, tmax, &arg1);
-		fpu_fetch(frame, rs2, t2, tmax, &arg2);
+		m88110_fpu_fetch(frame, rs1, t1, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg2);
 		switch (tmax) {
 		case FTYPE_SNG:
 			dest.sng = float32_mul(arg1.sng, arg2.sng);
@@ -457,19 +337,19 @@ fpu_emulate(struct trapframe *frame, u_int32_t insn)
 
 	case 0x01:	/* fcvt */
 		tmax = fpu_precision(IGNORE_PRECISION, t2, td);
-		fpu_fetch(frame, rs2, t2, tmax, &dest);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &dest);
 		fpu_store(frame, rd, tmax, td, &dest);
 		break;
 
 	case 0x04:	/* flt */
-		fpu_fetch(frame, rs2, FTYPE_INT, td, &dest);
+		m88110_fpu_fetch(frame, rs2, FTYPE_INT, td, &dest);
 		fpu_store(frame, rd, td, td, &dest);
 		break;
 
 	case 0x05:	/* fadd */
 		tmax = fpu_precision(t1, t2, td);
-		fpu_fetch(frame, rs1, t1, tmax, &arg1);
-		fpu_fetch(frame, rs2, t2, tmax, &arg2);
+		m88110_fpu_fetch(frame, rs1, t1, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg2);
 		switch (tmax) {
 		case FTYPE_SNG:
 			dest.sng = float32_add(arg1.sng, arg2.sng);
@@ -483,8 +363,8 @@ fpu_emulate(struct trapframe *frame, u_int32_t insn)
 
 	case 0x06:	/* fsub */
 		tmax = fpu_precision(t1, t2, td);
-		fpu_fetch(frame, rs1, t1, tmax, &arg1);
-		fpu_fetch(frame, rs2, t2, tmax, &arg2);
+		m88110_fpu_fetch(frame, rs1, t1, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg2);
 		switch (tmax) {
 		case FTYPE_SNG:
 			dest.sng = float32_sub(arg1.sng, arg2.sng);
@@ -498,14 +378,14 @@ fpu_emulate(struct trapframe *frame, u_int32_t insn)
 
 	case 0x07:	/* fcmp, fcmpu */
 		tmax = fpu_precision(t1, t2, IGNORE_PRECISION);
-		fpu_fetch(frame, rs1, t1, tmax, &arg1);
-		fpu_fetch(frame, rs2, t2, tmax, &arg2);
+		m88110_fpu_fetch(frame, rs1, t1, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg2);
 		fpu_compare(frame, &arg1, &arg2, tmax, rd, td /* fcmpu */);
 		break;
 
 	case 0x09:	/* int */
 do_int:
-		fpu_fetch(frame, rs2, t2, t2, &dest);
+		m88110_fpu_fetch(frame, rs2, t2, t2, &dest);
 		fpu_store(frame, rd, t2, FTYPE_INT, &dest);
 		break;
 
@@ -523,8 +403,8 @@ do_int:
 
 	case 0x0e:	/* fdiv */
 		tmax = fpu_precision(t1, t2, td);
-		fpu_fetch(frame, rs1, t1, tmax, &arg1);
-		fpu_fetch(frame, rs2, t2, tmax, &arg2);
+		m88110_fpu_fetch(frame, rs1, t1, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg2);
 		switch (tmax) {
 		case FTYPE_SNG:
 			dest.sng = float32_div(arg1.sng, arg2.sng);
@@ -538,7 +418,7 @@ do_int:
 
 	case 0x0f:	/* sqrt */
 		tmax = fpu_precision(IGNORE_PRECISION, t2, td);
-		fpu_fetch(frame, rs2, t2, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg1);
 		switch (tmax) {
 		case FTYPE_SNG:
 			dest.sng = float32_sqrt(arg1.sng);
@@ -569,167 +449,3 @@ do_int:
 
 	return (rc);
 }
-
-/*
- * Perform a compare instruction (fcmp, fcmpu).
- *
- * If either operand is NaN, the result is unordered.  This causes an
- * reserved operand exception (except for nonsignalling NaNs for fcmpu).
- */
-void
-fpu_compare(struct trapframe *frame, fparg *s1, fparg *s2, u_int width,
-    u_int rd, u_int fcmpu)
-{
-	u_int32_t cc;
-	int zero, s1positive, s2positive;
-
-	/*
-	 * Handle NaNs first, and raise invalid if fcmp or signaling NaN.
-	 */
-	switch (width) {
-	case FTYPE_SNG:
-		if (float32_is_nan(s1->sng)) {
-			if (!fcmpu || float32_is_signaling_nan(s1->sng))
-				float_set_invalid();
-			cc = CC_UN;
-			goto done;
-		}
-		if (float32_is_nan(s2->sng)) {
-			if (!fcmpu || float32_is_signaling_nan(s2->sng))
-				float_set_invalid();
-			cc = CC_UN;
-			goto done;
-		}
-		break;
-	case FTYPE_DBL:
-		if (float64_is_nan(s1->dbl)) {
-			if (!fcmpu || float64_is_signaling_nan(s1->dbl))
-				float_set_invalid();
-			cc = CC_UN;
-			goto done;
-		}
-		if (float64_is_nan(s2->dbl)) {
-			if (!fcmpu || float64_is_signaling_nan(s2->dbl))
-				float_set_invalid();
-			cc = CC_UN;
-			goto done;
-		}
-		break;
-	}
-
-	/*
-	 * Now order the two numbers.
-	 */
-	switch (width) {
-	case FTYPE_SNG:
-		if (float32_eq(s1->sng, s2->sng))
-			cc = CC_EQ;
-		else if (float32_lt(s1->sng, s2->sng))
-			cc = CC_LT | CC_NE;
-		else
-			cc = CC_GT | CC_NE;
-		break;
-	case FTYPE_DBL:
-		if (float64_eq(s1->dbl, s2->dbl))
-			cc = CC_EQ;
-		else if (float64_lt(s1->dbl, s2->dbl))
-			cc = CC_LT | CC_NE;
-		else
-			cc = CC_GT | CC_NE;
-		break;
-	}
-
-done:
-
-	/*
-	 * Complete condition code mask.
-	 */
-
-	if (cc & CC_UN)
-		cc |= CC_UE | CC_UG | CC_ULE | CC_UL | CC_UGE;
-	if (cc & CC_EQ)
-		cc |= CC_LE | CC_GE | CC_UE;
-	if (cc & CC_GT)
-		cc |= CC_GE;
-	if (cc & CC_LT)
-		cc |= CC_LE;
-	if (cc & (CC_LT | CC_GT))
-		cc |= CC_LG;
-	if (cc & (CC_LT | CC_GT | CC_EQ))
-		cc |= CC_LEG;
-	if (cc & CC_GT)
-		cc |= CC_UG;
-	if (cc & CC_LE)
-		cc |= CC_ULE;
-	if (cc & CC_LT)
-		cc |= CC_UL;
-	if (cc & CC_GE)
-		cc |= CC_UGE;
-
-	/*
-	 * Fill the interval bits.
-	 * s1 is compared to the interval [0, s2].
-	 */
-	if (!(cc & CC_UN)) {
-		if (cc & CC_EQ) {
-			/* if s1 and s2 are equal, s1 is on boundary */
-			cc |= CC_IB | CC_OB;
-			goto completed;
-		}
-
-		/* s1 and s2 are either Zero, numbers or Inf */
-		switch (width) {
-		case FTYPE_SNG:
-			zero = float32_eq(s1->sng, 0);
-			break;
-		case FTYPE_DBL:
-			zero = float64_eq(s1->dbl, 0LL);
-			break;
-		}
-		if (zero) {
-			/* if s1 is zero, it is on boundary */
-			cc |= CC_IB | CC_OB;
-			goto completed;
-		}
-
-		switch (width) {
-		case FTYPE_SNG:
-			s1positive = s1->sng >> 31 == 0;
-			s2positive = s2->sng >> 31 == 0;
-			break;
-		case FTYPE_DBL:
-			s1positive = s1->dbl >> 63 == 0;
-			s2positive = s2->dbl >> 63 == 0;
-			break;
-		}
-		if (s2positive) {
-			/* s2 is positive, the interval is [0, s2] */
-			if (cc & CC_GT) {
-				/* 0 <= s2 < s1 -> out of interval */
-				cc |= CC_OU | CC_OB;
-			} else if (s1positive) {
-				/* 0 < s1 < s2 -> in interval */
-				cc |= CC_IB | CC_IN;
-			} else {
-				/* s1 < 0 <= s2 */
-				cc |= CC_OU | CC_OB;
-			}
-		} else {
-			/* s2 is negative, the interval is [s2, 0] */
-			if (cc & CC_LT) {
-				/* s1 < s2 <= 0 */
-				cc |= CC_OU | CC_OB;
-			} else if (!s1positive) {
-				/* s2 < s1 < 0 */
-				cc |= CC_IB | CC_IN;
-			} else {
-				/* s2 < 0 < s1 */
-				cc |= CC_OU | CC_OB;
-			}
-		}
-	}
-
-completed:
-	if (rd != 0)
-		frame->tf_r[rd] = cc;
-}
diff --git a/sys/arch/m88k/m88k/trap.c b/sys/arch/m88k/m88k/trap.c
index 302efe39490..0e1dec19918 100644
--- a/sys/arch/m88k/m88k/trap.c
+++ b/sys/arch/m88k/m88k/trap.c
@@ -1,4 +1,4 @@
-/*	$OpenBSD: trap.c,v 1.97 2014/06/09 14:33:20 miod Exp $	*/
+/*	$OpenBSD: trap.c,v 1.98 2014/06/09 16:26:32 miod Exp $	*/
 /*
  * Copyright (c) 2004, Miodrag Vallat.
  * Copyright (c) 1998 Steve Murphree, Jr.
@@ -506,10 +506,9 @@ user_fault:
 		break;
 	case T_FPEPFLT+T_USER:
 		m88100_fpu_precise_exception(frame);
-		goto maysigfpe;
+		goto userexit;
 	case T_FPEIFLT+T_USER:
 		m88100_fpu_imprecise_exception(frame);
-maysigfpe:
 		/* Check for a SIGFPE condition */
 		if (frame->tf_fpsr & frame->tf_fpcr) {
 			sig = SIGFPE;
@@ -616,6 +615,7 @@ maysigfpe:
 		frame->tf_ipfsr = frame->tf_dpfsr = 0;
 	}
 
+userexit:
 	userret(p);
 }
 #endif /* M88100 */
author	miod <miod@openbsd.org>	2014-06-09 16:26:32 +0000
committer	miod <miod@openbsd.org>	2014-06-09 16:26:32 +0000
commit	af421d72ce5387c9dfb0050c65afb3f1be689da3 (patch)
tree	a19a10d528e1311fadec189e654f76237dc71077
parent	Remove redundant regdump() output. (diff)
download	wireguard-openbsd-af421d72ce5387c9dfb0050c65afb3f1be689da3.tar.xz wireguard-openbsd-af421d72ce5387c9dfb0050c65afb3f1be689da3.zip