10 files changed, 732 insertions, 2137 deletions
diff --git a/sys/arch/aviion/conf/Makefile.aviion b/sys/arch/aviion/conf/Makefile.aviion
index 749079ca0b7..bde4c65043a 100644
--- a/sys/arch/aviion/conf/Makefile.aviion
+++ b/sys/arch/aviion/conf/Makefile.aviion
@@ -1,4 +1,4 @@
-#	$OpenBSD: Makefile.aviion,v 1.45 2014/05/08 22:17:33 miod Exp $
+#	$OpenBSD: Makefile.aviion,v 1.46 2014/06/09 16:26:32 miod Exp $
 
 # For instructions on building kernels consult the config(8) and options(4)
 # manual pages.
@@ -143,7 +143,7 @@ db_structinfo.h: $S/ddb/db_structinfo.c $S/ddb/parse_structinfo.pl
 	rm -f db_structinfo.o
 
 locore.o: ${_machdir}/${_mach}/locore.S assym.h
-eh.o m88100_fp.o mutex.o process.o subr.o: assym.h
+eh.o m88100_fp_imp.o mutex.o process.o subr.o: assym.h
 
 # The install target can be redefined by putting a
 # install-kernel-${MACHINE_NAME} target into /etc/mk.conf
diff --git a/sys/arch/luna88k/conf/Makefile.luna88k b/sys/arch/luna88k/conf/Makefile.luna88k
index abe39b556e1..22d551e682f 100644
--- a/sys/arch/luna88k/conf/Makefile.luna88k
+++ b/sys/arch/luna88k/conf/Makefile.luna88k
@@ -1,4 +1,4 @@
-#	$OpenBSD: Makefile.luna88k,v 1.53 2014/05/08 22:17:33 miod Exp $
+#	$OpenBSD: Makefile.luna88k,v 1.54 2014/06/09 16:26:32 miod Exp $
 
 # For instructions on building kernels consult the config(8) and options(4)
 # manual pages.
@@ -143,7 +143,7 @@ db_structinfo.h: $S/ddb/db_structinfo.c $S/ddb/parse_structinfo.pl
 	rm -f db_structinfo.o
 
 locore.o: ${_machdir}/${_mach}/locore.S assym.h
-eh.o m88100_fp.o mutex.o process.o subr.o: assym.h
+eh.o m88100_fp_imp.o mutex.o process.o subr.o: assym.h
 
 # The install target can be redefined by putting a
 # install-kernel-${MACHINE_NAME} target into /etc/mk.conf
diff --git a/sys/arch/m88k/conf/files.m88k b/sys/arch/m88k/conf/files.m88k
index 44679231cc2..ee78c974160 100644
--- a/sys/arch/m88k/conf/files.m88k
+++ b/sys/arch/m88k/conf/files.m88k
@@ -1,14 +1,16 @@
-#	$OpenBSD: files.m88k,v 1.26 2014/06/09 10:26:10 miod Exp $
+#	$OpenBSD: files.m88k,v 1.27 2014/06/09 16:26:32 miod Exp $
 
 file	arch/m88k/m88k/atomic.S				multiprocessor
 file	arch/m88k/m88k/db_disasm.c			ddb
 file	arch/m88k/m88k/db_interface.c			ddb
 file	arch/m88k/m88k/db_sstep.c			ddb
 file	arch/m88k/m88k/db_trace.c			ddb
+file	arch/m88k/m88k/fpu.c
 file	arch/m88k/m88k/in_cksum.c			inet
-file	arch/m88k/m88k/m88100_fp.S			m88100
+file	arch/m88k/m88k/m88100_fp.c			m88100
 file	arch/m88k/m88k/m88100_fp_imp.S			m88100
 file	arch/m88k/m88k/m88100_machdep.c			m88100
+file	arch/m88k/m88k/m88110_fp.c			m88110
 file	arch/m88k/m88k/m88110_mmu.S			m88110
 file	arch/m88k/m88k/m8820x_machdep.c			m88100
 file	arch/m88k/m88k/m88k_machdep.c
@@ -26,9 +28,7 @@ file	arch/m88k/m88k/vectors_88100.S			m88100
 file	arch/m88k/m88k/vectors_88110.S			m88110
 file	arch/m88k/m88k/vm_machdep.c
 
-# floating-point support code for 88110
-file	arch/m88k/m88k/m88110_fp.c			m88110
-file	lib/libkern/softfloat.c				m88110
+file	lib/libkern/softfloat.c
 
 file	lib/libkern/arch/m88k/divsi3.S
 file	lib/libkern/arch/m88k/modsi3.S
diff --git a/sys/arch/m88k/include/ieeefp.h b/sys/arch/m88k/include/ieeefp.h
index 1af791fc06e..540f3099dc8 100644
--- a/sys/arch/m88k/include/ieeefp.h
+++ b/sys/arch/m88k/include/ieeefp.h
@@ -1,4 +1,4 @@
-/*	$OpenBSD: ieeefp.h,v 1.4 2010/04/21 15:37:32 miod Exp $ */
+/*	$OpenBSD: ieeefp.h,v 1.5 2014/06/09 16:26:32 miod Exp $ */
 /*
  * Copyright (c) 1996 Nivas Madhur
  * All rights reserved.
@@ -56,7 +56,7 @@ typedef enum {
 #ifdef _KERNEL
 
 /*
- * Defines for the 88110 floating-point completion code.
+ * Defines for the floating-point completion code.
  */
 
 #include <sys/param.h>
@@ -83,6 +83,6 @@ countLeadingZeros32(u_int32_t a)
 	return (a != 0 ? 31 - rc : rc);
 }
 
-#endif
+#endif /* _KERNEL */
 
 #endif /* _M88K_IEEEFP_H_ */
diff --git a/sys/arch/m88k/m88k/fpu.c b/sys/arch/m88k/m88k/fpu.c
new file mode 100644
index 00000000000..69885828861
--- /dev/null
+++ b/sys/arch/m88k/m88k/fpu.c
@@ -0,0 +1,308 @@
+/*	$OpenBSD: fpu.c,v 1.1 2014/06/09 16:26:32 miod Exp $	*/
+
+/*
+ * Copyright (c) 2007, 2014, Miodrag Vallat.
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice, this permission notice, and the disclaimer below
+ * appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+/*
+ * Common bits between the 88100 and the 88110 floating point completion
+ * code.
+ */
+
+#include <sys/types.h>
+#include <sys/param.h>
+#include <sys/proc.h>
+
+#include <machine/fpu.h>
+#include <machine/frame.h>
+#include <machine/ieeefp.h>
+
+#include <lib/libkern/softfloat.h>
+
+#include <m88k/m88k/fpu.h>
+
+/*
+ * Values for individual bits in fcmp results.
+ */
+#define	CC_UN	0x00000001	/* unordered */
+#define	CC_LEG	0x00000002	/* less than, equal or greater than */
+#define	CC_EQ	0x00000004	/* equal */
+#define	CC_NE	0x00000008	/* not equal */
+#define	CC_GT	0x00000010	/* greater than */
+#define	CC_LE	0x00000020	/* less than or equal */
+#define	CC_LT	0x00000040	/* less than */
+#define	CC_GE	0x00000080	/* greater than or equal */
+#define	CC_OU	0x00000100	/* out of range */
+#define	CC_IB	0x00000200	/* in range or on boundary */
+#define	CC_IN	0x00000400	/* in range */
+#define	CC_OB	0x00000800	/* out of range or on boundary */
+/* the following only on 88110 */
+#define	CC_UE	0x00001000	/* unordered or equal */
+#define	CC_LG	0x00002000	/* less than or greater than */
+#define	CC_UG	0x00004000	/* unordered or greater than */
+#define	CC_ULE	0x00008000	/* unordered or less than or equal */
+#define	CC_UL	0x00010000	/* unordered or less than */
+#define	CC_UGE	0x00020000	/* unordered or greater than or equal */
+
+/*
+ * Inlines from softfloat-specialize.h which are not made public, needed
+ * for fpu_compare.
+ */
+#define	float32_is_nan(a) \
+	(0xff000000 < (a << 1))
+#define	float32_is_signaling_nan(a) \
+	((((a >> 22) & 0x1ff) == 0x1fe) && (a & 0x003fffff))
+
+/*
+ * Store a floating-point result, converting it to the required format if it
+ * is of smaller precision.
+ *
+ * This assumes the original format (orig_width) is not FTYPE_INT, and the
+ * final format (width) <= orig_width.
+ */
+void
+fpu_store(struct trapframe *frame, u_int regno, u_int orig_width, u_int width,
+    fparg *src)
+{
+	u_int32_t tmp;
+	u_int rd;
+
+	switch (width) {
+	case FTYPE_INT:
+		rd = float_get_round(frame->tf_fpcr);
+		switch (orig_width) {
+		case FTYPE_SNG:
+			if (rd == FP_RZ)
+				tmp = float32_to_int32_round_to_zero(src->sng);
+			else
+				tmp = float32_to_int32(src->sng);
+			break;
+		case FTYPE_DBL:
+			if (rd == FP_RZ)
+				tmp = float64_to_int32_round_to_zero(src->dbl);
+			else
+				tmp = float64_to_int32(src->dbl);
+			break;
+		}
+		if (regno != 0)
+			frame->tf_r[regno] = tmp;
+		break;
+	case FTYPE_SNG:
+		switch (orig_width) {
+		case FTYPE_SNG:
+			tmp = src->sng;
+			break;
+		case FTYPE_DBL:
+			tmp = float64_to_float32(src->dbl);
+			break;
+		}
+		if (regno != 0)
+			frame->tf_r[regno] = tmp;
+		break;
+	case FTYPE_DBL:
+		switch (orig_width) {
+		case FTYPE_DBL:
+			tmp = (u_int32_t)(src->dbl >> 32);
+			if (regno != 0)
+				frame->tf_r[regno] = tmp;
+			tmp = (u_int32_t)src->dbl;
+			if (regno != 31)
+				frame->tf_r[regno + 1] = tmp;
+			break;
+		}
+		break;
+	}
+}
+
+/*
+ * Return the largest precision of all precision inputs.
+ *
+ * This assumes none of the inputs is FTYPE_INT.
+ */
+u_int
+fpu_precision(u_int ts1, u_int ts2, u_int td)
+{
+	return max(td, max(ts1, ts2));
+}
+
+/*
+ * Perform a compare instruction (fcmp, fcmpu).
+ *
+ * If either operand is NaN, the result is unordered.  This causes an
+ * reserved operand exception (except for nonsignalling NaNs for fcmpu).
+ */
+void
+fpu_compare(struct trapframe *frame, fparg *s1, fparg *s2, u_int width,
+    u_int rd, u_int fcmpu)
+{
+	u_int32_t cc;
+	int zero, s1positive, s2positive;
+
+	/*
+	 * Handle NaNs first, and raise invalid if fcmp or signaling NaN.
+	 */
+	switch (width) {
+	case FTYPE_SNG:
+		if (float32_is_nan(s1->sng)) {
+			if (!fcmpu || float32_is_signaling_nan(s1->sng))
+				float_set_invalid();
+			cc = CC_UN;
+			goto done;
+		}
+		if (float32_is_nan(s2->sng)) {
+			if (!fcmpu || float32_is_signaling_nan(s2->sng))
+				float_set_invalid();
+			cc = CC_UN;
+			goto done;
+		}
+		break;
+	case FTYPE_DBL:
+		if (float64_is_nan(s1->dbl)) {
+			if (!fcmpu || float64_is_signaling_nan(s1->dbl))
+				float_set_invalid();
+			cc = CC_UN;
+			goto done;
+		}
+		if (float64_is_nan(s2->dbl)) {
+			if (!fcmpu || float64_is_signaling_nan(s2->dbl))
+				float_set_invalid();
+			cc = CC_UN;
+			goto done;
+		}
+		break;
+	}
+
+	/*
+	 * Now order the two numbers.
+	 */
+	switch (width) {
+	case FTYPE_SNG:
+		if (float32_eq(s1->sng, s2->sng))
+			cc = CC_EQ;
+		else if (float32_lt(s1->sng, s2->sng))
+			cc = CC_LT | CC_NE;
+		else
+			cc = CC_GT | CC_NE;
+		break;
+	case FTYPE_DBL:
+		if (float64_eq(s1->dbl, s2->dbl))
+			cc = CC_EQ;
+		else if (float64_lt(s1->dbl, s2->dbl))
+			cc = CC_LT | CC_NE;
+		else
+			cc = CC_GT | CC_NE;
+		break;
+	}
+
+done:
+
+	/*
+	 * Complete condition code mask.
+	 */
+
+	if (cc & CC_UN)
+		cc |= CC_UE | CC_UG | CC_ULE | CC_UL | CC_UGE;
+	if (cc & CC_EQ)
+		cc |= CC_LE | CC_GE | CC_UE;
+	if (cc & CC_GT)
+		cc |= CC_GE;
+	if (cc & CC_LT)
+		cc |= CC_LE;
+	if (cc & (CC_LT | CC_GT))
+		cc |= CC_LG;
+	if (cc & (CC_LT | CC_GT | CC_EQ))
+		cc |= CC_LEG;
+	if (cc & CC_GT)
+		cc |= CC_UG;
+	if (cc & CC_LE)
+		cc |= CC_ULE;
+	if (cc & CC_LT)
+		cc |= CC_UL;
+	if (cc & CC_GE)
+		cc |= CC_UGE;
+
+	/*
+	 * Fill the interval bits.
+	 * s1 is compared to the interval [0, s2].
+	 */
+	if (!(cc & CC_UN)) {
+		if (cc & CC_EQ) {
+			/* if s1 and s2 are equal, s1 is on boundary */
+			cc |= CC_IB | CC_OB;
+			goto completed;
+		}
+
+		/* s1 and s2 are either Zero, numbers or Inf */
+		switch (width) {
+		case FTYPE_SNG:
+			zero = float32_eq(s1->sng, 0);
+			break;
+		case FTYPE_DBL:
+			zero = float64_eq(s1->dbl, 0LL);
+			break;
+		}
+		if (zero) {
+			/* if s1 is zero, it is on boundary */
+			cc |= CC_IB | CC_OB;
+			goto completed;
+		}
+
+		switch (width) {
+		case FTYPE_SNG:
+			s1positive = s1->sng >> 31 == 0;
+			s2positive = s2->sng >> 31 == 0;
+			break;
+		case FTYPE_DBL:
+			s1positive = s1->dbl >> 63 == 0;
+			s2positive = s2->dbl >> 63 == 0;
+			break;
+		}
+		if (s2positive) {
+			/* s2 is positive, the interval is [0, s2] */
+			if (cc & CC_GT) {
+				/* 0 <= s2 < s1 -> out of interval */
+				cc |= CC_OU | CC_OB;
+			} else if (s1positive) {
+				/* 0 < s1 < s2 -> in interval */
+				cc |= CC_IB | CC_IN;
+			} else {
+				/* s1 < 0 <= s2 */
+				cc |= CC_OU | CC_OB;
+			}
+		} else {
+			/* s2 is negative, the interval is [s2, 0] */
+			if (cc & CC_LT) {
+				/* s1 < s2 <= 0 */
+				cc |= CC_OU | CC_OB;
+			} else if (!s1positive) {
+				/* s2 < s1 < 0 */
+				cc |= CC_IB | CC_IN;
+			} else {
+				/* s2 < 0 < s1 */
+				cc |= CC_OU | CC_OB;
+			}
+		}
+	}
+
+#ifdef M88100
+	if (CPU_IS88100)
+		cc &= ~(CC_UE | CC_LG | CC_UG | CC_ULE | CC_UL | CC_UGE);
+#endif
+
+completed:
+	if (rd != 0)
+		frame->tf_r[rd] = cc;
+}
diff --git a/sys/arch/m88k/m88k/fpu.h b/sys/arch/m88k/m88k/fpu.h
new file mode 100644
index 00000000000..0e62030f789
--- /dev/null
+++ b/sys/arch/m88k/m88k/fpu.h
@@ -0,0 +1,42 @@
+/*	$OpenBSD: fpu.h,v 1.1 2014/06/09 16:26:32 miod Exp $	*/
+
+/*
+ * Copyright (c) 2014 Miodrag Vallat.
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+/*
+ * Internal defines for the floating-point completion code.
+ */
+
+/*
+ * Data width (matching the TD field of the instructions)
+ */
+#define	FTYPE_SNG	0
+#define	FTYPE_DBL	1
+#define	FTYPE_EXT	2
+#define	FTYPE_INT	3	/* not a real T value */
+
+#define	IGNORE_PRECISION	FTYPE_SNG
+
+/* floating point value */
+typedef union {
+	float32		sng;
+	float64		dbl;
+} fparg;
+
+void	fpu_compare(struct trapframe *, fparg *, fparg *, u_int, u_int, u_int);
+int	fpu_emulate(struct trapframe *, u_int32_t);
+u_int	fpu_precision(u_int, u_int, u_int);
+void	fpu_store(struct trapframe *, u_int, u_int, u_int, fparg *);
diff --git a/sys/arch/m88k/m88k/m88100_fp.S b/sys/arch/m88k/m88k/m88100_fp.S
deleted file mode 100644
index 6e4cbd40c62..00000000000
--- a/sys/arch/m88k/m88k/m88100_fp.S
+++ /dev/null
@@ -1,1816 +0,0 @@
-/* $OpenBSD: m88100_fp.S,v 1.10 2014/06/09 10:26:10 miod Exp $	*/
-/*
- * Mach Operating System
- * Copyright (c) 1991 Carnegie Mellon University
- * Copyright (c) 1991 OMRON Corporation
- * All Rights Reserved.
- *
- * Permission to use, copy, modify and distribute this software and its
- * documentation is hereby granted, provided that both the copyright
- * notice and this permission notice appear in all copies of the
- * software, derivative works or modified versions, and any portions
- * thereof, and that both notices appear in supporting documentation.
- *
- * CARNEGIE MELLON AND OMRON ALLOW FREE USE OF THIS SOFTWARE IN ITS "AS IS"
- * CONDITION.  CARNEGIE MELLON AND OMRON DISCLAIM ANY LIABILITY OF ANY KIND
- * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
- *
- * Carnegie Mellon requests users of this software to return to
- *
- *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
- *  School of Computer Science
- *  Carnegie Mellon University
- *  Pittsburgh PA 15213-3890
- *
- * any improvements or extensions that they make and grant Carnegie the
- * rights to redistribute these changes.
- */
-
-/* Floating point trouble routines */
-#include "assym.h"
-#include <machine/trap.h>
-#include <machine/asm.h>
-
-#define destsize 10
-
-/* Floating-Point Status Register bits */
-#define inexact		0
-#define overflow	1
-#define underflow	2
-#define divzero		3
-#define oper		4
-
-#define sign		31
-#define s1size		9
-#define s2size		7
-#define dsize		5
-
-#define FADDop		0x05
-#define FSUBop		0x06
-#define FCMPop		0x07
-#define FMULop		0x00
-#define FDIVop		0x0e
-#define FSQRTop		0x0f
-#define INTop		0x09
-#define NINTop		0x0a
-#define TRNCop		0x0b
-
-#define s1nan		7
-#define s2nan		6
-#define s1inf		5
-#define s2inf		4
-#define s1zero		3
-#define s2zero		2
-#define sigbit		19
-
-#define rndhi		15
-#define rndlo		14
-
-ENTRY(m88100_fpu_precise_exception)
-	or	%r29, %r2,  %r0		/* r29 is now the E.F. */
-	subu	%r31, %r31, 16
-	st	%r1,  %r31, 8
-	st	%r29, %r31, 12
-
-	ld	%r2,  %r29, EF_FPSR
-	ld	%r3,  %r29, EF_FPCR
-	ld	%r4,  %r29, EF_FPECR
-	ld	%r5,  %r29, EF_FPHS1
-	ld	%r6,  %r29, EF_FPLS1
-	ld	%r7,  %r29, EF_FPHS2
-	ld	%r8,  %r29, EF_FPLS2
-	ld	%r9,  %r29, EF_FPPT
-
-	/*
-	 * Load into %r1 the return address for the zero handlers. Looking at
-	 * FPECR, branch to the appropriate zero handler. However, if none of
-	 * the zero bits are enabled, then a floating point instruction was
-	 * issued with the floating point unit disabled. This will cause an
-	 * unimplemented opcode 0.
-	 */
-
-	or.u	%r1, %r0, %hi16(wrapup)	/* load return address of function */
-	or	%r1, %r1, %lo16(wrapup)
-
-	bb0	6, %r4, 3f		/* branch to FPunimp if bit set */
-	br	FPuimp
-3:
-	bb0	7, %r4, 4f		/* branch to FPintover if bit set */
-	br	FPintover
-4:
-#if 0
-	bb0	5, %r4, 5f		/* branch to FPpriviol if bit set */
-	br	FPpriviol
-#endif
-5:
-	bb0	4, %r4, 6f		/* branch to FPresoper if bit set */
-	br	FPresoper
-6:
-	bb0	3, %r4, 7f		/* branch to FPdivzero if bit set */
-	br	FPdivzero
-7:
-	or.u	%r4, %r4, 0xffff
-
-ASLOCAL(FPuimp)
-	subu	%r31, %r31, 16		/* allocate stack */
-	st	%r1,  %r31, 0		/* save return address */
-	or	%r2,  %r0,  T_FPEPFLT	/* load trap type */
-	bsr.n	_C_LABEL(m88100_trap)
-	 or	%r3,  %r29, %r0
-	ld	%r1,  %r31, 0		/* recover return address */
-	addu	%r31, %r31, 16		/* deallocate stack */
-	jmp	%r1
-
-	/*
-	 * To write back the results to the user registers, disable exceptions
-	 * and the floating point unit. Write FPSR and FPCR and load the SNIP
-	 * and SFIP.
-	 * r5 will contain the upper word of the result
-	 * r6 will contain the lower word of the result
-	 */
-
-ASLOCAL(wrapup)
-	FLUSH_PIPELINE		/* make sure all floating point operations */
-				/* have finished */
-	ldcr	%r10, %cr1	/* load the PSR */
-#if 0
-	set	%r10, %r10, 1<PSR_FPU_DISABLE_BIT>
-#endif
-	set	%r10, %r10, 1<PSR_INTERRUPT_DISABLE_BIT>
-	stcr	%r10, %cr1
-
-	ld	%r1,  %r31, 8
-	ld	%r29, %r31, 12
-	addu	%r31, %r31, 16
-
-	fstcr	%r2, FPSR		/* write revised value of FPSR... */
-	fstcr	%r3, FPCR		/* ...and FPCR... */
-	st	%r2, %r29, EF_FPSR	/* ...into the trapframe as well */
-	st	%r3, %r29, EF_FPCR
-
-	/* result writeback routine */
-	addu	%r3, %r29, EF_R0
-	extu	%r2, %r9,  5<0>		/* get 5 bits of destination register */
-	bb0	5,   %r9,  writesingle	/* branch if destination is single */
-
-/* writedouble here */
-	st	%r5, %r3[%r2]		/* write high word */
-	add	%r2, %r2, 1		/* for double, the low word is the */
-					/* unspecified register */
-	clr	%r2, %r2, 27<5>		/* perform equivalent of mod 32 */
-ASLOCAL(writesingle)
-	jmp.n	%r1
-	 st	%r6, %r3[%r2]		/* write low word into memory */
-
-/*
- * Check if the numerator is zero. If the numerator is zero, then handle
- * this instruction as you would a 0/0 invalid operation.
- */
-
-ASLOCAL(FPdivzero)
-	bb1.n	s1size, %r9, 1f		/* branch if numerator double */
-	 st	%r1,  %r31, 0		/* save return address */
-/* single number */
-	clr	%r10, %r5,  1<sign>	/* clear sign bit */
-	extu	%r11, %r6,  3<29>	/* grab upper bits of lower word */
-	or	%r10, %r10, %r11	/* combine ones of mantissa */
-	bcnd	eq0,  %r10, resoper	/* numerator is zero, handle */
-					/* reserved operand */
-	br	setbit			/* set divzero bit */
-1:
-/* double number */
-	clr	%r10, %r5,  1<sign>	/* clear sign bit */
-	or	%r10, %r10, %r6		/* or high and low words */
-	bcnd	ne0,  %r10, setbit	/* set divzero bit */
-
-/*
- * The numerator is zero, so handle the invalid operation by setting the
- * invalid operation bit and writing a quiet NaN to the destination.
- */
-
-ASLOCAL(resoper)
-	set	%r2, %r2, 1<oper>
-	set	%r5, %r0, 0<0>	/* put a NaN in high word */
-	set	%r6, %r0, 0<0>	/* put a NaN in low word */
-	br	FP_div_return	/* writing to a word which may be ignored */
-				/* is just as quick as checking the precision */
-				/* of the destination */
-
-/*
- * The operation is divide by zero, so set the divide by zero bit in the
- * FPSR.
- * Considering the sign of the numerator and zero, write a correctly
- * signed infinity of the proper precision into the destination.
- */
-
-setbit:
-	set	%r2, %r2, 1<divzero>
-	bb1	dsize, %r9, FPzero_double	/* branch to handle double result */
-FPzero_single:
-	clr	%r10, %r5, 31<0>	/* clear all of S1HI except sign bit */
-	xor	%r10, %r7, %r10		/* xor the sign bits of the operands */
-	or.u	%r6,  %r0, 0x7f80	/* load single precision infinity */
-	br.n	FP_div_return
-	 or	%r6,  %r6, %r10		/* load correctly signed infinity */
-
-FPzero_double:
-	clr	%r10, %r5, 31<0>	/* clear all of S1HI except sign bit */
-	xor	%r10, %r7, %r10		/* xor the sign bits of the operands */
-	or.u	%r5,  %r0, 0x7ff0	/* load double precision infinity */
-	or	%r5,  %r5, %r10		/* load correctly signed infinity */
-	or	%r6,  %r0, %r0		/* clear lower word of double */
-
-FP_div_return:
-	ld	%r1,  %r31, 0		/* load return address */
-	jmp	%r1
-
-/*
- * Both NINT and TRNC require a certain rounding mode, so check which
- * instruction caused the integer conversion overflow. Use a substitute
- * FPCR in %r1, and modify the rounding mode if the instruction is NINT
- * or TRNC.
- */
-ASLOCAL(FPintover)
-	extu	%r10, %r9,  5<11>	/* extract opcode */
-	cmp	%r11, %r10, INTop	/* see if instruction is INT */
-	st	%r1,  %r31, 0		/* save return address */
-	bb1.n	eq,   %r11, checksize	/* instruction is INT, do not modify */
-					/* rounding mode */
-	 or	%r1,  %r0,  %r3		/* load FPCR into r1 */
-	cmp	%r11, %r10, NINTop	/* see if instruction is NINT */
-	bb1	eq,   %r11, NINT	/* instruction is NINT */
-TRNC:
-	clr	%r1,  %r1,  2<rndlo>	/* clear rounding mode bits, */
-					/* instruction is TRNC */
-	br.n	checksize		/* branch to check size */
-	 set	%r1,  %r1,  1<rndlo>	/* make rounding mode round towards */
-					/* zero */
-NINT:
-	clr	%r1,  %r1,  2<rndlo>	/* make rounding mode round to */
-					/* nearest */
-
-/* See whether the source is single or double precision. */
-
-checksize:
-	bb1	s2size, %r9, checkdoub	/* S2 is double, branch to see if */
-					/* there is a false alarm */
-
-/*
- * An integer has more bits than the mantissa of a single precision floating
- * point number, so to check for false alarms (i.e. valid conversion), simply
- * check the exponents. False alarms are detected for 2**30 to (2**30) - 1
- * and -2**30 to -2**31. Only seven bits need to be looked at since an
- * exception will not occur for the other half of the numbering system.
- * To speed up the processing, first check to see if the exponent is 32 or
- * greater.
- *
- * This code was originally written for the exponent in the control
- * register to have the most significant bit (8 - single, 11 - double)
- * flipped and sign extended. For precise exceptions, however, the most
- * significant bit is only sign extended. Therefore, the code was chopped
- * up so that it would work for positive values of real exponent which were
- * only sign extended.
- */
-
-checksing:
-	extu	%r10, %r7, 7<20>/* internal representation for single */
-				/* precision is IEEE 8 bits sign extended */
-				/* to 11 bits; for real exp. = 30, the */
-				/* above instruction gives a result exp. */
-				/* that has the MSB flipped and sign */
-				/* extended like in the IMPCR */
-	cmp	%r11, %r10, 31	/* compare to 32, but exp. off by 1 */
-				/* these 2 instructions to speed up valid */
-				/* execution of valid cases */
-	bb1	ge,   %r11, overflw /* valid case, perform overflow routine */
-	bb1	sign, %r7, checksingn /* source operand is negative */
-
-/*
- * If the number is positve and the exponent is greater than 30, than it is
- * overflow.
- */
-checksingp:
-	cmp	%r10, %r10, 29		/* compare to 30, but exp. off by 1 */
-	bb1	gt,   %r10, overflw	/* no false alarm, its overflow */
-	br	conversionsp		/* finish single precision conversion */
-
-/*
- * If the number is negative, and the exponent is 30, or 31 with a mantissa
- * of 0, then it is a false alarm.
- */
-checksingn:
-	cmp	%r11, %r10, 30		/* compare to 31, but exp. off by 1 */
-	bb1	lt,   %r11, conversionsn/* exp. less than 31, so convert */
-	extu	%r10, %r8,  3<29>	/* get upper three bits of lower */
-					/* mantissa */
-	mak	%r12, %r7,  20<3>	/* get upper 20 bits of mantissa */
-	or	%r10, %r10, %r12	/* form complete mantissa */
-	bcnd	eq0,  %r10, conversionsn/* complete conversion if mantissa */
-					/* is 0 */
-	br	overflw			/* no false alarm, its overflow */
-
-/*
- * False alarms are detected for 2**30 to (2**30) - 1 and -2**30 to -2**31.
- * Only seven bits need to be looked at since an exception will not occur
- * for the other half of the numbering system.
- * To speed up the processing, first check to see if the exponent is 32 or
- * greater. Since there are more mantissa bits than integer bits, rounding
- * could cause overflow. (2**31) - 1 needs to be checked so that it does
- * not round to 2**31, and -2**31 needs to be checked in case it rounds to
- * -((2**31) + 1).
- */
-checkdoub:
-	extu	%r10, %r7, 10<20>/* internal representation for double */
-				/* precision is the same IEEE 11 bits */
-				/* for real exp. = 30, the */
-				/* above instruction gives a result exp. */
-				/* that has the MSB flipped and sign */
-				/* extended like in the IMPCR */
-	cmp	%r11, %r10, 31	/* compare to 32, but exp. off by 1 */
-				/* these 2 instructions to speed up valid */
-				/* execution of valid cases */
-	bb1	ge,   %r11, overflw /* valid case, perform overflow routine */
-	bb1	sign, %r7,  checkdoubn /* source operand is negative */
-
-/*
- * If the exponent is not 31, then the floating point number will be rounded
- * before the conversion is done. A branch table is set up with bits 4 and 3
- * being the rounding mode, and bits 2, 1, and 0 are the guard, round, and
- * sticky bits.
- */
-checkdoubp:
-	cmp	%r11, %r10, 30		/* compare to 31, but exponent is */
-					/* off by 1 */
-	bb1	eq,   %r11, overflw	/* no false alarm, it's overflow */
-	extu	%r12, %r8,  1<22>	/* get LSB for integer with exp. = 30 */
-	mak	%r12, %r12, 1<2>	/* start to set up field for branch */
-					/* table */
-	extu	%r11, %r8,  1<21>	/* get guard bit */
-	mak	%r11, %r11, 1<1>	/* set up field for branch table */
-	or	%r12, %r11, %r12	/* set up field for branch table */
-	extu	%r11, %r8,  21<0>	/* get bits for sticky bit */
-	bcnd	eq0,  %r11, nostickyp	/* do not set sticky */
-	set	%r12, %r12, 1<0>	/* set sticky bit */
-nostickyp:
-	rot	%r11, %r1,  0<rndlo>	/* shift rounding mode to 2 LSB''s */
-	mak	%r11, %r11, 2<3>	/* set up field, clear other bits */
-	or	%r12, %r11, %r12	/* set up field for branch table */
-	lda	%r12, %r0[%r12]		/* scale r12 */
-	or.u	%r12, %r12, %hi16(ptable)/* load pointer into table */
-	addu	%r12, %r12, %lo16(ptable)
-	jmp	%r12
-
-ptable:
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	paddone
-	br	conversiondp
-	br	conversiondp
-	br	paddone
-	br	paddone
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	conversiondp
-	br	paddone
-	br	paddone
-	br	paddone
-	br	conversiondp
-	br	paddone
-	br	paddone
-	br	paddone
-
-/*
- * Add one to the bit of the mantissa which corresponds to the LSB of an
- * integer. If the mantissa overflows, then there is a valid integer
- * overflow conversion; otherwise, the mantissa can be converted to the
- * integer.
- */
-paddone:
-	or	%r10, %r0,  %r0		/* clear r10 */
-	set	%r10, %r10, 1<22>	/* set LSB bit to 1 for adding */
-	addu.co	%r8,  %r8,  %r10	/* add the 1 obtained from rounding */
-	clr	%r11, %r7,  12<20>	/* clear exponent and sign */
-	addu.ci	%r11, %r0,  %r11	/* add carry */
-	bb1	20,   %r11, overflw	/* overflow to 2**31, abort the rest */
-	br.n	conversiondp		/* since the exp. was 30, and the exp.*/
-					/* did not round up to 31, the */
-					/* largest number that S2 could */
-					/* become is 2**31-1 */
-	 or	%r7,  %r0,  %r11	/* store r11 into r7 for conversion */
-
-/*
- * Now check for negative double precision sources. If the exponent is 30,
- * then convert the false alarm. If the exponent is 31, then check the
- * mantissa bits which correspond to integer bits. If any of them are a one,
- * then there is overflow. If they are zero, then check the guard, round,
- * and sticky bits.
- * Round toward zero and positive will not cause a roundup, but round toward
- * nearest and negative may, so perform those roundings. If there is no
- * overflow, then convert and return.
- */
-checkdoubn:
-	cmp	%r11, %r10, 29		/* compare to 30, but exp. off by 1 */
-	bb1	eq,   %r11, conversiondn/* false alarm if exp. = 30 */
-	extu	%r10, %r8,  11<21>	/* check upper bits of lower mantissa */
-	bcnd	ne0,  %r10, overflw	/* one of the bits is a 1, so oflow */
-	extu	%r10, %r7,  20<0>	/* check upper bits of upper mantissa */
-	bcnd	ne0,  %r10, overflw	/* one of the bits is a 1, so oflow */
-	bb0	rndlo, %r1, possround	/* rounding mode is either round near */
-					/* or round negative, which may cause */
-					/* a round */
-	br.n	FPintov_return		/* round positive, which will not */
-					/* cause a round */
-	 set	%r6,  %r0,  1<sign>
-possround:
-	extu	%r12, %r8,  1<20>	/* get guard bit */
-	extu	%r11, %r8,  20<0>	/* get bits for sticky bit */
-	bcnd.n	eq0,  %r11, nostickyn	/* do not set sticky */
-	 mak	%r12, %r12, 1<1>	/* set up field for branch table */
-	set	%r12, %r12, 1<0>	/* set sticky bit */
-nostickyn:
-	bb1	rndhi, %r1, negative	/* rounding mode is negative */
-nearest:
-	cmp	%r12, %r12, 3		/* are both guard and sticky set */
-	bb1	eq,  %r12, overflw	/* both guard and sticky are set, */
-					/* so signal overflow */
-	or	%r6,  %r0,  %r0		/* clear destination register r6 */
-	br.n	FPintov_return
-	 set	%r6,  %r6,  1<sign>	/* set the sign bit and take care of */
-					/* this special case */
-negative:
-	bcnd	ne0,  %r12, overflw	/* -2**31 will be rounded to */
-					/* -(2**31+1), so signal overflow */
-	or	%r6,  %r0,  %r0		/* clear destination register r6 */
-	br.n	FPintov_return
-	 set	%r6, %r6, 1<sign>	/* set the sign bit and take care of */
-					/* this special case */
-
-	/*
-	 * Since the exp. was 30, and there was no round-up, the largest
-	 * number that S2 could have been was 2**31 - 1
-	 */
-
-	/* Convert the single precision positive floating point number. */
-
-conversionsp:
-	extu	%r6,  %r8,  3<29>	/* extract lower bits of integer */
-	mak	%r6,  %r6,  3<7>	/* shift left to correct place in int */
-	mak	%r10, %r7,  20<10>	/* shift left upper bits of integer */
-	or	%r6,  %r6,  %r10	/* form most of integer */
-	br.n	FPintov_return
-	 set	%r6,  %r6,  1<30>	/* set hidden one */
-
-	/* Convert the single precision negative floating point number. */
-
-conversionsn:
-	bb1	eq,   %r11, exp31s	/* use old r11 to see if exp. is 31 */
-	extu	%r6,  %r8,  3<29>	/* extract lower bits of mantissa */
-	mak	%r6,  %r6,  3<7>	/* shift left to correct place in int */
-	mak	%r10, %r7,  20<10>	/* shift left upper bits of integer */
-	or	%r6,  %r6,  %r10	/* form most of integer */
-	set	%r6,  %r6,  1<30>	/* set hidden one */
-	or.c	%r6,  %r0,  %r6		/* negate result */
-	br.n	FPintov_return
-	 addu	%r6,  %r6,  1		/* add 1 to get 2''s complement */
-exp31s:
-	or	%r6,  %r0,  %r0		/* clear r6 */
-	br.n	FPintov_return
-	 set	%r6,  %r6,  1<sign>	/* set sign bit */
-
-	/* Convert the double precision positive floating point number. */
-
-conversiondp:
-	extu	%r6,  %r8,  10<22>	/* extract lower bits of integer */
-	mak	%r10, %r7,  20<10>	/* shift left upper bits of integer */
-	or	%r6,  %r6,  %r10	/* form most of integer */
-	br.n	FPintov_return
-	 set	%r6,  %r6,  1<30>	/* set hidden one */
-
-	/*
-	 * Convert the double precision negative floating point number.
-	 * The number, whose exponent is 30, must be rounded before converting.
-	 * Bits 4 and 3 are the rounding mode, and bits 2, 1, and 0 are the
-	 * guard, round, and sticky bits for the branch table.
-	 */
-
-conversiondn:
-	extu	%r12, %r8,  1<22>	/* get LSB for integer with exp. = 30 */
-	mak	%r12, %r12, 1<2>	/* start to set up field for branch */
-					/* table */
-	extu	%r11, %r8,  1<21>	/* get guard bit */
-	mak	%r11, %r11, 1<1>	/* set up field for branch table */
-	or	%r12, %r11, %r12	/* set up field for branch table */
-	extu	%r11, %r8,  21<0>	/* get bits for sticky bit */
-	bcnd	eq0,  %r11, nostkyn	/* do not set sticky */
-	set	%r12, %r12, 1<0>	/* set sticky bit */
-nostkyn:
-	rot	%r11, %r1,  0<rndlo>	/* shift rounding mode to 2 LSB''s */
-	mak	%r11, %r11, 2<3>	/* set up field, clear other bits */
-	or	%r12, %r11, %r12	/* set up field for branch table */
-	lda	%r12, %r0[%r12]		/* scale r12 */
-	or.u	%r12, %r12, %hi16(ntable)/* load pointer into table */
-	addu	%r12, %r12, %lo16(ntable)
-	jmp	%r12
-
-ntable:
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	naddone
-	br	nnoaddone
-	br	nnoaddone
-	br	naddone
-	br	naddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	naddone
-	br	naddone
-	br	naddone
-	br	nnoaddone
-	br	naddone
-	br	naddone
-	br	naddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-	br	nnoaddone
-
-/*
- * Add one to the mantissa, and check to see if it overflows to -2**31.
- * The conversion is done in nnoaddone.
- */
-
-naddone:
-	or	%r10, %r0,  %r0		/* clear r10 */
-	set	%r10, %r10, 1<22>	/* set LSB bit to 1 for adding */
-	add.co	%r8,  %r8,  %r10	/* add the 1 obtained from rounding */
-	clr	%r7,  %r7,  12<20>	/* clear exponent and sign */
-	add.ci	%r7,  %r0,  %r7		/* add carry */
-	bb1	20,   %r7,  maxneg	/* rounded to -2**31, handle separately */
-					/* the exponent was originally 30 */
-nnoaddone:
-	extu	%r6,  %r8,  11<22>	/* extract lower bits of integer */
-	mak	%r10, %r7,  20<10>	/* shift left upper bits of integer */
-	or	%r6,  %r6,  %r10	/* form most of integer */
-	set	%r6,  %r6,  1<30>	/* set hidden one */
-	or.c	%r6,  %r0,  %r6		/* negate integer */
-	br.n	FPintov_return
-	 addu	%r6,  %r6,  1		/* add 1 to get 2''s complement */
-
-maxneg:
-	or	%r6,  %r0,  %r0		/* clear integer */
-	br.n	FPintov_return
-	 set	%r6,  %r6,  1<sign>	/* set sign bit */
-
-	/* For valid overflows, write the correctly signed largest integer. */
-overflw:
-	set	%r2,  %r2,  1<oper>
-	bb0.n	sign, %r7,  FPintov_return /* if positive then return */
-	 set	%r6,  %r6,  31<0>	/* set result to largest positive int */
-	or.c	%r6,  %r0,  %r6		/* negate r6, giving largest negative */
-					/* integer */
-
-FPintov_return:
-	ld	%r1,  %r31, 0		/* load return address from memory */
-	jmp	%r1
-
-/*
- * Some instructions only have the S2 operations, so clear S1HI and S1LO
- * for those instructions so that the previous contents of S1HI and S1LO
- * do not influence this instruction.
- */
-
-ASLOCAL(FPresoper)
-	st	%r1,  %r31, 0
-	extu	%r10, %r9,  5<11>	/* extract opcode */
-#if 0
-	cmp	%r11, %r10, FSQRTop	/* compare to FSQRT */
-	bb1	eq,   %r11, S1clear	/* clear S1 if instruction only had S2 operand */
-#endif
-	cmp	%r11, %r10, INTop	/* compare to INT */
-	bb1	eq,   %r11, S1clear	/* clear S1 if instruction only had S2 operand */
-	cmp	%r11, %r10, NINTop	/* compare to NINT */
-	bb1	eq,   %r11, S1clear	/* clear S1 if instruction only had S2 operand */
-	cmp	%r11, %r10, TRNCop	/* compare to TRNC */
-	bb0	eq,   %r11, opercheck	/* check for reserved operands */
-
-ASLOCAL(S1clear)
-	or	%r5,  %r0,  %r0	/* clear any NaN''s, denorms, or infinities */
-	or	%r6,  %r0,  %r0	/* that may be left in S1HI, S1LO from a */
-				/* previous instruction */
-
-/*
- * r12 contains the following flags:
- *   bit 9 -- s1sign
- *   bit 8 -- s2sign
- *   bit 7 -- s1nan
- *   bit 6 -- s2nan
- *   bit 5 -- s1inf
- *   bit 4 -- s2inf
- *   bit 3 -- s1zero
- *   bit 2 -- s2zero
- *   bit 1 -- s1denorm
- *   bit 0 -- s2denorm
- */
-
-/*
- * Using code for both single and double precision, check if S1 is either
- * a NaN or infinity and set the appropriate flags in %r12. Then check if
- * S2 is a NaN or infinity. If it is a NaN, then branch to the NaN routine.
- */
-
-ASLOCAL(opercheck)
-	extu	%r10, %r5,  11<20>	/* internal representation for double */
-	bb1.n	s1size, %r9, S1NaNdoub	/* S1 is double precision */
-	 or	%r12, %r0,  %r0		/* clear operand flag register */
-ASLOCAL(S1NaNsing)
-	xor	%r10, %r10, 0x0080	/* internal representation for single */
-	ext	%r10, %r10, 8<0>	/* precision is IEEE 8 bits sign extended */
-					/* to 11 bits; for real exp. > 0, the */
-					/* above instructions gives a result */
-					/* exp. that has the MSB flipped and */
-					/* sign extended like in the IMPCR */
-	cmp	%r11, %r10, 127		/* Is exponent equal to IEEE 255 */
-					/* (here 127) */
-	bb1	ne,   %r11, S2NaN	/* source 1 is not a NaN or infinity */
-	mak	%r10, %r5,  20<0>	/* load r10 with upper bits of S1 */
-					/* mantissa */
-	extu	%r11, %r6,  3<29>	/* get 3 upper bits of lower word */
-	or	%r11, %r10, %r11	/* combine any existing 1 */
-	bcnd	eq0,  %r11, noS1NaNs	/* since r11 can only hold 0 or a */
-					/* > 0 number, branch to noS1NaN */
-					/* when eq0 */
-	br.n	S2NaN			/* see if S2 has a NaN */
-	 set	%r12, %r12, 1<s1nan>	/* indicate that S1 has a NaN */
-ASLOCAL(noS1NaNs)
-	br.n	S2NaN			/* check contents of S2 */
-	 set	%r12, %r0, 1<s1inf>	/* indicate that S1 has an infinity */
-
-ASLOCAL(S1NaNdoub)
-	xor	%r10, %r10, 0x0400	/* precision is the same IEEE 11 bits */
-					/* The above instructions gives a */
-					/* result exp. that has the MSB */
-					/* flipped and sign extended like in */
-					/* the IMPCR */
-	cmp	%r11, %r10, 1023	/* Is exp. equal to IEEE 2047 */
-					/* (internal 1023) */
-	bb1	ne,   %r11, S2NaN	/* source 1 is not a NaN or infinity */
-	mak	%r10, %r5,  20<0>	/* load r10 with upper bits of S1 */
-					/* mantissa */
-	or	%r11, %r6,  %r10	/* combine existing 1''s of mantissa */
-	bcnd	eq0,  %r11, noS1NaNd	/* since r11 can only hold 0 or a */
-					/* > 0 number, branch to noS1NaN */
-					/* when eq0 */
-	br.n	S2NaN			/* see if S2 has a NaN */
-	 set	%r12, %r12, 1<s1nan>	/* indicate that S1 has a NaN */
-ASLOCAL(noS1NaNd)
-	set	%r12, %r0,  1<s1inf>	/* indicate that S1 has an infinity */
-
-ASLOCAL(S2NaN)
-	bb1.n	s2size, %r9, S2NaNdoub	/* S1 is double precision */
-	 extu	%r10, %r7,  11<20>	/* internal representation for double */
-ASLOCAL(S2NaNsing)
-	xor	%r10, %r10, 0x0080	/* internal representation for single */
-	ext	%r10, %r10, 8<0>	/* precision is IEEE 8 bits sign */
-					/* extended to 11 bits; for real exp. */
-					/* > 0, the above instruction gives a */
-					/* result exp. that has the MSB */
-					/* flipped and sign extended like in */
-					/* the IMPCR */
-	cmp	%r11, %r10, 127		/* Is exponent equal to IEEE 255 */
-					/* (here 127) */
-	bb1	ne,   %r11, inf		/* source 2 is not a NaN or infinity */
-	mak	%r10, %r7,  20<0>	/* load r10 with upper bits of S1 */
-					/* mantissa */
-	extu	%r11, %r8,  3<29>	/* get 3 upper bits of lower word */
-	or	%r11, %r10, %r11	/* combine any existing 1''s */
-	bcnd	eq0,  %r11, noS2NaNs	/* since r11 can only hold 0 or a > 0 */
-					/* number, branch to noS2NaNs */
-					/* when eq0 */
-	br.n	_ASM_LABEL(NaN)		/* branch to NaN routine */
-	 set	%r12, %r12, 1<s2nan>	/* indicate that s2 has a NaN */
-ASLOCAL(noS2NaNs)
-	bb0	s1nan, %r12, 1f		/* branch to NaN if S1 is a NaN */
-	br	_ASM_LABEL(NaN)
-1:
-	br.n	_ASM_LABEL(infinity)	/* If S1 had a NaN we would have */
-					/* already branched, and S2 does not */
-					/* have a NaN, but it does have an */
-					/* infinity, so branch to handle the */
-					/* finity */
-	 set	%r12, %r12, 1<s2inf>	/* indicate that S2 has an infinity */
-
-ASLOCAL(S2NaNdoub)
-	xor	%r10, %r10, 0x0400	/* precision is the same IEEE 11 bits */
-					/* The above instruction gives a */
-					/* result exp. that has the MSB */
-					/* flipped and sign extended like in */
-					/* the IMPCR */
-	cmp	%r11, %r10, 1023	/* Is exp. equal to IEEE 2047 */
-					/* (internal 1023) */
-	bb1	ne,   %r11, inf		/* source 2 is not a NaN or infinity */
-	mak	%r10, %r7, 20<0>	/* load r10 with upper bits of S2 */
-					/* mantissa */
-	or	%r11, %r8,  %r10	/* combine existing 1''s of mantissa */
-	bcnd	eq0,  %r11, noS2NaNd	/* since r11 can only hold 0 or a > 0 */
-					/* number, branch to noS2NaNd */
-					/* when eq0 */
-	br.n	_ASM_LABEL(NaN)		/* branch to NaN routine */
-	 set	%r12, %r12, 1<s2nan>	/* indicate that s2 has a NaN */
-ASLOCAL(noS2NaNd)
-	bb0	s1nan, %r12, 1f		/* branch to NaN if S1 is a NaN */
-	br	_ASM_LABEL(NaN)
-1:
-	br.n	_ASM_LABEL(infinity)	/* If S1 had a NaN we would have */
-					/* already branched, and S2 does not */
-					/* have a NaN, but it does have an */
-					/* infinity, so branch to handle the */
-					/* finity */
-	 set	%r12, %r12, 1<s2inf>	/* indicate that S2 has an infinity */
-
-/*
- * If S2 was a NaN, the routine would have already branched to NaN. If S1
- * is a NaN, then branch to NaN. If S1 is not a NaN and S2 is infinity, then
- * we would have already branched to infinity. If S1 is infinity, then branch.
- * If the routine still has not branched, then branch to denorm, the only
- * reserved operand left.
- */
-
-ASLOCAL(inf)
-	bb0	s1nan, %r12, 1f		/* branch if S1 has a NaN and S2 does */
-					/* not */
-	br	_ASM_LABEL(NaN)
-1:
-	bb0	s1inf, %r12, 2f		/* Neither S1 or S2 has a NaN, and we */
-					/* would have branched already if S2 */
-					/* had an infinity, so branch if S1 */
-					/* is infinity */
-	br	_ASM_LABEL(infinity)
-2:
-	br	_ASM_LABEL(denorm)	/* branch to denorm, the only */
-					/* remaining alternative */
-
-/*
- * If either S1 or S2 is a signalling NaN, then set the invalid operation
- * bit of the FPSR.
- * If S1 is the only NaN or one of two NaN''s, then write
- * a quiet S1 to the result. A signalling NaN must be made quiet before
- * it can be written, but a signalling S2 is not modified in this routine
- * if S1 is a NaN.
- */
-ASLOCAL(NaN)
-	bb0.n	s1nan, %r12, S2sigcheck		/* S1 is not a NaN */
-	 st	%r1,  %r31,  0			/* save return address */
-	bb1	sigbit, %r5, S2sigcheck		/* S1 is not a signaling NaN */
-	set	%r2,  %r2,  1<oper>
-	br.n	S1write				/* FPSR bit already set, S1 is */
-						/* made quiet, and since we */
-						/* always write S1 if it is */
-						/* a NaN, write S1 and skip */
-						/* rest of routine */
-	 set	%r5,  %r5,  1<sigbit>		/* make S1 a quiet NaN */
-
-ASLOCAL(S2sigcheck)
-	bb0	s2nan, %r12, S1write		/* S2 is not a NaN */
-	bb1	sigbit, %r7, S1write		/* S2 is not a signaling NaN */
-	set	%r2,  %r2,  1<oper>
-	set	%r7,  %r7,  1<sigbit>		/* make S2 a quiet NaN */
-
-/*
- * Write a single or double precision quiet NaN unless the opeation is FCMP.
- * If the operation is FCMP, then set the not comparable bit in the result.
- */
-ASLOCAL(S1write)
-	bb0	s1nan, %r12, S2write		/* do not write S1 */
-						/* if it is not a NaN */
-	extu	%r10, %r9,  5<11>		/* extract opcode */
-	cmp	%r11, %r10, FCMPop		/* compare to FCMP */
-	bb1	ne,   %r11, S1noFCMP		/* operation is not FCMP */
-	set	%r6,  %r0,  1<nc>		/* set the not comparable bit */
-	br.n	FPnan_return
-	 set	%r6,  %r6,  1<ne>		/* set the not equal bit */
-ASLOCAL(S1noFCMP)
-	bb1.n	dsize, %r9, wrdoubS1		/* double destination */
-	 set	%r5,  %r5,  11<20>		/* set all exponent bits to 1 */
-/*
- * The single result will be formed the same way whether S1 is a single or
- * double.
- */
-ASLOCAL(wrsingS1)
-	mak	%r10, %r5,  28<3>		/* wipe out extra exponent */
-						/* bits */
-	extu	%r11, %r6,  3<29>		/* get lower three bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* combine all of result */
-						/* except sign */
-	clr	%r6,  %r5,  31<0>		/* clear all but sign */
-	br.n	FPnan_return
-	 or	%r6,  %r6,  %r10		/* form result */
-
-ASLOCAL(wrdoubS1)
-	set	%r6,  %r6,  29<0>		/* set extra bits of lower */
-						/* word */
-	br	FPnan_return			/* no modification necessary */
-						/* for writing double to */
-						/* double, so return */
-
-ASLOCAL(S2write)
-	extu	%r10, %r9,  5<11>		/* extract opcode */
-	cmp	%r11, %r10, FCMPop		/* compare to FCMP */
-	bb1.n	ne,   %r11, S2noFCMP		/* operation is not FCMP */
-	 set	%r7,  %r7,  11<20>		/* set all exponent bits to 1 */
-	set	%r6,  %r0,  1<nc>		/* set the not comparable bit */
-	br.n	FPnan_return
-	 set	%r6,  %r6,  1<ne>		/* set the not equal bit */
-ASLOCAL(S2noFCMP)
-	bb1.n	dsize, %r9, wrdoubS2		/* double destination */
-	 set	%r5,  %r5,  11<20>		/* set all exponent bits to 1 */
-/*
- * The single result will be formed the same way whether S1 is a single or
- * double.
- */
-ASLOCAL(wrsingS2)
-	mak	%r10, %r7,  28<3>		/* wipe out extra exponent */
-						/* bits */
-	extu	%r11, %r8,  3<29>		/* get lower three bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* combine all of result */
-						/* except sign */
-	clr	%r6,  %r7,  31<0>		/* clear all but sign */
-	br.n	FPnan_return
-	 or	%r6,  %r6,  %r10		/* form result */
-
-ASLOCAL(wrdoubS2)
-	set	%r6,  %r8,  29<0>		/* set extra bits of lower */
-						/* word */
-
-/* Return from this subroutine with the result. */
-
-ASLOCAL(FPnan_return)
-						/* no modification necessary */
-						/* for writing double to */
-						/* double, so return */
-	ld	%r1,  %r31,  0			/* retrieve return address */
-	jmp	%r1
-
-/*
- * infinity
- */
-
-/*
- * Extract the opcode, compare to a constant, and branch to the code
- * for the instruction.
- */
-
-ASLOCAL(infinity)
-	extu	%r10, %r9,  5<11>		/* extract opcode */
-	cmp	%r11, %r10, FADDop		/* compare to FADD */
-	bb1.n	eq,   %r11, FADD		/* operation is FADD */
-	 st	%r1,  %r31, 0			/* save return address */
-	cmp	%r11, %r10, FSUBop		/* compare to FSUB */
-	bb1	eq,   %r11, FSUB		/* operation is FSUB */
-	cmp	%r11, %r10, FCMPop		/* compare to FCMP */
-	bb1	eq,   %r11, FCMP		/* operation is FCMP */
-	cmp	%r11, %r10, FMULop		/* compare to FMUL */
-	bb1	eq,   %r11, FMUL		/* operation is FMUL */
-	cmp	%r11, %r10, FDIVop		/* compare to FDIV */
-	bb1	eq,   %r11, FDIV		/* operation is FDIV */
-#if 0
-	cmp	%r11, %r10, FSQRTop		/* compare to FSQRT */
-	bb1	eq,   %r11, FSQRT		/* operation is FSQRT */
-#endif
-	cmp	%r11, %r10, INTop		/* compare to INT */
-	bb1	eq,   %r11, FP_inf_overflw	/* operation is INT */
-	cmp	%r11, %r10, NINTop		/* compare to NINT */
-	bb1	eq,   %r11, FP_inf_overflw	/* operation is NINT */
-	cmp	%r11, %r10, TRNCop		/* compare to TRNC */
-	bb1	eq,   %r11, FP_inf_overflw	/* operation is TRNC */
-
-/*
- * Adding infinities of opposite signs will cause an exception,
- * but all other operands will result in a correctly signed infinity.
- */
-
-FADD:
-	bb0	s1inf, %r12, addS2write		/* branch if S1 not infinity */
-	bb0	s2inf, %r12, addS1write		/* S2 is not inf., so branch */
-						/* to write S1 */
-	bb1	sign, %r5, addS1neg		/* handle case of S1 negative */
-addS1pos:
-	bb1	sign, %r7, excpt		/* adding infinities of */
-						/* different signs causes an */
-						/* exception */
-	br	poswrinf			/* branch to write positive */
-						/* infinity */
-addS1neg:
-	bb0	sign, %r7, excpt		/* adding infinities of */
-						/* different signs causes an */
-						/* exception */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-addS1write:
-	bb0	sign, %r5, poswrinf		/* branch to write positive */
-						/* infinity */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-addS2write:
-	bb0	sign, %r7, poswrinf		/* branch to write positive */
-						/* infinity */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-
-/*
- * Subtracting infinities of the same sign will cause an exception,
- * but all other operands will result in a correctly signed infinity.
- */
-
-FSUB:
-	bb0	s1inf, %r12, subS2write		/* branch if S1 not infinity */
-	bb0	s2inf, %r12, subS1write		/* S2 is not inf., so branch */
-						/* to write S1 */
-	bb1	sign, %r5, subS1neg		/* handle case of S1 negative */
-subS1pos:
-	bb0	sign, %r7, excpt		/* subtracting infinities of */
-						/* the same sign causes an */
-						/* exception */
-	br	poswrinf			/* branch to write positive */
-						/* infinity */
-subS1neg:
-	bb1	sign, %r7, excpt		/* subtracting infinities of */
-						/* the same sign causes an */
-						/* exception */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-subS1write:
-	bb0	sign, %r5, poswrinf		/* branch to write positive */
-						/* infinity */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-subS2write:
-	bb1	sign, %r7, poswrinf		/* branch to write positive */
-						/* infinity */
-	br	negwrinf			/* branch to write negative */
-						/* infinity */
-
-/*
- * Compare the operands, at least one of which is infinity, and set the
- * correct bits in the destination register.
- */
-
-FCMP:
-	bb0.n	s1inf, %r12, FCMPS1f		/* branch for finite S1 */
-	 set	%r4,  %r0,  1<cp>		/* since neither S1 or S2 is */
-						/* a NaN, set cp */
-FCMPS1i:
-	bb1	sign, %r5, FCMPS1ni		/* branch to negative S1i */
-FCMPS1pi:
-	bb0	s2inf, %r12, FCMPS1piS2f	/* branch to finite S2 */
-						/* with S1pi */
-FCMPS1piS2i:
-	bb1	sign, %r7, FCMPS1piS2ni		/* branch to negative S2i */
-						/* with S1pi */
-FCMPS1piS2pi:
-	set	%r4,  %r4, 1<eq>		/* set eq bit */
-	set	%r4,  %r4, 1<le>		/* set le bit */
-	set	%r4,  %r4, 1<ge>		/* set ge bit */
-	set	%r4,  %r4, 1<ib>		/* set ib bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1piS2ni:
-	set	%r4,  %r4, 1<ne>		/* set ne bit */
-	set	%r4,  %r4, 1<gt>		/* set gt bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ge>		/* set ge bit */
-FCMPS1piS2f:
-	set	%r4,  %r4, 1<ne>		/* set ne bit */
-	set	%r4,  %r4, 1<gt>		/* set gt bit */
-	bsr.n	_ASM_LABEL(zero)		/* see if any of the operands */
-						/* are zero */
-	 set	%r4,  %r4, 1<ge>		/* set ge bit */
-	bb0	s2zero, %r12, FCMPS1piS2nz	/* check for negative if s2 */
-						/* not zero */
-	set	%r4,  %r4, 1<ou>		/* set ou bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1piS2nz:
-	bb1	sign, %r7, move			/* return if s2 is negative */
-FCMPS1piS2pf:
-	set	%r4,  %r4, 1<ou>		/* set ou bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1ni:
-	bb0	s2inf, %r12, FCMPS1niS2f	/* branch to finite S2 */
-						/* with S1ni */
-FCMPS1niS2i:
-	bb1	sign, %r7, FCMPS1niS2ni		/* branch to negative S2i */
-						/* with S1ni */
-FCMPS1niS2pi:
-	set	%r4,  %r4, 1<ne>		/* set eq bit */
-	set	%r4,  %r4, 1<le>		/* set le bit */
-	set	%r4,  %r4, 1<lt>		/* set lt bit */
-	set	%r4,  %r4, 1<ou>		/* set ou bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1niS2ni:
-	set	%r4,  %r4, 1<eq>		/* set eq bit */
-	set	%r4,  %r4, 1<le>		/* set le bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ge>		/* set ge bit */
-FCMPS1niS2f:
-	set	%r4,  %r4, 1<ne>		/* set eq bit */
-	set	%r4,  %r4, 1<le>		/* set le bit */
-	bsr.n	_ASM_LABEL(zero)		/* see if any of the operands */
-						/* are zero */
-	 set	%r4,  %r4, 1<lt>		/* set lt bit */
-	bb0	s2zero, %r12, FCMPS1niS2nz	/* branch if s2 is not zero */
-	set	%r4,  %r4, 1<ou>		/* set ou bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1niS2nz:
-	bb1	sign, %r7, move			/* return if s2 is negative */
-	set	%r4,  %r4, 1<ou>		/* set ou bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1f:
-	bb1	sign, %r5, FCMPS1nf		/* branch to negative S1f */
-FCMPS1pf:
-	bb1.n	sign, %r7, FCMPS1pfS2ni		/* branch to negative S2i */
-						/* with S1pf */
-	 set	%r4,  %r4, 1<ne>		/* set ne bit */
-FCMPS1pfS2pi:
-	set	%r4,  %r4, 1<le>		/* set le bit */
-	set	%r4,  %r4, 1<lt>		/* set lt bit */
-	bsr.n	_ASM_LABEL(zero)
-	 set	%r4,  %r4, 1<ib>		/* set ib bit */
-	bb0	s1zero, %r12, FCMPS1pfS2pinozero
-FCMPS1pfS2pizero:
-	br.n	move
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-FCMPS1pfS2pinozero:
-	br.n	move
-	 set	%r4,  %r4, 1<in>		/* set in bit */
-FCMPS1pfS2ni:
-	set	%r4,  %r4, 1<gt>		/* set gt bit */
-	br.n	move
-	 set	%r4,  %r4, 1<ge>		/* set ge bit */
-FCMPS1nf:
-	bb1.n	sign, %r7, FCMPS1nfS2ni		/* branch to negative S2i */
-						/* with S1nf */
-	 set	%r4,  %r4, 1<ne>		/* set ne bit */
-	set	%r4,  %r4, 1<le>		/* set gt bit */
-	set	%r4,  %r4, 1<lt>		/* set ge bit */
-	bsr.n	_ASM_LABEL(zero)		/* see which of the operands */
-						/* are zero */
-	 set	%r4,  %r4, 1<ob>		/* set ob bit */
-	bb0	s1zero, %r12, FCMPS1nfS2pinozero /* no ls and lo */
-FCMPS1nfS2pizero:
-	br.n	move
-	 set	%r4,  %r4, 1<ib>		/* set ib bit */
-FCMPS1nfS2pinozero:
-	br.n	move
-	 set	%r4,  %r4, 1<ou>		/* set ou bit */
-FCMPS1nfS2ni:
-	set	%r4,  %r4, 1<gt>		/* set gt bit */
-	set	%r4,  %r4, 1<ge>		/* set ge bit */
-
-move:
-	br.n	inf_return
-	 or	%r6,  %r0, %r4			/* transfer answer to r6 */
-/*
- * Multiplying infinity and zero causes an exception, but all other
- * operations produce a correctly signed infinity.
- */
-
-FMUL:
-	bsr	_ASM_LABEL(zero)		/* see if any of the operands */
-						/* are zero */
-	bb1	s1zero, %r12, excpt		/* infinity X 0 causes an */
-						/* exception */
-	bb1	s2zero, %r12, excpt		/* infinity X 0 causes an */
-						/* exception */
-	bb1	sign, %r5, FMULS1neg		/* handle negative cases */
-						/* of S1 */
-	bb0	sign, %r7, poswrinf		/* + X + = + */
-	br	negwrinf			/* + X - = - */
-FMULS1neg:
-	bb1	sign, %r7, poswrinf		/* - X - = + */
-	br	negwrinf			/* - X + = - */
-
-/*
- * Dividing infinity by infinity causes an exception, but dividing
- * infinity by a finite yields a correctly signed infinity, and
- * dividing a finite by an infinity produces a correctly signed zero.
- */
-
-FDIV:
-	bb1	s1inf, %r12, FDIVS1inf		/* handle case of S1 being */
-						/* infinity */
-	bb1	sign, %r5, FDIVS1nf		/* handle cases of S1 being */
-						/* neg. non-inf. */
-	bb1	sign, %r7, FDIVS1pfS2mi		/* handle case of negative S2 */
-FDIVS1pfS2pi:
-	br	poswrzero			/* +f / +inf = +0 */
-FDIVS1pfS2mi:
-	br	negwrzero			/* +f / -inf = -0 */
-FDIVS1nf:
-	bb1	sign, %r7, FDIVS1nfS2mi		/* handle case of negative S2 */
-FDIVS1nfS2pi:
-	br	negwrzero			/* -f / +inf = -0 */
-FDIVS1nfS2mi:
-	br	poswrzero			/* -f / -inf = +0 */
-FDIVS1inf:
-	bb1	s2inf, %r12, excpt		/* inf / inf = exception */
-	bb1	sign, %r5, FDIVS1mi		/* handle cases of S1 being */
-						/* neg. inf. */
-	bb1	sign, %r7, FDIVS1piS2nf		/* handle case of negative S2 */
-FDIVS1piS2pf:
-	br	poswrinf			/* +inf / +f = +inf */
-FDIVS1piS2nf:
-	br	negwrinf			/* +inf / -f = -inf */
-FDIVS1mi:
-	bb1	sign, %r7, FDIVS1miS2nf		/* handle case of negative S2 */
-FDIVS1miS2pf:
-	br	negwrinf			/* -inf / +f = -inf */
-FDIVS1miS2nf:
-	br	poswrinf			/* -inf / -f = +inf */
-
-/*
- * The square root of positive infinity is positive infinity,
- * but the square root of negative infinity is a NaN.
- */
-
-#if 0
-FSQRT:
-	bb0	sign, %r7, poswrinf		/* write sqrt(inf) = inf */
-	br	excpt				/* write sqrt(-inf) = NaN */
-#endif
-
-excpt:
-	set	%r2,  %r2, 1<oper>
-	set	%r5,  %r0, 0<0>			/* write NaN into r5 */
-	br.n	inf_return
-	 set	%r6,  %r0, 0<0>			/* write NaN into r6, writing */
-						/* NaN''s into both of these */
-						/* registers is quicker than */
-						/* checking for single or */
-						/* double precision */
-
-/* Write positive infinity of the correct precision */
-
-poswrinf:
-	bb1	dsize, %r9, poswrinfd		/* branch to write double */
-						/* precision inf. */
-	br.n	inf_return
-	 or.u	%r6,  %r0, 0x7f80		/* load r6 with single */
-						/* precision pos inf. */
-poswrinfd:
-	or.u	%r5,  %r0, 0x7ff0		/* load double precision */
-						/* pos inf. */
-	br.n	inf_return
-	 or	%r6,  %r0, %r0
-
-/* Write negative infinity of the correct precision */
-
-negwrinf:
-	bb1	dsize, %r9, negwrinfd		/* branch to write double */
-						/* precision inf. */
-	br.n	inf_return
-	 or.u	%r6,  %r0, 0xff80		/* load r6 with single */
-						/* precision neg inf. */
-negwrinfd:
-	or.u	%r5,  %r0, 0xfff0		/* load double precision */
-						/* neg inf. */
-	br.n	inf_return
-	 or	%r6,  %r0, %r0
-
-/* Write a positive zero disregarding precision. */
-
-poswrzero:
-	or	%r5,  %r0, %r0			/* write to both high word */
-						/* and low word now */
-	br.n	inf_return			/* it does not matter that */
-						/* both are written */
-	 or	%r6,  %r0, %r0
-
-/* Write a negative zero of the correct precision. */
-
-negwrzero:
-	or	%r6,  %r0, %r0			/* clear low word */
-	bb1	dsize, %r9, negwrzerod		/* branch to write double */
-						/* precision zero */
-	br.n	inf_return
-	 set	%r6,  %r6, 1<31>		/* set sign bit */
-negwrzerod:
-	or	%r5,  %r0, %r0			/* clear high word */
-	br.n	inf_return
-	 set	%r5,  %r5, 1<31>		/* set sign bit */
-
-FP_inf_overflw:
-	set	%r2,  %r2, 1<oper>
-	set	%r2,  %r2, 1<overflow>
-	set	%r2,  %r2, 1<inexact>
-
-	bb0.n	sign, %r7, inf_return		/* if positive then return */
-
-	 set	%r6,  %r6, 31<0>		/* set result to largest */
-						/* positive integer */
-	or.c	%r6,  %r0, %r6			/* negate r6, giving largest */
-						/* negative int. */
-
-inf_return:
-	ld	%r1,  %r31, 0			/* load return address */
-	jmp	%r1
-
-/*
- * denorm
- */
-
-/*
- * Check to see if either S1 or S2 is a denormalized number. First
- * extract the exponent to see if it is zero, and then check to see if
- * the mantissa is not zero. If the number is denormalized, then set the
- * 1 or 0 bit 10 %r12.
- */
-
-ASLOCAL(denorm)
-	st	%r1,  %r31, 0			/* save return address */
-dnmcheckS1:
-	extu	%r10, %r5,  11<20>		/* extract exponent */
-	bcnd	ne0,  %r10, dnmsetS2		/* S1 is not a denorm, so S2 */
-						/* must be */
-	bb1.n	9,    %r9,  dnmcheckS1d		/* S1 is double precision */
-	 mak	%r10, %r5,  20<3>		/* mak field with only */
-						/* mantissa bits */
-dnmcheckS1s:
-	extu	%r11, %r6,  3<29>		/* get three low bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* assemble all of the */
-						/* mantissa bits */
-	bcnd	eq0,  %r10, dnmsetS2		/* S1 is not a denorm, so S2 */
-						/* must be */
-	br	dnmsetS1			/* S1 is a denorm */
-
-dnmcheckS1d:
-	or	%r10, %r6,  %r10		/* or all of mantissa bits */
-	bcnd	eq0,  %r10, dnmsetS2		/* S1 is not a denorm, so S2 */
-						/* must be */
-dnmsetS1:
-	set	%r12, %r12, 1<1>		/* S1 is a denorm */
-
-dnmcheckS2:
-	extu	%r10, %r7,  11<20>		/* extract exponent */
-	bcnd	ne0,  %r10, S1form		/* S2 is not a denorm */
-	bb1.n	7,    %r9,  dnmcheckS2d		/* S2 is double precision */
-	 mak	%r10, %r7,  20<3>		/* mak field with only */
-						/* mantissa bits */
-dnmcheckS2s:
-	extu	%r11, %r8,  3<29>		/* get three low bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* assemble all of the */
-						/* mantissa bits */
-	bcnd	eq0,  %r10, S1form		/* S2 is not a denorm */
-	br	dnmsetS2			/* S1 is a denorm */
-dnmcheckS2d:
-	or	%r10, %r8,  %r10		/* or all or mantissa bits */
-	bcnd	eq0,  %r10, S1form		/* S2 is not a denorm */
-dnmsetS2:
-	set	%r12, %r12, 1<0>		/* S2 is a denorm */
-
-/*
- * Since the operations are going to be reperformed with modified denorms,
- * the operands which were initially single precision need to be modified
- * back to single precision.
- */
-
-S1form:
-	bb1	9,    %r9,  S2form		/* S1 is double precision, so */
-						/* do not modify S1 into */
-						/* single format */
-	mak	%r11, %r5,  28<3>		/* over final exponent and */
-						/* mantissa, eliminating */
-						/* extra 3 bits of exponent */
-	extu	%r6,  %r6,  3<29>		/* get low 3 bits of mantissa */
-	or	%r11, %r6,  %r11		/* form complete mantissa and */
-						/* exponent */
-	extu	%r10, %r5,  1<31>		/* get the 31 bit */
-	mak	%r10, %r10, 1<31>		/* place 31 bit into correct */
-						/* position */
-	or	%r6,  %r10, %r11		/* or 31, exponent, and all */
-						/* of mantissa */
-
-S2form:
-	bb1	7,    %r9,  checkop		/* S2 is double precision, so */
-						/* do not modify S2 into */
-						/* single format */
-	mak	%r11, %r7,  28<3>		/* over final exponent and */
-						/* mantissa, eliminating */
-						/* extra 3 bits of exponent */
-	extu	%r8,  %r8,  3<29>		/* get low 3 bits of mantissa */
-	or	%r11, %r8,  %r11		/* form complete mantissa and */
-						/* exponent */
-	extu	%r10, %r7,  1<31>		/* get the 31 bit */
-	mak	%r10, %r10, 1<31>		/* place 31 bit into correct */
-						/* position */
-	or	%r8,  %r10, %r11		/* or 31, exponent, and all */
-						/* of mantissa */
-
-/*
- * Extract the opcode, compare to a constant, and branch to the code that
- * deals with that opcode.
- */
-
-checkop:
-	extu	%r10, %r9,  5<11>		/* extract opcode */
-	cmp	%r11, %r10, 0x05		/* compare to FADD */
-	bb1	2,    %r11, denorm_FADD		/* operation is FADD */
-	cmp	%r11, %r10, 0x06		/* compare to FSUB */
-	bb1	2,    %r11, denorm_FSUB		/* operation is FSUB */
-	cmp	%r11, %r10, 0x07		/* compare to FCMP */
-	bb1	2,    %r11, denorm_FCMP		/* operation is FCMP */
-	cmp	%r11, %r10, 0x00		/* compare to FMUL */
-	bb1	2,    %r11, denorm_FMUL		/* operation is FMUL */
-	cmp	%r11, %r10, 0x0e		/* compare to FDIV */
-	bb1	2,    %r11, denorm_FDIV		/* operation is FDIV */
-#if 0
-	cmp	%r11, %r10, 0x0f		/* compare to FSQRT */
-	bb1	2,    %r11, denorm_FSQRT	/* operation is FSQRT */
-#endif
-	cmp	%r11, %r10, 0x09		/* compare to INT */
-	bb1	2,    %r11, denorm_INT		/* operation is INT */
-	cmp	%r11, %r10, 0x0a		/* compare to NINT */
-	bb1	2,    %r11, denorm_NINT		/* operation is NINT */
-	cmp	%r11, %r10, 0x0b		/* compare to TRNC */
-	bb1	2,    %r11, denorm_TRNC		/* operation is TRNC */
-
-/*
- * For all the following operations, the denormalized number is set to
- * zero and the operation is reperformed the correct destination and source
- * sizes.
- */
-
-denorm_FADD:
-	bb0	1,   %r12, FADDS2dnm		/* S1 is not denorm, so S2 */
-						/* must be */
-	or	%r5, %r0,  %r0			/* set S1 to zero */
-	or	%r6, %r0,  %r0
-FADDS2chk:
-	bb0	0,   %r12, FADDcalc		/* S2 is not a denorm */
-FADDS2dnm:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FADDcalc:
-	bb1	5,   %r9,  FADDdD		/* branch for double */
-						/* precision destination */
-FADDsD:
-	bb1	9,   %r9,  FADDsDdS1		/* branch for double */
-						/* precision S1 */
-FADDsDsS1:
-	bb1	7,   %r9,  FADDsDsS1dS2		/* branch for double */
-						/* precision S2 */
-FADDsDsS1sS2:
-	br.n	denorm_return
-	 fadd.sss %r6, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FADDsDsS1dS2:
-	br.n	denorm_return
-	 fadd.ssd %r6, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FADDsDdS1:
-	bb1	7,   %r9,  FADDsDdS1dS2		/* branch for double */
-						/* precision S2 */
-FADDsDdS1sS2:
-	br.n	denorm_return
-	 fadd.sds %r6, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FADDsDdS1dS2:
-	br.n	denorm_return
-	 fadd.sdd %r6, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-FADDdD:
-	bb1	9,   %r9,  FADDdDdS1		/* branch for double */
-						/* precision S1 */
-FADDdDsS1:
-	bb1	7,   %r9,  FADDdDsS1dS2		/* branch for double */
-						/* precision S2 */
-FADDdDsS1sS2:
-	br.n	denorm_return
-	 fadd.dss %r5, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FADDdDsS1dS2:
-	br.n	denorm_return
-	 fadd.dsd %r5, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FADDdDdS1:
-	bb1	7,   %r9,  FADDdDdS1dS2		/* branch for double */
-						/* precision S2 */
-FADDdDdS1sS2:
-	br.n	denorm_return
-	 fadd.dds %r5, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FADDdDdS1dS2:
-	br.n	denorm_return
-	 fadd.ddd %r5, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_FSUB:
-	bb0	1,   %r12, FSUBS2dnm		/* S1 is not denorm, so S2 */
-						/* must be */
-	or	%r5, %r0,  %r0			/* set S1 to zero */
-	or	%r6, %r0,  %r0
-FSUBS2chk:
-	bb0	0,   %r12, FSUBcalc		/* S2 is not a denorm */
-FSUBS2dnm:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FSUBcalc:
-	bb1	5,   %r9,  FSUBdD		/* branch for double */
-						/* precision destination */
-FSUBsD:
-	bb1	9,   %r9,  FSUBsDdS1		/* branch for double */
-						/* precision S1 */
-FSUBsDsS1:
-	bb1	7,   %r9,  FSUBsDsS1dS2		/* branch for double */
-						/* precision S2 */
-FSUBsDsS1sS2:
-	br.n	denorm_return
-	 fsub.sss %r6, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSUBsDsS1dS2:
-	br.n	denorm_return
-	 fsub.ssd %r6, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FSUBsDdS1:
-	bb1	7,   %r9,  FSUBsDdS1dS2		/* branch for double */
-						/* precision S2 */
-FSUBsDdS1sS2:
-	br.n	denorm_return
-	 fsub.sds %r6, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSUBsDdS1dS2:
-	br.n	denorm_return
-	 fsub.sdd %r6, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-FSUBdD:
-	bb1	9,   %r9,  FSUBdDdS1		/* branch for double */
-						/* precision S1 */
-FSUBdDsS1:
-	bb1	7,   %r9,  FSUBdDsS1dS2		/* branch for double */
-						/* precision S2 */
-FSUBdDsS1sS2:
-	br.n	denorm_return
-	 fsub.dss %r5, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSUBdDsS1dS2:
-	br.n	denorm_return
-	 fsub.dsd %r5, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FSUBdDdS1:
-	bb1	7,   %r9,  FSUBdDdS1dS2		/* branch for double */
-						/* precision S2 */
-FSUBdDdS1sS2:
-	br.n	denorm_return
-	 fsub.dds %r5, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSUBdDdS1dS2:
-	br.n	denorm_return
-	 fsub.ddd %r5, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_FCMP:
-	bb0	1,   %r12, FCMPS2dnm		/* S1 is not denorm, so S2 */
-						/* must be */
-	or	%r5, %r0,  %r0			/* set S1 to zero */
-	or	%r6, %r0,  %r0
-FCMPS2chk:
-	bb0	0,   %r12, FCMPcalc		/* S2 is not a denorm */
-FCMPS2dnm:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FCMPcalc:
-	bb1	9,   %r9,  FCMPdS1		/* branch for double */
-						/* precision S1 */
-FCMPsS1:
-	bb1	7,   %r9,  FCMPsS1dS2		/* branch for double */
-						/* precision S2 */
-FCMPsS1sS2:
-	br.n	denorm_return
-	 fcmp.sss %r6, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FCMPsS1dS2:
-	br.n	denorm_return
-	 fcmp.ssd %r6, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FCMPdS1:
-	bb1	7,   %r9,  FCMPdS1dS2		/* branch for double */
-						/* precision S2 */
-FCMPdS1sS2:
-	br.n	denorm_return
-	 fcmp.sds %r6, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FCMPdS1dS2:
-	br.n	denorm_return
-	 fcmp.sdd %r6, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_FMUL:
-	bb0	1,   %r12, FMULS2dnm		/* S1 is not denorm, so S2 */
-						/* must be */
-	or	%r5, %r0,  %r0			/* set S1 to zero */
-	or	%r6, %r0,  %r0
-FMULS2chk:
-	bb0	0,   %r12, FMULcalc		/* S2 is not a denorm */
-FMULS2dnm:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FMULcalc:
-	bb1	5,   %r9,  FMULdD		/* branch for double */
-						/* precision destination */
-FMULsD:
-	bb1	9,   %r9,  FMULsDdS1		/* branch for double */
-						/* precision S1 */
-FMULsDsS1:
-	bb1	7,   %r9,  FMULsDsS1dS2		/* branch for double */
-						/* precision S2 */
-FMULsDsS1sS2:
-	br.n	denorm_return
-	 fmul.sss %r6, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FMULsDsS1dS2:
-	br.n	denorm_return
-	 fmul.ssd %r6, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FMULsDdS1:
-	bb1	7,   %r9,  FMULsDdS1dS2		/* branch for double */
-						/* precision S2 */
-FMULsDdS1sS2:
-	br.n	denorm_return
-	 fmul.sds %r6, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FMULsDdS1dS2:
-	br.n	denorm_return
-	 fmul.sdd %r6, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-FMULdD:
-	bb1	9,   %r9,  FMULdDdS1		/* branch for double */
-						/* precision S1 */
-FMULdDsS1:
-	bb1	7,   %r9,  FMULdDsS1dS2		/* branch for double */
-						/* precision S2 */
-FMULdDsS1sS2:
-	br.n	denorm_return
-	 fmul.dss %r5, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FMULdDsS1dS2:
-	br.n	denorm_return
-	 fmul.dsd %r5, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FMULdDdS1:
-	bb1	7,   %r9,  FMULdDdS1dS2		/* branch for double */
-						/* precision S2 */
-FMULdDdS1sS2:
-	br.n	denorm_return
-	 fmul.dds %r5, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FMULdDdS1dS2:
-	br.n	denorm_return
-	 fmul.ddd %r5, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_FDIV:
-	bb0	1,   %r12, FDIVS2dnm		/* S1 is not denorm, so S2 */
-						/* must be */
-	or	%r5, %r0,  %r0			/* set S1 to zero */
-	or	%r6, %r0,  %r0
-FDIVS2chk:
-	bb0	0,   %r12, FDIVcalc		/* S2 is not a denorm */
-FDIVS2dnm:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FDIVcalc:
-	bb1	5,   %r9,  FDIVdD		/* branch for double */
-						/* precision destination */
-FDIVsD:
-	bb1	9,   %r9,  FDIVsDdS1		/* branch for double */
-						/* precision S1 */
-FDIVsDsS1:
-	bb1	7,   %r9,  FDIVsDsS1dS2		/* branch for double */
-						/* precision S2 */
-FDIVsDsS1sS2:
-	fdiv.sss %r6, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVsDsS1dS2:
-	fdiv.ssd %r6, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVsDdS1:
-	bb1	7,   %r9,  FDIVsDdS1dS2		/* branch for double */
-						/* precision S2 */
-FDIVsDdS1sS2:
-	fdiv.sds %r6, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVsDdS1dS2:
-	fdiv.sdd %r6, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVdD:
-	bb1	9,   %r9,  FDIVdDdS1		/* branch for double */
-						/* precision S1 */
-FDIVdDsS1:
-	bb1	7,   %r9,  FDIVdDsS1dS2		/* branch for double */
-						/* precision S2 */
-FDIVdDsS1sS2:
-	fdiv.dss %r5, %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVdDsS1dS2:
-	fdiv.dsd %r5, %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVdDdS1:
-	bb1	7,   %r9,  FDIVdDdS1dS2		/* branch for double */
-						/* precision S2 */
-FDIVdDdS1sS2:
-	fdiv.dds %r5, %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-FDIVdDdS1dS2:
-	fdiv.ddd %r5, %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-	br	denorm_return
-
-#if 0
-denorm_FSQRT:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-FSQRTcalc:
-	bb1	5,   %r9,  FSQRTdD		/* branch for double */
-						/* precision destination */
-FSQRTsD:
-	bb1	7,   %r9,  FSQRTsDdS2		/* branch for double */
-						/* precision S2 */
-FSQRTsDsS2:
-	br.n	denorm_return
-	 fsqrt.ss %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSQRTsDdS2:
-	br.n	denorm_return
-	 fsqrt.sd %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-FSQRTdD:
-	bb1	7,   %r9,  FSQRTdDdS2		/* branch for double */
-						/* precision S2 */
-FSQRTdDsS2:
-	br.n	denorm_return
-	 fsqrt.ds %r5, %r8			/* add the two sources and */
-						/* place result into S1 */
-FSQRTdDdS2:
-	br.n	denorm_return
-	 fsqrt.dd %r5, %r7			/* add the two sources and */
-						/* place result into S1 */
-#endif
-
-denorm_INT:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-INTcalc:
-	bb1	7,   %r9,  INTdS2		/* branch for double */
-						/* precision S2 */
-INTsS2:
-	br.n	denorm_return
-	 int.ss %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-INTdS2:
-	br.n	denorm_return
-	 int.sd %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_NINT:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-NINTcalc:
-	bb1	7,   %r9,  NINTdS2		/* branch for double */
-						/* precision S2 */
-NINTsS2:
-	br.n	denorm_return
-	 nint.ss %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-NINTdS2:
-	br.n	denorm_return
-	 nint.sd %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-denorm_TRNC:
-	or	%r7, %r0,  %r0			/* set S2 to zero */
-	or	%r8, %r0,  %r0
-TRNCcalc:
-	bb1	7,   %r9,  TRNCdS2		/* branch for double */
-						/* precision S2 */
-TRNCsS2:
-	br.n	denorm_return
-	 trnc.ss %r6, %r8			/* add the two sources and */
-						/* place result into S1 */
-TRNCdS2:
-	trnc.sd %r6, %r7			/* add the two sources and */
-						/* place result into S1 */
-
-/* Return to the routine that detected the reserved operand. */
-
-denorm_return:
-	ld	%r1, %r31, 0			/* load return address */
-	jmp	%r1
-
-/*
- * S1 and/or S2 is an infinity, and the other operand may be a zero.
- * Knowing which operands are infinity, check the remaining operands for zeros.
- */
-
-ASLOCAL(zero)
-	bb0	s1inf, %r12, S1noinf		/* see if S1 is zero */
-	bb0	s2inf, %r12, S2noinf		/* see if S2 is zero */
-	jmp	%r1
-
-/*
- * See if S1 is zero. Whether or not S1 is a zero, being in this routine
- * implies that S2 is infinity, so return to subroutine infinity after
- * completing this code. Set the s1zero flag in %r12 if S1 is zero.
- */
-
-S1noinf:
-	bb1	s1size, %r9, S1noinfd		/* work with double precision */
-						/* operand */
-S1noinfs:
-	or	%r10, %r0,  %r5			/* load high word into r10 */
-	clr	%r10, %r10, 1<sign>		/* clear the sign bit */
-	extu	%r11, %r6,  3<29>		/* extract lower 3 bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* or these 3 bits with high */
-						/* word */
-	bcnd	ne0,  %r10, operation		/* do not set zero flag */
-	jmp.n	%r1				/* since this operand was not */
-						/* infinity, S2 must have */
-						/* been, so return */
-	 set	%r12, %r12, 1<s1zero>		/* set zeroflag */
-S1noinfd:
-	clr	%r10, %r5,  1<sign>		/* clear the sign bit */
-	or	%r10, %r6,  %r10		/* or high and low word */
-	bcnd	ne0,  %r10, operation		/* do not set zero flag */
-	jmp.n	%r1				/* since this operand was not */
-						/* infinity, S2 must have */
-						/* been, so return */
-	 set	%r12, %r12, 1<s1zero>		/* set zeroflag */
-
-/* Check S2 for zero. If it is zero, then set the s2zero flag in r12. */
-
-S2noinf:
-	bb1	s2size, %r9, S2noinfd		/* work with double precision */
-						/* operand */
-S2noinfs:
-	or	%r10, %r0,  %r7			/* load high word into r10 */
-	clr	%r10, %r10, 1<sign>		/* clear the sign bit */
-	extu	%r11, %r8,  3<29>		/* extract lower 3 bits of */
-						/* mantissa */
-	or	%r10, %r10, %r11		/* or these 3 bits with high */
-						/* word */
-	bcnd	ne0,  %r10, operation		/* do not set zero flag */
-	jmp.n	%r1				/* since this operand was not */
-						/* infinity, S1 must have */
-						/* been, so return */
-	 set	%r12, %r12, 1<s2zero>		/* set zeroflag */
-S2noinfd:
-	clr	%r10, %r7,  1<sign>		/* clear the sign bit */
-	or	%r10, %r8,  %r10		/* or high and low word */
-	bcnd	ne0,  %r10, operation		/* do not set zero flag */
-	set	%r12, %r12, 1<s2zero>		/* set zeroflag */
-						/* since this operand was not */
-						/* infinity, S1 must have */
-						/* been, so return */
-operation:
-	jmp	%r1
diff --git a/sys/arch/m88k/m88k/m88100_fp.c b/sys/arch/m88k/m88k/m88100_fp.c
new file mode 100644
index 00000000000..9a5d79590d2
--- /dev/null
+++ b/sys/arch/m88k/m88k/m88100_fp.c
@@ -0,0 +1,345 @@
+/*	$OpenBSD: m88100_fp.c,v 1.1 2014/06/09 16:26:32 miod Exp $	*/
+
+/*
+ * Copyright (c) 2007, 2014, Miodrag Vallat.
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice, this permission notice, and the disclaimer below
+ * appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+#include <sys/types.h>
+#include <sys/param.h>
+#include <sys/proc.h>
+#include <sys/signalvar.h>
+#include <sys/systm.h>
+
+#include <machine/fpu.h>
+#include <machine/frame.h>
+#include <machine/ieeefp.h>
+#include <machine/trap.h>
+#include <machine/m88100.h>
+
+#include <lib/libkern/softfloat.h>
+
+#include <m88k/m88k/fpu.h>
+
+int	m88100_fpu_emulate(struct trapframe *);
+void	m88100_fpu_fetch(struct trapframe *, u_int, u_int, u_int, fparg *);
+
+/*
+ * All 88100 precise floating-point exceptions are handled there.
+ *
+ * We ignore the exception cause register completely, except for the
+ * `privilege violation' bit, and attempt to perform the computation in
+ * software if needed.
+ */
+
+void
+m88100_fpu_precise_exception(struct trapframe *frame)
+{
+	struct proc *p = curproc;
+	int fault_type;
+	vaddr_t fault_addr;
+	union sigval sv;
+	int sig;
+
+	fault_addr = frame->tf_sxip & XIP_ADDR;
+
+	/* if FPECR_FUNIMP is set, all other bits are undefined, ignore them */
+	if (ISSET(frame->tf_fpecr, FPECR_FUNIMP))
+		frame->tf_fpecr = FPECR_FUNIMP;
+
+	/* Reset the exception cause register */
+	__asm__ volatile ("fstcr %r0, %fcr0");
+
+	if (ISSET(frame->tf_fpecr, FPECR_FPRV)) {
+		sig = SIGILL;
+		fault_type = ILL_PRVREG;
+	} else {
+		sig = m88100_fpu_emulate(frame);
+		fault_type = SI_NOINFO;
+	}
+
+	/*
+	 * Update the floating point status register regardless of
+	 * whether we'll deliver a signal or not.
+	 */
+	__asm__ volatile ("fstcr %0, %%fcr62" :: "r"(frame->tf_fpsr));
+
+	if (sig != 0) {
+		if (sig == SIGILL) {
+			if (fault_type == SI_NOINFO)
+				fault_type = ILL_ILLOPC;
+		} else {
+			if (frame->tf_fpecr & FPECR_FIOV)
+				fault_type = FPE_FLTSUB;
+			else if (frame->tf_fpecr & FPECR_FROP)
+				fault_type = FPE_FLTINV;
+			else if (frame->tf_fpecr & FPECR_FDVZ)
+				fault_type = FPE_INTDIV;
+			else if (frame->tf_fpecr & FPECR_FUNF) {
+				if (frame->tf_fpsr & FPSR_EFUNF)
+					fault_type = FPE_FLTUND;
+				else if (frame->tf_fpsr & FPSR_EFINX)
+					fault_type = FPE_FLTRES;
+			} else if (frame->tf_fpecr & FPECR_FOVF) {
+				if (frame->tf_fpsr & FPSR_EFOVF)
+					fault_type = FPE_FLTOVF;
+				else if (frame->tf_fpsr & FPSR_EFINX)
+					fault_type = FPE_FLTRES;
+			} else if (frame->tf_fpecr & FPECR_FINX)
+				fault_type = FPE_FLTRES;
+		}
+
+		sv.sival_ptr = (void *)fault_addr;
+		KERNEL_LOCK();
+		trapsignal(p, sig, 0, fault_type, sv);
+		KERNEL_UNLOCK();
+	}
+}
+
+/*
+ * Load a floating-point argument into a fparg union, then convert it to
+ * the required format if it is of larger precision.
+ *
+ * This assumes the final format (width) is not FTYPE_INT, and the original
+ * format (orig_width) <= width.
+ */
+void
+m88100_fpu_fetch(struct trapframe *frame, u_int operandno, u_int orig_width,
+    u_int width, fparg *dest)
+{
+	u_int32_t tmp;
+
+	switch (orig_width) {
+	case FTYPE_INT:
+		tmp = operandno == 1 ? frame->tf_fpls1 : frame->tf_fpls2;
+		switch (width) {
+		case FTYPE_SNG:
+			dest->sng = int32_to_float32(tmp);
+			break;
+		case FTYPE_DBL:
+			dest->dbl = int32_to_float64(tmp);
+			break;
+		}
+		break;
+	case FTYPE_SNG:
+		tmp = operandno == 1 ? frame->tf_fphs1 : frame->tf_fphs2;
+		switch (width) {
+		case FTYPE_SNG:
+			dest->sng = tmp;
+			break;
+		case FTYPE_DBL:
+			dest->dbl = float32_to_float64(tmp);
+			break;
+		}
+		break;
+	case FTYPE_DBL:
+		tmp = operandno == 1 ? frame->tf_fphs1 : frame->tf_fphs2;
+		dest->dbl = ((float64)tmp) << 32;
+		tmp = operandno == 1 ? frame->tf_fpls1 : frame->tf_fpls2;
+		dest->dbl |= (float64)tmp;
+		break;
+	}
+}
+
+/*
+ * Emulate an FPU instruction.  On return, the trapframe registers
+ * will be modified to reflect the settings the hardware would have left.
+ */
+int
+m88100_fpu_emulate(struct trapframe *frame)
+{
+	u_int rd, t1, t2, td, tmax, opcode;
+	u_int32_t old_fpsr, old_fpcr;
+	int rc;
+
+	fparg arg1, arg2, dest;
+
+	/*
+	 * Crack the instruction.
+	 */
+	rd = frame->tf_fppt & 0x1f;
+	opcode = (frame->tf_fppt >> 11) & 0x1f;
+	t1 = (frame->tf_fppt >> 9) & 0x03;
+	t2 = (frame->tf_fppt >> 7) & 0x03;
+	td = (frame->tf_fppt >> 5) & 0x03;
+
+	if (rd == 0)	/* r0 not allowed as destination */
+		return (SIGILL);
+
+	switch (opcode) {
+	case 0x00:	/* fmul */
+	case 0x05:	/* fadd */
+	case 0x06:	/* fsub */
+	case 0x0e:	/* fdiv */
+		if ((t1 != FTYPE_SNG && t1 != FTYPE_DBL) ||
+		    (t2 != FTYPE_SNG && t2 != FTYPE_DBL) ||
+		    (td != FTYPE_SNG && td != FTYPE_DBL))
+			return (SIGILL);
+		break;
+	case 0x04:	/* flt */
+		if ((td != FTYPE_SNG && td != FTYPE_DBL) ||
+		    t2 != 0x00 || t1 != 0x00)
+			return (SIGILL);
+		break;
+	case 0x07:	/* fcmp */
+		if ((t1 != FTYPE_SNG && t1 != FTYPE_DBL) ||
+		    (t2 != FTYPE_SNG && t2 != FTYPE_DBL) ||
+		    td != 0x00)
+			return (SIGILL);
+		break;
+	case 0x09:	/* int */
+	case 0x0a:	/* nint */
+	case 0x0b:	/* trnc */
+		if ((t2 != FTYPE_SNG && t2 != FTYPE_DBL) ||
+		    t1 != 0x00 || td != 0x00)
+			return (SIGILL);
+		break;
+	default:
+		return (SIGILL);
+	}
+
+	/*
+	 * Temporarily reset the status register, so that we can tell
+	 * which exceptions are new after processing the opcode.
+	 */
+	old_fpsr = frame->tf_fpsr;
+	frame->tf_fpsr = 0;
+
+	/*
+	 * Save fpcr as well, since we might need to change rounding mode
+	 * temporarily.
+	 */
+	old_fpcr = frame->tf_fpcr;
+
+	/*
+	 * The logic for instruction emulation is:
+	 *
+	 * - the computation precision is the largest one of all the operands.
+	 * - all source operands are converted to this precision if needed.
+	 * - computation is performed.
+	 * - the result is stored into the destination operand, converting it
+	 *   to the destination precision if lower.
+	 */
+
+	switch (opcode) {
+	case 0x00:	/* fmul */
+		tmax = fpu_precision(t1, t2, td);
+		m88100_fpu_fetch(frame, 1, t1, tmax, &arg1);
+		m88100_fpu_fetch(frame, 2, t2, tmax, &arg2);
+		switch (tmax) {
+		case FTYPE_SNG:
+			dest.sng = float32_mul(arg1.sng, arg2.sng);
+			break;
+		case FTYPE_DBL:
+			dest.dbl = float64_mul(arg1.dbl, arg2.dbl);
+			break;
+		}
+		fpu_store(frame, rd, tmax, td, &dest);
+		break;
+
+	case 0x04:	/* flt */
+		m88100_fpu_fetch(frame, 2, FTYPE_INT, td, &dest);
+		fpu_store(frame, rd, td, td, &dest);
+		break;
+
+	case 0x05:	/* fadd */
+		tmax = fpu_precision(t1, t2, td);
+		m88100_fpu_fetch(frame, 1, t1, tmax, &arg1);
+		m88100_fpu_fetch(frame, 2, t2, tmax, &arg2);
+		switch (tmax) {
+		case FTYPE_SNG:
+			dest.sng = float32_add(arg1.sng, arg2.sng);
+			break;
+		case FTYPE_DBL:
+			dest.dbl = float64_add(arg1.dbl, arg2.dbl);
+			break;
+		}
+		fpu_store(frame, rd, tmax, td, &dest);
+		break;
+
+	case 0x06:	/* fsub */
+		tmax = fpu_precision(t1, t2, td);
+		m88100_fpu_fetch(frame, 1, t1, tmax, &arg1);
+		m88100_fpu_fetch(frame, 2, t2, tmax, &arg2);
+		switch (tmax) {
+		case FTYPE_SNG:
+			dest.sng = float32_sub(arg1.sng, arg2.sng);
+			break;
+		case FTYPE_DBL:
+			dest.dbl = float64_sub(arg1.dbl, arg2.dbl);
+			break;
+		}
+		fpu_store(frame, rd, tmax, td, &dest);
+		break;
+
+	case 0x07:	/* fcmp */
+		tmax = fpu_precision(t1, t2, IGNORE_PRECISION);
+		m88100_fpu_fetch(frame, 1, t1, tmax, &arg1);
+		m88100_fpu_fetch(frame, 2, t2, tmax, &arg2);
+		fpu_compare(frame, &arg1, &arg2, tmax, rd, 0);
+		break;
+
+	case 0x09:	/* int */
+do_int:
+		m88100_fpu_fetch(frame, 2, t2, t2, &dest);
+		fpu_store(frame, rd, t2, FTYPE_INT, &dest);
+		break;
+
+	case 0x0a:	/* nint */
+		/* round to nearest */
+		frame->tf_fpcr = (old_fpcr & ~(FPCR_RD_MASK << FPCR_RD_SHIFT)) |
+		    (FP_RN << FPCR_RD_SHIFT);
+		goto do_int;
+
+	case 0x0b:	/* trnc */
+		/* round towards zero */
+		frame->tf_fpcr = (old_fpcr & ~(FPCR_RD_MASK << FPCR_RD_SHIFT)) |
+		    (FP_RZ << FPCR_RD_SHIFT);
+		goto do_int;
+
+	case 0x0e:	/* fdiv */
+		tmax = fpu_precision(t1, t2, td);
+		m88100_fpu_fetch(frame, 1, t1, tmax, &arg1);
+		m88100_fpu_fetch(frame, 2, t2, tmax, &arg2);
+		switch (tmax) {
+		case FTYPE_SNG:
+			dest.sng = float32_div(arg1.sng, arg2.sng);
+			break;
+		case FTYPE_DBL:
+			dest.dbl = float64_div(arg1.dbl, arg2.dbl);
+			break;
+		}
+		fpu_store(frame, rd, tmax, td, &dest);
+		break;
+	}
+
+	/*
+	 * Mark new exceptions, if any, in the fpsr, and decide whether
+	 * to send a signal or not.
+	 */
+
+	if (frame->tf_fpsr & old_fpcr)
+		rc = SIGFPE;
+	else
+		rc = 0;
+	frame->tf_fpsr |= old_fpsr;
+
+	/*
+	 * Restore fpcr as well.
+	 */
+	frame->tf_fpcr = old_fpcr;
+
+	return (rc);
+}
diff --git a/sys/arch/m88k/m88k/m88110_fp.c b/sys/arch/m88k/m88k/m88110_fp.c
index ee04e7a1d9c..7b60277d657 100644
--- a/sys/arch/m88k/m88k/m88110_fp.c
+++ b/sys/arch/m88k/m88k/m88110_fp.c
@@ -1,4 +1,4 @@
-/*	$OpenBSD: m88110_fp.c,v 1.9 2014/03/29 18:09:29 guenther Exp $	*/
+/*	$OpenBSD: m88110_fp.c,v 1.10 2014/06/09 16:26:32 miod Exp $	*/
 
 /*
  * Copyright (c) 2007, Miodrag Vallat.
@@ -31,58 +31,10 @@
 
 #include <lib/libkern/softfloat.h>
 
-/*
- * Values for individual bits in fcmp results.
- */
-#define	CC_UN	0x00000001	/* unordered */
-#define	CC_LEG	0x00000002	/* less than, equal or greater than */
-#define	CC_EQ	0x00000004	/* equal */
-#define	CC_NE	0x00000008	/* not equal */
-#define	CC_GT	0x00000010	/* greater than */
-#define	CC_LE	0x00000020	/* less than or equal */
-#define	CC_LT	0x00000040	/* less than */
-#define	CC_GE	0x00000080	/* greater than or equal */
-#define	CC_OU	0x00000100	/* out of range */
-#define	CC_IB	0x00000200	/* in range or on boundary */
-#define	CC_IN	0x00000400	/* in range */
-#define	CC_OB	0x00000800	/* out of range or on boundary */
-#define	CC_UE	0x00001000	/* unordered or equal */
-#define	CC_LG	0x00002000	/* less than or greater than */
-#define	CC_UG	0x00004000	/* unordered or greater than */
-#define	CC_ULE	0x00008000	/* unordered or less than or equal */
-#define	CC_UL	0x00010000	/* unordered or less than */
-#define	CC_UGE	0x00020000	/* unordered or greater than or equal */
-
-/*
- * Data width (matching the TD field of the instructions)
- */
-#define	FTYPE_SNG	0
-#define	FTYPE_DBL	1
-#define	FTYPE_EXT	2
-#define	FTYPE_INT	3	/* not a real T value */
-
-#define	IGNORE_PRECISION	FTYPE_SNG
-
-/* floating point value */
-typedef union {
-	float32		sng;
-	float64		dbl;
-} fparg;
+#include <m88k/m88k/fpu.h>
 
-void	fpu_compare(struct trapframe *, fparg *, fparg *, u_int, u_int, u_int);
-int	fpu_emulate(struct trapframe *, u_int32_t);
-void	fpu_fetch(struct trapframe *, u_int, u_int, u_int, fparg *);
-u_int	fpu_precision(u_int, u_int, u_int);
-void	fpu_store(struct trapframe *, u_int, u_int, u_int, fparg *);
-
-/*
- * Inlines from softfloat-specialize.h which are not made public, needed
- * for fpu_compare.
- */
-#define	float32_is_nan(a) \
-	(0xff000000 < (a << 1))
-#define	float32_is_signaling_nan(a) \
-	((((a >> 22) & 0x1ff) == 0x1fe) && (a & 0x003fffff))
+int	m88110_fpu_emulate(struct trapframe *, u_int32_t);
+void	m88110_fpu_fetch(struct trapframe *, u_int, u_int, u_int, fparg *);
 
 /*
  * All 88110 floating-point exceptions are handled there.
@@ -171,7 +123,7 @@ m88110_fpu_exception(struct trapframe *frame)
 			fault_type = FPE_FLTINV;
 			goto deliver;
 		}
-		sig = fpu_emulate(frame, insn);
+		sig = m88110_fpu_emulate(frame, insn);
 		fault_type = SI_NOINFO;
 		/*
 		 * Update the floating point status register regardless of
@@ -229,8 +181,8 @@ deliver:
  * format (orig_width) <= width.
  */
 void
-fpu_fetch(struct trapframe *frame, u_int regno, u_int orig_width, u_int width,
-    fparg *dest)
+m88110_fpu_fetch(struct trapframe *frame, u_int regno, u_int orig_width,
+    u_int width, fparg *dest)
 {
 	u_int32_t tmp;
 
@@ -267,83 +219,11 @@ fpu_fetch(struct trapframe *frame, u_int regno, u_int orig_width, u_int width,
 }
 
 /*
- * Store a floating-point result, converting it to the required format if it
- * is of smaller precision.
- *
- * This assumes the original format (orig_width) is not FTYPE_INT, and the
- * final format (width) <= orig_width.
- */
-void
-fpu_store(struct trapframe *frame, u_int regno, u_int orig_width, u_int width,
-    fparg *src)
-{
-	u_int32_t tmp;
-	u_int rd;
-
-	switch (width) {
-	case FTYPE_INT:
-		rd = float_get_round(frame->tf_fpcr);
-		switch (orig_width) {
-		case FTYPE_SNG:
-			if (rd == FP_RZ)
-				tmp = float32_to_int32_round_to_zero(src->sng);
-			else
-				tmp = float32_to_int32(src->sng);
-			break;
-		case FTYPE_DBL:
-			if (rd == FP_RZ)
-				tmp = float64_to_int32_round_to_zero(src->dbl);
-			else
-				tmp = float64_to_int32(src->dbl);
-			break;
-		}
-		if (regno != 0)
-			frame->tf_r[regno] = tmp;
-		break;
-	case FTYPE_SNG:
-		switch (orig_width) {
-		case FTYPE_SNG:
-			tmp = src->sng;
-			break;
-		case FTYPE_DBL:
-			tmp = float64_to_float32(src->dbl);
-			break;
-		}
-		if (regno != 0)
-			frame->tf_r[regno] = tmp;
-		break;
-	case FTYPE_DBL:
-		switch (orig_width) {
-		case FTYPE_DBL:
-			tmp = (u_int32_t)(src->dbl >> 32);
-			if (regno != 0)
-				frame->tf_r[regno] = tmp;
-			tmp = (u_int32_t)src->dbl;
-			if (regno != 31)
-				frame->tf_r[regno + 1] = tmp;
-			break;
-		}
-		break;
-	}
-}
-
-/*
- * Return the largest precision of all precision inputs.
- *
- * This assumes none of the inputs is FTYPE_INT.
- */
-u_int
-fpu_precision(u_int ts1, u_int ts2, u_int td)
-{
-	return max(td, max(ts1, ts2));
-}
-
-/*
  * Emulate an FPU instruction.  On return, the trapframe registers
  * will be modified to reflect the settings the hardware would have left.
  */
 int
-fpu_emulate(struct trapframe *frame, u_int32_t insn)
+m88110_fpu_emulate(struct trapframe *frame, u_int32_t insn)
 {
 	u_int rf, rd, rs1, rs2, t1, t2, td, tmax, opcode;
 	u_int32_t old_fpsr, old_fpcr;
@@ -442,8 +322,8 @@ fpu_emulate(struct trapframe *frame, u_int32_t insn)
 	switch (opcode) {
 	case 0x00:	/* fmul */
 		tmax = fpu_precision(t1, t2, td);
-		fpu_fetch(frame, rs1, t1, tmax, &arg1);
-		fpu_fetch(frame, rs2, t2, tmax, &arg2);
+		m88110_fpu_fetch(frame, rs1, t1, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg2);
 		switch (tmax) {
 		case FTYPE_SNG:
 			dest.sng = float32_mul(arg1.sng, arg2.sng);
@@ -457,19 +337,19 @@ fpu_emulate(struct trapframe *frame, u_int32_t insn)
 
 	case 0x01:	/* fcvt */
 		tmax = fpu_precision(IGNORE_PRECISION, t2, td);
-		fpu_fetch(frame, rs2, t2, tmax, &dest);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &dest);
 		fpu_store(frame, rd, tmax, td, &dest);
 		break;
 
 	case 0x04:	/* flt */
-		fpu_fetch(frame, rs2, FTYPE_INT, td, &dest);
+		m88110_fpu_fetch(frame, rs2, FTYPE_INT, td, &dest);
 		fpu_store(frame, rd, td, td, &dest);
 		break;
 
 	case 0x05:	/* fadd */
 		tmax = fpu_precision(t1, t2, td);
-		fpu_fetch(frame, rs1, t1, tmax, &arg1);
-		fpu_fetch(frame, rs2, t2, tmax, &arg2);
+		m88110_fpu_fetch(frame, rs1, t1, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg2);
 		switch (tmax) {
 		case FTYPE_SNG:
 			dest.sng = float32_add(arg1.sng, arg2.sng);
@@ -483,8 +363,8 @@ fpu_emulate(struct trapframe *frame, u_int32_t insn)
 
 	case 0x06:	/* fsub */
 		tmax = fpu_precision(t1, t2, td);
-		fpu_fetch(frame, rs1, t1, tmax, &arg1);
-		fpu_fetch(frame, rs2, t2, tmax, &arg2);
+		m88110_fpu_fetch(frame, rs1, t1, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg2);
 		switch (tmax) {
 		case FTYPE_SNG:
 			dest.sng = float32_sub(arg1.sng, arg2.sng);
@@ -498,14 +378,14 @@ fpu_emulate(struct trapframe *frame, u_int32_t insn)
 
 	case 0x07:	/* fcmp, fcmpu */
 		tmax = fpu_precision(t1, t2, IGNORE_PRECISION);
-		fpu_fetch(frame, rs1, t1, tmax, &arg1);
-		fpu_fetch(frame, rs2, t2, tmax, &arg2);
+		m88110_fpu_fetch(frame, rs1, t1, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg2);
 		fpu_compare(frame, &arg1, &arg2, tmax, rd, td /* fcmpu */);
 		break;
 
 	case 0x09:	/* int */
 do_int:
-		fpu_fetch(frame, rs2, t2, t2, &dest);
+		m88110_fpu_fetch(frame, rs2, t2, t2, &dest);
 		fpu_store(frame, rd, t2, FTYPE_INT, &dest);
 		break;
 
@@ -523,8 +403,8 @@ do_int:
 
 	case 0x0e:	/* fdiv */
 		tmax = fpu_precision(t1, t2, td);
-		fpu_fetch(frame, rs1, t1, tmax, &arg1);
-		fpu_fetch(frame, rs2, t2, tmax, &arg2);
+		m88110_fpu_fetch(frame, rs1, t1, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg2);
 		switch (tmax) {
 		case FTYPE_SNG:
 			dest.sng = float32_div(arg1.sng, arg2.sng);
@@ -538,7 +418,7 @@ do_int:
 
 	case 0x0f:	/* sqrt */
 		tmax = fpu_precision(IGNORE_PRECISION, t2, td);
-		fpu_fetch(frame, rs2, t2, tmax, &arg1);
+		m88110_fpu_fetch(frame, rs2, t2, tmax, &arg1);
 		switch (tmax) {
 		case FTYPE_SNG:
 			dest.sng = float32_sqrt(arg1.sng);
@@ -569,167 +449,3 @@ do_int:
 
 	return (rc);
 }
-
-/*
- * Perform a compare instruction (fcmp, fcmpu).
- *
- * If either operand is NaN, the result is unordered.  This causes an
- * reserved operand exception (except for nonsignalling NaNs for fcmpu).
- */
-void
-fpu_compare(struct trapframe *frame, fparg *s1, fparg *s2, u_int width,
-    u_int rd, u_int fcmpu)
-{
-	u_int32_t cc;
-	int zero, s1positive, s2positive;
-
-	/*
-	 * Handle NaNs first, and raise invalid if fcmp or signaling NaN.
-	 */
-	switch (width) {
-	case FTYPE_SNG:
-		if (float32_is_nan(s1->sng)) {
-			if (!fcmpu || float32_is_signaling_nan(s1->sng))
-				float_set_invalid();
-			cc = CC_UN;
-			goto done;
-		}
-		if (float32_is_nan(s2->sng)) {
-			if (!fcmpu || float32_is_signaling_nan(s2->sng))
-				float_set_invalid();
-			cc = CC_UN;
-			goto done;
-		}
-		break;
-	case FTYPE_DBL:
-		if (float64_is_nan(s1->dbl)) {
-			if (!fcmpu || float64_is_signaling_nan(s1->dbl))
-				float_set_invalid();
-			cc = CC_UN;
-			goto done;
-		}
-		if (float64_is_nan(s2->dbl)) {
-			if (!fcmpu || float64_is_signaling_nan(s2->dbl))
-				float_set_invalid();
-			cc = CC_UN;
-			goto done;
-		}
-		break;
-	}
-
-	/*
-	 * Now order the two numbers.
-	 */
-	switch (width) {
-	case FTYPE_SNG:
-		if (float32_eq(s1->sng, s2->sng))
-			cc = CC_EQ;
-		else if (float32_lt(s1->sng, s2->sng))
-			cc = CC_LT | CC_NE;
-		else
-			cc = CC_GT | CC_NE;
-		break;
-	case FTYPE_DBL:
-		if (float64_eq(s1->dbl, s2->dbl))
-			cc = CC_EQ;
-		else if (float64_lt(s1->dbl, s2->dbl))
-			cc = CC_LT | CC_NE;
-		else
-			cc = CC_GT | CC_NE;
-		break;
-	}
-
-done:
-
-	/*
-	 * Complete condition code mask.
-	 */
-
-	if (cc & CC_UN)
-		cc |= CC_UE | CC_UG | CC_ULE | CC_UL | CC_UGE;
-	if (cc & CC_EQ)
-		cc |= CC_LE | CC_GE | CC_UE;
-	if (cc & CC_GT)
-		cc |= CC_GE;
-	if (cc & CC_LT)
-		cc |= CC_LE;
-	if (cc & (CC_LT | CC_GT))
-		cc |= CC_LG;
-	if (cc & (CC_LT | CC_GT | CC_EQ))
-		cc |= CC_LEG;
-	if (cc & CC_GT)
-		cc |= CC_UG;
-	if (cc & CC_LE)
-		cc |= CC_ULE;
-	if (cc & CC_LT)
-		cc |= CC_UL;
-	if (cc & CC_GE)
-		cc |= CC_UGE;
-
-	/*
-	 * Fill the interval bits.
-	 * s1 is compared to the interval [0, s2].
-	 */
-	if (!(cc & CC_UN)) {
-		if (cc & CC_EQ) {
-			/* if s1 and s2 are equal, s1 is on boundary */
-			cc |= CC_IB | CC_OB;
-			goto completed;
-		}
-
-		/* s1 and s2 are either Zero, numbers or Inf */
-		switch (width) {
-		case FTYPE_SNG:
-			zero = float32_eq(s1->sng, 0);
-			break;
-		case FTYPE_DBL:
-			zero = float64_eq(s1->dbl, 0LL);
-			break;
-		}
-		if (zero) {
-			/* if s1 is zero, it is on boundary */
-			cc |= CC_IB | CC_OB;
-			goto completed;
-		}
-
-		switch (width) {
-		case FTYPE_SNG:
-			s1positive = s1->sng >> 31 == 0;
-			s2positive = s2->sng >> 31 == 0;
-			break;
-		case FTYPE_DBL:
-			s1positive = s1->dbl >> 63 == 0;
-			s2positive = s2->dbl >> 63 == 0;
-			break;
-		}
-		if (s2positive) {
-			/* s2 is positive, the interval is [0, s2] */
-			if (cc & CC_GT) {
-				/* 0 <= s2 < s1 -> out of interval */
-				cc |= CC_OU | CC_OB;
-			} else if (s1positive) {
-				/* 0 < s1 < s2 -> in interval */
-				cc |= CC_IB | CC_IN;
-			} else {
-				/* s1 < 0 <= s2 */
-				cc |= CC_OU | CC_OB;
-			}
-		} else {
-			/* s2 is negative, the interval is [s2, 0] */
-			if (cc & CC_LT) {
-				/* s1 < s2 <= 0 */
-				cc |= CC_OU | CC_OB;
-			} else if (!s1positive) {
-				/* s2 < s1 < 0 */
-				cc |= CC_IB | CC_IN;
-			} else {
-				/* s2 < 0 < s1 */
-				cc |= CC_OU | CC_OB;
-			}
-		}
-	}
-
-completed:
-	if (rd != 0)
-		frame->tf_r[rd] = cc;
-}
diff --git a/sys/arch/m88k/m88k/trap.c b/sys/arch/m88k/m88k/trap.c
index 302efe39490..0e1dec19918 100644
--- a/sys/arch/m88k/m88k/trap.c
+++ b/sys/arch/m88k/m88k/trap.c
@@ -1,4 +1,4 @@
-/*	$OpenBSD: trap.c,v 1.97 2014/06/09 14:33:20 miod Exp $	*/
+/*	$OpenBSD: trap.c,v 1.98 2014/06/09 16:26:32 miod Exp $	*/
 /*
  * Copyright (c) 2004, Miodrag Vallat.
  * Copyright (c) 1998 Steve Murphree, Jr.
@@ -506,10 +506,9 @@ user_fault:
 		break;
 	case T_FPEPFLT+T_USER:
 		m88100_fpu_precise_exception(frame);
-		goto maysigfpe;
+		goto userexit;
 	case T_FPEIFLT+T_USER:
 		m88100_fpu_imprecise_exception(frame);
-maysigfpe:
 		/* Check for a SIGFPE condition */
 		if (frame->tf_fpsr & frame->tf_fpcr) {
 			sig = SIGFPE;
@@ -616,6 +615,7 @@ maysigfpe:
 		frame->tf_ipfsr = frame->tf_dpfsr = 0;
 	}
 
+userexit:
 	userret(p);
 }
 #endif /* M88100 */