3 files changed, 921 insertions, 882 deletions
diff --git a/sys/arch/m88k/conf/files.m88k b/sys/arch/m88k/conf/files.m88k
index 82a36c01148..44679231cc2 100644
--- a/sys/arch/m88k/conf/files.m88k
+++ b/sys/arch/m88k/conf/files.m88k
@@ -1,4 +1,4 @@
-#	$OpenBSD: files.m88k,v 1.25 2013/06/07 17:31:31 miod Exp $
+#	$OpenBSD: files.m88k,v 1.26 2014/06/09 10:26:10 miod Exp $
 
 file	arch/m88k/m88k/atomic.S				multiprocessor
 file	arch/m88k/m88k/db_disasm.c			ddb
@@ -7,6 +7,7 @@ file	arch/m88k/m88k/db_sstep.c			ddb
 file	arch/m88k/m88k/db_trace.c			ddb
 file	arch/m88k/m88k/in_cksum.c			inet
 file	arch/m88k/m88k/m88100_fp.S			m88100
+file	arch/m88k/m88k/m88100_fp_imp.S			m88100
 file	arch/m88k/m88k/m88100_machdep.c			m88100
 file	arch/m88k/m88k/m88110_mmu.S			m88110
 file	arch/m88k/m88k/m8820x_machdep.c			m88100
diff --git a/sys/arch/m88k/m88k/m88100_fp.S b/sys/arch/m88k/m88k/m88100_fp.S
index e0c39c8041f..6e4cbd40c62 100644
--- a/sys/arch/m88k/m88k/m88100_fp.S
+++ b/sys/arch/m88k/m88k/m88100_fp.S
@@ -1,4 +1,4 @@
-/* $OpenBSD: m88100_fp.S,v 1.9 2013/09/05 20:40:32 miod Exp $	*/
+/* $OpenBSD: m88100_fp.S,v 1.10 2014/06/09 10:26:10 miod Exp $	*/
 /*
  * Mach Operating System
  * Copyright (c) 1991 Carnegie Mellon University
@@ -63,13 +63,8 @@
 #define s2zero		2
 #define sigbit		19
 
-#define modehi		30
-#define modelo		29
 #define rndhi		15
 #define rndlo		14
-#define efunf		7
-#define efovf		6
-#define efinx		5
 
 ENTRY(m88100_fpu_precise_exception)
 	or	%r29, %r2,  %r0		/* r29 is now the E.F. */
@@ -782,822 +777,6 @@ ASLOCAL(inf)
 					/* remaining alternative */
 
 /*
- * Branch to the routine to make a denormalized number.
- */
-ASLOCAL(FPunderflow)
-	st	%r1, %r31, 0	/* save return address */
-	set	%r2, %r2,  1<underflow>
-	set	%r2, %r2,  1<inexact>
-
-/*
- * Now the floating point number, which has an exponent smaller than what
- * IEEE allows, must be denormalized. Denormalization is done by calculating
- * the difference between a denormalized exponent and an underflow exponent
- * and shifting the mantissa by that amount. A one may need to be subtracted
- * from the LSB if a one was added during rounding.
- * %r9 is used to contain the guard, round, sticky, and an inaccuracy bit in
- * case some bits were shifted off the mantissa during denormalization.
- * %r9 will contain:
- *   bit 4 -- new addone if one added during rounding after denormalization
- *   bit 3 -- inaccuracy flag caused by denormalization or pre-denormalization
- *            inexactness
- *   bit 2 -- guard bit of result
- *   bit 1 -- round bit of result
- *   bit 0 -- sticky bit of result
- */
-
-FPU_denorm:
-	bb1.n	destsize, %r12, Udouble	/* denorm for double */
-	 extu	%r9,  %r10, 3<26>	/* load r9 with grs */
-Usingle:
-	mak	%r5,  %r10, 21<3>	/* extract high 21 bits of mantissa */
-	extu	%r6,  %r11, 3<29>	/* extract low 3 bits of mantissa */
-	or	%r11, %r5,  %r6		/* form 24 bits of mantissa */
-
-/* See if the addone bit is set and unround if it is. */
-	bb0.n	25,   %r10, nounrounds	/* do not unround if addone bit clear */
-	 extu	%r6,  %r12, 12<20>	/* extract signed exponent from IMPCR */
-unrounds:
-	subu	%r11, %r11, 1		/* subtract 1 from mantissa */
-
-/*
- * If the hidden bit is cleared after subtracting the one, then the one added
- * during the rounding must have propagated through the mantissa. The exponent
- * will need to be decremented.
- */
-	bb1	23,   %r11, nounrounds	/* if hidden bit is set, the exponent */
-					/* does not need to be decremented */
-decexps:
-	sub	%r6,  %r6,  1		/* decrement exponent */
-	set	%r11, %r11, 1<23>	/* set the hidden bit */
-
-/*
- * For both single and double precision, there are cases where it is easier
- * and quicker to make a special case. Examples of this are if the shift
- * amount is only 1 or 2, or all the mantissa is shifted off, or all the
- * mantissa is shifted off and it is still shifting, or, in the case of
- * doubles, if the shift amount is around the boundary of MANTLO and MANTHI.
- */
-
-nounrounds:
-	or	%r8,  %r0,  %lo16(0x00000f81)
-					/* load r8 with -127 in decimal */
-					/* for lowest 12 bits */
-	sub	%r7,  %r8,  %r6		/* find difference between two */
-					/* exponents, this amount is the */
-					/* shift amount */
-	cmp	%r6,  %r7,  3		/* check to see if r7 contains 3 */
-					/* or more */
-	bb1	ge,   %r6,  threesing	/* br to code that handles shifts of */
-					/* 3 or more */
-	cmp	%r6,  %r7,  2		/* check to see if r7 contains 2 */
-	bb1	eq,   %r6,  twosing	/* br to code that handles shifts of */
-					/* 2 */
-one:
-	rot	%r9,  %r9,  0<1>	/* rotate roundoff register once, */
-					/* this places guard in round and */
-					/* round in sticky */
-	bb0	31,   %r9,  nosticky1s	/* do not or round and sticky if */
-					/* sticky is 0, this lost bit will */
-					/* be cleared later */
-	set	%r9,  %r9,  1<0>	/* or round and sticky */
-nosticky1s:
-	bb0	0,    %r11, guardclr1s	/* do not set guard bit if LSB = 0 */
-	set	%r9,  %r9,  1<2>	/* set guard bit */
-guardclr1s:
-	extu	%r11, %r11, 31<1>	/* shift mantissa right 1 */
-	br.n	round			/* round result */
-	 mak	%r9,  %r9,  3<0>	/* clear bits lost during rotation */
-
-twosing:
-	rot	%r9,  %r9,  0<2>	/* rotate roundff register twice, */
-					/* this places guard in sticky */
-	bb0	30,   %r9,  nosticky2s	/* do not or guard and sticky if */
-					/* sticky is 0, this lost bit will be */
-					/* cleared later */
-	br.n	noround2s		/* skip or old guard and old round if */
-					/* old sticky set */
-	 set	%r9,  %r9,  1<0>	/* or guard and sticky */
-nosticky2s:
-	bb0	31,   %r9,  noround2s	/* do not or guard and round if round */
-					/* is 0, this lost bit will be */
-					/* cleared later */
-	set	%r9,  %r9,  1<0>	/* or guard and round */
-noround2s:
-	bb0	0,    %r11, roundclr2s	/* do not set round bit if LSB = 0 */
-	set	%r9,  %r9,  1<1>	/* set round bit */
-roundclr2s:
-	bb0	1,    %r11, guardclr2s	/* do not set guard bit if LSB+1 = 0 */
-	set	%r9,  %r9,  1<2>	/* set guard bit */
-guardclr2s:
-	extu	%r11, %r11, 30<2>	/* shift mantissa right 2 */
-	br.n	round			/* round result */
-	 mak	%r9,  %r9,  3<0>	/* clear bits lost during rotation */
-
-threesing:
-	bb1	0,    %r9,  noguard3s	/* check sticky initially */
-					/* sticky is set, forget most of the */
-					/* oring */
-nosticky3s:
-	bb0	1,    %r9,  noround3s	/* check round initially, do not set */
-					/* sticky */
-	br.n	noguard3s		/* forget most of the rest of oring */
-	 set	%r9,  %r9,  1<0>	/* if round is clear, set sticky if */
-					/* round set */
-noround3s:
-	bb0.n	2,    %r9,  noguard3s	/* check guard initially, do not set */
-					/* sticky */
-	 clr	%r9,  %r9,  2<1>	/* clear the original guard and round */
-					/* for when you get to round section */
-	set	%r9,  %r9,  1<0>	/* if guard is clear, set sticky if */
-					/* guard set */
-noguard3s:
-	cmp	%r6,  %r7,  23		/* check if # of shifts is <=23 */
-	bb1	gt,   %r6,  s24		/* branch to see if shifts = 24 */
-	sub	%r6,  %r7,  2		/* get number of bits to check for */
-					/* sticky */
-	mak	%r6,  %r6,  5<5>	/* shift width into width field */
-	mak	%r8,  %r11, %r6		/* mask off shifted bits -2 */
-	ff1	%r8,  %r8		/* see if r8 has any ones */
-	bb1	5,    %r8,  nostky23	/* do not set sticky if no ones found */
-	set	%r9,  %r9,  1<0>	/* set sticky bit */
-nostky23:
-	or	%r8,  %r0,  0x22	/* start code to get new mantissa */
-					/* plus two extra bits for new round */
-					/* and new guard bits */
-	subu	%r8,  %r8,  %r7
-	mak	%r8,  %r8,  5<5>	/* shift field width into second five */
-					/* bits */
-	extu	%r6,  %r6,  5<5>	/* shift previous shifted -2 into */
-					/* offset field */
-	or	%r6,  %r6,  %r8		/* complete field */
-	extu	%r11, %r11, %r6		/* form new mantissa with two extra */
-					/* bits */
-
-	bb0	0,    %r11, nornd3s	/* do not set new round bit */
-	set	%r9,  %r9,  1<1>	/* set new round bit */
-nornd3s:
-	bb0	1,    %r11, nogrd3s	/* do not set new guard bit */
-	set	%r9,  %r9,  1<2>	/* set new guard bit */
-nogrd3s:
-	br.n	round			/* round mantissa */
-	 extu	%r11, %r11, 30<2>	/* shift off remaining two bits */
-
-s24:
-	cmp	%r6,  %r7,  24		/* check to see if # of shifts is 24 */
-	bb1	gt,   %r6,  s25		/* branch to see if shifts = 25 */
-	bb1	0,    %r9,  nostky24	/* skip checking if old sticky set */
-	extu	%r8,  %r11, 22<0>	/* prepare to check bits that will be */
-					/* shifted into the sticky */
-	ff1	%r8,  %r8		/* see if there are any 1''s */
-	bb1	5,    %r8,  nostky24	/* do not set sticky if no ones found */
-	set	%r9,  %r9,  1<0>	/* set sticky bit */
-nostky24:
-	bb0	22,   %r11, nornd24	/* do not set new round bit */
-	set	%r9,  %r9,  1<1>	/* set new round bit */
-nornd24:
-	set	%r9,  %r9,  1<2>	/* set new guard bit, this is hidden */
-					/* bit */
-	br.n	round			/* round mantissa */
-	 or	%r11, %r0,  %r0		/* clear r11, all of mantissa */
-					/* shifted off */
-
-s25:
-	cmp	%r6,  %r7,  25		/* check to see if # of shifts is 25 */
-	bb1	gt,   %r6,  s26		/* branch to execute for shifts => 26 */
-	bb1	0,    %r9,  nostky25	/* skip checking if old sticky set */
-	extu	%r8,  %r11, 23<0>	/* prepare to check bits that will be */
-					/* shifted into the sticky */
-	ff1	%r8,  %r8		/* see if there are any 1''s */
-	bb1	5,    %r8,  nostky25	/* do not set sticky if no ones found */
-	set	%r9,  %r9,  1<0>	/* set sticky bit */
-nostky25:
-	set	%r9,  %r9,  1<1>	/* set new round bit, this is hidden */
-					/* bit */
-	clr	%r9,  %r9,  1<2>	/* clear guard bit since nothing */
-					/* shifted in */
-	br.n	round			/* round and assemble result */
-	 or	%r11, %r0,  %r0		/* clear r11, all of mantissa */
-					/* shifted off */
-
-s26:
-	set	%r9,  %r9,  1<0>	/* set sticky bit, this contains */
-					/* hidden bit */
-	clr	%r9,  %r9,  2<1>	/* clear guard and round bits since */
-					/* nothing shifted in */
-	br.n	round			/* round and assemble result */
-	 or	%r11, %r0,  %r0		/* clear mantissa */
-
-Udouble:
-	mak	%r5,  %r10, 21<0>	/* extract upper bits of mantissa */
-	bb0.n	25,   %r10, nounroundd	/* do not unround if addone bit clear */
-	 extu	%r6,  %r12, 12<20>	/* extract signed exponenet from IMPCR */
-unroundd:
-	or	%r8,  %r0,  1
-	subu.co	%r11, %r11, %r8		/* subtract 1 from mantissa */
-	subu.ci	%r5,  %r5,  %r0		/* subtract borrow from upper word */
-	bb1	20,   %r5,  nounroundd	/* if hidden bit is set, then */
-					/* exponent does not need to be */
-					/* decremented */
-decexpd:
-	sub	%r6,  %r6,  1		/* decrement exponent */
-	set	%r5,  %r5,  1<20>	/* set the hidden bit */
-
-nounroundd:
-	or	%r8,  %r0,  %lo16(0x00000c01)
-					/* load r8 with -1023 in decimal */
-					/* for lowest 12 bits */
-	sub	%r7,  %r8,  %r6		/* find difference between two */
-					/* exponents, this amount is the */
-					/* shift amount */
-	cmp	%r6,  %r7,  3		/* check to see if r7 contains */
-					/* 3 or more */
-	bb1	ge,   %r6,  threedoub	/* br to code that handles shifts of */
-					/* 3 or more */
-	cmp	%r6,  %r7,  2		/* check to see if r7 contains 2 */
-	bb1	eq,   %r6,  twodoub	/* br to code that handles shifts */
-					/* of 2 */
-
-onedoub:
-	rot	%r9,  %r9,  0<1>	/* rotate roundoff register once, */
-					/* this places guard in round and */
-					/* round in sticky */
-	bb0	31,   %r9,  nosticky1d	/* do not or round and sticky if */
-					/* sticky is 0, this lost bit */
-					/* will be cleared later */
-	set	%r9,  %r9,  1<0>	/* or old round and old sticky into */
-					/* new sticky */
-nosticky1d:
-	bb0	0,    %r11, guardclr1d	/* do not set new guard bit */
-					/* if old LSB = 0 */
-	set	%r9,  %r9,  1<2>	/* set new guard bit */
-guardclr1d:
-	extu	%r11, %r11, 31<1>	/* shift lower mantissa over 1 */
-	mak	%r6,  %r5,  1<31>	/* shift off low bit of high mantissa */
-	or	%r11, %r6,  %r11	/* load high bit onto lower mantissa */
-	extu	%r5,  %r5,  20<1>	/* shift right once upper 20 bits of */
-					/* mantissa */
-	br.n	round			/* round mantissa and assemble result */
-	 mak	%r9,  %r9,  3<0>	/* clear bits lost during rotation */
-
-twodoub:
-	rot	%r9,  %r9,  0<2>	/* rotate roundoff register twice, */
-					/* this places old guard into sticky */
-	bb0	30,   %r9,  nosticky2d	/* do not or old guard and old sticky */
-					/* if old sticky is 0 */
-	br.n	noround2d		/* skip or of old guard and old round */
-					/* if old sticky set */
-	 set	%r9,  %r9,  1<0>	/* or old guard and old sticky into */
-					/* new sticky */
-nosticky2d:
-	bb0	31,   %r9,  noround2d	/* do not or old guard and old round */
-					/* if old round is 0 */
-	set	%r9,  %r9,  1<0>	/* or old guard and old round into */
-					/* new sticky */
-noround2d:
-	bb0	0,    %r11, roundclr2d	/* do not set round bit */
-					/* if old LSB = 0 */
-	set	%r9,  %r9,  1<1>	/* set new round bit */
-roundclr2d:
-	bb0	1,    %r11, guardclr2d	/* do not set guard bit */
-					/* if old LSB + 1 = 0 */
-	set	%r9,  %r9,  1<2>	/* set new guard bit */
-guardclr2d:
-	extu	%r11, %r11, 30<2>	/* shift lower mantissa over 2 */
-	mak	%r6,  %r5,  2<30>	/* shift off low bits of high */
-					/* mantissa */
-	or	%r11, %r6,  %r11	/* load high bit onto lower mantissa */
-	extu	%r5,  %r5,  19<2>	/* shift right twice upper 19 bits of */
-					/* mantissa */
-	br.n	round			/* round mantissa and assemble result */
-	 mak	%r9,  %r9,  3<0>	/* clear bits lost during rotation */
-
-threedoub:
-	bb1	0,    %r9,  noguard3d	/* checky sticky initially */
-					/* sticky is set, forget most of */
-					/* rest of oring */
-nosticky3d:
-	bb0	1,    %r9,  noround3d	/* check old round, do not set sticky */
-					/* if old round is clear, */
-					/* set otherwise */
-	br.n	noguard3d		/* sticky is set, forget most of */
-					/* rest of oring */
-	 set	%r9,  %r9,  1<0>	/* set sticky if old round is set */
-noround3d:
-	bb0	2,    %r9,  noguard3d	/* check old guard, do not set sticky */
-					/* if 0 */
-	clr	%r9,  %r9,  2<1>	/* clear the original guard and round */
-					/* for when you get to round section */
-	set	%r9,  %r9,  1<0>	/* set sticky if old guard is set */
-noguard3d:
-	cmp	%r6,  %r7,  32		/* do I need to work with a 1 or 2 */
-					/* word mantissa when forming sticky, */
-					/* round and guard */
-	bb1	gt,   %r6,  d33		/* jump to code that handles 2 word */
-					/* mantissas */
-	sub	%r6,  %r7,  2		/* get number of bits to check for */
-					/* sticky */
-	mak	%r6,  %r6,  5<5>	/* shift width into width field */
-	mak	%r8,  %r11, %r6		/* mask off shifted bits -2 */
-	ff1	%r8,  %r8		/* see if r8 has any ones */
-	bb1	5,    %r8,  nostky32	/* do not set sticky if no ones found */
-	set	%r9,  %r9,  1<0>	/* set sticky bit */
-nostky32:
-	or	%r8,  %r0,  0x22	/* start code to get new mantissa */
-					/* plus two extra bits for new round */
-					/* and new guard bits, the upper word */
-					/* bits will be shifted after the */
-					/* round and guard bits are handled */
-	subu	%r8,  %r8,  %r7
-	mak	%r8,  %r8,  5<5>	/* shift field width into second five */
-					/* bits */
-	extu	%r6,  %r6,  5<5>	/* shift previous shifted -2 into */
-					/* offset field */
-	or	%r6,  %r6,  %r8		/* complete bit field */
-	extu	%r11, %r11, %r6		/* partially form new low mantissa */
-					/* with 2 more bits */
-	bb0	0,    %r11, nornd32d	/* do not set new round bit */
-	set	%r9,  %r9,  1<1>	/* set new round bit */
-nornd32d:
-	bb0	1,    %r11, nogrd32d	/* do not set new guard bit */
-	set	%r9,  %r9,  1<2>	/* set new guard bit */
-nogrd32d:
-	extu	%r11, %r11, 30<2>	/* shift off remaining two bits */
-	mak	%r6,  %r7,  5<5>	/* shift field width into second 5 */
-					/* bits, if the width is 32, then */
-					/* these bits will be 0 */
-	or	%r8,  %r0,  32		/* load word length into r8 */
-	sub	%r8,  %r8,  %r7		/* form offset for high bits moved to */
-					/* low word */
-	or	%r6,  %r6,  %r8		/* form complete bit field */
-	mak	%r6,  %r5,  %r6		/* get shifted bits of high word */
-	or	%r11, %r6,  %r11	/* form new low word of mantissa */
-	bcnd	ne0,  %r8,  regular33	/* do not adjust for special case */
-					/* of r8 containing zeros, which */
-	br.n	round			/* would cause all of the bits to be */
-	 or	%r5,  %r0,  %r0		/* extracted under the regular method */
-regular33:
-	mak	%r6,  %r7,  5<0>	/* place lower 5 bits of shift */
-					/* into r6 */
-	mak	%r8,  %r8,  5<5>	/* shift r8 into width field */
-	or	%r6,  %r6,  %r8		/* form field for shifting of upper */
-					/* bits */
-	br.n	round			/* round and assemble result */
-	 extu	%r5,  %r5,  %r6		/* form new high word mantissa */
-
-d33:
-	cmp	%r6,  %r7,  33		/* is the number of bits to be */
-					/* shifted is 33? */
-	bb1	gt,   %r6,  d34		/* check to see if # of bits is 34 */
-	bb1	0,    %r9,  nostky33	/* skip checking if old sticky set */
-	mak	%r6,  %r11, 31<0>	/* check bits that will be shifted */
-					/* into sticky */
-	ff1	%r8,  %r8		/* check for ones */
-	bb1	5,    %r8,  nostky33	/* do not set sticky if there are no */
-					/* ones */
-	set	%r9,  %r9,  1<0>	/* set new sticky bit */
-nostky33:
-	bb0	31,   %r11, nornd33	/* do not set round if bit is not a 1 */
-	set	%r9,  %r9,  1<1>	/* set new round bit */
-nornd33:
-	bb0	0,    %r5,  nogrd33	/* do not set guard bit if bit is not */
-					/* a 1 */
-	set	%r9,  %r9,  1<2>	/* set new guard bit */
-nogrd33:
-	extu	%r11, %r5,  31<1>	/* shift high bits into low word */
-	br.n	round			/* round and assemble result */
-	 or	%r5,  %r0,  %r0		/* clear high word */
-
-d34:
-	cmp	%r6,  %r7,  34		/* is the number of bits to be */
-					/* shifted 34? */
-	bb1	gt,   %r6,  d35		/* check to see if # of bits is >= 35 */
-	bb1	0,    %r9,  nostky34	/* skip checking if old sticky set */
-	ff1	%r8,  %r11		/* check bits that will be shifted */
-					/* into sticky */
-	bb1	5,    %r8,  nostky34	/* do not set sticky if there are no */
-					/* ones */
-	set	%r9,  %r9,  1<0>	/* set new sticky bit */
-nostky34:
-	bb0	0,    %r5,  nornd34	/* do not set round if bit is not a 1 */
-	set	%r9,  %r9,  1<1>	/* set new round bit */
-nornd34:
-	bb0	1,    %r5,  nogrd34	/* do not set guard bit if bit is not */
-					/* a 1 */
-	set	%r9,  %r9,  1<2>	/* set new guard bit */
-nogrd34:
-	extu	%r11, %r5,  30<2>	/* shift high bits into low word */
-	br.n	round			/* round and assemble result */
-	 or	%r5,  %r0,  %r0		/* clear high word */
-
-d35:
-	cmp	%r6,  %r7,  52		/* see if # of shifts is */
-					/* 35 <= X <= 52 */
-	bb1	gt,   %r6,  d53		/* check to see if # of shifts is 52 */
-	bb1.n	0,    %r9,  nostky35	/* skip checking if old sticky set */
-	 sub	%r7,  %r7,  34		/* subtract 32 from # of shifts */
-					/* so that operations can be done on */
-					/* the upper word, and then subtract */
-					/* two more checking guard and */
-					/* sticky bits */
-	ff1	%r8,  %r11		/* see if lower word has a bit for */
-					/* sticky */
-	bb1	5,    %r8,  stkycheck35 /* see if upper word has any sticky */
-					/* bits	*/
-	br.n	nostky35		/* quit checking for sticky */
-	 set	%r9,  %r9,  1<0>	/* set sticky bit */
-stkycheck35:
-	mak	%r6,  %r7,  5<5>	/* place width into width field */
-	mak	%r8,  %r5,  %r6		/* mask off shifted bits - 2 */
-	ff1	%r8,  %r8		/* see if r8 has any ones */
-	bb1	5,    %r8,  nostky35	/* do not set sticky if no ones found */
-	set	%r9,  %r9,  1<0>	/* set sticky bit */
-nostky35:
-	or	%r8,  %r0,  32		/* look at what does not get shifted */
-					/* off plus round and sticky, */
-					/* remember that the r7 value was */
-					/* adjusted so that it did not */
-					/* include new round or new sticky in */
-					/* shifted off bits */
-	subu	%r8,  %r8,  %r7		/* complement width */
-	mak	%r8,  %r8,  5<5>	/* shift width into width field */
-	or	%r8,  %r7,  %r8		/* add offset field */
-	extu	%r11, %r5,  %r8		/* extract upper bits into low word */
-	bb0	0,    %r11, nornd35	/* do not set new round bit */
-	set	%r9,  %r9,  1<1>	/* set new round bit */
-nornd35:
-	bb0	1,    %r11, nogrd35	/* do not set new guard bit */
-	set	%r9,  %r9,  1<2>	/* set new guard bit */
-nogrd35:
-	extu	%r11, %r11, 30<2>	/* shift off remaining guard and round bits */
-	br.n	round			/* round and assemble result */
-	 or	%r5,  %r0,  %r0		/* clear high word */
-
-d53:
-	cmp	%r6,  %r7,  53		/* check to see if # of shifts is 53 */
-	bb1	gt,   %r6,  d54		/* branch to see if shifts = 54 */
-	bb1	0,    %r9,  nostky53	/* skip checking if old sticky set */
-	ff1	%r8,  %r11		/* see if lower word has a bit for */
-					/* sticky */
-	bb1	5,    %r8,  stkycheck53 /* see if upper word has any sticky */
-					/* bits */
-	br.n	nostky53		/* quit checking for sticky */
-	 set	%r9,  %r9,  1<0>	/* set sticky bit */
-stkycheck53:
-	mak	%r6,  %r5,  19<0>	/* check bits that are shifted into */
-					/* sticky */
-	ff1	%r8,  %r6		/* see if r6 has any ones */
-	bb1	5,    %r8,  nostky53	/* do not set sticky if no ones found */
-	set	%r9,  %r9,  1<0>	/* set sticky bit */
-nostky53:
-	bb0	19,   %r5,  nornd53	/* do not set new round bit */
-	set	%r9,  %r9,  1<1>	/* set new round bit */
-nornd53:
-	set	%r9,  %r9,  1<2>	/* set new guard bit, this is hidden */
-					/* bit */
-	or	%r5,  %r0,  %r0		/* clear high word */
-	br.n	round			/* round and assemble result */
-	 or	%r11, %r0,  %r0		/* clear low word */
-
-d54:
-	cmp	%r6,  %r7,  54		/* check to see if # of shifts is 54 */
-	bb1	gt,   %r6,  d55		/* branch to execute for shifts =>55 */
-	bb1	0,    %r9,  nostky54	/* skip checking if old sticky set */
-	ff1	%r8,  %r11		/* see if lower word has a bit for */
-					/* sticky */
-	bb1	5,    %r8,  stkycheck54 /* see if upper word has any sticky */
-					/* bits */
-	br.n	nostky54		/* quit checking for sticky */
-	 set	%r9,  %r9,  1<0>	/* set sticky bit */
-stkycheck54:
-	mak	%r6,  %r5,  20<0>	/* check bits that are shifted into */
-					/* sticky */
-	ff1	%r8,  %r6		/* see if r6 has any ones */
-	bb1	5,    %r8,  nostky54	/* do not set sticky if no ones found */
-	set	%r9,  %r9,  1<0>	/* set sticky bit */
-nostky54:
-	set	%r9,  %r9,  1<1>	/* set new round bit, this is hidden */
-					/* bit */
-	clr	%r9,  %r9,  1<2>	/* clear guard bit since nothing */
-					/* shifted in */
-	or	%r5,  %r0,  %r0		/* clear high word */
-	br.n	round			/* round and assemble result */
-	 or	%r11, %r0,  %r0		/* clear low word */
-
-d55:
-	set	%r9,  %r9,  1<0>	/* set new sticky bit, this contains */
-					/* hidden bit */
-	clr	%r9,  %r9,  2<1>	/* clear guard and round bits since */
-					/* nothing shifted in */
-	or	%r5,  %r0,  %r0		/* clear high word */
-	or	%r11, %r0,  %r0		/* clear low word */
-
-
-/*
- * The first item that the rounding code does is see if either guard, round,
- * or sticky is set. If all are clear, then there is no denormalization loss
- * and no need to round, then branch to assemble answer.
- * For rounding, a branch table is set up. The left two most bits are the
- * rounding mode. The third bit is either the LSB of the mantissa or the
- * sign bit, depending on the rounding mode. The three LSB''s are the guard,
- * round and sticky bits.
- */
-
-round:
-	ff1	%r8,  %r9		/* see if there is denormalization */
-					/* loss */
-	bb1	5,    %r8,  assemble	/* no denormalization loss or */
-					/* inexactness */
-	extu	%r6,  %r10, 2<modelo>	/* extract rounding mode */
-	bb1.n	modehi, %r10, signext	/* use sign bit instead of LSB */
-	 mak	%r6,  %r6,  2<4>	/* shift over rounding mode */
-	extu	%r7,  %r11, 1<0>	/* extract LSB */
-	br.n	grs			/* skip sign extraction */
-	 mak	%r7,  %r7,  1<3>	/* shift over LSB */
-signext:
-	extu	%r7,  %r10, 1<31>	/* extract sign bit */
-	mak	%r7,  %r7,  1<3>	/* shift sign bit over */
-grs:
-	or	%r6,  %r6,  %r7
-	or	%r6,  %r6,  %r9		/* or in guard, round, and sticky */
-	or.u	%r1,  %r0,  %hi16(roundtable) /* form address of branch table */
-	or	%r1,  %r1,  %lo16(roundtable)
-	lda	%r6,  %r1[%r6]		/* scale offset into branch table */
-	jmp.n	%r6			/* jump to branch table */
-	 set	%r9,  %r9,  1<3>	/* set inexact flag in r9 */
-
-roundtable:
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	addone
-	br	addone
-	br	addone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	addone
-	br	addone
-	br	addone
-	br	addone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	addone
-	br	addone
-	br	addone
-	br	addone
-	br	addone
-	br	addone
-	br	addone
-	br	noaddone
-	br	addone
-	br	addone
-	br	addone
-	br	addone
-	br	addone
-	br	addone
-	br	addone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-	br	noaddone
-
-/* Round by adding a one to the LSB of the mantissa. */
-addone:
-	or	%r6,  %r0,  1		/* load a 1 into r6 so that add.co */
-					/* can be used */
-	add.co	%r11, %r11, %r6		/* add a one to the lower word of */
-					/* result */
-	bb0.n	destsize, %r12, noaddone/* single result, forget carry */
-	 set	%r9,  %r9,  1<4>	/* indicate that a 1 has been added */
-	add.ci	%r5,  %r5,  %r0		/* propagate carry into high word */
-
-noaddone:
-	set	%r2,  %r2,  1<inexact>
-	set	%r2,  %r2,  1<underflow>
-
-/*
- * Assemble the result of the denormalization routine for writeback to the
- * destination register. The exponent of a denormalized number is zero,
- * so simply assemble the sign and the new mantissa.
- */
-
-assemble:
-	bb1	destsize, %r12, doubassem	/* assemble double result */
-	bb0	sign, %r10, exassems		/* exit assemble if sign is */
-						/* zero */
-	set	%r11, %r11, 1<sign>		/* make result negative */
-exassems:
-	br	Ureturn
-
-doubassem:
-	bb0.n	sign, %r10, signclr		/* do not set sign in r10 */
-	 or	%r10, %r5,  %r0			/* load high word from r5 */
-						/* into r10 */
-	set	%r10, %r10, 1<sign>		/* high word with sign loaded */
-signclr:
-	/* FALLTHROUGH */
-	/* br	Ureturn */
-
-/* Return to fpui. */
-Ureturn:
-	ld	%r1,  %r31, 0			/* load return address */
-	jmp	%r1
-
-/*
- * FPoverflow
- */
-
-ASLOCAL(FPoverflow)
-	st	%r1,  %r31, 0			/* save return address */
-	set	%r2,  %r2,  1<overflow>
-	set	%r2,  %r2,  1<inexact>
-
-/* Determine which rounding mode to use for the default procedure. */
-
-	bb1	modehi, %r10, signed		/* mode is either round */
-						/* toward pos. or neg. */
-	bb0	modelo, %r10, OFnearest		/* rounding mode is round */
-						/* nearest */
-	br	OFzero				/* rounding mode is round */
-						/* zero */
-signed:
-	bb0	modelo, %r10, OFnegative	/* rounding mode is round */
-						/* negative */
-	br	positive			/* rounding mode is round */
-						/* positive */
-
-/*
- * In the round toward nearest mode, positive values are rounded to
- * positive infinity and negative values are loaded toward negative infinity.
- * The value for single or double precision is loaded from a data table.
- */
-
-OFnearest:
-	bb1.n	destsize, %r12, neardouble	/* branch to neardouble of */
-						/* double result */
-	 mask.u	%r5,  %r10, 0x8000		/* mask off sign bit from */
-						/* MANTHI */
-	or.u	%r11, %r0,  %hi16(0x7f800000)	/* load single infinity */
-						/* constant */
-	or	%r11, %r11, %lo16(0x7f800000)
-	br.n	FPof_return			/* return with result */
-	 or	%r11, %r5,  %r11		/* adjust sign */
-neardouble:
-	or	%r11, %r0,  %r0			/* load lower word of double */
-						/* infinity */
-	or.u	%r10, %r0,  %hi16(0x7ff00000)	/* load upper word of double */
-						/* infinity */
-	or	%r10, %r10, %lo16(0x7ff00000)
-	br.n	FPof_return			/* return with result */
-	 or	%r10, %r5,  %r10		/* adjust sign */
-
-/*
- * In the round toward zero mode, positive values are rounded to the largest
- * postive finite number and negative values are rounded toward the largest
- * negative finite number.
- * The value for single or double precision is loaded from a data table.
- */
-
-OFzero:
-	bb1.n	destsize, %r12, zerodouble	/* branch to zerodouble of */
-						/* double result */
-	 mask.u	%r5,  %r10, 0x8000		/* mask off sign bit from */
-						/* MANTHI */
-	or.u	%r11, %r0,  %hi16(0x7f7fffff)	/* load single finite number */
-						/* constant */
-	or	%r11, %r11, %lo16(0x7f7fffff)
-	br.n	FPof_return			/* return with result */
-	 or	%r11, %r5,  %r11		/* adjust sign */
-zerodouble:
-	set	%r11, %r0,  0<0>		/* load lower word of double */
-						/* finite number */
-	or.u	%r10, %r0,  %hi16(0x7fefffff)	/* load upper word of double */
-						/* finite number */
-	or	%r10, %r10, %lo16(0x7fefffff)
-	br.n	FPof_return			/* return with result */
-	 or	%r10, %r5,  %r10		/* adjust sign */
-
-/*
- * In the round toward positve mode, positive values are rounded to
- * postive infinity and negative values are loaded toward the largest
- * negative finite number.
- * The value for single or double precision is loaded from a data table.
- */
-
-positive:
-	bb1	destsize, %r12, posdouble	/* branch to section for */
-						/* double result */
-possingle:
-	bb1	sign, %r10, possingleneg	/* branch to section for */
-						/* negatives */
-possinglepos:
-	or.u	%r11, %r0,  %hi16(0x7f800000)	/* load single infinity */
-						/* constant */
-	br.n	FPof_return			/* return with result */
-	 or	%r11, %r11, %lo16(0x7f800000)
-possingleneg:
-	or.u	%r11, %r0,  %hi16(0x7f7fffff)	/* load single finite number */
-						/* constant */
-	or	%r11, %r11, %lo16(0x7f7fffff)
-	br.n	FPof_return			/* return with result */
-	 set	%r11, %r11, 1<sign>		/* set sign for negative */
-posdouble:
-	bb1	sign, %r10, posdoubleneg	/* branch to negative double */
-						/* results */
-posdoublepos:
-	or	%r11, %r0,  %r0			/* load lower word of double */
-						/* infinity */
-	or.u	%r10, %r0,  %hi16(0x7ff00000)	/* load upper word of double */
-						/* infinity */
-	br.n	FPof_return			/* return with result */
-	 or	%r10, %r10, %lo16(0x7ff00000)
-posdoubleneg:
-	set	%r11, %r0,  0<0>		/* load lower word of finite */
-						/* number */
-	or.u	%r10, %r0,  %hi16(0x7fefffff)	/* load upper word of finite */
-						/* number */
-	or	%r10, %r10, %lo16(0x7fefffff)
-	br.n	FPof_return			/* return with result */
-	 set	%r10, %r10, 1<sign>		/* set sign for negative */
-
-/*
- * In the round toward negative mode, positive values are rounded to the
- * largest postive finite number and negative values are rounded to negative
- * infinity.
- * The value for single or double precision is loaded from a data table.
- */
-
-OFnegative:
-	bb1	destsize, %r12, negdouble	/* branch to section for */
-						/* double result */
-negsingle:
-	bb1	sign, %r10, negsingleneg	/* branch to section for */
-						/* negatives */
-negsinglepos:
-	or.u	%r11, %r0,  %hi16(0x7f7fffff)	/* load single finite number */
-						/* constant */
-	br.n	FPof_return			/* return with result */
-	 or	%r11, %r11, %lo16(0x7f7fffff)
-negsingleneg:
-	or.u	%r11, %r0,  %hi16(0x7f800000)	/* load single infinity */
-						/* constant */
-	or	%r11, %r11, %lo16(0x7f800000)
-	br.n	FPof_return			/* return with result */
-	 set	%r11, %r11, 1<sign>		/* set sign for negative */
-negdouble:
-	bb1	sign, %r10, negdoubleneg	/* branch to negative double */
-						/* results */
-negdoublepos:
-	set	%r11, %r0,  0<0>		/* load lower word of finite */
-						/* number */
-	or.u	%r10, %r0,  %hi16(0x7fefffff)	/* load upper word of finite */
-						/* number */
-	br.n	FPof_return			/* return with result */
-	 or	%r10, %r10, %lo16(0x7fefffff)
-negdoubleneg:
-	or	%r11, %r0,  %r0			/* load lower word of double */
-						/* infinity */
-	or.u	%r10, %r0,  %hi16(0x7ff00000)	/* load upper word of double */
-						/* infinity */
-	or	%r10, %r10, %lo16(0x7ff00000)
-	set	%r10, %r10, 1<sign>		/* set sign for negative */
-
-FPof_return:
-	ld	%r1,  %r31, 0			/* load return address */
-	jmp	%r1
-
-/*
  * If either S1 or S2 is a signalling NaN, then set the invalid operation
  * bit of the FPSR.
  * If S1 is the only NaN or one of two NaN''s, then write
@@ -2635,62 +1814,3 @@ S2noinfd:
 						/* been, so return */
 operation:
 	jmp	%r1
-
-ENTRY(m88100_fpu_imprecise_exception)
-	or	%r29, %r2,  %r0			/* r29 is now the E.F. */
-	subu	%r31, %r31, 16
-	st	%r1,  %r31, 4
-	st	%r29, %r31, 8
-
-	ld	%r2 , %r29, EF_FPSR
-	ld	%r3 , %r29, EF_FPCR
-	ld	%r4 , %r29, EF_FPECR
-	ld	%r10, %r29, EF_FPRH
-	ld	%r11, %r29, EF_FPRL
-	ld	%r12, %r29, EF_FPIT
-
-/*
- * Load into r1 the return address for the exception handlers. Looking
- * at FPECR, branch to the appropriate exception handler.
- */
-
-	or.u	%r1,  %r0,  %hi16(fpui_wrapup)	/* load return address of */
-	or	%r1,  %r1,  %lo16(fpui_wrapup)	/* functions */
-
-	bb0	2,    %r4,  2f			/* branch to FPunderflow if */
-	br	_ASM_LABEL(FPunderflow)		/* bit set */
-2:
-	bb0	1,    %r4,  3f			/* branch to FPoverflow if */
-	br	_ASM_LABEL(FPoverflow)		/* bit set */
-3:
-	/* XXX handle inexact!!! */
-
-fpui_wrapup:
-	FLUSH_PIPELINE				/* make sure all floating */
-						/* point operations have */
-						/* finished */
-	ldcr	%r4,  %cr1			/* load the PSR */
-#if 0
-	set	%r4,  %r4,  1<PSR_FPU_DISABLE_BIT>
-#endif
-	set	%r4,  %r4,  1<PSR_INTERRUPT_DISABLE_BIT>
-	stcr	%r4,  %cr1
-	ld	%r1,  %r31, 4
-	ld	%r29, %r31, 8
-	addu	%r31, %r31, 16
-
-	fstcr	%r2, FPSR		/* write revised value of FPSR... */
-	fstcr	%r3, FPCR		/* ...and FPCR... */
-	st	%r2, %r29, EF_FPSR	/* ...into the trapframe as well */
-	st	%r3, %r29, EF_FPCR
-
-	/* write back the results */
-	extu	%r2,  %r12, 5<0>
-	bb0.n	destsize, %r12, Iwritesingle
-	 addu	%r3,  %r29, EF_R0
-	st	%r10, %r3[%r2]
-	addu	%r2,  %r2,  1
-	clr	%r2,  %r2,  27<5>
-Iwritesingle:
-	jmp.n	%r1
-	 st	%r11, %r3[%r2]
diff --git a/sys/arch/m88k/m88k/m88100_fp_imp.S b/sys/arch/m88k/m88k/m88100_fp_imp.S
new file mode 100644
index 00000000000..ae5fb770a11
--- /dev/null
+++ b/sys/arch/m88k/m88k/m88100_fp_imp.S
@@ -0,0 +1,918 @@
+/* $OpenBSD: m88100_fp_imp.S,v 1.1 2014/06/09 10:26:10 miod Exp $	*/
+/*
+ * Mach Operating System
+ * Copyright (c) 1991 Carnegie Mellon University
+ * Copyright (c) 1991 OMRON Corporation
+ * All Rights Reserved.
+ *
+ * Permission to use, copy, modify and distribute this software and its
+ * documentation is hereby granted, provided that both the copyright
+ * notice and this permission notice appear in all copies of the
+ * software, derivative works or modified versions, and any portions
+ * thereof, and that both notices appear in supporting documentation.
+ *
+ * CARNEGIE MELLON AND OMRON ALLOW FREE USE OF THIS SOFTWARE IN ITS "AS IS"
+ * CONDITION.  CARNEGIE MELLON AND OMRON DISCLAIM ANY LIABILITY OF ANY KIND
+ * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
+ *
+ * Carnegie Mellon requests users of this software to return to
+ *
+ *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
+ *  School of Computer Science
+ *  Carnegie Mellon University
+ *  Pittsburgh PA 15213-3890
+ *
+ * any improvements or extensions that they make and grant Carnegie the
+ * rights to redistribute these changes.
+ */
+
+/* Floating point trouble routines */
+#include "assym.h"
+#include <machine/asm.h>
+
+#define destsize 10
+
+/* Floating-Point Status Register bits */
+#define inexact		0
+#define overflow	1
+#define underflow	2
+
+#define sign		31
+
+#define modehi		30
+#define modelo		29
+
+/*
+ * Branch to the routine to make a denormalized number.
+ */
+ASLOCAL(FPunderflow)
+	st	%r1, %r31, 0	/* save return address */
+	set	%r2, %r2,  1<underflow>
+	set	%r2, %r2,  1<inexact>
+
+/*
+ * Now the floating point number, which has an exponent smaller than what
+ * IEEE allows, must be denormalized. Denormalization is done by calculating
+ * the difference between a denormalized exponent and an underflow exponent
+ * and shifting the mantissa by that amount. A one may need to be subtracted
+ * from the LSB if a one was added during rounding.
+ * %r9 is used to contain the guard, round, sticky, and an inaccuracy bit in
+ * case some bits were shifted off the mantissa during denormalization.
+ * %r9 will contain:
+ *   bit 4 -- new addone if one added during rounding after denormalization
+ *   bit 3 -- inaccuracy flag caused by denormalization or pre-denormalization
+ *            inexactness
+ *   bit 2 -- guard bit of result
+ *   bit 1 -- round bit of result
+ *   bit 0 -- sticky bit of result
+ */
+
+FPU_denorm:
+	bb1.n	destsize, %r12, Udouble	/* denorm for double */
+	 extu	%r9,  %r10, 3<26>	/* load r9 with grs */
+Usingle:
+	mak	%r5,  %r10, 21<3>	/* extract high 21 bits of mantissa */
+	extu	%r6,  %r11, 3<29>	/* extract low 3 bits of mantissa */
+	or	%r11, %r5,  %r6		/* form 24 bits of mantissa */
+
+/* See if the addone bit is set and unround if it is. */
+	bb0.n	25,   %r10, nounrounds	/* do not unround if addone bit clear */
+	 extu	%r6,  %r12, 12<20>	/* extract signed exponent from IMPCR */
+unrounds:
+	subu	%r11, %r11, 1		/* subtract 1 from mantissa */
+
+/*
+ * If the hidden bit is cleared after subtracting the one, then the one added
+ * during the rounding must have propagated through the mantissa. The exponent
+ * will need to be decremented.
+ */
+	bb1	23,   %r11, nounrounds	/* if hidden bit is set, the exponent */
+					/* does not need to be decremented */
+decexps:
+	sub	%r6,  %r6,  1		/* decrement exponent */
+	set	%r11, %r11, 1<23>	/* set the hidden bit */
+
+/*
+ * For both single and double precision, there are cases where it is easier
+ * and quicker to make a special case. Examples of this are if the shift
+ * amount is only 1 or 2, or all the mantissa is shifted off, or all the
+ * mantissa is shifted off and it is still shifting, or, in the case of
+ * doubles, if the shift amount is around the boundary of MANTLO and MANTHI.
+ */
+
+nounrounds:
+	or	%r8,  %r0,  %lo16(0x00000f81)
+					/* load r8 with -127 in decimal */
+					/* for lowest 12 bits */
+	sub	%r7,  %r8,  %r6		/* find difference between two */
+					/* exponents, this amount is the */
+					/* shift amount */
+	cmp	%r6,  %r7,  3		/* check to see if r7 contains 3 */
+					/* or more */
+	bb1	ge,   %r6,  threesing	/* br to code that handles shifts of */
+					/* 3 or more */
+	cmp	%r6,  %r7,  2		/* check to see if r7 contains 2 */
+	bb1	eq,   %r6,  twosing	/* br to code that handles shifts of */
+					/* 2 */
+one:
+	rot	%r9,  %r9,  0<1>	/* rotate roundoff register once, */
+					/* this places guard in round and */
+					/* round in sticky */
+	bb0	31,   %r9,  nosticky1s	/* do not or round and sticky if */
+					/* sticky is 0, this lost bit will */
+					/* be cleared later */
+	set	%r9,  %r9,  1<0>	/* or round and sticky */
+nosticky1s:
+	bb0	0,    %r11, guardclr1s	/* do not set guard bit if LSB = 0 */
+	set	%r9,  %r9,  1<2>	/* set guard bit */
+guardclr1s:
+	extu	%r11, %r11, 31<1>	/* shift mantissa right 1 */
+	br.n	round			/* round result */
+	 mak	%r9,  %r9,  3<0>	/* clear bits lost during rotation */
+
+twosing:
+	rot	%r9,  %r9,  0<2>	/* rotate roundff register twice, */
+					/* this places guard in sticky */
+	bb0	30,   %r9,  nosticky2s	/* do not or guard and sticky if */
+					/* sticky is 0, this lost bit will be */
+					/* cleared later */
+	br.n	noround2s		/* skip or old guard and old round if */
+					/* old sticky set */
+	 set	%r9,  %r9,  1<0>	/* or guard and sticky */
+nosticky2s:
+	bb0	31,   %r9,  noround2s	/* do not or guard and round if round */
+					/* is 0, this lost bit will be */
+					/* cleared later */
+	set	%r9,  %r9,  1<0>	/* or guard and round */
+noround2s:
+	bb0	0,    %r11, roundclr2s	/* do not set round bit if LSB = 0 */
+	set	%r9,  %r9,  1<1>	/* set round bit */
+roundclr2s:
+	bb0	1,    %r11, guardclr2s	/* do not set guard bit if LSB+1 = 0 */
+	set	%r9,  %r9,  1<2>	/* set guard bit */
+guardclr2s:
+	extu	%r11, %r11, 30<2>	/* shift mantissa right 2 */
+	br.n	round			/* round result */
+	 mak	%r9,  %r9,  3<0>	/* clear bits lost during rotation */
+
+threesing:
+	bb1	0,    %r9,  noguard3s	/* check sticky initially */
+					/* sticky is set, forget most of the */
+					/* oring */
+nosticky3s:
+	bb0	1,    %r9,  noround3s	/* check round initially, do not set */
+					/* sticky */
+	br.n	noguard3s		/* forget most of the rest of oring */
+	 set	%r9,  %r9,  1<0>	/* if round is clear, set sticky if */
+					/* round set */
+noround3s:
+	bb0.n	2,    %r9,  noguard3s	/* check guard initially, do not set */
+					/* sticky */
+	 clr	%r9,  %r9,  2<1>	/* clear the original guard and round */
+					/* for when you get to round section */
+	set	%r9,  %r9,  1<0>	/* if guard is clear, set sticky if */
+					/* guard set */
+noguard3s:
+	cmp	%r6,  %r7,  23		/* check if # of shifts is <=23 */
+	bb1	gt,   %r6,  s24		/* branch to see if shifts = 24 */
+	sub	%r6,  %r7,  2		/* get number of bits to check for */
+					/* sticky */
+	mak	%r6,  %r6,  5<5>	/* shift width into width field */
+	mak	%r8,  %r11, %r6		/* mask off shifted bits -2 */
+	ff1	%r8,  %r8		/* see if r8 has any ones */
+	bb1	5,    %r8,  nostky23	/* do not set sticky if no ones found */
+	set	%r9,  %r9,  1<0>	/* set sticky bit */
+nostky23:
+	or	%r8,  %r0,  0x22	/* start code to get new mantissa */
+					/* plus two extra bits for new round */
+					/* and new guard bits */
+	subu	%r8,  %r8,  %r7
+	mak	%r8,  %r8,  5<5>	/* shift field width into second five */
+					/* bits */
+	extu	%r6,  %r6,  5<5>	/* shift previous shifted -2 into */
+					/* offset field */
+	or	%r6,  %r6,  %r8		/* complete field */
+	extu	%r11, %r11, %r6		/* form new mantissa with two extra */
+					/* bits */
+
+	bb0	0,    %r11, nornd3s	/* do not set new round bit */
+	set	%r9,  %r9,  1<1>	/* set new round bit */
+nornd3s:
+	bb0	1,    %r11, nogrd3s	/* do not set new guard bit */
+	set	%r9,  %r9,  1<2>	/* set new guard bit */
+nogrd3s:
+	br.n	round			/* round mantissa */
+	 extu	%r11, %r11, 30<2>	/* shift off remaining two bits */
+
+s24:
+	cmp	%r6,  %r7,  24		/* check to see if # of shifts is 24 */
+	bb1	gt,   %r6,  s25		/* branch to see if shifts = 25 */
+	bb1	0,    %r9,  nostky24	/* skip checking if old sticky set */
+	extu	%r8,  %r11, 22<0>	/* prepare to check bits that will be */
+					/* shifted into the sticky */
+	ff1	%r8,  %r8		/* see if there are any 1''s */
+	bb1	5,    %r8,  nostky24	/* do not set sticky if no ones found */
+	set	%r9,  %r9,  1<0>	/* set sticky bit */
+nostky24:
+	bb0	22,   %r11, nornd24	/* do not set new round bit */
+	set	%r9,  %r9,  1<1>	/* set new round bit */
+nornd24:
+	set	%r9,  %r9,  1<2>	/* set new guard bit, this is hidden */
+					/* bit */
+	br.n	round			/* round mantissa */
+	 or	%r11, %r0,  %r0		/* clear r11, all of mantissa */
+					/* shifted off */
+
+s25:
+	cmp	%r6,  %r7,  25		/* check to see if # of shifts is 25 */
+	bb1	gt,   %r6,  s26		/* branch to execute for shifts => 26 */
+	bb1	0,    %r9,  nostky25	/* skip checking if old sticky set */
+	extu	%r8,  %r11, 23<0>	/* prepare to check bits that will be */
+					/* shifted into the sticky */
+	ff1	%r8,  %r8		/* see if there are any 1''s */
+	bb1	5,    %r8,  nostky25	/* do not set sticky if no ones found */
+	set	%r9,  %r9,  1<0>	/* set sticky bit */
+nostky25:
+	set	%r9,  %r9,  1<1>	/* set new round bit, this is hidden */
+					/* bit */
+	clr	%r9,  %r9,  1<2>	/* clear guard bit since nothing */
+					/* shifted in */
+	br.n	round			/* round and assemble result */
+	 or	%r11, %r0,  %r0		/* clear r11, all of mantissa */
+					/* shifted off */
+
+s26:
+	set	%r9,  %r9,  1<0>	/* set sticky bit, this contains */
+					/* hidden bit */
+	clr	%r9,  %r9,  2<1>	/* clear guard and round bits since */
+					/* nothing shifted in */
+	br.n	round			/* round and assemble result */
+	 or	%r11, %r0,  %r0		/* clear mantissa */
+
+Udouble:
+	mak	%r5,  %r10, 21<0>	/* extract upper bits of mantissa */
+	bb0.n	25,   %r10, nounroundd	/* do not unround if addone bit clear */
+	 extu	%r6,  %r12, 12<20>	/* extract signed exponenet from IMPCR */
+unroundd:
+	or	%r8,  %r0,  1
+	subu.co	%r11, %r11, %r8		/* subtract 1 from mantissa */
+	subu.ci	%r5,  %r5,  %r0		/* subtract borrow from upper word */
+	bb1	20,   %r5,  nounroundd	/* if hidden bit is set, then */
+					/* exponent does not need to be */
+					/* decremented */
+decexpd:
+	sub	%r6,  %r6,  1		/* decrement exponent */
+	set	%r5,  %r5,  1<20>	/* set the hidden bit */
+
+nounroundd:
+	or	%r8,  %r0,  %lo16(0x00000c01)
+					/* load r8 with -1023 in decimal */
+					/* for lowest 12 bits */
+	sub	%r7,  %r8,  %r6		/* find difference between two */
+					/* exponents, this amount is the */
+					/* shift amount */
+	cmp	%r6,  %r7,  3		/* check to see if r7 contains */
+					/* 3 or more */
+	bb1	ge,   %r6,  threedoub	/* br to code that handles shifts of */
+					/* 3 or more */
+	cmp	%r6,  %r7,  2		/* check to see if r7 contains 2 */
+	bb1	eq,   %r6,  twodoub	/* br to code that handles shifts */
+					/* of 2 */
+
+onedoub:
+	rot	%r9,  %r9,  0<1>	/* rotate roundoff register once, */
+					/* this places guard in round and */
+					/* round in sticky */
+	bb0	31,   %r9,  nosticky1d	/* do not or round and sticky if */
+					/* sticky is 0, this lost bit */
+					/* will be cleared later */
+	set	%r9,  %r9,  1<0>	/* or old round and old sticky into */
+					/* new sticky */
+nosticky1d:
+	bb0	0,    %r11, guardclr1d	/* do not set new guard bit */
+					/* if old LSB = 0 */
+	set	%r9,  %r9,  1<2>	/* set new guard bit */
+guardclr1d:
+	extu	%r11, %r11, 31<1>	/* shift lower mantissa over 1 */
+	mak	%r6,  %r5,  1<31>	/* shift off low bit of high mantissa */
+	or	%r11, %r6,  %r11	/* load high bit onto lower mantissa */
+	extu	%r5,  %r5,  20<1>	/* shift right once upper 20 bits of */
+					/* mantissa */
+	br.n	round			/* round mantissa and assemble result */
+	 mak	%r9,  %r9,  3<0>	/* clear bits lost during rotation */
+
+twodoub:
+	rot	%r9,  %r9,  0<2>	/* rotate roundoff register twice, */
+					/* this places old guard into sticky */
+	bb0	30,   %r9,  nosticky2d	/* do not or old guard and old sticky */
+					/* if old sticky is 0 */
+	br.n	noround2d		/* skip or of old guard and old round */
+					/* if old sticky set */
+	 set	%r9,  %r9,  1<0>	/* or old guard and old sticky into */
+					/* new sticky */
+nosticky2d:
+	bb0	31,   %r9,  noround2d	/* do not or old guard and old round */
+					/* if old round is 0 */
+	set	%r9,  %r9,  1<0>	/* or old guard and old round into */
+					/* new sticky */
+noround2d:
+	bb0	0,    %r11, roundclr2d	/* do not set round bit */
+					/* if old LSB = 0 */
+	set	%r9,  %r9,  1<1>	/* set new round bit */
+roundclr2d:
+	bb0	1,    %r11, guardclr2d	/* do not set guard bit */
+					/* if old LSB + 1 = 0 */
+	set	%r9,  %r9,  1<2>	/* set new guard bit */
+guardclr2d:
+	extu	%r11, %r11, 30<2>	/* shift lower mantissa over 2 */
+	mak	%r6,  %r5,  2<30>	/* shift off low bits of high */
+					/* mantissa */
+	or	%r11, %r6,  %r11	/* load high bit onto lower mantissa */
+	extu	%r5,  %r5,  19<2>	/* shift right twice upper 19 bits of */
+					/* mantissa */
+	br.n	round			/* round mantissa and assemble result */
+	 mak	%r9,  %r9,  3<0>	/* clear bits lost during rotation */
+
+threedoub:
+	bb1	0,    %r9,  noguard3d	/* checky sticky initially */
+					/* sticky is set, forget most of */
+					/* rest of oring */
+nosticky3d:
+	bb0	1,    %r9,  noround3d	/* check old round, do not set sticky */
+					/* if old round is clear, */
+					/* set otherwise */
+	br.n	noguard3d		/* sticky is set, forget most of */
+					/* rest of oring */
+	 set	%r9,  %r9,  1<0>	/* set sticky if old round is set */
+noround3d:
+	bb0	2,    %r9,  noguard3d	/* check old guard, do not set sticky */
+					/* if 0 */
+	clr	%r9,  %r9,  2<1>	/* clear the original guard and round */
+					/* for when you get to round section */
+	set	%r9,  %r9,  1<0>	/* set sticky if old guard is set */
+noguard3d:
+	cmp	%r6,  %r7,  32		/* do I need to work with a 1 or 2 */
+					/* word mantissa when forming sticky, */
+					/* round and guard */
+	bb1	gt,   %r6,  d33		/* jump to code that handles 2 word */
+					/* mantissas */
+	sub	%r6,  %r7,  2		/* get number of bits to check for */
+					/* sticky */
+	mak	%r6,  %r6,  5<5>	/* shift width into width field */
+	mak	%r8,  %r11, %r6		/* mask off shifted bits -2 */
+	ff1	%r8,  %r8		/* see if r8 has any ones */
+	bb1	5,    %r8,  nostky32	/* do not set sticky if no ones found */
+	set	%r9,  %r9,  1<0>	/* set sticky bit */
+nostky32:
+	or	%r8,  %r0,  0x22	/* start code to get new mantissa */
+					/* plus two extra bits for new round */
+					/* and new guard bits, the upper word */
+					/* bits will be shifted after the */
+					/* round and guard bits are handled */
+	subu	%r8,  %r8,  %r7
+	mak	%r8,  %r8,  5<5>	/* shift field width into second five */
+					/* bits */
+	extu	%r6,  %r6,  5<5>	/* shift previous shifted -2 into */
+					/* offset field */
+	or	%r6,  %r6,  %r8		/* complete bit field */
+	extu	%r11, %r11, %r6		/* partially form new low mantissa */
+					/* with 2 more bits */
+	bb0	0,    %r11, nornd32d	/* do not set new round bit */
+	set	%r9,  %r9,  1<1>	/* set new round bit */
+nornd32d:
+	bb0	1,    %r11, nogrd32d	/* do not set new guard bit */
+	set	%r9,  %r9,  1<2>	/* set new guard bit */
+nogrd32d:
+	extu	%r11, %r11, 30<2>	/* shift off remaining two bits */
+	mak	%r6,  %r7,  5<5>	/* shift field width into second 5 */
+					/* bits, if the width is 32, then */
+					/* these bits will be 0 */
+	or	%r8,  %r0,  32		/* load word length into r8 */
+	sub	%r8,  %r8,  %r7		/* form offset for high bits moved to */
+					/* low word */
+	or	%r6,  %r6,  %r8		/* form complete bit field */
+	mak	%r6,  %r5,  %r6		/* get shifted bits of high word */
+	or	%r11, %r6,  %r11	/* form new low word of mantissa */
+	bcnd	ne0,  %r8,  regular33	/* do not adjust for special case */
+					/* of r8 containing zeros, which */
+	br.n	round			/* would cause all of the bits to be */
+	 or	%r5,  %r0,  %r0		/* extracted under the regular method */
+regular33:
+	mak	%r6,  %r7,  5<0>	/* place lower 5 bits of shift */
+					/* into r6 */
+	mak	%r8,  %r8,  5<5>	/* shift r8 into width field */
+	or	%r6,  %r6,  %r8		/* form field for shifting of upper */
+					/* bits */
+	br.n	round			/* round and assemble result */
+	 extu	%r5,  %r5,  %r6		/* form new high word mantissa */
+
+d33:
+	cmp	%r6,  %r7,  33		/* is the number of bits to be */
+					/* shifted is 33? */
+	bb1	gt,   %r6,  d34		/* check to see if # of bits is 34 */
+	bb1	0,    %r9,  nostky33	/* skip checking if old sticky set */
+	mak	%r6,  %r11, 31<0>	/* check bits that will be shifted */
+					/* into sticky */
+	ff1	%r8,  %r8		/* check for ones */
+	bb1	5,    %r8,  nostky33	/* do not set sticky if there are no */
+					/* ones */
+	set	%r9,  %r9,  1<0>	/* set new sticky bit */
+nostky33:
+	bb0	31,   %r11, nornd33	/* do not set round if bit is not a 1 */
+	set	%r9,  %r9,  1<1>	/* set new round bit */
+nornd33:
+	bb0	0,    %r5,  nogrd33	/* do not set guard bit if bit is not */
+					/* a 1 */
+	set	%r9,  %r9,  1<2>	/* set new guard bit */
+nogrd33:
+	extu	%r11, %r5,  31<1>	/* shift high bits into low word */
+	br.n	round			/* round and assemble result */
+	 or	%r5,  %r0,  %r0		/* clear high word */
+
+d34:
+	cmp	%r6,  %r7,  34		/* is the number of bits to be */
+					/* shifted 34? */
+	bb1	gt,   %r6,  d35		/* check to see if # of bits is >= 35 */
+	bb1	0,    %r9,  nostky34	/* skip checking if old sticky set */
+	ff1	%r8,  %r11		/* check bits that will be shifted */
+					/* into sticky */
+	bb1	5,    %r8,  nostky34	/* do not set sticky if there are no */
+					/* ones */
+	set	%r9,  %r9,  1<0>	/* set new sticky bit */
+nostky34:
+	bb0	0,    %r5,  nornd34	/* do not set round if bit is not a 1 */
+	set	%r9,  %r9,  1<1>	/* set new round bit */
+nornd34:
+	bb0	1,    %r5,  nogrd34	/* do not set guard bit if bit is not */
+					/* a 1 */
+	set	%r9,  %r9,  1<2>	/* set new guard bit */
+nogrd34:
+	extu	%r11, %r5,  30<2>	/* shift high bits into low word */
+	br.n	round			/* round and assemble result */
+	 or	%r5,  %r0,  %r0		/* clear high word */
+
+d35:
+	cmp	%r6,  %r7,  52		/* see if # of shifts is */
+					/* 35 <= X <= 52 */
+	bb1	gt,   %r6,  d53		/* check to see if # of shifts is 52 */
+	bb1.n	0,    %r9,  nostky35	/* skip checking if old sticky set */
+	 sub	%r7,  %r7,  34		/* subtract 32 from # of shifts */
+					/* so that operations can be done on */
+					/* the upper word, and then subtract */
+					/* two more checking guard and */
+					/* sticky bits */
+	ff1	%r8,  %r11		/* see if lower word has a bit for */
+					/* sticky */
+	bb1	5,    %r8,  stkycheck35 /* see if upper word has any sticky */
+					/* bits	*/
+	br.n	nostky35		/* quit checking for sticky */
+	 set	%r9,  %r9,  1<0>	/* set sticky bit */
+stkycheck35:
+	mak	%r6,  %r7,  5<5>	/* place width into width field */
+	mak	%r8,  %r5,  %r6		/* mask off shifted bits - 2 */
+	ff1	%r8,  %r8		/* see if r8 has any ones */
+	bb1	5,    %r8,  nostky35	/* do not set sticky if no ones found */
+	set	%r9,  %r9,  1<0>	/* set sticky bit */
+nostky35:
+	or	%r8,  %r0,  32		/* look at what does not get shifted */
+					/* off plus round and sticky, */
+					/* remember that the r7 value was */
+					/* adjusted so that it did not */
+					/* include new round or new sticky in */
+					/* shifted off bits */
+	subu	%r8,  %r8,  %r7		/* complement width */
+	mak	%r8,  %r8,  5<5>	/* shift width into width field */
+	or	%r8,  %r7,  %r8		/* add offset field */
+	extu	%r11, %r5,  %r8		/* extract upper bits into low word */
+	bb0	0,    %r11, nornd35	/* do not set new round bit */
+	set	%r9,  %r9,  1<1>	/* set new round bit */
+nornd35:
+	bb0	1,    %r11, nogrd35	/* do not set new guard bit */
+	set	%r9,  %r9,  1<2>	/* set new guard bit */
+nogrd35:
+	extu	%r11, %r11, 30<2>	/* shift off remaining guard and round bits */
+	br.n	round			/* round and assemble result */
+	 or	%r5,  %r0,  %r0		/* clear high word */
+
+d53:
+	cmp	%r6,  %r7,  53		/* check to see if # of shifts is 53 */
+	bb1	gt,   %r6,  d54		/* branch to see if shifts = 54 */
+	bb1	0,    %r9,  nostky53	/* skip checking if old sticky set */
+	ff1	%r8,  %r11		/* see if lower word has a bit for */
+					/* sticky */
+	bb1	5,    %r8,  stkycheck53 /* see if upper word has any sticky */
+					/* bits */
+	br.n	nostky53		/* quit checking for sticky */
+	 set	%r9,  %r9,  1<0>	/* set sticky bit */
+stkycheck53:
+	mak	%r6,  %r5,  19<0>	/* check bits that are shifted into */
+					/* sticky */
+	ff1	%r8,  %r6		/* see if r6 has any ones */
+	bb1	5,    %r8,  nostky53	/* do not set sticky if no ones found */
+	set	%r9,  %r9,  1<0>	/* set sticky bit */
+nostky53:
+	bb0	19,   %r5,  nornd53	/* do not set new round bit */
+	set	%r9,  %r9,  1<1>	/* set new round bit */
+nornd53:
+	set	%r9,  %r9,  1<2>	/* set new guard bit, this is hidden */
+					/* bit */
+	or	%r5,  %r0,  %r0		/* clear high word */
+	br.n	round			/* round and assemble result */
+	 or	%r11, %r0,  %r0		/* clear low word */
+
+d54:
+	cmp	%r6,  %r7,  54		/* check to see if # of shifts is 54 */
+	bb1	gt,   %r6,  d55		/* branch to execute for shifts =>55 */
+	bb1	0,    %r9,  nostky54	/* skip checking if old sticky set */
+	ff1	%r8,  %r11		/* see if lower word has a bit for */
+					/* sticky */
+	bb1	5,    %r8,  stkycheck54 /* see if upper word has any sticky */
+					/* bits */
+	br.n	nostky54		/* quit checking for sticky */
+	 set	%r9,  %r9,  1<0>	/* set sticky bit */
+stkycheck54:
+	mak	%r6,  %r5,  20<0>	/* check bits that are shifted into */
+					/* sticky */
+	ff1	%r8,  %r6		/* see if r6 has any ones */
+	bb1	5,    %r8,  nostky54	/* do not set sticky if no ones found */
+	set	%r9,  %r9,  1<0>	/* set sticky bit */
+nostky54:
+	set	%r9,  %r9,  1<1>	/* set new round bit, this is hidden */
+					/* bit */
+	clr	%r9,  %r9,  1<2>	/* clear guard bit since nothing */
+					/* shifted in */
+	or	%r5,  %r0,  %r0		/* clear high word */
+	br.n	round			/* round and assemble result */
+	 or	%r11, %r0,  %r0		/* clear low word */
+
+d55:
+	set	%r9,  %r9,  1<0>	/* set new sticky bit, this contains */
+					/* hidden bit */
+	clr	%r9,  %r9,  2<1>	/* clear guard and round bits since */
+					/* nothing shifted in */
+	or	%r5,  %r0,  %r0		/* clear high word */
+	or	%r11, %r0,  %r0		/* clear low word */
+
+
+/*
+ * The first item that the rounding code does is see if either guard, round,
+ * or sticky is set. If all are clear, then there is no denormalization loss
+ * and no need to round, then branch to assemble answer.
+ * For rounding, a branch table is set up. The left two most bits are the
+ * rounding mode. The third bit is either the LSB of the mantissa or the
+ * sign bit, depending on the rounding mode. The three LSB''s are the guard,
+ * round and sticky bits.
+ */
+
+round:
+	ff1	%r8,  %r9		/* see if there is denormalization */
+					/* loss */
+	bb1	5,    %r8,  assemble	/* no denormalization loss or */
+					/* inexactness */
+	extu	%r6,  %r10, 2<modelo>	/* extract rounding mode */
+	bb1.n	modehi, %r10, signext	/* use sign bit instead of LSB */
+	 mak	%r6,  %r6,  2<4>	/* shift over rounding mode */
+	extu	%r7,  %r11, 1<0>	/* extract LSB */
+	br.n	grs			/* skip sign extraction */
+	 mak	%r7,  %r7,  1<3>	/* shift over LSB */
+signext:
+	extu	%r7,  %r10, 1<31>	/* extract sign bit */
+	mak	%r7,  %r7,  1<3>	/* shift sign bit over */
+grs:
+	or	%r6,  %r6,  %r7
+	or	%r6,  %r6,  %r9		/* or in guard, round, and sticky */
+	or.u	%r1,  %r0,  %hi16(roundtable) /* form address of branch table */
+	or	%r1,  %r1,  %lo16(roundtable)
+	lda	%r6,  %r1[%r6]		/* scale offset into branch table */
+	jmp.n	%r6			/* jump to branch table */
+	 set	%r9,  %r9,  1<3>	/* set inexact flag in r9 */
+
+roundtable:
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	addone
+	br	addone
+	br	addone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	addone
+	br	addone
+	br	addone
+	br	addone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	addone
+	br	addone
+	br	addone
+	br	addone
+	br	addone
+	br	addone
+	br	addone
+	br	noaddone
+	br	addone
+	br	addone
+	br	addone
+	br	addone
+	br	addone
+	br	addone
+	br	addone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+	br	noaddone
+
+/* Round by adding a one to the LSB of the mantissa. */
+addone:
+	or	%r6,  %r0,  1		/* load a 1 into r6 so that add.co */
+					/* can be used */
+	add.co	%r11, %r11, %r6		/* add a one to the lower word of */
+					/* result */
+	bb0.n	destsize, %r12, noaddone/* single result, forget carry */
+	 set	%r9,  %r9,  1<4>	/* indicate that a 1 has been added */
+	add.ci	%r5,  %r5,  %r0		/* propagate carry into high word */
+
+noaddone:
+	set	%r2,  %r2,  1<inexact>
+	set	%r2,  %r2,  1<underflow>
+
+/*
+ * Assemble the result of the denormalization routine for writeback to the
+ * destination register. The exponent of a denormalized number is zero,
+ * so simply assemble the sign and the new mantissa.
+ */
+
+assemble:
+	bb1	destsize, %r12, doubassem	/* assemble double result */
+	bb0	sign, %r10, exassems		/* exit assemble if sign is */
+						/* zero */
+	set	%r11, %r11, 1<sign>		/* make result negative */
+exassems:
+	br	Ureturn
+
+doubassem:
+	bb0.n	sign, %r10, signclr		/* do not set sign in r10 */
+	 or	%r10, %r5,  %r0			/* load high word from r5 */
+						/* into r10 */
+	set	%r10, %r10, 1<sign>		/* high word with sign loaded */
+signclr:
+	/* FALLTHROUGH */
+	/* br	Ureturn */
+
+/* Return to fpui. */
+Ureturn:
+	ld	%r1,  %r31, 0			/* load return address */
+	jmp	%r1
+
+/*
+ * FPoverflow
+ */
+
+ASLOCAL(FPoverflow)
+	st	%r1,  %r31, 0			/* save return address */
+	set	%r2,  %r2,  1<overflow>
+	set	%r2,  %r2,  1<inexact>
+
+/* Determine which rounding mode to use for the default procedure. */
+
+	bb1	modehi, %r10, signed		/* mode is either round */
+						/* toward pos. or neg. */
+	bb0	modelo, %r10, OFnearest		/* rounding mode is round */
+						/* nearest */
+	br	OFzero				/* rounding mode is round */
+						/* zero */
+signed:
+	bb0	modelo, %r10, OFnegative	/* rounding mode is round */
+						/* negative */
+	br	positive			/* rounding mode is round */
+						/* positive */
+
+/*
+ * In the round toward nearest mode, positive values are rounded to
+ * positive infinity and negative values are loaded toward negative infinity.
+ * The value for single or double precision is loaded from a data table.
+ */
+
+OFnearest:
+	bb1.n	destsize, %r12, neardouble	/* branch to neardouble of */
+						/* double result */
+	 mask.u	%r5,  %r10, 0x8000		/* mask off sign bit from */
+						/* MANTHI */
+	or.u	%r11, %r0,  %hi16(0x7f800000)	/* load single infinity */
+						/* constant */
+	or	%r11, %r11, %lo16(0x7f800000)
+	br.n	FPof_return			/* return with result */
+	 or	%r11, %r5,  %r11		/* adjust sign */
+neardouble:
+	or	%r11, %r0,  %r0			/* load lower word of double */
+						/* infinity */
+	or.u	%r10, %r0,  %hi16(0x7ff00000)	/* load upper word of double */
+						/* infinity */
+	or	%r10, %r10, %lo16(0x7ff00000)
+	br.n	FPof_return			/* return with result */
+	 or	%r10, %r5,  %r10		/* adjust sign */
+
+/*
+ * In the round toward zero mode, positive values are rounded to the largest
+ * postive finite number and negative values are rounded toward the largest
+ * negative finite number.
+ * The value for single or double precision is loaded from a data table.
+ */
+
+OFzero:
+	bb1.n	destsize, %r12, zerodouble	/* branch to zerodouble of */
+						/* double result */
+	 mask.u	%r5,  %r10, 0x8000		/* mask off sign bit from */
+						/* MANTHI */
+	or.u	%r11, %r0,  %hi16(0x7f7fffff)	/* load single finite number */
+						/* constant */
+	or	%r11, %r11, %lo16(0x7f7fffff)
+	br.n	FPof_return			/* return with result */
+	 or	%r11, %r5,  %r11		/* adjust sign */
+zerodouble:
+	set	%r11, %r0,  0<0>		/* load lower word of double */
+						/* finite number */
+	or.u	%r10, %r0,  %hi16(0x7fefffff)	/* load upper word of double */
+						/* finite number */
+	or	%r10, %r10, %lo16(0x7fefffff)
+	br.n	FPof_return			/* return with result */
+	 or	%r10, %r5,  %r10		/* adjust sign */
+
+/*
+ * In the round toward positve mode, positive values are rounded to
+ * postive infinity and negative values are loaded toward the largest
+ * negative finite number.
+ * The value for single or double precision is loaded from a data table.
+ */
+
+positive:
+	bb1	destsize, %r12, posdouble	/* branch to section for */
+						/* double result */
+possingle:
+	bb1	sign, %r10, possingleneg	/* branch to section for */
+						/* negatives */
+possinglepos:
+	or.u	%r11, %r0,  %hi16(0x7f800000)	/* load single infinity */
+						/* constant */
+	br.n	FPof_return			/* return with result */
+	 or	%r11, %r11, %lo16(0x7f800000)
+possingleneg:
+	or.u	%r11, %r0,  %hi16(0x7f7fffff)	/* load single finite number */
+						/* constant */
+	or	%r11, %r11, %lo16(0x7f7fffff)
+	br.n	FPof_return			/* return with result */
+	 set	%r11, %r11, 1<sign>		/* set sign for negative */
+posdouble:
+	bb1	sign, %r10, posdoubleneg	/* branch to negative double */
+						/* results */
+posdoublepos:
+	or	%r11, %r0,  %r0			/* load lower word of double */
+						/* infinity */
+	or.u	%r10, %r0,  %hi16(0x7ff00000)	/* load upper word of double */
+						/* infinity */
+	br.n	FPof_return			/* return with result */
+	 or	%r10, %r10, %lo16(0x7ff00000)
+posdoubleneg:
+	set	%r11, %r0,  0<0>		/* load lower word of finite */
+						/* number */
+	or.u	%r10, %r0,  %hi16(0x7fefffff)	/* load upper word of finite */
+						/* number */
+	or	%r10, %r10, %lo16(0x7fefffff)
+	br.n	FPof_return			/* return with result */
+	 set	%r10, %r10, 1<sign>		/* set sign for negative */
+
+/*
+ * In the round toward negative mode, positive values are rounded to the
+ * largest postive finite number and negative values are rounded to negative
+ * infinity.
+ * The value for single or double precision is loaded from a data table.
+ */
+
+OFnegative:
+	bb1	destsize, %r12, negdouble	/* branch to section for */
+						/* double result */
+negsingle:
+	bb1	sign, %r10, negsingleneg	/* branch to section for */
+						/* negatives */
+negsinglepos:
+	or.u	%r11, %r0,  %hi16(0x7f7fffff)	/* load single finite number */
+						/* constant */
+	br.n	FPof_return			/* return with result */
+	 or	%r11, %r11, %lo16(0x7f7fffff)
+negsingleneg:
+	or.u	%r11, %r0,  %hi16(0x7f800000)	/* load single infinity */
+						/* constant */
+	or	%r11, %r11, %lo16(0x7f800000)
+	br.n	FPof_return			/* return with result */
+	 set	%r11, %r11, 1<sign>		/* set sign for negative */
+negdouble:
+	bb1	sign, %r10, negdoubleneg	/* branch to negative double */
+						/* results */
+negdoublepos:
+	set	%r11, %r0,  0<0>		/* load lower word of finite */
+						/* number */
+	or.u	%r10, %r0,  %hi16(0x7fefffff)	/* load upper word of finite */
+						/* number */
+	br.n	FPof_return			/* return with result */
+	 or	%r10, %r10, %lo16(0x7fefffff)
+negdoubleneg:
+	or	%r11, %r0,  %r0			/* load lower word of double */
+						/* infinity */
+	or.u	%r10, %r0,  %hi16(0x7ff00000)	/* load upper word of double */
+						/* infinity */
+	or	%r10, %r10, %lo16(0x7ff00000)
+	set	%r10, %r10, 1<sign>		/* set sign for negative */
+
+FPof_return:
+	ld	%r1,  %r31, 0			/* load return address */
+	jmp	%r1
+
+ENTRY(m88100_fpu_imprecise_exception)
+	or	%r29, %r2,  %r0			/* r29 is now the E.F. */
+	subu	%r31, %r31, 16
+	st	%r1,  %r31, 4
+	st	%r29, %r31, 8
+
+	ld	%r2 , %r29, EF_FPSR
+	ld	%r3 , %r29, EF_FPCR
+	ld	%r4 , %r29, EF_FPECR
+	ld	%r10, %r29, EF_FPRH
+	ld	%r11, %r29, EF_FPRL
+	ld	%r12, %r29, EF_FPIT
+
+/*
+ * Load into r1 the return address for the exception handlers. Looking
+ * at FPECR, branch to the appropriate exception handler.
+ */
+
+	or.u	%r1,  %r0,  %hi16(fpui_wrapup)	/* load return address of */
+	or	%r1,  %r1,  %lo16(fpui_wrapup)	/* functions */
+
+	bb0	2,    %r4,  2f			/* branch to FPunderflow if */
+	br	_ASM_LABEL(FPunderflow)		/* bit set */
+2:
+	bb0	1,    %r4,  3f			/* branch to FPoverflow if */
+	br	_ASM_LABEL(FPoverflow)		/* bit set */
+3:
+	/* XXX handle inexact!!! */
+
+fpui_wrapup:
+	FLUSH_PIPELINE				/* make sure all floating */
+						/* point operations have */
+						/* finished */
+	ldcr	%r4,  %cr1			/* load the PSR */
+#if 0
+	set	%r4,  %r4,  1<PSR_FPU_DISABLE_BIT>
+#endif
+	set	%r4,  %r4,  1<PSR_INTERRUPT_DISABLE_BIT>
+	stcr	%r4,  %cr1
+	ld	%r1,  %r31, 4
+	ld	%r29, %r31, 8
+	addu	%r31, %r31, 16
+
+	fstcr	%r2, FPSR		/* write revised value of FPSR... */
+	fstcr	%r3, FPCR		/* ...and FPCR... */
+	st	%r2, %r29, EF_FPSR	/* ...into the trapframe as well */
+	st	%r3, %r29, EF_FPCR
+
+	/* write back the results */
+	extu	%r2,  %r12, 5<0>
+	bb0.n	destsize, %r12, Iwritesingle
+	 addu	%r3,  %r29, EF_R0
+	st	%r10, %r3[%r2]
+	addu	%r2,  %r2,  1
+	clr	%r2,  %r2,  27<5>
+Iwritesingle:
+	jmp.n	%r1
+	 st	%r11, %r3[%r2]