sys/arch/m88k/m88k/m88100_fp.S - annotate

Return to m88100_fp.S CVS log
Up to [local] / sys / arch / m88k / m88k
Annotation of sys/arch/m88k/m88k/m88100_fp.S, Revision 1.1.1.1

1.1       nbrk        1: /* $OpenBSD: m88100_fp.S,v 1.4 2004/08/09 20:52:11 miod Exp $  */
                      2: /*
                      3:  * Mach Operating System
                      4:  * Copyright (c) 1991 Carnegie Mellon University
                      5:  * Copyright (c) 1991 OMRON Corporation
                      6:  * All Rights Reserved.
                      7:  *
                      8:  * Permission to use, copy, modify and distribute this software and its
                      9:  * documentation is hereby granted, provided that both the copyright
                     10:  * notice and this permission notice appear in all copies of the
                     11:  * software, derivative works or modified versions, and any portions
                     12:  * thereof, and that both notices appear in supporting documentation.
                     13:  *
                     14:  * CARNEGIE MELLON AND OMRON ALLOW FREE USE OF THIS SOFTWARE IN ITS "AS IS"
                     15:  * CONDITION.  CARNEGIE MELLON AND OMRON DISCLAIM ANY LIABILITY OF ANY KIND
                     16:  * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
                     17:  *
                     18:  * Carnegie Mellon requests users of this software to return to
                     19:  *
                     20:  *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
                     21:  *  School of Computer Science
                     22:  *  Carnegie Mellon University
                     23:  *  Pittsburgh PA 15213-3890
                     24:  *
                     25:  * any improvements or extensions that they make and grant Carnegie the
                     26:  * rights to redistribute these changes.
                     27:  */
                     28:
                     29: /* Floating point trouble routines */
                     30: #include "assym.h"
                     31: #include <machine/trap.h>
                     32: #include <machine/asm.h>
                     33:
                     34: #define destsize 10
                     35:
                     36: /* Floating-Point Status Register bits */
                     37: #define inexact 0
                     38: #define overflow 1
                     39: #define underflow 2
                     40: #define divzero 3
                     41: #define oper 4
                     42:
                     43: #define sign 31
                     44: #define s1size 9
                     45: #define s2size 7
                     46: #define dsize 5
                     47:
                     48: #define FADDop 0x05
                     49: #define FSUBop 0x06
                     50: #define FCMPop 0x07
                     51: #define FMULop 0x00
                     52: #define FDIVop 0x0e
                     53: #define FSQRTop 0x0f
                     54: #define INTop 0x09
                     55: #define NINTop 0x0a
                     56: #define TRNCop 0x0b
                     57:
                     58: #define s1nan 7
                     59: #define s2nan 6
                     60: #define s1inf 5
                     61: #define s2inf 4
                     62: #define s1zero 3
                     63: #define s2zero 2
                     64: #define sigbit 19
                     65:
                     66: #define modehi 30
                     67: #define modelo 29
                     68: #define rndhi 15
                     69: #define rndlo 14
                     70: #define efunf 7
                     71: #define efovf 6
                     72: #define efinx 5
                     73:
                     74: ASENTRY(m88100_Xfp_precise)
                     75:        or      r29, r3,  r0            /* r29 is now the E.F. */
                     76:        subu    r31, r31, 16
                     77:        st      r1,  r31, 8
                     78:        st      r29, r31, 12
                     79:
                     80:        ld      r2, r29, EF_FPSR * 4
                     81:        ld      r3, r29, EF_FPCR * 4
                     82:        ld      r4, r29, EF_FPECR * 4
                     83:        ld      r5, r29, EF_FPHS1 * 4
                     84:        ld      r6, r29, EF_FPLS1 * 4
                     85:        ld      r7, r29, EF_FPHS2 * 4
                     86:        ld      r8, r29, EF_FPLS2 * 4
                     87:        ld      r9, r29, EF_FPPT * 4
                     88:
                     89:
                     90:        /*
                     91:         * Load into r1 the return address for the zero handlers. Looking at
                     92:         * FPECR, branch to the appropriate zero handler. However, if none of
                     93:         * the zero bits are enabled, then a floating point instruction was
                     94:         * issued with the floating point unit disabled. This will cause an
                     95:         * unimplemented opcode 0.
                     96:         */
                     97:
                     98:        or.u    r1,r0,hi16(wrapup)      /* load return address of function */
                     99:        or      r1,r1,lo16(wrapup)
                    100:
                    101:        bb0     6,r4, 3f                /* branch to FPunimp if bit set */
                    102:        br      FPuimp
                    103: 3:
                    104:        bb0     7,r4, 4f                /* branch to FPintover if bit set */
                    105:        br      FPintover
                    106: 4:
                    107: #if 0
                    108:        bb0     5,r4, 5f                /* branch to FPpriviol if bit set */
                    109:        br      FPpriviol
                    110: #endif
                    111: 5:
                    112:        bb0     4,r4, 6f                /* branch to FPresoper if bit set */
                    113:        br      FPresoper
                    114: 6:
                    115:        bb0     3,r4, 7f                /* branch to FPdivzero if bit set */
                    116:        br      FPdivzero
                    117: 7:
                    118:        or.u    r4, r4, 0xffff
                    119:
                    120: ASLOCAL(FPuimp)
                    121:        subu    r31,r31,16              /* allocate stack */
                    122:        st      r1,r31,0                /* save return address */
                    123:        or      r2,r0,T_FPEPFLT         /* load trap type */
                    124:        bsr.n   _C_LABEL(m88100_trap)
                    125:         or     r3, r29, r0
                    126:        ld      r1,r31,0                /* recover return address */
                    127:        addu    r31,r31,16              /* deallocate stack */
                    128:        jmp     r1
                    129:
                    130:        /*
                    131:         * To write back the results to the user registers, disable exceptions
                    132:         * and the floating point unit. Write FPSR and FPCR and load the SNIP
                    133:         * and SFIP.
                    134:         * r5 will contain the upper word of the result
                    135:         * r6 will contain the lower word of the result
                    136:         */
                    137:
                    138: ASLOCAL(wrapup)
                    139:        tb1     0,r0,0          /* make sure all floating point operations */
                    140:                                /* have finished */
                    141:        ldcr    r10, cr1        /* load the PSR */
                    142: #if 0
                    143:        set     r10, r10, 1<PSR_FPU_DISABLE_BIT>
                    144: #endif
                    145:        set     r10, r10, 1<PSR_INTERRUPT_DISABLE_BIT>
                    146:        stcr    r10, cr1
                    147:
                    148:        ld      r1, r31, 8
                    149:        ld      r29, r31, 12
                    150:        addu    r31, r31, 16
                    151:
                    152:        fstcr   r2, FPSR        /* write revised value of FPSR */
                    153:        fstcr   r3, FPCR        /* write revised value of FPCR */
                    154:
                    155:        /* result writeback routine */
                    156:        addu    r3, r29, EF_R0 * 4
                    157:        extu    r2, r9, 5<0>            /* get 5 bits of destination register */
                    158:        bb0     5, r9, writesingle      /* branch if destination is single */
                    159:
                    160: /* writedouble here */
                    161:        st      r5, r3 [r2]             /* write high word */
                    162:        add     r2, r2, 1               /* for double, the low word is the */
                    163:        /* unspecified register */
                    164:        clr     r2, r2, 27<5>           /* perform equivalent of mod 32 */
                    165: ASLOCAL(writesingle)
                    166:        jmp.n   r1
                    167:         st     r6, r3 [r2]             /* write low word into memory */
                    168:
                    169: /*
                    170:  * Check if the numerator is zero. If the numerator is zero, then handle
                    171:  * this instruction as you would a 0/0 invalid operation.
                    172:  */
                    173:
                    174: ASLOCAL(FPdivzero)
                    175:        bb1.n   s1size,r9,1f            /* branch if numerator double */
                    176:         st     r1,r31,0                /* save return address */
                    177: /* single number */
                    178:        clr     r10,r5,1<sign>  /* clear sign bit */
                    179:        extu    r11,r6,3<29>    /* grab upper bits of lower word */
                    180:        or      r10,r10,r11     /* combine ones of mantissa */
                    181:        bcnd    eq0,r10,resoper /* numerator is zero, handle reserved operand */
                    182:        br      setbit          /* set divzero bit */
                    183: 1:
                    184: /* double number */
                    185:        clr     r10,r5,1<sign>  /* clear sign bit */
                    186:        or      r10,r10,r6      /* or high and low words */
                    187:        bcnd    ne0,r10,setbit  /* set divzero bit */
                    188:
                    189: /*
                    190:  * The numerator is zero, so handle the invalid operation by setting the
                    191:  * invalid operation bit and writing a quiet NaN to the destination.
                    192:  */
                    193:
                    194: ASLOCAL(resoper)
                    195:        set     r2,r2,1<oper>
                    196:        set     r5,r0,0<0>      /* put a NaN in high word */
                    197:        set     r6,r0,0<0>      /* put a NaN in low word */
                    198:        br      FP_div_return
                    199:                                /* writing to a word which may be ignored */
                    200:                                /* is just as quick as checking the precision */
                    201:                                /* of the destination */
                    202:
                    203: /*
                    204:  * The operation is divide by zero, so set the divide by zero bit in the
                    205:  * FPSR.
                    206:  * Considering the sign of the numerator and zero, write a correctly
                    207:  * signed infinity of the proper precision into the destination.
                    208:  */
                    209:
                    210: setbit:
                    211:        set     r2,r2,1<divzero>
                    212:        bb1     dsize,r9,FPzero_double  /* branch to handle double result */
                    213: FPzero_single:
                    214:        clr     r10,r5,31<0>    /* clear all of S1HI except sign bit */
                    215:        xor     r10,r7,r10      /* xor the sign bits of the operands */
                    216:        or.u    r6,r0,0x7f80    /* load single precision infinity */
                    217:        br.n    FP_div_return
                    218:         or     r6,r6,r10       /* load correctly signed infinity */
                    219:
                    220: FPzero_double:
                    221:        clr     r10,r5,31<0>    /* clear all of S1HI except sign bit */
                    222:        xor     r10,r7,r10      /* xor the sign bits of the operands */
                    223:        or.u    r5,r0,0x7ff0    /* load double precision infinity */
                    224:        or      r5,r5,r10       /* load correctly signed infinity */
                    225:        or      r6,r0,r0        /* clear lower word of double */
                    226:
                    227: FP_div_return:
                    228:        ld      r1,r31,0        /* load return address */
                    229:        jmp     r1
                    230:
                    231: /*
                    232:  * Both NINT and TRNC require a certain rounding mode, so check which
                    233:  * instruction caused the integer conversion overflow. Use a substitute
                    234:  * FPCR in r1, and modify the rounding mode if the instruction is NINT
                    235:  * or TRNC.
                    236:  */
                    237: ASLOCAL(FPintover)
                    238:        extu    r10,r9,5<11>            /* extract opcode */
                    239:        cmp     r11,r10,INTop           /* see if instruction is INT */
                    240:        st      r1,r31,0                /* save return address */
                    241:        bb1.n   eq,r11,checksize        /* instruction is INT, do not modify */
                    242:                                        /* rounding mode */
                    243:         or     r1,r0,r3                /* load FPCR into r1 */
                    244:        cmp     r11,r10,NINTop          /* see if instruction is NINT */
                    245:        bb1     eq,r11,NINT             /* instruction is NINT */
                    246: TRNC:
                    247:        clr     r1,r1,2<rndlo>          /* clear rounding mode bits, */
                    248:                                        /* instruction is TRNC */
                    249:        br.n    checksize               /* branch to check size */
                    250:         set    r1,r1,1<rndlo>          /* make rounding mode round towards */
                    251:                                        /* zero */
                    252: NINT:
                    253:        clr     r1,r1,2<rndlo>          /* make rounding mode round to */
                    254:                                        /* nearest */
                    255:
                    256: /* See whether the source is single or double precision. */
                    257:
                    258: checksize:
                    259:        bb1     s2size,r9,checkdoub     /* S2 is double, branch to see if */
                    260:                                        /* there is a false alarm */
                    261:
                    262: /*
                    263:  * An integer has more bits than the mantissa of a single precision floating
                    264:  * point number, so to check for false alarms (i.e. valid conversion), simply
                    265:  * check the exponents. False alarms are detected for 2**30 to (2**30) - 1
                    266:  * and -2**30 to -2**31. Only seven bits need to be looked at since an
                    267:  * exception will not occur for the other half of the numbering system.
                    268:  * To speed up the processing, first check to see if the exponent is 32 or
                    269:  * greater.
                    270:  *
                    271:  * This code was originally written for the exponent in the control
                    272:  * register to have the most significant bit (8 - single, 11 - double)
                    273:  * flipped and sign extended. For precise exceptions, however, the most
                    274:  * significant bit is only sign extended. Therefore, the code was chopped
                    275:  * up so that it would work for positive values of real exponent which were
                    276:  * only sign extended.
                    277:  */
                    278:
                    279: checksing:
                    280:        extu    r10,r7,7<20>    /* internal representation for single */
                    281:                                /* precision is IEEE 8 bits sign extended */
                    282:                                /* to 11 bits; for real exp. = 30, the */
                    283:                                /* above instruction gives a result exp. */
                    284:                                /* that has the MSB flipped and sign */
                    285:                                /* extended like in the IMPCR */
                    286:        cmp     r11,r10,31      /* compare to 32,but exp. off by 1 */
                    287:                                /* these 2 instructions to speed up valid */
                    288:                                /* execution of valid cases */
                    289:        bb1     ge,r11,overflw  /* valid case, perform overflow routine */
                    290:        bb1     sign,r7,checksingn /* source operand is negative */
                    291:
                    292: /*
                    293:  * If the number is positve and the exponent is greater than 30, than it is
                    294:  * overflow.
                    295:  */
                    296: checksingp:
                    297:        cmp     r10,r10,29      /* compare to 30, but exp. off by 1 */
                    298:        bb1     gt,r10,overflw  /* no false alarm, its overflow */
                    299:        br      conversionsp    /* finish single precision conversion */
                    300:
                    301: /*
                    302:  * If the number is negative, and the exponent is 30, or 31 with a mantissa
                    303:  * of 0, then it is a false alarm.
                    304:  */
                    305: checksingn:
                    306:        cmp     r11,r10,30              /* compare to 31,but exp. off by 1 */
                    307:        bb1     lt,r11,conversionsn     /* exp. less than 31, so convert */
                    308:        extu    r10,r8,3<29>            /* get upper three bits of lower */
                    309:                                        /* mantissa */
                    310:        mak     r12,r7,20<3>            /* get upper 20 bits of mantissa */
                    311:        or      r10,r10,r12             /* form complete mantissa */
                    312:        bcnd    eq0,r10,conversionsn    /* complete conversion if mantissa */
                    313:                                        /* is 0 */
                    314:        br      overflw                 /* no false alarm, its overflow */
                    315:
                    316: /*
                    317:  * False alarms are detected for 2**30 to (2**30) - 1 and -2**30 to -2**31.
                    318:  * Only seven bits need to be looked at since an exception will not occur
                    319:  * for the other half of the numbering system.
                    320:  * To speed up the processing, first check to see if the exponent is 32 or
                    321:  * greater. Since there are more mantissa bits than integer bits, rounding
                    322:  * could cause overflow. (2**31) - 1 needs to be checked so that it does
                    323:  * not round to 2**31, and -2**31 needs to be checked in case it rounds to
                    324:  * -((2**31) + 1).
                    325:  */
                    326: checkdoub:
                    327:        extu    r10,r7,10<20>   /* internal representation for double */
                    328:                                /* precision is the same IEEE 11 bits */
                    329:                                /* for real exp. = 30, the */
                    330:                                /* above instruction gives a result exp. */
                    331:                                /* that has the MSB flipped and sign */
                    332:                                /* extended like in the IMPCR */
                    333:        cmp     r11,r10,31      /* compare to 32,but exp. off by 1 */
                    334:                                /* these 2 instructions to speed up valid */
                    335:                                /* execution of valid cases */
                    336:        bb1     ge,r11,overflw  /* valid case, perform overflow routine */
                    337:        bb1     sign,r7,checkdoubn /* source operand is negative */
                    338:
                    339: /*
                    340:  * If the exponent is not 31, then the floating point number will be rounded
                    341:  * before the conversion is done. A branch table is set up with bits 4 and 3
                    342:  * being the rounding mode, and bits 2, 1, and 0 are the guard, round, and
                    343:  * sticky bits.
                    344:  */
                    345: checkdoubp:
                    346:        cmp     r11,r10,30      /* compare to 31, but exponent off by 1 */
                    347:        bb1     eq,r11,overflw  /* no false alarm, its overflow */
                    348:        extu    r12,r8,1<22>    /* get LSB for integer with exp. = 30 */
                    349:        mak     r12,r12,1<2>    /* start to set up field for branch table */
                    350:        extu    r11,r8,1<21>    /* get guard bit */
                    351:        mak     r11,r11,1<1>    /* set up field for branch table */
                    352:        or      r12,r11,r12     /* set up field for branch table */
                    353:        extu    r11,r8,21<0>    /* get bits for sticky bit */
                    354:        bcnd    eq0,r11,nostickyp /* do not set sticky */
                    355:        set     r12,r12,1<0>    /* set sticky bit */
                    356: nostickyp:
                    357:        rot     r11,r1,0<rndlo>         /* shift rounding mode to 2 LSB''s */
                    358:        mak     r11,r11,2<3>            /* set up field, clear other bits */
                    359:        or      r12,r11,r12             /* set up field for branch table */
                    360:        lda     r12,r0[r12]             /* scale r12 */
                    361:        or.u    r12,r12,hi16(ptable)    /* load pointer into table */
                    362:        addu    r12,r12,lo16(ptable)
                    363:        jmp     r12
                    364:
                    365: ptable:
                    366:        br      conversiondp
                    367:        br      conversiondp
                    368:        br      conversiondp
                    369:        br      paddone
                    370:        br      conversiondp
                    371:        br      conversiondp
                    372:        br      paddone
                    373:        br      paddone
                    374:        br      conversiondp
                    375:        br      conversiondp
                    376:        br      conversiondp
                    377:        br      conversiondp
                    378:        br      conversiondp
                    379:        br      conversiondp
                    380:        br      conversiondp
                    381:        br      conversiondp
                    382:        br      conversiondp
                    383:        br      conversiondp
                    384:        br      conversiondp
                    385:        br      conversiondp
                    386:        br      conversiondp
                    387:        br      conversiondp
                    388:        br      conversiondp
                    389:        br      conversiondp
                    390:        br      conversiondp
                    391:        br      paddone
                    392:        br      paddone
                    393:        br      paddone
                    394:        br      conversiondp
                    395:        br      paddone
                    396:        br      paddone
                    397:        br      paddone
                    398:
                    399: /*
                    400:  * Add one to the bit of the mantissa which corresponds to the LSB of an
                    401:  * integer. If the mantissa overflows, then there is a valid integer
                    402:  * overflow conversion; otherwise, the mantissa can be converted to the
                    403:  * integer.
                    404:  */
                    405: paddone:
                    406:        or      r10,r0,r0       /* clear r10 */
                    407:        set     r10,r10,1<22>   /* set LSB bit to 1 for adding */
                    408:        addu.co r8,r8,r10       /* add the 1 obtained from rounding */
                    409:        clr     r11,r7,12<20>   /* clear exponent and sign */
                    410:        addu.ci r11,r0,r11      /* add carry */
                    411:        bb1     20,r11,overflw  /* overflow to 2**31, abort the rest */
                    412:        br.n    conversiondp    /* since the exp. was 30, and the exp. */
                    413:                                /* did not round up to 31, the largest */
                    414:                                /* number that S2 could become is 2**31-1 */
                    415:         or     r7,r0,r11       /* store r11 into r7 for conversion */
                    416:
                    417: /*
                    418:  * Now check for negative double precision sources. If the exponent is 30,
                    419:  * then convert the false alarm. If the exponent is 31, then check the
                    420:  * mantissa bits which correspond to integer bits. If any of them are a one,
                    421:  * then there is overflow. If they are zero, then check the guard, round,
                    422:  * and sticky bits.
                    423:  * Round toward zero and positive will not cause a roundup, but round toward
                    424:  * nearest and negative may, so perform those roundings. If there is no
                    425:  * overflow, then convert and return.
                    426:  */
                    427: checkdoubn:
                    428:        cmp     r11,r10,29              /* compare to 30, but exp. off by 1 */
                    429:        bb1     eq,r11,conversiondn     /* false alarm if exp. = 30 */
                    430:        extu    r10,r8,11<21>           /* check upper bits of lower mantissa */
                    431:        bcnd    ne0,r10,overflw         /* one of the bits is a 1, so oflow */
                    432:        extu    r10,r7,20<0>            /* check upper bits of upper mantissa */
                    433:        bcnd    ne0,r10,overflw         /* one of the bits is a 1, so oflow */
                    434:        bb0     rndlo,r1,possround      /* rounding mode is either round near */
                    435:                                        /* or round negative, which may cause */
                    436:                                        /* a round */
                    437:        br.n    FPintov_return          /* round positive, which will not */
                    438:                                        /* cause a round */
                    439:         set    r6,r0,1<sign>
                    440: possround:
                    441:        extu    r12,r8,1<20>            /* get guard bit */
                    442:        extu    r11,r8,20<0>            /* get bits for sticky bit */
                    443:        bcnd.n  eq0,r11,nostickyn       /* do not set sticky */
                    444:         mak    r12,r12,1<1>            /* set up field for branch table */
                    445:        set     r12,r12,1<0>            /* set sticky bit */
                    446: nostickyn:
                    447:        bb1     rndhi,r1,negative       /* rounding mode is negative */
                    448: nearest:
                    449:        cmp     r12,r12,3               /* are both guard and sticky set */
                    450:        bb1     eq,r12,overflw          /* both guard and sticky are set, */
                    451:                                        /* so signal overflow */
                    452:        or      r6,r0,r0                /* clear destination register r6 */
                    453:        br.n    FPintov_return
                    454:         set    r6,r6,1<sign>           /* set the sign bit and take care of */
                    455:                                        /* this special case */
                    456: negative:
                    457:        bcnd    ne0,r12,overflw         /* -2**31 will be rounded to */
                    458:                                        /* -(2**31+1), so signal overflow */
                    459:        or      r6,r0,r0                /* clear destination register r6 */
                    460:        br.n    FPintov_return
                    461:         set    r6,r6,1<sign>           /* set the sign bit and take care of */
                    462:                                        /* this special case */
                    463:
                    464:        /*
                    465:         * Since the exp. was 30, and there was no round-up, the largest
                    466:         * number that S2 could have been was 2**31 - 1
                    467:         */
                    468:
                    469:
                    470:        /* Convert the single precision positive floating point number. */
                    471:
                    472: conversionsp:
                    473:        extu    r6,r8,3<29>     /* extract lower bits of integer */
                    474:        mak     r6,r6,3<7>      /* shift left to correct place in integer */
                    475:        mak     r10,r7,20<10>   /* shift left upper bits of integer */
                    476:        or      r6,r6,r10       /* form most of integer */
                    477:        br.n    FPintov_return
                    478:         set    r6,r6,1<30>     /* set hidden one */
                    479:
                    480:        /* Convert the single precision negative floating point number. */
                    481:
                    482: conversionsn:
                    483:        bb1     eq,r11,exp31s   /* use old r11 to see if exp. is 31 */
                    484:        extu    r6,r8,3<29>     /* extract lower bits of mantissa */
                    485:        mak     r6,r6,3<7>      /* shift left to correct place in integer */
                    486:        mak     r10,r7,20<10>   /* shift left upper bits of integer */
                    487:        or      r6,r6,r10       /* form most of integer */
                    488:        set     r6,r6,1<30>     /* set hidden one */
                    489:        or.c    r6,r0,r6        /* negate result */
                    490:        br.n    FPintov_return
                    491:         addu   r6,r6,1         /* add 1 to get 2''s complement */
                    492: exp31s:
                    493:        or      r6,r0,r0        /* clear r6 */
                    494:        br.n    FPintov_return
                    495:         set    r6,r6,1<sign>   /* set sign bit */
                    496:
                    497:        /* Convert the double precision positive floating point number. */
                    498:
                    499: conversiondp:
                    500:        extu    r6,r8,10<22>    /* extract lower bits of integer */
                    501:        mak     r10,r7,20<10>   /* shift left upper bits of integer */
                    502:        or      r6,r6,r10       /* form most of integer */
                    503:        br.n    FPintov_return
                    504:         set    r6,r6,1<30>     /* set hidden one */
                    505:
                    506:        /*
                    507:         * Convert the double precision negative floating point number.
                    508:         * The number, whose exponent is 30, must be rounded before converting.
                    509:         * Bits 4 and 3 are the rounding mode, and bits 2, 1, and 0 are the
                    510:         * guard, round, and sticky bits for the branch table.
                    511:         */
                    512:
                    513: conversiondn:
                    514:        extu    r12,r8,1<22>    /* get LSB for integer with exp. = 30 */
                    515:        mak     r12,r12,1<2>    /* start to set up field for branch table */
                    516:        extu    r11,r8,1<21>    /* get guard bit */
                    517:        mak     r11,r11,1<1>    /* set up field for branch table */
                    518:        or      r12,r11,r12     /* set up field for branch table */
                    519:        extu    r11,r8,21<0>    /* get bits for sticky bit */
                    520:        bcnd    eq0,r11,nostkyn /* do not set sticky */
                    521:        set     r12,r12,1<0>    /* set sticky bit */
                    522: nostkyn:
                    523:        rot     r11,r1,0<rndlo> /* shift rounding mode to 2 LSB''s */
                    524:        mak     r11,r11,2<3>    /* set up field, clear other bits */
                    525:        or      r12,r11,r12     /* set up field for branch table */
                    526:        lda     r12,r0[r12]     /* scale r12 */
                    527:        or.u    r12,r12,hi16(ntable) /* load pointer into table */
                    528:        addu    r12,r12,lo16(ntable)
                    529:        jmp     r12
                    530:
                    531: ntable:
                    532:        br      nnoaddone
                    533:        br      nnoaddone
                    534:        br      nnoaddone
                    535:        br      naddone
                    536:        br      nnoaddone
                    537:        br      nnoaddone
                    538:        br      naddone
                    539:        br      naddone
                    540:        br      nnoaddone
                    541:        br      nnoaddone
                    542:        br      nnoaddone
                    543:        br      nnoaddone
                    544:        br      nnoaddone
                    545:        br      nnoaddone
                    546:        br      nnoaddone
                    547:        br      nnoaddone
                    548:        br      nnoaddone
                    549:        br      naddone
                    550:        br      naddone
                    551:        br      naddone
                    552:        br      nnoaddone
                    553:        br      naddone
                    554:        br      naddone
                    555:        br      naddone
                    556:        br      nnoaddone
                    557:        br      nnoaddone
                    558:        br      nnoaddone
                    559:        br      nnoaddone
                    560:        br      nnoaddone
                    561:        br      nnoaddone
                    562:        br      nnoaddone
                    563:        br      nnoaddone
                    564:
                    565: /*
                    566:  * Add one to the mantissa, and check to see if it overflows to -2**31.
                    567:  * The conversion is done in nnoaddone.
                    568:  */
                    569:
                    570: naddone:
                    571:        or      r10,r0,r0       /* clear r10 */
                    572:        set     r10,r10,1<22>   /* set LSB bit to 1 for adding */
                    573:        add.co  r8,r8,r10       /* add the 1 obtained from rounding */
                    574:        clr     r7,r7,12<20>    /* clear exponent and sign */
                    575:        add.ci  r7,r0,r7        /* add carry */
                    576:        bb1     20,r7,maxneg    /* rounded to -2**31,handle separately */
                    577:                                /* the exponent was originally 30 */
                    578: nnoaddone:
                    579:        extu    r6,r8,11<22>    /* extract lower bits of integer */
                    580:        mak     r10,r7,20<10>   /* shift left upper bits of integer */
                    581:        or      r6,r6,r10       /* form most of integer */
                    582:        set     r6,r6,1<30>     /* set hidden one */
                    583:        or.c    r6,r0,r6        /* negate integer */
                    584:        br.n    FPintov_return
                    585:         addu   r6,r6,1         /* add 1 to get 2''s complement */
                    586:
                    587: maxneg:
                    588:        or      r6,r0,r0        /* clear integer */
                    589:        br.n    FPintov_return
                    590:         set    r6,r6,1<sign>   /* set sign bit */
                    591:
                    592:        /* For valid overflows, write the correctly signed largest integer. */
                    593: overflw:
                    594:        set     r2,r2,1<oper>
                    595:        bb0.n   sign,r7,FPintov_return  /* if positive then return */
                    596:         set    r6,r6,31<0>             /* set result to largest positive int */
                    597:        or.c    r6,r0,r6                /* negate r6, giving largest negative */
                    598:                                        /* integer */
                    599:
                    600: FPintov_return:
                    601:        ld      r1,r31,0                /* load return address from memory */
                    602:        jmp     r1
                    603:
                    604: /*
                    605:  * Some instructions only have the S2 operations, so clear S1HI and S1LO
                    606:  * for those instructions so that the previous contents of S1HI and S1LO
                    607:  * do not influence this instruction.
                    608:  */
                    609:
                    610: ASLOCAL(FPresoper)
                    611:        st      r1, r31, 0
                    612:        extu    r10,r9,5<11>    /* extract opcode */
                    613: #if 0
                    614:        cmp     r11,r10,FSQRTop /* compare to FSQRT */
                    615:        bb1     eq,r11,S1clear  /* clear S1 if instruction only had S2 operand */
                    616: #endif
                    617:        cmp     r11,r10,INTop   /* compare to INT */
                    618:        bb1     eq,r11,S1clear  /* clear S1 if instruction only had S2 operand */
                    619:        cmp     r11,r10,NINTop  /* compare to NINT */
                    620:        bb1     eq,r11,S1clear  /* clear S1 if instruction only had S2 operand */
                    621:        cmp     r11,r10,TRNCop  /* compare to TRNC */
                    622:        bb0     eq,r11,opercheck /* check for reserved operands */
                    623:
                    624: ASLOCAL(S1clear)
                    625:        or      r5,r0,r0        /* clear any NaN''s, denorms, or infinities */
                    626:        or      r6,r0,r0        /* that may be left in S1HI,S1LO from a */
                    627:                                /* previous instruction */
                    628:
                    629: /*
                    630:  * r12 contains the following flags:
                    631:  *   bit 9 -- s1sign
                    632:  *   bit 8 -- s2sign
                    633:  *   bit 7 -- s1nan
                    634:  *   bit 6 -- s2nan
                    635:  *   bit 5 -- s1inf
                    636:  *   bit 4 -- s2inf
                    637:  *   bit 3 -- s1zero
                    638:  *   bit 2 -- s2zero
                    639:  *   bit 1 -- s1denorm
                    640:  *   bit 0 -- s2denorm
                    641:  */
                    642:
                    643: /*
                    644:  * Using code for both single and double precision, check if S1 is either
                    645:  * a NaN or infinity and set the appropriate flags in r12. Then check if
                    646:  * S2 is a NaN or infinity. If it is a NaN, then branch to the NaN routine.
                    647:  */
                    648:
                    649: ASLOCAL(opercheck)
                    650:        extu    r10,r5,11<20>   /* internal representation for double */
                    651:        bb1.n   s1size,r9,S1NaNdoub /* S1 is double precision */
                    652:         or     r12,r0,r0       /* clear operand flag register */
                    653: ASLOCAL(S1NaNsing)
                    654:        xor     r10,r10,0x0080  /* internal representation for single */
                    655:        ext     r10,r10,8<0>    /* precision is IEEE 8 bits sign extended */
                    656:                                /* to 11 bits; for real exp. > 0, the */
                    657:                                /* above instructions gives a result exp. */
                    658:                                /* that has the MSB flipped and sign */
                    659:                                /* extended like in the IMPCR */
                    660:        cmp     r11,r10,127     /* Is exponent equal to IEEE 255 (here 127) */
                    661:        bb1     ne,r11,S2NaN    /* source 1 is not a NaN or infinity */
                    662:        mak     r10,r5,20<0>    /* load r10 with upper bits of S1 mantissa */
                    663:        extu    r11,r6,3<29>    /* get 3 upper bits of lower word */
                    664:        or      r11,r10,r11     /* combine any existing 1 */
                    665:        bcnd    eq0,r11,noS1NaNs /* since r11 can only hold 0 or a */
                    666:                                /* > 0 number, branch to noS1NaN when eq0 */
                    667:        br.n    S2NaN           /* see if S2 has a NaN */
                    668:         set    r12,r12,1<s1nan> /* indicate that S1 has a NaN */
                    669: ASLOCAL(noS1NaNs)
                    670:        br.n    S2NaN           /* check contents of S2 */
                    671:         set    r12,r0,1<s1inf> /* indicate that S1 has an infinity */
                    672:
                    673: ASLOCAL(S1NaNdoub)
                    674:        xor     r10,r10,0x0400  /* precision is the same IEEE 11 bits */
                    675:                                /* The above instructions gives a result exp. */
                    676:                                /* that has the MSB flipped and sign */
                    677:                                /* extended like in the IMPCR */
                    678:        cmp     r11,r10,1023    /* Is exp. equal to IEEE 2047 (internal 1023) */
                    679:        bb1     ne,r11,S2NaN    /* source 1 is not a NaN or infinity */
                    680:        mak     r10,r5,20<0>    /* load r10 with upper bits of S1 mantissa */
                    681:        or      r11,r6,r10      /* combine existing 1''s of mantissa */
                    682:        bcnd    eq0,r11,noS1NaNd /* since r11 can only hold 0 or a > 0 */
                    683:                                /* number, branch to noS1NaN when eq0 */
                    684:        br.n    S2NaN           /* see if S2 has a NaN */
                    685:         set    r12,r12,1<s1nan> /* indicate that S1 has a NaN */
                    686: ASLOCAL(noS1NaNd)
                    687:        set     r12,r0,1<s1inf> /* indicate that S1 has an infinity */
                    688:
                    689: ASLOCAL(S2NaN)
                    690:        bb1.n   s2size,r9,S2NaNdoub /* S1 is double precision */
                    691:         extu   r10,r7,11<20>   /* internal representation for double */
                    692: ASLOCAL(S2NaNsing)
                    693:        xor     r10,r10,0x0080  /* internal representation for single */
                    694:        ext     r10,r10,8<0>    /* precision is IEEE 8 bits sign extended */
                    695:                                /* to 11 bits; for real exp. > 0, the */
                    696:                                /* above instruction gives a result exp. */
                    697:                                /* that has the MSB flipped and sign */
                    698:                                /* extended like in the IMPCR */
                    699:        cmp     r11,r10,127     /* Is exponent equal to IEEE 255 (here 127) */
                    700:        bb1     ne,r11,inf      /* source 2 is not a NaN or infinity */
                    701:        mak     r10,r7,20<0>    /* load r10 with upper bits of S1 mantissa */
                    702:        extu    r11,r8,3<29>    /* get 3 upper bits of lower word */
                    703:        or      r11,r10,r11     /* combine any existing 1''s */
                    704:        bcnd    eq0,r11,noS2NaNs /* since r11 can only hold 0 or a > 0 */
                    705:                                /* number, branch to noS2NaNs when eq0 */
                    706:        br.n    _ASM_LABEL(NaN) /* branch to NaN routine */
                    707:         set    r12,r12,1<s2nan> /* indicate that s2 has a NaN */
                    708: ASLOCAL(noS2NaNs)
                    709:        bb0     s1nan,r12, 1f   /* branch to NaN if S1 is a NaN */
                    710:        br      _ASM_LABEL(NaN)
                    711: 1:
                    712:        br.n    _ASM_LABEL(infinity) /* If S1 had a NaN we would have */
                    713:                                /* already branched, and S2 does not have a */
                    714:                                /* NaN, but it does have an infinity, so */
                    715:                                /* branch to handle the finity */
                    716:         set    r12,r12,1<s2inf> /* indicate that S2 has an infinity */
                    717:
                    718: ASLOCAL(S2NaNdoub)
                    719:        xor     r10,r10,0x0400  /* precision is the same IEEE 11 bits */
                    720:                                /* The above instruction gives a result exp. */
                    721:                                /* that has the MSB flipped and sign */
                    722:                                /* extended like in the IMPCR */
                    723:        cmp     r11,r10,1023    /* Is exp. equal to IEEE 2047 (internal 1023) */
                    724:        bb1     ne,r11,inf      /* source 2 is not a NaN or infinity */
                    725:        mak     r10,r7,20<0>    /* load r10 with upper bits of S2 mantissa */
                    726:        or      r11,r8,r10      /* combine existing 1''s of mantissa */
                    727:        bcnd    eq0,r11,noS2NaNd /* since r11 can only hold 0 or a > 0 */
                    728:                                /* number, branch to noS2NaNd when eq0 */
                    729:        br.n    _ASM_LABEL(NaN) /* branch to NaN routine */
                    730:         set    r12,r12,1<s2nan> /* indicate that s2 has a NaN */
                    731: ASLOCAL(noS2NaNd)
                    732:        bb0     s1nan,r12,1f    /* branch to NaN if S1 is a NaN */
                    733:        br      _ASM_LABEL(NaN)
                    734: 1:
                    735:        br.n    _ASM_LABEL(infinity) /* If S1 had a NaN we would have */
                    736:                                /* already branched, and S2 does not have a */
                    737:                                /* NaN, but it does have an infinity, so */
                    738:                                /* branch to handle the finity */
                    739:         set    r12,r12,1<s2inf> /* indicate that S2 has an infinity */
                    740:
                    741: /*
                    742:  * If S2 was a NaN, the routine would have already branched to NaN. If S1
                    743:  * is a NaN, then branch to NaN. If S1 is not a NaN and S2 is infinity, then
                    744:  * we would have already branched to infinity. If S1 is infinity, then branch.
                    745:  * If the routine still has not branched, then branch to denorm, the only
                    746:  * reserved operand left.
                    747:  */
                    748:
                    749: ASLOCAL(inf)
                    750:        bb0     s1nan,r12,1f    /* branch if S1 has a NaN and S2 does not */
                    751:        br      _ASM_LABEL(NaN)
                    752: 1:
                    753:        bb0     s1inf,r12,2f    /* Neither S1 or S2 has a NaN, and we would */
                    754:                                /* have branched already if S2 had an */
                    755:                                /* infinity, so branch if S1 is infinity */
                    756:        br      _ASM_LABEL(infinity)
                    757: 2:
                    758:        br      _ASM_LABEL(denorm)      /* branch to denorm, the only */
                    759:                                        /* remaining alternative */
                    760:
                    761: /*
                    762:  * Branch to the routine to make a denormalized number.
                    763:  */
                    764: ASLOCAL(FPunderflow)
                    765:        st      r1,r31,0        /* save return address */
                    766:        set     r2,r2,1<underflow>
                    767:        set     r2,r2,1<inexact>
                    768:
                    769: /*
                    770:  * Now the floating point number, which has an exponent smaller than what
                    771:  * IEEE allows, must be denormalized. Denormalization is done by calculating
                    772:  * the difference between a denormalized exponent and an underflow exponent
                    773:  * and shifting the mantissa by that amount. A one may need to be subtracted
                    774:  * from the LSB if a one was added during rounding.
                    775:  * r9 is used to contain the guard, round, sticky, and an inaccuracy bit in
                    776:  * case some bits were shifted off the mantissa during denormalization.
                    777:  * r9 will contain:
                    778:  *   bit 4 -- new addone if one added during rounding after denormalization
                    779:  *   bit 3 -- inaccuracy flag caused by denormalization or pre-denormalization
                    780:  *            inexactness
                    781:  *   bit 2 -- guard bit of result
                    782:  *   bit 1 -- round bit of result
                    783:  *   bit 0 -- sticky bit of result
                    784:  */
                    785:
                    786: FPU_denorm:
                    787:        bb1.n   destsize,r12,Udouble    /* denorm for double */
                    788:         extu   r9,r10,3<26>    /* load r9 with grs */
                    789: Usingle:
                    790:        mak     r5,r10,21<3>    /* extract high 21 bits of mantissa */
                    791:        extu    r6,r11,3<29>    /* extract low 3 bits of mantissa */
                    792:        or      r11,r5,r6       /* form 24 bits of mantissa */
                    793:
                    794: /* See if the addone bit is set and unround if it is. */
                    795:        bb0.n   25,r10,nounrounds /* do not unround if addone bit clear */
                    796:         extu   r6,r12,12<20>   /* extract signed exponent from IMPCR */
                    797: unrounds:
                    798:        subu    r11,r11,1       /* subtract 1 from mantissa */
                    799:
                    800: /*
                    801:  * If the hidden bit is cleared after subtracting the one, then the one added
                    802:  * during the rounding must have propagated through the mantissa. The exponent
                    803:  * will need to be decremented.
                    804:  */
                    805:        bb1     23,r11,nounrounds /* if hidden bit is set,then exponent */
                    806:                                /* does not need to be decremented */
                    807: decexps:
                    808:        sub     r6,r6,1         /* decrement exponent 1 */
                    809:        set     r11,r11,1<23>   /* set the hidden bit */
                    810:
                    811: /*
                    812:  * For both single and double precision, there are cases where it is easier
                    813:  * and quicker to make a special case. Examples of this are if the shift
                    814:  * amount is only 1 or 2, or all the mantissa is shifted off, or all the
                    815:  * mantissa is shifted off and it is still shifting, or, in the case of
                    816:  * doubles, if the shift amount is around the boundary of MANTLO and MANTHI.
                    817:  */
                    818:
                    819: nounrounds:
                    820:        or      r8,r0,lo16(0x00000f81)  /* load r8 with -127 in decimal */
                    821:                                        /* for lowest 12 bits */
                    822:        sub     r7,r8,r6        /* find difference between two exponents, */
                    823:                                /* this amount is the shift amount */
                    824:        cmp     r6,r7,3         /* check to see if r7 contains 3 or more */
                    825:        bb1     ge,r6,threesing /* br to code that handles shifts of >=3 */
                    826:        cmp     r6,r7,2         /* check to see if r7 contains 2 */
                    827:        bb1     eq,r6,twosing   /* br to code that handles shifts of 2 */
                    828: one:
                    829:        rot     r9,r9,0<1>      /* rotate roundoff register once, this places */
                    830:                                /* guard in round and round in sticky */
                    831:        bb0     31,r9,nosticky1s /* do not or round and sticky if sticky is */
                    832:                                /* 0, this lost bit will be cleared later */
                    833:        set     r9,r9,1<0>      /* or round and sticky */
                    834: nosticky1s:
                    835:        bb0     0,r11,guardclr1s /* do not set guard bit if LSB = 0 */
                    836:        set     r9,r9,1<2>      /* set guard bit */
                    837: guardclr1s:
                    838:        extu    r11,r11,31<1>   /* shift mantissa right 1 */
                    839:        br.n    round           /* round result */
                    840:         mak    r9,r9,3<0>      /* clear bits lost during rotation */
                    841:
                    842: twosing:
                    843:        rot     r9,r9,0<2>      /* rotate roundff register twice, this places */
                    844:                                /* guard in sticky */
                    845:        bb0     30,r9,nosticky2s /* do not or guard and sticky if stick is 0 */
                    846:                                /* this lost bit will be cleared later */
                    847:        br.n    noround2s       /* skip or old guard and old round if old */
                    848:                                /* sticky set */
                    849:         set    r9,r9,1<0>      /* or guard and sticky */
                    850: nosticky2s:
                    851:        bb0     31,r9,noround2s /* do not or guard and round if round is 0 */
                    852:                                /* this lost bit will be cleared later */
                    853:        set     r9,r9,1<0>      /* or guard and round */
                    854: noround2s:
                    855:        bb0     0,r11,roundclr2s /* do not set round bit if LSB = 0 */
                    856:        set     r9,r9,1<1>      /* set round bit */
                    857: roundclr2s:
                    858:        bb0     1,r11,guardclr2s /* do not set guard bit if LSB + 1 = 0 */
                    859:        set     r9,r9,1<2>      /* set guard bit */
                    860: guardclr2s:
                    861:        extu    r11,r11,30<2>   /* shift mantissa right 2 */
                    862:        br.n    round           /* round result */
                    863:         mak    r9,r9,3<0>      /* clear bits lost during rotation */
                    864:
                    865: threesing:
                    866:        bb1     0,r9,noguard3s  /* check sticky initially */
                    867:                                /* sticky is set, forget most of the oring */
                    868: nosticky3s:
                    869:        bb0     1,r9,noround3s  /* check round initially, do not set sticky */
                    870:        br.n    noguard3s       /* forget most of the rest of oring */
                    871:         set    r9,r9,1<0>      /* if round is clear,set sticky if round set */
                    872: noround3s:
                    873:        bb0.n   2,r9,noguard3s  /* check guard initially, do not set sticky */
                    874:         clr    r9,r9,2<1>      /* clear the original guard and round for when */
                    875:                                /* you get to round section */
                    876:        set     r9,r9,1<0>      /* if guard is clear,set sticky if guard set */
                    877: noguard3s:
                    878:        cmp     r6,r7,23        /* check if # of shifts is <=23 */
                    879:        bb1     gt,r6,s24       /* branch to see if shifts = 24 */
                    880:        sub     r6,r7,2         /* get number of bits to check for sticky */
                    881:        mak     r6,r6,5<5>      /* shift width into width field */
                    882:        mak     r8,r11,r6       /* mask off shifted bits -2 */
                    883:        ff1     r8,r8           /* see if r8 has any ones */
                    884:        bb1     5,r8,nostky23   /* do not set sticky if no ones found */
                    885:        set     r9,r9,1<0>      /* set sticky bit */
                    886: nostky23:
                    887:        or      r8,r0,34        /* start code to get new mantissa plus two */
                    888:                                /* extra bits for new round and new guard */
                    889:                                /* bits */
                    890:        subu    r8,r8,r7
                    891:        mak     r8,r8,5<5>      /* shift field width into second five bits */
                    892:        extu    r6,r6,5<5>      /* shift previous shifted -2 into offset field */
                    893:        or      r6,r6,r8        /* complete field */
                    894:        extu    r11,r11,r6      /* form new mantissa with two extra bits */
                    895:
                    896:        bb0     0,r11,nornd3s   /* do not set new round bit */
                    897:        set     r9,r9,1<1>      /* set new round bit */
                    898: nornd3s:
                    899:        bb0     1,r11,nogrd3s   /* do not set new guard bit */
                    900:        set     r9,r9,1<2>      /* set new guard bit */
                    901: nogrd3s:
                    902:        br.n    round           /* round mantissa */
                    903:         extu   r11,r11,30<2>   /* shift off remaining two bits */
                    904:
                    905: s24:
                    906:        cmp     r6,r7,24        /* check to see if # of shifts is 24 */
                    907:        bb1     gt,r6,s25       /* branch to see if shifts = 25 */
                    908:        bb1     0,r9,nostky24   /* skip checking if old sticky set */
                    909:        extu    r8,r11,22<0>    /* prepare to check bits that will be shifted */
                    910:                                /* into the sticky */
                    911:        ff1     r8,r8           /* see if there are any 1''s */
                    912:        bb1     5,r8,nostky24   /* do not set sticky if no ones found */
                    913:        set     r9,r9,1<0>      /* set sticky bit */
                    914: nostky24:
                    915:        bb0     22,r11,nornd24  /* do not set new round bit */
                    916:        set     r9,r9,1<1>      /* set new round bit */
                    917: nornd24:
                    918:        set     r9,r9,1<2>      /* set new guard bit,this is hidden bit */
                    919:        br.n    round           /* round mantissa */
                    920:         or     r11,r0,r0       /* clear r11, all of mantissa shifted off */
                    921:
                    922: s25:
                    923:        cmp     r6,r7,25        /* check to see if # of shifts is 25 */
                    924:        bb1     gt,r6,s26       /* branch to execute for shifts => 26 */
                    925:        bb1     0,r9,nostky25   /* skip checking if old sticky set */
                    926:        extu    r8,r11,23<0>    /* prepare to check bits that will be shifted */
                    927:                                /* into the sticky */
                    928:        ff1     r8,r8           /* see if there are any 1''s */
                    929:        bb1     5,r8,nostky25   /* do not set sticky if no ones found */
                    930:        set     r9,r9,1<0>      /* set sticky bit */
                    931: nostky25:
                    932:        set     r9,r9,1<1>      /* set new round bit,this is hidden bit */
                    933:        clr     r9,r9,1<2>      /* clear guard bit since nothing shifted in */
                    934:        br.n    round           /* round and assemble result */
                    935:         or     r11,r0,r0       /* clear r11, all of mantissa shifted off */
                    936:
                    937: s26:
                    938:        set     r9,r9,1<0>      /* set sticky bit,this contains hidden bit */
                    939:        clr     r9,r9,2<1>      /* clear guard and round bits since nothing */
                    940:                                /* shifted in */
                    941:        br.n    round           /* round and assemble result */
                    942:         or     r11,r0,r0       /* clear mantissa */
                    943:
                    944: Udouble:
                    945:        mak     r5,r10,21<0>    /* extract upper bits of mantissa */
                    946:        bb0.n   25,r10,nounroundd /* do not unround if addone bit clear */
                    947:         extu   r6,r12,12<20>   /* extract signed exponenet from IMPCR */
                    948: unroundd:
                    949:        or      r8,r0,1
                    950:        subu.co r11,r11,r8      /* subtract 1 from mantissa */
                    951:        subu.ci r5,r5,r0        /* subtract borrow from upper word */
                    952:        bb1     20,r5,nounroundd /* if hidden bit is set, then exponent does */
                    953:                                /* not need to be decremented */
                    954: decexpd:
                    955:        sub     r6,r6,1         /* decrement exponent 1 */
                    956:        set     r5,r5,1<20>     /* set the hidden bit */
                    957:
                    958: nounroundd:
                    959:        or      r8,r0,lo16(0x00000c01) /* load r8 with -1023 in decimal */
                    960:                                /* for lowest 12 bits */
                    961:        sub     r7,r8,r6        /* find difference between two exponents, */
                    962:                                /* this amount is the shift amount */
                    963:        cmp     r6,r7,3         /* check to see if r7 contains 3 or more */
                    964:        bb1     ge,r6,threedoub /* br to code that handles shifts of >=3 */
                    965:        cmp     r6,r7,2         /* check to see if r7 contains 2 */
                    966:        bb1     eq,r6,twodoub   /* br to code that handles shifts of 2 */
                    967:
                    968: onedoub:
                    969:        rot     r9,r9,0<1>      /* rotate roundoff register once, this places */
                    970:                                /* guard in round and round in sticky */
                    971:        bb0     31,r9,nosticky1d/* do not or round and sticky if sticky is 0 */
                    972:                                /* this lost bit will be cleared later */
                    973:        set     r9,r9,1<0>      /* or old round and old sticky into new sticky */
                    974: nosticky1d:
                    975:        bb0     0,r11,guardclr1d /* do not set new guard bit if old LSB = 0 */
                    976:        set     r9,r9,1<2>      /* set new guard bit */
                    977: guardclr1d:
                    978:        extu    r11,r11,31<1>   /* shift lower mantissa over 1 */
                    979:        mak     r6,r5,1<31>     /* shift off low bit of high mantissa */
                    980:        or      r11,r6,r11      /* load high bit onto lower mantissa */
                    981:        extu    r5,r5,20<1>     /* shift right once upper 20 bits of mantissa */
                    982:        br.n    round           /* round mantissa and assemble result */
                    983:         mak    r9,r9,3<0>      /* clear bits lost during rotation */
                    984:
                    985: twodoub:
                    986:        rot     r9,r9,0<2>      /* rotate roundoff register twice, this places */
                    987:                                /* old guard into sticky */
                    988:        bb0     30,r9,nosticky2d /* do not or old guard and old sticky if */
                    989:                                /* old sticky is 0 */
                    990:        br.n    noround2d       /* skip or of old guard and old round if old */
                    991:                                /* sticky set */
                    992:         set    r9,r9,1<0>      /* or old guard and old sticky into new sticky */
                    993: nosticky2d:
                    994:        bb0     31,r9,noround2d /* do not or old guard and old round if */
                    995:                                /* old round is 0 */
                    996:        set     r9,r9,1<0>      /* or old guard and old round into new sticky */
                    997: noround2d:
                    998:        bb0     0,r11,roundclr2d /* do not set round bit if old LSB = 0 */
                    999:        set     r9,r9,1<1>      /* set new round bit */
                   1000: roundclr2d:
                   1001:        bb0     1,r11,guardclr2d /* do not set guard bit if old LSB + 1 = 0 */
                   1002:        set     r9,r9,1<2>      /* set new guard bit */
                   1003: guardclr2d:
                   1004:        extu    r11,r11,30<2>   /* shift lower mantissa over 2 */
                   1005:        mak     r6,r5,2<30>     /* shift off low bits of high mantissa */
                   1006:        or      r11,r6,r11      /* load high bit onto lower mantissa */
                   1007:        extu    r5,r5,19<2>     /* shift right twice upper 19 bits of mantissa */
                   1008:        br.n    round           /* round mantissa and assemble result */
                   1009:         mak    r9,r9,3<0>      /* clear bits lost during rotation */
                   1010:
                   1011: threedoub:
                   1012:        bb1     0,r9,noguard3d  /* checky sticky initially */
                   1013:                                /* sticky is set, forget most of rest of oring */
                   1014: nosticky3d:
                   1015:        bb0     1,r9,noround3d  /* check old round, do not set sticky if */
                   1016:                                /* old round is clear, set otherwise */
                   1017:        br.n    noguard3d       /* sticky is set, forget most of rest of oring */
                   1018:         set    r9,r9,1<0>      /* set sticky if old round is set */
                   1019: noround3d:
                   1020:        bb0     2,r9,noguard3d  /* check old guard, do not set sticky if 0 */
                   1021:        clr     r9,r9,2<1>      /* clear the original guard and round for when */
                   1022:                                /* you get to round section */
                   1023:        set     r9,r9,1<0>      /* set sticky if old guard is set */
                   1024: noguard3d:
                   1025:        cmp     r6,r7,32        /* do I need to work with a 1 or 2 word mant. */
                   1026:                                /* when forming sticky, round and guard */
                   1027:        bb1     gt,r6,d33       /* jump to code that handles 2 word mantissas */
                   1028:        sub     r6,r7,2         /* get number of bits to check for sticky */
                   1029:        mak     r6,r6,5<5>      /* shift width into width field */
                   1030:        mak     r8,r11,r6       /* mask off shifted bits -2 */
                   1031:        ff1     r8,r8           /* see if r8 has any ones */
                   1032:        bb1     5,r8,nostky32   /* do not set sticky if no ones found */
                   1033:        set     r9,r9,1<0>      /* set sticky bit */
                   1034: nostky32:
                   1035:        or      r8,r0,34        /* start code to get new mantissa plus two */
                   1036:                                /* extra bits for new round and new guard bits, */
                   1037:                                /* the upper word bits will be shifted after */
                   1038:                                /* the round and guard bits are handled */
                   1039:        subu    r8,r8,r7
                   1040:        mak     r8,r8,5<5>      /* shift field width into second five bits */
                   1041:        extu    r6,r6,5<5>      /* shift previous shifted -2 into offset field */
                   1042:        or      r6,r6,r8        /* complete bit field */
                   1043:        extu    r11,r11,r6      /* partially form new low mantissa with 2 more */
                   1044:                                /* bits */
                   1045:        bb0     0,r11,nornd32d  /* do not set new round bit */
                   1046:        set     r9,r9,1<1>      /* set new round bit */
                   1047: nornd32d:
                   1048:        bb0     1,r11,nogrd32d  /* do not set new guard bit */
                   1049:        set     r9,r9,1<2>      /* set new guard bit */
                   1050: nogrd32d:
                   1051:        extu    r11,r11,30<2>   /* shift off remaining two bits */
                   1052:        mak     r6,r7,5<5>      /* shift field width into second 5 bits, if the */
                   1053:                                /* width is 32, then these bits will be 0 */
                   1054:        or      r8,r0,32        /* load word length into r8 */
                   1055:        sub     r8,r8,r7        /* form offset for high bits moved to low word */
                   1056:        or      r6,r6,r8        /* form complete bit field */
                   1057:        mak     r6,r5,r6        /* get shifted bits of high word */
                   1058:        or      r11,r6,r11      /* form new low word of mantissa */
                   1059:        bcnd    ne0,r8,regular33 /* do not adjust for special case of r8 */
                   1060:        br.n    round           /* containing zeros, which would cause */
                   1061:         or     r5,r0,r0        /* all of the bits to be extracted under */
                   1062:                                /* the regular method */
                   1063: regular33:
                   1064:        mak     r6,r7,5<0>      /* place lower 5 bits of shift into r6 */
                   1065:        mak     r8,r8,5<5>      /* shift r8 into width field */
                   1066:        or      r6,r6,r8        /* form field for shifting of upper bits */
                   1067:        br.n    round           /* round and assemble result */
                   1068:         extu   r5,r5,r6        /* form new high word mantissa */
                   1069:
                   1070: d33:
                   1071:        cmp     r6,r7,33        /* is the number of bits to be shifted is 33? */
                   1072:        bb1     gt,r6,d34       /* check to see if # of bits is 34 */
                   1073:        bb1     0,r9,nostky33   /* skip checking if old sticky set */
                   1074:        mak     r6,r11,31<0>    /* check bits that will be shifted into sticky */
                   1075:        ff1     r8,r8           /* check for ones */
                   1076:        bb1     5,r8,nostky33   /* do not set sticky if there are no ones */
                   1077:        set     r9,r9,1<0>      /* set new sticky bit */
                   1078: nostky33:
                   1079:        bb0     31,r11,nornd33  /* do not set round if bit is not a 1 */
                   1080:        set     r9,r9,1<1>      /* set new round bit */
                   1081: nornd33:
                   1082:        bb0     0,r5,nogrd33    /* do not set guard bit if bit is not a 1 */
                   1083:        set     r9,r9,1<2>      /* set new guard bit */
                   1084: nogrd33:
                   1085:        extu    r11,r5,31<1>    /* shift high bits into low word */
                   1086:        br.n    round           /* round and assemble result */
                   1087:         or     r5,r0,r0        /* clear high word */
                   1088:
                   1089: d34:
                   1090:        cmp     r6,r7,34        /* is the number of bits to be shifted 34? */
                   1091:        bb1     gt,r6,d35       /* check to see if # of bits is >= 35 */
                   1092:        bb1     0,r9,nostky34   /* skip checking if old sticky set */
                   1093:        ff1     r8,r11          /* check bits that will be shifted into sticky */
                   1094:        bb1     5,r8,nostky34   /* do not set sticky if there are no ones */
                   1095:        set     r9,r9,1<0>      /* set new sticky bit */
                   1096: nostky34:
                   1097:        bb0     0,r5,nornd34    /* do not set round if bit is not a 1 */
                   1098:        set     r9,r9,1<1>      /* set new round bit */
                   1099: nornd34:
                   1100:        bb0     1,r5,nogrd34    /* do not set guard bit if bit is not a 1 */
                   1101:        set     r9,r9,1<2>      /* set new guard bit */
                   1102: nogrd34:
                   1103:        extu    r11,r5,30<2>    /* shift high bits into low word */
                   1104:        br.n    round           /* round and assemble result */
                   1105:         or     r5,r0,r0        /* clear high word */
                   1106:
                   1107: d35:
                   1108:        cmp     r6,r7,52        /* see if # of shifts is 35 <= X <= 52 */
                   1109:        bb1     gt,r6,d53       /* check to see if # of shifts is 52 */
                   1110:        bb1.n   0,r9,nostky35   /* skip checking if old sticky set */
                   1111:         sub    r7,r7,34        /* subtract 32 from # of shifts so that opera- */
                   1112:                                /* tions can be done on the upper word, and */
                   1113:                                /* then subtract two more checking guard and */
                   1114:                                /* sticky bits */
                   1115:        ff1     r8,r11          /* see if lower word has a bit for sticky */
                   1116:        bb1     5,r8,stkycheck35 /* see if upper word has any sticky bits       */
                   1117:        br.n    nostky35        /* quit checking for sticky */
                   1118:         set    r9,r9,1<0>      /* set sticky bit */
                   1119: stkycheck35:
                   1120:        mak     r6,r7,5<5>      /* place width into width field */
                   1121:        mak     r8,r5,r6        /* mask off shifted bits - 2 */
                   1122:        ff1     r8,r8           /* see if r8 has any ones */
                   1123:        bb1     5,r8,nostky35   /* do not set sticky if no ones found */
                   1124:        set     r9,r9,1<0>      /* set sticky bit */
                   1125: nostky35:
                   1126:        or      r8,r0,32        /* look at what does not get shifted off plus */
                   1127:                                /* round and sticky, remember that the r7 value */
                   1128:                                /* was adjusted so that it did not include */
                   1129:                                /* new round or new sticky in shifted off bits */
                   1130:        subu    r8,r8,r7        /* complement width */
                   1131:        mak     r8,r8,5<5>      /* shift width into width field */
                   1132:        or      r8,r7,r8        /* add offset field */
                   1133:        extu    r11,r5,r8       /* extract upper bits into low word */
                   1134:        bb0     0,r11,nornd35   /* do not set new round bit */
                   1135:        set     r9,r9,1<1>      /* set new round bit */
                   1136: nornd35:
                   1137:        bb0     1,r11,nogrd35   /* do not set new guard bit */
                   1138:        set     r9,r9,1<2>      /* set new guard bit */
                   1139: nogrd35:
                   1140:        extu    r11,r11,30<2>   /* shift off remaining guard and round bits */
                   1141:        br.n    round           /* round and assemble result */
                   1142:         or     r5,r0,r0        /* clear high word */
                   1143:
                   1144: d53:
                   1145:        cmp     r6,r7,53        /* check to see if # of shifts is 53 */
                   1146:        bb1     gt,r6,d54       /* branch to see if shifts = 54 */
                   1147:        bb1     0,r9,nostky53   /* skip checking if old sticky set */
                   1148:        ff1     r8,r11          /* see if lower word has a bit for sticky */
                   1149:        bb1     5,r8,stkycheck53 /* see if upper word has any sticky bits       */
                   1150:        br.n    nostky53        /* quit checking for sticky */
                   1151:         set    r9,r9,1<0>      /* set sticky bit */
                   1152: stkycheck53:
                   1153:        mak     r6,r5,19<0>     /* check bits that are shifted into sticky */
                   1154:        ff1     r8,r6           /* see if r6 has any ones */
                   1155:        bb1     5,r8,nostky53   /* do not set sticky if no ones found */
                   1156:        set     r9,r9,1<0>      /* set sticky bit */
                   1157: nostky53:
                   1158:        bb0     19,r5,nornd53   /* do not set new round bit */
                   1159:        set     r9,r9,1<1>      /* set new round bit */
                   1160: nornd53:
                   1161:        set     r9,r9,1<2>      /* set new guard bit,this is hidden bit */
                   1162:        or      r5,r0,r0        /* clear high word */
                   1163:        br.n    round           /* round and assemble result */
                   1164:         or     r11,r0,r0       /* clear low word */
                   1165:
                   1166: d54:
                   1167:        cmp     r6,r7,54        /* check to see if # of shifts is 54 */
                   1168:        bb1     gt,r6,d55       /* branch to execute for shifts =>55 */
                   1169:        bb1     0,r9,nostky54   /* skip checking if old sticky set */
                   1170:        ff1     r8,r11          /* see if lower word has a bit for sticky */
                   1171:        bb1     5,r8,stkycheck54 /* see if upper word has any sticky bits       */
                   1172:        br.n    nostky54        /* quit checking for sticky */
                   1173:         set    r9,r9,1<0>      /* set sticky bit */
                   1174: stkycheck54:
                   1175:        mak     r6,r5,20<0>     /* check bits that are shifted into sticky */
                   1176:        ff1     r8,r6           /* see if r6 has any ones */
                   1177:        bb1     5,r8,nostky54   /* do not set sticky if no ones found */
                   1178:        set     r9,r9,1<0>      /* set sticky bit */
                   1179: nostky54:
                   1180:        set     r9,r9,1<1>      /* set new round bit,this is hidden bit */
                   1181:        clr     r9,r9,1<2>      /* clear guard bit since nothing shifted in */
                   1182:        or      r5,r0,r0        /* clear high word */
                   1183:        br.n    round           /* round and assemble result */
                   1184:         or     r11,r0,r0       /* clear low word */
                   1185:
                   1186: d55:
                   1187:        set     r9,r9,1<0>      /* set new sticky bit,this contains hidden bit */
                   1188:        clr     r9,r9,2<1>      /* clear guard and round bits since nothing */
                   1189:                                /* shifted in */
                   1190:        or      r5,r0,r0        /* clear high word */
                   1191:        or      r11,r0,r0       /* clear low word */
                   1192:
                   1193:
                   1194: /* The first item that the rounding code does is see if either guard, round, */
                   1195: /* or sticky is set. If all are clear, then there is no denormalization loss */
                   1196: /* and no need to round, then branch to assemble answer. */
                   1197: /* For rounding, a branch table is set up. The left two most bits are the */
                   1198: /* rounding mode. The third bit is either the LSB of the mantissa or the */
                   1199: /* sign bit, depending on the rounding mode. The three LSB''s are the guard, */
                   1200: /* round and sticky bits. */
                   1201:
                   1202: round:
                   1203:        ff1     r8,r9           /* see if there is denormalization loss */
                   1204:        bb1     5,r8,assemble   /* no denormalization loss or inexactness */
                   1205:        extu    r6,r10,2<modelo> /* extract rounding mode */
                   1206:        bb1.n   modehi,r10,signext /* use sign bit instead of LSB */
                   1207:         mak    r6,r6,2<4>      /* shift over rounding mode */
                   1208:        extu    r7,r11,1<0>     /* extract LSB */
                   1209:        br.n    grs             /* skip sign extraction */
                   1210:         mak    r7,r7,1<3>      /* shift over LSB */
                   1211: signext:
                   1212:        extu    r7,r10,1<31>    /* extract sign bit */
                   1213:        mak     r7,r7,1<3>      /* shift sign bit over */
                   1214: grs:
                   1215:        or      r6,r6,r7
                   1216:        or      r6,r6,r9        /* or in guard, round, and sticky */
                   1217:        or.u    r1,r0,hi16(roundtable) /* form address of branch table */
                   1218:        or      r1,r1,lo16(roundtable)
                   1219:        lda     r6,r1[r6]       /* scale offset into branch table */
                   1220:        jmp.n   r6              /* jump to branch table */
                   1221:         set    r9,r9,1<3>      /* set inexact flag in r9 */
                   1222:
                   1223: roundtable:
                   1224:        br      noaddone
                   1225:        br      noaddone
                   1226:        br      noaddone
                   1227:        br      noaddone
                   1228:        br      noaddone
                   1229:        br      addone
                   1230:        br      addone
                   1231:        br      addone
                   1232:        br      noaddone
                   1233:        br      noaddone
                   1234:        br      noaddone
                   1235:        br      noaddone
                   1236:        br      addone
                   1237:        br      addone
                   1238:        br      addone
                   1239:        br      addone
                   1240:        br      noaddone
                   1241:        br      noaddone
                   1242:        br      noaddone
                   1243:        br      noaddone
                   1244:        br      noaddone
                   1245:        br      noaddone
                   1246:        br      noaddone
                   1247:        br      noaddone
                   1248:        br      noaddone
                   1249:        br      noaddone
                   1250:        br      noaddone
                   1251:        br      noaddone
                   1252:        br      noaddone
                   1253:        br      noaddone
                   1254:        br      noaddone
                   1255:        br      noaddone
                   1256:        br      noaddone
                   1257:        br      noaddone
                   1258:        br      noaddone
                   1259:        br      noaddone
                   1260:        br      noaddone
                   1261:        br      noaddone
                   1262:        br      noaddone
                   1263:        br      noaddone
                   1264:        br      noaddone
                   1265:        br      addone
                   1266:        br      addone
                   1267:        br      addone
                   1268:        br      addone
                   1269:        br      addone
                   1270:        br      addone
                   1271:        br      addone
                   1272:        br      noaddone
                   1273:        br      addone
                   1274:        br      addone
                   1275:        br      addone
                   1276:        br      addone
                   1277:        br      addone
                   1278:        br      addone
                   1279:        br      addone
                   1280:        br      noaddone
                   1281:        br      noaddone
                   1282:        br      noaddone
                   1283:        br      noaddone
                   1284:        br      noaddone
                   1285:        br      noaddone
                   1286:        br      noaddone
                   1287:        br      noaddone
                   1288:
                   1289: /* Round by adding a one to the LSB of the mantissa. */
                   1290: addone:
                   1291:        or      r6,r0,1         /* load a 1 into r6 so that add.co can be used */
                   1292:        add.co  r11,r11,r6      /* add a one to the lower word of result */
                   1293:        bb0.n   destsize,r12,noaddone /* single result,forget carry */
                   1294:         set    r9,r9,1<4>      /* indicate that a 1 has been added */
                   1295:        add.ci  r5,r5,r0        /* propagate carry into high word */
                   1296:
                   1297: noaddone:
                   1298:        set     r2,r2,1<inexact>
                   1299:        set     r2,r2,1<underflow>
                   1300:
                   1301: /* Assemble the result of the denormalization routine for writeback to the */
                   1302: /* destination register. The exponent of a denormalized number is zero, */
                   1303: /* so simply assemble the sign and the new mantissa. */
                   1304:
                   1305: assemble:
                   1306:        bb1     destsize,r12,doubassem  /* assemble double result */
                   1307:        bb0     sign,r10,exassems       /* exit assemble if sign is zero */
                   1308:        set     r11,r11,1<sign>         /* make result negative */
                   1309: exassems:
                   1310:        br      Ureturn
                   1311:
                   1312: doubassem:
                   1313:        bb0.n   sign,r10,signclr        /* do not set sign in r10 */
                   1314:         or     r10,r5,r0               /* load high word from r5 into r10 */
                   1315:        set     r10,r10,1<sign>         /* high word with sign loaded */
                   1316: signclr:
                   1317:        /* FALLTHROUGH */
                   1318:        /* br   Ureturn */
                   1319:
                   1320: /* Return to fpui. */
                   1321: Ureturn:
                   1322:        ld      r1,r31,0        /* load return address */
                   1323:        jmp     r1
                   1324:
                   1325: /*
                   1326:  * FPoverflow
                   1327:  */
                   1328:
                   1329: ASLOCAL(FPoverflow)
                   1330:        st      r1,r31,0        /* save return address */
                   1331:        set     r2,r2,1<overflow>
                   1332:        set     r2,r2,1<inexact>
                   1333:
                   1334: /* Determine which rounding mode to use for the default procedure. */
                   1335:
                   1336:        bb1     modehi,r10,signed /* mode is either round toward pos. or neg. */
                   1337:        bb0     modelo,r10,OFnearest /* rounding mode is round nearest */
                   1338:        br      OFzero          /* rounding mode is round zero */
                   1339: signed:
                   1340:        bb0     modelo,r10,OFnegative /* rounding mode is round negative */
                   1341:        br      positive        /* rounding mode is round positive */
                   1342:
                   1343:
                   1344: /* In the round toward nearest mode, positive values are rounded to */
                   1345: /* positive infinity and negative values are loaded toward negative infinity. */
                   1346: /* The value for single or double precision is loaded from a data table. */
                   1347:
                   1348: OFnearest:
                   1349:        bb1.n   destsize,r12,neardouble /* branch to neardouble of */
                   1350:                                        /* double result */
                   1351:         mask.u r5,r10,0x8000           /* mask off sign bit from MANTHI */
                   1352:        or.u    r11,r0,hi16(0x7f800000) /* load single infinity constant */
                   1353:        or      r11,r11,lo16(0x7f800000)
                   1354:        br.n    FPof_return             /* return with result */
                   1355:         or     r11,r5,r11              /* adjust sign */
                   1356: neardouble:
                   1357:        or      r11,r0,r0               /* load lower word of infinity */
                   1358:        or.u    r10,r0,hi16(0x7ff00000) /* load upper word of infinity */
                   1359:        or      r10,r10,lo16(0x7ff00000)
                   1360:        br.n    FPof_return             /* return with result */
                   1361:         or     r10,r5,r10              /* adjust sign */
                   1362:
                   1363:
                   1364: /* In the round toward zero mode, positive values are rounded to the largest */
                   1365: /* postive finite number and negative values are rounded toward the largest */
                   1366: /* negative finite number. */
                   1367: /* The value for single or double precision is loaded from a data table. */
                   1368:
                   1369: OFzero:
                   1370:        bb1.n   destsize,r12,zerodouble /* branch to zerodouble of */
                   1371:                                        /* double result */
                   1372:         mask.u r5,r10,0x8000           /* mask off sign bit from MANTHI */
                   1373:        or.u    r11,r0,hi16(0x7f7fffff) /* load single finite number constant */
                   1374:        or      r11,r11,lo16(0x7f7fffff)
                   1375:        br.n    FPof_return             /* return with result */
                   1376:         or     r11,r5,r11              /* adjust sign */
                   1377: zerodouble:
                   1378:        set     r11,r0,0<0>             /* load lower word of finite number */
                   1379:        or.u    r10,r0,hi16(0x7fefffff) /* load upper word of finite number */
                   1380:        or      r10,r10,lo16(0x7fefffff)
                   1381:        br.n    FPof_return             /* return with result */
                   1382:         or     r10,r5,r10              /* adjust sign */
                   1383:
                   1384:
                   1385: /* In the round toward positve mode, positive values are rounded to */
                   1386: /* postive infinity and negative values are loaded toward the largest */
                   1387: /* negative finite number. */
                   1388: /* The value for single or double precision is loaded from a data table. */
                   1389:
                   1390: positive:
                   1391:        bb1     destsize,r12,posdouble  /* branch to section for double result */
                   1392: possingle:
                   1393:        bb1     sign,r10,possingleneg   /* branch to section for negatives */
                   1394: possinglepos:
                   1395:        or.u    r11,r0,hi16(0x7f800000) /* load single infinity constant */
                   1396:        br.n    FPof_return             /* return with result */
                   1397:         or     r11,r11,lo16(0x7f800000)
                   1398: possingleneg:
                   1399:        or.u    r11,r0,hi16(0x7f7fffff) /* load single finite number constant */
                   1400:        or      r11,r11,lo16(0x7f7fffff)
                   1401:        br.n    FPof_return             /* return with result */
                   1402:         set    r11,r11,1<sign>         /* set sign for negative */
                   1403: posdouble:
                   1404:        bb1     sign,r10,posdoubleneg   /* branch to negative double results */
                   1405: posdoublepos:
                   1406:        or      r11,r0,r0               /* load lower word of double infinity */
                   1407:        or.u    r10,r0,hi16(0x7ff00000) /* load upper word of infinity */
                   1408:        br.n    FPof_return             /* return with result */
                   1409:         or     r10,r10,lo16(0x7ff00000)
                   1410: posdoubleneg:
                   1411:        set     r11,r0,0<0>             /* load lower word of finite number */
                   1412:        or.u    r10,r0,hi16(0x7fefffff) /* load upper word of finite number */
                   1413:        or      r10,r10,lo16(0x7fefffff)
                   1414:        br.n    FPof_return             /* return with result */
                   1415:         set    r10,r10,1<sign>         /* set sign for negative */
                   1416:
                   1417:
                   1418: /* In the round toward negative mode, positive values are rounded to the largest */
                   1419: /* postive finite number and negative values are rounded to negative infinity. */
                   1420: /* The value for single or double precision is loaded from a data table. */
                   1421:
                   1422: OFnegative:
                   1423:        bb1     destsize,r12,negdouble  /* branch to section for double result */
                   1424: negsingle:
                   1425:        bb1     sign,r10,negsingleneg   /* branch to section for negatives */
                   1426: negsinglepos:
                   1427:        or.u    r11,r0,hi16(0x7f7fffff) /* load single finite number constant */
                   1428:        br.n    FPof_return             /* return with result */
                   1429:         or     r11,r11,lo16(0x7f7fffff)
                   1430: negsingleneg:
                   1431:        or.u    r11,r0,hi16(0x7f800000) /* load single infinity constant */
                   1432:        or      r11,r11,lo16(0x7f800000)
                   1433:        br.n    FPof_return             /* return with result */
                   1434:         set    r11,r11,1<sign>         /* set sign for negative */
                   1435: negdouble:
                   1436:        bb1     sign,r10,negdoubleneg   /* branch to negative double results */
                   1437: negdoublepos:
                   1438:        set     r11,r0,0<0>             /* load lower word of finite number */
                   1439:        or.u    r10,r0,hi16(0x7fefffff) /* load upper word of finite number */
                   1440:        br.n    FPof_return             /* return with result */
                   1441:         or     r10,r10,lo16(0x7fefffff)
                   1442: negdoubleneg:
                   1443:        or      r11,r0,r0               /* load lower word of double infinity */
                   1444:        or.u    r10,r0,hi16(0x7ff00000) /* load upper word of infinity */
                   1445:        or      r10,r10,lo16(0x7ff00000)
                   1446:        set     r10,r10,1<sign>         /* set sign for negative */
                   1447:
                   1448: FPof_return:
                   1449:        ld      r1,r31,0                /* ld return address */
                   1450:        jmp     r1
                   1451:
                   1452: /* If either S1 or S2 is a signalling NaN, then set the invalid operation */
                   1453: /* bit of the FPSR. */
                   1454: /* If S1 is the only NaN or one of two NaN''s, then write */
                   1455: /* a quiet S1 to the result. A signalling NaN must be made quiet before */
                   1456: /* it can be written, but a signalling S2 is not modified in this routine */
                   1457: /* if S1 is a NaN. */
                   1458: ASLOCAL(NaN)
                   1459:        bb0.n   s1nan,r12,S2sigcheck    /* S1 is not a NaN */
                   1460:         st     r1,r31,0                /* save return address */
                   1461:        bb1     sigbit,r5,S2sigcheck    /* S1 is not a signaling NaN */
                   1462:        set     r2,r2,1<oper>
                   1463:        br.n    S1write         /* FPSR bit already set, S1 is made quiet, */
                   1464:                                /* and since we always write S1 if it is a */
                   1465:                                /* NaN, write S1 and skip rest of routine */
                   1466:         set    r5,r5,1<sigbit> /* make S1 a quiet NaN */
                   1467:
                   1468: ASLOCAL(S2sigcheck)
                   1469:        bb0     s2nan,r12,S1write       /* S2 is not a NaN */
                   1470:        bb1     sigbit,r7,S1write       /* S2 is not a signaling NaN */
                   1471:        set     r2,r2,1<oper>
                   1472:        set     r7,r7,1<sigbit>         /* make S2 a quiet NaN */
                   1473:
                   1474:
                   1475: /* Write a single or double precision quiet NaN unless the opeation is FCMP. */
                   1476: /* If the operation is FCMP, then set the not comparable bit in the result. */
                   1477:
                   1478: ASLOCAL(S1write)
                   1479:        bb0     s1nan,r12,S2write /* do not write S1 if it is not a NaN */
                   1480:        extu    r10,r9,5<11>    /* extract opcode */
                   1481:        cmp     r11,r10,FCMPop  /* compare to FCMP */
                   1482:        bb1     ne,r11,S1noFCMP /* operation is not FCMP */
                   1483:        set     r6,r0,1<nc>     /* set the not comparable bit */
                   1484:        br.n    FPnan_return
                   1485:         set    r6,r6,1<ne>     /* set the not equal bit */
                   1486: ASLOCAL(S1noFCMP)
                   1487:        bb1.n   dsize,r9,wrdoubS1 /* double destination */
                   1488:         set    r5,r5,11<20>    /* set all exponent bits to 1 */
                   1489: /* The single result will be formed the same way whether S1 is a single or double */
                   1490: ASLOCAL(wrsingS1)
                   1491:        mak     r10,r5,28<3>    /* wipe out extra exponent bits */
                   1492:        extu    r11,r6,3<29>    /* get lower three bits of mantissa */
                   1493:        or      r10,r10,r11     /* combine all of result except sign */
                   1494:        clr     r6,r5,31<0>     /* clear all but sign */
                   1495:        br.n    FPnan_return
                   1496:         or     r6,r6,r10       /* form result */
                   1497:
                   1498: ASLOCAL(wrdoubS1)
                   1499:        set     r6,r6,29<0>     /* set extra bits of lower word */
                   1500:        br      FPnan_return    /* no modification necessary for writing */
                   1501:                                /* double to double, so return */
                   1502:
                   1503: ASLOCAL(S2write)
                   1504:        extu    r10,r9,5<11>    /* extract opcode */
                   1505:        cmp     r11,r10,FCMPop  /* compare to FCMP */
                   1506:        bb1.n   ne,r11,S2noFCMP /* operation is not FCMP */
                   1507:         set    r7,r7,11<20>    /* set all exponent bits to 1 */
                   1508:        set     r6,r0,1<nc>     /* set the not comparable bit */
                   1509:        br.n    FPnan_return
                   1510:         set    r6,r6,1<ne>     /* set the not equal bit */
                   1511: ASLOCAL(S2noFCMP)
                   1512:        bb1.n   dsize,r9,wrdoubS2 /* double destination */
                   1513:         set    r5,r5,11<20>    /* set all exponent bits to 1 */
                   1514: /* The single result will be formed the same way whether S1 is a single or double */
                   1515: ASLOCAL(wrsingS2)
                   1516:        mak     r10,r7,28<3>    /* wipe out extra exponent bits */
                   1517:        extu    r11,r8,3<29>    /* get lower three bits of mantissa */
                   1518:        or      r10,r10,r11     /* combine all of result except sign */
                   1519:        clr     r6,r7,31<0>     /* clear all but sign */
                   1520:        br.n    FPnan_return
                   1521:         or     r6,r6,r10       /* form result */
                   1522:
                   1523: ASLOCAL(wrdoubS2)
                   1524:        set     r6,r8,29<0>     /* set extra bits of lower word */
                   1525:
                   1526: /* Return from this subroutine with the result. */
                   1527:
                   1528: ASLOCAL(FPnan_return)
                   1529:                                /* no modification necessary for writing */
                   1530:                                /* double to double, so return */
                   1531:        ld      r1,r31, 0       /* retrieve return address */
                   1532:        jmp     r1
                   1533:
                   1534: /*
                   1535:  * infinity
                   1536:  */
                   1537:
                   1538: /* Extract the opcode, compare to a constant, and branch to the code */
                   1539: /* for the instruction. */
                   1540:
                   1541: ASLOCAL(infinity)
                   1542:        extu    r10,r9,5<11>    /* extract opcode */
                   1543:        cmp     r11,r10,FADDop  /* compare to FADD */
                   1544:        bb1.n   eq,r11,FADD     /* operation is FADD */
                   1545:         st     r1,r31,0        /* save return address */
                   1546:        cmp     r11,r10,FSUBop  /* compare to FSUB */
                   1547:        bb1     eq,r11,FSUB     /* operation is FSUB */
                   1548:        cmp     r11,r10,FCMPop  /* compare to FCMP */
                   1549:        bb1     eq,r11,FCMP     /* operation is FCMP */
                   1550:        cmp     r11,r10,FMULop  /* compare to FMUL */
                   1551:        bb1     eq,r11,FMUL     /* operation is FMUL */
                   1552:        cmp     r11,r10,FDIVop  /* compare to FDIV */
                   1553:        bb1     eq,r11,FDIV     /* operation is FDIV */
                   1554: #if 0
                   1555:        cmp     r11,r10,FSQRTop /* compare to FSQRT */
                   1556:        bb1     eq,r11,FSQRT    /* operation is FSQRT */
                   1557: #endif
                   1558:        cmp     r11,r10,INTop   /* compare to INT */
                   1559:        bb1     eq,r11,FP_inf_overflw /* operation is INT */
                   1560:        cmp     r11,r10,NINTop  /* compare to NINT */
                   1561:        bb1     eq,r11,FP_inf_overflw /* operation is NINT */
                   1562:        cmp     r11,r10,TRNCop  /* compare to TRNC */
                   1563:        bb1     eq,r11,FP_inf_overflw /* operation is TRNC */
                   1564:
                   1565:
                   1566: /* Adding infinities of opposite signs will cause an exception, */
                   1567: /* but all other operands will result in a correctly signed infinity. */
                   1568:
                   1569: FADD:
                   1570:        bb0     s1inf,r12,addS2write    /* branch if S1 not infinity */
                   1571:        bb0     s2inf,r12,addS1write    /* S2 is not inf., so branch to write S1 */
                   1572:        bb1     sign,r5,addS1neg        /* handle case of S1 negative */
                   1573: addS1pos:
                   1574:        bb1     sign,r7,excpt           /* adding infinities of different */
                   1575:                                        /* signs causes an exception */
                   1576:        br      poswrinf                /* branch to write positive infinity */
                   1577: addS1neg:
                   1578:        bb0     sign,r7,excpt           /* adding infinities of different */
                   1579:                                        /* signs causes an exception */
                   1580:        br      negwrinf                /* branch to write negative infinity */
                   1581: addS1write:
                   1582:        bb0     sign,r5,poswrinf        /* branch to write positive infinity */
                   1583:        br      negwrinf                /* branch to write negative infinity */
                   1584: addS2write:
                   1585:        bb0     sign,r7,poswrinf        /* branch to write positive infinity */
                   1586:        br      negwrinf                /* branch to write negative infinity */
                   1587:
                   1588:
                   1589: /* Subtracting infinities of the same sign will cause an exception, */
                   1590: /* but all other operands will result in a correctly signed infinity. */
                   1591:
                   1592: FSUB:
                   1593:        bb0     s1inf,r12,subS2write    /* branch if S1 not infinity */
                   1594:        bb0     s2inf,r12,subS1write    /* S2 is not inf., so branch to write S1 */
                   1595:        bb1     sign,r5,subS1neg        /* handle case of S1 negative */
                   1596: subS1pos:
                   1597:        bb0     sign,r7,excpt           /* subtracting infinities of the same */
                   1598:                                        /* sign causes an exception */
                   1599:        br      poswrinf                /* branch to write positive infinity */
                   1600: subS1neg:
                   1601:        bb1     sign,r7,excpt           /* subtracting infinities of the same */
                   1602:                                        /* sign causes an exception */
                   1603:        br      negwrinf                /* branch to write negative infinity */
                   1604: subS1write:
                   1605:        bb0     sign,r5,poswrinf        /* branch to write positive infinity */
                   1606:        br      negwrinf                /* branch to write negative infinity */
                   1607: subS2write:
                   1608:        bb1     sign,r7,poswrinf        /* branch to write positive infinity */
                   1609:        br      negwrinf                /* branch to write negative infinity */
                   1610:
                   1611:
                   1612: /* Compare the operands, at least one of which is infinity, and set the */
                   1613: /* correct bits in the destination register. */
                   1614:
                   1615: FCMP:
                   1616:        bb0.n   s1inf,r12,FCMPS1f       /* branch for finite S1 */
                   1617:         set    r4,r0,1<cp>             /* since neither S1 or S2 is a NaN, */
                   1618:                                        /* set cp */
                   1619: FCMPS1i:
                   1620:        bb1     sign,r5,FCMPS1ni        /* branch to negative S1i */
                   1621: FCMPS1pi:
                   1622:        bb0     s2inf,r12,FCMPS1piS2f   /* branch to finite S2 with S1pi */
                   1623: FCMPS1piS2i:
                   1624:        bb1     sign,r7,FCMPS1piS2ni    /* branch to negative S2i with S1pi */
                   1625: FCMPS1piS2pi:
                   1626:        set     r4,r4,1<eq>             /* set eq bit */
                   1627:        set     r4,r4,1<le>             /* set le bit */
                   1628:        set     r4,r4,1<ge>             /* set ge bit */
                   1629:        set     r4,r4,1<ib>             /* set ib bit */
                   1630:        br.n    move
                   1631:         set    r4,r4,1<ob>             /* set ob bit */
                   1632: FCMPS1piS2ni:
                   1633:        set     r4,r4,1<ne>             /* set ne bit */
                   1634:        set     r4,r4,1<gt>             /* set gt bit */
                   1635:        br.n    move
                   1636:         set    r4,r4,1<ge>             /* set ge bit */
                   1637: FCMPS1piS2f:
                   1638:        set     r4,r4,1<ne>             /* set ne bit */
                   1639:        set     r4,r4,1<gt>             /* set gt bit */
                   1640:        bsr.n   _ASM_LABEL(zero)        /* see if any of the operands are zero */
                   1641:         set    r4,r4,1<ge>             /* set ge bit */
                   1642:        bb0     s2zero,r12,FCMPS1piS2nz /* check for negative if s2 not zero */
                   1643:        set     r4,r4,1<ou>             /* set ou bit */
                   1644:        br.n    move
                   1645:         set    r4,r4,1<ob>             /* set ob bit */
                   1646: FCMPS1piS2nz:
                   1647:        bb1     sign,r7,move            /* return if s2 is negative */
                   1648: FCMPS1piS2pf:
                   1649:        set     r4,r4,1<ou>             /* set ou bit */
                   1650:        br.n    move
                   1651:         set    r4,r4,1<ob>             /* set ob bit */
                   1652: FCMPS1ni:
                   1653:        bb0     s2inf,r12,FCMPS1niS2f   /* branch to finite S2 with S1ni */
                   1654: FCMPS1niS2i:
                   1655:        bb1     sign,r7,FCMPS1niS2ni    /* branch to negative S2i with S1ni */
                   1656: FCMPS1niS2pi:
                   1657:        set     r4,r4,1<ne>             /* set eq bit */
                   1658:        set     r4,r4,1<le>             /* set le bit */
                   1659:        set     r4,r4,1<lt>             /* set lt bit */
                   1660:        set     r4,r4,1<ou>             /* set ou bit */
                   1661:        br.n    move
                   1662:         set    r4,r4,1<ob>             /* set ob bit */
                   1663: FCMPS1niS2ni:
                   1664:        set     r4,r4,1<eq>             /* set eq bit */
                   1665:        set     r4,r4,1<le>             /* set le bit */
                   1666:        br.n    move
                   1667:         set    r4,r4,1<ge>             /* set ge bit */
                   1668: FCMPS1niS2f:
                   1669:        set     r4,r4,1<ne>             /* set eq bit */
                   1670:        set     r4,r4,1<le>             /* set le bit */
                   1671:        bsr.n   _ASM_LABEL(zero)        /* see if any of the operands are zero */
                   1672:         set    r4,r4,1<lt>             /* set lt bit */
                   1673:        bb0     s2zero,r12,FCMPS1niS2nz /* branch if s2 is not zero */
                   1674:        set     r4,r4,1<ou>             /* set ou bit */
                   1675:        br.n    move
                   1676:         set    r4,r4,1<ob>             /* set ob bit */
                   1677: FCMPS1niS2nz:
                   1678:        bb1     sign,r7,move            /* return if s2 is negative */
                   1679:        set     r4,r4,1<ou>             /* set ou bit */
                   1680:        br.n    move
                   1681:         set    r4,r4,1<ob>             /* set ob bit */
                   1682: FCMPS1f:
                   1683:        bb1     sign,r5,FCMPS1nf        /* branch to negative S1f */
                   1684: FCMPS1pf:
                   1685:        bb1.n   sign,r7,FCMPS1pfS2ni    /* branch to negative S2i with S1pf */
                   1686:         set    r4,r4,1<ne>             /* set ne bit */
                   1687: FCMPS1pfS2pi:
                   1688:        set     r4,r4,1<le>             /* set le bit */
                   1689:        set     r4,r4,1<lt>             /* set lt bit */
                   1690:        bsr.n   _ASM_LABEL(zero)
                   1691:         set    r4,r4,1<ib>             /* set ib bit */
                   1692:        bb0     s1zero,r12,FCMPS1pfS2pinozero
                   1693: FCMPS1pfS2pizero:
                   1694:        br.n    move
                   1695:         set    r4,r4,1<ob>             /* set ob bit */
                   1696: FCMPS1pfS2pinozero:
                   1697:        br.n    move
                   1698:         set    r4,r4,1<in>             /* set in bit */
                   1699: FCMPS1pfS2ni:
                   1700:        set     r4,r4,1<gt>             /* set gt bit */
                   1701:        br.n    move
                   1702:         set    r4,r4,1<ge>             /* set ge bit */
                   1703: FCMPS1nf:
                   1704:        bb1.n   sign,r7,FCMPS1nfS2ni    /* branch to negative S2i with S1nf */
                   1705:         set    r4,r4,1<ne>             /* set ne bit */
                   1706:        set     r4,r4,1<le>             /* set gt bit */
                   1707:        set     r4,r4,1<lt>             /* set ge bit */
                   1708:        bsr.n   _ASM_LABEL(zero)        /* see which of the operands are zero */
                   1709:         set    r4,r4,1<ob>             /* set ob bit */
                   1710:        bb0     s1zero,r12,FCMPS1nfS2pinozero /* no ls and lo */
                   1711: FCMPS1nfS2pizero:
                   1712:        br.n    move
                   1713:         set    r4,r4,1<ib>             /* set ib bit */
                   1714: FCMPS1nfS2pinozero:
                   1715:        br.n    move
                   1716:         set    r4,r4,1<ou>             /* set ou bit */
                   1717: FCMPS1nfS2ni:
                   1718:        set     r4,r4,1<gt>             /* set gt bit */
                   1719:        set     r4,r4,1<ge>             /* set ge bit */
                   1720:
                   1721: move:
                   1722:        br.n    inf_return
                   1723:         or     r6,r0,r4                /* transfer answer to r6 */
                   1724:
                   1725:
                   1726: /* Multiplying infinity and zero causes an exception, but all other */
                   1727: /* operations produce a correctly signed infinity. */
                   1728:
                   1729: FMUL:
                   1730:        bsr     _ASM_LABEL(zero)        /* see if any of the operands are zero */
                   1731:        bb1     s1zero,r12,excpt        /* infinity X 0 causes an exception */
                   1732:        bb1     s2zero,r12,excpt        /* infinity X 0 causes an exception */
                   1733:        bb1     sign,r5,FMULS1neg       /* handle negative cases of S1 */
                   1734:        bb0     sign,r7,poswrinf        /* + X + = + */
                   1735:        br      negwrinf                /* + X - = - */
                   1736: FMULS1neg:
                   1737:        bb1     sign,r7,poswrinf        /* - X - = + */
                   1738:        br      negwrinf                /* - X + = - */
                   1739:
                   1740:
                   1741: /* Dividing infinity by infinity causes an exception, but dividing */
                   1742: /* infinity by a finite yields a correctly signed infinity, and */
                   1743: /* dividing a finite by an infinity produces a correctly signed zero. */
                   1744:
                   1745: FDIV:
                   1746:        bb1     s1inf,r12,FDIVS1inf     /* handle case of S1 being infinity */
                   1747:        bb1     sign,r5,FDIVS1nf        /* handle cases of S1 being neg. non-inf. */
                   1748:        bb1     sign,r7,FDIVS1pfS2mi    /* handle case of negative S2 */
                   1749: FDIVS1pfS2pi:
                   1750:        br      poswrzero               /* +f / +inf = +0 */
                   1751: FDIVS1pfS2mi:
                   1752:        br      negwrzero               /* +f / -inf = -0 */
                   1753: FDIVS1nf:
                   1754:        bb1     sign,r7,FDIVS1nfS2mi    /* handle case of negative S2 */
                   1755: FDIVS1nfS2pi:
                   1756:        br      negwrzero               /* -f / +inf = -0 */
                   1757: FDIVS1nfS2mi:
                   1758:        br      poswrzero               /* -f / -inf = +0 */
                   1759: FDIVS1inf:
                   1760:        bb1     s2inf,r12,excpt         /* inf / inf = exception */
                   1761:        bb1     sign,r5,FDIVS1mi        /* handle cases of S1 being neg. inf. */
                   1762:        bb1     sign,r7,FDIVS1piS2nf    /* handle case of negative S2 */
                   1763: FDIVS1piS2pf:
                   1764:        br      poswrinf                /* +inf / +f = +inf */
                   1765: FDIVS1piS2nf:
                   1766:        br      negwrinf                /* +inf / -f = -inf */
                   1767: FDIVS1mi:
                   1768:        bb1     sign,r7,FDIVS1miS2nf    /* handle case of negative S2 */
                   1769: FDIVS1miS2pf:
                   1770:        br      negwrinf                /* -inf / +f = -inf */
                   1771: FDIVS1miS2nf:
                   1772:        br      poswrinf                /* -inf / -f = +inf */
                   1773:
                   1774:
                   1775: /* The square root of positive infinity is positive infinity, */
                   1776: /* but the square root of negative infinity is a NaN */
                   1777:
                   1778: #if 0
                   1779: FSQRT:
                   1780:        bb0     sign,r7,poswrinf        /* write sqrt(inf) = inf */
                   1781:        br      excpt                   /* write sqrt(-inf) = NaN */
                   1782: #endif
                   1783:
                   1784: excpt:
                   1785:        set     r2,r2,1<oper>
                   1786:        set     r5,r0,0<0>      /* write NaN into r5 */
                   1787:        br.n    inf_return
                   1788:         set    r6,r0,0<0>      /* write NaN into r6, writing NaN''s into */
                   1789:                                /* both of these registers is quicker than */
                   1790:                                /* checking for single or double precision */
                   1791:
                   1792:
                   1793: /* Write positive infinity of the correct precision */
                   1794:
                   1795: poswrinf:
                   1796:        bb1     dsize,r9,poswrinfd      /* branch to write double precision inf. */
                   1797:        br.n    inf_return
                   1798:         or.u   r6,r0,0x7f80            /* load r6 with single precision pos inf.       */
                   1799: poswrinfd:
                   1800:        or.u    r5,r0,0x7ff0            /* load double precision pos inf. */
                   1801:        br.n    inf_return
                   1802:         or     r6,r0,r0
                   1803:
                   1804:
                   1805: /* Write negative infinity of the correct precision */
                   1806:
                   1807: negwrinf:
                   1808:        bb1     dsize,r9,negwrinfd      /* branch to write double precision inf. */
                   1809:        br.n    inf_return
                   1810:         or.u   r6,r0,0xff80            /* load r6 with single precision pos inf.       */
                   1811: negwrinfd:
                   1812:        or.u    r5,r0,0xfff0            /* load double precision pos inf. */
                   1813:        br.n    inf_return
                   1814:         or     r6,r0,r0
                   1815:
                   1816:
                   1817: /* Write a positive zero disregarding precision. */
                   1818:
                   1819: poswrzero:
                   1820:        or      r5,r0,r0        /* write to both high word and low word now */
                   1821:        br.n    inf_return      /* it does not matter that both are written */
                   1822:         or     r6,r0,r0
                   1823:
                   1824:
                   1825: /* Write a negative zero of the correct precision. */
                   1826:
                   1827: negwrzero:
                   1828:        or      r6,r0,r0        /* clear low word */
                   1829:        bb1     dsize,r9,negwrzerod /* branch to write double precision zero */
                   1830:        br.n    inf_return
                   1831:         set    r6,r6,1<31>     /* set sign bit */
                   1832: negwrzerod:
                   1833:        or      r5,r0,r0        /* clear high word */
                   1834:        br.n    inf_return
                   1835:         set    r5,r5,1<31>     /* set sign bit */
                   1836:
                   1837: FP_inf_overflw:
                   1838:        set     r2,r2,1<oper>
                   1839:        set     r2,r2,1<overflow>
                   1840:        set     r2,r2,1<inexact>
                   1841:
                   1842:        bb0.n   sign,r7,inf_return /* if positive then return */
                   1843:
                   1844:         set    r6,r6,31<0>     /* set result to largest positive integer */
                   1845:        or.c    r6,r0,r6        /* negate r6,giving largest negative int. */
                   1846:
                   1847: inf_return:
                   1848:        ld      r1,r31,0        /* load return address */
                   1849:        jmp     r1
                   1850:
                   1851: /*
                   1852:  * denorm
                   1853:  */
                   1854:
                   1855: /* Check to see if either S1 or S2 is a denormalized number. First */
                   1856: /* extract the exponent to see if it is zero, and then check to see if */
                   1857: /* the mantissa is not zero. If the number is denormalized, then set the */
                   1858: /* 1 or 0 bit 10 r12. */
                   1859:
                   1860: ASLOCAL(denorm)
                   1861:        st      r1,r31,0        /* save return address */
                   1862: dnmcheckS1:
                   1863:        extu    r10,r5,11<20>   /* extract exponent */
                   1864:        bcnd    ne0,r10,dnmsetS2 /* S1 is not a denorm, so S2 must be */
                   1865:        bb1.n   9,r9,dnmcheckS1d /* S1 is double precision */
                   1866:         mak    r10,r5,20<3>    /* mak field with only mantissa bits */
                   1867:                                /* into final result */
                   1868: dnmcheckS1s:
                   1869:        extu    r11,r6,3<29>    /* get three low bits of mantissa */
                   1870:        or      r10,r10,r11     /* assemble all of the mantissa bits */
                   1871:        bcnd    eq0,r10,dnmsetS2 /* S1 is not a denorm, so S2 must be */
                   1872:        br      dnmsetS1        /* S1 is a denorm */
                   1873:
                   1874: dnmcheckS1d:
                   1875:        or      r10,r6,r10      /* or all of mantissa bits */
                   1876:        bcnd    eq0,r10,dnmsetS2 /* S1 is not a denorm, so S2 must be */
                   1877: dnmsetS1:
                   1878:        set     r12,r12,1<1>    /* S1 is a denorm */
                   1879:
                   1880: dnmcheckS2:
                   1881:        extu    r10,r7,11<20>   /* extract exponent */
                   1882:        bcnd    ne0,r10,S1form  /* S2 is not a denorm */
                   1883:        bb1.n   7,r9,dnmcheckS2d /* S2 is double precision */
                   1884:         mak    r10,r7,20<3>    /* mak field with only mantissa bits */
                   1885: dnmcheckS2s:
                   1886:        extu    r11,r8,3<29>    /* get three low bits of mantissa */
                   1887:        or      r10,r10,r11     /* assemble all of the mantissa bits */
                   1888:        bcnd    eq0,r10,S1form  /* S2 is not a denorm */
                   1889:        br      dnmsetS2        /* S1 is a denorm */
                   1890: dnmcheckS2d:
                   1891:        or      r10,r8,r10      /* or all or mantissa bits */
                   1892:        bcnd    eq0,r10,S1form  /* S2 is not a denorm */
                   1893: dnmsetS2:
                   1894:        set     r12,r12,1<0>    /* S2 is a denorm */
                   1895:
                   1896:
                   1897: /* Since the operations are going to be reperformed with modified denorms, */
                   1898: /* the operands which were initially single precision need to be modified */
                   1899: /* back to single precision.   */
                   1900:
                   1901: S1form:
                   1902:        bb1     9,r9,S2form     /* S1 is double precision, so do not */
                   1903:                                /* modify S1 into single format */
                   1904:        mak     r11,r5,28<3>    /* over final exponent and mantissa */
                   1905:                                /* eliminating extra 3 bits of exponent */
                   1906:        extu    r6,r6,3<29>     /* get low 3 bits of mantissa */
                   1907:        or      r11,r6,r11      /* form complete mantissa and exponent */
                   1908:        extu    r10,r5,1<31>    /* get the 31 bit */
                   1909:        mak     r10,r10,1<31>   /* place 31 bit 10 correct position */
                   1910:        or      r6,r10,r11      /* or 31, exponent, and all of mantissa */
                   1911:
                   1912: S2form:
                   1913:        bb1     7,r9,checkop    /* S2 is double precision, so do not */
                   1914:                                /* modify S2 into single format */
                   1915:        mak     r11,r7,28<3>    /* over final exponent and mantissa */
                   1916:                                /* eliminating extra 3 bits of exponent */
                   1917:        extu    r8,r8,3<29>     /* get low 3 bits of mantissa */
                   1918:        or      r11,r8,r11      /* form complete mantissa and exponent */
                   1919:        extu    r10,r7,1<31>    /* get the 31 bit */
                   1920:        mak     r10,r10,1<31>   /* place 31 bit 10 correct position */
                   1921:        or      r8,r10,r11      /* or 31, exponent, and all of mantissa */
                   1922:
                   1923:
                   1924: /* Extract the opcode, compare to a constant, and branch to the code that */
                   1925: /* deals with that opcode. */
                   1926:
                   1927: checkop:
                   1928:        extu    r10,r9,5<11>    /* extract opcode */
                   1929:        cmp     r11,r10,0x05    /* compare to FADD */
                   1930:        bb1     2,r11,denorm_FADD       /* operation is FADD */
                   1931:        cmp     r11,r10,0x06    /* compare to FSUB */
                   1932:        bb1     2,r11,denorm_FSUB       /* operation is FSUB */
                   1933:        cmp     r11,r10,0x07    /* compare to FCMP */
                   1934:        bb1     2,r11,denorm_FCMP       /* operation is FCMP */
                   1935:        cmp     r11,r10,0x00    /* compare to FMUL */
                   1936:        bb1     2,r11,denorm_FMUL       /* operation is FMUL */
                   1937:        cmp     r11,r10,0x0e    /* compare to FDIV */
                   1938:        bb1     2,r11,denorm_FDIV       /* operation is FDIV */
                   1939: #if 0
                   1940:        cmp     r11,r10,0x0f    /* compare to FSQRT */
                   1941:        bb1     2,r11,denorm_FSQRT      /* operation is FSQRT */
                   1942: #endif
                   1943:        cmp     r11,r10,0x09    /* compare to INT */
                   1944:        bb1     2,r11,denorm_INT        /* operation is INT */
                   1945:        cmp     r11,r10,0x0a    /* compare to NINT */
                   1946:        bb1     2,r11,denorm_NINT       /* operation is NINT */
                   1947:        cmp     r11,r10,0x0b    /* compare to TRNC */
                   1948:        bb1     2,r11,denorm_TRNC       /* operation is TRNC */
                   1949:
                   1950:
                   1951: /* For all the following operations, the denormalized number is set to */
                   1952: /* zero and the operation is reperformed the correct destination and source */
                   1953: /* sizes. */
                   1954:
                   1955: denorm_FADD:
                   1956:        bb0     1,r12,FADDS2dnm /* S1 is not denorm, so S2 must be */
                   1957:        or      r5,r0,r0        /* set S1 to zero */
                   1958:        or      r6,r0,r0
                   1959: FADDS2chk:
                   1960:        bb0     0,r12,FADDcalc  /* S2 is not a denorm */
                   1961: FADDS2dnm:
                   1962:        or      r7,r0,r0        /* set S2 to zero */
                   1963:        or      r8,r0,r0
                   1964: FADDcalc:
                   1965:        bb1     5,r9,FADDdD     /* branch for double precision destination */
                   1966: FADDsD:
                   1967:        bb1     9,r9,FADDsDdS1  /* branch for double precision S1 */
                   1968: FADDsDsS1:
                   1969:        bb1     7,r9,FADDsDsS1dS2 /* branch for double precision S2 */
                   1970: FADDsDsS1sS2:
                   1971:        br.n    denorm_return
                   1972:         fadd.sss r6,r6,r8      /* add the two sources and place result 10 S1 */
                   1973: FADDsDsS1dS2:
                   1974:        br.n    denorm_return
                   1975:         fadd.ssd r6,r6,r7      /* add the two sources and place result 10 S1 */
                   1976: FADDsDdS1:
                   1977:        bb1     7,r9,FADDsDdS1dS2 /* branch for double precision S2 */
                   1978: FADDsDdS1sS2:
                   1979:        br.n    denorm_return
                   1980:         fadd.sds r6,r5,r8      /* add the two sources and place result 10 S1 */
                   1981: FADDsDdS1dS2:
                   1982:        br.n    denorm_return
                   1983:         fadd.sdd r6,r5,r7      /* add the two sources and place result 10 S1 */
                   1984: FADDdD:
                   1985:        bb1     9,r9,FADDdDdS1  /* branch for double precision S1 */
                   1986: FADDdDsS1:
                   1987:        bb1     7,r9,FADDdDsS1dS2 /* branch for double precision S2 */
                   1988: FADDdDsS1sS2:
                   1989:        br.n    denorm_return
                   1990:         fadd.dss r5,r6,r8      /* add the two sources and place result 10 S1 */
                   1991: FADDdDsS1dS2:
                   1992:        br.n    denorm_return
                   1993:         fadd.dsd r5,r6,r7      /* add the two sources and place result 10 S1 */
                   1994: FADDdDdS1:
                   1995:        bb1     7,r9,FADDdDdS1dS2 /* branch for double precision S2 */
                   1996: FADDdDdS1sS2:
                   1997:        br.n    denorm_return
                   1998:         fadd.dds r5,r5,r8      /* add the two sources and place result 10 S1 */
                   1999: FADDdDdS1dS2:
                   2000:        br.n    denorm_return
                   2001:         fadd.ddd r5,r5,r7      /* add the two sources and place result 10 S1 */
                   2002:
                   2003: denorm_FSUB:
                   2004:        bb0     1,r12,FSUBS2dnm /* S1 is not denorm, so S2 must be */
                   2005:        or      r5,r0,r0        /* set S1 to zero */
                   2006:        or      r6,r0,r0
                   2007: FSUBS2chk:
                   2008:        bb0     0,r12,FSUBcalc  /* S2 is not a denorm */
                   2009: FSUBS2dnm:
                   2010:        or      r7,r0,r0        /* set S2 to zero */
                   2011:        or      r8,r0,r0
                   2012: FSUBcalc:
                   2013:        bb1     5,r9,FSUBdD     /* branch for double precision destination */
                   2014: FSUBsD:
                   2015:        bb1     9,r9,FSUBsDdS1  /* branch for double precision S1 */
                   2016: FSUBsDsS1:
                   2017:        bb1     7,r9,FSUBsDsS1dS2 /* branch for double precision S2 */
                   2018: FSUBsDsS1sS2:
                   2019:        br.n    denorm_return
                   2020:         fsub.sss r6,r6,r8      /* add the two sources and place result 10 S1 */
                   2021: FSUBsDsS1dS2:
                   2022:        br.n    denorm_return
                   2023:         fsub.ssd r6,r6,r7      /* add the two sources and place result 10 S1 */
                   2024: FSUBsDdS1:
                   2025:        bb1     7,r9,FSUBsDdS1dS2 /* branch for double precision S2 */
                   2026: FSUBsDdS1sS2:
                   2027:        br.n    denorm_return
                   2028:         fsub.sds r6,r5,r8      /* add the two sources and place result 10 S1 */
                   2029: FSUBsDdS1dS2:
                   2030:        br.n    denorm_return
                   2031:         fsub.sdd r6,r5,r7      /* add the two sources and place result 10 S1 */
                   2032: FSUBdD:
                   2033:        bb1     9,r9,FSUBdDdS1  /* branch for double precision S1 */
                   2034: FSUBdDsS1:
                   2035:        bb1     7,r9,FSUBdDsS1dS2 /* branch for double precision S2 */
                   2036: FSUBdDsS1sS2:
                   2037:        br.n    denorm_return
                   2038:         fsub.dss r5,r6,r8      /* add the two sources and place result 10 S1 */
                   2039: FSUBdDsS1dS2:
                   2040:        br.n    denorm_return
                   2041:         fsub.dsd r5,r6,r7      /* add the two sources and place result 10 S1 */
                   2042: FSUBdDdS1:
                   2043:        bb1     7,r9,FSUBdDdS1dS2 /* branch for double precision S2 */
                   2044: FSUBdDdS1sS2:
                   2045:        br.n    denorm_return
                   2046:         fsub.dds r5,r5,r8      /* add the two sources and place result 10 S1 */
                   2047: FSUBdDdS1dS2:
                   2048:        br.n    denorm_return
                   2049:         fsub.ddd r5,r5,r7      /* add the two sources and place result 10 S1 */
                   2050:
                   2051: denorm_FCMP:
                   2052:        bb0     1,r12,FCMPS2dnm /* S1 is not denorm, so S2 must be */
                   2053:        or      r5,r0,r0        /* set S1 to zero */
                   2054:        or      r6,r0,r0
                   2055: FCMPS2chk:
                   2056:        bb0     0,r12,FCMPcalc  /* S2 is not a denorm */
                   2057: FCMPS2dnm:
                   2058:        or      r7,r0,r0        /* set S2 to zero */
                   2059:        or      r8,r0,r0
                   2060: FCMPcalc:
                   2061:        bb1     9,r9,FCMPdS1    /* branch for double precision S1 */
                   2062: FCMPsS1:
                   2063:        bb1     7,r9,FCMPsS1dS2 /* branch for double precision S2 */
                   2064: FCMPsS1sS2:
                   2065:        br.n    denorm_return
                   2066:         fcmp.sss r6,r6,r8      /* add the two sources and place result 10 S1 */
                   2067: FCMPsS1dS2:
                   2068:        br.n    denorm_return
                   2069:         fcmp.ssd r6,r6,r7      /* add the two sources and place result 10 S1 */
                   2070: FCMPdS1:
                   2071:        bb1     7,r9,FCMPdS1dS2 /* branch for double precision S2 */
                   2072: FCMPdS1sS2:
                   2073:        br.n    denorm_return
                   2074:         fcmp.sds r6,r5,r8      /* add the two sources and place result 10 S1 */
                   2075: FCMPdS1dS2:
                   2076:        br.n    denorm_return
                   2077:         fcmp.sdd r6,r5,r7      /* add the two sources and place result 10 S1 */
                   2078:
                   2079: denorm_FMUL:
                   2080:        bb0     1,r12,FMULS2dnm /* S1 is not denorm, so S2 must be */
                   2081:        or      r5,r0,r0        /* set S1 to zero */
                   2082:        or      r6,r0,r0
                   2083: FMULS2chk:
                   2084:        bb0     0,r12,FMULcalc  /* S2 is not a denorm */
                   2085: FMULS2dnm:
                   2086:        or      r7,r0,r0        /* set S2 to zero */
                   2087:        or      r8,r0,r0
                   2088: FMULcalc:
                   2089:        bb1     5,r9,FMULdD     /* branch for double precision destination */
                   2090: FMULsD:
                   2091:        bb1     9,r9,FMULsDdS1  /* branch for double precision S1 */
                   2092: FMULsDsS1:
                   2093:        bb1     7,r9,FMULsDsS1dS2 /* branch for double precision S2 */
                   2094: FMULsDsS1sS2:
                   2095:        br.n    denorm_return
                   2096:         fmul.sss r6,r6,r8      /* add the two sources and place result 10 S1 */
                   2097: FMULsDsS1dS2:
                   2098:        br.n    denorm_return
                   2099:         fmul.ssd r6,r6,r7      /* add the two sources and place result 10 S1 */
                   2100: FMULsDdS1:
                   2101:        bb1     7,r9,FMULsDdS1dS2 /* branch for double precision S2 */
                   2102: FMULsDdS1sS2:
                   2103:        br.n    denorm_return
                   2104:         fmul.sds r6,r5,r8      /* add the two sources and place result 10 S1 */
                   2105: FMULsDdS1dS2:
                   2106:        br.n    denorm_return
                   2107:         fmul.sdd r6,r5,r7      /* add the two sources and place result 10 S1 */
                   2108: FMULdD:
                   2109:        bb1     9,r9,FMULdDdS1  /* branch for double precision S1 */
                   2110: FMULdDsS1:
                   2111:        bb1     7,r9,FMULdDsS1dS2 /* branch for double precision S2 */
                   2112: FMULdDsS1sS2:
                   2113:        br.n    denorm_return
                   2114:         fmul.dss r5,r6,r8      /* add the two sources and place result 10 S1 */
                   2115: FMULdDsS1dS2:
                   2116:        br.n    denorm_return
                   2117:         fmul.dsd r5,r6,r7      /* add the two sources and place result 10 S1 */
                   2118: FMULdDdS1:
                   2119:        bb1     7,r9,FMULdDdS1dS2 /* branch for double precision S2 */
                   2120: FMULdDdS1sS2:
                   2121:        br.n    denorm_return
                   2122:         fmul.dds r5,r5,r8      /* add the two sources and place result 10 S1 */
                   2123: FMULdDdS1dS2:
                   2124:        br.n    denorm_return
                   2125:         fmul.ddd r5,r5,r7      /* add the two sources and place result 10 S1 */
                   2126:
                   2127: denorm_FDIV:
                   2128:        bb0     1,r12,FDIVS2dnm /* S1 is not denorm, so S2 must be */
                   2129:        or      r5,r0,r0        /* set S1 to zero */
                   2130:        or      r6,r0,r0
                   2131: FDIVS2chk:
                   2132:        bb0     0,r12,FDIVcalc  /* S2 is not a denorm */
                   2133: FDIVS2dnm:
                   2134:        or      r7,r0,r0        /* set S2 to zero */
                   2135:        or      r8,r0,r0
                   2136: FDIVcalc:
                   2137:        bb1     5,r9,FDIVdD     /* branch for double precision destination */
                   2138: FDIVsD:
                   2139:        bb1     9,r9,FDIVsDdS1  /* branch for double precision S1 */
                   2140: FDIVsDsS1:
                   2141:        bb1     7,r9,FDIVsDsS1dS2 /* branch for double precision S2 */
                   2142: FDIVsDsS1sS2:
                   2143:        fdiv.sss r6,r6,r8       /* add the two sources and place result 10 S1 */
                   2144:        br      denorm_return
                   2145: FDIVsDsS1dS2:
                   2146:        fdiv.ssd r6,r6,r7       /* add the two sources and place result 10 S1 */
                   2147:        br      denorm_return
                   2148: FDIVsDdS1:
                   2149:        bb1     7,r9,FDIVsDdS1dS2 /* branch for double precision S2 */
                   2150: FDIVsDdS1sS2:
                   2151:        fdiv.sds r6,r5,r8       /* add the two sources and place result 10 S1 */
                   2152:        br      denorm_return
                   2153: FDIVsDdS1dS2:
                   2154:        fdiv.sdd r6,r5,r7       /* add the two sources and place result 10 S1 */
                   2155:        br      denorm_return
                   2156: FDIVdD:
                   2157:        bb1     9,r9,FDIVdDdS1  /* branch for double precision S1 */
                   2158: FDIVdDsS1:
                   2159:        bb1     7,r9,FDIVdDsS1dS2 /* branch for double precision S2 */
                   2160: FDIVdDsS1sS2:
                   2161:        fdiv.dss r5,r6,r8       /* add the two sources and place result 10 S1 */
                   2162:        br      denorm_return
                   2163: FDIVdDsS1dS2:
                   2164:        fdiv.dsd r5,r6,r7       /* add the two sources and place result 10 S1 */
                   2165:        br      denorm_return
                   2166: FDIVdDdS1:
                   2167:        bb1     7,r9,FDIVdDdS1dS2 /* branch for double precision S2 */
                   2168: FDIVdDdS1sS2:
                   2169:        fdiv.dds r5,r5,r8       /* add the two sources and place result 10 S1 */
                   2170:        br      denorm_return
                   2171: FDIVdDdS1dS2:
                   2172:        fdiv.ddd r5,r5,r7       /* add the two sources and place result 10 S1 */
                   2173:        br      denorm_return
                   2174:
                   2175: #if 0
                   2176: denorm_FSQRT:
                   2177:        or      r7,r0,r0        /* set S2 to zero */
                   2178:        or      r8,r0,r0
                   2179: FSQRTcalc:
                   2180:        bb1     5,r9,FSQRTdD    /* branch for double precision destination */
                   2181: FSQRTsD:
                   2182:        bb1     7,r9,FSQRTsDdS2 /* branch for double precision S2 */
                   2183: FSQRTsDsS2:
                   2184:        br.n    denorm_return
                   2185:         fsqrt.ss r6,r8         /* add the two sources and place result 10 S1 */
                   2186: FSQRTsDdS2:
                   2187:        br.n    denorm_return
                   2188:         fsqrt.sd r6,r7         /* add the two sources and place result 10 S1 */
                   2189: FSQRTdD:
                   2190:        bb1     7,r9,FSQRTdDdS2 /* branch for double precision S2 */
                   2191: FSQRTdDsS2:
                   2192:        br.n    denorm_return
                   2193:         fsqrt.ds r5,r8         /* add the two sources and place result 10 S1 */
                   2194: FSQRTdDdS2:
                   2195:        br.n    denorm_return
                   2196:         fsqrt.dd r5,r7         /* add the two sources and place result 10 S1 */
                   2197: #endif
                   2198:
                   2199: denorm_INT:
                   2200:        or      r7,r0,r0        /* set S2 to zero */
                   2201:        or      r8,r0,r0
                   2202: INTcalc:
                   2203:        bb1     7,r9,INTdS2     /* branch for double precision S2 */
                   2204: INTsS2:
                   2205:        br.n    denorm_return
                   2206:         int.ss r6,r8           /* add the two sources and place result 10 S1 */
                   2207: INTdS2:
                   2208:        br.n    denorm_return
                   2209:         int.sd r6,r7           /* add the two sources and place result 10 S1 */
                   2210:
                   2211: denorm_NINT:
                   2212:        or      r7,r0,r0        /* set S2 to zero */
                   2213:        or      r8,r0,r0
                   2214: NINTcalc:
                   2215:        bb1     7,r9,NINTdS2    /* branch for double precision S2 */
                   2216: NINTsS2:
                   2217:        br.n    denorm_return
                   2218:         nint.ss r6,r8          /* add the two sources and place result 10 S1 */
                   2219: NINTdS2:
                   2220:        br.n    denorm_return
                   2221:         nint.sd r6,r7          /* add the two sources and place result 10 S1 */
                   2222:
                   2223: denorm_TRNC:
                   2224:        or      r7,r0,r0        /* set S2 to zero */
                   2225:        or      r8,r0,r0
                   2226: TRNCcalc:
                   2227:        bb1     7,r9,TRNCdS2    /* branch for double precision S2 */
                   2228: TRNCsS2:
                   2229:        br.n    denorm_return
                   2230:         trnc.ss r6,r8          /* add the two sources and place result 10 S1 */
                   2231: TRNCdS2:
                   2232:        trnc.sd r6,r7           /* add the two sources and place result 10 S1 */
                   2233:
                   2234:
                   2235: /* Return to the routine that detected the reserved operand. */
                   2236:
                   2237: denorm_return:
                   2238:        ld      r1,r31,0        /* load return address */
                   2239:        jmp     r1
                   2240:
                   2241: /* S1 and/or S2 is an infinity, and the other operand may be a zero. */
                   2242: /* Knowing which operands are infinity, check the remaining operands for zeros. */
                   2243:
                   2244: ASLOCAL(zero)
                   2245:        bb0     s1inf,r12,S1noinf       /* see if S1 is zero */
                   2246:        bb0     s2inf,r12,S2noinf       /* see if S2 is zero */
                   2247:        jmp     r1
                   2248:
                   2249: /* See if S1 is zero. Whether or not S1 is a zero, being in this routine */
                   2250: /* implies that S2 is infinity, so return to subroutine infinity after */
                   2251: /* completing this code. Set the s1zero flag in r12 if S1 is zero. */
                   2252:
                   2253: S1noinf:
                   2254:        bb1     s1size,r9,S1noinfd      /* work with double precision operand */
                   2255: S1noinfs:
                   2256:        or      r10,r0,r5               /* load high word into r10 */
                   2257:        clr     r10,r10,1<sign>         /* clear the sign bit */
                   2258:        extu    r11,r6,3<29>            /* extract lower 3 bits of mantissa */
                   2259:        or      r10,r10,r11             /* or these 3 bits with high word */
                   2260:        bcnd    ne0,r10,operation       /* do not set zero flag */
                   2261:        jmp.n   r1                      /* since this operand was not */
                   2262:                                        /* infinity, S2 must have been, */
                   2263:                                        /* so return */
                   2264:         set    r12,r12,1<s1zero>       /* set zeroflag */
                   2265: S1noinfd:
                   2266:        clr     r10,r5,1<sign>          /* clear the sign bit */
                   2267:        or      r10,r6,r10              /* or high and low word */
                   2268:        bcnd    ne0,r10,operation       /* do not set zero flag */
                   2269:        jmp.n   r1                      /* since this operand was not */
                   2270:                                        /* infinity, S2 must have been, */
                   2271:                                        /* so return */
                   2272:         set    r12,r12,1<s1zero>       /* set zeroflag */
                   2273:
                   2274:
                   2275: /* Check S2 for zero. If it is zero, then set the s2zero flag in r12. */
                   2276:
                   2277: S2noinf:
                   2278:        bb1     s2size,r9,S2noinfd      /* work with double precision operand */
                   2279: S2noinfs:
                   2280:        or      r10,r0,r7               /* load high word into r10 */
                   2281:        clr     r10,r10,1<sign>         /* clear the sign bit */
                   2282:        extu    r11,r8,3<29>            /* extract lower 3 bits of mantissa */
                   2283:        or      r10,r10,r11             /* or these 3 bits with high word */
                   2284:        bcnd    ne0,r10,operation       /* do not set zero flag */
                   2285:        jmp.n   r1                      /* since this operand was not */
                   2286:                                        /* infinity, S1 must have been, */
                   2287:                                        /* so return */
                   2288:         set    r12,r12,1<s2zero>       /* set zeroflag */
                   2289: S2noinfd:
                   2290:        clr     r10,r7,1<sign>          /* clear the sign bit */
                   2291:        or      r10,r8,r10              /* or high and low word */
                   2292:        bcnd    ne0,r10,operation       /* do not set zero flag */
                   2293:        set     r12,r12,1<s2zero>       /* set zeroflag */
                   2294:                                        /* since this operand was not */
                   2295:                                        /* infinity, S1 must have been, */
                   2296:                                        /* so return */
                   2297: operation:
                   2298:        jmp     r1
                   2299:
                   2300: ASENTRY(Xfp_imprecise)
                   2301: /* input: r3 is the exception frame */
                   2302:        or      r29, r3, r0             /* r29 is now the E.F. */
                   2303:        subu    r31, r31, 16
                   2304:        st      r1,  r31, 4
                   2305:        st      r29, r31, 8
                   2306:
                   2307:        ld      r2 , r29, EF_FPSR  * 4
                   2308:        ld      r3 , r29, EF_FPCR  * 4
                   2309:        ld      r4 , r29, EF_FPECR * 4
                   2310:        ld      r10, r29, EF_FPRH  * 4
                   2311:        ld      r11, r29, EF_FPRL  * 4
                   2312:        ld      r12, r29, EF_FPIT  * 4
                   2313:
                   2314: /* Load into r1 the return address for the exception handlers. Looking */
                   2315: /* at FPECR, branch to the appropriate exception handler. */
                   2316:
                   2317:        or.u    r1,r0,hi16(fpui_wrapup)/* load return address of functions */
                   2318:        or      r1,r1,lo16(fpui_wrapup)
                   2319:
                   2320:        bb0     2,r4,2f                 /* branch to FPunderflow if bit set */
                   2321:        br      _ASM_LABEL(FPunderflow)
                   2322: 2:
                   2323:        bb0     1,r4,3f                 /* branch to FPoverflow if bit set */
                   2324:        br      _ASM_LABEL(FPoverflow)
                   2325: 3:
                   2326:        /* XXX handle inexact!!! */
                   2327:
                   2328: fpui_wrapup:
                   2329:        tb1     0,r0,0          /* make sure all floating point operations */
                   2330:                                /* have finished */
                   2331:        ldcr    r4, cr1 /* load the PSR */
                   2332: #if 0
                   2333:        set     r4, r4, 1<PSR_FPU_DISABLE_BIT>
                   2334: #endif
                   2335:        set     r4, r4, 1<PSR_INTERRUPT_DISABLE_BIT>
                   2336:        stcr    r4, cr1
                   2337:        ld      r1, r31, 4
                   2338:        ld      r29,r31, 8
                   2339:        addu    r31, r31, 16
                   2340:
                   2341:        fstcr   r2, FPSR        /* write revised value of FPSR */
                   2342:        fstcr   r3, FPCR        /* write revised value of FPCR */
                   2343:
                   2344:        /* write back the results */
                   2345:        extu    r2, r12, 5<0>
                   2346:        bb0.n   destsize, r12, Iwritesingle
                   2347:         addu   r3, r29, EF_R0 * 4
                   2348:        st      r10, r3 [r2]
                   2349:        addu    r2, r2, 1
                   2350:        clr     r2, r2, 27<5>
                   2351: Iwritesingle:
                   2352:        jmp.n   r1
                   2353:         st     r11, r3 [r2]
CVSweb