sys/arch/m68k/fpsp/scale.sa - annotate

Return to scale.sa CVS log
Up to [local] / sys / arch / m68k / fpsp
Annotation of sys/arch/m68k/fpsp/scale.sa, Revision 1.1.1.1

1.1       nbrk        1: *      $OpenBSD: scale.sa,v 1.2 1996/05/29 21:05:36 niklas Exp $
                      2: *      $NetBSD: scale.sa,v 1.3 1994/10/26 07:49:34 cgd Exp $
                      3:
                      4: *      MOTOROLA MICROPROCESSOR & MEMORY TECHNOLOGY GROUP
                      5: *      M68000 Hi-Performance Microprocessor Division
                      6: *      M68040 Software Package
                      7: *
                      8: *      M68040 Software Package Copyright (c) 1993, 1994 Motorola Inc.
                      9: *      All rights reserved.
                     10: *
                     11: *      THE SOFTWARE is provided on an "AS IS" basis and without warranty.
                     12: *      To the maximum extent permitted by applicable law,
                     13: *      MOTOROLA DISCLAIMS ALL WARRANTIES WHETHER EXPRESS OR IMPLIED,
                     14: *      INCLUDING IMPLIED WARRANTIES OF MERCHANTABILITY OR FITNESS FOR A
                     15: *      PARTICULAR PURPOSE and any warranty against infringement with
                     16: *      regard to the SOFTWARE (INCLUDING ANY MODIFIED VERSIONS THEREOF)
                     17: *      and any accompanying written materials.
                     18: *
                     19: *      To the maximum extent permitted by applicable law,
                     20: *      IN NO EVENT SHALL MOTOROLA BE LIABLE FOR ANY DAMAGES WHATSOEVER
                     21: *      (INCLUDING WITHOUT LIMITATION, DAMAGES FOR LOSS OF BUSINESS
                     22: *      PROFITS, BUSINESS INTERRUPTION, LOSS OF BUSINESS INFORMATION, OR
                     23: *      OTHER PECUNIARY LOSS) ARISING OF THE USE OR INABILITY TO USE THE
                     24: *      SOFTWARE.  Motorola assumes no responsibility for the maintenance
                     25: *      and support of the SOFTWARE.
                     26: *
                     27: *      You are hereby granted a copyright license to use, modify, and
                     28: *      distribute the SOFTWARE so long as this entire notice is retained
                     29: *      without alteration in any modified and/or redistributed versions,
                     30: *      and that such modified versions are clearly identified as such.
                     31: *      No licenses are granted by implication, estoppel or otherwise
                     32: *      under any patents or trademarks of Motorola, Inc.
                     33:
                     34: *
                     35: *      scale.sa 3.3 7/30/91
                     36: *
                     37: *      The entry point sSCALE computes the destination operand
                     38: *      scaled by the source operand.  If the absoulute value of
                     39: *      the source operand is (>= 2^14) an overflow or underflow
                     40: *      is returned.
                     41: *
                     42: *      The entry point sscale is called from do_func to emulate
                     43: *      the fscale unimplemented instruction.
                     44: *
                     45: *      Input: Double-extended destination operand in FPTEMP,
                     46: *              double-extended source operand in ETEMP.
                     47: *
                     48: *      Output: The function returns scale(X,Y) to fp0.
                     49: *
                     50: *      Modifies: fp0.
                     51: *
                     52: *      Algorithm:
                     53: *
                     54:
                     55: SCALE    IDNT    2,1 Motorola 040 Floating Point Software Package
                     56:
                     57:        section 8
                     58:
                     59:        include fpsp.h
                     60:
                     61:        xref    t_ovfl2
                     62:        xref    t_unfl
                     63:        xref    round
                     64:        xref    t_resdnrm
                     65:
                     66: SRC_BNDS dc.w  $3fff,$400c
                     67:
                     68: *
                     69: * This entry point is used by the unimplemented instruction exception
                     70: * handler.
                     71: *
                     72: *
                     73: *
                     74: *      FSCALE
                     75: *
                     76:        xdef    sscale
                     77: sscale:
                     78:        fmove.l         #0,fpcr         ;clr user enabled exc
                     79:        clr.l           d1
                     80:        move.w          FPTEMP(a6),d1   ;get dest exponent
                     81:        smi             L_SCR1(a6)      ;use L_SCR1 to hold sign
                     82:        andi.l          #$7fff,d1       ;strip sign
                     83:        move.w          ETEMP(a6),d0    ;check src bounds
                     84:        andi.w          #$7fff,d0       ;clr sign bit
                     85:        cmp2.w          SRC_BNDS,d0
                     86:        bcc.b           src_in
                     87:        cmpi.w          #$400c,d0       ;test for too large
                     88:        bge.w           src_out
                     89: *
                     90: * The source input is below 1, so we check for denormalized numbers
                     91: * and set unfl.
                     92: *
                     93: src_small:
                     94:        move.b          DTAG(a6),d0
                     95:        andi.b          #$e0,d0
                     96:        tst.b           d0
                     97:        beq.b           no_denorm
                     98:        st              STORE_FLG(a6)   ;dest already contains result
                     99:        or.l            #unfl_mask,USER_FPSR(a6) ;set UNFL
                    100: den_done:
                    101:        lea.l           FPTEMP(a6),a0
                    102:        bra             t_resdnrm
                    103: no_denorm:
                    104:        fmove.l         USER_FPCR(a6),FPCR
                    105:        fmove.x         FPTEMP(a6),fp0  ;simply return dest
                    106:        rts
                    107:
                    108:
                    109: *
                    110: * Source is within 2^14 range.  To perform the int operation,
                    111: * move it to d0.
                    112: *
                    113: src_in:
                    114:        fmove.x         ETEMP(a6),fp0   ;move in src for int
                    115:        fmove.l         #rz_mode,fpcr   ;force rz for src conversion
                    116:        fmove.l         fp0,d0          ;int src to d0
                    117:        fmove.l         #0,FPSR         ;clr status from above
                    118:        tst.w           ETEMP(a6)       ;check src sign
                    119:        blt.w           src_neg
                    120: *
                    121: * Source is positive.  Add the src to the dest exponent.
                    122: * The result can be denormalized, if src = 0, or overflow,
                    123: * if the result of the add sets a bit in the upper word.
                    124: *
                    125: src_pos:
                    126:        tst.w           d1              ;check for denorm
                    127:        beq.w           dst_dnrm
                    128:        add.l           d0,d1           ;add src to dest exp
                    129:        beq.b           denorm          ;if zero, result is denorm
                    130:        cmpi.l          #$7fff,d1       ;test for overflow
                    131:        bge.b           ovfl
                    132:        tst.b           L_SCR1(a6)
                    133:        beq.b           spos_pos
                    134:        or.w            #$8000,d1
                    135: spos_pos:
                    136:        move.w          d1,FPTEMP(a6)   ;result in FPTEMP
                    137:        fmove.l         USER_FPCR(a6),FPCR
                    138:        fmove.x         FPTEMP(a6),fp0  ;write result to fp0
                    139:        rts
                    140: ovfl:
                    141:        tst.b           L_SCR1(a6)
                    142:        beq.b           sovl_pos
                    143:        or.w            #$8000,d1
                    144: sovl_pos:
                    145:        move.w          FPTEMP(a6),ETEMP(a6)    ;result in ETEMP
                    146:        move.l          FPTEMP_HI(a6),ETEMP_HI(a6)
                    147:        move.l          FPTEMP_LO(a6),ETEMP_LO(a6)
                    148:        bra             t_ovfl2
                    149:
                    150: denorm:
                    151:        tst.b           L_SCR1(a6)
                    152:        beq.b           den_pos
                    153:        or.w            #$8000,d1
                    154: den_pos:
                    155:        tst.l           FPTEMP_HI(a6)   ;check j bit
                    156:        blt.b           nden_exit       ;if set, not denorm
                    157:        move.w          d1,ETEMP(a6)    ;input expected in ETEMP
                    158:        move.l          FPTEMP_HI(a6),ETEMP_HI(a6)
                    159:        move.l          FPTEMP_LO(a6),ETEMP_LO(a6)
                    160:        or.l            #unfl_bit,USER_FPSR(a6) ;set unfl
                    161:        lea.l           ETEMP(a6),a0
                    162:        bra             t_resdnrm
                    163: nden_exit:
                    164:        move.w          d1,FPTEMP(a6)   ;result in FPTEMP
                    165:        fmove.l         USER_FPCR(a6),FPCR
                    166:        fmove.x         FPTEMP(a6),fp0  ;write result to fp0
                    167:        rts
                    168:
                    169: *
                    170: * Source is negative.  Add the src to the dest exponent.
                    171: * (The result exponent will be reduced).  The result can be
                    172: * denormalized.
                    173: *
                    174: src_neg:
                    175:        add.l           d0,d1           ;add src to dest
                    176:        beq.b           denorm          ;if zero, result is denorm
                    177:        blt.b           fix_dnrm        ;if negative, result is
                    178: *                                      ;needing denormalization
                    179:        tst.b           L_SCR1(a6)
                    180:        beq.b           sneg_pos
                    181:        or.w            #$8000,d1
                    182: sneg_pos:
                    183:        move.w          d1,FPTEMP(a6)   ;result in FPTEMP
                    184:        fmove.l         USER_FPCR(a6),FPCR
                    185:        fmove.x         FPTEMP(a6),fp0  ;write result to fp0
                    186:        rts
                    187:
                    188:
                    189: *
                    190: * The result exponent is below denorm value.  Test for catastrophic
                    191: * underflow and force zero if true.  If not, try to shift the
                    192: * mantissa right until a zero exponent exists.
                    193: *
                    194: fix_dnrm:
                    195:        cmpi.w          #$ffc0,d1       ;lower bound for normalization
                    196:        blt.w           fix_unfl        ;if lower, catastrophic unfl
                    197:        move.w          d1,d0           ;use d0 for exp
                    198:        move.l          d2,-(a7)        ;free d2 for norm
                    199:        move.l          FPTEMP_HI(a6),d1
                    200:        move.l          FPTEMP_LO(a6),d2
                    201:        clr.l           L_SCR2(a6)
                    202: fix_loop:
                    203:        add.w           #1,d0           ;drive d0 to 0
                    204:        lsr.l           #1,d1           ;while shifting the
                    205:        roxr.l          #1,d2           ;mantissa to the right
                    206:        bcc.b           no_carry
                    207:        st              L_SCR2(a6)      ;use L_SCR2 to capture inex
                    208: no_carry:
                    209:        tst.w           d0              ;it is finished when
                    210:        blt.b           fix_loop        ;d0 is zero or the mantissa
                    211:        tst.b           L_SCR2(a6)
                    212:        beq.b           tst_zero
                    213:        or.l            #unfl_inx_mask,USER_FPSR(a6)
                    214: *                                      ;set unfl, aunfl, ainex
                    215: *
                    216: * Test for zero. If zero, simply use fmove to return +/- zero
                    217: * to the fpu.
                    218: *
                    219: tst_zero:
                    220:        clr.w           FPTEMP_EX(a6)
                    221:        tst.b           L_SCR1(a6)      ;test for sign
                    222:        beq.b           tst_con
                    223:        or.w            #$8000,FPTEMP_EX(a6) ;set sign bit
                    224: tst_con:
                    225:        move.l          d1,FPTEMP_HI(a6)
                    226:        move.l          d2,FPTEMP_LO(a6)
                    227:        move.l          (a7)+,d2
                    228:        tst.l           d1
                    229:        bne.b           not_zero
                    230:        tst.l           FPTEMP_LO(a6)
                    231:        bne.b           not_zero
                    232: *
                    233: * Result is zero.  Check for rounding mode to set lsb.  If the
                    234: * mode is rp, and the zero is positive, return smallest denorm.
                    235: * If the mode is rm, and the zero is negative, return smallest
                    236: * negative denorm.
                    237: *
                    238:        btst.b          #5,FPCR_MODE(a6) ;test if rm or rp
                    239:        beq.b           no_dir
                    240:        btst.b          #4,FPCR_MODE(a6) ;check which one
                    241:        beq.b           zer_rm
                    242: zer_rp:
                    243:        tst.b           L_SCR1(a6)      ;check sign
                    244:        bne.b           no_dir          ;if set, neg op, no inc
                    245:        move.l          #1,FPTEMP_LO(a6) ;set lsb
                    246:        bra.b           sm_dnrm
                    247: zer_rm:
                    248:        tst.b           L_SCR1(a6)      ;check sign
                    249:        beq.b           no_dir          ;if clr, neg op, no inc
                    250:        move.l          #1,FPTEMP_LO(a6) ;set lsb
                    251:        or.l            #neg_mask,USER_FPSR(a6) ;set N
                    252:        bra.b           sm_dnrm
                    253: no_dir:
                    254:        fmove.l         USER_FPCR(a6),FPCR
                    255:        fmove.x         FPTEMP(a6),fp0  ;use fmove to set cc's
                    256:        rts
                    257:
                    258: *
                    259: * The rounding mode changed the zero to a smallest denorm. Call
                    260: * t_resdnrm with exceptional operand in ETEMP.
                    261: *
                    262: sm_dnrm:
                    263:        move.l          FPTEMP_EX(a6),ETEMP_EX(a6)
                    264:        move.l          FPTEMP_HI(a6),ETEMP_HI(a6)
                    265:        move.l          FPTEMP_LO(a6),ETEMP_LO(a6)
                    266:        lea.l           ETEMP(a6),a0
                    267:        bra             t_resdnrm
                    268:
                    269: *
                    270: * Result is still denormalized.
                    271: *
                    272: not_zero:
                    273:        or.l            #unfl_mask,USER_FPSR(a6) ;set unfl
                    274:        tst.b           L_SCR1(a6)      ;check for sign
                    275:        beq.b           fix_exit
                    276:        or.l            #neg_mask,USER_FPSR(a6) ;set N
                    277: fix_exit:
                    278:        bra.b           sm_dnrm
                    279:
                    280:
                    281: *
                    282: * The result has underflowed to zero. Return zero and set
                    283: * unfl, aunfl, and ainex.
                    284: *
                    285: fix_unfl:
                    286:        or.l            #unfl_inx_mask,USER_FPSR(a6)
                    287:        btst.b          #5,FPCR_MODE(a6) ;test if rm or rp
                    288:        beq.b           no_dir2
                    289:        btst.b          #4,FPCR_MODE(a6) ;check which one
                    290:        beq.b           zer_rm2
                    291: zer_rp2:
                    292:        tst.b           L_SCR1(a6)      ;check sign
                    293:        bne.b           no_dir2         ;if set, neg op, no inc
                    294:        clr.l           FPTEMP_EX(a6)
                    295:        clr.l           FPTEMP_HI(a6)
                    296:        move.l          #1,FPTEMP_LO(a6) ;set lsb
                    297:        bra.b           sm_dnrm         ;return smallest denorm
                    298: zer_rm2:
                    299:        tst.b           L_SCR1(a6)      ;check sign
                    300:        beq.b           no_dir2         ;if clr, neg op, no inc
                    301:        move.w          #$8000,FPTEMP_EX(a6)
                    302:        clr.l           FPTEMP_HI(a6)
                    303:        move.l          #1,FPTEMP_LO(a6) ;set lsb
                    304:        or.l            #neg_mask,USER_FPSR(a6) ;set N
                    305:        bra.w           sm_dnrm         ;return smallest denorm
                    306:
                    307: no_dir2:
                    308:        tst.b           L_SCR1(a6)
                    309:        bge.b           pos_zero
                    310: neg_zero:
                    311:        clr.l           FP_SCR1(a6)     ;clear the exceptional operand
                    312:        clr.l           FP_SCR1+4(a6)   ;for gen_except.
                    313:        clr.l           FP_SCR1+8(a6)
                    314:        fmove.s         #:80000000,fp0
                    315:        rts
                    316: pos_zero:
                    317:        clr.l           FP_SCR1(a6)     ;clear the exceptional operand
                    318:        clr.l           FP_SCR1+4(a6)   ;for gen_except.
                    319:        clr.l           FP_SCR1+8(a6)
                    320:        fmove.s         #:00000000,fp0
                    321:        rts
                    322:
                    323: *
                    324: * The destination is a denormalized number.  It must be handled
                    325: * by first shifting the bits in the mantissa until it is normalized,
                    326: * then adding the remainder of the source to the exponent.
                    327: *
                    328: dst_dnrm:
                    329:        movem.l         d2/d3,-(a7)
                    330:        move.w          FPTEMP_EX(a6),d1
                    331:        move.l          FPTEMP_HI(a6),d2
                    332:        move.l          FPTEMP_LO(a6),d3
                    333: dst_loop:
                    334:        tst.l           d2              ;test for normalized result
                    335:        blt.b           dst_norm        ;exit loop if so
                    336:        tst.l           d0              ;otherwise, test shift count
                    337:        beq.b           dst_fin         ;if zero, shifting is done
                    338:        subq.l          #1,d0           ;dec src
                    339:        add.l           d3,d3
                    340:        addx.l          d2,d2
                    341:        bra.b           dst_loop
                    342: *
                    343: * Destination became normalized.  Simply add the remaining
                    344: * portion of the src to the exponent.
                    345: *
                    346: dst_norm:
                    347:        add.w           d0,d1           ;dst is normalized; add src
                    348:        tst.b           L_SCR1(a6)
                    349:        beq.b           dnrm_pos
                    350:        or.w            #$8000,d1
                    351: dnrm_pos:
                    352:        movem.w         d1,FPTEMP_EX(a6)
                    353:        movem.l         d2,FPTEMP_HI(a6)
                    354:        movem.l         d3,FPTEMP_LO(a6)
                    355:        fmove.l         USER_FPCR(a6),FPCR
                    356:        fmove.x         FPTEMP(a6),fp0
                    357:        movem.l         (a7)+,d2/d3
                    358:        rts
                    359:
                    360: *
                    361: * Destination remained denormalized.  Call t_excdnrm with
                    362: * exceptional operand in ETEMP.
                    363: *
                    364: dst_fin:
                    365:        tst.b           L_SCR1(a6)      ;check for sign
                    366:        beq.b           dst_exit
                    367:        or.l            #neg_mask,USER_FPSR(a6) ;set N
                    368:        or.w            #$8000,d1
                    369: dst_exit:
                    370:        movem.w         d1,ETEMP_EX(a6)
                    371:        movem.l         d2,ETEMP_HI(a6)
                    372:        movem.l         d3,ETEMP_LO(a6)
                    373:        or.l            #unfl_mask,USER_FPSR(a6) ;set unfl
                    374:        movem.l         (a7)+,d2/d3
                    375:        lea.l           ETEMP(a6),a0
                    376:        bra             t_resdnrm
                    377:
                    378: *
                    379: * Source is outside of 2^14 range.  Test the sign and branch
                    380: * to the appropriate exception handler.
                    381: *
                    382: src_out:
                    383:        tst.b           L_SCR1(a6)
                    384:        beq.b           scro_pos
                    385:        or.w            #$8000,d1
                    386: scro_pos:
                    387:        move.l          FPTEMP_HI(a6),ETEMP_HI(a6)
                    388:        move.l          FPTEMP_LO(a6),ETEMP_LO(a6)
                    389:        tst.w           ETEMP(a6)
                    390:        blt.b           res_neg
                    391: res_pos:
                    392:        move.w          d1,ETEMP(a6)    ;result in ETEMP
                    393:        bra             t_ovfl2
                    394: res_neg:
                    395:        move.w          d1,ETEMP(a6)    ;result in ETEMP
                    396:        lea.l           ETEMP(a6),a0
                    397:        bra             t_unfl
                    398:        end
CVSweb