123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040 |
- |
- | res_func.sa 3.9 7/29/91
- |
- | Normalizes denormalized numbers if necessary and updates the
- | stack frame. The function is then restored back into the
- | machine and the 040 completes the operation. This routine
- | is only used by the unsupported data type/format handler.
- | (Exception vector 55).
- |
- | For packed move out (fmove.p fpm,<ea>) the operation is
- | completed here; data is packed and moved to user memory.
- | The stack is restored to the 040 only in the case of a
- | reportable exception in the conversion.
- |
- |
- | Copyright (C) Motorola, Inc. 1990
- | All Rights Reserved
- |
- | For details on the license for this file, please see the
- | file, README, in this same directory.
- RES_FUNC: |idnt 2,1 | Motorola 040 Floating Point Software Package
- |section 8
- #include "fpsp.h"
- sp_bnds: .short 0x3f81,0x407e
- .short 0x3f6a,0x0000
- dp_bnds: .short 0x3c01,0x43fe
- .short 0x3bcd,0x0000
- |xref mem_write
- |xref bindec
- |xref get_fline
- |xref round
- |xref denorm
- |xref dest_ext
- |xref dest_dbl
- |xref dest_sgl
- |xref unf_sub
- |xref nrm_set
- |xref dnrm_lp
- |xref ovf_res
- |xref reg_dest
- |xref t_ovfl
- |xref t_unfl
- .global res_func
- .global p_move
- res_func:
- clrb DNRM_FLG(%a6)
- clrb RES_FLG(%a6)
- clrb CU_ONLY(%a6)
- tstb DY_MO_FLG(%a6)
- beqs monadic
- dyadic:
- btstb #7,DTAG(%a6) |if dop = norm=000, zero=001,
- | ;inf=010 or nan=011
- beqs monadic |then branch
- | ;else denorm
- | HANDLE DESTINATION DENORM HERE
- | ;set dtag to norm
- | ;write the tag & fpte15 to the fstack
- leal FPTEMP(%a6),%a0
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- bsr nrm_set |normalize number (exp will go negative)
- bclrb #sign_bit,LOCAL_EX(%a0) |get rid of false sign
- bfclr LOCAL_SGN(%a0){#0:#8} |change back to IEEE ext format
- beqs dpos
- bsetb #sign_bit,LOCAL_EX(%a0)
- dpos:
- bfclr DTAG(%a6){#0:#4} |set tag to normalized, FPTE15 = 0
- bsetb #4,DTAG(%a6) |set FPTE15
- orb #0x0f,DNRM_FLG(%a6)
- monadic:
- leal ETEMP(%a6),%a0
- btstb #direction_bit,CMDREG1B(%a6) |check direction
- bne opclass3 |it is a mv out
- |
- | At this point, only opclass 0 and 2 possible
- |
- btstb #7,STAG(%a6) |if sop = norm=000, zero=001,
- | ;inf=010 or nan=011
- bne mon_dnrm |else denorm
- tstb DY_MO_FLG(%a6) |all cases of dyadic instructions would
- bne normal |require normalization of denorm
- | At this point:
- | monadic instructions: fabs = $18 fneg = $1a ftst = $3a
- | fmove = $00 fsmove = $40 fdmove = $44
- | fsqrt = $05* fssqrt = $41 fdsqrt = $45
- | (*fsqrt reencoded to $05)
- |
- movew CMDREG1B(%a6),%d0 |get command register
- andil #0x7f,%d0 |strip to only command word
- |
- | At this point, fabs, fneg, fsmove, fdmove, ftst, fsqrt, fssqrt, and
- | fdsqrt are possible.
- | For cases fabs, fneg, fsmove, and fdmove goto spos (do not normalize)
- | For cases fsqrt, fssqrt, and fdsqrt goto nrm_src (do normalize)
- |
- btstl #0,%d0
- bne normal |weed out fsqrt instructions
- |
- | cu_norm handles fmove in instructions with normalized inputs.
- | The routine round is used to correctly round the input for the
- | destination precision and mode.
- |
- cu_norm:
- st CU_ONLY(%a6) |set cu-only inst flag
- movew CMDREG1B(%a6),%d0
- andib #0x3b,%d0 |isolate bits to select inst
- tstb %d0
- beql cu_nmove |if zero, it is an fmove
- cmpib #0x18,%d0
- beql cu_nabs |if $18, it is fabs
- cmpib #0x1a,%d0
- beql cu_nneg |if $1a, it is fneg
- |
- | Inst is ftst. Check the source operand and set the cc's accordingly.
- | No write is done, so simply rts.
- |
- cu_ntst:
- movew LOCAL_EX(%a0),%d0
- bclrl #15,%d0
- sne LOCAL_SGN(%a0)
- beqs cu_ntpo
- orl #neg_mask,USER_FPSR(%a6) |set N
- cu_ntpo:
- cmpiw #0x7fff,%d0 |test for inf/nan
- bnes cu_ntcz
- tstl LOCAL_HI(%a0)
- bnes cu_ntn
- tstl LOCAL_LO(%a0)
- bnes cu_ntn
- orl #inf_mask,USER_FPSR(%a6)
- rts
- cu_ntn:
- orl #nan_mask,USER_FPSR(%a6)
- movel ETEMP_EX(%a6),FPTEMP_EX(%a6) |set up fptemp sign for
- | ;snan handler
- rts
- cu_ntcz:
- tstl LOCAL_HI(%a0)
- bnel cu_ntsx
- tstl LOCAL_LO(%a0)
- bnel cu_ntsx
- orl #z_mask,USER_FPSR(%a6)
- cu_ntsx:
- rts
- |
- | Inst is fabs. Execute the absolute value function on the input.
- | Branch to the fmove code. If the operand is NaN, do nothing.
- |
- cu_nabs:
- moveb STAG(%a6),%d0
- btstl #5,%d0 |test for NaN or zero
- bne wr_etemp |if either, simply write it
- bclrb #7,LOCAL_EX(%a0) |do abs
- bras cu_nmove |fmove code will finish
- |
- | Inst is fneg. Execute the negate value function on the input.
- | Fall though to the fmove code. If the operand is NaN, do nothing.
- |
- cu_nneg:
- moveb STAG(%a6),%d0
- btstl #5,%d0 |test for NaN or zero
- bne wr_etemp |if either, simply write it
- bchgb #7,LOCAL_EX(%a0) |do neg
- |
- | Inst is fmove. This code also handles all result writes.
- | If bit 2 is set, round is forced to double. If it is clear,
- | and bit 6 is set, round is forced to single. If both are clear,
- | the round precision is found in the fpcr. If the rounding precision
- | is double or single, round the result before the write.
- |
- cu_nmove:
- moveb STAG(%a6),%d0
- andib #0xe0,%d0 |isolate stag bits
- bne wr_etemp |if not norm, simply write it
- btstb #2,CMDREG1B+1(%a6) |check for rd
- bne cu_nmrd
- btstb #6,CMDREG1B+1(%a6) |check for rs
- bne cu_nmrs
- |
- | The move or operation is not with forced precision. Test for
- | nan or inf as the input; if so, simply write it to FPn. Use the
- | FPCR_MODE byte to get rounding on norms and zeros.
- |
- cu_nmnr:
- bfextu FPCR_MODE(%a6){#0:#2},%d0
- tstb %d0 |check for extended
- beq cu_wrexn |if so, just write result
- cmpib #1,%d0 |check for single
- beq cu_nmrs |fall through to double
- |
- | The move is fdmove or round precision is double.
- |
- cu_nmrd:
- movel #2,%d0 |set up the size for denorm
- movew LOCAL_EX(%a0),%d1 |compare exponent to double threshold
- andw #0x7fff,%d1
- cmpw #0x3c01,%d1
- bls cu_nunfl
- bfextu FPCR_MODE(%a6){#2:#2},%d1 |get rmode
- orl #0x00020000,%d1 |or in rprec (double)
- clrl %d0 |clear g,r,s for round
- bclrb #sign_bit,LOCAL_EX(%a0) |convert to internal format
- sne LOCAL_SGN(%a0)
- bsrl round
- bfclr LOCAL_SGN(%a0){#0:#8}
- beqs cu_nmrdc
- bsetb #sign_bit,LOCAL_EX(%a0)
- cu_nmrdc:
- movew LOCAL_EX(%a0),%d1 |check for overflow
- andw #0x7fff,%d1
- cmpw #0x43ff,%d1
- bge cu_novfl |take care of overflow case
- bra cu_wrexn
- |
- | The move is fsmove or round precision is single.
- |
- cu_nmrs:
- movel #1,%d0
- movew LOCAL_EX(%a0),%d1
- andw #0x7fff,%d1
- cmpw #0x3f81,%d1
- bls cu_nunfl
- bfextu FPCR_MODE(%a6){#2:#2},%d1
- orl #0x00010000,%d1
- clrl %d0
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- bsrl round
- bfclr LOCAL_SGN(%a0){#0:#8}
- beqs cu_nmrsc
- bsetb #sign_bit,LOCAL_EX(%a0)
- cu_nmrsc:
- movew LOCAL_EX(%a0),%d1
- andw #0x7FFF,%d1
- cmpw #0x407f,%d1
- blt cu_wrexn
- |
- | The operand is above precision boundaries. Use t_ovfl to
- | generate the correct value.
- |
- cu_novfl:
- bsr t_ovfl
- bra cu_wrexn
- |
- | The operand is below precision boundaries. Use denorm to
- | generate the correct value.
- |
- cu_nunfl:
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- bsr denorm
- bfclr LOCAL_SGN(%a0){#0:#8} |change back to IEEE ext format
- beqs cu_nucont
- bsetb #sign_bit,LOCAL_EX(%a0)
- cu_nucont:
- bfextu FPCR_MODE(%a6){#2:#2},%d1
- btstb #2,CMDREG1B+1(%a6) |check for rd
- bne inst_d
- btstb #6,CMDREG1B+1(%a6) |check for rs
- bne inst_s
- swap %d1
- moveb FPCR_MODE(%a6),%d1
- lsrb #6,%d1
- swap %d1
- bra inst_sd
- inst_d:
- orl #0x00020000,%d1
- bra inst_sd
- inst_s:
- orl #0x00010000,%d1
- inst_sd:
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- bsrl round
- bfclr LOCAL_SGN(%a0){#0:#8}
- beqs cu_nuflp
- bsetb #sign_bit,LOCAL_EX(%a0)
- cu_nuflp:
- btstb #inex2_bit,FPSR_EXCEPT(%a6)
- beqs cu_nuninx
- orl #aunfl_mask,USER_FPSR(%a6) |if the round was inex, set AUNFL
- cu_nuninx:
- tstl LOCAL_HI(%a0) |test for zero
- bnes cu_nunzro
- tstl LOCAL_LO(%a0)
- bnes cu_nunzro
- |
- | The mantissa is zero from the denorm loop. Check sign and rmode
- | to see if rounding should have occurred which would leave the lsb.
- |
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0 |isolate rmode
- cmpil #0x20,%d0
- blts cu_nzro
- bnes cu_nrp
- cu_nrm:
- tstw LOCAL_EX(%a0) |if positive, set lsb
- bges cu_nzro
- btstb #7,FPCR_MODE(%a6) |check for double
- beqs cu_nincs
- bras cu_nincd
- cu_nrp:
- tstw LOCAL_EX(%a0) |if positive, set lsb
- blts cu_nzro
- btstb #7,FPCR_MODE(%a6) |check for double
- beqs cu_nincs
- cu_nincd:
- orl #0x800,LOCAL_LO(%a0) |inc for double
- bra cu_nunzro
- cu_nincs:
- orl #0x100,LOCAL_HI(%a0) |inc for single
- bra cu_nunzro
- cu_nzro:
- orl #z_mask,USER_FPSR(%a6)
- moveb STAG(%a6),%d0
- andib #0xe0,%d0
- cmpib #0x40,%d0 |check if input was tagged zero
- beqs cu_numv
- cu_nunzro:
- orl #unfl_mask,USER_FPSR(%a6) |set unfl
- cu_numv:
- movel (%a0),ETEMP(%a6)
- movel 4(%a0),ETEMP_HI(%a6)
- movel 8(%a0),ETEMP_LO(%a6)
- |
- | Write the result to memory, setting the fpsr cc bits. NaN and Inf
- | bypass cu_wrexn.
- |
- cu_wrexn:
- tstw LOCAL_EX(%a0) |test for zero
- beqs cu_wrzero
- cmpw #0x8000,LOCAL_EX(%a0) |test for zero
- bnes cu_wreon
- cu_wrzero:
- orl #z_mask,USER_FPSR(%a6) |set Z bit
- cu_wreon:
- tstw LOCAL_EX(%a0)
- bpl wr_etemp
- orl #neg_mask,USER_FPSR(%a6)
- bra wr_etemp
- |
- | HANDLE SOURCE DENORM HERE
- |
- | ;clear denorm stag to norm
- | ;write the new tag & ete15 to the fstack
- mon_dnrm:
- |
- | At this point, check for the cases in which normalizing the
- | denorm produces incorrect results.
- |
- tstb DY_MO_FLG(%a6) |all cases of dyadic instructions would
- bnes nrm_src |require normalization of denorm
- | At this point:
- | monadic instructions: fabs = $18 fneg = $1a ftst = $3a
- | fmove = $00 fsmove = $40 fdmove = $44
- | fsqrt = $05* fssqrt = $41 fdsqrt = $45
- | (*fsqrt reencoded to $05)
- |
- movew CMDREG1B(%a6),%d0 |get command register
- andil #0x7f,%d0 |strip to only command word
- |
- | At this point, fabs, fneg, fsmove, fdmove, ftst, fsqrt, fssqrt, and
- | fdsqrt are possible.
- | For cases fabs, fneg, fsmove, and fdmove goto spos (do not normalize)
- | For cases fsqrt, fssqrt, and fdsqrt goto nrm_src (do normalize)
- |
- btstl #0,%d0
- bnes nrm_src |weed out fsqrt instructions
- st CU_ONLY(%a6) |set cu-only inst flag
- bra cu_dnrm |fmove, fabs, fneg, ftst
- | ;cases go to cu_dnrm
- nrm_src:
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- bsr nrm_set |normalize number (exponent will go
- | ; negative)
- bclrb #sign_bit,LOCAL_EX(%a0) |get rid of false sign
- bfclr LOCAL_SGN(%a0){#0:#8} |change back to IEEE ext format
- beqs spos
- bsetb #sign_bit,LOCAL_EX(%a0)
- spos:
- bfclr STAG(%a6){#0:#4} |set tag to normalized, FPTE15 = 0
- bsetb #4,STAG(%a6) |set ETE15
- orb #0xf0,DNRM_FLG(%a6)
- normal:
- tstb DNRM_FLG(%a6) |check if any of the ops were denorms
- bne ck_wrap |if so, check if it is a potential
- | ;wrap-around case
- fix_stk:
- moveb #0xfe,CU_SAVEPC(%a6)
- bclrb #E1,E_BYTE(%a6)
- clrw NMNEXC(%a6)
- st RES_FLG(%a6) |indicate that a restore is needed
- rts
- |
- | cu_dnrm handles all cu-only instructions (fmove, fabs, fneg, and
- | ftst) completely in software without an frestore to the 040.
- |
- cu_dnrm:
- st CU_ONLY(%a6)
- movew CMDREG1B(%a6),%d0
- andib #0x3b,%d0 |isolate bits to select inst
- tstb %d0
- beql cu_dmove |if zero, it is an fmove
- cmpib #0x18,%d0
- beql cu_dabs |if $18, it is fabs
- cmpib #0x1a,%d0
- beql cu_dneg |if $1a, it is fneg
- |
- | Inst is ftst. Check the source operand and set the cc's accordingly.
- | No write is done, so simply rts.
- |
- cu_dtst:
- movew LOCAL_EX(%a0),%d0
- bclrl #15,%d0
- sne LOCAL_SGN(%a0)
- beqs cu_dtpo
- orl #neg_mask,USER_FPSR(%a6) |set N
- cu_dtpo:
- cmpiw #0x7fff,%d0 |test for inf/nan
- bnes cu_dtcz
- tstl LOCAL_HI(%a0)
- bnes cu_dtn
- tstl LOCAL_LO(%a0)
- bnes cu_dtn
- orl #inf_mask,USER_FPSR(%a6)
- rts
- cu_dtn:
- orl #nan_mask,USER_FPSR(%a6)
- movel ETEMP_EX(%a6),FPTEMP_EX(%a6) |set up fptemp sign for
- | ;snan handler
- rts
- cu_dtcz:
- tstl LOCAL_HI(%a0)
- bnel cu_dtsx
- tstl LOCAL_LO(%a0)
- bnel cu_dtsx
- orl #z_mask,USER_FPSR(%a6)
- cu_dtsx:
- rts
- |
- | Inst is fabs. Execute the absolute value function on the input.
- | Branch to the fmove code.
- |
- cu_dabs:
- bclrb #7,LOCAL_EX(%a0) |do abs
- bras cu_dmove |fmove code will finish
- |
- | Inst is fneg. Execute the negate value function on the input.
- | Fall though to the fmove code.
- |
- cu_dneg:
- bchgb #7,LOCAL_EX(%a0) |do neg
- |
- | Inst is fmove. This code also handles all result writes.
- | If bit 2 is set, round is forced to double. If it is clear,
- | and bit 6 is set, round is forced to single. If both are clear,
- | the round precision is found in the fpcr. If the rounding precision
- | is double or single, the result is zero, and the mode is checked
- | to determine if the lsb of the result should be set.
- |
- cu_dmove:
- btstb #2,CMDREG1B+1(%a6) |check for rd
- bne cu_dmrd
- btstb #6,CMDREG1B+1(%a6) |check for rs
- bne cu_dmrs
- |
- | The move or operation is not with forced precision. Use the
- | FPCR_MODE byte to get rounding.
- |
- cu_dmnr:
- bfextu FPCR_MODE(%a6){#0:#2},%d0
- tstb %d0 |check for extended
- beq cu_wrexd |if so, just write result
- cmpib #1,%d0 |check for single
- beq cu_dmrs |fall through to double
- |
- | The move is fdmove or round precision is double. Result is zero.
- | Check rmode for rp or rm and set lsb accordingly.
- |
- cu_dmrd:
- bfextu FPCR_MODE(%a6){#2:#2},%d1 |get rmode
- tstw LOCAL_EX(%a0) |check sign
- blts cu_dmdn
- cmpib #3,%d1 |check for rp
- bne cu_dpd |load double pos zero
- bra cu_dpdr |load double pos zero w/lsb
- cu_dmdn:
- cmpib #2,%d1 |check for rm
- bne cu_dnd |load double neg zero
- bra cu_dndr |load double neg zero w/lsb
- |
- | The move is fsmove or round precision is single. Result is zero.
- | Check for rp or rm and set lsb accordingly.
- |
- cu_dmrs:
- bfextu FPCR_MODE(%a6){#2:#2},%d1 |get rmode
- tstw LOCAL_EX(%a0) |check sign
- blts cu_dmsn
- cmpib #3,%d1 |check for rp
- bne cu_spd |load single pos zero
- bra cu_spdr |load single pos zero w/lsb
- cu_dmsn:
- cmpib #2,%d1 |check for rm
- bne cu_snd |load single neg zero
- bra cu_sndr |load single neg zero w/lsb
- |
- | The precision is extended, so the result in etemp is correct.
- | Simply set unfl (not inex2 or aunfl) and write the result to
- | the correct fp register.
- cu_wrexd:
- orl #unfl_mask,USER_FPSR(%a6)
- tstw LOCAL_EX(%a0)
- beq wr_etemp
- orl #neg_mask,USER_FPSR(%a6)
- bra wr_etemp
- |
- | These routines write +/- zero in double format. The routines
- | cu_dpdr and cu_dndr set the double lsb.
- |
- cu_dpd:
- movel #0x3c010000,LOCAL_EX(%a0) |force pos double zero
- clrl LOCAL_HI(%a0)
- clrl LOCAL_LO(%a0)
- orl #z_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_dpdr:
- movel #0x3c010000,LOCAL_EX(%a0) |force pos double zero
- clrl LOCAL_HI(%a0)
- movel #0x800,LOCAL_LO(%a0) |with lsb set
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_dnd:
- movel #0xbc010000,LOCAL_EX(%a0) |force pos double zero
- clrl LOCAL_HI(%a0)
- clrl LOCAL_LO(%a0)
- orl #z_mask,USER_FPSR(%a6)
- orl #neg_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_dndr:
- movel #0xbc010000,LOCAL_EX(%a0) |force pos double zero
- clrl LOCAL_HI(%a0)
- movel #0x800,LOCAL_LO(%a0) |with lsb set
- orl #neg_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- |
- | These routines write +/- zero in single format. The routines
- | cu_dpdr and cu_dndr set the single lsb.
- |
- cu_spd:
- movel #0x3f810000,LOCAL_EX(%a0) |force pos single zero
- clrl LOCAL_HI(%a0)
- clrl LOCAL_LO(%a0)
- orl #z_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_spdr:
- movel #0x3f810000,LOCAL_EX(%a0) |force pos single zero
- movel #0x100,LOCAL_HI(%a0) |with lsb set
- clrl LOCAL_LO(%a0)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_snd:
- movel #0xbf810000,LOCAL_EX(%a0) |force pos single zero
- clrl LOCAL_HI(%a0)
- clrl LOCAL_LO(%a0)
- orl #z_mask,USER_FPSR(%a6)
- orl #neg_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_sndr:
- movel #0xbf810000,LOCAL_EX(%a0) |force pos single zero
- movel #0x100,LOCAL_HI(%a0) |with lsb set
- clrl LOCAL_LO(%a0)
- orl #neg_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- |
- | This code checks for 16-bit overflow conditions on dyadic
- | operations which are not restorable into the floating-point
- | unit and must be completed in software. Basically, this
- | condition exists with a very large norm and a denorm. One
- | of the operands must be denormalized to enter this code.
- |
- | Flags used:
- | DY_MO_FLG contains 0 for monadic op, $ff for dyadic
- | DNRM_FLG contains $00 for neither op denormalized
- | $0f for the destination op denormalized
- | $f0 for the source op denormalized
- | $ff for both ops denormalized
- |
- | The wrap-around condition occurs for add, sub, div, and cmp
- | when
- |
- | abs(dest_exp - src_exp) >= $8000
- |
- | and for mul when
- |
- | (dest_exp + src_exp) < $0
- |
- | we must process the operation here if this case is true.
- |
- | The rts following the frcfpn routine is the exit from res_func
- | for this condition. The restore flag (RES_FLG) is left clear.
- | No frestore is done unless an exception is to be reported.
- |
- | For fadd:
- | if(sign_of(dest) != sign_of(src))
- | replace exponent of src with $3fff (keep sign)
- | use fpu to perform dest+new_src (user's rmode and X)
- | clr sticky
- | else
- | set sticky
- | call round with user's precision and mode
- | move result to fpn and wbtemp
- |
- | For fsub:
- | if(sign_of(dest) == sign_of(src))
- | replace exponent of src with $3fff (keep sign)
- | use fpu to perform dest+new_src (user's rmode and X)
- | clr sticky
- | else
- | set sticky
- | call round with user's precision and mode
- | move result to fpn and wbtemp
- |
- | For fdiv/fsgldiv:
- | if(both operands are denorm)
- | restore_to_fpu;
- | if(dest is norm)
- | force_ovf;
- | else(dest is denorm)
- | force_unf:
- |
- | For fcmp:
- | if(dest is norm)
- | N = sign_of(dest);
- | else(dest is denorm)
- | N = sign_of(src);
- |
- | For fmul:
- | if(both operands are denorm)
- | force_unf;
- | if((dest_exp + src_exp) < 0)
- | force_unf:
- | else
- | restore_to_fpu;
- |
- | local equates:
- .set addcode,0x22
- .set subcode,0x28
- .set mulcode,0x23
- .set divcode,0x20
- .set cmpcode,0x38
- ck_wrap:
- | tstb DY_MO_FLG(%a6) ;check for fsqrt
- beq fix_stk |if zero, it is fsqrt
- movew CMDREG1B(%a6),%d0
- andiw #0x3b,%d0 |strip to command bits
- cmpiw #addcode,%d0
- beq wrap_add
- cmpiw #subcode,%d0
- beq wrap_sub
- cmpiw #mulcode,%d0
- beq wrap_mul
- cmpiw #cmpcode,%d0
- beq wrap_cmp
- |
- | Inst is fdiv.
- |
- wrap_div:
- cmpb #0xff,DNRM_FLG(%a6) |if both ops denorm,
- beq fix_stk |restore to fpu
- |
- | One of the ops is denormalized. Test for wrap condition
- | and force the result.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |check for dest denorm
- bnes div_srcd
- div_destd:
- bsrl ckinf_ns
- bne fix_stk
- bfextu ETEMP_EX(%a6){#1:#15},%d0 |get src exp (always pos)
- bfexts FPTEMP_EX(%a6){#1:#15},%d1 |get dest exp (always neg)
- subl %d1,%d0 |subtract dest from src
- cmpl #0x7fff,%d0
- blt fix_stk |if less, not wrap case
- clrb WBTEMP_SGN(%a6)
- movew ETEMP_EX(%a6),%d0 |find the sign of the result
- movew FPTEMP_EX(%a6),%d1
- eorw %d1,%d0
- andiw #0x8000,%d0
- beq force_unf
- st WBTEMP_SGN(%a6)
- bra force_unf
- ckinf_ns:
- moveb STAG(%a6),%d0 |check source tag for inf or nan
- bra ck_in_com
- ckinf_nd:
- moveb DTAG(%a6),%d0 |check destination tag for inf or nan
- ck_in_com:
- andib #0x60,%d0 |isolate tag bits
- cmpb #0x40,%d0 |is it inf?
- beq nan_or_inf |not wrap case
- cmpb #0x60,%d0 |is it nan?
- beq nan_or_inf |yes, not wrap case?
- cmpb #0x20,%d0 |is it a zero?
- beq nan_or_inf |yes
- clrl %d0
- rts |then ; it is either a zero of norm,
- | ;check wrap case
- nan_or_inf:
- moveql #-1,%d0
- rts
- div_srcd:
- bsrl ckinf_nd
- bne fix_stk
- bfextu FPTEMP_EX(%a6){#1:#15},%d0 |get dest exp (always pos)
- bfexts ETEMP_EX(%a6){#1:#15},%d1 |get src exp (always neg)
- subl %d1,%d0 |subtract src from dest
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- clrb WBTEMP_SGN(%a6)
- movew ETEMP_EX(%a6),%d0 |find the sign of the result
- movew FPTEMP_EX(%a6),%d1
- eorw %d1,%d0
- andiw #0x8000,%d0
- beqs force_ovf
- st WBTEMP_SGN(%a6)
- |
- | This code handles the case of the instruction resulting in
- | an overflow condition.
- |
- force_ovf:
- bclrb #E1,E_BYTE(%a6)
- orl #ovfl_inx_mask,USER_FPSR(%a6)
- clrw NMNEXC(%a6)
- leal WBTEMP(%a6),%a0 |point a0 to memory location
- movew CMDREG1B(%a6),%d0
- btstl #6,%d0 |test for forced precision
- beqs frcovf_fpcr
- btstl #2,%d0 |check for double
- bnes frcovf_dbl
- movel #0x1,%d0 |inst is forced single
- bras frcovf_rnd
- frcovf_dbl:
- movel #0x2,%d0 |inst is forced double
- bras frcovf_rnd
- frcovf_fpcr:
- bfextu FPCR_MODE(%a6){#0:#2},%d0 |inst not forced - use fpcr prec
- frcovf_rnd:
- | The 881/882 does not set inex2 for the following case, so the
- | line is commented out to be compatible with 881/882
- | tst.b %d0
- | beq.b frcovf_x
- | or.l #inex2_mask,USER_FPSR(%a6) ;if prec is s or d, set inex2
- |frcovf_x:
- bsrl ovf_res |get correct result based on
- | ;round precision/mode. This
- | ;sets FPSR_CC correctly
- | ;returns in external format
- bfclr WBTEMP_SGN(%a6){#0:#8}
- beq frcfpn
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpn
- |
- | Inst is fadd.
- |
- wrap_add:
- cmpb #0xff,DNRM_FLG(%a6) |if both ops denorm,
- beq fix_stk |restore to fpu
- |
- | One of the ops is denormalized. Test for wrap condition
- | and complete the instruction.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |check for dest denorm
- bnes add_srcd
- add_destd:
- bsrl ckinf_ns
- bne fix_stk
- bfextu ETEMP_EX(%a6){#1:#15},%d0 |get src exp (always pos)
- bfexts FPTEMP_EX(%a6){#1:#15},%d1 |get dest exp (always neg)
- subl %d1,%d0 |subtract dest from src
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- bra add_wrap
- add_srcd:
- bsrl ckinf_nd
- bne fix_stk
- bfextu FPTEMP_EX(%a6){#1:#15},%d0 |get dest exp (always pos)
- bfexts ETEMP_EX(%a6){#1:#15},%d1 |get src exp (always neg)
- subl %d1,%d0 |subtract src from dest
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- |
- | Check the signs of the operands. If they are unlike, the fpu
- | can be used to add the norm and 1.0 with the sign of the
- | denorm and it will correctly generate the result in extended
- | precision. We can then call round with no sticky and the result
- | will be correct for the user's rounding mode and precision. If
- | the signs are the same, we call round with the sticky bit set
- | and the result will be correct for the user's rounding mode and
- | precision.
- |
- add_wrap:
- movew ETEMP_EX(%a6),%d0
- movew FPTEMP_EX(%a6),%d1
- eorw %d1,%d0
- andiw #0x8000,%d0
- beq add_same
- |
- | The signs are unlike.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |is dest the denorm?
- bnes add_u_srcd
- movew FPTEMP_EX(%a6),%d0
- andiw #0x8000,%d0
- orw #0x3fff,%d0 |force the exponent to +/- 1
- movew %d0,FPTEMP_EX(%a6) |in the denorm
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- fmovel %d0,%fpcr |set up users rmode and X
- fmovex ETEMP(%a6),%fp0
- faddx FPTEMP(%a6),%fp0
- leal WBTEMP(%a6),%a0 |point a0 to wbtemp in frame
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture cc's and inex from fadd
- fmovex %fp0,WBTEMP(%a6) |write result to memory
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- clrl %d0 |force sticky to zero
- bclrb #sign_bit,WBTEMP_EX(%a6)
- sne WBTEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beq frcfpnr
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpnr
- add_u_srcd:
- movew ETEMP_EX(%a6),%d0
- andiw #0x8000,%d0
- orw #0x3fff,%d0 |force the exponent to +/- 1
- movew %d0,ETEMP_EX(%a6) |in the denorm
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- fmovel %d0,%fpcr |set up users rmode and X
- fmovex ETEMP(%a6),%fp0
- faddx FPTEMP(%a6),%fp0
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture cc's and inex from fadd
- leal WBTEMP(%a6),%a0 |point a0 to wbtemp in frame
- fmovex %fp0,WBTEMP(%a6) |write result to memory
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- clrl %d0 |force sticky to zero
- bclrb #sign_bit,WBTEMP_EX(%a6)
- sne WBTEMP_SGN(%a6) |use internal format for round
- bsrl round |round result to users rmode & prec
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beq frcfpnr
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpnr
- |
- | Signs are alike:
- |
- add_same:
- cmpb #0x0f,DNRM_FLG(%a6) |is dest the denorm?
- bnes add_s_srcd
- add_s_destd:
- leal ETEMP(%a6),%a0
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- movel #0x20000000,%d0 |set sticky for round
- bclrb #sign_bit,ETEMP_EX(%a6)
- sne ETEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr ETEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs add_s_dclr
- bsetb #sign_bit,ETEMP_EX(%a6)
- add_s_dclr:
- leal WBTEMP(%a6),%a0
- movel ETEMP(%a6),(%a0) |write result to wbtemp
- movel ETEMP_HI(%a6),4(%a0)
- movel ETEMP_LO(%a6),8(%a0)
- tstw ETEMP_EX(%a6)
- bgt add_ckovf
- orl #neg_mask,USER_FPSR(%a6)
- bra add_ckovf
- add_s_srcd:
- leal FPTEMP(%a6),%a0
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- movel #0x20000000,%d0 |set sticky for round
- bclrb #sign_bit,FPTEMP_EX(%a6)
- sne FPTEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr FPTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs add_s_sclr
- bsetb #sign_bit,FPTEMP_EX(%a6)
- add_s_sclr:
- leal WBTEMP(%a6),%a0
- movel FPTEMP(%a6),(%a0) |write result to wbtemp
- movel FPTEMP_HI(%a6),4(%a0)
- movel FPTEMP_LO(%a6),8(%a0)
- tstw FPTEMP_EX(%a6)
- bgt add_ckovf
- orl #neg_mask,USER_FPSR(%a6)
- add_ckovf:
- movew WBTEMP_EX(%a6),%d0
- andiw #0x7fff,%d0
- cmpiw #0x7fff,%d0
- bne frcfpnr
- |
- | The result has overflowed to $7fff exponent. Set I, ovfl,
- | and aovfl, and clr the mantissa (incorrectly set by the
- | round routine.)
- |
- orl #inf_mask+ovfl_inx_mask,USER_FPSR(%a6)
- clrl 4(%a0)
- bra frcfpnr
- |
- | Inst is fsub.
- |
- wrap_sub:
- cmpb #0xff,DNRM_FLG(%a6) |if both ops denorm,
- beq fix_stk |restore to fpu
- |
- | One of the ops is denormalized. Test for wrap condition
- | and complete the instruction.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |check for dest denorm
- bnes sub_srcd
- sub_destd:
- bsrl ckinf_ns
- bne fix_stk
- bfextu ETEMP_EX(%a6){#1:#15},%d0 |get src exp (always pos)
- bfexts FPTEMP_EX(%a6){#1:#15},%d1 |get dest exp (always neg)
- subl %d1,%d0 |subtract src from dest
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- bra sub_wrap
- sub_srcd:
- bsrl ckinf_nd
- bne fix_stk
- bfextu FPTEMP_EX(%a6){#1:#15},%d0 |get dest exp (always pos)
- bfexts ETEMP_EX(%a6){#1:#15},%d1 |get src exp (always neg)
- subl %d1,%d0 |subtract dest from src
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- |
- | Check the signs of the operands. If they are alike, the fpu
- | can be used to subtract from the norm 1.0 with the sign of the
- | denorm and it will correctly generate the result in extended
- | precision. We can then call round with no sticky and the result
- | will be correct for the user's rounding mode and precision. If
- | the signs are unlike, we call round with the sticky bit set
- | and the result will be correct for the user's rounding mode and
- | precision.
- |
- sub_wrap:
- movew ETEMP_EX(%a6),%d0
- movew FPTEMP_EX(%a6),%d1
- eorw %d1,%d0
- andiw #0x8000,%d0
- bne sub_diff
- |
- | The signs are alike.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |is dest the denorm?
- bnes sub_u_srcd
- movew FPTEMP_EX(%a6),%d0
- andiw #0x8000,%d0
- orw #0x3fff,%d0 |force the exponent to +/- 1
- movew %d0,FPTEMP_EX(%a6) |in the denorm
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- fmovel %d0,%fpcr |set up users rmode and X
- fmovex FPTEMP(%a6),%fp0
- fsubx ETEMP(%a6),%fp0
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture cc's and inex from fadd
- leal WBTEMP(%a6),%a0 |point a0 to wbtemp in frame
- fmovex %fp0,WBTEMP(%a6) |write result to memory
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- clrl %d0 |force sticky to zero
- bclrb #sign_bit,WBTEMP_EX(%a6)
- sne WBTEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beq frcfpnr
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpnr
- sub_u_srcd:
- movew ETEMP_EX(%a6),%d0
- andiw #0x8000,%d0
- orw #0x3fff,%d0 |force the exponent to +/- 1
- movew %d0,ETEMP_EX(%a6) |in the denorm
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- fmovel %d0,%fpcr |set up users rmode and X
- fmovex FPTEMP(%a6),%fp0
- fsubx ETEMP(%a6),%fp0
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture cc's and inex from fadd
- leal WBTEMP(%a6),%a0 |point a0 to wbtemp in frame
- fmovex %fp0,WBTEMP(%a6) |write result to memory
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- clrl %d0 |force sticky to zero
- bclrb #sign_bit,WBTEMP_EX(%a6)
- sne WBTEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beq frcfpnr
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpnr
- |
- | Signs are unlike:
- |
- sub_diff:
- cmpb #0x0f,DNRM_FLG(%a6) |is dest the denorm?
- bnes sub_s_srcd
- sub_s_destd:
- leal ETEMP(%a6),%a0
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- movel #0x20000000,%d0 |set sticky for round
- |
- | Since the dest is the denorm, the sign is the opposite of the
- | norm sign.
- |
- eoriw #0x8000,ETEMP_EX(%a6) |flip sign on result
- tstw ETEMP_EX(%a6)
- bgts sub_s_dwr
- orl #neg_mask,USER_FPSR(%a6)
- sub_s_dwr:
- bclrb #sign_bit,ETEMP_EX(%a6)
- sne ETEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr ETEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs sub_s_dclr
- bsetb #sign_bit,ETEMP_EX(%a6)
- sub_s_dclr:
- leal WBTEMP(%a6),%a0
- movel ETEMP(%a6),(%a0) |write result to wbtemp
- movel ETEMP_HI(%a6),4(%a0)
- movel ETEMP_LO(%a6),8(%a0)
- bra sub_ckovf
- sub_s_srcd:
- leal FPTEMP(%a6),%a0
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- movel #0x20000000,%d0 |set sticky for round
- bclrb #sign_bit,FPTEMP_EX(%a6)
- sne FPTEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr FPTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs sub_s_sclr
- bsetb #sign_bit,FPTEMP_EX(%a6)
- sub_s_sclr:
- leal WBTEMP(%a6),%a0
- movel FPTEMP(%a6),(%a0) |write result to wbtemp
- movel FPTEMP_HI(%a6),4(%a0)
- movel FPTEMP_LO(%a6),8(%a0)
- tstw FPTEMP_EX(%a6)
- bgt sub_ckovf
- orl #neg_mask,USER_FPSR(%a6)
- sub_ckovf:
- movew WBTEMP_EX(%a6),%d0
- andiw #0x7fff,%d0
- cmpiw #0x7fff,%d0
- bne frcfpnr
- |
- | The result has overflowed to $7fff exponent. Set I, ovfl,
- | and aovfl, and clr the mantissa (incorrectly set by the
- | round routine.)
- |
- orl #inf_mask+ovfl_inx_mask,USER_FPSR(%a6)
- clrl 4(%a0)
- bra frcfpnr
- |
- | Inst is fcmp.
- |
- wrap_cmp:
- cmpb #0xff,DNRM_FLG(%a6) |if both ops denorm,
- beq fix_stk |restore to fpu
- |
- | One of the ops is denormalized. Test for wrap condition
- | and complete the instruction.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |check for dest denorm
- bnes cmp_srcd
- cmp_destd:
- bsrl ckinf_ns
- bne fix_stk
- bfextu ETEMP_EX(%a6){#1:#15},%d0 |get src exp (always pos)
- bfexts FPTEMP_EX(%a6){#1:#15},%d1 |get dest exp (always neg)
- subl %d1,%d0 |subtract dest from src
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- tstw ETEMP_EX(%a6) |set N to ~sign_of(src)
- bge cmp_setn
- rts
- cmp_srcd:
- bsrl ckinf_nd
- bne fix_stk
- bfextu FPTEMP_EX(%a6){#1:#15},%d0 |get dest exp (always pos)
- bfexts ETEMP_EX(%a6){#1:#15},%d1 |get src exp (always neg)
- subl %d1,%d0 |subtract src from dest
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- tstw FPTEMP_EX(%a6) |set N to sign_of(dest)
- blt cmp_setn
- rts
- cmp_setn:
- orl #neg_mask,USER_FPSR(%a6)
- rts
- |
- | Inst is fmul.
- |
- wrap_mul:
- cmpb #0xff,DNRM_FLG(%a6) |if both ops denorm,
- beq force_unf |force an underflow (really!)
- |
- | One of the ops is denormalized. Test for wrap condition
- | and complete the instruction.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |check for dest denorm
- bnes mul_srcd
- mul_destd:
- bsrl ckinf_ns
- bne fix_stk
- bfextu ETEMP_EX(%a6){#1:#15},%d0 |get src exp (always pos)
- bfexts FPTEMP_EX(%a6){#1:#15},%d1 |get dest exp (always neg)
- addl %d1,%d0 |subtract dest from src
- bgt fix_stk
- bra force_unf
- mul_srcd:
- bsrl ckinf_nd
- bne fix_stk
- bfextu FPTEMP_EX(%a6){#1:#15},%d0 |get dest exp (always pos)
- bfexts ETEMP_EX(%a6){#1:#15},%d1 |get src exp (always neg)
- addl %d1,%d0 |subtract src from dest
- bgt fix_stk
- |
- | This code handles the case of the instruction resulting in
- | an underflow condition.
- |
- force_unf:
- bclrb #E1,E_BYTE(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- clrw NMNEXC(%a6)
- clrb WBTEMP_SGN(%a6)
- movew ETEMP_EX(%a6),%d0 |find the sign of the result
- movew FPTEMP_EX(%a6),%d1
- eorw %d1,%d0
- andiw #0x8000,%d0
- beqs frcunfcont
- st WBTEMP_SGN(%a6)
- frcunfcont:
- lea WBTEMP(%a6),%a0 |point a0 to memory location
- movew CMDREG1B(%a6),%d0
- btstl #6,%d0 |test for forced precision
- beqs frcunf_fpcr
- btstl #2,%d0 |check for double
- bnes frcunf_dbl
- movel #0x1,%d0 |inst is forced single
- bras frcunf_rnd
- frcunf_dbl:
- movel #0x2,%d0 |inst is forced double
- bras frcunf_rnd
- frcunf_fpcr:
- bfextu FPCR_MODE(%a6){#0:#2},%d0 |inst not forced - use fpcr prec
- frcunf_rnd:
- bsrl unf_sub |get correct result based on
- | ;round precision/mode. This
- | ;sets FPSR_CC correctly
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs frcfpn
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpn
- |
- | Write the result to the user's fpn. All results must be HUGE to be
- | written; otherwise the results would have overflowed or underflowed.
- | If the rounding precision is single or double, the ovf_res routine
- | is needed to correctly supply the max value.
- |
- frcfpnr:
- movew CMDREG1B(%a6),%d0
- btstl #6,%d0 |test for forced precision
- beqs frcfpn_fpcr
- btstl #2,%d0 |check for double
- bnes frcfpn_dbl
- movel #0x1,%d0 |inst is forced single
- bras frcfpn_rnd
- frcfpn_dbl:
- movel #0x2,%d0 |inst is forced double
- bras frcfpn_rnd
- frcfpn_fpcr:
- bfextu FPCR_MODE(%a6){#0:#2},%d0 |inst not forced - use fpcr prec
- tstb %d0
- beqs frcfpn |if extended, write what you got
- frcfpn_rnd:
- bclrb #sign_bit,WBTEMP_EX(%a6)
- sne WBTEMP_SGN(%a6)
- bsrl ovf_res |get correct result based on
- | ;round precision/mode. This
- | ;sets FPSR_CC correctly
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs frcfpn_clr
- bsetb #sign_bit,WBTEMP_EX(%a6)
- frcfpn_clr:
- orl #ovfinx_mask,USER_FPSR(%a6)
- |
- | Perform the write.
- |
- frcfpn:
- bfextu CMDREG1B(%a6){#6:#3},%d0 |extract fp destination register
- cmpib #3,%d0
- bles frc0123 |check if dest is fp0-fp3
- movel #7,%d1
- subl %d0,%d1
- clrl %d0
- bsetl %d1,%d0
- fmovemx WBTEMP(%a6),%d0
- rts
- frc0123:
- cmpib #0,%d0
- beqs frc0_dst
- cmpib #1,%d0
- beqs frc1_dst
- cmpib #2,%d0
- beqs frc2_dst
- frc3_dst:
- movel WBTEMP_EX(%a6),USER_FP3(%a6)
- movel WBTEMP_HI(%a6),USER_FP3+4(%a6)
- movel WBTEMP_LO(%a6),USER_FP3+8(%a6)
- rts
- frc2_dst:
- movel WBTEMP_EX(%a6),USER_FP2(%a6)
- movel WBTEMP_HI(%a6),USER_FP2+4(%a6)
- movel WBTEMP_LO(%a6),USER_FP2+8(%a6)
- rts
- frc1_dst:
- movel WBTEMP_EX(%a6),USER_FP1(%a6)
- movel WBTEMP_HI(%a6),USER_FP1+4(%a6)
- movel WBTEMP_LO(%a6),USER_FP1+8(%a6)
- rts
- frc0_dst:
- movel WBTEMP_EX(%a6),USER_FP0(%a6)
- movel WBTEMP_HI(%a6),USER_FP0+4(%a6)
- movel WBTEMP_LO(%a6),USER_FP0+8(%a6)
- rts
- |
- | Write etemp to fpn.
- | A check is made on enabled and signalled snan exceptions,
- | and the destination is not overwritten if this condition exists.
- | This code is designed to make fmoveins of unsupported data types
- | faster.
- |
- wr_etemp:
- btstb #snan_bit,FPSR_EXCEPT(%a6) |if snan is set, and
- beqs fmoveinc |enabled, force restore
- btstb #snan_bit,FPCR_ENABLE(%a6) |and don't overwrite
- beqs fmoveinc |the dest
- movel ETEMP_EX(%a6),FPTEMP_EX(%a6) |set up fptemp sign for
- | ;snan handler
- tstb ETEMP(%a6) |check for negative
- blts snan_neg
- rts
- snan_neg:
- orl #neg_bit,USER_FPSR(%a6) |snan is negative; set N
- rts
- fmoveinc:
- clrw NMNEXC(%a6)
- bclrb #E1,E_BYTE(%a6)
- moveb STAG(%a6),%d0 |check if stag is inf
- andib #0xe0,%d0
- cmpib #0x40,%d0
- bnes fminc_cnan
- orl #inf_mask,USER_FPSR(%a6) |if inf, nothing yet has set I
- tstw LOCAL_EX(%a0) |check sign
- bges fminc_con
- orl #neg_mask,USER_FPSR(%a6)
- bra fminc_con
- fminc_cnan:
- cmpib #0x60,%d0 |check if stag is NaN
- bnes fminc_czero
- orl #nan_mask,USER_FPSR(%a6) |if nan, nothing yet has set NaN
- movel ETEMP_EX(%a6),FPTEMP_EX(%a6) |set up fptemp sign for
- | ;snan handler
- tstw LOCAL_EX(%a0) |check sign
- bges fminc_con
- orl #neg_mask,USER_FPSR(%a6)
- bra fminc_con
- fminc_czero:
- cmpib #0x20,%d0 |check if zero
- bnes fminc_con
- orl #z_mask,USER_FPSR(%a6) |if zero, set Z
- tstw LOCAL_EX(%a0) |check sign
- bges fminc_con
- orl #neg_mask,USER_FPSR(%a6)
- fminc_con:
- bfextu CMDREG1B(%a6){#6:#3},%d0 |extract fp destination register
- cmpib #3,%d0
- bles fp0123 |check if dest is fp0-fp3
- movel #7,%d1
- subl %d0,%d1
- clrl %d0
- bsetl %d1,%d0
- fmovemx ETEMP(%a6),%d0
- rts
- fp0123:
- cmpib #0,%d0
- beqs fp0_dst
- cmpib #1,%d0
- beqs fp1_dst
- cmpib #2,%d0
- beqs fp2_dst
- fp3_dst:
- movel ETEMP_EX(%a6),USER_FP3(%a6)
- movel ETEMP_HI(%a6),USER_FP3+4(%a6)
- movel ETEMP_LO(%a6),USER_FP3+8(%a6)
- rts
- fp2_dst:
- movel ETEMP_EX(%a6),USER_FP2(%a6)
- movel ETEMP_HI(%a6),USER_FP2+4(%a6)
- movel ETEMP_LO(%a6),USER_FP2+8(%a6)
- rts
- fp1_dst:
- movel ETEMP_EX(%a6),USER_FP1(%a6)
- movel ETEMP_HI(%a6),USER_FP1+4(%a6)
- movel ETEMP_LO(%a6),USER_FP1+8(%a6)
- rts
- fp0_dst:
- movel ETEMP_EX(%a6),USER_FP0(%a6)
- movel ETEMP_HI(%a6),USER_FP0+4(%a6)
- movel ETEMP_LO(%a6),USER_FP0+8(%a6)
- rts
- opclass3:
- st CU_ONLY(%a6)
- movew CMDREG1B(%a6),%d0 |check if packed moveout
- andiw #0x0c00,%d0 |isolate last 2 bits of size field
- cmpiw #0x0c00,%d0 |if size is 011 or 111, it is packed
- beq pack_out |else it is norm or denorm
- bra mv_out
- |
- | MOVE OUT
- |
- mv_tbl:
- .long li
- .long sgp
- .long xp
- .long mvout_end |should never be taken
- .long wi
- .long dp
- .long bi
- .long mvout_end |should never be taken
- mv_out:
- bfextu CMDREG1B(%a6){#3:#3},%d1 |put source specifier in d1
- leal mv_tbl,%a0
- movel %a0@(%d1:l:4),%a0
- jmp (%a0)
- |
- | This exit is for move-out to memory. The aunfl bit is
- | set if the result is inex and unfl is signalled.
- |
- mvout_end:
- btstb #inex2_bit,FPSR_EXCEPT(%a6)
- beqs no_aufl
- btstb #unfl_bit,FPSR_EXCEPT(%a6)
- beqs no_aufl
- bsetb #aunfl_bit,FPSR_AEXCEPT(%a6)
- no_aufl:
- clrw NMNEXC(%a6)
- bclrb #E1,E_BYTE(%a6)
- fmovel #0,%FPSR |clear any cc bits from res_func
- |
- | Return ETEMP to extended format from internal extended format so
- | that gen_except will have a correctly signed value for ovfl/unfl
- | handlers.
- |
- bfclr ETEMP_SGN(%a6){#0:#8}
- beqs mvout_con
- bsetb #sign_bit,ETEMP_EX(%a6)
- mvout_con:
- rts
- |
- | This exit is for move-out to int register. The aunfl bit is
- | not set in any case for this move.
- |
- mvouti_end:
- clrw NMNEXC(%a6)
- bclrb #E1,E_BYTE(%a6)
- fmovel #0,%FPSR |clear any cc bits from res_func
- |
- | Return ETEMP to extended format from internal extended format so
- | that gen_except will have a correctly signed value for ovfl/unfl
- | handlers.
- |
- bfclr ETEMP_SGN(%a6){#0:#8}
- beqs mvouti_con
- bsetb #sign_bit,ETEMP_EX(%a6)
- mvouti_con:
- rts
- |
- | li is used to handle a long integer source specifier
- |
- li:
- moveql #4,%d0 |set byte count
- btstb #7,STAG(%a6) |check for extended denorm
- bne int_dnrm |if so, branch
- fmovemx ETEMP(%a6),%fp0-%fp0
- fcmpd #0x41dfffffffc00000,%fp0
- | 41dfffffffc00000 in dbl prec = 401d0000fffffffe00000000 in ext prec
- fbge lo_plrg
- fcmpd #0xc1e0000000000000,%fp0
- | c1e0000000000000 in dbl prec = c01e00008000000000000000 in ext prec
- fble lo_nlrg
- |
- | at this point, the answer is between the largest pos and neg values
- |
- movel USER_FPCR(%a6),%d1 |use user's rounding mode
- andil #0x30,%d1
- fmovel %d1,%fpcr
- fmovel %fp0,L_SCR1(%a6) |let the 040 perform conversion
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture inex2/ainex if set
- bra int_wrt
- lo_plrg:
- movel #0x7fffffff,L_SCR1(%a6) |answer is largest positive int
- fbeq int_wrt |exact answer
- fcmpd #0x41dfffffffe00000,%fp0
- | 41dfffffffe00000 in dbl prec = 401d0000ffffffff00000000 in ext prec
- fbge int_operr |set operr
- bra int_inx |set inexact
- lo_nlrg:
- movel #0x80000000,L_SCR1(%a6)
- fbeq int_wrt |exact answer
- fcmpd #0xc1e0000000100000,%fp0
- | c1e0000000100000 in dbl prec = c01e00008000000080000000 in ext prec
- fblt int_operr |set operr
- bra int_inx |set inexact
- |
- | wi is used to handle a word integer source specifier
- |
- wi:
- moveql #2,%d0 |set byte count
- btstb #7,STAG(%a6) |check for extended denorm
- bne int_dnrm |branch if so
- fmovemx ETEMP(%a6),%fp0-%fp0
- fcmps #0x46fffe00,%fp0
- | 46fffe00 in sgl prec = 400d0000fffe000000000000 in ext prec
- fbge wo_plrg
- fcmps #0xc7000000,%fp0
- | c7000000 in sgl prec = c00e00008000000000000000 in ext prec
- fble wo_nlrg
- |
- | at this point, the answer is between the largest pos and neg values
- |
- movel USER_FPCR(%a6),%d1 |use user's rounding mode
- andil #0x30,%d1
- fmovel %d1,%fpcr
- fmovew %fp0,L_SCR1(%a6) |let the 040 perform conversion
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture inex2/ainex if set
- bra int_wrt
- wo_plrg:
- movew #0x7fff,L_SCR1(%a6) |answer is largest positive int
- fbeq int_wrt |exact answer
- fcmps #0x46ffff00,%fp0
- | 46ffff00 in sgl prec = 400d0000ffff000000000000 in ext prec
- fbge int_operr |set operr
- bra int_inx |set inexact
- wo_nlrg:
- movew #0x8000,L_SCR1(%a6)
- fbeq int_wrt |exact answer
- fcmps #0xc7000080,%fp0
- | c7000080 in sgl prec = c00e00008000800000000000 in ext prec
- fblt int_operr |set operr
- bra int_inx |set inexact
- |
- | bi is used to handle a byte integer source specifier
- |
- bi:
- moveql #1,%d0 |set byte count
- btstb #7,STAG(%a6) |check for extended denorm
- bne int_dnrm |branch if so
- fmovemx ETEMP(%a6),%fp0-%fp0
- fcmps #0x42fe0000,%fp0
- | 42fe0000 in sgl prec = 40050000fe00000000000000 in ext prec
- fbge by_plrg
- fcmps #0xc3000000,%fp0
- | c3000000 in sgl prec = c00600008000000000000000 in ext prec
- fble by_nlrg
- |
- | at this point, the answer is between the largest pos and neg values
- |
- movel USER_FPCR(%a6),%d1 |use user's rounding mode
- andil #0x30,%d1
- fmovel %d1,%fpcr
- fmoveb %fp0,L_SCR1(%a6) |let the 040 perform conversion
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture inex2/ainex if set
- bra int_wrt
- by_plrg:
- moveb #0x7f,L_SCR1(%a6) |answer is largest positive int
- fbeq int_wrt |exact answer
- fcmps #0x42ff0000,%fp0
- | 42ff0000 in sgl prec = 40050000ff00000000000000 in ext prec
- fbge int_operr |set operr
- bra int_inx |set inexact
- by_nlrg:
- moveb #0x80,L_SCR1(%a6)
- fbeq int_wrt |exact answer
- fcmps #0xc3008000,%fp0
- | c3008000 in sgl prec = c00600008080000000000000 in ext prec
- fblt int_operr |set operr
- bra int_inx |set inexact
- |
- | Common integer routines
- |
- | int_drnrm---account for possible nonzero result for round up with positive
- | operand and round down for negative answer. In the first case (result = 1)
- | byte-width (store in d0) of result must be honored. In the second case,
- | -1 in L_SCR1(a6) will cover all contingencies (FMOVE.B/W/L out).
- int_dnrm:
- movel #0,L_SCR1(%a6) | initialize result to 0
- bfextu FPCR_MODE(%a6){#2:#2},%d1 | d1 is the rounding mode
- cmpb #2,%d1
- bmis int_inx | if RN or RZ, done
- bnes int_rp | if RP, continue below
- tstw ETEMP(%a6) | RM: store -1 in L_SCR1 if src is negative
- bpls int_inx | otherwise result is 0
- movel #-1,L_SCR1(%a6)
- bras int_inx
- int_rp:
- tstw ETEMP(%a6) | RP: store +1 of proper width in L_SCR1 if
- | ; source is greater than 0
- bmis int_inx | otherwise, result is 0
- lea L_SCR1(%a6),%a1 | a1 is address of L_SCR1
- addal %d0,%a1 | offset by destination width -1
- subal #1,%a1
- bsetb #0,(%a1) | set low bit at a1 address
- int_inx:
- oril #inx2a_mask,USER_FPSR(%a6)
- bras int_wrt
- int_operr:
- fmovemx %fp0-%fp0,FPTEMP(%a6) |FPTEMP must contain the extended
- | ;precision source that needs to be
- | ;converted to integer this is required
- | ;if the operr exception is enabled.
- | ;set operr/aiop (no inex2 on int ovfl)
- oril #opaop_mask,USER_FPSR(%a6)
- | ;fall through to perform int_wrt
- int_wrt:
- movel EXC_EA(%a6),%a1 |load destination address
- tstl %a1 |check to see if it is a dest register
- beqs wrt_dn |write data register
- lea L_SCR1(%a6),%a0 |point to supervisor source address
- bsrl mem_write
- bra mvouti_end
- wrt_dn:
- movel %d0,-(%sp) |d0 currently contains the size to write
- bsrl get_fline |get_fline returns Dn in d0
- andiw #0x7,%d0 |isolate register
- movel (%sp)+,%d1 |get size
- cmpil #4,%d1 |most frequent case
- beqs sz_long
- cmpil #2,%d1
- bnes sz_con
- orl #8,%d0 |add 'word' size to register#
- bras sz_con
- sz_long:
- orl #0x10,%d0 |add 'long' size to register#
- sz_con:
- movel %d0,%d1 |reg_dest expects size:reg in d1
- bsrl reg_dest |load proper data register
- bra mvouti_end
- xp:
- lea ETEMP(%a6),%a0
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- btstb #7,STAG(%a6) |check for extended denorm
- bne xdnrm
- clrl %d0
- bras do_fp |do normal case
- sgp:
- lea ETEMP(%a6),%a0
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- btstb #7,STAG(%a6) |check for extended denorm
- bne sp_catas |branch if so
- movew LOCAL_EX(%a0),%d0
- lea sp_bnds,%a1
- cmpw (%a1),%d0
- blt sp_under
- cmpw 2(%a1),%d0
- bgt sp_over
- movel #1,%d0 |set destination format to single
- bras do_fp |do normal case
- dp:
- lea ETEMP(%a6),%a0
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- btstb #7,STAG(%a6) |check for extended denorm
- bne dp_catas |branch if so
- movew LOCAL_EX(%a0),%d0
- lea dp_bnds,%a1
- cmpw (%a1),%d0
- blt dp_under
- cmpw 2(%a1),%d0
- bgt dp_over
- movel #2,%d0 |set destination format to double
- | ;fall through to do_fp
- |
- do_fp:
- bfextu FPCR_MODE(%a6){#2:#2},%d1 |rnd mode in d1
- swap %d0 |rnd prec in upper word
- addl %d0,%d1 |d1 has PREC/MODE info
- clrl %d0 |clear g,r,s
- bsrl round |round
- movel %a0,%a1
- movel EXC_EA(%a6),%a0
- bfextu CMDREG1B(%a6){#3:#3},%d1 |extract destination format
- | ;at this point only the dest
- | ;formats sgl, dbl, ext are
- | ;possible
- cmpb #2,%d1
- bgts ddbl |double=5, extended=2, single=1
- bnes dsgl
- | ;fall through to dext
- dext:
- bsrl dest_ext
- bra mvout_end
- dsgl:
- bsrl dest_sgl
- bra mvout_end
- ddbl:
- bsrl dest_dbl
- bra mvout_end
- |
- | Handle possible denorm or catastrophic underflow cases here
- |
- xdnrm:
- bsr set_xop |initialize WBTEMP
- bsetb #wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15
- movel %a0,%a1
- movel EXC_EA(%a6),%a0 |a0 has the destination pointer
- bsrl dest_ext |store to memory
- bsetb #unfl_bit,FPSR_EXCEPT(%a6)
- bra mvout_end
- sp_under:
- bsetb #etemp15_bit,STAG(%a6)
- cmpw 4(%a1),%d0
- blts sp_catas |catastrophic underflow case
- movel #1,%d0 |load in round precision
- movel #sgl_thresh,%d1 |load in single denorm threshold
- bsrl dpspdnrm |expects d1 to have the proper
- | ;denorm threshold
- bsrl dest_sgl |stores value to destination
- bsetb #unfl_bit,FPSR_EXCEPT(%a6)
- bra mvout_end |exit
- dp_under:
- bsetb #etemp15_bit,STAG(%a6)
- cmpw 4(%a1),%d0
- blts dp_catas |catastrophic underflow case
- movel #dbl_thresh,%d1 |load in double precision threshold
- movel #2,%d0
- bsrl dpspdnrm |expects d1 to have proper
- | ;denorm threshold
- | ;expects d0 to have round precision
- bsrl dest_dbl |store value to destination
- bsetb #unfl_bit,FPSR_EXCEPT(%a6)
- bra mvout_end |exit
- |
- | Handle catastrophic underflow cases here
- |
- sp_catas:
- | Temp fix for z bit set in unf_sub
- movel USER_FPSR(%a6),-(%a7)
- movel #1,%d0 |set round precision to sgl
- bsrl unf_sub |a0 points to result
- movel (%a7)+,USER_FPSR(%a6)
- movel #1,%d0
- subw %d0,LOCAL_EX(%a0) |account for difference between
- | ;denorm/norm bias
- movel %a0,%a1 |a1 has the operand input
- movel EXC_EA(%a6),%a0 |a0 has the destination pointer
- bsrl dest_sgl |store the result
- oril #unfinx_mask,USER_FPSR(%a6)
- bra mvout_end
- dp_catas:
- | Temp fix for z bit set in unf_sub
- movel USER_FPSR(%a6),-(%a7)
- movel #2,%d0 |set round precision to dbl
- bsrl unf_sub |a0 points to result
- movel (%a7)+,USER_FPSR(%a6)
- movel #1,%d0
- subw %d0,LOCAL_EX(%a0) |account for difference between
- | ;denorm/norm bias
- movel %a0,%a1 |a1 has the operand input
- movel EXC_EA(%a6),%a0 |a0 has the destination pointer
- bsrl dest_dbl |store the result
- oril #unfinx_mask,USER_FPSR(%a6)
- bra mvout_end
- |
- | Handle catastrophic overflow cases here
- |
- sp_over:
- | Temp fix for z bit set in unf_sub
- movel USER_FPSR(%a6),-(%a7)
- movel #1,%d0
- leal FP_SCR1(%a6),%a0 |use FP_SCR1 for creating result
- movel ETEMP_EX(%a6),(%a0)
- movel ETEMP_HI(%a6),4(%a0)
- movel ETEMP_LO(%a6),8(%a0)
- bsrl ovf_res
- movel (%a7)+,USER_FPSR(%a6)
- movel %a0,%a1
- movel EXC_EA(%a6),%a0
- bsrl dest_sgl
- orl #ovfinx_mask,USER_FPSR(%a6)
- bra mvout_end
- dp_over:
- | Temp fix for z bit set in ovf_res
- movel USER_FPSR(%a6),-(%a7)
- movel #2,%d0
- leal FP_SCR1(%a6),%a0 |use FP_SCR1 for creating result
- movel ETEMP_EX(%a6),(%a0)
- movel ETEMP_HI(%a6),4(%a0)
- movel ETEMP_LO(%a6),8(%a0)
- bsrl ovf_res
- movel (%a7)+,USER_FPSR(%a6)
- movel %a0,%a1
- movel EXC_EA(%a6),%a0
- bsrl dest_dbl
- orl #ovfinx_mask,USER_FPSR(%a6)
- bra mvout_end
- |
- | DPSPDNRM
- |
- | This subroutine takes an extended normalized number and denormalizes
- | it to the given round precision. This subroutine also decrements
- | the input operand's exponent by 1 to account for the fact that
- | dest_sgl or dest_dbl expects a normalized number's bias.
- |
- | Input: a0 points to a normalized number in internal extended format
- | d0 is the round precision (=1 for sgl; =2 for dbl)
- | d1 is the single precision or double precision
- | denorm threshold
- |
- | Output: (In the format for dest_sgl or dest_dbl)
- | a0 points to the destination
- | a1 points to the operand
- |
- | Exceptions: Reports inexact 2 exception by setting USER_FPSR bits
- |
- dpspdnrm:
- movel %d0,-(%a7) |save round precision
- clrl %d0 |clear initial g,r,s
- bsrl dnrm_lp |careful with d0, it's needed by round
- bfextu FPCR_MODE(%a6){#2:#2},%d1 |get rounding mode
- swap %d1
- movew 2(%a7),%d1 |set rounding precision
- swap %d1 |at this point d1 has PREC/MODE info
- bsrl round |round result, sets the inex bit in
- | ;USER_FPSR if needed
- movew #1,%d0
- subw %d0,LOCAL_EX(%a0) |account for difference in denorm
- | ;vs norm bias
- movel %a0,%a1 |a1 has the operand input
- movel EXC_EA(%a6),%a0 |a0 has the destination pointer
- addw #4,%a7 |pop stack
- rts
- |
- | SET_XOP initialized WBTEMP with the value pointed to by a0
- | input: a0 points to input operand in the internal extended format
- |
- set_xop:
- movel LOCAL_EX(%a0),WBTEMP_EX(%a6)
- movel LOCAL_HI(%a0),WBTEMP_HI(%a6)
- movel LOCAL_LO(%a0),WBTEMP_LO(%a6)
- bfclr WBTEMP_SGN(%a6){#0:#8}
- beqs sxop
- bsetb #sign_bit,WBTEMP_EX(%a6)
- sxop:
- bfclr STAG(%a6){#5:#4} |clear wbtm66,wbtm1,wbtm0,sbit
- rts
- |
- | P_MOVE
- |
- p_movet:
- .long p_move
- .long p_movez
- .long p_movei
- .long p_moven
- .long p_move
- p_regd:
- .long p_dyd0
- .long p_dyd1
- .long p_dyd2
- .long p_dyd3
- .long p_dyd4
- .long p_dyd5
- .long p_dyd6
- .long p_dyd7
- pack_out:
- leal p_movet,%a0 |load jmp table address
- movew STAG(%a6),%d0 |get source tag
- bfextu %d0{#16:#3},%d0 |isolate source bits
- movel (%a0,%d0.w*4),%a0 |load a0 with routine label for tag
- jmp (%a0) |go to the routine
- p_write:
- movel #0x0c,%d0 |get byte count
- movel EXC_EA(%a6),%a1 |get the destination address
- bsr mem_write |write the user's destination
- moveb #0,CU_SAVEPC(%a6) |set the cu save pc to all 0's
- |
- | Also note that the dtag must be set to norm here - this is because
- | the 040 uses the dtag to execute the correct microcode.
- |
- bfclr DTAG(%a6){#0:#3} |set dtag to norm
- rts
- | Notes on handling of special case (zero, inf, and nan) inputs:
- | 1. Operr is not signalled if the k-factor is greater than 18.
- | 2. Per the manual, status bits are not set.
- |
- p_move:
- movew CMDREG1B(%a6),%d0
- btstl #kfact_bit,%d0 |test for dynamic k-factor
- beqs statick |if clear, k-factor is static
- dynamick:
- bfextu %d0{#25:#3},%d0 |isolate register for dynamic k-factor
- lea p_regd,%a0
- movel %a0@(%d0:l:4),%a0
- jmp (%a0)
- statick:
- andiw #0x007f,%d0 |get k-factor
- bfexts %d0{#25:#7},%d0 |sign extend d0 for bindec
- leal ETEMP(%a6),%a0 |a0 will point to the packed decimal
- bsrl bindec |perform the convert; data at a6
- leal FP_SCR1(%a6),%a0 |load a0 with result address
- bral p_write
- p_movez:
- leal ETEMP(%a6),%a0 |a0 will point to the packed decimal
- clrw 2(%a0) |clear lower word of exp
- clrl 4(%a0) |load second lword of ZERO
- clrl 8(%a0) |load third lword of ZERO
- bra p_write |go write results
- p_movei:
- fmovel #0,%FPSR |clear aiop
- leal ETEMP(%a6),%a0 |a0 will point to the packed decimal
- clrw 2(%a0) |clear lower word of exp
- bra p_write |go write the result
- p_moven:
- leal ETEMP(%a6),%a0 |a0 will point to the packed decimal
- clrw 2(%a0) |clear lower word of exp
- bra p_write |go write the result
- |
- | Routines to read the dynamic k-factor from Dn.
- |
- p_dyd0:
- movel USER_D0(%a6),%d0
- bras statick
- p_dyd1:
- movel USER_D1(%a6),%d0
- bras statick
- p_dyd2:
- movel %d2,%d0
- bras statick
- p_dyd3:
- movel %d3,%d0
- bras statick
- p_dyd4:
- movel %d4,%d0
- bras statick
- p_dyd5:
- movel %d5,%d0
- bras statick
- p_dyd6:
- movel %d6,%d0
- bra statick
- p_dyd7:
- movel %d7,%d0
- bra statick
- |end
|