12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039 |
- |
- | res_func.sa 3.9 7/29/91
- |
- | Normalizes denormalized numbers if necessary and updates the
- | stack frame. The function is then restored back into the
- | machine and the 040 completes the operation. This routine
- | is only used by the unsupported data type/format handler.
- | (Exception vector 55).
- |
- | For packed move out (fmove.p fpm,<ea>) the operation is
- | completed here; data is packed and moved to user memory.
- | The stack is restored to the 040 only in the case of a
- | reportable exception in the conversion.
- |
- |
- | Copyright (C) Motorola, Inc. 1990
- | All Rights Reserved
- |
- | For details on the license for this file, please see the
- | file, README, in this same directory.
- RES_FUNC: |idnt 2,1 | Motorola 040 Floating Point Software Package
- |section 8
- #include "fpsp.h"
- sp_bnds: .short 0x3f81,0x407e
- .short 0x3f6a,0x0000
- dp_bnds: .short 0x3c01,0x43fe
- .short 0x3bcd,0x0000
- |xref mem_write
- |xref bindec
- |xref get_fline
- |xref round
- |xref denorm
- |xref dest_ext
- |xref dest_dbl
- |xref dest_sgl
- |xref unf_sub
- |xref nrm_set
- |xref dnrm_lp
- |xref ovf_res
- |xref reg_dest
- |xref t_ovfl
- |xref t_unfl
- .global res_func
- .global p_move
- res_func:
- clrb DNRM_FLG(%a6)
- clrb RES_FLG(%a6)
- clrb CU_ONLY(%a6)
- tstb DY_MO_FLG(%a6)
- beqs monadic
- dyadic:
- btstb #7,DTAG(%a6) |if dop = norm=000, zero=001,
- | ;inf=010 or nan=011
- beqs monadic |then branch
- | ;else denorm
- | HANDLE DESTINATION DENORM HERE
- | ;set dtag to norm
- | ;write the tag & fpte15 to the fstack
- leal FPTEMP(%a6),%a0
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- bsr nrm_set |normalize number (exp will go negative)
- bclrb #sign_bit,LOCAL_EX(%a0) |get rid of false sign
- bfclr LOCAL_SGN(%a0){#0:#8} |change back to IEEE ext format
- beqs dpos
- bsetb #sign_bit,LOCAL_EX(%a0)
- dpos:
- bfclr DTAG(%a6){#0:#4} |set tag to normalized, FPTE15 = 0
- bsetb #4,DTAG(%a6) |set FPTE15
- orb #0x0f,DNRM_FLG(%a6)
- monadic:
- leal ETEMP(%a6),%a0
- btstb #direction_bit,CMDREG1B(%a6) |check direction
- bne opclass3 |it is a mv out
- |
- | At this point, only opclass 0 and 2 possible
- |
- btstb #7,STAG(%a6) |if sop = norm=000, zero=001,
- | ;inf=010 or nan=011
- bne mon_dnrm |else denorm
- tstb DY_MO_FLG(%a6) |all cases of dyadic instructions would
- bne normal |require normalization of denorm
- | At this point:
- | monadic instructions: fabs = $18 fneg = $1a ftst = $3a
- | fmove = $00 fsmove = $40 fdmove = $44
- | fsqrt = $05* fssqrt = $41 fdsqrt = $45
- | (*fsqrt reencoded to $05)
- |
- movew CMDREG1B(%a6),%d0 |get command register
- andil #0x7f,%d0 |strip to only command word
- |
- | At this point, fabs, fneg, fsmove, fdmove, ftst, fsqrt, fssqrt, and
- | fdsqrt are possible.
- | For cases fabs, fneg, fsmove, and fdmove goto spos (do not normalize)
- | For cases fsqrt, fssqrt, and fdsqrt goto nrm_src (do normalize)
- |
- btstl #0,%d0
- bne normal |weed out fsqrt instructions
- |
- | cu_norm handles fmove in instructions with normalized inputs.
- | The routine round is used to correctly round the input for the
- | destination precision and mode.
- |
- cu_norm:
- st CU_ONLY(%a6) |set cu-only inst flag
- movew CMDREG1B(%a6),%d0
- andib #0x3b,%d0 |isolate bits to select inst
- tstb %d0
- beql cu_nmove |if zero, it is an fmove
- cmpib #0x18,%d0
- beql cu_nabs |if $18, it is fabs
- cmpib #0x1a,%d0
- beql cu_nneg |if $1a, it is fneg
- |
- | Inst is ftst. Check the source operand and set the cc's accordingly.
- | No write is done, so simply rts.
- |
- cu_ntst:
- movew LOCAL_EX(%a0),%d0
- bclrl #15,%d0
- sne LOCAL_SGN(%a0)
- beqs cu_ntpo
- orl #neg_mask,USER_FPSR(%a6) |set N
- cu_ntpo:
- cmpiw #0x7fff,%d0 |test for inf/nan
- bnes cu_ntcz
- tstl LOCAL_HI(%a0)
- bnes cu_ntn
- tstl LOCAL_LO(%a0)
- bnes cu_ntn
- orl #inf_mask,USER_FPSR(%a6)
- rts
- cu_ntn:
- orl #nan_mask,USER_FPSR(%a6)
- movel ETEMP_EX(%a6),FPTEMP_EX(%a6) |set up fptemp sign for
- | ;snan handler
- rts
- cu_ntcz:
- tstl LOCAL_HI(%a0)
- bnel cu_ntsx
- tstl LOCAL_LO(%a0)
- bnel cu_ntsx
- orl #z_mask,USER_FPSR(%a6)
- cu_ntsx:
- rts
- |
- | Inst is fabs. Execute the absolute value function on the input.
- | Branch to the fmove code. If the operand is NaN, do nothing.
- |
- cu_nabs:
- moveb STAG(%a6),%d0
- btstl #5,%d0 |test for NaN or zero
- bne wr_etemp |if either, simply write it
- bclrb #7,LOCAL_EX(%a0) |do abs
- bras cu_nmove |fmove code will finish
- |
- | Inst is fneg. Execute the negate value function on the input.
- | Fall though to the fmove code. If the operand is NaN, do nothing.
- |
- cu_nneg:
- moveb STAG(%a6),%d0
- btstl #5,%d0 |test for NaN or zero
- bne wr_etemp |if either, simply write it
- bchgb #7,LOCAL_EX(%a0) |do neg
- |
- | Inst is fmove. This code also handles all result writes.
- | If bit 2 is set, round is forced to double. If it is clear,
- | and bit 6 is set, round is forced to single. If both are clear,
- | the round precision is found in the fpcr. If the rounding precision
- | is double or single, round the result before the write.
- |
- cu_nmove:
- moveb STAG(%a6),%d0
- andib #0xe0,%d0 |isolate stag bits
- bne wr_etemp |if not norm, simply write it
- btstb #2,CMDREG1B+1(%a6) |check for rd
- bne cu_nmrd
- btstb #6,CMDREG1B+1(%a6) |check for rs
- bne cu_nmrs
- |
- | The move or operation is not with forced precision. Test for
- | nan or inf as the input; if so, simply write it to FPn. Use the
- | FPCR_MODE byte to get rounding on norms and zeros.
- |
- cu_nmnr:
- bfextu FPCR_MODE(%a6){#0:#2},%d0
- tstb %d0 |check for extended
- beq cu_wrexn |if so, just write result
- cmpib #1,%d0 |check for single
- beq cu_nmrs |fall through to double
- |
- | The move is fdmove or round precision is double.
- |
- cu_nmrd:
- movel #2,%d0 |set up the size for denorm
- movew LOCAL_EX(%a0),%d1 |compare exponent to double threshold
- andw #0x7fff,%d1
- cmpw #0x3c01,%d1
- bls cu_nunfl
- bfextu FPCR_MODE(%a6){#2:#2},%d1 |get rmode
- orl #0x00020000,%d1 |or in rprec (double)
- clrl %d0 |clear g,r,s for round
- bclrb #sign_bit,LOCAL_EX(%a0) |convert to internal format
- sne LOCAL_SGN(%a0)
- bsrl round
- bfclr LOCAL_SGN(%a0){#0:#8}
- beqs cu_nmrdc
- bsetb #sign_bit,LOCAL_EX(%a0)
- cu_nmrdc:
- movew LOCAL_EX(%a0),%d1 |check for overflow
- andw #0x7fff,%d1
- cmpw #0x43ff,%d1
- bge cu_novfl |take care of overflow case
- bra cu_wrexn
- |
- | The move is fsmove or round precision is single.
- |
- cu_nmrs:
- movel #1,%d0
- movew LOCAL_EX(%a0),%d1
- andw #0x7fff,%d1
- cmpw #0x3f81,%d1
- bls cu_nunfl
- bfextu FPCR_MODE(%a6){#2:#2},%d1
- orl #0x00010000,%d1
- clrl %d0
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- bsrl round
- bfclr LOCAL_SGN(%a0){#0:#8}
- beqs cu_nmrsc
- bsetb #sign_bit,LOCAL_EX(%a0)
- cu_nmrsc:
- movew LOCAL_EX(%a0),%d1
- andw #0x7FFF,%d1
- cmpw #0x407f,%d1
- blt cu_wrexn
- |
- | The operand is above precision boundaries. Use t_ovfl to
- | generate the correct value.
- |
- cu_novfl:
- bsr t_ovfl
- bra cu_wrexn
- |
- | The operand is below precision boundaries. Use denorm to
- | generate the correct value.
- |
- cu_nunfl:
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- bsr denorm
- bfclr LOCAL_SGN(%a0){#0:#8} |change back to IEEE ext format
- beqs cu_nucont
- bsetb #sign_bit,LOCAL_EX(%a0)
- cu_nucont:
- bfextu FPCR_MODE(%a6){#2:#2},%d1
- btstb #2,CMDREG1B+1(%a6) |check for rd
- bne inst_d
- btstb #6,CMDREG1B+1(%a6) |check for rs
- bne inst_s
- swap %d1
- moveb FPCR_MODE(%a6),%d1
- lsrb #6,%d1
- swap %d1
- bra inst_sd
- inst_d:
- orl #0x00020000,%d1
- bra inst_sd
- inst_s:
- orl #0x00010000,%d1
- inst_sd:
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- bsrl round
- bfclr LOCAL_SGN(%a0){#0:#8}
- beqs cu_nuflp
- bsetb #sign_bit,LOCAL_EX(%a0)
- cu_nuflp:
- btstb #inex2_bit,FPSR_EXCEPT(%a6)
- beqs cu_nuninx
- orl #aunfl_mask,USER_FPSR(%a6) |if the round was inex, set AUNFL
- cu_nuninx:
- tstl LOCAL_HI(%a0) |test for zero
- bnes cu_nunzro
- tstl LOCAL_LO(%a0)
- bnes cu_nunzro
- |
- | The mantissa is zero from the denorm loop. Check sign and rmode
- | to see if rounding should have occurred which would leave the lsb.
- |
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0 |isolate rmode
- cmpil #0x20,%d0
- blts cu_nzro
- bnes cu_nrp
- cu_nrm:
- tstw LOCAL_EX(%a0) |if positive, set lsb
- bges cu_nzro
- btstb #7,FPCR_MODE(%a6) |check for double
- beqs cu_nincs
- bras cu_nincd
- cu_nrp:
- tstw LOCAL_EX(%a0) |if positive, set lsb
- blts cu_nzro
- btstb #7,FPCR_MODE(%a6) |check for double
- beqs cu_nincs
- cu_nincd:
- orl #0x800,LOCAL_LO(%a0) |inc for double
- bra cu_nunzro
- cu_nincs:
- orl #0x100,LOCAL_HI(%a0) |inc for single
- bra cu_nunzro
- cu_nzro:
- orl #z_mask,USER_FPSR(%a6)
- moveb STAG(%a6),%d0
- andib #0xe0,%d0
- cmpib #0x40,%d0 |check if input was tagged zero
- beqs cu_numv
- cu_nunzro:
- orl #unfl_mask,USER_FPSR(%a6) |set unfl
- cu_numv:
- movel (%a0),ETEMP(%a6)
- movel 4(%a0),ETEMP_HI(%a6)
- movel 8(%a0),ETEMP_LO(%a6)
- |
- | Write the result to memory, setting the fpsr cc bits. NaN and Inf
- | bypass cu_wrexn.
- |
- cu_wrexn:
- tstw LOCAL_EX(%a0) |test for zero
- beqs cu_wrzero
- cmpw #0x8000,LOCAL_EX(%a0) |test for zero
- bnes cu_wreon
- cu_wrzero:
- orl #z_mask,USER_FPSR(%a6) |set Z bit
- cu_wreon:
- tstw LOCAL_EX(%a0)
- bpl wr_etemp
- orl #neg_mask,USER_FPSR(%a6)
- bra wr_etemp
- |
- | HANDLE SOURCE DENORM HERE
- |
- | ;clear denorm stag to norm
- | ;write the new tag & ete15 to the fstack
- mon_dnrm:
- |
- | At this point, check for the cases in which normalizing the
- | denorm produces incorrect results.
- |
- tstb DY_MO_FLG(%a6) |all cases of dyadic instructions would
- bnes nrm_src |require normalization of denorm
- | At this point:
- | monadic instructions: fabs = $18 fneg = $1a ftst = $3a
- | fmove = $00 fsmove = $40 fdmove = $44
- | fsqrt = $05* fssqrt = $41 fdsqrt = $45
- | (*fsqrt reencoded to $05)
- |
- movew CMDREG1B(%a6),%d0 |get command register
- andil #0x7f,%d0 |strip to only command word
- |
- | At this point, fabs, fneg, fsmove, fdmove, ftst, fsqrt, fssqrt, and
- | fdsqrt are possible.
- | For cases fabs, fneg, fsmove, and fdmove goto spos (do not normalize)
- | For cases fsqrt, fssqrt, and fdsqrt goto nrm_src (do normalize)
- |
- btstl #0,%d0
- bnes nrm_src |weed out fsqrt instructions
- st CU_ONLY(%a6) |set cu-only inst flag
- bra cu_dnrm |fmove, fabs, fneg, ftst
- | ;cases go to cu_dnrm
- nrm_src:
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- bsr nrm_set |normalize number (exponent will go
- | ; negative)
- bclrb #sign_bit,LOCAL_EX(%a0) |get rid of false sign
- bfclr LOCAL_SGN(%a0){#0:#8} |change back to IEEE ext format
- beqs spos
- bsetb #sign_bit,LOCAL_EX(%a0)
- spos:
- bfclr STAG(%a6){#0:#4} |set tag to normalized, FPTE15 = 0
- bsetb #4,STAG(%a6) |set ETE15
- orb #0xf0,DNRM_FLG(%a6)
- normal:
- tstb DNRM_FLG(%a6) |check if any of the ops were denorms
- bne ck_wrap |if so, check if it is a potential
- | ;wrap-around case
- fix_stk:
- moveb #0xfe,CU_SAVEPC(%a6)
- bclrb #E1,E_BYTE(%a6)
- clrw NMNEXC(%a6)
- st RES_FLG(%a6) |indicate that a restore is needed
- rts
- |
- | cu_dnrm handles all cu-only instructions (fmove, fabs, fneg, and
- | ftst) completely in software without an frestore to the 040.
- |
- cu_dnrm:
- st CU_ONLY(%a6)
- movew CMDREG1B(%a6),%d0
- andib #0x3b,%d0 |isolate bits to select inst
- tstb %d0
- beql cu_dmove |if zero, it is an fmove
- cmpib #0x18,%d0
- beql cu_dabs |if $18, it is fabs
- cmpib #0x1a,%d0
- beql cu_dneg |if $1a, it is fneg
- |
- | Inst is ftst. Check the source operand and set the cc's accordingly.
- | No write is done, so simply rts.
- |
- cu_dtst:
- movew LOCAL_EX(%a0),%d0
- bclrl #15,%d0
- sne LOCAL_SGN(%a0)
- beqs cu_dtpo
- orl #neg_mask,USER_FPSR(%a6) |set N
- cu_dtpo:
- cmpiw #0x7fff,%d0 |test for inf/nan
- bnes cu_dtcz
- tstl LOCAL_HI(%a0)
- bnes cu_dtn
- tstl LOCAL_LO(%a0)
- bnes cu_dtn
- orl #inf_mask,USER_FPSR(%a6)
- rts
- cu_dtn:
- orl #nan_mask,USER_FPSR(%a6)
- movel ETEMP_EX(%a6),FPTEMP_EX(%a6) |set up fptemp sign for
- | ;snan handler
- rts
- cu_dtcz:
- tstl LOCAL_HI(%a0)
- bnel cu_dtsx
- tstl LOCAL_LO(%a0)
- bnel cu_dtsx
- orl #z_mask,USER_FPSR(%a6)
- cu_dtsx:
- rts
- |
- | Inst is fabs. Execute the absolute value function on the input.
- | Branch to the fmove code.
- |
- cu_dabs:
- bclrb #7,LOCAL_EX(%a0) |do abs
- bras cu_dmove |fmove code will finish
- |
- | Inst is fneg. Execute the negate value function on the input.
- | Fall though to the fmove code.
- |
- cu_dneg:
- bchgb #7,LOCAL_EX(%a0) |do neg
- |
- | Inst is fmove. This code also handles all result writes.
- | If bit 2 is set, round is forced to double. If it is clear,
- | and bit 6 is set, round is forced to single. If both are clear,
- | the round precision is found in the fpcr. If the rounding precision
- | is double or single, the result is zero, and the mode is checked
- | to determine if the lsb of the result should be set.
- |
- cu_dmove:
- btstb #2,CMDREG1B+1(%a6) |check for rd
- bne cu_dmrd
- btstb #6,CMDREG1B+1(%a6) |check for rs
- bne cu_dmrs
- |
- | The move or operation is not with forced precision. Use the
- | FPCR_MODE byte to get rounding.
- |
- cu_dmnr:
- bfextu FPCR_MODE(%a6){#0:#2},%d0
- tstb %d0 |check for extended
- beq cu_wrexd |if so, just write result
- cmpib #1,%d0 |check for single
- beq cu_dmrs |fall through to double
- |
- | The move is fdmove or round precision is double. Result is zero.
- | Check rmode for rp or rm and set lsb accordingly.
- |
- cu_dmrd:
- bfextu FPCR_MODE(%a6){#2:#2},%d1 |get rmode
- tstw LOCAL_EX(%a0) |check sign
- blts cu_dmdn
- cmpib #3,%d1 |check for rp
- bne cu_dpd |load double pos zero
- bra cu_dpdr |load double pos zero w/lsb
- cu_dmdn:
- cmpib #2,%d1 |check for rm
- bne cu_dnd |load double neg zero
- bra cu_dndr |load double neg zero w/lsb
- |
- | The move is fsmove or round precision is single. Result is zero.
- | Check for rp or rm and set lsb accordingly.
- |
- cu_dmrs:
- bfextu FPCR_MODE(%a6){#2:#2},%d1 |get rmode
- tstw LOCAL_EX(%a0) |check sign
- blts cu_dmsn
- cmpib #3,%d1 |check for rp
- bne cu_spd |load single pos zero
- bra cu_spdr |load single pos zero w/lsb
- cu_dmsn:
- cmpib #2,%d1 |check for rm
- bne cu_snd |load single neg zero
- bra cu_sndr |load single neg zero w/lsb
- |
- | The precision is extended, so the result in etemp is correct.
- | Simply set unfl (not inex2 or aunfl) and write the result to
- | the correct fp register.
- cu_wrexd:
- orl #unfl_mask,USER_FPSR(%a6)
- tstw LOCAL_EX(%a0)
- beq wr_etemp
- orl #neg_mask,USER_FPSR(%a6)
- bra wr_etemp
- |
- | These routines write +/- zero in double format. The routines
- | cu_dpdr and cu_dndr set the double lsb.
- |
- cu_dpd:
- movel #0x3c010000,LOCAL_EX(%a0) |force pos double zero
- clrl LOCAL_HI(%a0)
- clrl LOCAL_LO(%a0)
- orl #z_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_dpdr:
- movel #0x3c010000,LOCAL_EX(%a0) |force pos double zero
- clrl LOCAL_HI(%a0)
- movel #0x800,LOCAL_LO(%a0) |with lsb set
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_dnd:
- movel #0xbc010000,LOCAL_EX(%a0) |force pos double zero
- clrl LOCAL_HI(%a0)
- clrl LOCAL_LO(%a0)
- orl #z_mask,USER_FPSR(%a6)
- orl #neg_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_dndr:
- movel #0xbc010000,LOCAL_EX(%a0) |force pos double zero
- clrl LOCAL_HI(%a0)
- movel #0x800,LOCAL_LO(%a0) |with lsb set
- orl #neg_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- |
- | These routines write +/- zero in single format. The routines
- | cu_dpdr and cu_dndr set the single lsb.
- |
- cu_spd:
- movel #0x3f810000,LOCAL_EX(%a0) |force pos single zero
- clrl LOCAL_HI(%a0)
- clrl LOCAL_LO(%a0)
- orl #z_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_spdr:
- movel #0x3f810000,LOCAL_EX(%a0) |force pos single zero
- movel #0x100,LOCAL_HI(%a0) |with lsb set
- clrl LOCAL_LO(%a0)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_snd:
- movel #0xbf810000,LOCAL_EX(%a0) |force pos single zero
- clrl LOCAL_HI(%a0)
- clrl LOCAL_LO(%a0)
- orl #z_mask,USER_FPSR(%a6)
- orl #neg_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- cu_sndr:
- movel #0xbf810000,LOCAL_EX(%a0) |force pos single zero
- movel #0x100,LOCAL_HI(%a0) |with lsb set
- clrl LOCAL_LO(%a0)
- orl #neg_mask,USER_FPSR(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- bra wr_etemp
- |
- | This code checks for 16-bit overflow conditions on dyadic
- | operations which are not restorable into the floating-point
- | unit and must be completed in software. Basically, this
- | condition exists with a very large norm and a denorm. One
- | of the operands must be denormalized to enter this code.
- |
- | Flags used:
- | DY_MO_FLG contains 0 for monadic op, $ff for dyadic
- | DNRM_FLG contains $00 for neither op denormalized
- | $0f for the destination op denormalized
- | $f0 for the source op denormalized
- | $ff for both ops denormalized
- |
- | The wrap-around condition occurs for add, sub, div, and cmp
- | when
- |
- | abs(dest_exp - src_exp) >= $8000
- |
- | and for mul when
- |
- | (dest_exp + src_exp) < $0
- |
- | we must process the operation here if this case is true.
- |
- | The rts following the frcfpn routine is the exit from res_func
- | for this condition. The restore flag (RES_FLG) is left clear.
- | No frestore is done unless an exception is to be reported.
- |
- | For fadd:
- | if(sign_of(dest) != sign_of(src))
- | replace exponent of src with $3fff (keep sign)
- | use fpu to perform dest+new_src (user's rmode and X)
- | clr sticky
- | else
- | set sticky
- | call round with user's precision and mode
- | move result to fpn and wbtemp
- |
- | For fsub:
- | if(sign_of(dest) == sign_of(src))
- | replace exponent of src with $3fff (keep sign)
- | use fpu to perform dest+new_src (user's rmode and X)
- | clr sticky
- | else
- | set sticky
- | call round with user's precision and mode
- | move result to fpn and wbtemp
- |
- | For fdiv/fsgldiv:
- | if(both operands are denorm)
- | restore_to_fpu;
- | if(dest is norm)
- | force_ovf;
- | else(dest is denorm)
- | force_unf:
- |
- | For fcmp:
- | if(dest is norm)
- | N = sign_of(dest);
- | else(dest is denorm)
- | N = sign_of(src);
- |
- | For fmul:
- | if(both operands are denorm)
- | force_unf;
- | if((dest_exp + src_exp) < 0)
- | force_unf:
- | else
- | restore_to_fpu;
- |
- | local equates:
- .set addcode,0x22
- .set subcode,0x28
- .set mulcode,0x23
- .set divcode,0x20
- .set cmpcode,0x38
- ck_wrap:
- | tstb DY_MO_FLG(%a6) ;check for fsqrt
- beq fix_stk |if zero, it is fsqrt
- movew CMDREG1B(%a6),%d0
- andiw #0x3b,%d0 |strip to command bits
- cmpiw #addcode,%d0
- beq wrap_add
- cmpiw #subcode,%d0
- beq wrap_sub
- cmpiw #mulcode,%d0
- beq wrap_mul
- cmpiw #cmpcode,%d0
- beq wrap_cmp
- |
- | Inst is fdiv.
- |
- wrap_div:
- cmpb #0xff,DNRM_FLG(%a6) |if both ops denorm,
- beq fix_stk |restore to fpu
- |
- | One of the ops is denormalized. Test for wrap condition
- | and force the result.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |check for dest denorm
- bnes div_srcd
- div_destd:
- bsrl ckinf_ns
- bne fix_stk
- bfextu ETEMP_EX(%a6){#1:#15},%d0 |get src exp (always pos)
- bfexts FPTEMP_EX(%a6){#1:#15},%d1 |get dest exp (always neg)
- subl %d1,%d0 |subtract dest from src
- cmpl #0x7fff,%d0
- blt fix_stk |if less, not wrap case
- clrb WBTEMP_SGN(%a6)
- movew ETEMP_EX(%a6),%d0 |find the sign of the result
- movew FPTEMP_EX(%a6),%d1
- eorw %d1,%d0
- andiw #0x8000,%d0
- beq force_unf
- st WBTEMP_SGN(%a6)
- bra force_unf
- ckinf_ns:
- moveb STAG(%a6),%d0 |check source tag for inf or nan
- bra ck_in_com
- ckinf_nd:
- moveb DTAG(%a6),%d0 |check destination tag for inf or nan
- ck_in_com:
- andib #0x60,%d0 |isolate tag bits
- cmpb #0x40,%d0 |is it inf?
- beq nan_or_inf |not wrap case
- cmpb #0x60,%d0 |is it nan?
- beq nan_or_inf |yes, not wrap case?
- cmpb #0x20,%d0 |is it a zero?
- beq nan_or_inf |yes
- clrl %d0
- rts |then ; it is either a zero of norm,
- | ;check wrap case
- nan_or_inf:
- moveql #-1,%d0
- rts
- div_srcd:
- bsrl ckinf_nd
- bne fix_stk
- bfextu FPTEMP_EX(%a6){#1:#15},%d0 |get dest exp (always pos)
- bfexts ETEMP_EX(%a6){#1:#15},%d1 |get src exp (always neg)
- subl %d1,%d0 |subtract src from dest
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- clrb WBTEMP_SGN(%a6)
- movew ETEMP_EX(%a6),%d0 |find the sign of the result
- movew FPTEMP_EX(%a6),%d1
- eorw %d1,%d0
- andiw #0x8000,%d0
- beqs force_ovf
- st WBTEMP_SGN(%a6)
- |
- | This code handles the case of the instruction resulting in
- | an overflow condition.
- |
- force_ovf:
- bclrb #E1,E_BYTE(%a6)
- orl #ovfl_inx_mask,USER_FPSR(%a6)
- clrw NMNEXC(%a6)
- leal WBTEMP(%a6),%a0 |point a0 to memory location
- movew CMDREG1B(%a6),%d0
- btstl #6,%d0 |test for forced precision
- beqs frcovf_fpcr
- btstl #2,%d0 |check for double
- bnes frcovf_dbl
- movel #0x1,%d0 |inst is forced single
- bras frcovf_rnd
- frcovf_dbl:
- movel #0x2,%d0 |inst is forced double
- bras frcovf_rnd
- frcovf_fpcr:
- bfextu FPCR_MODE(%a6){#0:#2},%d0 |inst not forced - use fpcr prec
- frcovf_rnd:
- | The 881/882 does not set inex2 for the following case, so the
- | line is commented out to be compatible with 881/882
- | tst.b %d0
- | beq.b frcovf_x
- | or.l #inex2_mask,USER_FPSR(%a6) ;if prec is s or d, set inex2
- |frcovf_x:
- bsrl ovf_res |get correct result based on
- | ;round precision/mode. This
- | ;sets FPSR_CC correctly
- | ;returns in external format
- bfclr WBTEMP_SGN(%a6){#0:#8}
- beq frcfpn
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpn
- |
- | Inst is fadd.
- |
- wrap_add:
- cmpb #0xff,DNRM_FLG(%a6) |if both ops denorm,
- beq fix_stk |restore to fpu
- |
- | One of the ops is denormalized. Test for wrap condition
- | and complete the instruction.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |check for dest denorm
- bnes add_srcd
- add_destd:
- bsrl ckinf_ns
- bne fix_stk
- bfextu ETEMP_EX(%a6){#1:#15},%d0 |get src exp (always pos)
- bfexts FPTEMP_EX(%a6){#1:#15},%d1 |get dest exp (always neg)
- subl %d1,%d0 |subtract dest from src
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- bra add_wrap
- add_srcd:
- bsrl ckinf_nd
- bne fix_stk
- bfextu FPTEMP_EX(%a6){#1:#15},%d0 |get dest exp (always pos)
- bfexts ETEMP_EX(%a6){#1:#15},%d1 |get src exp (always neg)
- subl %d1,%d0 |subtract src from dest
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- |
- | Check the signs of the operands. If they are unlike, the fpu
- | can be used to add the norm and 1.0 with the sign of the
- | denorm and it will correctly generate the result in extended
- | precision. We can then call round with no sticky and the result
- | will be correct for the user's rounding mode and precision. If
- | the signs are the same, we call round with the sticky bit set
- | and the result will be correct for the user's rounding mode and
- | precision.
- |
- add_wrap:
- movew ETEMP_EX(%a6),%d0
- movew FPTEMP_EX(%a6),%d1
- eorw %d1,%d0
- andiw #0x8000,%d0
- beq add_same
- |
- | The signs are unlike.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |is dest the denorm?
- bnes add_u_srcd
- movew FPTEMP_EX(%a6),%d0
- andiw #0x8000,%d0
- orw #0x3fff,%d0 |force the exponent to +/- 1
- movew %d0,FPTEMP_EX(%a6) |in the denorm
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- fmovel %d0,%fpcr |set up users rmode and X
- fmovex ETEMP(%a6),%fp0
- faddx FPTEMP(%a6),%fp0
- leal WBTEMP(%a6),%a0 |point a0 to wbtemp in frame
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture cc's and inex from fadd
- fmovex %fp0,WBTEMP(%a6) |write result to memory
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- clrl %d0 |force sticky to zero
- bclrb #sign_bit,WBTEMP_EX(%a6)
- sne WBTEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beq frcfpnr
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpnr
- add_u_srcd:
- movew ETEMP_EX(%a6),%d0
- andiw #0x8000,%d0
- orw #0x3fff,%d0 |force the exponent to +/- 1
- movew %d0,ETEMP_EX(%a6) |in the denorm
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- fmovel %d0,%fpcr |set up users rmode and X
- fmovex ETEMP(%a6),%fp0
- faddx FPTEMP(%a6),%fp0
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture cc's and inex from fadd
- leal WBTEMP(%a6),%a0 |point a0 to wbtemp in frame
- fmovex %fp0,WBTEMP(%a6) |write result to memory
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- clrl %d0 |force sticky to zero
- bclrb #sign_bit,WBTEMP_EX(%a6)
- sne WBTEMP_SGN(%a6) |use internal format for round
- bsrl round |round result to users rmode & prec
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beq frcfpnr
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpnr
- |
- | Signs are alike:
- |
- add_same:
- cmpb #0x0f,DNRM_FLG(%a6) |is dest the denorm?
- bnes add_s_srcd
- add_s_destd:
- leal ETEMP(%a6),%a0
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- movel #0x20000000,%d0 |set sticky for round
- bclrb #sign_bit,ETEMP_EX(%a6)
- sne ETEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr ETEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs add_s_dclr
- bsetb #sign_bit,ETEMP_EX(%a6)
- add_s_dclr:
- leal WBTEMP(%a6),%a0
- movel ETEMP(%a6),(%a0) |write result to wbtemp
- movel ETEMP_HI(%a6),4(%a0)
- movel ETEMP_LO(%a6),8(%a0)
- tstw ETEMP_EX(%a6)
- bgt add_ckovf
- orl #neg_mask,USER_FPSR(%a6)
- bra add_ckovf
- add_s_srcd:
- leal FPTEMP(%a6),%a0
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- movel #0x20000000,%d0 |set sticky for round
- bclrb #sign_bit,FPTEMP_EX(%a6)
- sne FPTEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr FPTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs add_s_sclr
- bsetb #sign_bit,FPTEMP_EX(%a6)
- add_s_sclr:
- leal WBTEMP(%a6),%a0
- movel FPTEMP(%a6),(%a0) |write result to wbtemp
- movel FPTEMP_HI(%a6),4(%a0)
- movel FPTEMP_LO(%a6),8(%a0)
- tstw FPTEMP_EX(%a6)
- bgt add_ckovf
- orl #neg_mask,USER_FPSR(%a6)
- add_ckovf:
- movew WBTEMP_EX(%a6),%d0
- andiw #0x7fff,%d0
- cmpiw #0x7fff,%d0
- bne frcfpnr
- |
- | The result has overflowed to $7fff exponent. Set I, ovfl,
- | and aovfl, and clr the mantissa (incorrectly set by the
- | round routine.)
- |
- orl #inf_mask+ovfl_inx_mask,USER_FPSR(%a6)
- clrl 4(%a0)
- bra frcfpnr
- |
- | Inst is fsub.
- |
- wrap_sub:
- cmpb #0xff,DNRM_FLG(%a6) |if both ops denorm,
- beq fix_stk |restore to fpu
- |
- | One of the ops is denormalized. Test for wrap condition
- | and complete the instruction.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |check for dest denorm
- bnes sub_srcd
- sub_destd:
- bsrl ckinf_ns
- bne fix_stk
- bfextu ETEMP_EX(%a6){#1:#15},%d0 |get src exp (always pos)
- bfexts FPTEMP_EX(%a6){#1:#15},%d1 |get dest exp (always neg)
- subl %d1,%d0 |subtract src from dest
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- bra sub_wrap
- sub_srcd:
- bsrl ckinf_nd
- bne fix_stk
- bfextu FPTEMP_EX(%a6){#1:#15},%d0 |get dest exp (always pos)
- bfexts ETEMP_EX(%a6){#1:#15},%d1 |get src exp (always neg)
- subl %d1,%d0 |subtract dest from src
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- |
- | Check the signs of the operands. If they are alike, the fpu
- | can be used to subtract from the norm 1.0 with the sign of the
- | denorm and it will correctly generate the result in extended
- | precision. We can then call round with no sticky and the result
- | will be correct for the user's rounding mode and precision. If
- | the signs are unlike, we call round with the sticky bit set
- | and the result will be correct for the user's rounding mode and
- | precision.
- |
- sub_wrap:
- movew ETEMP_EX(%a6),%d0
- movew FPTEMP_EX(%a6),%d1
- eorw %d1,%d0
- andiw #0x8000,%d0
- bne sub_diff
- |
- | The signs are alike.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |is dest the denorm?
- bnes sub_u_srcd
- movew FPTEMP_EX(%a6),%d0
- andiw #0x8000,%d0
- orw #0x3fff,%d0 |force the exponent to +/- 1
- movew %d0,FPTEMP_EX(%a6) |in the denorm
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- fmovel %d0,%fpcr |set up users rmode and X
- fmovex FPTEMP(%a6),%fp0
- fsubx ETEMP(%a6),%fp0
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture cc's and inex from fadd
- leal WBTEMP(%a6),%a0 |point a0 to wbtemp in frame
- fmovex %fp0,WBTEMP(%a6) |write result to memory
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- clrl %d0 |force sticky to zero
- bclrb #sign_bit,WBTEMP_EX(%a6)
- sne WBTEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beq frcfpnr
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpnr
- sub_u_srcd:
- movew ETEMP_EX(%a6),%d0
- andiw #0x8000,%d0
- orw #0x3fff,%d0 |force the exponent to +/- 1
- movew %d0,ETEMP_EX(%a6) |in the denorm
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- fmovel %d0,%fpcr |set up users rmode and X
- fmovex FPTEMP(%a6),%fp0
- fsubx ETEMP(%a6),%fp0
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture cc's and inex from fadd
- leal WBTEMP(%a6),%a0 |point a0 to wbtemp in frame
- fmovex %fp0,WBTEMP(%a6) |write result to memory
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- clrl %d0 |force sticky to zero
- bclrb #sign_bit,WBTEMP_EX(%a6)
- sne WBTEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beq frcfpnr
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpnr
- |
- | Signs are unlike:
- |
- sub_diff:
- cmpb #0x0f,DNRM_FLG(%a6) |is dest the denorm?
- bnes sub_s_srcd
- sub_s_destd:
- leal ETEMP(%a6),%a0
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- movel #0x20000000,%d0 |set sticky for round
- |
- | Since the dest is the denorm, the sign is the opposite of the
- | norm sign.
- |
- eoriw #0x8000,ETEMP_EX(%a6) |flip sign on result
- tstw ETEMP_EX(%a6)
- bgts sub_s_dwr
- orl #neg_mask,USER_FPSR(%a6)
- sub_s_dwr:
- bclrb #sign_bit,ETEMP_EX(%a6)
- sne ETEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr ETEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs sub_s_dclr
- bsetb #sign_bit,ETEMP_EX(%a6)
- sub_s_dclr:
- leal WBTEMP(%a6),%a0
- movel ETEMP(%a6),(%a0) |write result to wbtemp
- movel ETEMP_HI(%a6),4(%a0)
- movel ETEMP_LO(%a6),8(%a0)
- bra sub_ckovf
- sub_s_srcd:
- leal FPTEMP(%a6),%a0
- movel USER_FPCR(%a6),%d0
- andil #0x30,%d0
- lsrl #4,%d0 |put rmode in lower 2 bits
- movel USER_FPCR(%a6),%d1
- andil #0xc0,%d1
- lsrl #6,%d1 |put precision in upper word
- swap %d1
- orl %d0,%d1 |set up for round call
- movel #0x20000000,%d0 |set sticky for round
- bclrb #sign_bit,FPTEMP_EX(%a6)
- sne FPTEMP_SGN(%a6)
- bsrl round |round result to users rmode & prec
- bfclr FPTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs sub_s_sclr
- bsetb #sign_bit,FPTEMP_EX(%a6)
- sub_s_sclr:
- leal WBTEMP(%a6),%a0
- movel FPTEMP(%a6),(%a0) |write result to wbtemp
- movel FPTEMP_HI(%a6),4(%a0)
- movel FPTEMP_LO(%a6),8(%a0)
- tstw FPTEMP_EX(%a6)
- bgt sub_ckovf
- orl #neg_mask,USER_FPSR(%a6)
- sub_ckovf:
- movew WBTEMP_EX(%a6),%d0
- andiw #0x7fff,%d0
- cmpiw #0x7fff,%d0
- bne frcfpnr
- |
- | The result has overflowed to $7fff exponent. Set I, ovfl,
- | and aovfl, and clr the mantissa (incorrectly set by the
- | round routine.)
- |
- orl #inf_mask+ovfl_inx_mask,USER_FPSR(%a6)
- clrl 4(%a0)
- bra frcfpnr
- |
- | Inst is fcmp.
- |
- wrap_cmp:
- cmpb #0xff,DNRM_FLG(%a6) |if both ops denorm,
- beq fix_stk |restore to fpu
- |
- | One of the ops is denormalized. Test for wrap condition
- | and complete the instruction.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |check for dest denorm
- bnes cmp_srcd
- cmp_destd:
- bsrl ckinf_ns
- bne fix_stk
- bfextu ETEMP_EX(%a6){#1:#15},%d0 |get src exp (always pos)
- bfexts FPTEMP_EX(%a6){#1:#15},%d1 |get dest exp (always neg)
- subl %d1,%d0 |subtract dest from src
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- tstw ETEMP_EX(%a6) |set N to ~sign_of(src)
- bge cmp_setn
- rts
- cmp_srcd:
- bsrl ckinf_nd
- bne fix_stk
- bfextu FPTEMP_EX(%a6){#1:#15},%d0 |get dest exp (always pos)
- bfexts ETEMP_EX(%a6){#1:#15},%d1 |get src exp (always neg)
- subl %d1,%d0 |subtract src from dest
- cmpl #0x8000,%d0
- blt fix_stk |if less, not wrap case
- tstw FPTEMP_EX(%a6) |set N to sign_of(dest)
- blt cmp_setn
- rts
- cmp_setn:
- orl #neg_mask,USER_FPSR(%a6)
- rts
- |
- | Inst is fmul.
- |
- wrap_mul:
- cmpb #0xff,DNRM_FLG(%a6) |if both ops denorm,
- beq force_unf |force an underflow (really!)
- |
- | One of the ops is denormalized. Test for wrap condition
- | and complete the instruction.
- |
- cmpb #0x0f,DNRM_FLG(%a6) |check for dest denorm
- bnes mul_srcd
- mul_destd:
- bsrl ckinf_ns
- bne fix_stk
- bfextu ETEMP_EX(%a6){#1:#15},%d0 |get src exp (always pos)
- bfexts FPTEMP_EX(%a6){#1:#15},%d1 |get dest exp (always neg)
- addl %d1,%d0 |subtract dest from src
- bgt fix_stk
- bra force_unf
- mul_srcd:
- bsrl ckinf_nd
- bne fix_stk
- bfextu FPTEMP_EX(%a6){#1:#15},%d0 |get dest exp (always pos)
- bfexts ETEMP_EX(%a6){#1:#15},%d1 |get src exp (always neg)
- addl %d1,%d0 |subtract src from dest
- bgt fix_stk
- |
- | This code handles the case of the instruction resulting in
- | an underflow condition.
- |
- force_unf:
- bclrb #E1,E_BYTE(%a6)
- orl #unfinx_mask,USER_FPSR(%a6)
- clrw NMNEXC(%a6)
- clrb WBTEMP_SGN(%a6)
- movew ETEMP_EX(%a6),%d0 |find the sign of the result
- movew FPTEMP_EX(%a6),%d1
- eorw %d1,%d0
- andiw #0x8000,%d0
- beqs frcunfcont
- st WBTEMP_SGN(%a6)
- frcunfcont:
- lea WBTEMP(%a6),%a0 |point a0 to memory location
- movew CMDREG1B(%a6),%d0
- btstl #6,%d0 |test for forced precision
- beqs frcunf_fpcr
- btstl #2,%d0 |check for double
- bnes frcunf_dbl
- movel #0x1,%d0 |inst is forced single
- bras frcunf_rnd
- frcunf_dbl:
- movel #0x2,%d0 |inst is forced double
- bras frcunf_rnd
- frcunf_fpcr:
- bfextu FPCR_MODE(%a6){#0:#2},%d0 |inst not forced - use fpcr prec
- frcunf_rnd:
- bsrl unf_sub |get correct result based on
- | ;round precision/mode. This
- | ;sets FPSR_CC correctly
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs frcfpn
- bsetb #sign_bit,WBTEMP_EX(%a6)
- bra frcfpn
- |
- | Write the result to the user's fpn. All results must be HUGE to be
- | written; otherwise the results would have overflowed or underflowed.
- | If the rounding precision is single or double, the ovf_res routine
- | is needed to correctly supply the max value.
- |
- frcfpnr:
- movew CMDREG1B(%a6),%d0
- btstl #6,%d0 |test for forced precision
- beqs frcfpn_fpcr
- btstl #2,%d0 |check for double
- bnes frcfpn_dbl
- movel #0x1,%d0 |inst is forced single
- bras frcfpn_rnd
- frcfpn_dbl:
- movel #0x2,%d0 |inst is forced double
- bras frcfpn_rnd
- frcfpn_fpcr:
- bfextu FPCR_MODE(%a6){#0:#2},%d0 |inst not forced - use fpcr prec
- tstb %d0
- beqs frcfpn |if extended, write what you got
- frcfpn_rnd:
- bclrb #sign_bit,WBTEMP_EX(%a6)
- sne WBTEMP_SGN(%a6)
- bsrl ovf_res |get correct result based on
- | ;round precision/mode. This
- | ;sets FPSR_CC correctly
- bfclr WBTEMP_SGN(%a6){#0:#8} |convert back to IEEE ext format
- beqs frcfpn_clr
- bsetb #sign_bit,WBTEMP_EX(%a6)
- frcfpn_clr:
- orl #ovfinx_mask,USER_FPSR(%a6)
- |
- | Perform the write.
- |
- frcfpn:
- bfextu CMDREG1B(%a6){#6:#3},%d0 |extract fp destination register
- cmpib #3,%d0
- bles frc0123 |check if dest is fp0-fp3
- movel #7,%d1
- subl %d0,%d1
- clrl %d0
- bsetl %d1,%d0
- fmovemx WBTEMP(%a6),%d0
- rts
- frc0123:
- cmpib #0,%d0
- beqs frc0_dst
- cmpib #1,%d0
- beqs frc1_dst
- cmpib #2,%d0
- beqs frc2_dst
- frc3_dst:
- movel WBTEMP_EX(%a6),USER_FP3(%a6)
- movel WBTEMP_HI(%a6),USER_FP3+4(%a6)
- movel WBTEMP_LO(%a6),USER_FP3+8(%a6)
- rts
- frc2_dst:
- movel WBTEMP_EX(%a6),USER_FP2(%a6)
- movel WBTEMP_HI(%a6),USER_FP2+4(%a6)
- movel WBTEMP_LO(%a6),USER_FP2+8(%a6)
- rts
- frc1_dst:
- movel WBTEMP_EX(%a6),USER_FP1(%a6)
- movel WBTEMP_HI(%a6),USER_FP1+4(%a6)
- movel WBTEMP_LO(%a6),USER_FP1+8(%a6)
- rts
- frc0_dst:
- movel WBTEMP_EX(%a6),USER_FP0(%a6)
- movel WBTEMP_HI(%a6),USER_FP0+4(%a6)
- movel WBTEMP_LO(%a6),USER_FP0+8(%a6)
- rts
- |
- | Write etemp to fpn.
- | A check is made on enabled and signalled snan exceptions,
- | and the destination is not overwritten if this condition exists.
- | This code is designed to make fmoveins of unsupported data types
- | faster.
- |
- wr_etemp:
- btstb #snan_bit,FPSR_EXCEPT(%a6) |if snan is set, and
- beqs fmoveinc |enabled, force restore
- btstb #snan_bit,FPCR_ENABLE(%a6) |and don't overwrite
- beqs fmoveinc |the dest
- movel ETEMP_EX(%a6),FPTEMP_EX(%a6) |set up fptemp sign for
- | ;snan handler
- tstb ETEMP(%a6) |check for negative
- blts snan_neg
- rts
- snan_neg:
- orl #neg_bit,USER_FPSR(%a6) |snan is negative; set N
- rts
- fmoveinc:
- clrw NMNEXC(%a6)
- bclrb #E1,E_BYTE(%a6)
- moveb STAG(%a6),%d0 |check if stag is inf
- andib #0xe0,%d0
- cmpib #0x40,%d0
- bnes fminc_cnan
- orl #inf_mask,USER_FPSR(%a6) |if inf, nothing yet has set I
- tstw LOCAL_EX(%a0) |check sign
- bges fminc_con
- orl #neg_mask,USER_FPSR(%a6)
- bra fminc_con
- fminc_cnan:
- cmpib #0x60,%d0 |check if stag is NaN
- bnes fminc_czero
- orl #nan_mask,USER_FPSR(%a6) |if nan, nothing yet has set NaN
- movel ETEMP_EX(%a6),FPTEMP_EX(%a6) |set up fptemp sign for
- | ;snan handler
- tstw LOCAL_EX(%a0) |check sign
- bges fminc_con
- orl #neg_mask,USER_FPSR(%a6)
- bra fminc_con
- fminc_czero:
- cmpib #0x20,%d0 |check if zero
- bnes fminc_con
- orl #z_mask,USER_FPSR(%a6) |if zero, set Z
- tstw LOCAL_EX(%a0) |check sign
- bges fminc_con
- orl #neg_mask,USER_FPSR(%a6)
- fminc_con:
- bfextu CMDREG1B(%a6){#6:#3},%d0 |extract fp destination register
- cmpib #3,%d0
- bles fp0123 |check if dest is fp0-fp3
- movel #7,%d1
- subl %d0,%d1
- clrl %d0
- bsetl %d1,%d0
- fmovemx ETEMP(%a6),%d0
- rts
- fp0123:
- cmpib #0,%d0
- beqs fp0_dst
- cmpib #1,%d0
- beqs fp1_dst
- cmpib #2,%d0
- beqs fp2_dst
- fp3_dst:
- movel ETEMP_EX(%a6),USER_FP3(%a6)
- movel ETEMP_HI(%a6),USER_FP3+4(%a6)
- movel ETEMP_LO(%a6),USER_FP3+8(%a6)
- rts
- fp2_dst:
- movel ETEMP_EX(%a6),USER_FP2(%a6)
- movel ETEMP_HI(%a6),USER_FP2+4(%a6)
- movel ETEMP_LO(%a6),USER_FP2+8(%a6)
- rts
- fp1_dst:
- movel ETEMP_EX(%a6),USER_FP1(%a6)
- movel ETEMP_HI(%a6),USER_FP1+4(%a6)
- movel ETEMP_LO(%a6),USER_FP1+8(%a6)
- rts
- fp0_dst:
- movel ETEMP_EX(%a6),USER_FP0(%a6)
- movel ETEMP_HI(%a6),USER_FP0+4(%a6)
- movel ETEMP_LO(%a6),USER_FP0+8(%a6)
- rts
- opclass3:
- st CU_ONLY(%a6)
- movew CMDREG1B(%a6),%d0 |check if packed moveout
- andiw #0x0c00,%d0 |isolate last 2 bits of size field
- cmpiw #0x0c00,%d0 |if size is 011 or 111, it is packed
- beq pack_out |else it is norm or denorm
- bra mv_out
- |
- | MOVE OUT
- |
- mv_tbl:
- .long li
- .long sgp
- .long xp
- .long mvout_end |should never be taken
- .long wi
- .long dp
- .long bi
- .long mvout_end |should never be taken
- mv_out:
- bfextu CMDREG1B(%a6){#3:#3},%d1 |put source specifier in d1
- leal mv_tbl,%a0
- movel %a0@(%d1:l:4),%a0
- jmp (%a0)
- |
- | This exit is for move-out to memory. The aunfl bit is
- | set if the result is inex and unfl is signalled.
- |
- mvout_end:
- btstb #inex2_bit,FPSR_EXCEPT(%a6)
- beqs no_aufl
- btstb #unfl_bit,FPSR_EXCEPT(%a6)
- beqs no_aufl
- bsetb #aunfl_bit,FPSR_AEXCEPT(%a6)
- no_aufl:
- clrw NMNEXC(%a6)
- bclrb #E1,E_BYTE(%a6)
- fmovel #0,%FPSR |clear any cc bits from res_func
- |
- | Return ETEMP to extended format from internal extended format so
- | that gen_except will have a correctly signed value for ovfl/unfl
- | handlers.
- |
- bfclr ETEMP_SGN(%a6){#0:#8}
- beqs mvout_con
- bsetb #sign_bit,ETEMP_EX(%a6)
- mvout_con:
- rts
- |
- | This exit is for move-out to int register. The aunfl bit is
- | not set in any case for this move.
- |
- mvouti_end:
- clrw NMNEXC(%a6)
- bclrb #E1,E_BYTE(%a6)
- fmovel #0,%FPSR |clear any cc bits from res_func
- |
- | Return ETEMP to extended format from internal extended format so
- | that gen_except will have a correctly signed value for ovfl/unfl
- | handlers.
- |
- bfclr ETEMP_SGN(%a6){#0:#8}
- beqs mvouti_con
- bsetb #sign_bit,ETEMP_EX(%a6)
- mvouti_con:
- rts
- |
- | li is used to handle a long integer source specifier
- |
- li:
- moveql #4,%d0 |set byte count
- btstb #7,STAG(%a6) |check for extended denorm
- bne int_dnrm |if so, branch
- fmovemx ETEMP(%a6),%fp0-%fp0
- fcmpd #0x41dfffffffc00000,%fp0
- | 41dfffffffc00000 in dbl prec = 401d0000fffffffe00000000 in ext prec
- fbge lo_plrg
- fcmpd #0xc1e0000000000000,%fp0
- | c1e0000000000000 in dbl prec = c01e00008000000000000000 in ext prec
- fble lo_nlrg
- |
- | at this point, the answer is between the largest pos and neg values
- |
- movel USER_FPCR(%a6),%d1 |use user's rounding mode
- andil #0x30,%d1
- fmovel %d1,%fpcr
- fmovel %fp0,L_SCR1(%a6) |let the 040 perform conversion
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture inex2/ainex if set
- bra int_wrt
- lo_plrg:
- movel #0x7fffffff,L_SCR1(%a6) |answer is largest positive int
- fbeq int_wrt |exact answer
- fcmpd #0x41dfffffffe00000,%fp0
- | 41dfffffffe00000 in dbl prec = 401d0000ffffffff00000000 in ext prec
- fbge int_operr |set operr
- bra int_inx |set inexact
- lo_nlrg:
- movel #0x80000000,L_SCR1(%a6)
- fbeq int_wrt |exact answer
- fcmpd #0xc1e0000000100000,%fp0
- | c1e0000000100000 in dbl prec = c01e00008000000080000000 in ext prec
- fblt int_operr |set operr
- bra int_inx |set inexact
- |
- | wi is used to handle a word integer source specifier
- |
- wi:
- moveql #2,%d0 |set byte count
- btstb #7,STAG(%a6) |check for extended denorm
- bne int_dnrm |branch if so
- fmovemx ETEMP(%a6),%fp0-%fp0
- fcmps #0x46fffe00,%fp0
- | 46fffe00 in sgl prec = 400d0000fffe000000000000 in ext prec
- fbge wo_plrg
- fcmps #0xc7000000,%fp0
- | c7000000 in sgl prec = c00e00008000000000000000 in ext prec
- fble wo_nlrg
- |
- | at this point, the answer is between the largest pos and neg values
- |
- movel USER_FPCR(%a6),%d1 |use user's rounding mode
- andil #0x30,%d1
- fmovel %d1,%fpcr
- fmovew %fp0,L_SCR1(%a6) |let the 040 perform conversion
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture inex2/ainex if set
- bra int_wrt
- wo_plrg:
- movew #0x7fff,L_SCR1(%a6) |answer is largest positive int
- fbeq int_wrt |exact answer
- fcmps #0x46ffff00,%fp0
- | 46ffff00 in sgl prec = 400d0000ffff000000000000 in ext prec
- fbge int_operr |set operr
- bra int_inx |set inexact
- wo_nlrg:
- movew #0x8000,L_SCR1(%a6)
- fbeq int_wrt |exact answer
- fcmps #0xc7000080,%fp0
- | c7000080 in sgl prec = c00e00008000800000000000 in ext prec
- fblt int_operr |set operr
- bra int_inx |set inexact
- |
- | bi is used to handle a byte integer source specifier
- |
- bi:
- moveql #1,%d0 |set byte count
- btstb #7,STAG(%a6) |check for extended denorm
- bne int_dnrm |branch if so
- fmovemx ETEMP(%a6),%fp0-%fp0
- fcmps #0x42fe0000,%fp0
- | 42fe0000 in sgl prec = 40050000fe00000000000000 in ext prec
- fbge by_plrg
- fcmps #0xc3000000,%fp0
- | c3000000 in sgl prec = c00600008000000000000000 in ext prec
- fble by_nlrg
- |
- | at this point, the answer is between the largest pos and neg values
- |
- movel USER_FPCR(%a6),%d1 |use user's rounding mode
- andil #0x30,%d1
- fmovel %d1,%fpcr
- fmoveb %fp0,L_SCR1(%a6) |let the 040 perform conversion
- fmovel %fpsr,%d1
- orl %d1,USER_FPSR(%a6) |capture inex2/ainex if set
- bra int_wrt
- by_plrg:
- moveb #0x7f,L_SCR1(%a6) |answer is largest positive int
- fbeq int_wrt |exact answer
- fcmps #0x42ff0000,%fp0
- | 42ff0000 in sgl prec = 40050000ff00000000000000 in ext prec
- fbge int_operr |set operr
- bra int_inx |set inexact
- by_nlrg:
- moveb #0x80,L_SCR1(%a6)
- fbeq int_wrt |exact answer
- fcmps #0xc3008000,%fp0
- | c3008000 in sgl prec = c00600008080000000000000 in ext prec
- fblt int_operr |set operr
- bra int_inx |set inexact
- |
- | Common integer routines
- |
- | int_drnrm---account for possible nonzero result for round up with positive
- | operand and round down for negative answer. In the first case (result = 1)
- | byte-width (store in d0) of result must be honored. In the second case,
- | -1 in L_SCR1(a6) will cover all contingencies (FMOVE.B/W/L out).
- int_dnrm:
- movel #0,L_SCR1(%a6) | initialize result to 0
- bfextu FPCR_MODE(%a6){#2:#2},%d1 | d1 is the rounding mode
- cmpb #2,%d1
- bmis int_inx | if RN or RZ, done
- bnes int_rp | if RP, continue below
- tstw ETEMP(%a6) | RM: store -1 in L_SCR1 if src is negative
- bpls int_inx | otherwise result is 0
- movel #-1,L_SCR1(%a6)
- bras int_inx
- int_rp:
- tstw ETEMP(%a6) | RP: store +1 of proper width in L_SCR1 if
- | ; source is greater than 0
- bmis int_inx | otherwise, result is 0
- lea L_SCR1(%a6),%a1 | a1 is address of L_SCR1
- addal %d0,%a1 | offset by destination width -1
- subal #1,%a1
- bsetb #0,(%a1) | set low bit at a1 address
- int_inx:
- oril #inx2a_mask,USER_FPSR(%a6)
- bras int_wrt
- int_operr:
- fmovemx %fp0-%fp0,FPTEMP(%a6) |FPTEMP must contain the extended
- | ;precision source that needs to be
- | ;converted to integer this is required
- | ;if the operr exception is enabled.
- | ;set operr/aiop (no inex2 on int ovfl)
- oril #opaop_mask,USER_FPSR(%a6)
- | ;fall through to perform int_wrt
- int_wrt:
- movel EXC_EA(%a6),%a1 |load destination address
- tstl %a1 |check to see if it is a dest register
- beqs wrt_dn |write data register
- lea L_SCR1(%a6),%a0 |point to supervisor source address
- bsrl mem_write
- bra mvouti_end
- wrt_dn:
- movel %d0,-(%sp) |d0 currently contains the size to write
- bsrl get_fline |get_fline returns Dn in d0
- andiw #0x7,%d0 |isolate register
- movel (%sp)+,%d1 |get size
- cmpil #4,%d1 |most frequent case
- beqs sz_long
- cmpil #2,%d1
- bnes sz_con
- orl #8,%d0 |add 'word' size to register#
- bras sz_con
- sz_long:
- orl #0x10,%d0 |add 'long' size to register#
- sz_con:
- movel %d0,%d1 |reg_dest expects size:reg in d1
- bsrl reg_dest |load proper data register
- bra mvouti_end
- xp:
- lea ETEMP(%a6),%a0
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- btstb #7,STAG(%a6) |check for extended denorm
- bne xdnrm
- clrl %d0
- bras do_fp |do normal case
- sgp:
- lea ETEMP(%a6),%a0
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- btstb #7,STAG(%a6) |check for extended denorm
- bne sp_catas |branch if so
- movew LOCAL_EX(%a0),%d0
- lea sp_bnds,%a1
- cmpw (%a1),%d0
- blt sp_under
- cmpw 2(%a1),%d0
- bgt sp_over
- movel #1,%d0 |set destination format to single
- bras do_fp |do normal case
- dp:
- lea ETEMP(%a6),%a0
- bclrb #sign_bit,LOCAL_EX(%a0)
- sne LOCAL_SGN(%a0)
- btstb #7,STAG(%a6) |check for extended denorm
- bne dp_catas |branch if so
- movew LOCAL_EX(%a0),%d0
- lea dp_bnds,%a1
- cmpw (%a1),%d0
- blt dp_under
- cmpw 2(%a1),%d0
- bgt dp_over
- movel #2,%d0 |set destination format to double
- | ;fall through to do_fp
- |
- do_fp:
- bfextu FPCR_MODE(%a6){#2:#2},%d1 |rnd mode in d1
- swap %d0 |rnd prec in upper word
- addl %d0,%d1 |d1 has PREC/MODE info
- clrl %d0 |clear g,r,s
- bsrl round |round
- movel %a0,%a1
- movel EXC_EA(%a6),%a0
- bfextu CMDREG1B(%a6){#3:#3},%d1 |extract destination format
- | ;at this point only the dest
- | ;formats sgl, dbl, ext are
- | ;possible
- cmpb #2,%d1
- bgts ddbl |double=5, extended=2, single=1
- bnes dsgl
- | ;fall through to dext
- dext:
- bsrl dest_ext
- bra mvout_end
- dsgl:
- bsrl dest_sgl
- bra mvout_end
- ddbl:
- bsrl dest_dbl
- bra mvout_end
- |
- | Handle possible denorm or catastrophic underflow cases here
- |
- xdnrm:
- bsr set_xop |initialize WBTEMP
- bsetb #wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15
- movel %a0,%a1
- movel EXC_EA(%a6),%a0 |a0 has the destination pointer
- bsrl dest_ext |store to memory
- bsetb #unfl_bit,FPSR_EXCEPT(%a6)
- bra mvout_end
- sp_under:
- bsetb #etemp15_bit,STAG(%a6)
- cmpw 4(%a1),%d0
- blts sp_catas |catastrophic underflow case
- movel #1,%d0 |load in round precision
- movel #sgl_thresh,%d1 |load in single denorm threshold
- bsrl dpspdnrm |expects d1 to have the proper
- | ;denorm threshold
- bsrl dest_sgl |stores value to destination
- bsetb #unfl_bit,FPSR_EXCEPT(%a6)
- bra mvout_end |exit
- dp_under:
- bsetb #etemp15_bit,STAG(%a6)
- cmpw 4(%a1),%d0
- blts dp_catas |catastrophic underflow case
- movel #dbl_thresh,%d1 |load in double precision threshold
- movel #2,%d0
- bsrl dpspdnrm |expects d1 to have proper
- | ;denorm threshold
- | ;expects d0 to have round precision
- bsrl dest_dbl |store value to destination
- bsetb #unfl_bit,FPSR_EXCEPT(%a6)
- bra mvout_end |exit
- |
- | Handle catastrophic underflow cases here
- |
- sp_catas:
- | Temp fix for z bit set in unf_sub
- movel USER_FPSR(%a6),-(%a7)
- movel #1,%d0 |set round precision to sgl
- bsrl unf_sub |a0 points to result
- movel (%a7)+,USER_FPSR(%a6)
- movel #1,%d0
- subw %d0,LOCAL_EX(%a0) |account for difference between
- | ;denorm/norm bias
- movel %a0,%a1 |a1 has the operand input
- movel EXC_EA(%a6),%a0 |a0 has the destination pointer
- bsrl dest_sgl |store the result
- oril #unfinx_mask,USER_FPSR(%a6)
- bra mvout_end
- dp_catas:
- | Temp fix for z bit set in unf_sub
- movel USER_FPSR(%a6),-(%a7)
- movel #2,%d0 |set round precision to dbl
- bsrl unf_sub |a0 points to result
- movel (%a7)+,USER_FPSR(%a6)
- movel #1,%d0
- subw %d0,LOCAL_EX(%a0) |account for difference between
- | ;denorm/norm bias
- movel %a0,%a1 |a1 has the operand input
- movel EXC_EA(%a6),%a0 |a0 has the destination pointer
- bsrl dest_dbl |store the result
- oril #unfinx_mask,USER_FPSR(%a6)
- bra mvout_end
- |
- | Handle catastrophic overflow cases here
- |
- sp_over:
- | Temp fix for z bit set in unf_sub
- movel USER_FPSR(%a6),-(%a7)
- movel #1,%d0
- leal FP_SCR1(%a6),%a0 |use FP_SCR1 for creating result
- movel ETEMP_EX(%a6),(%a0)
- movel ETEMP_HI(%a6),4(%a0)
- movel ETEMP_LO(%a6),8(%a0)
- bsrl ovf_res
- movel (%a7)+,USER_FPSR(%a6)
- movel %a0,%a1
- movel EXC_EA(%a6),%a0
- bsrl dest_sgl
- orl #ovfinx_mask,USER_FPSR(%a6)
- bra mvout_end
- dp_over:
- | Temp fix for z bit set in ovf_res
- movel USER_FPSR(%a6),-(%a7)
- movel #2,%d0
- leal FP_SCR1(%a6),%a0 |use FP_SCR1 for creating result
- movel ETEMP_EX(%a6),(%a0)
- movel ETEMP_HI(%a6),4(%a0)
- movel ETEMP_LO(%a6),8(%a0)
- bsrl ovf_res
- movel (%a7)+,USER_FPSR(%a6)
- movel %a0,%a1
- movel EXC_EA(%a6),%a0
- bsrl dest_dbl
- orl #ovfinx_mask,USER_FPSR(%a6)
- bra mvout_end
- |
- | DPSPDNRM
- |
- | This subroutine takes an extended normalized number and denormalizes
- | it to the given round precision. This subroutine also decrements
- | the input operand's exponent by 1 to account for the fact that
- | dest_sgl or dest_dbl expects a normalized number's bias.
- |
- | Input: a0 points to a normalized number in internal extended format
- | d0 is the round precision (=1 for sgl; =2 for dbl)
- | d1 is the single precision or double precision
- | denorm threshold
- |
- | Output: (In the format for dest_sgl or dest_dbl)
- | a0 points to the destination
- | a1 points to the operand
- |
- | Exceptions: Reports inexact 2 exception by setting USER_FPSR bits
- |
- dpspdnrm:
- movel %d0,-(%a7) |save round precision
- clrl %d0 |clear initial g,r,s
- bsrl dnrm_lp |careful with d0, it's needed by round
- bfextu FPCR_MODE(%a6){#2:#2},%d1 |get rounding mode
- swap %d1
- movew 2(%a7),%d1 |set rounding precision
- swap %d1 |at this point d1 has PREC/MODE info
- bsrl round |round result, sets the inex bit in
- | ;USER_FPSR if needed
- movew #1,%d0
- subw %d0,LOCAL_EX(%a0) |account for difference in denorm
- | ;vs norm bias
- movel %a0,%a1 |a1 has the operand input
- movel EXC_EA(%a6),%a0 |a0 has the destination pointer
- addw #4,%a7 |pop stack
- rts
- |
- | SET_XOP initialized WBTEMP with the value pointed to by a0
- | input: a0 points to input operand in the internal extended format
- |
- set_xop:
- movel LOCAL_EX(%a0),WBTEMP_EX(%a6)
- movel LOCAL_HI(%a0),WBTEMP_HI(%a6)
- movel LOCAL_LO(%a0),WBTEMP_LO(%a6)
- bfclr WBTEMP_SGN(%a6){#0:#8}
- beqs sxop
- bsetb #sign_bit,WBTEMP_EX(%a6)
- sxop:
- bfclr STAG(%a6){#5:#4} |clear wbtm66,wbtm1,wbtm0,sbit
- rts
- |
- | P_MOVE
- |
- p_movet:
- .long p_move
- .long p_movez
- .long p_movei
- .long p_moven
- .long p_move
- p_regd:
- .long p_dyd0
- .long p_dyd1
- .long p_dyd2
- .long p_dyd3
- .long p_dyd4
- .long p_dyd5
- .long p_dyd6
- .long p_dyd7
- pack_out:
- leal p_movet,%a0 |load jmp table address
- movew STAG(%a6),%d0 |get source tag
- bfextu %d0{#16:#3},%d0 |isolate source bits
- movel (%a0,%d0.w*4),%a0 |load a0 with routine label for tag
- jmp (%a0) |go to the routine
- p_write:
- movel #0x0c,%d0 |get byte count
- movel EXC_EA(%a6),%a1 |get the destination address
- bsr mem_write |write the user's destination
- moveb #0,CU_SAVEPC(%a6) |set the cu save pc to all 0's
- |
- | Also note that the dtag must be set to norm here - this is because
- | the 040 uses the dtag to execute the correct microcode.
- |
- bfclr DTAG(%a6){#0:#3} |set dtag to norm
- rts
- | Notes on handling of special case (zero, inf, and nan) inputs:
- | 1. Operr is not signalled if the k-factor is greater than 18.
- | 2. Per the manual, status bits are not set.
- |
- p_move:
- movew CMDREG1B(%a6),%d0
- btstl #kfact_bit,%d0 |test for dynamic k-factor
- beqs statick |if clear, k-factor is static
- dynamick:
- bfextu %d0{#25:#3},%d0 |isolate register for dynamic k-factor
- lea p_regd,%a0
- movel %a0@(%d0:l:4),%a0
- jmp (%a0)
- statick:
- andiw #0x007f,%d0 |get k-factor
- bfexts %d0{#25:#7},%d0 |sign extend d0 for bindec
- leal ETEMP(%a6),%a0 |a0 will point to the packed decimal
- bsrl bindec |perform the convert; data at a6
- leal FP_SCR1(%a6),%a0 |load a0 with result address
- bral p_write
- p_movez:
- leal ETEMP(%a6),%a0 |a0 will point to the packed decimal
- clrw 2(%a0) |clear lower word of exp
- clrl 4(%a0) |load second lword of ZERO
- clrl 8(%a0) |load third lword of ZERO
- bra p_write |go write results
- p_movei:
- fmovel #0,%FPSR |clear aiop
- leal ETEMP(%a6),%a0 |a0 will point to the packed decimal
- clrw 2(%a0) |clear lower word of exp
- bra p_write |go write the result
- p_moven:
- leal ETEMP(%a6),%a0 |a0 will point to the packed decimal
- clrw 2(%a0) |clear lower word of exp
- bra p_write |go write the result
- |
- | Routines to read the dynamic k-factor from Dn.
- |
- p_dyd0:
- movel USER_D0(%a6),%d0
- bras statick
- p_dyd1:
- movel USER_D1(%a6),%d0
- bras statick
- p_dyd2:
- movel %d2,%d0
- bras statick
- p_dyd3:
- movel %d3,%d0
- bras statick
- p_dyd4:
- movel %d4,%d0
- bras statick
- p_dyd5:
- movel %d5,%d0
- bras statick
- p_dyd6:
- movel %d6,%d0
- bra statick
- p_dyd7:
- movel %d7,%d0
- bra statick
- |end
|