URL https://opencores.org/ocsvn/or1k/or1k/trunk

Subversion Repositories or1k

[/] [or1k/] [trunk/] [uclinux/] [uClinux-2.0.x/] [arch/] [m68k/] [fpsp040/] [x_unfl.S] - Blame information for rev 1765

Details | Compare with Previous | View Log


|
|       x_unfl.sa 3.4 7/1/91
|
|       fpsp_unfl --- FPSP handler for underflow exception
|
| Trap disabled results
|       For 881/2 compatibility, sw must denormalize the intermediate
| result, then store the result.  Denormalization is accomplished
| by taking the intermediate result (which is always normalized) and
| shifting the mantissa right while incrementing the exponent until
| it is equal to the denormalized exponent for the destination
| format.  After denormalization, the result is rounded to the
| destination format.
|
| Trap enabled results
|       All trap disabled code applies. In addition the exceptional
| operand needs to made available to the user with a bias of $6000
| added to the exponent.
|
 
|               Copyright (C) Motorola, Inc. 1990
|                       All Rights Reserved
|
|       THIS IS UNPUBLISHED PROPRIETARY SOURCE CODE OF MOTOROLA
|       The copyright notice above does not evidence any
|       actual or intended publication of such source code.
 
X_UNFL: |idnt    2,1 | Motorola 040 Floating Point Software Package
 
        |section        8
 
        .include "fpsp.h"
 
        |xref   denorm
        |xref   round
        |xref   store
        |xref   g_rndpr
        |xref   g_opcls
        |xref   g_dfmtou
        |xref   real_unfl
        |xref   real_inex
        |xref   fpsp_done
        |xref   b1238_fix
 
        .global fpsp_unfl
fpsp_unfl:
        link            %a6,#-LOCAL_SIZE
        fsave           -(%a7)
        moveml          %d0-%d1/%a0-%a1,USER_DA(%a6)
        fmovemx %fp0-%fp3,USER_FP0(%a6)
        fmoveml %fpcr/%fpsr/%fpiar,USER_FPCR(%a6)
 
|
        bsrl            unf_res |denormalize, round & store interm op
|
| If underflow exceptions are not enabled, check for inexact
| exception
|
        btstb           #unfl_bit,FPCR_ENABLE(%a6)
        beqs            ck_inex
 
        btstb           #E3,E_BYTE(%a6)
        beqs            no_e3_1
|
| Clear dirty bit on dest resister in the frame before branching
| to b1238_fix.
|
        bfextu          CMDREG3B(%a6){#6:#3},%d0        |get dest reg no
        bclrb           %d0,FPR_DIRTY_BITS(%a6) |clr dest dirty bit
        bsrl            b1238_fix               |test for bug1238 case
        movel           USER_FPSR(%a6),FPSR_SHADOW(%a6)
        orl             #sx_mask,E_BYTE(%a6)
no_e3_1:
        moveml          USER_DA(%a6),%d0-%d1/%a0-%a1
        fmovemx USER_FP0(%a6),%fp0-%fp3
        fmoveml USER_FPCR(%a6),%fpcr/%fpsr/%fpiar
        frestore        (%a7)+
        unlk            %a6
        bral            real_unfl
|
| It is possible to have either inex2 or inex1 exceptions with the
| unfl.  If the inex enable bit is set in the FPCR, and either
| inex2 or inex1 occurred, we must clean up and branch to the
| real inex handler.
|
ck_inex:
        moveb           FPCR_ENABLE(%a6),%d0
        andb            FPSR_EXCEPT(%a6),%d0
        andib           #0x3,%d0
        beqs            unfl_done
 
|
| Inexact enabled and reported, and we must take an inexact exception
|
take_inex:
        btstb           #E3,E_BYTE(%a6)
        beqs            no_e3_2
|
| Clear dirty bit on dest resister in the frame before branching
| to b1238_fix.
|
        bfextu          CMDREG3B(%a6){#6:#3},%d0        |get dest reg no
        bclrb           %d0,FPR_DIRTY_BITS(%a6) |clr dest dirty bit
        bsrl            b1238_fix               |test for bug1238 case
        movel           USER_FPSR(%a6),FPSR_SHADOW(%a6)
        orl             #sx_mask,E_BYTE(%a6)
no_e3_2:
        moveb           #INEX_VEC,EXC_VEC+1(%a6)
        moveml         USER_DA(%a6),%d0-%d1/%a0-%a1
        fmovemx        USER_FP0(%a6),%fp0-%fp3
        fmoveml        USER_FPCR(%a6),%fpcr/%fpsr/%fpiar
        frestore        (%a7)+
        unlk            %a6
        bral            real_inex
 
unfl_done:
        bclrb           #E3,E_BYTE(%a6)
        beqs            e1_set          |if set then branch
|
| Clear dirty bit on dest resister in the frame before branching
| to b1238_fix.
|
        bfextu          CMDREG3B(%a6){#6:#3},%d0                |get dest reg no
        bclrb           %d0,FPR_DIRTY_BITS(%a6) |clr dest dirty bit
        bsrl            b1238_fix               |test for bug1238 case
        movel           USER_FPSR(%a6),FPSR_SHADOW(%a6)
        orl             #sx_mask,E_BYTE(%a6)
        moveml          USER_DA(%a6),%d0-%d1/%a0-%a1
        fmovemx USER_FP0(%a6),%fp0-%fp3
        fmoveml USER_FPCR(%a6),%fpcr/%fpsr/%fpiar
        frestore        (%a7)+
        unlk            %a6
        bral            fpsp_done
e1_set:
        moveml          USER_DA(%a6),%d0-%d1/%a0-%a1
        fmovemx USER_FP0(%a6),%fp0-%fp3
        fmoveml USER_FPCR(%a6),%fpcr/%fpsr/%fpiar
        unlk            %a6
        bral            fpsp_done
|
|       unf_res --- underflow result calculation
|
unf_res:
        bsrl            g_rndpr         |returns RND_PREC in d0 0=ext,
|                                       ;1=sgl, 2=dbl
|                                       ;we need the RND_PREC in the
|                                       ;upper word for round
        movew           #0,-(%a7)
        movew           %d0,-(%a7)      |copy RND_PREC to stack
|
|
| If the exception bit set is E3, the exceptional operand from the
| fpu is in WBTEMP; else it is in FPTEMP.
|
        btstb           #E3,E_BYTE(%a6)
        beqs            unf_E1
unf_E3:
        lea             WBTEMP(%a6),%a0 |a0 now points to operand
|
| Test for fsgldiv and fsglmul.  If the inst was one of these, then
| force the precision to extended for the denorm routine.  Use
| the user's precision for the round routine.
|
        movew           CMDREG3B(%a6),%d1       |check for fsgldiv or fsglmul
        andiw           #0x7f,%d1
        cmpiw           #0x30,%d1               |check for sgldiv
        beqs            unf_sgl
        cmpiw           #0x33,%d1               |check for sglmul
        bnes            unf_cont        |if not, use fpcr prec in round
unf_sgl:
        clrl            %d0
        movew           #0x1,(%a7)      |override g_rndpr precision
|                                       ;force single
        bras            unf_cont
unf_E1:
        lea             FPTEMP(%a6),%a0 |a0 now points to operand
unf_cont:
        bclrb           #sign_bit,LOCAL_EX(%a0) |clear sign bit
        sne             LOCAL_SGN(%a0)          |store sign
 
        bsrl            denorm          |returns denorm, a0 points to it
|
| WARNING:
|                               ;d0 has guard,round sticky bit
|                               ;make sure that it is not corrupted
|                               ;before it reaches the round subroutine
|                               ;also ensure that a0 isn't corrupted
 
|
| Set up d1 for round subroutine d1 contains the PREC/MODE
| information respectively on upper/lower register halves.
|
        bfextu          FPCR_MODE(%a6){#2:#2},%d1       |get mode from FPCR
|                                               ;mode in lower d1
        addl            (%a7)+,%d1              |merge PREC/MODE
|
| WARNING: a0 and d0 are assumed to be intact between the denorm and
| round subroutines. All code between these two subroutines
| must not corrupt a0 and d0.
|
|
| Perform Round
|       Input:          a0 points to input operand
|                       d0{31:29} has guard, round, sticky
|                       d1{01:00} has rounding mode
|                       d1{17:16} has rounding precision
|       Output:         a0 points to rounded operand
|
 
        bsrl            round           |returns rounded denorm at (a0)
|
| Differentiate between store to memory vs. store to register
|
unf_store:
        bsrl            g_opcls         |returns opclass in d0{2:0}
        cmpib           #0x3,%d0
        bnes            not_opc011
|
| At this point, a store to memory is pending
|
opc011:
        bsrl            g_dfmtou
        tstb            %d0
        beqs            ext_opc011      |If extended, do not subtract
|                               ;If destination format is sgl/dbl,
        tstb            LOCAL_HI(%a0)   |If rounded result is normal,don't
|                                       ;subtract
        bmis            ext_opc011
        subqw           #1,LOCAL_EX(%a0)        |account for denorm bias vs.
|                               ;normalized bias
|                               ;          normalized   denormalized
|                               ;single       $7f           $7e
|                               ;double       $3ff          $3fe
|
ext_opc011:
        bsrl            store           |stores to memory
        bras            unf_done        |finish up
 
|
| At this point, a store to a float register is pending
|
not_opc011:
        bsrl            store   |stores to float register
|                               ;a0 is not corrupted on a store to a
|                               ;float register.
|
| Set the condition codes according to result
|
        tstl            LOCAL_HI(%a0)   |check upper mantissa
        bnes            ck_sgn
        tstl            LOCAL_LO(%a0)   |check lower mantissa
        bnes            ck_sgn
        bsetb           #z_bit,FPSR_CC(%a6) |set condition codes if zero
ck_sgn:
        btstb           #sign_bit,LOCAL_EX(%a0) |check the sign bit
        beqs            unf_done
        bsetb           #neg_bit,FPSR_CC(%a6)
 
|
| Finish.
|
unf_done:
        btstb           #inex2_bit,FPSR_EXCEPT(%a6)
        beqs            no_aunfl
        bsetb           #aunfl_bit,FPSR_AEXCEPT(%a6)
no_aunfl:
        rts
 
        |end

Browse

Tools

Subversion Repositories or1k

[/] [or1k/] [trunk/] [uclinux/] [uClinux-2.0.x/] [arch/] [m68k/] [fpsp040/] [x_unfl.S] - Blame information for rev 1765

Line No.	Rev	Author	Line
1	199	simons	`\|`
2			`\| x_unfl.sa 3.4 7/1/91`
3			`\|`
4			`\| fpsp_unfl --- FPSP handler for underflow exception`
5			`\|`
6			`\| Trap disabled results`
7			`\| For 881/2 compatibility, sw must denormalize the intermediate`
8			`\| result, then store the result. Denormalization is accomplished`
9			`\| by taking the intermediate result (which is always normalized) and`
10			`\| shifting the mantissa right while incrementing the exponent until`
11			`\| it is equal to the denormalized exponent for the destination`
12			`\| format. After denormalization, the result is rounded to the`
13			`\| destination format.`
14			`\|`
15			`\| Trap enabled results`
16			`\| All trap disabled code applies. In addition the exceptional`
17			`\| operand needs to made available to the user with a bias of $6000`
18			`\| added to the exponent.`
19			`\|`
20
21			`\| Copyright (C) Motorola, Inc. 1990`
22			`\| All Rights Reserved`
23			`\|`
24			`\| THIS IS UNPUBLISHED PROPRIETARY SOURCE CODE OF MOTOROLA`
25			`\| The copyright notice above does not evidence any`
26			`\| actual or intended publication of such source code.`
27
28			`X_UNFL: \|idnt 2,1 \| Motorola 040 Floating Point Software Package`
29
30			`\|section 8`
31
32			`.include "fpsp.h"`
33
34			`\|xref denorm`
35			`\|xref round`
36			`\|xref store`
37			`\|xref g_rndpr`
38			`\|xref g_opcls`
39			`\|xref g_dfmtou`
40			`\|xref real_unfl`
41			`\|xref real_inex`
42			`\|xref fpsp_done`
43			`\|xref b1238_fix`
44
45			`.global fpsp_unfl`
46			`fpsp_unfl:`
47			`link %a6,#-LOCAL_SIZE`
48			`fsave -(%a7)`
49			`moveml %d0-%d1/%a0-%a1,USER_DA(%a6)`
50			`fmovemx %fp0-%fp3,USER_FP0(%a6)`
51			`fmoveml %fpcr/%fpsr/%fpiar,USER_FPCR(%a6)`
52
53			`\|`
54			`bsrl unf_res \|denormalize, round & store interm op`
55			`\|`
56			`\| If underflow exceptions are not enabled, check for inexact`
57			`\| exception`
58			`\|`
59			`btstb #unfl_bit,FPCR_ENABLE(%a6)`
60			`beqs ck_inex`
61
62			`btstb #E3,E_BYTE(%a6)`
63			`beqs no_e3_1`
64			`\|`
65			`\| Clear dirty bit on dest resister in the frame before branching`
66			`\| to b1238_fix.`
67			`\|`
68			`bfextu CMDREG3B(%a6){#6:#3},%d0 \|get dest reg no`
69			`bclrb %d0,FPR_DIRTY_BITS(%a6) \|clr dest dirty bit`
70			`bsrl b1238_fix \|test for bug1238 case`
71			`movel USER_FPSR(%a6),FPSR_SHADOW(%a6)`
72			`orl #sx_mask,E_BYTE(%a6)`
73			`no_e3_1:`
74			`moveml USER_DA(%a6),%d0-%d1/%a0-%a1`
75			`fmovemx USER_FP0(%a6),%fp0-%fp3`
76			`fmoveml USER_FPCR(%a6),%fpcr/%fpsr/%fpiar`
77			`frestore (%a7)+`
78			`unlk %a6`
79			`bral real_unfl`
80			`\|`
81			`\| It is possible to have either inex2 or inex1 exceptions with the`
82			`\| unfl. If the inex enable bit is set in the FPCR, and either`
83			`\| inex2 or inex1 occurred, we must clean up and branch to the`
84			`\| real inex handler.`
85			`\|`
86			`ck_inex:`
87			`moveb FPCR_ENABLE(%a6),%d0`
88			`andb FPSR_EXCEPT(%a6),%d0`
89			`andib #0x3,%d0`
90			`beqs unfl_done`
91
92			`\|`
93			`\| Inexact enabled and reported, and we must take an inexact exception`
94			`\|`
95			`take_inex:`
96			`btstb #E3,E_BYTE(%a6)`
97			`beqs no_e3_2`
98			`\|`
99			`\| Clear dirty bit on dest resister in the frame before branching`
100			`\| to b1238_fix.`
101			`\|`
102			`bfextu CMDREG3B(%a6){#6:#3},%d0 \|get dest reg no`
103			`bclrb %d0,FPR_DIRTY_BITS(%a6) \|clr dest dirty bit`
104			`bsrl b1238_fix \|test for bug1238 case`
105			`movel USER_FPSR(%a6),FPSR_SHADOW(%a6)`
106			`orl #sx_mask,E_BYTE(%a6)`
107			`no_e3_2:`
108			`moveb #INEX_VEC,EXC_VEC+1(%a6)`
109			`moveml USER_DA(%a6),%d0-%d1/%a0-%a1`
110			`fmovemx USER_FP0(%a6),%fp0-%fp3`
111			`fmoveml USER_FPCR(%a6),%fpcr/%fpsr/%fpiar`
112			`frestore (%a7)+`
113			`unlk %a6`
114			`bral real_inex`
115
116			`unfl_done:`
117			`bclrb #E3,E_BYTE(%a6)`
118			`beqs e1_set \|if set then branch`
119			`\|`
120			`\| Clear dirty bit on dest resister in the frame before branching`
121			`\| to b1238_fix.`
122			`\|`
123			`bfextu CMDREG3B(%a6){#6:#3},%d0 \|get dest reg no`
124			`bclrb %d0,FPR_DIRTY_BITS(%a6) \|clr dest dirty bit`
125			`bsrl b1238_fix \|test for bug1238 case`
126			`movel USER_FPSR(%a6),FPSR_SHADOW(%a6)`
127			`orl #sx_mask,E_BYTE(%a6)`
128			`moveml USER_DA(%a6),%d0-%d1/%a0-%a1`
129			`fmovemx USER_FP0(%a6),%fp0-%fp3`
130			`fmoveml USER_FPCR(%a6),%fpcr/%fpsr/%fpiar`
131			`frestore (%a7)+`
132			`unlk %a6`
133			`bral fpsp_done`
134			`e1_set:`
135			`moveml USER_DA(%a6),%d0-%d1/%a0-%a1`
136			`fmovemx USER_FP0(%a6),%fp0-%fp3`
137			`fmoveml USER_FPCR(%a6),%fpcr/%fpsr/%fpiar`
138			`unlk %a6`
139			`bral fpsp_done`
140			`\|`
141			`\| unf_res --- underflow result calculation`
142			`\|`
143			`unf_res:`
144			`bsrl g_rndpr \|returns RND_PREC in d0 0=ext,`
145			`\| ;1=sgl, 2=dbl`
146			`\| ;we need the RND_PREC in the`
147			`\| ;upper word for round`
148			`movew #0,-(%a7)`
149			`movew %d0,-(%a7) \|copy RND_PREC to stack`
150			`\|`
151			`\|`
152			`\| If the exception bit set is E3, the exceptional operand from the`
153			`\| fpu is in WBTEMP; else it is in FPTEMP.`
154			`\|`
155			`btstb #E3,E_BYTE(%a6)`
156			`beqs unf_E1`
157			`unf_E3:`
158			`lea WBTEMP(%a6),%a0 \|a0 now points to operand`
159			`\|`
160			`\| Test for fsgldiv and fsglmul. If the inst was one of these, then`
161			`\| force the precision to extended for the denorm routine. Use`
162			`\| the user's precision for the round routine.`
163			`\|`
164			`movew CMDREG3B(%a6),%d1 \|check for fsgldiv or fsglmul`
165			`andiw #0x7f,%d1`
166			`cmpiw #0x30,%d1 \|check for sgldiv`
167			`beqs unf_sgl`
168			`cmpiw #0x33,%d1 \|check for sglmul`
169			`bnes unf_cont \|if not, use fpcr prec in round`
170			`unf_sgl:`
171			`clrl %d0`
172			`movew #0x1,(%a7) \|override g_rndpr precision`
173			`\| ;force single`
174			`bras unf_cont`
175			`unf_E1:`
176			`lea FPTEMP(%a6),%a0 \|a0 now points to operand`
177			`unf_cont:`
178			`bclrb #sign_bit,LOCAL_EX(%a0) \|clear sign bit`
179			`sne LOCAL_SGN(%a0) \|store sign`
180
181			`bsrl denorm \|returns denorm, a0 points to it`
182			`\|`
183			`\| WARNING:`
184			`\| ;d0 has guard,round sticky bit`
185			`\| ;make sure that it is not corrupted`
186			`\| ;before it reaches the round subroutine`
187			`\| ;also ensure that a0 isn't corrupted`
188
189			`\|`
190			`\| Set up d1 for round subroutine d1 contains the PREC/MODE`
191			`\| information respectively on upper/lower register halves.`
192			`\|`
193			`bfextu FPCR_MODE(%a6){#2:#2},%d1 \|get mode from FPCR`
194			`\| ;mode in lower d1`
195			`addl (%a7)+,%d1 \|merge PREC/MODE`
196			`\|`
197			`\| WARNING: a0 and d0 are assumed to be intact between the denorm and`
198			`\| round subroutines. All code between these two subroutines`
199			`\| must not corrupt a0 and d0.`
200			`\|`
201			`\|`
202			`\| Perform Round`
203			`\| Input: a0 points to input operand`
204			`\| d0{31:29} has guard, round, sticky`
205			`\| d1{01:00} has rounding mode`
206			`\| d1{17:16} has rounding precision`
207			`\| Output: a0 points to rounded operand`
208			`\|`
209
210			`bsrl round \|returns rounded denorm at (a0)`
211			`\|`
212			`\| Differentiate between store to memory vs. store to register`
213			`\|`
214			`unf_store:`
215			`bsrl g_opcls \|returns opclass in d0{2:0}`
216			`cmpib #0x3,%d0`
217			`bnes not_opc011`
218			`\|`
219			`\| At this point, a store to memory is pending`
220			`\|`
221			`opc011:`
222			`bsrl g_dfmtou`
223			`tstb %d0`
224			`beqs ext_opc011 \|If extended, do not subtract`
225			`\| ;If destination format is sgl/dbl,`
226			`tstb LOCAL_HI(%a0) \|If rounded result is normal,don't`
227			`\| ;subtract`
228			`bmis ext_opc011`
229			`subqw #1,LOCAL_EX(%a0) \|account for denorm bias vs.`
230			`\| ;normalized bias`
231			`\| ; normalized denormalized`
232			`\| ;single $7f $7e`
233			`\| ;double $3ff $3fe`
234			`\|`
235			`ext_opc011:`
236			`bsrl store \|stores to memory`
237			`bras unf_done \|finish up`
238
239			`\|`
240			`\| At this point, a store to a float register is pending`
241			`\|`
242			`not_opc011:`
243			`bsrl store \|stores to float register`
244			`\| ;a0 is not corrupted on a store to a`
245			`\| ;float register.`
246			`\|`
247			`\| Set the condition codes according to result`
248			`\|`
249			`tstl LOCAL_HI(%a0) \|check upper mantissa`
250			`bnes ck_sgn`
251			`tstl LOCAL_LO(%a0) \|check lower mantissa`
252			`bnes ck_sgn`
253			`bsetb #z_bit,FPSR_CC(%a6) \|set condition codes if zero`
254			`ck_sgn:`
255			`btstb #sign_bit,LOCAL_EX(%a0) \|check the sign bit`
256			`beqs unf_done`
257			`bsetb #neg_bit,FPSR_CC(%a6)`
258
259			`\|`
260			`\| Finish.`
261			`\|`
262			`unf_done:`
263			`btstb #inex2_bit,FPSR_EXCEPT(%a6)`
264			`beqs no_aunfl`
265			`bsetb #aunfl_bit,FPSR_AEXCEPT(%a6)`
266			`no_aunfl:`
267			`rts`
268
269			`\|end`