~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

TOMOYO Linux Cross Reference
Linux/arch/m68k/fpsp040/x_unfl.S

Version: ~ [ linux-6.12-rc7 ] ~ [ linux-6.11.7 ] ~ [ linux-6.10.14 ] ~ [ linux-6.9.12 ] ~ [ linux-6.8.12 ] ~ [ linux-6.7.12 ] ~ [ linux-6.6.60 ] ~ [ linux-6.5.13 ] ~ [ linux-6.4.16 ] ~ [ linux-6.3.13 ] ~ [ linux-6.2.16 ] ~ [ linux-6.1.116 ] ~ [ linux-6.0.19 ] ~ [ linux-5.19.17 ] ~ [ linux-5.18.19 ] ~ [ linux-5.17.15 ] ~ [ linux-5.16.20 ] ~ [ linux-5.15.171 ] ~ [ linux-5.14.21 ] ~ [ linux-5.13.19 ] ~ [ linux-5.12.19 ] ~ [ linux-5.11.22 ] ~ [ linux-5.10.229 ] ~ [ linux-5.9.16 ] ~ [ linux-5.8.18 ] ~ [ linux-5.7.19 ] ~ [ linux-5.6.19 ] ~ [ linux-5.5.19 ] ~ [ linux-5.4.285 ] ~ [ linux-5.3.18 ] ~ [ linux-5.2.21 ] ~ [ linux-5.1.21 ] ~ [ linux-5.0.21 ] ~ [ linux-4.20.17 ] ~ [ linux-4.19.323 ] ~ [ linux-4.18.20 ] ~ [ linux-4.17.19 ] ~ [ linux-4.16.18 ] ~ [ linux-4.15.18 ] ~ [ linux-4.14.336 ] ~ [ linux-4.13.16 ] ~ [ linux-4.12.14 ] ~ [ linux-4.11.12 ] ~ [ linux-4.10.17 ] ~ [ linux-4.9.337 ] ~ [ linux-4.4.302 ] ~ [ linux-3.10.108 ] ~ [ linux-2.6.32.71 ] ~ [ linux-2.6.0 ] ~ [ linux-2.4.37.11 ] ~ [ unix-v6-master ] ~ [ ccs-tools-1.8.12 ] ~ [ policy-sample ] ~
Architecture: ~ [ i386 ] ~ [ alpha ] ~ [ m68k ] ~ [ mips ] ~ [ ppc ] ~ [ sparc ] ~ [ sparc64 ] ~

  1 |
  2 |       x_unfl.sa 3.4 7/1/91
  3 |
  4 |       fpsp_unfl --- FPSP handler for underflow exception
  5 |
  6 | Trap disabled results
  7 |       For 881/2 compatibility, sw must denormalize the intermediate
  8 | result, then store the result.  Denormalization is accomplished
  9 | by taking the intermediate result (which is always normalized) and
 10 | shifting the mantissa right while incrementing the exponent until
 11 | it is equal to the denormalized exponent for the destination
 12 | format.  After denormalization, the result is rounded to the
 13 | destination format.
 14 |
 15 | Trap enabled results
 16 |       All trap disabled code applies. In addition the exceptional
 17 | operand needs to made available to the user with a bias of $6000
 18 | added to the exponent.
 19 |
 20 
 21 |               Copyright (C) Motorola, Inc. 1990
 22 |                       All Rights Reserved
 23 |
 24 |       For details on the license for this file, please see the
 25 |       file, README, in this same directory.
 26 
 27 X_UNFL: |idnt    2,1 | Motorola 040 Floating Point Software Package
 28 
 29         |section        8
 30 
 31 #include "fpsp.h"
 32 
 33         |xref   denorm
 34         |xref   round
 35         |xref   store
 36         |xref   g_rndpr
 37         |xref   g_opcls
 38         |xref   g_dfmtou
 39         |xref   real_unfl
 40         |xref   real_inex
 41         |xref   fpsp_done
 42         |xref   b1238_fix
 43 
 44         .global fpsp_unfl
 45 fpsp_unfl:
 46         link            %a6,#-LOCAL_SIZE
 47         fsave           -(%a7)
 48         moveml          %d0-%d1/%a0-%a1,USER_DA(%a6)
 49         fmovemx %fp0-%fp3,USER_FP0(%a6)
 50         fmoveml %fpcr/%fpsr/%fpiar,USER_FPCR(%a6)
 51 
 52 |
 53         bsrl            unf_res |denormalize, round & store interm op
 54 |
 55 | If underflow exceptions are not enabled, check for inexact
 56 | exception
 57 |
 58         btstb           #unfl_bit,FPCR_ENABLE(%a6)
 59         beqs            ck_inex
 60 
 61         btstb           #E3,E_BYTE(%a6)
 62         beqs            no_e3_1
 63 |
 64 | Clear dirty bit on dest resister in the frame before branching
 65 | to b1238_fix.
 66 |
 67         bfextu          CMDREG3B(%a6){#6:#3},%d0        |get dest reg no
 68         bclrb           %d0,FPR_DIRTY_BITS(%a6) |clr dest dirty bit
 69         bsrl            b1238_fix               |test for bug1238 case
 70         movel           USER_FPSR(%a6),FPSR_SHADOW(%a6)
 71         orl             #sx_mask,E_BYTE(%a6)
 72 no_e3_1:
 73         moveml          USER_DA(%a6),%d0-%d1/%a0-%a1
 74         fmovemx USER_FP0(%a6),%fp0-%fp3
 75         fmoveml USER_FPCR(%a6),%fpcr/%fpsr/%fpiar
 76         frestore        (%a7)+
 77         unlk            %a6
 78         bral            real_unfl
 79 |
 80 | It is possible to have either inex2 or inex1 exceptions with the
 81 | unfl.  If the inex enable bit is set in the FPCR, and either
 82 | inex2 or inex1 occurred, we must clean up and branch to the
 83 | real inex handler.
 84 |
 85 ck_inex:
 86         moveb           FPCR_ENABLE(%a6),%d0
 87         andb            FPSR_EXCEPT(%a6),%d0
 88         andib           #0x3,%d0
 89         beqs            unfl_done
 90 
 91 |
 92 | Inexact enabled and reported, and we must take an inexact exception
 93 |
 94 take_inex:
 95         btstb           #E3,E_BYTE(%a6)
 96         beqs            no_e3_2
 97 |
 98 | Clear dirty bit on dest resister in the frame before branching
 99 | to b1238_fix.
100 |
101         bfextu          CMDREG3B(%a6){#6:#3},%d0        |get dest reg no
102         bclrb           %d0,FPR_DIRTY_BITS(%a6) |clr dest dirty bit
103         bsrl            b1238_fix               |test for bug1238 case
104         movel           USER_FPSR(%a6),FPSR_SHADOW(%a6)
105         orl             #sx_mask,E_BYTE(%a6)
106 no_e3_2:
107         moveb           #INEX_VEC,EXC_VEC+1(%a6)
108         moveml         USER_DA(%a6),%d0-%d1/%a0-%a1
109         fmovemx        USER_FP0(%a6),%fp0-%fp3
110         fmoveml        USER_FPCR(%a6),%fpcr/%fpsr/%fpiar
111         frestore        (%a7)+
112         unlk            %a6
113         bral            real_inex
114 
115 unfl_done:
116         bclrb           #E3,E_BYTE(%a6)
117         beqs            e1_set          |if set then branch
118 |
119 | Clear dirty bit on dest resister in the frame before branching
120 | to b1238_fix.
121 |
122         bfextu          CMDREG3B(%a6){#6:#3},%d0                |get dest reg no
123         bclrb           %d0,FPR_DIRTY_BITS(%a6) |clr dest dirty bit
124         bsrl            b1238_fix               |test for bug1238 case
125         movel           USER_FPSR(%a6),FPSR_SHADOW(%a6)
126         orl             #sx_mask,E_BYTE(%a6)
127         moveml          USER_DA(%a6),%d0-%d1/%a0-%a1
128         fmovemx USER_FP0(%a6),%fp0-%fp3
129         fmoveml USER_FPCR(%a6),%fpcr/%fpsr/%fpiar
130         frestore        (%a7)+
131         unlk            %a6
132         bral            fpsp_done
133 e1_set:
134         moveml          USER_DA(%a6),%d0-%d1/%a0-%a1
135         fmovemx USER_FP0(%a6),%fp0-%fp3
136         fmoveml USER_FPCR(%a6),%fpcr/%fpsr/%fpiar
137         unlk            %a6
138         bral            fpsp_done
139 |
140 |       unf_res --- underflow result calculation
141 |
142 unf_res:
143         bsrl            g_rndpr         |returns RND_PREC in d0 0=ext,
144 |                                       ;1=sgl, 2=dbl
145 |                                       ;we need the RND_PREC in the
146 |                                       ;upper word for round
147         movew           #0,-(%a7)
148         movew           %d0,-(%a7)      |copy RND_PREC to stack
149 |
150 |
151 | If the exception bit set is E3, the exceptional operand from the
152 | fpu is in WBTEMP; else it is in FPTEMP.
153 |
154         btstb           #E3,E_BYTE(%a6)
155         beqs            unf_E1
156 unf_E3:
157         lea             WBTEMP(%a6),%a0 |a0 now points to operand
158 |
159 | Test for fsgldiv and fsglmul.  If the inst was one of these, then
160 | force the precision to extended for the denorm routine.  Use
161 | the user's precision for the round routine.
162 |
163         movew           CMDREG3B(%a6),%d1       |check for fsgldiv or fsglmul
164         andiw           #0x7f,%d1
165         cmpiw           #0x30,%d1               |check for sgldiv
166         beqs            unf_sgl
167         cmpiw           #0x33,%d1               |check for sglmul
168         bnes            unf_cont        |if not, use fpcr prec in round
169 unf_sgl:
170         clrl            %d0
171         movew           #0x1,(%a7)      |override g_rndpr precision
172 |                                       ;force single
173         bras            unf_cont
174 unf_E1:
175         lea             FPTEMP(%a6),%a0 |a0 now points to operand
176 unf_cont:
177         bclrb           #sign_bit,LOCAL_EX(%a0) |clear sign bit
178         sne             LOCAL_SGN(%a0)          |store sign
179 
180         bsrl            denorm          |returns denorm, a0 points to it
181 |
182 | WARNING:
183 |                               ;d0 has guard,round sticky bit
184 |                               ;make sure that it is not corrupted
185 |                               ;before it reaches the round subroutine
186 |                               ;also ensure that a0 isn't corrupted
187 
188 |
189 | Set up d1 for round subroutine d1 contains the PREC/MODE
190 | information respectively on upper/lower register halves.
191 |
192         bfextu          FPCR_MODE(%a6){#2:#2},%d1       |get mode from FPCR
193 |                                               ;mode in lower d1
194         addl            (%a7)+,%d1              |merge PREC/MODE
195 |
196 | WARNING: a0 and d0 are assumed to be intact between the denorm and
197 | round subroutines. All code between these two subroutines
198 | must not corrupt a0 and d0.
199 |
200 |
201 | Perform Round
202 |       Input:          a0 points to input operand
203 |                       d0{31:29} has guard, round, sticky
204 |                       d1{01:00} has rounding mode
205 |                       d1{17:16} has rounding precision
206 |       Output:         a0 points to rounded operand
207 |
208 
209         bsrl            round           |returns rounded denorm at (a0)
210 |
211 | Differentiate between store to memory vs. store to register
212 |
213 unf_store:
214         bsrl            g_opcls         |returns opclass in d0{2:0}
215         cmpib           #0x3,%d0
216         bnes            not_opc011
217 |
218 | At this point, a store to memory is pending
219 |
220 opc011:
221         bsrl            g_dfmtou
222         tstb            %d0
223         beqs            ext_opc011      |If extended, do not subtract
224 |                               ;If destination format is sgl/dbl,
225         tstb            LOCAL_HI(%a0)   |If rounded result is normal,don't
226 |                                       ;subtract
227         bmis            ext_opc011
228         subqw           #1,LOCAL_EX(%a0)        |account for denorm bias vs.
229 |                               ;normalized bias
230 |                               ;          normalized   denormalized
231 |                               ;single       $7f           $7e
232 |                               ;double       $3ff          $3fe
233 |
234 ext_opc011:
235         bsrl            store           |stores to memory
236         bras            unf_done        |finish up
237 
238 |
239 | At this point, a store to a float register is pending
240 |
241 not_opc011:
242         bsrl            store   |stores to float register
243 |                               ;a0 is not corrupted on a store to a
244 |                               ;float register.
245 |
246 | Set the condition codes according to result
247 |
248         tstl            LOCAL_HI(%a0)   |check upper mantissa
249         bnes            ck_sgn
250         tstl            LOCAL_LO(%a0)   |check lower mantissa
251         bnes            ck_sgn
252         bsetb           #z_bit,FPSR_CC(%a6) |set condition codes if zero
253 ck_sgn:
254         btstb           #sign_bit,LOCAL_EX(%a0) |check the sign bit
255         beqs            unf_done
256         bsetb           #neg_bit,FPSR_CC(%a6)
257 
258 |
259 | Finish.
260 |
261 unf_done:
262         btstb           #inex2_bit,FPSR_EXCEPT(%a6)
263         beqs            no_aunfl
264         bsetb           #aunfl_bit,FPSR_AEXCEPT(%a6)
265 no_aunfl:
266         rts
267 
268         |end

~ [ source navigation ] ~ [ diff markup ] ~ [ identifier search ] ~

kernel.org | git.kernel.org | LWN.net | Project Home | SVN repository | Mail admin

Linux® is a registered trademark of Linus Torvalds in the United States and other countries.
TOMOYO® is a registered trademark of NTT DATA CORPORATION.

sflogo.php