Merge remote-tracking branch 'spi/topic/core' into spi-next
[deliverable/linux.git] / arch / m68k / fpsp040 / kernel_ex.S
1 |
2 | kernel_ex.sa 3.3 12/19/90
3 |
4 | This file contains routines to force exception status in the
5 | fpu for exceptional cases detected or reported within the
6 | transcendental functions. Typically, the t_xx routine will
7 | set the appropriate bits in the USER_FPSR word on the stack.
8 | The bits are tested in gen_except.sa to determine if an exceptional
9 | situation needs to be created on return from the FPSP.
10 |
11
12 | Copyright (C) Motorola, Inc. 1990
13 | All Rights Reserved
14 |
15 | For details on the license for this file, please see the
16 | file, README, in this same directory.
17
18 KERNEL_EX: |idnt 2,1 | Motorola 040 Floating Point Software Package
19
20 |section 8
21
22 #include "fpsp.h"
23
24 mns_inf: .long 0xffff0000,0x00000000,0x00000000
25 pls_inf: .long 0x7fff0000,0x00000000,0x00000000
26 nan: .long 0x7fff0000,0xffffffff,0xffffffff
27 huge: .long 0x7ffe0000,0xffffffff,0xffffffff
28
29 |xref ovf_r_k
30 |xref unf_sub
31 |xref nrm_set
32
33 .global t_dz
34 .global t_dz2
35 .global t_operr
36 .global t_unfl
37 .global t_ovfl
38 .global t_ovfl2
39 .global t_inx2
40 .global t_frcinx
41 .global t_extdnrm
42 .global t_resdnrm
43 .global dst_nan
44 .global src_nan
45 |
46 | DZ exception
47 |
48 |
49 | if dz trap disabled
50 | store properly signed inf (use sign of etemp) into fp0
51 | set FPSR exception status dz bit, condition code
52 | inf bit, and accrued dz bit
53 | return
54 | frestore the frame into the machine (done by unimp_hd)
55 |
56 | else dz trap enabled
57 | set exception status bit & accrued bits in FPSR
58 | set flag to disable sto_res from corrupting fp register
59 | return
60 | frestore the frame into the machine (done by unimp_hd)
61 |
62 | t_dz2 is used by monadic functions such as flogn (from do_func).
63 | t_dz is used by monadic functions such as satanh (from the
64 | transcendental function).
65 |
66 t_dz2:
67 bsetb #neg_bit,FPSR_CC(%a6) |set neg bit in FPSR
68 fmovel #0,%FPSR |clr status bits (Z set)
69 btstb #dz_bit,FPCR_ENABLE(%a6) |test FPCR for dz exc enabled
70 bnes dz_ena_end
71 bras m_inf |flogx always returns -inf
72 t_dz:
73 fmovel #0,%FPSR |clr status bits (Z set)
74 btstb #dz_bit,FPCR_ENABLE(%a6) |test FPCR for dz exc enabled
75 bnes dz_ena
76 |
77 | dz disabled
78 |
79 btstb #sign_bit,ETEMP_EX(%a6) |check sign for neg or pos
80 beqs p_inf |branch if pos sign
81
82 m_inf:
83 fmovemx mns_inf,%fp0-%fp0 |load -inf
84 bsetb #neg_bit,FPSR_CC(%a6) |set neg bit in FPSR
85 bras set_fpsr
86 p_inf:
87 fmovemx pls_inf,%fp0-%fp0 |load +inf
88 set_fpsr:
89 orl #dzinf_mask,USER_FPSR(%a6) |set I,DZ,ADZ
90 rts
91 |
92 | dz enabled
93 |
94 dz_ena:
95 btstb #sign_bit,ETEMP_EX(%a6) |check sign for neg or pos
96 beqs dz_ena_end
97 bsetb #neg_bit,FPSR_CC(%a6) |set neg bit in FPSR
98 dz_ena_end:
99 orl #dzinf_mask,USER_FPSR(%a6) |set I,DZ,ADZ
100 st STORE_FLG(%a6)
101 rts
102 |
103 | OPERR exception
104 |
105 | if (operr trap disabled)
106 | set FPSR exception status operr bit, condition code
107 | nan bit; Store default NAN into fp0
108 | frestore the frame into the machine (done by unimp_hd)
109 |
110 | else (operr trap enabled)
111 | set FPSR exception status operr bit, accrued operr bit
112 | set flag to disable sto_res from corrupting fp register
113 | frestore the frame into the machine (done by unimp_hd)
114 |
115 t_operr:
116 orl #opnan_mask,USER_FPSR(%a6) |set NaN, OPERR, AIOP
117
118 btstb #operr_bit,FPCR_ENABLE(%a6) |test FPCR for operr enabled
119 bnes op_ena
120
121 fmovemx nan,%fp0-%fp0 |load default nan
122 rts
123 op_ena:
124 st STORE_FLG(%a6) |do not corrupt destination
125 rts
126
127 |
128 | t_unfl --- UNFL exception
129 |
130 | This entry point is used by all routines requiring unfl, inex2,
131 | aunfl, and ainex to be set on exit.
132 |
133 | On entry, a0 points to the exceptional operand. The final exceptional
134 | operand is built in FP_SCR1 and only the sign from the original operand
135 | is used.
136 |
137 t_unfl:
138 clrl FP_SCR1(%a6) |set exceptional operand to zero
139 clrl FP_SCR1+4(%a6)
140 clrl FP_SCR1+8(%a6)
141 tstb (%a0) |extract sign from caller's exop
142 bpls unfl_signok
143 bset #sign_bit,FP_SCR1(%a6)
144 unfl_signok:
145 leal FP_SCR1(%a6),%a0
146 orl #unfinx_mask,USER_FPSR(%a6)
147 | ;set UNFL, INEX2, AUNFL, AINEX
148 unfl_con:
149 btstb #unfl_bit,FPCR_ENABLE(%a6)
150 beqs unfl_dis
151
152 unfl_ena:
153 bfclr STAG(%a6){#5:#3} |clear wbtm66,wbtm1,wbtm0
154 bsetb #wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15
155 bsetb #sticky_bit,STICKY(%a6) |set sticky bit
156
157 bclrb #E1,E_BYTE(%a6)
158
159 unfl_dis:
160 bfextu FPCR_MODE(%a6){#0:#2},%d0 |get round precision
161
162 bclrb #sign_bit,LOCAL_EX(%a0)
163 sne LOCAL_SGN(%a0) |convert to internal ext format
164
165 bsr unf_sub |returns IEEE result at a0
166 | ;and sets FPSR_CC accordingly
167
168 bfclr LOCAL_SGN(%a0){#0:#8} |convert back to IEEE ext format
169 beqs unfl_fin
170
171 bsetb #sign_bit,LOCAL_EX(%a0)
172 bsetb #sign_bit,FP_SCR1(%a6) |set sign bit of exc operand
173
174 unfl_fin:
175 fmovemx (%a0),%fp0-%fp0 |store result in fp0
176 rts
177
178
179 |
180 | t_ovfl2 --- OVFL exception (without inex2 returned)
181 |
182 | This entry is used by scale to force catastrophic overflow. The
183 | ovfl, aovfl, and ainex bits are set, but not the inex2 bit.
184 |
185 t_ovfl2:
186 orl #ovfl_inx_mask,USER_FPSR(%a6)
187 movel ETEMP(%a6),FP_SCR1(%a6)
188 movel ETEMP_HI(%a6),FP_SCR1+4(%a6)
189 movel ETEMP_LO(%a6),FP_SCR1+8(%a6)
190 |
191 | Check for single or double round precision. If single, check if
192 | the lower 40 bits of ETEMP are zero; if not, set inex2. If double,
193 | check if the lower 21 bits are zero; if not, set inex2.
194 |
195 moveb FPCR_MODE(%a6),%d0
196 andib #0xc0,%d0
197 beq t_work |if extended, finish ovfl processing
198 cmpib #0x40,%d0 |test for single
199 bnes t_dbl
200 t_sgl:
201 tstb ETEMP_LO(%a6)
202 bnes t_setinx2
203 movel ETEMP_HI(%a6),%d0
204 andil #0xff,%d0 |look at only lower 8 bits
205 bnes t_setinx2
206 bra t_work
207 t_dbl:
208 movel ETEMP_LO(%a6),%d0
209 andil #0x7ff,%d0 |look at only lower 11 bits
210 beq t_work
211 t_setinx2:
212 orl #inex2_mask,USER_FPSR(%a6)
213 bras t_work
214 |
215 | t_ovfl --- OVFL exception
216 |
217 |** Note: the exc operand is returned in ETEMP.
218 |
219 t_ovfl:
220 orl #ovfinx_mask,USER_FPSR(%a6)
221 t_work:
222 btstb #ovfl_bit,FPCR_ENABLE(%a6) |test FPCR for ovfl enabled
223 beqs ovf_dis
224
225 ovf_ena:
226 clrl FP_SCR1(%a6) |set exceptional operand
227 clrl FP_SCR1+4(%a6)
228 clrl FP_SCR1+8(%a6)
229
230 bfclr STAG(%a6){#5:#3} |clear wbtm66,wbtm1,wbtm0
231 bclrb #wbtemp15_bit,WB_BYTE(%a6) |clear wbtemp15
232 bsetb #sticky_bit,STICKY(%a6) |set sticky bit
233
234 bclrb #E1,E_BYTE(%a6)
235 | ;fall through to disabled case
236
237 | For disabled overflow call 'ovf_r_k'. This routine loads the
238 | correct result based on the rounding precision, destination
239 | format, rounding mode and sign.
240 |
241 ovf_dis:
242 bsr ovf_r_k |returns unsigned ETEMP_EX
243 | ;and sets FPSR_CC accordingly.
244 bfclr ETEMP_SGN(%a6){#0:#8} |fix sign
245 beqs ovf_pos
246 bsetb #sign_bit,ETEMP_EX(%a6)
247 bsetb #sign_bit,FP_SCR1(%a6) |set exceptional operand sign
248 ovf_pos:
249 fmovemx ETEMP(%a6),%fp0-%fp0 |move the result to fp0
250 rts
251
252
253 |
254 | INEX2 exception
255 |
256 | The inex2 and ainex bits are set.
257 |
258 t_inx2:
259 orl #inx2a_mask,USER_FPSR(%a6) |set INEX2, AINEX
260 rts
261
262 |
263 | Force Inex2
264 |
265 | This routine is called by the transcendental routines to force
266 | the inex2 exception bits set in the FPSR. If the underflow bit
267 | is set, but the underflow trap was not taken, the aunfl bit in
268 | the FPSR must be set.
269 |
270 t_frcinx:
271 orl #inx2a_mask,USER_FPSR(%a6) |set INEX2, AINEX
272 btstb #unfl_bit,FPSR_EXCEPT(%a6) |test for unfl bit set
273 beqs no_uacc1 |if clear, do not set aunfl
274 bsetb #aunfl_bit,FPSR_AEXCEPT(%a6)
275 no_uacc1:
276 rts
277
278 |
279 | DST_NAN
280 |
281 | Determine if the destination nan is signalling or non-signalling,
282 | and set the FPSR bits accordingly. See the MC68040 User's Manual
283 | section 3.2.2.5 NOT-A-NUMBERS.
284 |
285 dst_nan:
286 btstb #sign_bit,FPTEMP_EX(%a6) |test sign of nan
287 beqs dst_pos |if clr, it was positive
288 bsetb #neg_bit,FPSR_CC(%a6) |set N bit
289 dst_pos:
290 btstb #signan_bit,FPTEMP_HI(%a6) |check if signalling
291 beqs dst_snan |branch if signalling
292
293 fmovel %d1,%fpcr |restore user's rmode/prec
294 fmovex FPTEMP(%a6),%fp0 |return the non-signalling nan
295 |
296 | Check the source nan. If it is signalling, snan will be reported.
297 |
298 moveb STAG(%a6),%d0
299 andib #0xe0,%d0
300 cmpib #0x60,%d0
301 bnes no_snan
302 btstb #signan_bit,ETEMP_HI(%a6) |check if signalling
303 bnes no_snan
304 orl #snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
305 no_snan:
306 rts
307
308 dst_snan:
309 btstb #snan_bit,FPCR_ENABLE(%a6) |check if trap enabled
310 beqs dst_dis |branch if disabled
311
312 orb #nan_tag,DTAG(%a6) |set up dtag for nan
313 st STORE_FLG(%a6) |do not store a result
314 orl #snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
315 rts
316
317 dst_dis:
318 bsetb #signan_bit,FPTEMP_HI(%a6) |set SNAN bit in sop
319 fmovel %d1,%fpcr |restore user's rmode/prec
320 fmovex FPTEMP(%a6),%fp0 |load non-sign. nan
321 orl #snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
322 rts
323
324 |
325 | SRC_NAN
326 |
327 | Determine if the source nan is signalling or non-signalling,
328 | and set the FPSR bits accordingly. See the MC68040 User's Manual
329 | section 3.2.2.5 NOT-A-NUMBERS.
330 |
331 src_nan:
332 btstb #sign_bit,ETEMP_EX(%a6) |test sign of nan
333 beqs src_pos |if clr, it was positive
334 bsetb #neg_bit,FPSR_CC(%a6) |set N bit
335 src_pos:
336 btstb #signan_bit,ETEMP_HI(%a6) |check if signalling
337 beqs src_snan |branch if signalling
338 fmovel %d1,%fpcr |restore user's rmode/prec
339 fmovex ETEMP(%a6),%fp0 |return the non-signalling nan
340 rts
341
342 src_snan:
343 btstb #snan_bit,FPCR_ENABLE(%a6) |check if trap enabled
344 beqs src_dis |branch if disabled
345 bsetb #signan_bit,ETEMP_HI(%a6) |set SNAN bit in sop
346 orb #norm_tag,DTAG(%a6) |set up dtag for norm
347 orb #nan_tag,STAG(%a6) |set up stag for nan
348 st STORE_FLG(%a6) |do not store a result
349 orl #snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
350 rts
351
352 src_dis:
353 bsetb #signan_bit,ETEMP_HI(%a6) |set SNAN bit in sop
354 fmovel %d1,%fpcr |restore user's rmode/prec
355 fmovex ETEMP(%a6),%fp0 |load non-sign. nan
356 orl #snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
357 rts
358
359 |
360 | For all functions that have a denormalized input and that f(x)=x,
361 | this is the entry point
362 |
363 t_extdnrm:
364 orl #unfinx_mask,USER_FPSR(%a6)
365 | ;set UNFL, INEX2, AUNFL, AINEX
366 bras xdnrm_con
367 |
368 | Entry point for scale with extended denorm. The function does
369 | not set inex2, aunfl, or ainex.
370 |
371 t_resdnrm:
372 orl #unfl_mask,USER_FPSR(%a6)
373
374 xdnrm_con:
375 btstb #unfl_bit,FPCR_ENABLE(%a6)
376 beqs xdnrm_dis
377
378 |
379 | If exceptions are enabled, the additional task of setting up WBTEMP
380 | is needed so that when the underflow exception handler is entered,
381 | the user perceives no difference between what the 040 provides vs.
382 | what the FPSP provides.
383 |
384 xdnrm_ena:
385 movel %a0,-(%a7)
386
387 movel LOCAL_EX(%a0),FP_SCR1(%a6)
388 movel LOCAL_HI(%a0),FP_SCR1+4(%a6)
389 movel LOCAL_LO(%a0),FP_SCR1+8(%a6)
390
391 lea FP_SCR1(%a6),%a0
392
393 bclrb #sign_bit,LOCAL_EX(%a0)
394 sne LOCAL_SGN(%a0) |convert to internal ext format
395 tstw LOCAL_EX(%a0) |check if input is denorm
396 beqs xdnrm_dn |if so, skip nrm_set
397 bsr nrm_set |normalize the result (exponent
398 | ;will be negative
399 xdnrm_dn:
400 bclrb #sign_bit,LOCAL_EX(%a0) |take off false sign
401 bfclr LOCAL_SGN(%a0){#0:#8} |change back to IEEE ext format
402 beqs xdep
403 bsetb #sign_bit,LOCAL_EX(%a0)
404 xdep:
405 bfclr STAG(%a6){#5:#3} |clear wbtm66,wbtm1,wbtm0
406 bsetb #wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15
407 bclrb #sticky_bit,STICKY(%a6) |clear sticky bit
408 bclrb #E1,E_BYTE(%a6)
409 movel (%a7)+,%a0
410 xdnrm_dis:
411 bfextu FPCR_MODE(%a6){#0:#2},%d0 |get round precision
412 bnes not_ext |if not round extended, store
413 | ;IEEE defaults
414 is_ext:
415 btstb #sign_bit,LOCAL_EX(%a0)
416 beqs xdnrm_store
417
418 bsetb #neg_bit,FPSR_CC(%a6) |set N bit in FPSR_CC
419
420 bras xdnrm_store
421
422 not_ext:
423 bclrb #sign_bit,LOCAL_EX(%a0)
424 sne LOCAL_SGN(%a0) |convert to internal ext format
425 bsr unf_sub |returns IEEE result pointed by
426 | ;a0; sets FPSR_CC accordingly
427 bfclr LOCAL_SGN(%a0){#0:#8} |convert back to IEEE ext format
428 beqs xdnrm_store
429 bsetb #sign_bit,LOCAL_EX(%a0)
430 xdnrm_store:
431 fmovemx (%a0),%fp0-%fp0 |store result in fp0
432 rts
433
434 |
435 | This subroutine is used for dyadic operations that use an extended
436 | denorm within the kernel. The approach used is to capture the frame,
437 | fix/restore.
438 |
439 .global t_avoid_unsupp
440 t_avoid_unsupp:
441 link %a2,#-LOCAL_SIZE |so that a2 fpsp.h negative
442 | ;offsets may be used
443 fsave -(%a7)
444 tstb 1(%a7) |check if idle, exit if so
445 beq idle_end
446 btstb #E1,E_BYTE(%a2) |check for an E1 exception if
447 | ;enabled, there is an unsupp
448 beq end_avun |else, exit
449 btstb #7,DTAG(%a2) |check for denorm destination
450 beqs src_den |else, must be a source denorm
451 |
452 | handle destination denorm
453 |
454 lea FPTEMP(%a2),%a0
455 btstb #sign_bit,LOCAL_EX(%a0)
456 sne LOCAL_SGN(%a0) |convert to internal ext format
457 bclrb #7,DTAG(%a2) |set DTAG to norm
458 bsr nrm_set |normalize result, exponent
459 | ;will become negative
460 bclrb #sign_bit,LOCAL_EX(%a0) |get rid of fake sign
461 bfclr LOCAL_SGN(%a0){#0:#8} |convert back to IEEE ext format
462 beqs ck_src_den |check if source is also denorm
463 bsetb #sign_bit,LOCAL_EX(%a0)
464 ck_src_den:
465 btstb #7,STAG(%a2)
466 beqs end_avun
467 src_den:
468 lea ETEMP(%a2),%a0
469 btstb #sign_bit,LOCAL_EX(%a0)
470 sne LOCAL_SGN(%a0) |convert to internal ext format
471 bclrb #7,STAG(%a2) |set STAG to norm
472 bsr nrm_set |normalize result, exponent
473 | ;will become negative
474 bclrb #sign_bit,LOCAL_EX(%a0) |get rid of fake sign
475 bfclr LOCAL_SGN(%a0){#0:#8} |convert back to IEEE ext format
476 beqs den_com
477 bsetb #sign_bit,LOCAL_EX(%a0)
478 den_com:
479 moveb #0xfe,CU_SAVEPC(%a2) |set continue frame
480 clrw NMNEXC(%a2) |clear NMNEXC
481 bclrb #E1,E_BYTE(%a2)
482 | fmove.l %FPSR,FPSR_SHADOW(%a2)
483 | bset.b #SFLAG,E_BYTE(%a2)
484 | bset.b #XFLAG,T_BYTE(%a2)
485 end_avun:
486 frestore (%a7)+
487 unlk %a2
488 rts
489 idle_end:
490 addl #4,%a7
491 unlk %a2
492 rts
493 |end
This page took 0.058447 seconds and 5 git commands to generate.