[deliverable/linux.git] / arch / m68k / fpsp040 / kernel_ex.S

|
|	kernel_ex.sa 3.3 12/19/90
|
| This file contains routines to force exception status in the
| fpu for exceptional cases detected or reported within the
| transcendental functions.  Typically, the t_xx routine will
| set the appropriate bits in the USER_FPSR word on the stack.
| The bits are tested in gen_except.sa to determine if an exceptional
| situation needs to be created on return from the FPSP.
|

|		Copyright (C) Motorola, Inc. 1990
|			All Rights Reserved
|
|       For details on the license for this file, please see the
|       file, README, in this same directory.

KERNEL_EX:    |idnt    2,1 | Motorola 040 Floating Point Software Package

	|section    8

#include "fpsp.h"

mns_inf:  .long 0xffff0000,0x00000000,0x00000000
pls_inf:  .long 0x7fff0000,0x00000000,0x00000000
nan:      .long 0x7fff0000,0xffffffff,0xffffffff
huge:     .long 0x7ffe0000,0xffffffff,0xffffffff

	|xref	  ovf_r_k
	|xref	  unf_sub
	|xref	  nrm_set

	.global	  t_dz
	.global      t_dz2
	.global      t_operr
	.global      t_unfl
	.global      t_ovfl
	.global      t_ovfl2
	.global      t_inx2
	.global	  t_frcinx
	.global	  t_extdnrm
	.global	  t_resdnrm
	.global	  dst_nan
	.global	  src_nan
|
|	DZ exception
|
|
|	if dz trap disabled
|		store properly signed inf (use sign of etemp) into fp0
|		set FPSR exception status dz bit, condition code
|		inf bit, and accrued dz bit
|		return
|		frestore the frame into the machine (done by unimp_hd)
|
|	else dz trap enabled
|		set exception status bit & accrued bits in FPSR
|		set flag to disable sto_res from corrupting fp register
|		return
|		frestore the frame into the machine (done by unimp_hd)
|
| t_dz2 is used by monadic functions such as flogn (from do_func).
| t_dz is used by monadic functions such as satanh (from the
| transcendental function).
|
t_dz2:
	bsetb	#neg_bit,FPSR_CC(%a6)	|set neg bit in FPSR
	fmovel	#0,%FPSR			|clr status bits (Z set)
	btstb	#dz_bit,FPCR_ENABLE(%a6)	|test FPCR for dz exc enabled
	bnes	dz_ena_end
	bras	m_inf			|flogx always returns -inf
t_dz:
	fmovel	#0,%FPSR			|clr status bits (Z set)
	btstb	#dz_bit,FPCR_ENABLE(%a6)	|test FPCR for dz exc enabled
	bnes	dz_ena
|
|	dz disabled
|
	btstb	#sign_bit,ETEMP_EX(%a6)	|check sign for neg or pos
	beqs	p_inf			|branch if pos sign

m_inf:
	fmovemx mns_inf,%fp0-%fp0		|load -inf
	bsetb	#neg_bit,FPSR_CC(%a6)	|set neg bit in FPSR
	bras	set_fpsr
p_inf:
	fmovemx pls_inf,%fp0-%fp0		|load +inf
set_fpsr:
	orl	#dzinf_mask,USER_FPSR(%a6) |set I,DZ,ADZ
	rts
|
|	dz enabled
|
dz_ena:
	btstb	#sign_bit,ETEMP_EX(%a6)	|check sign for neg or pos
	beqs	dz_ena_end
	bsetb	#neg_bit,FPSR_CC(%a6)	|set neg bit in FPSR
dz_ena_end:
	orl	#dzinf_mask,USER_FPSR(%a6) |set I,DZ,ADZ
	st	STORE_FLG(%a6)
	rts
|
|	OPERR exception
|
|	if (operr trap disabled)
|		set FPSR exception status operr bit, condition code
|		nan bit; Store default NAN into fp0
|		frestore the frame into the machine (done by unimp_hd)
|
|	else (operr trap enabled)
|		set FPSR exception status operr bit, accrued operr bit
|		set flag to disable sto_res from corrupting fp register
|		frestore the frame into the machine (done by unimp_hd)
|
t_operr:
	orl	#opnan_mask,USER_FPSR(%a6) |set NaN, OPERR, AIOP

	btstb	#operr_bit,FPCR_ENABLE(%a6) |test FPCR for operr enabled
	bnes	op_ena

	fmovemx nan,%fp0-%fp0		|load default nan
	rts
op_ena:
	st	STORE_FLG(%a6)		|do not corrupt destination
	rts

|
|	t_unfl --- UNFL exception
|
| This entry point is used by all routines requiring unfl, inex2,
| aunfl, and ainex to be set on exit.
|
| On entry, a0 points to the exceptional operand.  The final exceptional
| operand is built in FP_SCR1 and only the sign from the original operand
| is used.
|
t_unfl:
	clrl	FP_SCR1(%a6)		|set exceptional operand to zero
	clrl	FP_SCR1+4(%a6)
	clrl	FP_SCR1+8(%a6)
	tstb	(%a0)			|extract sign from caller's exop
	bpls	unfl_signok
	bset	#sign_bit,FP_SCR1(%a6)
unfl_signok:
	leal	FP_SCR1(%a6),%a0
	orl	#unfinx_mask,USER_FPSR(%a6)
|					;set UNFL, INEX2, AUNFL, AINEX
unfl_con:
	btstb	#unfl_bit,FPCR_ENABLE(%a6)
	beqs	unfl_dis

unfl_ena:
	bfclr	STAG(%a6){#5:#3}		|clear wbtm66,wbtm1,wbtm0
	bsetb	#wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15
	bsetb	#sticky_bit,STICKY(%a6)	|set sticky bit

	bclrb	#E1,E_BYTE(%a6)

unfl_dis:
	bfextu	FPCR_MODE(%a6){#0:#2},%d0	|get round precision

	bclrb	#sign_bit,LOCAL_EX(%a0)
	sne	LOCAL_SGN(%a0)		|convert to internal ext format

	bsr	unf_sub			|returns IEEE result at a0
|					;and sets FPSR_CC accordingly

	bfclr	LOCAL_SGN(%a0){#0:#8}	|convert back to IEEE ext format
	beqs	unfl_fin

	bsetb	#sign_bit,LOCAL_EX(%a0)
	bsetb	#sign_bit,FP_SCR1(%a6)	|set sign bit of exc operand

unfl_fin:
	fmovemx (%a0),%fp0-%fp0		|store result in fp0
	rts


|
|	t_ovfl2 --- OVFL exception (without inex2 returned)
|
| This entry is used by scale to force catastrophic overflow.  The
| ovfl, aovfl, and ainex bits are set, but not the inex2 bit.
|
t_ovfl2:
	orl	#ovfl_inx_mask,USER_FPSR(%a6)
	movel	ETEMP(%a6),FP_SCR1(%a6)
	movel	ETEMP_HI(%a6),FP_SCR1+4(%a6)
	movel	ETEMP_LO(%a6),FP_SCR1+8(%a6)
|
| Check for single or double round precision.  If single, check if
| the lower 40 bits of ETEMP are zero; if not, set inex2.  If double,
| check if the lower 21 bits are zero; if not, set inex2.
|
	moveb	FPCR_MODE(%a6),%d0
	andib	#0xc0,%d0
	beq	t_work		|if extended, finish ovfl processing
	cmpib	#0x40,%d0		|test for single
	bnes	t_dbl
t_sgl:
	tstb	ETEMP_LO(%a6)
	bnes	t_setinx2
	movel	ETEMP_HI(%a6),%d0
	andil	#0xff,%d0		|look at only lower 8 bits
	bnes	t_setinx2
	bra	t_work
t_dbl:
	movel	ETEMP_LO(%a6),%d0
	andil	#0x7ff,%d0	|look at only lower 11 bits
	beq	t_work
t_setinx2:
	orl	#inex2_mask,USER_FPSR(%a6)
	bras	t_work
|
|	t_ovfl --- OVFL exception
|
|** Note: the exc operand is returned in ETEMP.
|
t_ovfl:
	orl	#ovfinx_mask,USER_FPSR(%a6)
t_work:
	btstb	#ovfl_bit,FPCR_ENABLE(%a6) |test FPCR for ovfl enabled
	beqs	ovf_dis

ovf_ena:
	clrl	FP_SCR1(%a6)		|set exceptional operand
	clrl	FP_SCR1+4(%a6)
	clrl	FP_SCR1+8(%a6)

	bfclr	STAG(%a6){#5:#3}		|clear wbtm66,wbtm1,wbtm0
	bclrb	#wbtemp15_bit,WB_BYTE(%a6) |clear wbtemp15
	bsetb	#sticky_bit,STICKY(%a6)	|set sticky bit

	bclrb	#E1,E_BYTE(%a6)
|					;fall through to disabled case

| For disabled overflow call 'ovf_r_k'.  This routine loads the
| correct result based on the rounding precision, destination
| format, rounding mode and sign.
|
ovf_dis:
	bsr	ovf_r_k			|returns unsigned ETEMP_EX
|					;and sets FPSR_CC accordingly.
	bfclr	ETEMP_SGN(%a6){#0:#8}	|fix sign
	beqs	ovf_pos
	bsetb	#sign_bit,ETEMP_EX(%a6)
	bsetb	#sign_bit,FP_SCR1(%a6)	|set exceptional operand sign
ovf_pos:
	fmovemx ETEMP(%a6),%fp0-%fp0		|move the result to fp0
	rts


|
|	INEX2 exception
|
| The inex2 and ainex bits are set.
|
t_inx2:
	orl	#inx2a_mask,USER_FPSR(%a6) |set INEX2, AINEX
	rts

|
|	Force Inex2
|
| This routine is called by the transcendental routines to force
| the inex2 exception bits set in the FPSR.  If the underflow bit
| is set, but the underflow trap was not taken, the aunfl bit in
| the FPSR must be set.
|
t_frcinx:
	orl	#inx2a_mask,USER_FPSR(%a6) |set INEX2, AINEX
	btstb	#unfl_bit,FPSR_EXCEPT(%a6) |test for unfl bit set
	beqs	no_uacc1		|if clear, do not set aunfl
	bsetb	#aunfl_bit,FPSR_AEXCEPT(%a6)
no_uacc1:
	rts

|
|	DST_NAN
|
| Determine if the destination nan is signalling or non-signalling,
| and set the FPSR bits accordingly.  See the MC68040 User's Manual
| section 3.2.2.5 NOT-A-NUMBERS.
|
dst_nan:
	btstb	#sign_bit,FPTEMP_EX(%a6) |test sign of nan
	beqs	dst_pos			|if clr, it was positive
	bsetb	#neg_bit,FPSR_CC(%a6)	|set N bit
dst_pos:
	btstb	#signan_bit,FPTEMP_HI(%a6) |check if signalling
	beqs	dst_snan		|branch if signalling

	fmovel	%d1,%fpcr			|restore user's rmode/prec
	fmovex FPTEMP(%a6),%fp0		|return the non-signalling nan
|
| Check the source nan.  If it is signalling, snan will be reported.
|
	moveb	STAG(%a6),%d0
	andib	#0xe0,%d0
	cmpib	#0x60,%d0
	bnes	no_snan
	btstb	#signan_bit,ETEMP_HI(%a6) |check if signalling
	bnes	no_snan
	orl	#snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
no_snan:
	rts

dst_snan:
	btstb	#snan_bit,FPCR_ENABLE(%a6) |check if trap enabled
	beqs	dst_dis			|branch if disabled

	orb	#nan_tag,DTAG(%a6)	|set up dtag for nan
	st	STORE_FLG(%a6)		|do not store a result
	orl	#snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
	rts

dst_dis:
	bsetb	#signan_bit,FPTEMP_HI(%a6) |set SNAN bit in sop
	fmovel	%d1,%fpcr			|restore user's rmode/prec
	fmovex FPTEMP(%a6),%fp0		|load non-sign. nan
	orl	#snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
	rts

|
|	SRC_NAN
|
| Determine if the source nan is signalling or non-signalling,
| and set the FPSR bits accordingly.  See the MC68040 User's Manual
| section 3.2.2.5 NOT-A-NUMBERS.
|
src_nan:
	btstb	#sign_bit,ETEMP_EX(%a6) |test sign of nan
	beqs	src_pos			|if clr, it was positive
	bsetb	#neg_bit,FPSR_CC(%a6)	|set N bit
src_pos:
	btstb	#signan_bit,ETEMP_HI(%a6) |check if signalling
	beqs	src_snan		|branch if signalling
	fmovel	%d1,%fpcr			|restore user's rmode/prec
	fmovex ETEMP(%a6),%fp0		|return the non-signalling nan
	rts

src_snan:
	btstb	#snan_bit,FPCR_ENABLE(%a6) |check if trap enabled
	beqs	src_dis			|branch if disabled
	bsetb	#signan_bit,ETEMP_HI(%a6) |set SNAN bit in sop
	orb	#norm_tag,DTAG(%a6)	|set up dtag for norm
	orb	#nan_tag,STAG(%a6)	|set up stag for nan
	st	STORE_FLG(%a6)		|do not store a result
	orl	#snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
	rts

src_dis:
	bsetb	#signan_bit,ETEMP_HI(%a6) |set SNAN bit in sop
	fmovel	%d1,%fpcr			|restore user's rmode/prec
	fmovex ETEMP(%a6),%fp0		|load non-sign. nan
	orl	#snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
	rts

|
| For all functions that have a denormalized input and that f(x)=x,
| this is the entry point
|
t_extdnrm:
	orl	#unfinx_mask,USER_FPSR(%a6)
|					;set UNFL, INEX2, AUNFL, AINEX
	bras	xdnrm_con
|
| Entry point for scale with extended denorm.  The function does
| not set inex2, aunfl, or ainex.
|
t_resdnrm:
	orl	#unfl_mask,USER_FPSR(%a6)

xdnrm_con:
	btstb	#unfl_bit,FPCR_ENABLE(%a6)
	beqs	xdnrm_dis

|
| If exceptions are enabled, the additional task of setting up WBTEMP
| is needed so that when the underflow exception handler is entered,
| the user perceives no difference between what the 040 provides vs.
| what the FPSP provides.
|
xdnrm_ena:
	movel	%a0,-(%a7)

	movel	LOCAL_EX(%a0),FP_SCR1(%a6)
	movel	LOCAL_HI(%a0),FP_SCR1+4(%a6)
	movel	LOCAL_LO(%a0),FP_SCR1+8(%a6)

	lea	FP_SCR1(%a6),%a0

	bclrb	#sign_bit,LOCAL_EX(%a0)
	sne	LOCAL_SGN(%a0)		|convert to internal ext format
	tstw	LOCAL_EX(%a0)		|check if input is denorm
	beqs	xdnrm_dn		|if so, skip nrm_set
	bsr	nrm_set			|normalize the result (exponent
|					;will be negative
xdnrm_dn:
	bclrb	#sign_bit,LOCAL_EX(%a0)	|take off false sign
	bfclr	LOCAL_SGN(%a0){#0:#8}	|change back to IEEE ext format
	beqs	xdep
	bsetb	#sign_bit,LOCAL_EX(%a0)
xdep:
	bfclr	STAG(%a6){#5:#3}		|clear wbtm66,wbtm1,wbtm0
	bsetb	#wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15
	bclrb	#sticky_bit,STICKY(%a6)	|clear sticky bit
	bclrb	#E1,E_BYTE(%a6)
	movel	(%a7)+,%a0
xdnrm_dis:
	bfextu	FPCR_MODE(%a6){#0:#2},%d0	|get round precision
	bnes	not_ext			|if not round extended, store
|					;IEEE defaults
is_ext:
	btstb	#sign_bit,LOCAL_EX(%a0)
	beqs	xdnrm_store

	bsetb	#neg_bit,FPSR_CC(%a6)	|set N bit in FPSR_CC

	bras	xdnrm_store

not_ext:
	bclrb	#sign_bit,LOCAL_EX(%a0)
	sne	LOCAL_SGN(%a0)		|convert to internal ext format
	bsr	unf_sub			|returns IEEE result pointed by
|					;a0; sets FPSR_CC accordingly
	bfclr	LOCAL_SGN(%a0){#0:#8}	|convert back to IEEE ext format
	beqs	xdnrm_store
	bsetb	#sign_bit,LOCAL_EX(%a0)
xdnrm_store:
	fmovemx (%a0),%fp0-%fp0		|store result in fp0
	rts

|
| This subroutine is used for dyadic operations that use an extended
| denorm within the kernel. The approach used is to capture the frame,
| fix/restore.
|
	.global	t_avoid_unsupp
t_avoid_unsupp:
	link	%a2,#-LOCAL_SIZE		|so that a2 fpsp.h negative
|					;offsets may be used
	fsave	-(%a7)
	tstb	1(%a7)			|check if idle, exit if so
	beq	idle_end
	btstb	#E1,E_BYTE(%a2)		|check for an E1 exception if
|					;enabled, there is an unsupp
	beq	end_avun		|else, exit
	btstb	#7,DTAG(%a2)		|check for denorm destination
	beqs	src_den			|else, must be a source denorm
|
| handle destination denorm
|
	lea	FPTEMP(%a2),%a0
	btstb	#sign_bit,LOCAL_EX(%a0)
	sne	LOCAL_SGN(%a0)		|convert to internal ext format
	bclrb	#7,DTAG(%a2)		|set DTAG to norm
	bsr	nrm_set			|normalize result, exponent
|					;will become negative
	bclrb	#sign_bit,LOCAL_EX(%a0)	|get rid of fake sign
	bfclr	LOCAL_SGN(%a0){#0:#8}	|convert back to IEEE ext format
	beqs	ck_src_den		|check if source is also denorm
	bsetb	#sign_bit,LOCAL_EX(%a0)
ck_src_den:
	btstb	#7,STAG(%a2)
	beqs	end_avun
src_den:
	lea	ETEMP(%a2),%a0
	btstb	#sign_bit,LOCAL_EX(%a0)
	sne	LOCAL_SGN(%a0)		|convert to internal ext format
	bclrb	#7,STAG(%a2)		|set STAG to norm
	bsr	nrm_set			|normalize result, exponent
|					;will become negative
	bclrb	#sign_bit,LOCAL_EX(%a0)	|get rid of fake sign
	bfclr	LOCAL_SGN(%a0){#0:#8}	|convert back to IEEE ext format
	beqs	den_com
	bsetb	#sign_bit,LOCAL_EX(%a0)
den_com:
	moveb	#0xfe,CU_SAVEPC(%a2)	|set continue frame
	clrw	NMNEXC(%a2)		|clear NMNEXC
	bclrb	#E1,E_BYTE(%a2)
|	fmove.l	%FPSR,FPSR_SHADOW(%a2)
|	bset.b	#SFLAG,E_BYTE(%a2)
|	bset.b	#XFLAG,T_BYTE(%a2)
end_avun:
	frestore (%a7)+
	unlk	%a2
	rts
idle_end:
	addl	#4,%a7
	unlk	%a2
	rts
	|end
Commit	Line	Data
1da177e4 LT	1	\|
	2	\| kernel_ex.sa 3.3 12/19/90
	3	\|
	4	\| This file contains routines to force exception status in the
	5	\| fpu for exceptional cases detected or reported within the
	6	\| transcendental functions. Typically, the t_xx routine will
	7	\| set the appropriate bits in the USER_FPSR word on the stack.
	8	\| The bits are tested in gen_except.sa to determine if an exceptional
	9	\| situation needs to be created on return from the FPSP.
	10	\|
	11
	12	\| Copyright (C) Motorola, Inc. 1990
	13	\| All Rights Reserved
	14	\|
e00d82d0 MW	15	\| For details on the license for this file, please see the
e00d82d0 MW	16	\| file, README, in this same directory.
1da177e4 LT	17
	18	KERNEL_EX: \|idnt 2,1 \| Motorola 040 Floating Point Software Package
	19
	20	\|section 8
	21
	22	#include "fpsp.h"
	23
	24	mns_inf: .long 0xffff0000,0x00000000,0x00000000
	25	pls_inf: .long 0x7fff0000,0x00000000,0x00000000
	26	nan: .long 0x7fff0000,0xffffffff,0xffffffff
	27	huge: .long 0x7ffe0000,0xffffffff,0xffffffff
	28
	29	\|xref ovf_r_k
	30	\|xref unf_sub
	31	\|xref nrm_set
	32
	33	.global t_dz
	34	.global t_dz2
	35	.global t_operr
	36	.global t_unfl
	37	.global t_ovfl
	38	.global t_ovfl2
	39	.global t_inx2
	40	.global t_frcinx
	41	.global t_extdnrm
	42	.global t_resdnrm
	43	.global dst_nan
	44	.global src_nan
	45	\|
	46	\| DZ exception
	47	\|
	48	\|
	49	\| if dz trap disabled
	50	\| store properly signed inf (use sign of etemp) into fp0
	51	\| set FPSR exception status dz bit, condition code
	52	\| inf bit, and accrued dz bit
	53	\| return
	54	\| frestore the frame into the machine (done by unimp_hd)
	55	\|
	56	\| else dz trap enabled
	57	\| set exception status bit & accrued bits in FPSR
	58	\| set flag to disable sto_res from corrupting fp register
	59	\| return
	60	\| frestore the frame into the machine (done by unimp_hd)
	61	\|
	62	\| t_dz2 is used by monadic functions such as flogn (from do_func).
	63	\| t_dz is used by monadic functions such as satanh (from the
	64	\| transcendental function).
	65	\|
	66	t_dz2:
	67	bsetb #neg_bit,FPSR_CC(%a6) \|set neg bit in FPSR
	68	fmovel #0,%FPSR \|clr status bits (Z set)
	69	btstb #dz_bit,FPCR_ENABLE(%a6) \|test FPCR for dz exc enabled
	70	bnes dz_ena_end
	71	bras m_inf \|flogx always returns -inf
	72	t_dz:
	73	fmovel #0,%FPSR \|clr status bits (Z set)
	74	btstb #dz_bit,FPCR_ENABLE(%a6) \|test FPCR for dz exc enabled
	75	bnes dz_ena
	76	\|
	77	\| dz disabled
	78	\|
	79	btstb #sign_bit,ETEMP_EX(%a6) \|check sign for neg or pos
	80	beqs p_inf \|branch if pos sign
81
82	m_inf:
83	fmovemx mns_inf,%fp0-%fp0 \|load -inf
84	bsetb #neg_bit,FPSR_CC(%a6) \|set neg bit in FPSR
85	bras set_fpsr
86	p_inf:
87	fmovemx pls_inf,%fp0-%fp0 \|load +inf
88	set_fpsr:
89	orl #dzinf_mask,USER_FPSR(%a6) \|set I,DZ,ADZ
90	rts
91	\|
92	\| dz enabled
93	\|
94	dz_ena:
95	btstb #sign_bit,ETEMP_EX(%a6) \|check sign for neg or pos
96	beqs dz_ena_end
97	bsetb #neg_bit,FPSR_CC(%a6) \|set neg bit in FPSR
98	dz_ena_end:
99	orl #dzinf_mask,USER_FPSR(%a6) \|set I,DZ,ADZ
100	st STORE_FLG(%a6)
101	rts
102	\|
103	\| OPERR exception
104	\|
105	\| if (operr trap disabled)
106	\| set FPSR exception status operr bit, condition code
107	\| nan bit; Store default NAN into fp0
108	\| frestore the frame into the machine (done by unimp_hd)
109	\|
110	\| else (operr trap enabled)
111	\| set FPSR exception status operr bit, accrued operr bit
112	\| set flag to disable sto_res from corrupting fp register
113	\| frestore the frame into the machine (done by unimp_hd)
114	\|
115	t_operr:
116	orl #opnan_mask,USER_FPSR(%a6) \|set NaN, OPERR, AIOP
117
118	btstb #operr_bit,FPCR_ENABLE(%a6) \|test FPCR for operr enabled
119	bnes op_ena
120
121	fmovemx nan,%fp0-%fp0 \|load default nan
122	rts
123	op_ena:
124	st STORE_FLG(%a6) \|do not corrupt destination
125	rts
126
127	\|
128	\| t_unfl --- UNFL exception
129	\|
130	\| This entry point is used by all routines requiring unfl, inex2,
131	\| aunfl, and ainex to be set on exit.
132	\|
133	\| On entry, a0 points to the exceptional operand. The final exceptional
134	\| operand is built in FP_SCR1 and only the sign from the original operand
135	\| is used.
136	\|
137	t_unfl:
138	clrl FP_SCR1(%a6) \|set exceptional operand to zero
139	clrl FP_SCR1+4(%a6)
140	clrl FP_SCR1+8(%a6)
141	tstb (%a0) \|extract sign from caller's exop
142	bpls unfl_signok
143	bset #sign_bit,FP_SCR1(%a6)
144	unfl_signok:
145	leal FP_SCR1(%a6),%a0
146	orl #unfinx_mask,USER_FPSR(%a6)
147	\| ;set UNFL, INEX2, AUNFL, AINEX
148	unfl_con:
149	btstb #unfl_bit,FPCR_ENABLE(%a6)
150	beqs unfl_dis
151
152	unfl_ena:
153	bfclr STAG(%a6){#5:#3} \|clear wbtm66,wbtm1,wbtm0
154	bsetb #wbtemp15_bit,WB_BYTE(%a6) \|set wbtemp15
155	bsetb #sticky_bit,STICKY(%a6) \|set sticky bit
156
157	bclrb #E1,E_BYTE(%a6)
158
159	unfl_dis:
160	bfextu FPCR_MODE(%a6){#0:#2},%d0 \|get round precision
161
162	bclrb #sign_bit,LOCAL_EX(%a0)
163	sne LOCAL_SGN(%a0) \|convert to internal ext format
164
165	bsr unf_sub \|returns IEEE result at a0
166	\| ;and sets FPSR_CC accordingly
167
168	bfclr LOCAL_SGN(%a0){#0:#8} \|convert back to IEEE ext format
169	beqs unfl_fin
170
171	bsetb #sign_bit,LOCAL_EX(%a0)
172	bsetb #sign_bit,FP_SCR1(%a6) \|set sign bit of exc operand
173
174	unfl_fin:
175	fmovemx (%a0),%fp0-%fp0 \|store result in fp0
176	rts
177
178
179	\|
180	\| t_ovfl2 --- OVFL exception (without inex2 returned)
181	\|
182	\| This entry is used by scale to force catastrophic overflow. The
183	\| ovfl, aovfl, and ainex bits are set, but not the inex2 bit.
184	\|
185	t_ovfl2:
186	orl #ovfl_inx_mask,USER_FPSR(%a6)
187	movel ETEMP(%a6),FP_SCR1(%a6)
188	movel ETEMP_HI(%a6),FP_SCR1+4(%a6)
189	movel ETEMP_LO(%a6),FP_SCR1+8(%a6)
190	\|
191	\| Check for single or double round precision. If single, check if
192	\| the lower 40 bits of ETEMP are zero; if not, set inex2. If double,
193	\| check if the lower 21 bits are zero; if not, set inex2.
194	\|
195	moveb FPCR_MODE(%a6),%d0
196	andib #0xc0,%d0
197	beq t_work \|if extended, finish ovfl processing
198	cmpib #0x40,%d0 \|test for single
199	bnes t_dbl
200	t_sgl:
201	tstb ETEMP_LO(%a6)
202	bnes t_setinx2
203	movel ETEMP_HI(%a6),%d0
204	andil #0xff,%d0 \|look at only lower 8 bits
205	bnes t_setinx2
206	bra t_work
207	t_dbl:
208	movel ETEMP_LO(%a6),%d0
209	andil #0x7ff,%d0 \|look at only lower 11 bits
210	beq t_work
211	t_setinx2:
212	orl #inex2_mask,USER_FPSR(%a6)
213	bras t_work
214	\|
215	\| t_ovfl --- OVFL exception
216	\|
217	\|** Note: the exc operand is returned in ETEMP.
218	\|
219	t_ovfl:
220	orl #ovfinx_mask,USER_FPSR(%a6)
221	t_work:
222	btstb #ovfl_bit,FPCR_ENABLE(%a6) \|test FPCR for ovfl enabled
223	beqs ovf_dis
224
225	ovf_ena:
226	clrl FP_SCR1(%a6) \|set exceptional operand
227	clrl FP_SCR1+4(%a6)
228	clrl FP_SCR1+8(%a6)
229
230	bfclr STAG(%a6){#5:#3} \|clear wbtm66,wbtm1,wbtm0
231	bclrb #wbtemp15_bit,WB_BYTE(%a6) \|clear wbtemp15
232	bsetb #sticky_bit,STICKY(%a6) \|set sticky bit
233
234	bclrb #E1,E_BYTE(%a6)
235	\| ;fall through to disabled case
236
237	\| For disabled overflow call 'ovf_r_k'. This routine loads the
238	\| correct result based on the rounding precision, destination
239	\| format, rounding mode and sign.
240	\|
241	ovf_dis:
242	bsr ovf_r_k \|returns unsigned ETEMP_EX
243	\| ;and sets FPSR_CC accordingly.
244	bfclr ETEMP_SGN(%a6){#0:#8} \|fix sign
245	beqs ovf_pos
246	bsetb #sign_bit,ETEMP_EX(%a6)
247	bsetb #sign_bit,FP_SCR1(%a6) \|set exceptional operand sign
248	ovf_pos:
249	fmovemx ETEMP(%a6),%fp0-%fp0 \|move the result to fp0
250	rts
251
252
253	\|
254	\| INEX2 exception
255	\|
256	\| The inex2 and ainex bits are set.
257	\|
258	t_inx2:
259	orl #inx2a_mask,USER_FPSR(%a6) \|set INEX2, AINEX
260	rts
261
262	\|
263	\| Force Inex2
264	\|
265	\| This routine is called by the transcendental routines to force
266	\| the inex2 exception bits set in the FPSR. If the underflow bit
267	\| is set, but the underflow trap was not taken, the aunfl bit in
268	\| the FPSR must be set.
269	\|
270	t_frcinx:
271	orl #inx2a_mask,USER_FPSR(%a6) \|set INEX2, AINEX
272	btstb #unfl_bit,FPSR_EXCEPT(%a6) \|test for unfl bit set
273	beqs no_uacc1 \|if clear, do not set aunfl
274	bsetb #aunfl_bit,FPSR_AEXCEPT(%a6)
275	no_uacc1:
276	rts
277
278	\|
279	\| DST_NAN
280	\|
281	\| Determine if the destination nan is signalling or non-signalling,
282	\| and set the FPSR bits accordingly. See the MC68040 User's Manual
283	\| section 3.2.2.5 NOT-A-NUMBERS.
284	\|
285	dst_nan:
286	btstb #sign_bit,FPTEMP_EX(%a6) \|test sign of nan
287	beqs dst_pos \|if clr, it was positive
288	bsetb #neg_bit,FPSR_CC(%a6) \|set N bit
289	dst_pos:
290	btstb #signan_bit,FPTEMP_HI(%a6) \|check if signalling
291	beqs dst_snan \|branch if signalling
292
293	fmovel %d1,%fpcr \|restore user's rmode/prec
294	fmovex FPTEMP(%a6),%fp0 \|return the non-signalling nan
295	\|
296	\| Check the source nan. If it is signalling, snan will be reported.
297	\|
298	moveb STAG(%a6),%d0
299	andib #0xe0,%d0
300	cmpib #0x60,%d0
301	bnes no_snan
302	btstb #signan_bit,ETEMP_HI(%a6) \|check if signalling
303	bnes no_snan
304	orl #snaniop_mask,USER_FPSR(%a6) \|set NAN, SNAN, AIOP
305	no_snan:
306	rts
307
308	dst_snan:
309	btstb #snan_bit,FPCR_ENABLE(%a6) \|check if trap enabled
310	beqs dst_dis \|branch if disabled
311
312	orb #nan_tag,DTAG(%a6) \|set up dtag for nan
313	st STORE_FLG(%a6) \|do not store a result
314	orl #snaniop_mask,USER_FPSR(%a6) \|set NAN, SNAN, AIOP
315	rts
316
317	dst_dis:
318	bsetb #signan_bit,FPTEMP_HI(%a6) \|set SNAN bit in sop
319	fmovel %d1,%fpcr \|restore user's rmode/prec
320	fmovex FPTEMP(%a6),%fp0 \|load non-sign. nan
321	orl #snaniop_mask,USER_FPSR(%a6) \|set NAN, SNAN, AIOP
322	rts
323
324	\|
325	\| SRC_NAN
326	\|
327	\| Determine if the source nan is signalling or non-signalling,
328	\| and set the FPSR bits accordingly. See the MC68040 User's Manual
329	\| section 3.2.2.5 NOT-A-NUMBERS.
330	\|
331	src_nan:
332	btstb #sign_bit,ETEMP_EX(%a6) \|test sign of nan
333	beqs src_pos \|if clr, it was positive
334	bsetb #neg_bit,FPSR_CC(%a6) \|set N bit
335	src_pos:
336	btstb #signan_bit,ETEMP_HI(%a6) \|check if signalling
337	beqs src_snan \|branch if signalling
338	fmovel %d1,%fpcr \|restore user's rmode/prec
339	fmovex ETEMP(%a6),%fp0 \|return the non-signalling nan
340	rts
341
342	src_snan:
343	btstb #snan_bit,FPCR_ENABLE(%a6) \|check if trap enabled
344	beqs src_dis \|branch if disabled
345	bsetb #signan_bit,ETEMP_HI(%a6) \|set SNAN bit in sop
346	orb #norm_tag,DTAG(%a6) \|set up dtag for norm
347	orb #nan_tag,STAG(%a6) \|set up stag for nan
348	st STORE_FLG(%a6) \|do not store a result
349	orl #snaniop_mask,USER_FPSR(%a6) \|set NAN, SNAN, AIOP
350	rts
351
352	src_dis:
353	bsetb #signan_bit,ETEMP_HI(%a6) \|set SNAN bit in sop
354	fmovel %d1,%fpcr \|restore user's rmode/prec
355	fmovex ETEMP(%a6),%fp0 \|load non-sign. nan
356	orl #snaniop_mask,USER_FPSR(%a6) \|set NAN, SNAN, AIOP
357	rts
358
359	\|
360	\| For all functions that have a denormalized input and that f(x)=x,
361	\| this is the entry point
362	\|
363	t_extdnrm:
364	orl #unfinx_mask,USER_FPSR(%a6)
365	\| ;set UNFL, INEX2, AUNFL, AINEX
366	bras xdnrm_con
367	\|
368	\| Entry point for scale with extended denorm. The function does
369	\| not set inex2, aunfl, or ainex.
370	\|
371	t_resdnrm:
372	orl #unfl_mask,USER_FPSR(%a6)
373
374	xdnrm_con:
375	btstb #unfl_bit,FPCR_ENABLE(%a6)
376	beqs xdnrm_dis
377
378	\|
379	\| If exceptions are enabled, the additional task of setting up WBTEMP
380	\| is needed so that when the underflow exception handler is entered,
381	\| the user perceives no difference between what the 040 provides vs.
382	\| what the FPSP provides.
383	\|
384	xdnrm_ena:
385	movel %a0,-(%a7)
386
387	movel LOCAL_EX(%a0),FP_SCR1(%a6)
388	movel LOCAL_HI(%a0),FP_SCR1+4(%a6)
389	movel LOCAL_LO(%a0),FP_SCR1+8(%a6)
390
391	lea FP_SCR1(%a6),%a0
392
393	bclrb #sign_bit,LOCAL_EX(%a0)
394	sne LOCAL_SGN(%a0) \|convert to internal ext format
395	tstw LOCAL_EX(%a0) \|check if input is denorm
396	beqs xdnrm_dn \|if so, skip nrm_set
397	bsr nrm_set \|normalize the result (exponent
398	\| ;will be negative
399	xdnrm_dn:
400	bclrb #sign_bit,LOCAL_EX(%a0) \|take off false sign
401	bfclr LOCAL_SGN(%a0){#0:#8} \|change back to IEEE ext format
402	beqs xdep
403	bsetb #sign_bit,LOCAL_EX(%a0)
404	xdep:
405	bfclr STAG(%a6){#5:#3} \|clear wbtm66,wbtm1,wbtm0
406	bsetb #wbtemp15_bit,WB_BYTE(%a6) \|set wbtemp15
407	bclrb #sticky_bit,STICKY(%a6) \|clear sticky bit
408	bclrb #E1,E_BYTE(%a6)
409	movel (%a7)+,%a0
410	xdnrm_dis:
411	bfextu FPCR_MODE(%a6){#0:#2},%d0 \|get round precision
412	bnes not_ext \|if not round extended, store
413	\| ;IEEE defaults
414	is_ext:
415	btstb #sign_bit,LOCAL_EX(%a0)
416	beqs xdnrm_store
417
418	bsetb #neg_bit,FPSR_CC(%a6) \|set N bit in FPSR_CC
419
420	bras xdnrm_store
421
422	not_ext:
423	bclrb #sign_bit,LOCAL_EX(%a0)
424	sne LOCAL_SGN(%a0) \|convert to internal ext format
425	bsr unf_sub \|returns IEEE result pointed by
426	\| ;a0; sets FPSR_CC accordingly
427	bfclr LOCAL_SGN(%a0){#0:#8} \|convert back to IEEE ext format
428	beqs xdnrm_store
429	bsetb #sign_bit,LOCAL_EX(%a0)
430	xdnrm_store:
431	fmovemx (%a0),%fp0-%fp0 \|store result in fp0
432	rts
433
434	\|
435	\| This subroutine is used for dyadic operations that use an extended
436	\| denorm within the kernel. The approach used is to capture the frame,
437	\| fix/restore.
438	\|
439	.global t_avoid_unsupp
440	t_avoid_unsupp:
441	link %a2,#-LOCAL_SIZE \|so that a2 fpsp.h negative
442	\| ;offsets may be used
443	fsave -(%a7)
444	tstb 1(%a7) \|check if idle, exit if so
445	beq idle_end
446	btstb #E1,E_BYTE(%a2) \|check for an E1 exception if
447	\| ;enabled, there is an unsupp
448	beq end_avun \|else, exit
449	btstb #7,DTAG(%a2) \|check for denorm destination
450	beqs src_den \|else, must be a source denorm
451	\|
452	\| handle destination denorm
453	\|
454	lea FPTEMP(%a2),%a0
455	btstb #sign_bit,LOCAL_EX(%a0)
456	sne LOCAL_SGN(%a0) \|convert to internal ext format
457	bclrb #7,DTAG(%a2) \|set DTAG to norm
458	bsr nrm_set \|normalize result, exponent
459	\| ;will become negative
460	bclrb #sign_bit,LOCAL_EX(%a0) \|get rid of fake sign
461	bfclr LOCAL_SGN(%a0){#0:#8} \|convert back to IEEE ext format
462	beqs ck_src_den \|check if source is also denorm
463	bsetb #sign_bit,LOCAL_EX(%a0)
464	ck_src_den:
465	btstb #7,STAG(%a2)
466	beqs end_avun
467	src_den:
468	lea ETEMP(%a2),%a0
469	btstb #sign_bit,LOCAL_EX(%a0)
470	sne LOCAL_SGN(%a0) \|convert to internal ext format
471	bclrb #7,STAG(%a2) \|set STAG to norm
472	bsr nrm_set \|normalize result, exponent
473	\| ;will become negative
474	bclrb #sign_bit,LOCAL_EX(%a0) \|get rid of fake sign
475	bfclr LOCAL_SGN(%a0){#0:#8} \|convert back to IEEE ext format
476	beqs den_com
477	bsetb #sign_bit,LOCAL_EX(%a0)
478	den_com:
479	moveb #0xfe,CU_SAVEPC(%a2) \|set continue frame
480	clrw NMNEXC(%a2) \|clear NMNEXC
481	bclrb #E1,E_BYTE(%a2)
482	\| fmove.l %FPSR,FPSR_SHADOW(%a2)
483	\| bset.b #SFLAG,E_BYTE(%a2)
484	\| bset.b #XFLAG,T_BYTE(%a2)
485	end_avun:
486	frestore (%a7)+
487	unlk %a2
488	rts
489	idle_end:
490	addl #4,%a7
491	unlk %a2
492	rts
493	\|end