[deliverable/linux.git] / arch / parisc / math-emu / dfsqrt.c

/*
 * Linux/PA-RISC Project (http://www.parisc-linux.org/)
 *
 * Floating-point emulation code
 *  Copyright (C) 2001 Hewlett-Packard (Paul Bame) <bame@debian.org>
 *
 *    This program is free software; you can redistribute it and/or modify
 *    it under the terms of the GNU General Public License as published by
 *    the Free Software Foundation; either version 2, or (at your option)
 *    any later version.
 *
 *    This program is distributed in the hope that it will be useful,
 *    but WITHOUT ANY WARRANTY; without even the implied warranty of
 *    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *    GNU General Public License for more details.
 *
 *    You should have received a copy of the GNU General Public License
 *    along with this program; if not, write to the Free Software
 *    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 */
/*
 * BEGIN_DESC
 *
 *  File:
 *	@(#)	pa/spmath/dfsqrt.c		$Revision: 1.1 $
 *
 *  Purpose:
 *	Double Floating-point Square Root
 *
 *  External Interfaces:
 *	dbl_fsqrt(srcptr,nullptr,dstptr,status)
 *
 *  Internal Interfaces:
 *
 *  Theory:
 *	<<please update with a overview of the operation of this file>>
 *
 * END_DESC
*/


#include "float.h"
#include "dbl_float.h"

/*
 *  Double Floating-point Square Root
 */

/*ARGSUSED*/
unsigned int
dbl_fsqrt(
	    dbl_floating_point *srcptr,
	    unsigned int *nullptr,
	    dbl_floating_point *dstptr,
	    unsigned int *status)
{
	register unsigned int srcp1, srcp2, resultp1, resultp2;
	register unsigned int newbitp1, newbitp2, sump1, sump2;
	register int src_exponent;
	register boolean guardbit = FALSE, even_exponent;

	Dbl_copyfromptr(srcptr,srcp1,srcp2);
        /*
         * check source operand for NaN or infinity
         */
        if ((src_exponent = Dbl_exponent(srcp1)) == DBL_INFINITY_EXPONENT) {
                /*
                 * is signaling NaN?
                 */
                if (Dbl_isone_signaling(srcp1)) {
                        /* trap if INVALIDTRAP enabled */
                        if (Is_invalidtrap_enabled()) return(INVALIDEXCEPTION);
                        /* make NaN quiet */
                        Set_invalidflag();
                        Dbl_set_quiet(srcp1);
                }
                /*
                 * Return quiet NaN or positive infinity.
		 *  Fall through to negative test if negative infinity.
                 */
		if (Dbl_iszero_sign(srcp1) || 
		    Dbl_isnotzero_mantissa(srcp1,srcp2)) {
                	Dbl_copytoptr(srcp1,srcp2,dstptr);
                	return(NOEXCEPTION);
		}
        }

        /*
         * check for zero source operand
         */
	if (Dbl_iszero_exponentmantissa(srcp1,srcp2)) {
		Dbl_copytoptr(srcp1,srcp2,dstptr);
		return(NOEXCEPTION);
	}

        /*
         * check for negative source operand 
         */
	if (Dbl_isone_sign(srcp1)) {
		/* trap if INVALIDTRAP enabled */
		if (Is_invalidtrap_enabled()) return(INVALIDEXCEPTION);
		/* make NaN quiet */
		Set_invalidflag();
		Dbl_makequietnan(srcp1,srcp2);
		Dbl_copytoptr(srcp1,srcp2,dstptr);
		return(NOEXCEPTION);
	}

	/*
	 * Generate result
	 */
	if (src_exponent > 0) {
		even_exponent = Dbl_hidden(srcp1);
		Dbl_clear_signexponent_set_hidden(srcp1);
	}
	else {
		/* normalize operand */
		Dbl_clear_signexponent(srcp1);
		src_exponent++;
		Dbl_normalize(srcp1,srcp2,src_exponent);
		even_exponent = src_exponent & 1;
	}
	if (even_exponent) {
		/* exponent is even */
		/* Add comment here.  Explain why odd exponent needs correction */
		Dbl_leftshiftby1(srcp1,srcp2);
	}
	/*
	 * Add comment here.  Explain following algorithm.
	 * 
	 * Trust me, it works.
	 *
	 */
	Dbl_setzero(resultp1,resultp2);
	Dbl_allp1(newbitp1) = 1 << (DBL_P - 32);
	Dbl_setzero_mantissap2(newbitp2);
	while (Dbl_isnotzero(newbitp1,newbitp2) && Dbl_isnotzero(srcp1,srcp2)) {
		Dbl_addition(resultp1,resultp2,newbitp1,newbitp2,sump1,sump2);
		if(Dbl_isnotgreaterthan(sump1,sump2,srcp1,srcp2)) {
			Dbl_leftshiftby1(newbitp1,newbitp2);
			/* update result */
			Dbl_addition(resultp1,resultp2,newbitp1,newbitp2,
			 resultp1,resultp2);  
			Dbl_subtract(srcp1,srcp2,sump1,sump2,srcp1,srcp2);
			Dbl_rightshiftby2(newbitp1,newbitp2);
		}
		else {
			Dbl_rightshiftby1(newbitp1,newbitp2);
		}
		Dbl_leftshiftby1(srcp1,srcp2);
	}
	/* correct exponent for pre-shift */
	if (even_exponent) {
		Dbl_rightshiftby1(resultp1,resultp2);
	}

	/* check for inexact */
	if (Dbl_isnotzero(srcp1,srcp2)) {
		if (!even_exponent && Dbl_islessthan(resultp1,resultp2,srcp1,srcp2)) {
			Dbl_increment(resultp1,resultp2);
		}
		guardbit = Dbl_lowmantissap2(resultp2);
		Dbl_rightshiftby1(resultp1,resultp2);

		/*  now round result  */
		switch (Rounding_mode()) {
		case ROUNDPLUS:
		     Dbl_increment(resultp1,resultp2);
		     break;
		case ROUNDNEAREST:
		     /* stickybit is always true, so guardbit 
		      * is enough to determine rounding */
		     if (guardbit) {
			    Dbl_increment(resultp1,resultp2);
		     }
		     break;
		}
		/* increment result exponent by 1 if mantissa overflowed */
		if (Dbl_isone_hiddenoverflow(resultp1)) src_exponent+=2;

		if (Is_inexacttrap_enabled()) {
			Dbl_set_exponent(resultp1,
			 ((src_exponent-DBL_BIAS)>>1)+DBL_BIAS);
			Dbl_copytoptr(resultp1,resultp2,dstptr);
			return(INEXACTEXCEPTION);
		}
		else Set_inexactflag();
	}
	else {
		Dbl_rightshiftby1(resultp1,resultp2);
	}
	Dbl_set_exponent(resultp1,((src_exponent-DBL_BIAS)>>1)+DBL_BIAS);
	Dbl_copytoptr(resultp1,resultp2,dstptr);
	return(NOEXCEPTION);
}
Commit	Line	Data
1da177e4 LT	1	/*
	2	* Linux/PA-RISC Project (http://www.parisc-linux.org/)
	3	*
	4	* Floating-point emulation code
	5	* Copyright (C) 2001 Hewlett-Packard (Paul Bame) <bame@debian.org>
	6	*
	7	* This program is free software; you can redistribute it and/or modify
	8	* it under the terms of the GNU General Public License as published by
	9	* the Free Software Foundation; either version 2, or (at your option)
	10	* any later version.
	11	*
	12	* This program is distributed in the hope that it will be useful,
	13	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	14	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	15	* GNU General Public License for more details.
	16	*
	17	* You should have received a copy of the GNU General Public License
	18	* along with this program; if not, write to the Free Software
	19	* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
	20	*/
	21	/*
	22	* BEGIN_DESC
	23	*
	24	* File:
	25	* @(#) pa/spmath/dfsqrt.c $Revision: 1.1 $
	26	*
	27	* Purpose:
	28	* Double Floating-point Square Root
	29	*
	30	* External Interfaces:
	31	* dbl_fsqrt(srcptr,nullptr,dstptr,status)
	32	*
	33	* Internal Interfaces:
	34	*
	35	* Theory:
	36	* <<please update with a overview of the operation of this file>>
	37	*
	38	* END_DESC
	39	*/
	40
	41
	42	#include "float.h"
	43	#include "dbl_float.h"
	44
	45	/*
	46	* Double Floating-point Square Root
	47	*/
	48
	49	/ARGSUSED/
	50	unsigned int
	51	dbl_fsqrt(
	52	dbl_floating_point *srcptr,
	53	unsigned int *nullptr,
	54	dbl_floating_point *dstptr,
	55	unsigned int *status)
	56	{
	57	register unsigned int srcp1, srcp2, resultp1, resultp2;
	58	register unsigned int newbitp1, newbitp2, sump1, sump2;
	59	register int src_exponent;
	60	register boolean guardbit = FALSE, even_exponent;
	61
	62	Dbl_copyfromptr(srcptr,srcp1,srcp2);
	63	/*
	64	* check source operand for NaN or infinity
65	*/
66	if ((src_exponent = Dbl_exponent(srcp1)) == DBL_INFINITY_EXPONENT) {
67	/*
68	* is signaling NaN?
69	*/
70	if (Dbl_isone_signaling(srcp1)) {
71	/* trap if INVALIDTRAP enabled */
72	if (Is_invalidtrap_enabled()) return(INVALIDEXCEPTION);
73	/* make NaN quiet */
74	Set_invalidflag();
75	Dbl_set_quiet(srcp1);
76	}
77	/*
78	* Return quiet NaN or positive infinity.
7022672e	79	* Fall through to negative test if negative infinity.
1da177e4 LT	80	*/
	81	if (Dbl_iszero_sign(srcp1) \|\|
	82	Dbl_isnotzero_mantissa(srcp1,srcp2)) {
	83	Dbl_copytoptr(srcp1,srcp2,dstptr);
	84	return(NOEXCEPTION);
	85	}
	86	}
	87
	88	/*
	89	* check for zero source operand
	90	*/
	91	if (Dbl_iszero_exponentmantissa(srcp1,srcp2)) {
	92	Dbl_copytoptr(srcp1,srcp2,dstptr);
	93	return(NOEXCEPTION);
	94	}
	95
	96	/*
	97	* check for negative source operand
	98	*/
	99	if (Dbl_isone_sign(srcp1)) {
	100	/* trap if INVALIDTRAP enabled */
	101	if (Is_invalidtrap_enabled()) return(INVALIDEXCEPTION);
	102	/* make NaN quiet */
	103	Set_invalidflag();
	104	Dbl_makequietnan(srcp1,srcp2);
	105	Dbl_copytoptr(srcp1,srcp2,dstptr);
	106	return(NOEXCEPTION);
	107	}
	108
	109	/*
	110	* Generate result
	111	*/
	112	if (src_exponent > 0) {
	113	even_exponent = Dbl_hidden(srcp1);
	114	Dbl_clear_signexponent_set_hidden(srcp1);
	115	}
	116	else {
	117	/* normalize operand */
	118	Dbl_clear_signexponent(srcp1);
	119	src_exponent++;
	120	Dbl_normalize(srcp1,srcp2,src_exponent);
	121	even_exponent = src_exponent & 1;
	122	}
	123	if (even_exponent) {
	124	/* exponent is even */
	125	/* Add comment here. Explain why odd exponent needs correction */
	126	Dbl_leftshiftby1(srcp1,srcp2);
	127	}
	128	/*
	129	* Add comment here. Explain following algorithm.
	130	*
	131	* Trust me, it works.
	132	*
	133	*/
	134	Dbl_setzero(resultp1,resultp2);
	135	Dbl_allp1(newbitp1) = 1 << (DBL_P - 32);
	136	Dbl_setzero_mantissap2(newbitp2);
	137	while (Dbl_isnotzero(newbitp1,newbitp2) && Dbl_isnotzero(srcp1,srcp2)) {
	138	Dbl_addition(resultp1,resultp2,newbitp1,newbitp2,sump1,sump2);
	139	if(Dbl_isnotgreaterthan(sump1,sump2,srcp1,srcp2)) {
	140	Dbl_leftshiftby1(newbitp1,newbitp2);
	141	/* update result */
	142	Dbl_addition(resultp1,resultp2,newbitp1,newbitp2,
	143	resultp1,resultp2);
144	Dbl_subtract(srcp1,srcp2,sump1,sump2,srcp1,srcp2);
145	Dbl_rightshiftby2(newbitp1,newbitp2);
146	}
147	else {
148	Dbl_rightshiftby1(newbitp1,newbitp2);
149	}
150	Dbl_leftshiftby1(srcp1,srcp2);
151	}
152	/* correct exponent for pre-shift */
153	if (even_exponent) {
154	Dbl_rightshiftby1(resultp1,resultp2);
155	}
156
157	/* check for inexact */
158	if (Dbl_isnotzero(srcp1,srcp2)) {
159	if (!even_exponent && Dbl_islessthan(resultp1,resultp2,srcp1,srcp2)) {
160	Dbl_increment(resultp1,resultp2);
161	}
162	guardbit = Dbl_lowmantissap2(resultp2);
163	Dbl_rightshiftby1(resultp1,resultp2);
164
165	/* now round result */
166	switch (Rounding_mode()) {
167	case ROUNDPLUS:
168	Dbl_increment(resultp1,resultp2);
169	break;
170	case ROUNDNEAREST:
171	/* stickybit is always true, so guardbit
172	* is enough to determine rounding */
173	if (guardbit) {
174	Dbl_increment(resultp1,resultp2);
175	}
176	break;
177	}
178	/* increment result exponent by 1 if mantissa overflowed */
179	if (Dbl_isone_hiddenoverflow(resultp1)) src_exponent+=2;
180
181	if (Is_inexacttrap_enabled()) {
182	Dbl_set_exponent(resultp1,
183	((src_exponent-DBL_BIAS)>>1)+DBL_BIAS);
184	Dbl_copytoptr(resultp1,resultp2,dstptr);
185	return(INEXACTEXCEPTION);
186	}
187	else Set_inexactflag();
188	}
189	else {
190	Dbl_rightshiftby1(resultp1,resultp2);
191	}
192	Dbl_set_exponent(resultp1,((src_exponent-DBL_BIAS)>>1)+DBL_BIAS);
193	Dbl_copytoptr(resultp1,resultp2,dstptr);
194	return(NOEXCEPTION);
195	}