xref: /openbmc/linux/arch/mips/math-emu/sp_sqrt.c (revision 56a64733)
11da177e4SLinus Torvalds /* IEEE754 floating point arithmetic
21da177e4SLinus Torvalds  * single precision square root
31da177e4SLinus Torvalds  */
41da177e4SLinus Torvalds /*
51da177e4SLinus Torvalds  * MIPS floating point support
61da177e4SLinus Torvalds  * Copyright (C) 1994-2000 Algorithmics Ltd.
71da177e4SLinus Torvalds  *
81da177e4SLinus Torvalds  *  This program is free software; you can distribute it and/or modify it
91da177e4SLinus Torvalds  *  under the terms of the GNU General Public License (Version 2) as
101da177e4SLinus Torvalds  *  published by the Free Software Foundation.
111da177e4SLinus Torvalds  *
121da177e4SLinus Torvalds  *  This program is distributed in the hope it will be useful, but WITHOUT
131da177e4SLinus Torvalds  *  ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
141da177e4SLinus Torvalds  *  FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
151da177e4SLinus Torvalds  *  for more details.
161da177e4SLinus Torvalds  *
171da177e4SLinus Torvalds  *  You should have received a copy of the GNU General Public License along
181da177e4SLinus Torvalds  *  with this program; if not, write to the Free Software Foundation, Inc.,
193f7cac41SRalf Baechle  *  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA.
201da177e4SLinus Torvalds  */
211da177e4SLinus Torvalds 
221da177e4SLinus Torvalds #include "ieee754sp.h"
231da177e4SLinus Torvalds 
242209bcb1SRalf Baechle union ieee754sp ieee754sp_sqrt(union ieee754sp x)
251da177e4SLinus Torvalds {
261da177e4SLinus Torvalds 	int ix, s, q, m, t, i;
271da177e4SLinus Torvalds 	unsigned int r;
281da177e4SLinus Torvalds 	COMPXSP;
291da177e4SLinus Torvalds 
301da177e4SLinus Torvalds 	/* take care of Inf and NaN */
311da177e4SLinus Torvalds 
321da177e4SLinus Torvalds 	EXPLODEXSP;
339e8bad1fSRalf Baechle 	ieee754_clearcx();
341da177e4SLinus Torvalds 	FLUSHXSP;
351da177e4SLinus Torvalds 
361da177e4SLinus Torvalds 	/* x == INF or NAN? */
371da177e4SLinus Torvalds 	switch (xc) {
381da177e4SLinus Torvalds 	case IEEE754_CLASS_QNAN:
391da177e4SLinus Torvalds 		/* sqrt(Nan) = Nan */
4090efba36SRalf Baechle 		return ieee754sp_nanxcpt(x);
413f7cac41SRalf Baechle 
421da177e4SLinus Torvalds 	case IEEE754_CLASS_SNAN:
439e8bad1fSRalf Baechle 		ieee754_setcx(IEEE754_INVALID_OPERATION);
4490efba36SRalf Baechle 		return ieee754sp_nanxcpt(ieee754sp_indef());
453f7cac41SRalf Baechle 
461da177e4SLinus Torvalds 	case IEEE754_CLASS_ZERO:
471da177e4SLinus Torvalds 		/* sqrt(0) = 0 */
481da177e4SLinus Torvalds 		return x;
493f7cac41SRalf Baechle 
501da177e4SLinus Torvalds 	case IEEE754_CLASS_INF:
511da177e4SLinus Torvalds 		if (xs) {
521da177e4SLinus Torvalds 			/* sqrt(-Inf) = Nan */
539e8bad1fSRalf Baechle 			ieee754_setcx(IEEE754_INVALID_OPERATION);
5490efba36SRalf Baechle 			return ieee754sp_nanxcpt(ieee754sp_indef());
551da177e4SLinus Torvalds 		}
561da177e4SLinus Torvalds 		/* sqrt(+Inf) = Inf */
571da177e4SLinus Torvalds 		return x;
583f7cac41SRalf Baechle 
591da177e4SLinus Torvalds 	case IEEE754_CLASS_DNORM:
601da177e4SLinus Torvalds 	case IEEE754_CLASS_NORM:
611da177e4SLinus Torvalds 		if (xs) {
621da177e4SLinus Torvalds 			/* sqrt(-x) = Nan */
639e8bad1fSRalf Baechle 			ieee754_setcx(IEEE754_INVALID_OPERATION);
6490efba36SRalf Baechle 			return ieee754sp_nanxcpt(ieee754sp_indef());
651da177e4SLinus Torvalds 		}
661da177e4SLinus Torvalds 		break;
671da177e4SLinus Torvalds 	}
681da177e4SLinus Torvalds 
691da177e4SLinus Torvalds 	ix = x.bits;
701da177e4SLinus Torvalds 
711da177e4SLinus Torvalds 	/* normalize x */
721da177e4SLinus Torvalds 	m = (ix >> 23);
731da177e4SLinus Torvalds 	if (m == 0) {		/* subnormal x */
741da177e4SLinus Torvalds 		for (i = 0; (ix & 0x00800000) == 0; i++)
751da177e4SLinus Torvalds 			ix <<= 1;
761da177e4SLinus Torvalds 		m -= i - 1;
771da177e4SLinus Torvalds 	}
781da177e4SLinus Torvalds 	m -= 127;		/* unbias exponent */
791da177e4SLinus Torvalds 	ix = (ix & 0x007fffff) | 0x00800000;
801da177e4SLinus Torvalds 	if (m & 1)		/* odd m, double x to make it even */
811da177e4SLinus Torvalds 		ix += ix;
821da177e4SLinus Torvalds 	m >>= 1;		/* m = [m/2] */
831da177e4SLinus Torvalds 
841da177e4SLinus Torvalds 	/* generate sqrt(x) bit by bit */
851da177e4SLinus Torvalds 	ix += ix;
861da177e4SLinus Torvalds 	q = s = 0;		/* q = sqrt(x) */
871da177e4SLinus Torvalds 	r = 0x01000000;		/* r = moving bit from right to left */
881da177e4SLinus Torvalds 
891da177e4SLinus Torvalds 	while (r != 0) {
901da177e4SLinus Torvalds 		t = s + r;
911da177e4SLinus Torvalds 		if (t <= ix) {
921da177e4SLinus Torvalds 			s = t + r;
931da177e4SLinus Torvalds 			ix -= t;
941da177e4SLinus Torvalds 			q += r;
951da177e4SLinus Torvalds 		}
961da177e4SLinus Torvalds 		ix += ix;
971da177e4SLinus Torvalds 		r >>= 1;
981da177e4SLinus Torvalds 	}
991da177e4SLinus Torvalds 
1001da177e4SLinus Torvalds 	if (ix != 0) {
1019e8bad1fSRalf Baechle 		ieee754_setcx(IEEE754_INEXACT);
1021da177e4SLinus Torvalds 		switch (ieee754_csr.rm) {
10356a64733SRalf Baechle 		case FPU_CSR_RU:
1041da177e4SLinus Torvalds 			q += 2;
1051da177e4SLinus Torvalds 			break;
10656a64733SRalf Baechle 		case FPU_CSR_RN:
1071da177e4SLinus Torvalds 			q += (q & 1);
1081da177e4SLinus Torvalds 			break;
1091da177e4SLinus Torvalds 		}
1101da177e4SLinus Torvalds 	}
1111da177e4SLinus Torvalds 	ix = (q >> 1) + 0x3f000000;
1121da177e4SLinus Torvalds 	ix += (m << 23);
1131da177e4SLinus Torvalds 	x.bits = ix;
1141da177e4SLinus Torvalds 	return x;
1151da177e4SLinus Torvalds }
116