xref: /openbmc/linux/arch/mips/math-emu/sp_sub.c (revision 4b4193256c8d3bc3a5397b5cd9494c2ad386317d)
19d5a6349SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
21da177e4SLinus Torvalds /* IEEE754 floating point arithmetic
31da177e4SLinus Torvalds  * single precision
41da177e4SLinus Torvalds  */
51da177e4SLinus Torvalds /*
61da177e4SLinus Torvalds  * MIPS floating point support
71da177e4SLinus Torvalds  * Copyright (C) 1994-2000 Algorithmics Ltd.
81da177e4SLinus Torvalds  */
91da177e4SLinus Torvalds 
101da177e4SLinus Torvalds #include "ieee754sp.h"
111da177e4SLinus Torvalds 
ieee754sp_sub(union ieee754sp x,union ieee754sp y)122209bcb1SRalf Baechle union ieee754sp ieee754sp_sub(union ieee754sp x, union ieee754sp y)
131da177e4SLinus Torvalds {
143f7cac41SRalf Baechle 	int s;
153f7cac41SRalf Baechle 
161da177e4SLinus Torvalds 	COMPXSP;
171da177e4SLinus Torvalds 	COMPYSP;
181da177e4SLinus Torvalds 
191da177e4SLinus Torvalds 	EXPLODEXSP;
201da177e4SLinus Torvalds 	EXPLODEYSP;
211da177e4SLinus Torvalds 
229e8bad1fSRalf Baechle 	ieee754_clearcx();
231da177e4SLinus Torvalds 
241da177e4SLinus Torvalds 	FLUSHXSP;
251da177e4SLinus Torvalds 	FLUSHYSP;
261da177e4SLinus Torvalds 
271da177e4SLinus Torvalds 	switch (CLPAIR(xc, yc)) {
281da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_SNAN):
291da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_SNAN):
301da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_SNAN):
311da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_SNAN):
321da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_SNAN):
33d5afa7e9SMaciej W. Rozycki 		return ieee754sp_nanxcpt(y);
34d5afa7e9SMaciej W. Rozycki 
35d5afa7e9SMaciej W. Rozycki 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_SNAN):
36d5afa7e9SMaciej W. Rozycki 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_QNAN):
371da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_ZERO):
381da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_NORM):
391da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_DNORM):
401da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_INF):
41d5afa7e9SMaciej W. Rozycki 		return ieee754sp_nanxcpt(x);
421da177e4SLinus Torvalds 
431da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_QNAN):
441da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_QNAN):
451da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_QNAN):
461da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_QNAN):
471da177e4SLinus Torvalds 		return y;
481da177e4SLinus Torvalds 
491da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_QNAN):
501da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_ZERO):
511da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_NORM):
521da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_DNORM):
531da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_INF):
541da177e4SLinus Torvalds 		return x;
551da177e4SLinus Torvalds 
561da177e4SLinus Torvalds 
573f7cac41SRalf Baechle 	/*
583f7cac41SRalf Baechle 	 * Infinity handling
591da177e4SLinus Torvalds 	 */
601da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_INF):
611da177e4SLinus Torvalds 		if (xs != ys)
621da177e4SLinus Torvalds 			return x;
639e8bad1fSRalf Baechle 		ieee754_setcx(IEEE754_INVALID_OPERATION);
6490efba36SRalf Baechle 		return ieee754sp_indef();
651da177e4SLinus Torvalds 
661da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_INF):
671da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_INF):
681da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_INF):
691da177e4SLinus Torvalds 		return ieee754sp_inf(ys ^ 1);
701da177e4SLinus Torvalds 
711da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_ZERO):
721da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_NORM):
731da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_DNORM):
741da177e4SLinus Torvalds 		return x;
751da177e4SLinus Torvalds 
763f7cac41SRalf Baechle 	/*
773f7cac41SRalf Baechle 	 * Zero handling
781da177e4SLinus Torvalds 	 */
791da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_ZERO):
801da177e4SLinus Torvalds 		if (xs != ys)
811da177e4SLinus Torvalds 			return x;
821da177e4SLinus Torvalds 		else
8356a64733SRalf Baechle 			return ieee754sp_zero(ieee754_csr.rm == FPU_CSR_RD);
841da177e4SLinus Torvalds 
851da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_ZERO):
861da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_ZERO):
871da177e4SLinus Torvalds 		return x;
881da177e4SLinus Torvalds 
891da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_NORM):
901da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_DNORM):
911da177e4SLinus Torvalds 		/* quick fix up */
923e160aadSRalf Baechle 		SPSIGN(y) ^= 1;
931da177e4SLinus Torvalds 		return y;
941da177e4SLinus Torvalds 
951da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_DNORM):
961da177e4SLinus Torvalds 		SPDNORMX;
97*c9b02990SLiangliang Huang 		fallthrough;
981da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_DNORM):
991da177e4SLinus Torvalds 		SPDNORMY;
1001da177e4SLinus Torvalds 		break;
1011da177e4SLinus Torvalds 
1021da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_NORM):
1031da177e4SLinus Torvalds 		SPDNORMX;
1041da177e4SLinus Torvalds 		break;
1051da177e4SLinus Torvalds 
1061da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_NORM):
1071da177e4SLinus Torvalds 		break;
1081da177e4SLinus Torvalds 	}
1091da177e4SLinus Torvalds 	/* flip sign of y and handle as add */
1101da177e4SLinus Torvalds 	ys ^= 1;
1111da177e4SLinus Torvalds 
1121da177e4SLinus Torvalds 	assert(xm & SP_HIDDEN_BIT);
1131da177e4SLinus Torvalds 	assert(ym & SP_HIDDEN_BIT);
1141da177e4SLinus Torvalds 
1151da177e4SLinus Torvalds 
1161da177e4SLinus Torvalds 	/* provide guard,round and stick bit space */
1171da177e4SLinus Torvalds 	xm <<= 3;
1181da177e4SLinus Torvalds 	ym <<= 3;
1191da177e4SLinus Torvalds 
1201da177e4SLinus Torvalds 	if (xe > ye) {
1213f7cac41SRalf Baechle 		/*
1223f7cac41SRalf Baechle 		 * have to shift y fraction right to align
1231da177e4SLinus Torvalds 		 */
1243f7cac41SRalf Baechle 		s = xe - ye;
125db57f29dSPaul Burton 		ym = XSPSRS(ym, s);
126db57f29dSPaul Burton 		ye += s;
1271da177e4SLinus Torvalds 	} else if (ye > xe) {
1283f7cac41SRalf Baechle 		/*
1293f7cac41SRalf Baechle 		 * have to shift x fraction right to align
1301da177e4SLinus Torvalds 		 */
1313f7cac41SRalf Baechle 		s = ye - xe;
132db57f29dSPaul Burton 		xm = XSPSRS(xm, s);
133db57f29dSPaul Burton 		xe += s;
1341da177e4SLinus Torvalds 	}
1351da177e4SLinus Torvalds 	assert(xe == ye);
1361da177e4SLinus Torvalds 	assert(xe <= SP_EMAX);
1371da177e4SLinus Torvalds 
1381da177e4SLinus Torvalds 	if (xs == ys) {
1391da177e4SLinus Torvalds 		/* generate 28 bit result of adding two 27 bit numbers
1401da177e4SLinus Torvalds 		 */
1411da177e4SLinus Torvalds 		xm = xm + ym;
1421da177e4SLinus Torvalds 
143ad8fb553SRalf Baechle 		if (xm >> (SP_FBITS + 1 + 3)) { /* carry out */
1441da177e4SLinus Torvalds 			SPXSRSX1();	/* shift preserving sticky */
1451da177e4SLinus Torvalds 		}
1461da177e4SLinus Torvalds 	} else {
1471da177e4SLinus Torvalds 		if (xm >= ym) {
1481da177e4SLinus Torvalds 			xm = xm - ym;
1491da177e4SLinus Torvalds 		} else {
1501da177e4SLinus Torvalds 			xm = ym - xm;
1511da177e4SLinus Torvalds 			xs = ys;
1521da177e4SLinus Torvalds 		}
1531da177e4SLinus Torvalds 		if (xm == 0) {
15456a64733SRalf Baechle 			if (ieee754_csr.rm == FPU_CSR_RD)
1551da177e4SLinus Torvalds 				return ieee754sp_zero(1);	/* round negative inf. => sign = -1 */
1561da177e4SLinus Torvalds 			else
1571da177e4SLinus Torvalds 				return ieee754sp_zero(0);	/* other round modes   => sign = 1 */
1581da177e4SLinus Torvalds 		}
1591da177e4SLinus Torvalds 		/* normalize to rounding precision
1601da177e4SLinus Torvalds 		 */
161ad8fb553SRalf Baechle 		while ((xm >> (SP_FBITS + 3)) == 0) {
1621da177e4SLinus Torvalds 			xm <<= 1;
1631da177e4SLinus Torvalds 			xe--;
1641da177e4SLinus Torvalds 		}
1651da177e4SLinus Torvalds 	}
16690efba36SRalf Baechle 
16790efba36SRalf Baechle 	return ieee754sp_format(xs, xe, xm);
1681da177e4SLinus Torvalds }
169