19d5a6349SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
21da177e4SLinus Torvalds /* IEEE754 floating point arithmetic
31da177e4SLinus Torvalds * single precision
41da177e4SLinus Torvalds */
51da177e4SLinus Torvalds /*
61da177e4SLinus Torvalds * MIPS floating point support
71da177e4SLinus Torvalds * Copyright (C) 1994-2000 Algorithmics Ltd.
81da177e4SLinus Torvalds */
91da177e4SLinus Torvalds
101da177e4SLinus Torvalds #include "ieee754sp.h"
111da177e4SLinus Torvalds
ieee754sp_sub(union ieee754sp x,union ieee754sp y)122209bcb1SRalf Baechle union ieee754sp ieee754sp_sub(union ieee754sp x, union ieee754sp y)
131da177e4SLinus Torvalds {
143f7cac41SRalf Baechle int s;
153f7cac41SRalf Baechle
161da177e4SLinus Torvalds COMPXSP;
171da177e4SLinus Torvalds COMPYSP;
181da177e4SLinus Torvalds
191da177e4SLinus Torvalds EXPLODEXSP;
201da177e4SLinus Torvalds EXPLODEYSP;
211da177e4SLinus Torvalds
229e8bad1fSRalf Baechle ieee754_clearcx();
231da177e4SLinus Torvalds
241da177e4SLinus Torvalds FLUSHXSP;
251da177e4SLinus Torvalds FLUSHYSP;
261da177e4SLinus Torvalds
271da177e4SLinus Torvalds switch (CLPAIR(xc, yc)) {
281da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_SNAN):
291da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_SNAN):
301da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_SNAN):
311da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_SNAN):
321da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_SNAN):
33d5afa7e9SMaciej W. Rozycki return ieee754sp_nanxcpt(y);
34d5afa7e9SMaciej W. Rozycki
35d5afa7e9SMaciej W. Rozycki case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_SNAN):
36d5afa7e9SMaciej W. Rozycki case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_QNAN):
371da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_ZERO):
381da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_NORM):
391da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_DNORM):
401da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_INF):
41d5afa7e9SMaciej W. Rozycki return ieee754sp_nanxcpt(x);
421da177e4SLinus Torvalds
431da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_QNAN):
441da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_QNAN):
451da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_QNAN):
461da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_QNAN):
471da177e4SLinus Torvalds return y;
481da177e4SLinus Torvalds
491da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_QNAN):
501da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_ZERO):
511da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_NORM):
521da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_DNORM):
531da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_INF):
541da177e4SLinus Torvalds return x;
551da177e4SLinus Torvalds
561da177e4SLinus Torvalds
573f7cac41SRalf Baechle /*
583f7cac41SRalf Baechle * Infinity handling
591da177e4SLinus Torvalds */
601da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_INF):
611da177e4SLinus Torvalds if (xs != ys)
621da177e4SLinus Torvalds return x;
639e8bad1fSRalf Baechle ieee754_setcx(IEEE754_INVALID_OPERATION);
6490efba36SRalf Baechle return ieee754sp_indef();
651da177e4SLinus Torvalds
661da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_INF):
671da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_INF):
681da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_INF):
691da177e4SLinus Torvalds return ieee754sp_inf(ys ^ 1);
701da177e4SLinus Torvalds
711da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_ZERO):
721da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_NORM):
731da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_DNORM):
741da177e4SLinus Torvalds return x;
751da177e4SLinus Torvalds
763f7cac41SRalf Baechle /*
773f7cac41SRalf Baechle * Zero handling
781da177e4SLinus Torvalds */
791da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_ZERO):
801da177e4SLinus Torvalds if (xs != ys)
811da177e4SLinus Torvalds return x;
821da177e4SLinus Torvalds else
8356a64733SRalf Baechle return ieee754sp_zero(ieee754_csr.rm == FPU_CSR_RD);
841da177e4SLinus Torvalds
851da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_ZERO):
861da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_ZERO):
871da177e4SLinus Torvalds return x;
881da177e4SLinus Torvalds
891da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_NORM):
901da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_DNORM):
911da177e4SLinus Torvalds /* quick fix up */
923e160aadSRalf Baechle SPSIGN(y) ^= 1;
931da177e4SLinus Torvalds return y;
941da177e4SLinus Torvalds
951da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_DNORM):
961da177e4SLinus Torvalds SPDNORMX;
97*c9b02990SLiangliang Huang fallthrough;
981da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_DNORM):
991da177e4SLinus Torvalds SPDNORMY;
1001da177e4SLinus Torvalds break;
1011da177e4SLinus Torvalds
1021da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_NORM):
1031da177e4SLinus Torvalds SPDNORMX;
1041da177e4SLinus Torvalds break;
1051da177e4SLinus Torvalds
1061da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_NORM):
1071da177e4SLinus Torvalds break;
1081da177e4SLinus Torvalds }
1091da177e4SLinus Torvalds /* flip sign of y and handle as add */
1101da177e4SLinus Torvalds ys ^= 1;
1111da177e4SLinus Torvalds
1121da177e4SLinus Torvalds assert(xm & SP_HIDDEN_BIT);
1131da177e4SLinus Torvalds assert(ym & SP_HIDDEN_BIT);
1141da177e4SLinus Torvalds
1151da177e4SLinus Torvalds
1161da177e4SLinus Torvalds /* provide guard,round and stick bit space */
1171da177e4SLinus Torvalds xm <<= 3;
1181da177e4SLinus Torvalds ym <<= 3;
1191da177e4SLinus Torvalds
1201da177e4SLinus Torvalds if (xe > ye) {
1213f7cac41SRalf Baechle /*
1223f7cac41SRalf Baechle * have to shift y fraction right to align
1231da177e4SLinus Torvalds */
1243f7cac41SRalf Baechle s = xe - ye;
125db57f29dSPaul Burton ym = XSPSRS(ym, s);
126db57f29dSPaul Burton ye += s;
1271da177e4SLinus Torvalds } else if (ye > xe) {
1283f7cac41SRalf Baechle /*
1293f7cac41SRalf Baechle * have to shift x fraction right to align
1301da177e4SLinus Torvalds */
1313f7cac41SRalf Baechle s = ye - xe;
132db57f29dSPaul Burton xm = XSPSRS(xm, s);
133db57f29dSPaul Burton xe += s;
1341da177e4SLinus Torvalds }
1351da177e4SLinus Torvalds assert(xe == ye);
1361da177e4SLinus Torvalds assert(xe <= SP_EMAX);
1371da177e4SLinus Torvalds
1381da177e4SLinus Torvalds if (xs == ys) {
1391da177e4SLinus Torvalds /* generate 28 bit result of adding two 27 bit numbers
1401da177e4SLinus Torvalds */
1411da177e4SLinus Torvalds xm = xm + ym;
1421da177e4SLinus Torvalds
143ad8fb553SRalf Baechle if (xm >> (SP_FBITS + 1 + 3)) { /* carry out */
1441da177e4SLinus Torvalds SPXSRSX1(); /* shift preserving sticky */
1451da177e4SLinus Torvalds }
1461da177e4SLinus Torvalds } else {
1471da177e4SLinus Torvalds if (xm >= ym) {
1481da177e4SLinus Torvalds xm = xm - ym;
1491da177e4SLinus Torvalds } else {
1501da177e4SLinus Torvalds xm = ym - xm;
1511da177e4SLinus Torvalds xs = ys;
1521da177e4SLinus Torvalds }
1531da177e4SLinus Torvalds if (xm == 0) {
15456a64733SRalf Baechle if (ieee754_csr.rm == FPU_CSR_RD)
1551da177e4SLinus Torvalds return ieee754sp_zero(1); /* round negative inf. => sign = -1 */
1561da177e4SLinus Torvalds else
1571da177e4SLinus Torvalds return ieee754sp_zero(0); /* other round modes => sign = 1 */
1581da177e4SLinus Torvalds }
1591da177e4SLinus Torvalds /* normalize to rounding precision
1601da177e4SLinus Torvalds */
161ad8fb553SRalf Baechle while ((xm >> (SP_FBITS + 3)) == 0) {
1621da177e4SLinus Torvalds xm <<= 1;
1631da177e4SLinus Torvalds xe--;
1641da177e4SLinus Torvalds }
1651da177e4SLinus Torvalds }
16690efba36SRalf Baechle
16790efba36SRalf Baechle return ieee754sp_format(xs, xe, xm);
1681da177e4SLinus Torvalds }
169