19d5a6349SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
21da177e4SLinus Torvalds /* IEEE754 floating point arithmetic
31da177e4SLinus Torvalds * single precision
41da177e4SLinus Torvalds */
51da177e4SLinus Torvalds /*
61da177e4SLinus Torvalds * MIPS floating point support
71da177e4SLinus Torvalds * Copyright (C) 1994-2000 Algorithmics Ltd.
81da177e4SLinus Torvalds */
91da177e4SLinus Torvalds
101da177e4SLinus Torvalds #include "ieee754sp.h"
111da177e4SLinus Torvalds
ieee754sp_add(union ieee754sp x,union ieee754sp y)122209bcb1SRalf Baechle union ieee754sp ieee754sp_add(union ieee754sp x, union ieee754sp y)
131da177e4SLinus Torvalds {
143f7cac41SRalf Baechle int s;
153f7cac41SRalf Baechle
161da177e4SLinus Torvalds COMPXSP;
171da177e4SLinus Torvalds COMPYSP;
181da177e4SLinus Torvalds
191da177e4SLinus Torvalds EXPLODEXSP;
201da177e4SLinus Torvalds EXPLODEYSP;
211da177e4SLinus Torvalds
229e8bad1fSRalf Baechle ieee754_clearcx();
231da177e4SLinus Torvalds
241da177e4SLinus Torvalds FLUSHXSP;
251da177e4SLinus Torvalds FLUSHYSP;
261da177e4SLinus Torvalds
271da177e4SLinus Torvalds switch (CLPAIR(xc, yc)) {
281da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_SNAN):
291da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_SNAN):
301da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_SNAN):
311da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_SNAN):
321da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_SNAN):
33d5afa7e9SMaciej W. Rozycki return ieee754sp_nanxcpt(y);
34d5afa7e9SMaciej W. Rozycki
35d5afa7e9SMaciej W. Rozycki case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_SNAN):
36d5afa7e9SMaciej W. Rozycki case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_QNAN):
371da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_ZERO):
381da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_NORM):
391da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_DNORM):
401da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_INF):
41d5afa7e9SMaciej W. Rozycki return ieee754sp_nanxcpt(x);
421da177e4SLinus Torvalds
431da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_QNAN):
441da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_QNAN):
451da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_QNAN):
461da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_QNAN):
471da177e4SLinus Torvalds return y;
481da177e4SLinus Torvalds
491da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_QNAN):
501da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_ZERO):
511da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_NORM):
521da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_DNORM):
531da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_INF):
541da177e4SLinus Torvalds return x;
551da177e4SLinus Torvalds
561da177e4SLinus Torvalds
573f7cac41SRalf Baechle /*
583f7cac41SRalf Baechle * Infinity handling
591da177e4SLinus Torvalds */
601da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_INF):
611da177e4SLinus Torvalds if (xs == ys)
621da177e4SLinus Torvalds return x;
639e8bad1fSRalf Baechle ieee754_setcx(IEEE754_INVALID_OPERATION);
6490efba36SRalf Baechle return ieee754sp_indef();
651da177e4SLinus Torvalds
661da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_INF):
671da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_INF):
681da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_INF):
691da177e4SLinus Torvalds return y;
701da177e4SLinus Torvalds
711da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_ZERO):
721da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_NORM):
731da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_DNORM):
741da177e4SLinus Torvalds return x;
751da177e4SLinus Torvalds
763f7cac41SRalf Baechle /*
773f7cac41SRalf Baechle * Zero handling
781da177e4SLinus Torvalds */
791da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_ZERO):
801da177e4SLinus Torvalds if (xs == ys)
811da177e4SLinus Torvalds return x;
821da177e4SLinus Torvalds else
8356a64733SRalf Baechle return ieee754sp_zero(ieee754_csr.rm == FPU_CSR_RD);
841da177e4SLinus Torvalds
851da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_ZERO):
861da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_ZERO):
871da177e4SLinus Torvalds return x;
881da177e4SLinus Torvalds
891da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_NORM):
901da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_DNORM):
911da177e4SLinus Torvalds return y;
921da177e4SLinus Torvalds
931da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_DNORM):
941da177e4SLinus Torvalds SPDNORMX;
95*c9b02990SLiangliang Huang fallthrough;
961da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_DNORM):
971da177e4SLinus Torvalds SPDNORMY;
981da177e4SLinus Torvalds break;
991da177e4SLinus Torvalds
1001da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_NORM):
1011da177e4SLinus Torvalds SPDNORMX;
1021da177e4SLinus Torvalds break;
1031da177e4SLinus Torvalds
1041da177e4SLinus Torvalds case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_NORM):
1051da177e4SLinus Torvalds break;
1061da177e4SLinus Torvalds }
1071da177e4SLinus Torvalds assert(xm & SP_HIDDEN_BIT);
1081da177e4SLinus Torvalds assert(ym & SP_HIDDEN_BIT);
1091da177e4SLinus Torvalds
1103f7cac41SRalf Baechle /*
1113f7cac41SRalf Baechle * Provide guard, round and stick bit space.
1123f7cac41SRalf Baechle */
1131da177e4SLinus Torvalds xm <<= 3;
1141da177e4SLinus Torvalds ym <<= 3;
1151da177e4SLinus Torvalds
1161da177e4SLinus Torvalds if (xe > ye) {
1173f7cac41SRalf Baechle /*
1183f7cac41SRalf Baechle * Have to shift y fraction right to align.
1191da177e4SLinus Torvalds */
1203f7cac41SRalf Baechle s = xe - ye;
121db57f29dSPaul Burton ym = XSPSRS(ym, s);
122db57f29dSPaul Burton ye += s;
1231da177e4SLinus Torvalds } else if (ye > xe) {
1243f7cac41SRalf Baechle /*
1253f7cac41SRalf Baechle * Have to shift x fraction right to align.
1261da177e4SLinus Torvalds */
1273f7cac41SRalf Baechle s = ye - xe;
128db57f29dSPaul Burton xm = XSPSRS(xm, s);
129db57f29dSPaul Burton xe += s;
1301da177e4SLinus Torvalds }
1311da177e4SLinus Torvalds assert(xe == ye);
1321da177e4SLinus Torvalds assert(xe <= SP_EMAX);
1331da177e4SLinus Torvalds
1341da177e4SLinus Torvalds if (xs == ys) {
1353f7cac41SRalf Baechle /*
1363f7cac41SRalf Baechle * Generate 28 bit result of adding two 27 bit numbers
1373f7cac41SRalf Baechle * leaving result in xm, xs and xe.
1381da177e4SLinus Torvalds */
1391da177e4SLinus Torvalds xm = xm + ym;
1401da177e4SLinus Torvalds
141ad8fb553SRalf Baechle if (xm >> (SP_FBITS + 1 + 3)) { /* carry out */
1421da177e4SLinus Torvalds SPXSRSX1();
1431da177e4SLinus Torvalds }
1441da177e4SLinus Torvalds } else {
1451da177e4SLinus Torvalds if (xm >= ym) {
1461da177e4SLinus Torvalds xm = xm - ym;
1471da177e4SLinus Torvalds } else {
1481da177e4SLinus Torvalds xm = ym - xm;
1491da177e4SLinus Torvalds xs = ys;
1501da177e4SLinus Torvalds }
1511da177e4SLinus Torvalds if (xm == 0)
15256a64733SRalf Baechle return ieee754sp_zero(ieee754_csr.rm == FPU_CSR_RD);
1531da177e4SLinus Torvalds
1543f7cac41SRalf Baechle /*
1553f7cac41SRalf Baechle * Normalize in extended single precision
1563f7cac41SRalf Baechle */
157ad8fb553SRalf Baechle while ((xm >> (SP_FBITS + 3)) == 0) {
1581da177e4SLinus Torvalds xm <<= 1;
1591da177e4SLinus Torvalds xe--;
1601da177e4SLinus Torvalds }
1611da177e4SLinus Torvalds }
16290efba36SRalf Baechle
16390efba36SRalf Baechle return ieee754sp_format(xs, xe, xm);
1641da177e4SLinus Torvalds }
165