xref: /linux/arch/mips/math-emu/dp_add.c (revision c9b02990)
19d5a6349SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
21da177e4SLinus Torvalds /* IEEE754 floating point arithmetic
31da177e4SLinus Torvalds  * double precision: common utilities
41da177e4SLinus Torvalds  */
51da177e4SLinus Torvalds /*
61da177e4SLinus Torvalds  * MIPS floating point support
71da177e4SLinus Torvalds  * Copyright (C) 1994-2000 Algorithmics Ltd.
81da177e4SLinus Torvalds  */
91da177e4SLinus Torvalds 
101da177e4SLinus Torvalds #include "ieee754dp.h"
111da177e4SLinus Torvalds 
ieee754dp_add(union ieee754dp x,union ieee754dp y)122209bcb1SRalf Baechle union ieee754dp ieee754dp_add(union ieee754dp x, union ieee754dp y)
131da177e4SLinus Torvalds {
143f7cac41SRalf Baechle 	int s;
153f7cac41SRalf Baechle 
161da177e4SLinus Torvalds 	COMPXDP;
171da177e4SLinus Torvalds 	COMPYDP;
181da177e4SLinus Torvalds 
191da177e4SLinus Torvalds 	EXPLODEXDP;
201da177e4SLinus Torvalds 	EXPLODEYDP;
211da177e4SLinus Torvalds 
229e8bad1fSRalf Baechle 	ieee754_clearcx();
231da177e4SLinus Torvalds 
241da177e4SLinus Torvalds 	FLUSHXDP;
251da177e4SLinus Torvalds 	FLUSHYDP;
261da177e4SLinus Torvalds 
271da177e4SLinus Torvalds 	switch (CLPAIR(xc, yc)) {
281da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_SNAN):
291da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_SNAN):
301da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_SNAN):
311da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_SNAN):
321da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_SNAN):
33d5afa7e9SMaciej W. Rozycki 		return ieee754dp_nanxcpt(y);
34d5afa7e9SMaciej W. Rozycki 
35d5afa7e9SMaciej W. Rozycki 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_SNAN):
36d5afa7e9SMaciej W. Rozycki 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_QNAN):
371da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_ZERO):
381da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_NORM):
391da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_DNORM):
401da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_INF):
41d5afa7e9SMaciej W. Rozycki 		return ieee754dp_nanxcpt(x);
421da177e4SLinus Torvalds 
431da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_QNAN):
441da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_QNAN):
451da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_QNAN):
461da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_QNAN):
471da177e4SLinus Torvalds 		return y;
481da177e4SLinus Torvalds 
491da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_QNAN):
501da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_ZERO):
511da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_NORM):
521da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_DNORM):
531da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_INF):
541da177e4SLinus Torvalds 		return x;
551da177e4SLinus Torvalds 
561da177e4SLinus Torvalds 
573f7cac41SRalf Baechle 	/*
583f7cac41SRalf Baechle 	 * Infinity handling
591da177e4SLinus Torvalds 	 */
601da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_INF):
611da177e4SLinus Torvalds 		if (xs == ys)
621da177e4SLinus Torvalds 			return x;
639e8bad1fSRalf Baechle 		ieee754_setcx(IEEE754_INVALID_OPERATION);
6490efba36SRalf Baechle 		return ieee754dp_indef();
651da177e4SLinus Torvalds 
661da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_INF):
671da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_INF):
681da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_INF):
691da177e4SLinus Torvalds 		return y;
701da177e4SLinus Torvalds 
711da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_ZERO):
721da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_NORM):
731da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_DNORM):
741da177e4SLinus Torvalds 		return x;
751da177e4SLinus Torvalds 
763f7cac41SRalf Baechle 	/*
773f7cac41SRalf Baechle 	 * Zero handling
781da177e4SLinus Torvalds 	 */
791da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_ZERO):
801da177e4SLinus Torvalds 		if (xs == ys)
811da177e4SLinus Torvalds 			return x;
821da177e4SLinus Torvalds 		else
8356a64733SRalf Baechle 			return ieee754dp_zero(ieee754_csr.rm == FPU_CSR_RD);
841da177e4SLinus Torvalds 
851da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_ZERO):
861da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_ZERO):
871da177e4SLinus Torvalds 		return x;
881da177e4SLinus Torvalds 
891da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_NORM):
901da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_DNORM):
911da177e4SLinus Torvalds 		return y;
921da177e4SLinus Torvalds 
931da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_DNORM):
941da177e4SLinus Torvalds 		DPDNORMX;
95*c9b02990SLiangliang Huang 		fallthrough;
961da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_DNORM):
971da177e4SLinus Torvalds 		DPDNORMY;
981da177e4SLinus Torvalds 		break;
991da177e4SLinus Torvalds 
1001da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_NORM):
1011da177e4SLinus Torvalds 		DPDNORMX;
1021da177e4SLinus Torvalds 		break;
1031da177e4SLinus Torvalds 
1041da177e4SLinus Torvalds 	case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_NORM):
1051da177e4SLinus Torvalds 		break;
1061da177e4SLinus Torvalds 	}
1071da177e4SLinus Torvalds 	assert(xm & DP_HIDDEN_BIT);
1081da177e4SLinus Torvalds 	assert(ym & DP_HIDDEN_BIT);
1091da177e4SLinus Torvalds 
1103f7cac41SRalf Baechle 	/*
1113f7cac41SRalf Baechle 	 * Provide guard,round and stick bit space.
1123f7cac41SRalf Baechle 	 */
1131da177e4SLinus Torvalds 	xm <<= 3;
1141da177e4SLinus Torvalds 	ym <<= 3;
1151da177e4SLinus Torvalds 
1161da177e4SLinus Torvalds 	if (xe > ye) {
1173f7cac41SRalf Baechle 		/*
1183f7cac41SRalf Baechle 		 * Have to shift y fraction right to align.
1191da177e4SLinus Torvalds 		 */
1203f7cac41SRalf Baechle 		s = xe - ye;
1211da177e4SLinus Torvalds 		ym = XDPSRS(ym, s);
1221da177e4SLinus Torvalds 		ye += s;
1231da177e4SLinus Torvalds 	} else if (ye > xe) {
1243f7cac41SRalf Baechle 		/*
1253f7cac41SRalf Baechle 		 * Have to shift x fraction right to align.
1261da177e4SLinus Torvalds 		 */
1273f7cac41SRalf Baechle 		s = ye - xe;
1281da177e4SLinus Torvalds 		xm = XDPSRS(xm, s);
1291da177e4SLinus Torvalds 		xe += s;
1301da177e4SLinus Torvalds 	}
1311da177e4SLinus Torvalds 	assert(xe == ye);
1321da177e4SLinus Torvalds 	assert(xe <= DP_EMAX);
1331da177e4SLinus Torvalds 
1341da177e4SLinus Torvalds 	if (xs == ys) {
1353f7cac41SRalf Baechle 		/*
1363f7cac41SRalf Baechle 		 * Generate 28 bit result of adding two 27 bit numbers
1373f7cac41SRalf Baechle 		 * leaving result in xm, xs and xe.
1381da177e4SLinus Torvalds 		 */
1391da177e4SLinus Torvalds 		xm = xm + ym;
1401da177e4SLinus Torvalds 
141ad8fb553SRalf Baechle 		if (xm >> (DP_FBITS + 1 + 3)) { /* carry out */
1421da177e4SLinus Torvalds 			xm = XDPSRS1(xm);
1431da177e4SLinus Torvalds 			xe++;
1441da177e4SLinus Torvalds 		}
1451da177e4SLinus Torvalds 	} else {
1461da177e4SLinus Torvalds 		if (xm >= ym) {
1471da177e4SLinus Torvalds 			xm = xm - ym;
1481da177e4SLinus Torvalds 		} else {
1491da177e4SLinus Torvalds 			xm = ym - xm;
1501da177e4SLinus Torvalds 			xs = ys;
1511da177e4SLinus Torvalds 		}
1521da177e4SLinus Torvalds 		if (xm == 0)
15356a64733SRalf Baechle 			return ieee754dp_zero(ieee754_csr.rm == FPU_CSR_RD);
1541da177e4SLinus Torvalds 
1553f7cac41SRalf Baechle 		/*
1563f7cac41SRalf Baechle 		 * Normalize to rounding precision.
1573f7cac41SRalf Baechle 		 */
158ad8fb553SRalf Baechle 		while ((xm >> (DP_FBITS + 3)) == 0) {
1591da177e4SLinus Torvalds 			xm <<= 1;
1601da177e4SLinus Torvalds 			xe--;
1611da177e4SLinus Torvalds 		}
1621da177e4SLinus Torvalds 	}
16390efba36SRalf Baechle 
16490efba36SRalf Baechle 	return ieee754dp_format(xs, xe, xm);
1651da177e4SLinus Torvalds }
166