blob: 58b27959a6c460e03d7e4acdec4f1e7df56e6b31 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/* IEEE754 floating point arithmetic
2 * double precision: common utilities
3 */
4/*
5 * MIPS floating point support
6 * Copyright (C) 1994-2000 Algorithmics Ltd.
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 * This program is free software; you can distribute it and/or modify it
9 * under the terms of the GNU General Public License (Version 2) as
10 * published by the Free Software Foundation.
11 *
12 * This program is distributed in the hope it will be useful, but WITHOUT
13 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 * for more details.
16 *
17 * You should have received a copy of the GNU General Public License along
18 * with this program; if not, write to the Free Software Foundation, Inc.,
Ralf Baechle3f7cac42014-04-26 01:49:14 +020019 * 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
Linus Torvalds1da177e2005-04-16 15:20:36 -070020 */
21
Linus Torvalds1da177e2005-04-16 15:20:36 -070022#include "ieee754dp.h"
23
Ralf Baechle2209bcb2014-04-16 01:31:11 +020024union ieee754dp ieee754dp_add(union ieee754dp x, union ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -070025{
Ralf Baechle3f7cac42014-04-26 01:49:14 +020026 int s;
27
Linus Torvalds1da177e2005-04-16 15:20:36 -070028 COMPXDP;
29 COMPYDP;
30
31 EXPLODEXDP;
32 EXPLODEYDP;
33
Ralf Baechle9e8bad12014-04-19 00:36:32 +020034 ieee754_clearcx();
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
36 FLUSHXDP;
37 FLUSHYDP;
38
39 switch (CLPAIR(xc, yc)) {
40 case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_QNAN):
41 case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_SNAN):
42 case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_SNAN):
43 case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_SNAN):
44 case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_SNAN):
45 case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_SNAN):
46 case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_SNAN):
47 case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_ZERO):
48 case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_NORM):
49 case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_DNORM):
50 case CLPAIR(IEEE754_CLASS_SNAN, IEEE754_CLASS_INF):
Ralf Baechle9e8bad12014-04-19 00:36:32 +020051 ieee754_setcx(IEEE754_INVALID_OPERATION);
Ralf Baechle90efba32014-04-25 03:19:57 +020052 return ieee754dp_nanxcpt(ieee754dp_indef());
Linus Torvalds1da177e2005-04-16 15:20:36 -070053
54 case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_QNAN):
55 case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_QNAN):
56 case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_QNAN):
57 case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_QNAN):
58 return y;
59
60 case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_QNAN):
61 case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_ZERO):
62 case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_NORM):
63 case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_DNORM):
64 case CLPAIR(IEEE754_CLASS_QNAN, IEEE754_CLASS_INF):
65 return x;
66
67
Ralf Baechle3f7cac42014-04-26 01:49:14 +020068 /*
69 * Infinity handling
70 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070071 case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_INF):
72 if (xs == ys)
73 return x;
Ralf Baechle9e8bad12014-04-19 00:36:32 +020074 ieee754_setcx(IEEE754_INVALID_OPERATION);
Ralf Baechle90efba32014-04-25 03:19:57 +020075 return ieee754dp_indef();
Linus Torvalds1da177e2005-04-16 15:20:36 -070076
77 case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_INF):
78 case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_INF):
79 case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_INF):
80 return y;
81
82 case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_ZERO):
83 case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_NORM):
84 case CLPAIR(IEEE754_CLASS_INF, IEEE754_CLASS_DNORM):
85 return x;
86
Ralf Baechle3f7cac42014-04-26 01:49:14 +020087 /*
88 * Zero handling
89 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070090 case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_ZERO):
91 if (xs == ys)
92 return x;
93 else
Ralf Baechle56a64732014-04-30 11:21:55 +020094 return ieee754dp_zero(ieee754_csr.rm == FPU_CSR_RD);
Linus Torvalds1da177e2005-04-16 15:20:36 -070095
96 case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_ZERO):
97 case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_ZERO):
98 return x;
99
100 case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_NORM):
101 case CLPAIR(IEEE754_CLASS_ZERO, IEEE754_CLASS_DNORM):
102 return y;
103
104 case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_DNORM):
105 DPDNORMX;
106
107 /* FALL THROUGH */
108
109 case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_DNORM):
110 DPDNORMY;
111 break;
112
113 case CLPAIR(IEEE754_CLASS_DNORM, IEEE754_CLASS_NORM):
114 DPDNORMX;
115 break;
116
117 case CLPAIR(IEEE754_CLASS_NORM, IEEE754_CLASS_NORM):
118 break;
119 }
120 assert(xm & DP_HIDDEN_BIT);
121 assert(ym & DP_HIDDEN_BIT);
122
Ralf Baechle3f7cac42014-04-26 01:49:14 +0200123 /*
124 * Provide guard,round and stick bit space.
125 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126 xm <<= 3;
127 ym <<= 3;
128
129 if (xe > ye) {
Ralf Baechle3f7cac42014-04-26 01:49:14 +0200130 /*
131 * Have to shift y fraction right to align.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700132 */
Ralf Baechle3f7cac42014-04-26 01:49:14 +0200133 s = xe - ye;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134 ym = XDPSRS(ym, s);
135 ye += s;
136 } else if (ye > xe) {
Ralf Baechle3f7cac42014-04-26 01:49:14 +0200137 /*
138 * Have to shift x fraction right to align.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139 */
Ralf Baechle3f7cac42014-04-26 01:49:14 +0200140 s = ye - xe;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700141 xm = XDPSRS(xm, s);
142 xe += s;
143 }
144 assert(xe == ye);
145 assert(xe <= DP_EMAX);
146
147 if (xs == ys) {
Ralf Baechle3f7cac42014-04-26 01:49:14 +0200148 /*
149 * Generate 28 bit result of adding two 27 bit numbers
150 * leaving result in xm, xs and xe.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151 */
152 xm = xm + ym;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153
Ralf Baechlead8fb552014-04-22 15:51:55 +0200154 if (xm >> (DP_FBITS + 1 + 3)) { /* carry out */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 xm = XDPSRS1(xm);
156 xe++;
157 }
158 } else {
159 if (xm >= ym) {
160 xm = xm - ym;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161 } else {
162 xm = ym - xm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163 xs = ys;
164 }
165 if (xm == 0)
Ralf Baechle56a64732014-04-30 11:21:55 +0200166 return ieee754dp_zero(ieee754_csr.rm == FPU_CSR_RD);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167
Ralf Baechle3f7cac42014-04-26 01:49:14 +0200168 /*
169 * Normalize to rounding precision.
170 */
Ralf Baechlead8fb552014-04-22 15:51:55 +0200171 while ((xm >> (DP_FBITS + 3)) == 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172 xm <<= 1;
173 xe--;
174 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700175 }
Ralf Baechle90efba32014-04-25 03:19:57 +0200176
177 return ieee754dp_format(xs, xe, xm);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178}