blob: 465a0342ed4c8ca8028420299ae374952870c63f [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/* IEEE754 floating point arithmetic
2 * double precision: common utilities
3 */
4/*
5 * MIPS floating point support
6 * Copyright (C) 1994-2000 Algorithmics Ltd.
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 * This program is free software; you can distribute it and/or modify it
9 * under the terms of the GNU General Public License (Version 2) as
10 * published by the Free Software Foundation.
11 *
12 * This program is distributed in the hope it will be useful, but WITHOUT
13 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 * for more details.
16 *
17 * You should have received a copy of the GNU General Public License along
18 * with this program; if not, write to the Free Software Foundation, Inc.,
Ralf Baechle3f7cac42014-04-26 01:49:14 +020019 * 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
Linus Torvalds1da177e2005-04-16 15:20:36 -070020 */
21
Ralf Baechlecae55062014-04-16 00:47:59 +020022#include <linux/compiler.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070023
24#include "ieee754dp.h"
25
Ralf Baechle2209bcb2014-04-16 01:31:11 +020026int ieee754dp_class(union ieee754dp x)
Linus Torvalds1da177e2005-04-16 15:20:36 -070027{
28 COMPXDP;
29 EXPLODEXDP;
30 return xc;
31}
32
Maciej W. Rozyckie06b5302015-04-03 23:25:57 +010033static inline int ieee754dp_isnan(union ieee754dp x)
Linus Torvalds1da177e2005-04-16 15:20:36 -070034{
Maciej W. Rozyckic9a10842015-04-03 23:25:38 +010035 return ieee754_class_nan(ieee754dp_class(x));
Linus Torvalds1da177e2005-04-16 15:20:36 -070036}
37
Ralf Baechlef71baa12014-04-25 00:40:42 +020038static inline int ieee754dp_issnan(union ieee754dp x)
Linus Torvalds1da177e2005-04-16 15:20:36 -070039{
Maciej W. Rozycki90d53a92015-11-13 00:47:28 +000040 int qbit;
41
Linus Torvalds1da177e2005-04-16 15:20:36 -070042 assert(ieee754dp_isnan(x));
Maciej W. Rozycki90d53a92015-11-13 00:47:28 +000043 qbit = (DPMANT(x) & DP_MBIT(DP_FBITS - 1)) == DP_MBIT(DP_FBITS - 1);
44 return ieee754_csr.nan2008 ^ qbit;
Linus Torvalds1da177e2005-04-16 15:20:36 -070045}
46
47
Maciej W. Rozyckid5afa7e2015-04-03 23:25:34 +010048/*
49 * Raise the Invalid Operation IEEE 754 exception
50 * and convert the signaling NaN supplied to a quiet NaN.
51 */
Ralf Baechle90efba32014-04-25 03:19:57 +020052union ieee754dp __cold ieee754dp_nanxcpt(union ieee754dp r)
Linus Torvalds1da177e2005-04-16 15:20:36 -070053{
Maciej W. Rozyckid5afa7e2015-04-03 23:25:34 +010054 assert(ieee754dp_issnan(r));
Linus Torvalds1da177e2005-04-16 15:20:36 -070055
Maciej W. Rozyckid5afa7e2015-04-03 23:25:34 +010056 ieee754_setcx(IEEE754_INVALID_OPERATION);
Maciej W. Rozyckiacd9e202015-11-13 00:48:48 +000057 if (ieee754_csr.nan2008) {
Maciej W. Rozycki90d53a92015-11-13 00:47:28 +000058 DPMANT(r) |= DP_MBIT(DP_FBITS - 1);
Maciej W. Rozyckiacd9e202015-11-13 00:48:48 +000059 } else {
60 DPMANT(r) &= ~DP_MBIT(DP_FBITS - 1);
61 if (!ieee754dp_isnan(r))
62 DPMANT(r) |= DP_MBIT(DP_FBITS - 2);
63 }
Maciej W. Rozycki90d53a92015-11-13 00:47:28 +000064
65 return r;
Linus Torvalds1da177e2005-04-16 15:20:36 -070066}
67
Ralf Baechlede2fc342014-04-25 10:54:06 +020068static u64 ieee754dp_get_rounding(int sn, u64 xm)
Linus Torvalds1da177e2005-04-16 15:20:36 -070069{
70 /* inexact must round of 3 bits
71 */
72 if (xm & (DP_MBIT(3) - 1)) {
73 switch (ieee754_csr.rm) {
Ralf Baechle56a64732014-04-30 11:21:55 +020074 case FPU_CSR_RZ:
Linus Torvalds1da177e2005-04-16 15:20:36 -070075 break;
Ralf Baechle56a64732014-04-30 11:21:55 +020076 case FPU_CSR_RN:
Linus Torvalds1da177e2005-04-16 15:20:36 -070077 xm += 0x3 + ((xm >> 3) & 1);
78 /* xm += (xm&0x8)?0x4:0x3 */
79 break;
Ralf Baechle56a64732014-04-30 11:21:55 +020080 case FPU_CSR_RU: /* toward +Infinity */
Linus Torvalds1da177e2005-04-16 15:20:36 -070081 if (!sn) /* ?? */
82 xm += 0x8;
83 break;
Ralf Baechle56a64732014-04-30 11:21:55 +020084 case FPU_CSR_RD: /* toward -Infinity */
Ralf Baechle70342282013-01-22 12:59:30 +010085 if (sn) /* ?? */
Linus Torvalds1da177e2005-04-16 15:20:36 -070086 xm += 0x8;
87 break;
88 }
89 }
90 return xm;
91}
92
93
94/* generate a normal/denormal number with over,under handling
95 * sn is sign
96 * xe is an unbiased exponent
97 * xm is 3bit extended precision value.
98 */
Ralf Baechle2209bcb2014-04-16 01:31:11 +020099union ieee754dp ieee754dp_format(int sn, int xe, u64 xm)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100{
101 assert(xm); /* we don't gen exact zeros (probably should) */
102
Adam Buchbinder92a76f62016-02-25 00:44:58 -0800103 assert((xm >> (DP_FBITS + 1 + 3)) == 0); /* no excess */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104 assert(xm & (DP_HIDDEN_BIT << 3));
105
106 if (xe < DP_EMIN) {
107 /* strip lower bits */
108 int es = DP_EMIN - xe;
109
110 if (ieee754_csr.nod) {
Ralf Baechle9e8bad12014-04-19 00:36:32 +0200111 ieee754_setcx(IEEE754_UNDERFLOW);
112 ieee754_setcx(IEEE754_INEXACT);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113
114 switch(ieee754_csr.rm) {
Ralf Baechle56a64732014-04-30 11:21:55 +0200115 case FPU_CSR_RN:
116 case FPU_CSR_RZ:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117 return ieee754dp_zero(sn);
Ralf Baechle56a64732014-04-30 11:21:55 +0200118 case FPU_CSR_RU: /* toward +Infinity */
Ralf Baechle47fa0c02014-04-16 11:00:12 +0200119 if (sn == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120 return ieee754dp_min(0);
121 else
122 return ieee754dp_zero(1);
Ralf Baechle56a64732014-04-30 11:21:55 +0200123 case FPU_CSR_RD: /* toward -Infinity */
Ralf Baechle47fa0c02014-04-16 11:00:12 +0200124 if (sn == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125 return ieee754dp_zero(0);
126 else
127 return ieee754dp_min(1);
128 }
129 }
130
Ralf Baechlede2fc342014-04-25 10:54:06 +0200131 if (xe == DP_EMIN - 1 &&
132 ieee754dp_get_rounding(sn, xm) >> (DP_FBITS + 1 + 3))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700133 {
134 /* Not tiny after rounding */
Ralf Baechle9e8bad12014-04-19 00:36:32 +0200135 ieee754_setcx(IEEE754_INEXACT);
Ralf Baechlede2fc342014-04-25 10:54:06 +0200136 xm = ieee754dp_get_rounding(sn, xm);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137 xm >>= 1;
138 /* Clear grs bits */
139 xm &= ~(DP_MBIT(3) - 1);
140 xe++;
141 }
142 else {
143 /* sticky right shift es bits
144 */
145 xm = XDPSRS(xm, es);
146 xe += es;
147 assert((xm & (DP_HIDDEN_BIT << 3)) == 0);
148 assert(xe == DP_EMIN);
149 }
150 }
151 if (xm & (DP_MBIT(3) - 1)) {
Ralf Baechle9e8bad12014-04-19 00:36:32 +0200152 ieee754_setcx(IEEE754_INEXACT);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153 if ((xm & (DP_HIDDEN_BIT << 3)) == 0) {
Ralf Baechle9e8bad12014-04-19 00:36:32 +0200154 ieee754_setcx(IEEE754_UNDERFLOW);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 }
156
157 /* inexact must round of 3 bits
158 */
Ralf Baechlede2fc342014-04-25 10:54:06 +0200159 xm = ieee754dp_get_rounding(sn, xm);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160 /* adjust exponent for rounding add overflowing
161 */
Ralf Baechlead8fb552014-04-22 15:51:55 +0200162 if (xm >> (DP_FBITS + 3 + 1)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163 /* add causes mantissa overflow */
164 xm >>= 1;
165 xe++;
166 }
167 }
168 /* strip grs bits */
169 xm >>= 3;
170
Adam Buchbinder92a76f62016-02-25 00:44:58 -0800171 assert((xm >> (DP_FBITS + 1)) == 0); /* no excess */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172 assert(xe >= DP_EMIN);
173
174 if (xe > DP_EMAX) {
Ralf Baechle9e8bad12014-04-19 00:36:32 +0200175 ieee754_setcx(IEEE754_OVERFLOW);
176 ieee754_setcx(IEEE754_INEXACT);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177 /* -O can be table indexed by (rm,sn) */
178 switch (ieee754_csr.rm) {
Ralf Baechle56a64732014-04-30 11:21:55 +0200179 case FPU_CSR_RN:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 return ieee754dp_inf(sn);
Ralf Baechle56a64732014-04-30 11:21:55 +0200181 case FPU_CSR_RZ:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700182 return ieee754dp_max(sn);
Ralf Baechle56a64732014-04-30 11:21:55 +0200183 case FPU_CSR_RU: /* toward +Infinity */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184 if (sn == 0)
185 return ieee754dp_inf(0);
186 else
187 return ieee754dp_max(1);
Ralf Baechle56a64732014-04-30 11:21:55 +0200188 case FPU_CSR_RD: /* toward -Infinity */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700189 if (sn == 0)
190 return ieee754dp_max(0);
191 else
192 return ieee754dp_inf(1);
193 }
194 }
195 /* gen norm/denorm/zero */
196
197 if ((xm & DP_HIDDEN_BIT) == 0) {
198 /* we underflow (tiny/zero) */
199 assert(xe == DP_EMIN);
200 if (ieee754_csr.mx & IEEE754_UNDERFLOW)
Ralf Baechle9e8bad12014-04-19 00:36:32 +0200201 ieee754_setcx(IEEE754_UNDERFLOW);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202 return builddp(sn, DP_EMIN - 1 + DP_EBIAS, xm);
203 } else {
Adam Buchbinder92a76f62016-02-25 00:44:58 -0800204 assert((xm >> (DP_FBITS + 1)) == 0); /* no excess */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205 assert(xm & DP_HIDDEN_BIT);
206
207 return builddp(sn, xe + DP_EBIAS, xm & ~DP_HIDDEN_BIT);
208 }
209}