blob: d3be351aed151305396723ddfff661837a114cde [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * MIPS floating point support
3 * Copyright (C) 1994-2000 Algorithmics Ltd.
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07005 * This program is free software; you can distribute it and/or modify it
6 * under the terms of the GNU General Public License (Version 2) as
7 * published by the Free Software Foundation.
8 *
9 * This program is distributed in the hope it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12 * for more details.
13 *
14 * You should have received a copy of the GNU General Public License along
15 * with this program; if not, write to the Free Software Foundation, Inc.,
Ralf Baechle3f7cac42014-04-26 01:49:14 +020016 * 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
Linus Torvalds1da177e2005-04-16 15:20:36 -070017 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070018 * Nov 7, 2000
19 * Modification to allow integration with Linux kernel
20 *
21 * Kevin D. Kissell, kevink@mips.com and Carsten Langgard, carstenl@mips.com
22 * Copyright (C) 2000 MIPS Technologies, Inc. All rights reserved.
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000023 */
Ralf Baechlea663bf92005-10-23 13:44:31 +010024#ifndef __ARCH_MIPS_MATH_EMU_IEEE754_H
25#define __ARCH_MIPS_MATH_EMU_IEEE754_H
Linus Torvalds1da177e2005-04-16 15:20:36 -070026
Ralf Baechlecae55062014-04-16 00:47:59 +020027#include <linux/compiler.h>
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000028#include <asm/byteorder.h>
Ralf Baechlee812a732014-04-19 14:20:54 +020029#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <linux/types.h>
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000031#include <linux/sched.h>
Ralf Baechlef80cc082014-04-16 00:40:02 +020032#include <asm/bitfield.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070033
Ralf Baechle2209bcb2014-04-16 01:31:11 +020034union ieee754dp {
Linus Torvalds1da177e2005-04-16 15:20:36 -070035 struct {
Ralf Baechlef80cc082014-04-16 00:40:02 +020036 __BITFIELD_FIELD(unsigned int sign:1,
37 __BITFIELD_FIELD(unsigned int bexp:11,
38 __BITFIELD_FIELD(u64 mant:52,
39 ;)))
Ralf Baechle49548b02014-04-25 15:48:40 +020040 };
Linus Torvalds1da177e2005-04-16 15:20:36 -070041 u64 bits;
Ralf Baechle2209bcb2014-04-16 01:31:11 +020042};
Linus Torvalds1da177e2005-04-16 15:20:36 -070043
Ralf Baechle2209bcb2014-04-16 01:31:11 +020044union ieee754sp {
Ralf Baechle49548b02014-04-25 15:48:40 +020045 struct {
46 __BITFIELD_FIELD(unsigned sign:1,
47 __BITFIELD_FIELD(unsigned bexp:8,
48 __BITFIELD_FIELD(unsigned mant:23,
49 ;)))
50 };
Linus Torvalds1da177e2005-04-16 15:20:36 -070051 u32 bits;
Ralf Baechle2209bcb2014-04-16 01:31:11 +020052};
Linus Torvalds1da177e2005-04-16 15:20:36 -070053
54/*
55 * single precision (often aka float)
56*/
Ralf Baechle2209bcb2014-04-16 01:31:11 +020057int ieee754sp_class(union ieee754sp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070058
Ralf Baechle2209bcb2014-04-16 01:31:11 +020059union ieee754sp ieee754sp_abs(union ieee754sp x);
60union ieee754sp ieee754sp_neg(union ieee754sp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070061
Ralf Baechle2209bcb2014-04-16 01:31:11 +020062union ieee754sp ieee754sp_add(union ieee754sp x, union ieee754sp y);
63union ieee754sp ieee754sp_sub(union ieee754sp x, union ieee754sp y);
64union ieee754sp ieee754sp_mul(union ieee754sp x, union ieee754sp y);
65union ieee754sp ieee754sp_div(union ieee754sp x, union ieee754sp y);
Linus Torvalds1da177e2005-04-16 15:20:36 -070066
Ralf Baechle2209bcb2014-04-16 01:31:11 +020067union ieee754sp ieee754sp_fint(int x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +020068union ieee754sp ieee754sp_flong(s64 x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +020069union ieee754sp ieee754sp_fdp(union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070070
Ralf Baechle2209bcb2014-04-16 01:31:11 +020071int ieee754sp_tint(union ieee754sp x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +020072s64 ieee754sp_tlong(union ieee754sp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070073
Ralf Baechle2209bcb2014-04-16 01:31:11 +020074int ieee754sp_cmp(union ieee754sp x, union ieee754sp y, int cop, int sig);
Linus Torvalds1da177e2005-04-16 15:20:36 -070075
Ralf Baechle2209bcb2014-04-16 01:31:11 +020076union ieee754sp ieee754sp_sqrt(union ieee754sp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070077
Markos Chandrase24c3be2015-08-13 09:56:31 +020078union ieee754sp ieee754sp_maddf(union ieee754sp z, union ieee754sp x,
79 union ieee754sp y);
Markos Chandras83d43302015-08-13 09:56:32 +020080union ieee754sp ieee754sp_msubf(union ieee754sp z, union ieee754sp x,
81 union ieee754sp y);
Markos Chandras38db37b2015-08-13 09:56:34 +020082int ieee754sp_2008class(union ieee754sp x);
Markos Chandras4e9561b2015-08-13 09:56:35 +020083union ieee754sp ieee754sp_fmin(union ieee754sp x, union ieee754sp y);
84union ieee754sp ieee754sp_fmina(union ieee754sp x, union ieee754sp y);
Markos Chandrasa79f5f92015-08-13 09:56:36 +020085union ieee754sp ieee754sp_fmax(union ieee754sp x, union ieee754sp y);
86union ieee754sp ieee754sp_fmaxa(union ieee754sp x, union ieee754sp y);
Markos Chandrase24c3be2015-08-13 09:56:31 +020087
Linus Torvalds1da177e2005-04-16 15:20:36 -070088/*
89 * double precision (often aka double)
90*/
Ralf Baechle2209bcb2014-04-16 01:31:11 +020091int ieee754dp_class(union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070092
Ralf Baechle2209bcb2014-04-16 01:31:11 +020093union ieee754dp ieee754dp_add(union ieee754dp x, union ieee754dp y);
94union ieee754dp ieee754dp_sub(union ieee754dp x, union ieee754dp y);
95union ieee754dp ieee754dp_mul(union ieee754dp x, union ieee754dp y);
96union ieee754dp ieee754dp_div(union ieee754dp x, union ieee754dp y);
Linus Torvalds1da177e2005-04-16 15:20:36 -070097
Ralf Baechle2209bcb2014-04-16 01:31:11 +020098union ieee754dp ieee754dp_abs(union ieee754dp x);
99union ieee754dp ieee754dp_neg(union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200101union ieee754dp ieee754dp_fint(int x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200102union ieee754dp ieee754dp_flong(s64 x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200103union ieee754dp ieee754dp_fsp(union ieee754sp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200105int ieee754dp_tint(union ieee754dp x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200106s64 ieee754dp_tlong(union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200108int ieee754dp_cmp(union ieee754dp x, union ieee754dp y, int cop, int sig);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200110union ieee754dp ieee754dp_sqrt(union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111
Markos Chandrase24c3be2015-08-13 09:56:31 +0200112union ieee754dp ieee754dp_maddf(union ieee754dp z, union ieee754dp x,
113 union ieee754dp y);
Markos Chandras83d43302015-08-13 09:56:32 +0200114union ieee754dp ieee754dp_msubf(union ieee754dp z, union ieee754dp x,
115 union ieee754dp y);
Markos Chandras38db37b2015-08-13 09:56:34 +0200116int ieee754dp_2008class(union ieee754dp x);
Markos Chandras4e9561b2015-08-13 09:56:35 +0200117union ieee754dp ieee754dp_fmin(union ieee754dp x, union ieee754dp y);
118union ieee754dp ieee754dp_fmina(union ieee754dp x, union ieee754dp y);
Markos Chandrasa79f5f92015-08-13 09:56:36 +0200119union ieee754dp ieee754dp_fmax(union ieee754dp x, union ieee754dp y);
120union ieee754dp ieee754dp_fmaxa(union ieee754dp x, union ieee754dp y);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700121
122
123/* 5 types of floating point number
124*/
Ralf Baechle9e8bad12014-04-19 00:36:32 +0200125enum {
126 IEEE754_CLASS_NORM = 0x00,
127 IEEE754_CLASS_ZERO = 0x01,
128 IEEE754_CLASS_DNORM = 0x02,
129 IEEE754_CLASS_INF = 0x03,
130 IEEE754_CLASS_SNAN = 0x04,
131 IEEE754_CLASS_QNAN = 0x05,
132};
Linus Torvalds1da177e2005-04-16 15:20:36 -0700133
134/* exception numbers */
135#define IEEE754_INEXACT 0x01
136#define IEEE754_UNDERFLOW 0x02
137#define IEEE754_OVERFLOW 0x04
138#define IEEE754_ZERO_DIVIDE 0x08
139#define IEEE754_INVALID_OPERATION 0x10
140
141/* cmp operators
142*/
143#define IEEE754_CLT 0x01
144#define IEEE754_CEQ 0x02
145#define IEEE754_CGT 0x04
146#define IEEE754_CUN 0x08
147
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000148/*
149 * The control status register
150 */
151struct _ieee754_csr {
Maciej W. Rozyckif1f3b7e2015-04-03 23:27:38 +0100152 __BITFIELD_FIELD(unsigned fcc:7, /* condition[7:1] */
153 __BITFIELD_FIELD(unsigned nod:1, /* set 1 for no denormals */
154 __BITFIELD_FIELD(unsigned c:1, /* condition[0] */
155 __BITFIELD_FIELD(unsigned pad0:3,
156 __BITFIELD_FIELD(unsigned abs2008:1, /* IEEE 754-2008 ABS/NEG.fmt */
157 __BITFIELD_FIELD(unsigned nan2008:1, /* IEEE 754-2008 NaN mode */
Ralf Baechlef80cc082014-04-16 00:40:02 +0200158 __BITFIELD_FIELD(unsigned cx:6, /* exceptions this operation */
159 __BITFIELD_FIELD(unsigned mx:5, /* exception enable mask */
160 __BITFIELD_FIELD(unsigned sx:5, /* exceptions total */
161 __BITFIELD_FIELD(unsigned rm:2, /* current rounding mode */
Maciej W. Rozyckif1f3b7e2015-04-03 23:27:38 +0100162 ;))))))))))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163};
Atsushi Nemotoeae89072006-05-16 01:26:03 +0900164#define ieee754_csr (*(struct _ieee754_csr *)(&current->thread.fpu.fcr31))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000166static inline unsigned ieee754_getrm(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167{
168 return (ieee754_csr.rm);
169}
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000170static inline unsigned ieee754_setrm(unsigned rm)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171{
172 return (ieee754_csr.rm = rm);
173}
174
175/*
176 * get current exceptions
177 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000178static inline unsigned ieee754_getcx(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179{
180 return (ieee754_csr.cx);
181}
182
183/* test for current exception condition
184 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000185static inline int ieee754_cxtest(unsigned n)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186{
187 return (ieee754_csr.cx & n);
188}
189
190/*
191 * get sticky exceptions
192 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000193static inline unsigned ieee754_getsx(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194{
195 return (ieee754_csr.sx);
196}
197
198/* clear sticky conditions
199*/
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000200static inline unsigned ieee754_clrsx(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700201{
202 return (ieee754_csr.sx = 0);
203}
204
205/* test for sticky exception condition
206 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000207static inline int ieee754_sxtest(unsigned n)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208{
209 return (ieee754_csr.sx & n);
210}
211
212/* debugging */
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200213union ieee754sp ieee754sp_dump(char *s, union ieee754sp x);
214union ieee754dp ieee754dp_dump(char *s, union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700215
Maciej W. Rozycki1796ec72015-04-03 23:24:09 +0100216#define IEEE754_SPCVAL_PZERO 0 /* +0.0 */
217#define IEEE754_SPCVAL_NZERO 1 /* -0.0 */
218#define IEEE754_SPCVAL_PONE 2 /* +1.0 */
219#define IEEE754_SPCVAL_NONE 3 /* -1.0 */
220#define IEEE754_SPCVAL_PTEN 4 /* +10.0 */
221#define IEEE754_SPCVAL_NTEN 5 /* -10.0 */
222#define IEEE754_SPCVAL_PINFINITY 6 /* +inf */
223#define IEEE754_SPCVAL_NINFINITY 7 /* -inf */
Maciej W. Rozycki90d53a92015-11-13 00:47:28 +0000224#define IEEE754_SPCVAL_INDEF_LEG 8 /* legacy quiet NaN */
225#define IEEE754_SPCVAL_INDEF_2008 9 /* IEEE 754-2008 quiet NaN */
226#define IEEE754_SPCVAL_PMAX 10 /* +max norm */
227#define IEEE754_SPCVAL_NMAX 11 /* -max norm */
228#define IEEE754_SPCVAL_PMIN 12 /* +min norm */
229#define IEEE754_SPCVAL_NMIN 13 /* -min norm */
230#define IEEE754_SPCVAL_PMIND 14 /* +min denorm */
231#define IEEE754_SPCVAL_NMIND 15 /* -min denorm */
232#define IEEE754_SPCVAL_P1E31 16 /* + 1.0e31 */
233#define IEEE754_SPCVAL_P1E63 17 /* + 1.0e63 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234
Ralf Baechle49548b02014-04-25 15:48:40 +0200235extern const union ieee754dp __ieee754dp_spcvals[];
236extern const union ieee754sp __ieee754sp_spcvals[];
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200237#define ieee754dp_spcvals ((const union ieee754dp *)__ieee754dp_spcvals)
238#define ieee754sp_spcvals ((const union ieee754sp *)__ieee754sp_spcvals)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000240/*
241 * Return infinity with given sign
242 */
243#define ieee754dp_inf(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PINFINITY+(sn)])
244#define ieee754dp_zero(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PZERO+(sn)])
245#define ieee754dp_one(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PONE+(sn)])
246#define ieee754dp_ten(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PTEN+(sn)])
Maciej W. Rozycki90d53a92015-11-13 00:47:28 +0000247#define ieee754dp_indef() (ieee754dp_spcvals[IEEE754_SPCVAL_INDEF_LEG + \
248 ieee754_csr.nan2008])
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000249#define ieee754dp_max(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMAX+(sn)])
250#define ieee754dp_min(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMIN+(sn)])
251#define ieee754dp_mind(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMIND+(sn)])
252#define ieee754dp_1e31() (ieee754dp_spcvals[IEEE754_SPCVAL_P1E31])
253#define ieee754dp_1e63() (ieee754dp_spcvals[IEEE754_SPCVAL_P1E63])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000255#define ieee754sp_inf(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PINFINITY+(sn)])
256#define ieee754sp_zero(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PZERO+(sn)])
257#define ieee754sp_one(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PONE+(sn)])
258#define ieee754sp_ten(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PTEN+(sn)])
Maciej W. Rozycki90d53a92015-11-13 00:47:28 +0000259#define ieee754sp_indef() (ieee754sp_spcvals[IEEE754_SPCVAL_INDEF_LEG + \
260 ieee754_csr.nan2008])
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000261#define ieee754sp_max(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMAX+(sn)])
262#define ieee754sp_min(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMIN+(sn)])
263#define ieee754sp_mind(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMIND+(sn)])
264#define ieee754sp_1e31() (ieee754sp_spcvals[IEEE754_SPCVAL_P1E31])
265#define ieee754sp_1e63() (ieee754sp_spcvals[IEEE754_SPCVAL_P1E63])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000267/*
268 * Indefinite integer value
269 */
Ralf Baechlee812a732014-04-19 14:20:54 +0200270static inline int ieee754si_indef(void)
271{
Maciej W. Rozycki90d53a92015-11-13 00:47:28 +0000272 return ieee754_csr.nan2008 ? 0 : INT_MAX;
Ralf Baechlee812a732014-04-19 14:20:54 +0200273}
274
275static inline s64 ieee754di_indef(void)
276{
Maciej W. Rozycki90d53a92015-11-13 00:47:28 +0000277 return ieee754_csr.nan2008 ? 0 : S64_MAX;
278}
279
280/*
281 * Overflow integer value
282 */
283static inline int ieee754si_overflow(int xs)
284{
285 return ieee754_csr.nan2008 && xs ? INT_MIN : INT_MAX;
286}
287
288static inline s64 ieee754di_overflow(int xs)
289{
290 return ieee754_csr.nan2008 && xs ? S64_MIN : S64_MAX;
Ralf Baechlee812a732014-04-19 14:20:54 +0200291}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293/* result types for xctx.rt */
294#define IEEE754_RT_SP 0
295#define IEEE754_RT_DP 1
296#define IEEE754_RT_XP 2
297#define IEEE754_RT_SI 3
298#define IEEE754_RT_DI 4
299
Linus Torvalds1da177e2005-04-16 15:20:36 -0700300/* compat */
301#define ieee754dp_fix(x) ieee754dp_tint(x)
302#define ieee754sp_fix(x) ieee754sp_tint(x)
Ralf Baechlea663bf92005-10-23 13:44:31 +0100303
304#endif /* __ARCH_MIPS_MATH_EMU_IEEE754_H */