blob: e87a6361149bee0c06ad19b14c28ba18e69f5222 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * MIPS floating point support
3 * Copyright (C) 1994-2000 Algorithmics Ltd.
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07005 * This program is free software; you can distribute it and/or modify it
6 * under the terms of the GNU General Public License (Version 2) as
7 * published by the Free Software Foundation.
8 *
9 * This program is distributed in the hope it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12 * for more details.
13 *
14 * You should have received a copy of the GNU General Public License along
15 * with this program; if not, write to the Free Software Foundation, Inc.,
16 * 59 Temple Place - Suite 330, Boston MA 02111-1307, USA.
17 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070018 * Nov 7, 2000
19 * Modification to allow integration with Linux kernel
20 *
21 * Kevin D. Kissell, kevink@mips.com and Carsten Langgard, carstenl@mips.com
22 * Copyright (C) 2000 MIPS Technologies, Inc. All rights reserved.
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000023 */
Ralf Baechlea663bf92005-10-23 13:44:31 +010024#ifndef __ARCH_MIPS_MATH_EMU_IEEE754_H
25#define __ARCH_MIPS_MATH_EMU_IEEE754_H
Linus Torvalds1da177e2005-04-16 15:20:36 -070026
Ralf Baechlecae55062014-04-16 00:47:59 +020027#include <linux/compiler.h>
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000028#include <asm/byteorder.h>
Ralf Baechlee812a732014-04-19 14:20:54 +020029#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <linux/types.h>
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000031#include <linux/sched.h>
Ralf Baechlef80cc082014-04-16 00:40:02 +020032#include <asm/bitfield.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070033
Ralf Baechle23708812014-04-16 01:16:02 +020034struct ieee754dp_const {
Ralf Baechlef80cc082014-04-16 00:40:02 +020035 __BITFIELD_FIELD(unsigned sign:1,
36 __BITFIELD_FIELD(unsigned bexp:11,
37 __BITFIELD_FIELD(unsigned manthi:20,
38 __BITFIELD_FIELD(unsigned mantlo:32,
39 ;))))
Linus Torvalds1da177e2005-04-16 15:20:36 -070040};
41
Ralf Baechle2209bcb2014-04-16 01:31:11 +020042union ieee754dp {
Ralf Baechle23708812014-04-16 01:16:02 +020043 struct ieee754dp_const oparts;
Linus Torvalds1da177e2005-04-16 15:20:36 -070044 struct {
Ralf Baechlef80cc082014-04-16 00:40:02 +020045 __BITFIELD_FIELD(unsigned int sign:1,
46 __BITFIELD_FIELD(unsigned int bexp:11,
47 __BITFIELD_FIELD(u64 mant:52,
48 ;)))
Linus Torvalds1da177e2005-04-16 15:20:36 -070049 } parts;
50 double d;
51 u64 bits;
Ralf Baechle2209bcb2014-04-16 01:31:11 +020052};
Linus Torvalds1da177e2005-04-16 15:20:36 -070053
Ralf Baechle23708812014-04-16 01:16:02 +020054struct ieee754sp_const {
Ralf Baechlef80cc082014-04-16 00:40:02 +020055 __BITFIELD_FIELD(unsigned sign:1,
56 __BITFIELD_FIELD(unsigned bexp:8,
57 __BITFIELD_FIELD(unsigned mant:23,
58 ;)))
Linus Torvalds1da177e2005-04-16 15:20:36 -070059};
60
Ralf Baechle2209bcb2014-04-16 01:31:11 +020061union ieee754sp {
Ralf Baechle23708812014-04-16 01:16:02 +020062 struct ieee754sp_const parts;
Linus Torvalds1da177e2005-04-16 15:20:36 -070063 float f;
64 u32 bits;
Ralf Baechle2209bcb2014-04-16 01:31:11 +020065};
Linus Torvalds1da177e2005-04-16 15:20:36 -070066
67/*
68 * single precision (often aka float)
69*/
Ralf Baechle2209bcb2014-04-16 01:31:11 +020070int ieee754sp_class(union ieee754sp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070071
Ralf Baechle2209bcb2014-04-16 01:31:11 +020072union ieee754sp ieee754sp_abs(union ieee754sp x);
73union ieee754sp ieee754sp_neg(union ieee754sp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070074
Ralf Baechle2209bcb2014-04-16 01:31:11 +020075union ieee754sp ieee754sp_add(union ieee754sp x, union ieee754sp y);
76union ieee754sp ieee754sp_sub(union ieee754sp x, union ieee754sp y);
77union ieee754sp ieee754sp_mul(union ieee754sp x, union ieee754sp y);
78union ieee754sp ieee754sp_div(union ieee754sp x, union ieee754sp y);
Linus Torvalds1da177e2005-04-16 15:20:36 -070079
Ralf Baechle2209bcb2014-04-16 01:31:11 +020080union ieee754sp ieee754sp_fint(int x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +020081union ieee754sp ieee754sp_flong(s64 x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +020082union ieee754sp ieee754sp_fdp(union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070083
Ralf Baechle2209bcb2014-04-16 01:31:11 +020084int ieee754sp_tint(union ieee754sp x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +020085s64 ieee754sp_tlong(union ieee754sp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070086
Ralf Baechle2209bcb2014-04-16 01:31:11 +020087int ieee754sp_cmp(union ieee754sp x, union ieee754sp y, int cop, int sig);
Linus Torvalds1da177e2005-04-16 15:20:36 -070088
Ralf Baechle2209bcb2014-04-16 01:31:11 +020089union ieee754sp ieee754sp_sqrt(union ieee754sp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070090
91/*
92 * double precision (often aka double)
93*/
Ralf Baechle2209bcb2014-04-16 01:31:11 +020094int ieee754dp_class(union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -070095
Ralf Baechle2209bcb2014-04-16 01:31:11 +020096union ieee754dp ieee754dp_add(union ieee754dp x, union ieee754dp y);
97union ieee754dp ieee754dp_sub(union ieee754dp x, union ieee754dp y);
98union ieee754dp ieee754dp_mul(union ieee754dp x, union ieee754dp y);
99union ieee754dp ieee754dp_div(union ieee754dp x, union ieee754dp y);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200101union ieee754dp ieee754dp_abs(union ieee754dp x);
102union ieee754dp ieee754dp_neg(union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200104union ieee754dp ieee754dp_fint(int x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200105union ieee754dp ieee754dp_flong(s64 x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200106union ieee754dp ieee754dp_fsp(union ieee754sp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200108int ieee754dp_tint(union ieee754dp x);
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200109s64 ieee754dp_tlong(union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200111int ieee754dp_cmp(union ieee754dp x, union ieee754dp y, int cop, int sig);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200113union ieee754dp ieee754dp_sqrt(union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114
115
116
117/* 5 types of floating point number
118*/
Ralf Baechle9e8bad12014-04-19 00:36:32 +0200119enum {
120 IEEE754_CLASS_NORM = 0x00,
121 IEEE754_CLASS_ZERO = 0x01,
122 IEEE754_CLASS_DNORM = 0x02,
123 IEEE754_CLASS_INF = 0x03,
124 IEEE754_CLASS_SNAN = 0x04,
125 IEEE754_CLASS_QNAN = 0x05,
126};
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127
128/* exception numbers */
129#define IEEE754_INEXACT 0x01
130#define IEEE754_UNDERFLOW 0x02
131#define IEEE754_OVERFLOW 0x04
132#define IEEE754_ZERO_DIVIDE 0x08
133#define IEEE754_INVALID_OPERATION 0x10
134
135/* cmp operators
136*/
137#define IEEE754_CLT 0x01
138#define IEEE754_CEQ 0x02
139#define IEEE754_CGT 0x04
140#define IEEE754_CUN 0x08
141
142/* rounding mode
143*/
144#define IEEE754_RN 0 /* round to nearest */
145#define IEEE754_RZ 1 /* round toward zero */
146#define IEEE754_RD 2 /* round toward -Infinity */
147#define IEEE754_RU 3 /* round toward +Infinity */
148
149/* other naming */
150#define IEEE754_RM IEEE754_RD
151#define IEEE754_RP IEEE754_RU
152
153/* "normal" comparisons
154*/
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200155static inline int ieee754sp_eq(union ieee754sp x, union ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156{
157 return ieee754sp_cmp(x, y, IEEE754_CEQ, 0);
158}
159
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200160static inline int ieee754sp_ne(union ieee754sp x, union ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161{
162 return ieee754sp_cmp(x, y,
163 IEEE754_CLT | IEEE754_CGT | IEEE754_CUN, 0);
164}
165
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200166static inline int ieee754sp_lt(union ieee754sp x, union ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167{
168 return ieee754sp_cmp(x, y, IEEE754_CLT, 0);
169}
170
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200171static inline int ieee754sp_le(union ieee754sp x, union ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700172{
173 return ieee754sp_cmp(x, y, IEEE754_CLT | IEEE754_CEQ, 0);
174}
175
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200176static inline int ieee754sp_gt(union ieee754sp x, union ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177{
178 return ieee754sp_cmp(x, y, IEEE754_CGT, 0);
179}
180
181
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200182static inline int ieee754sp_ge(union ieee754sp x, union ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183{
184 return ieee754sp_cmp(x, y, IEEE754_CGT | IEEE754_CEQ, 0);
185}
186
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200187static inline int ieee754dp_eq(union ieee754dp x, union ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700188{
189 return ieee754dp_cmp(x, y, IEEE754_CEQ, 0);
190}
191
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200192static inline int ieee754dp_ne(union ieee754dp x, union ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193{
194 return ieee754dp_cmp(x, y,
195 IEEE754_CLT | IEEE754_CGT | IEEE754_CUN, 0);
196}
197
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200198static inline int ieee754dp_lt(union ieee754dp x, union ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199{
200 return ieee754dp_cmp(x, y, IEEE754_CLT, 0);
201}
202
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200203static inline int ieee754dp_le(union ieee754dp x, union ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204{
205 return ieee754dp_cmp(x, y, IEEE754_CLT | IEEE754_CEQ, 0);
206}
207
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200208static inline int ieee754dp_gt(union ieee754dp x, union ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700209{
210 return ieee754dp_cmp(x, y, IEEE754_CGT, 0);
211}
212
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200213static inline int ieee754dp_ge(union ieee754dp x, union ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214{
215 return ieee754dp_cmp(x, y, IEEE754_CGT | IEEE754_CEQ, 0);
216}
217
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000218/*
219 * The control status register
220 */
221struct _ieee754_csr {
Ralf Baechlef80cc082014-04-16 00:40:02 +0200222 __BITFIELD_FIELD(unsigned pad0:7,
223 __BITFIELD_FIELD(unsigned nod:1, /* set 1 for no denormalised numbers */
224 __BITFIELD_FIELD(unsigned c:1, /* condition */
225 __BITFIELD_FIELD(unsigned pad1:5,
226 __BITFIELD_FIELD(unsigned cx:6, /* exceptions this operation */
227 __BITFIELD_FIELD(unsigned mx:5, /* exception enable mask */
228 __BITFIELD_FIELD(unsigned sx:5, /* exceptions total */
229 __BITFIELD_FIELD(unsigned rm:2, /* current rounding mode */
230 ;))))))))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231};
Atsushi Nemotoeae89072006-05-16 01:26:03 +0900232#define ieee754_csr (*(struct _ieee754_csr *)(&current->thread.fpu.fcr31))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000234static inline unsigned ieee754_getrm(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700235{
236 return (ieee754_csr.rm);
237}
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000238static inline unsigned ieee754_setrm(unsigned rm)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239{
240 return (ieee754_csr.rm = rm);
241}
242
243/*
244 * get current exceptions
245 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000246static inline unsigned ieee754_getcx(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247{
248 return (ieee754_csr.cx);
249}
250
251/* test for current exception condition
252 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000253static inline int ieee754_cxtest(unsigned n)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254{
255 return (ieee754_csr.cx & n);
256}
257
258/*
259 * get sticky exceptions
260 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000261static inline unsigned ieee754_getsx(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262{
263 return (ieee754_csr.sx);
264}
265
266/* clear sticky conditions
267*/
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000268static inline unsigned ieee754_clrsx(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269{
270 return (ieee754_csr.sx = 0);
271}
272
273/* test for sticky exception condition
274 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000275static inline int ieee754_sxtest(unsigned n)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276{
277 return (ieee754_csr.sx & n);
278}
279
280/* debugging */
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200281union ieee754sp ieee754sp_dump(char *s, union ieee754sp x);
282union ieee754dp ieee754dp_dump(char *s, union ieee754dp x);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283
284#define IEEE754_SPCVAL_PZERO 0
285#define IEEE754_SPCVAL_NZERO 1
286#define IEEE754_SPCVAL_PONE 2
287#define IEEE754_SPCVAL_NONE 3
288#define IEEE754_SPCVAL_PTEN 4
289#define IEEE754_SPCVAL_NTEN 5
290#define IEEE754_SPCVAL_PINFINITY 6
291#define IEEE754_SPCVAL_NINFINITY 7
292#define IEEE754_SPCVAL_INDEF 8
293#define IEEE754_SPCVAL_PMAX 9 /* +max norm */
294#define IEEE754_SPCVAL_NMAX 10 /* -max norm */
295#define IEEE754_SPCVAL_PMIN 11 /* +min norm */
296#define IEEE754_SPCVAL_NMIN 12 /* +min norm */
297#define IEEE754_SPCVAL_PMIND 13 /* +min denorm */
298#define IEEE754_SPCVAL_NMIND 14 /* +min denorm */
299#define IEEE754_SPCVAL_P1E31 15 /* + 1.0e31 */
300#define IEEE754_SPCVAL_P1E63 16 /* + 1.0e63 */
301
Ralf Baechle23708812014-04-16 01:16:02 +0200302extern const struct ieee754dp_const __ieee754dp_spcvals[];
303extern const struct ieee754sp_const __ieee754sp_spcvals[];
Ralf Baechle2209bcb2014-04-16 01:31:11 +0200304#define ieee754dp_spcvals ((const union ieee754dp *)__ieee754dp_spcvals)
305#define ieee754sp_spcvals ((const union ieee754sp *)__ieee754sp_spcvals)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000307/*
308 * Return infinity with given sign
309 */
310#define ieee754dp_inf(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PINFINITY+(sn)])
311#define ieee754dp_zero(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PZERO+(sn)])
312#define ieee754dp_one(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PONE+(sn)])
313#define ieee754dp_ten(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PTEN+(sn)])
314#define ieee754dp_indef() (ieee754dp_spcvals[IEEE754_SPCVAL_INDEF])
315#define ieee754dp_max(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMAX+(sn)])
316#define ieee754dp_min(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMIN+(sn)])
317#define ieee754dp_mind(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMIND+(sn)])
318#define ieee754dp_1e31() (ieee754dp_spcvals[IEEE754_SPCVAL_P1E31])
319#define ieee754dp_1e63() (ieee754dp_spcvals[IEEE754_SPCVAL_P1E63])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000321#define ieee754sp_inf(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PINFINITY+(sn)])
322#define ieee754sp_zero(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PZERO+(sn)])
323#define ieee754sp_one(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PONE+(sn)])
324#define ieee754sp_ten(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PTEN+(sn)])
325#define ieee754sp_indef() (ieee754sp_spcvals[IEEE754_SPCVAL_INDEF])
326#define ieee754sp_max(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMAX+(sn)])
327#define ieee754sp_min(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMIN+(sn)])
328#define ieee754sp_mind(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMIND+(sn)])
329#define ieee754sp_1e31() (ieee754sp_spcvals[IEEE754_SPCVAL_P1E31])
330#define ieee754sp_1e63() (ieee754sp_spcvals[IEEE754_SPCVAL_P1E63])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000332/*
333 * Indefinite integer value
334 */
Ralf Baechlee812a732014-04-19 14:20:54 +0200335static inline int ieee754si_indef(void)
336{
337 return INT_MAX;
338}
339
340static inline s64 ieee754di_indef(void)
341{
342 return S64_MAX;
343}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345/* result types for xctx.rt */
346#define IEEE754_RT_SP 0
347#define IEEE754_RT_DP 1
348#define IEEE754_RT_XP 2
349#define IEEE754_RT_SI 3
350#define IEEE754_RT_DI 4
351
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352/* compat */
353#define ieee754dp_fix(x) ieee754dp_tint(x)
354#define ieee754sp_fix(x) ieee754sp_tint(x)
Ralf Baechlea663bf92005-10-23 13:44:31 +0100355
356#endif /* __ARCH_MIPS_MATH_EMU_IEEE754_H */