blob: 5689b0cf018591c0602cb80e181dafdacc4aa072 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * MIPS floating point support
3 * Copyright (C) 1994-2000 Algorithmics Ltd.
4 * http://www.algor.co.uk
5 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07006 * This program is free software; you can distribute it and/or modify it
7 * under the terms of the GNU General Public License (Version 2) as
8 * published by the Free Software Foundation.
9 *
10 * This program is distributed in the hope it will be useful, but WITHOUT
11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
13 * for more details.
14 *
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 59 Temple Place - Suite 330, Boston MA 02111-1307, USA.
18 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070019 * Nov 7, 2000
20 * Modification to allow integration with Linux kernel
21 *
22 * Kevin D. Kissell, kevink@mips.com and Carsten Langgard, carstenl@mips.com
23 * Copyright (C) 2000 MIPS Technologies, Inc. All rights reserved.
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000024 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070025
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000026#include <asm/byteorder.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070027#include <linux/types.h>
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000028#include <linux/sched.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070029
30/*
31 * Not very pretty, but the Linux kernel's normal va_list definition
32 * does not allow it to be used as a structure element, as it is here.
33 */
34#ifndef _STDARG_H
35#include <stdarg.h>
36#endif
37
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000038#ifdef __LITTLE_ENDIAN
Linus Torvalds1da177e2005-04-16 15:20:36 -070039struct ieee754dp_konst {
40 unsigned mantlo:32;
41 unsigned manthi:20;
42 unsigned bexp:11;
43 unsigned sign:1;
44};
45struct ieee754sp_konst {
46 unsigned mant:23;
47 unsigned bexp:8;
48 unsigned sign:1;
49};
50
51typedef union _ieee754dp {
52 struct ieee754dp_konst oparts;
53 struct {
54 u64 mant:52;
55 unsigned int bexp:11;
56 unsigned int sign:1;
57 } parts;
58 u64 bits;
59 double d;
60} ieee754dp;
61
62typedef union _ieee754sp {
63 struct ieee754sp_konst parts;
64 float f;
65 u32 bits;
66} ieee754sp;
67#endif
68
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000069#ifdef __BIG_ENDIAN
Linus Torvalds1da177e2005-04-16 15:20:36 -070070struct ieee754dp_konst {
71 unsigned sign:1;
72 unsigned bexp:11;
73 unsigned manthi:20;
74 unsigned mantlo:32;
75};
Ralf Baechlecd21dfc2005-04-28 13:39:10 +000076
Linus Torvalds1da177e2005-04-16 15:20:36 -070077typedef union _ieee754dp {
78 struct ieee754dp_konst oparts;
79 struct {
80 unsigned int sign:1;
81 unsigned int bexp:11;
82 u64 mant:52;
83 } parts;
84 double d;
85 u64 bits;
86} ieee754dp;
87
88struct ieee754sp_konst {
89 unsigned sign:1;
90 unsigned bexp:8;
91 unsigned mant:23;
92};
93
94typedef union _ieee754sp {
95 struct ieee754sp_konst parts;
96 float f;
97 u32 bits;
98} ieee754sp;
99#endif
100
101/*
102 * single precision (often aka float)
103*/
104int ieee754sp_finite(ieee754sp x);
105int ieee754sp_class(ieee754sp x);
106
107ieee754sp ieee754sp_abs(ieee754sp x);
108ieee754sp ieee754sp_neg(ieee754sp x);
109ieee754sp ieee754sp_scalb(ieee754sp x, int);
110ieee754sp ieee754sp_logb(ieee754sp x);
111
112/* x with sign of y */
113ieee754sp ieee754sp_copysign(ieee754sp x, ieee754sp y);
114
115ieee754sp ieee754sp_add(ieee754sp x, ieee754sp y);
116ieee754sp ieee754sp_sub(ieee754sp x, ieee754sp y);
117ieee754sp ieee754sp_mul(ieee754sp x, ieee754sp y);
118ieee754sp ieee754sp_div(ieee754sp x, ieee754sp y);
119
120ieee754sp ieee754sp_fint(int x);
121ieee754sp ieee754sp_funs(unsigned x);
122ieee754sp ieee754sp_flong(s64 x);
123ieee754sp ieee754sp_fulong(u64 x);
124ieee754sp ieee754sp_fdp(ieee754dp x);
125
126int ieee754sp_tint(ieee754sp x);
127unsigned int ieee754sp_tuns(ieee754sp x);
128s64 ieee754sp_tlong(ieee754sp x);
129u64 ieee754sp_tulong(ieee754sp x);
130
131int ieee754sp_cmp(ieee754sp x, ieee754sp y, int cop, int sig);
132/*
133 * basic sp math
134 */
135ieee754sp ieee754sp_modf(ieee754sp x, ieee754sp * ip);
136ieee754sp ieee754sp_frexp(ieee754sp x, int *exp);
137ieee754sp ieee754sp_ldexp(ieee754sp x, int exp);
138
139ieee754sp ieee754sp_ceil(ieee754sp x);
140ieee754sp ieee754sp_floor(ieee754sp x);
141ieee754sp ieee754sp_trunc(ieee754sp x);
142
143ieee754sp ieee754sp_sqrt(ieee754sp x);
144
145/*
146 * double precision (often aka double)
147*/
148int ieee754dp_finite(ieee754dp x);
149int ieee754dp_class(ieee754dp x);
150
151/* x with sign of y */
152ieee754dp ieee754dp_copysign(ieee754dp x, ieee754dp y);
153
154ieee754dp ieee754dp_add(ieee754dp x, ieee754dp y);
155ieee754dp ieee754dp_sub(ieee754dp x, ieee754dp y);
156ieee754dp ieee754dp_mul(ieee754dp x, ieee754dp y);
157ieee754dp ieee754dp_div(ieee754dp x, ieee754dp y);
158
159ieee754dp ieee754dp_abs(ieee754dp x);
160ieee754dp ieee754dp_neg(ieee754dp x);
161ieee754dp ieee754dp_scalb(ieee754dp x, int);
162
163/* return exponent as integer in floating point format
164 */
165ieee754dp ieee754dp_logb(ieee754dp x);
166
167ieee754dp ieee754dp_fint(int x);
168ieee754dp ieee754dp_funs(unsigned x);
169ieee754dp ieee754dp_flong(s64 x);
170ieee754dp ieee754dp_fulong(u64 x);
171ieee754dp ieee754dp_fsp(ieee754sp x);
172
173ieee754dp ieee754dp_ceil(ieee754dp x);
174ieee754dp ieee754dp_floor(ieee754dp x);
175ieee754dp ieee754dp_trunc(ieee754dp x);
176
177int ieee754dp_tint(ieee754dp x);
178unsigned int ieee754dp_tuns(ieee754dp x);
179s64 ieee754dp_tlong(ieee754dp x);
180u64 ieee754dp_tulong(ieee754dp x);
181
182int ieee754dp_cmp(ieee754dp x, ieee754dp y, int cop, int sig);
183/*
184 * basic sp math
185 */
186ieee754dp ieee754dp_modf(ieee754dp x, ieee754dp * ip);
187ieee754dp ieee754dp_frexp(ieee754dp x, int *exp);
188ieee754dp ieee754dp_ldexp(ieee754dp x, int exp);
189
190ieee754dp ieee754dp_ceil(ieee754dp x);
191ieee754dp ieee754dp_floor(ieee754dp x);
192ieee754dp ieee754dp_trunc(ieee754dp x);
193
194ieee754dp ieee754dp_sqrt(ieee754dp x);
195
196
197
198/* 5 types of floating point number
199*/
200#define IEEE754_CLASS_NORM 0x00
201#define IEEE754_CLASS_ZERO 0x01
202#define IEEE754_CLASS_DNORM 0x02
203#define IEEE754_CLASS_INF 0x03
204#define IEEE754_CLASS_SNAN 0x04
205#define IEEE754_CLASS_QNAN 0x05
206extern const char *const ieee754_cname[];
207
208/* exception numbers */
209#define IEEE754_INEXACT 0x01
210#define IEEE754_UNDERFLOW 0x02
211#define IEEE754_OVERFLOW 0x04
212#define IEEE754_ZERO_DIVIDE 0x08
213#define IEEE754_INVALID_OPERATION 0x10
214
215/* cmp operators
216*/
217#define IEEE754_CLT 0x01
218#define IEEE754_CEQ 0x02
219#define IEEE754_CGT 0x04
220#define IEEE754_CUN 0x08
221
222/* rounding mode
223*/
224#define IEEE754_RN 0 /* round to nearest */
225#define IEEE754_RZ 1 /* round toward zero */
226#define IEEE754_RD 2 /* round toward -Infinity */
227#define IEEE754_RU 3 /* round toward +Infinity */
228
229/* other naming */
230#define IEEE754_RM IEEE754_RD
231#define IEEE754_RP IEEE754_RU
232
233/* "normal" comparisons
234*/
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000235static inline int ieee754sp_eq(ieee754sp x, ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236{
237 return ieee754sp_cmp(x, y, IEEE754_CEQ, 0);
238}
239
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000240static inline int ieee754sp_ne(ieee754sp x, ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241{
242 return ieee754sp_cmp(x, y,
243 IEEE754_CLT | IEEE754_CGT | IEEE754_CUN, 0);
244}
245
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000246static inline int ieee754sp_lt(ieee754sp x, ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247{
248 return ieee754sp_cmp(x, y, IEEE754_CLT, 0);
249}
250
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000251static inline int ieee754sp_le(ieee754sp x, ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252{
253 return ieee754sp_cmp(x, y, IEEE754_CLT | IEEE754_CEQ, 0);
254}
255
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000256static inline int ieee754sp_gt(ieee754sp x, ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700257{
258 return ieee754sp_cmp(x, y, IEEE754_CGT, 0);
259}
260
261
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000262static inline int ieee754sp_ge(ieee754sp x, ieee754sp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263{
264 return ieee754sp_cmp(x, y, IEEE754_CGT | IEEE754_CEQ, 0);
265}
266
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000267static inline int ieee754dp_eq(ieee754dp x, ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268{
269 return ieee754dp_cmp(x, y, IEEE754_CEQ, 0);
270}
271
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000272static inline int ieee754dp_ne(ieee754dp x, ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273{
274 return ieee754dp_cmp(x, y,
275 IEEE754_CLT | IEEE754_CGT | IEEE754_CUN, 0);
276}
277
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000278static inline int ieee754dp_lt(ieee754dp x, ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279{
280 return ieee754dp_cmp(x, y, IEEE754_CLT, 0);
281}
282
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000283static inline int ieee754dp_le(ieee754dp x, ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284{
285 return ieee754dp_cmp(x, y, IEEE754_CLT | IEEE754_CEQ, 0);
286}
287
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000288static inline int ieee754dp_gt(ieee754dp x, ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289{
290 return ieee754dp_cmp(x, y, IEEE754_CGT, 0);
291}
292
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000293static inline int ieee754dp_ge(ieee754dp x, ieee754dp y)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294{
295 return ieee754dp_cmp(x, y, IEEE754_CGT | IEEE754_CEQ, 0);
296}
297
298
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000299/*
300 * Like strtod
301 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302ieee754dp ieee754dp_fstr(const char *s, char **endp);
303char *ieee754dp_tstr(ieee754dp x, int prec, int fmt, int af);
304
305
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000306/*
307 * The control status register
308 */
309struct _ieee754_csr {
310#ifdef __BIG_ENDIAN
311 unsigned pad0:7;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 unsigned nod:1; /* set 1 for no denormalised numbers */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000313 unsigned c:1; /* condition */
314 unsigned pad1:5;
315 unsigned cx:6; /* exceptions this operation */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700316 unsigned mx:5; /* exception enable mask */
317 unsigned sx:5; /* exceptions total */
318 unsigned rm:2; /* current rounding mode */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000319#endif
320#ifdef __LITTLE_ENDIAN
321 unsigned rm:2; /* current rounding mode */
322 unsigned sx:5; /* exceptions total */
323 unsigned mx:5; /* exception enable mask */
324 unsigned cx:6; /* exceptions this operation */
325 unsigned pad1:5;
326 unsigned c:1; /* condition */
327 unsigned nod:1; /* set 1 for no denormalised numbers */
328 unsigned pad0:7;
329#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330};
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000331#define ieee754_csr (*(struct _ieee754_csr *)(&current->thread.fpu.soft.fcr31))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000333static inline unsigned ieee754_getrm(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334{
335 return (ieee754_csr.rm);
336}
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000337static inline unsigned ieee754_setrm(unsigned rm)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338{
339 return (ieee754_csr.rm = rm);
340}
341
342/*
343 * get current exceptions
344 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000345static inline unsigned ieee754_getcx(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346{
347 return (ieee754_csr.cx);
348}
349
350/* test for current exception condition
351 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000352static inline int ieee754_cxtest(unsigned n)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353{
354 return (ieee754_csr.cx & n);
355}
356
357/*
358 * get sticky exceptions
359 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000360static inline unsigned ieee754_getsx(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361{
362 return (ieee754_csr.sx);
363}
364
365/* clear sticky conditions
366*/
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000367static inline unsigned ieee754_clrsx(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700368{
369 return (ieee754_csr.sx = 0);
370}
371
372/* test for sticky exception condition
373 */
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000374static inline int ieee754_sxtest(unsigned n)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700375{
376 return (ieee754_csr.sx & n);
377}
378
379/* debugging */
380ieee754sp ieee754sp_dump(char *s, ieee754sp x);
381ieee754dp ieee754dp_dump(char *s, ieee754dp x);
382
383#define IEEE754_SPCVAL_PZERO 0
384#define IEEE754_SPCVAL_NZERO 1
385#define IEEE754_SPCVAL_PONE 2
386#define IEEE754_SPCVAL_NONE 3
387#define IEEE754_SPCVAL_PTEN 4
388#define IEEE754_SPCVAL_NTEN 5
389#define IEEE754_SPCVAL_PINFINITY 6
390#define IEEE754_SPCVAL_NINFINITY 7
391#define IEEE754_SPCVAL_INDEF 8
392#define IEEE754_SPCVAL_PMAX 9 /* +max norm */
393#define IEEE754_SPCVAL_NMAX 10 /* -max norm */
394#define IEEE754_SPCVAL_PMIN 11 /* +min norm */
395#define IEEE754_SPCVAL_NMIN 12 /* +min norm */
396#define IEEE754_SPCVAL_PMIND 13 /* +min denorm */
397#define IEEE754_SPCVAL_NMIND 14 /* +min denorm */
398#define IEEE754_SPCVAL_P1E31 15 /* + 1.0e31 */
399#define IEEE754_SPCVAL_P1E63 16 /* + 1.0e63 */
400
401extern const struct ieee754dp_konst __ieee754dp_spcvals[];
402extern const struct ieee754sp_konst __ieee754sp_spcvals[];
403#define ieee754dp_spcvals ((const ieee754dp *)__ieee754dp_spcvals)
404#define ieee754sp_spcvals ((const ieee754sp *)__ieee754sp_spcvals)
405
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000406/*
407 * Return infinity with given sign
408 */
409#define ieee754dp_inf(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PINFINITY+(sn)])
410#define ieee754dp_zero(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PZERO+(sn)])
411#define ieee754dp_one(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PONE+(sn)])
412#define ieee754dp_ten(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PTEN+(sn)])
413#define ieee754dp_indef() (ieee754dp_spcvals[IEEE754_SPCVAL_INDEF])
414#define ieee754dp_max(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMAX+(sn)])
415#define ieee754dp_min(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMIN+(sn)])
416#define ieee754dp_mind(sn) (ieee754dp_spcvals[IEEE754_SPCVAL_PMIND+(sn)])
417#define ieee754dp_1e31() (ieee754dp_spcvals[IEEE754_SPCVAL_P1E31])
418#define ieee754dp_1e63() (ieee754dp_spcvals[IEEE754_SPCVAL_P1E63])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700419
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000420#define ieee754sp_inf(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PINFINITY+(sn)])
421#define ieee754sp_zero(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PZERO+(sn)])
422#define ieee754sp_one(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PONE+(sn)])
423#define ieee754sp_ten(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PTEN+(sn)])
424#define ieee754sp_indef() (ieee754sp_spcvals[IEEE754_SPCVAL_INDEF])
425#define ieee754sp_max(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMAX+(sn)])
426#define ieee754sp_min(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMIN+(sn)])
427#define ieee754sp_mind(sn) (ieee754sp_spcvals[IEEE754_SPCVAL_PMIND+(sn)])
428#define ieee754sp_1e31() (ieee754sp_spcvals[IEEE754_SPCVAL_P1E31])
429#define ieee754sp_1e63() (ieee754sp_spcvals[IEEE754_SPCVAL_P1E63])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700430
Ralf Baechlecd21dfc2005-04-28 13:39:10 +0000431/*
432 * Indefinite integer value
433 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700434#define ieee754si_indef() INT_MAX
435#ifdef LONG_LONG_MAX
436#define ieee754di_indef() LONG_LONG_MAX
437#else
438#define ieee754di_indef() ((s64)(~0ULL>>1))
439#endif
440
441/* IEEE exception context, passed to handler */
442struct ieee754xctx {
443 const char *op; /* operation name */
444 int rt; /* result type */
445 union {
446 ieee754sp sp; /* single precision */
447 ieee754dp dp; /* double precision */
448#ifdef IEEE854_XP
449 ieee754xp xp; /* extended precision */
450#endif
451 int si; /* standard signed integer (32bits) */
452 s64 di; /* extended signed integer (64bits) */
453 } rv; /* default result format implied by op */
454 va_list ap;
455};
456
457/* result types for xctx.rt */
458#define IEEE754_RT_SP 0
459#define IEEE754_RT_DP 1
460#define IEEE754_RT_XP 2
461#define IEEE754_RT_SI 3
462#define IEEE754_RT_DI 4
463
464extern void ieee754_xcpt(struct ieee754xctx *xcp);
465
466/* compat */
467#define ieee754dp_fix(x) ieee754dp_tint(x)
468#define ieee754sp_fix(x) ieee754sp_tint(x)