Blame - arch/mips/math-emu/ieee754dp.c - kernel/msm-4.9

blob: ad3c73436777f0c3103c887827c4547d888f5941 [file] [log] [blame]

Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1	/* IEEE754 floating point arithmetic
				2	* double precision: common utilities
				3	*/
				4	/*
				5	* MIPS floating point support
				6	* Copyright (C) 1994-2000 Algorithmics Ltd.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	7	*
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	8	* This program is free software; you can distribute it and/or modify it
				9	* under the terms of the GNU General Public License (Version 2) as
				10	* published by the Free Software Foundation.
				11	*
				12	* This program is distributed in the hope it will be useful, but WITHOUT
				13	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
				14	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
				15	* for more details.
				16	*
				17	* You should have received a copy of the GNU General Public License along
				18	* with this program; if not, write to the Free Software Foundation, Inc.,
Ralf Baechle	3f7cac4	2014-04-26 01:49:14 +0200	[diff] [blame]	19	* 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	20	*/
				21
Ralf Baechle	cae5506	2014-04-16 00:47:59 +0200	[diff] [blame]	22	#include <linux/compiler.h>
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	23
				24	#include "ieee754dp.h"
				25
Ralf Baechle	2209bcb	2014-04-16 01:31:11 +0200	[diff] [blame]	26	int ieee754dp_class(union ieee754dp x)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	27	{
				28	COMPXDP;
				29	EXPLODEXDP;
				30	return xc;
				31	}
				32
Maciej W. Rozycki	e06b530	2015-04-03 23:25:57 +0100	[diff] [blame]	33	static inline int ieee754dp_isnan(union ieee754dp x)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	34	{
Maciej W. Rozycki	c9a1084	2015-04-03 23:25:38 +0100	[diff] [blame]	35	return ieee754_class_nan(ieee754dp_class(x));
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	36	}
				37
Ralf Baechle	f71baa1	2014-04-25 00:40:42 +0200	[diff] [blame]	38	static inline int ieee754dp_issnan(union ieee754dp x)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	39	{
Maciej W. Rozycki	90d53a9	2015-11-13 00:47:28 +0000	[diff] [blame]	40	int qbit;
				41
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	42	assert(ieee754dp_isnan(x));
Maciej W. Rozycki	90d53a9	2015-11-13 00:47:28 +0000	[diff] [blame]	43	qbit = (DPMANT(x) & DP_MBIT(DP_FBITS - 1)) == DP_MBIT(DP_FBITS - 1);
				44	return ieee754_csr.nan2008 ^ qbit;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	45	}
				46
				47
Maciej W. Rozycki	d5afa7e	2015-04-03 23:25:34 +0100	[diff] [blame]	48	/*
				49	* Raise the Invalid Operation IEEE 754 exception
				50	* and convert the signaling NaN supplied to a quiet NaN.
				51	*/
Ralf Baechle	90efba3	2014-04-25 03:19:57 +0200	[diff] [blame]	52	union ieee754dp __cold ieee754dp_nanxcpt(union ieee754dp r)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	53	{
Maciej W. Rozycki	d5afa7e	2015-04-03 23:25:34 +0100	[diff] [blame]	54	assert(ieee754dp_issnan(r));
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	55
Maciej W. Rozycki	d5afa7e	2015-04-03 23:25:34 +0100	[diff] [blame]	56	ieee754_setcx(IEEE754_INVALID_OPERATION);
Maciej W. Rozycki	90d53a9	2015-11-13 00:47:28 +0000	[diff] [blame]	57	if (ieee754_csr.nan2008)
				58	DPMANT(r) \|= DP_MBIT(DP_FBITS - 1);
				59	else
				60	r = ieee754dp_indef();
				61
				62	return r;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	63	}
				64
Ralf Baechle	de2fc34	2014-04-25 10:54:06 +0200	[diff] [blame]	65	static u64 ieee754dp_get_rounding(int sn, u64 xm)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	66	{
				67	/* inexact must round of 3 bits
				68	*/
				69	if (xm & (DP_MBIT(3) - 1)) {
				70	switch (ieee754_csr.rm) {
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	71	case FPU_CSR_RZ:
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	72	break;
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	73	case FPU_CSR_RN:
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	74	xm += 0x3 + ((xm >> 3) & 1);
				75	/* xm += (xm&0x8)?0x4:0x3 */
				76	break;
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	77	case FPU_CSR_RU: /* toward +Infinity */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	78	if (!sn) /* ?? */
				79	xm += 0x8;
				80	break;
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	81	case FPU_CSR_RD: /* toward -Infinity */
Ralf Baechle	7034228	2013-01-22 12:59:30 +0100	[diff] [blame]	82	if (sn) /* ?? */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	83	xm += 0x8;
				84	break;
				85	}
				86	}
				87	return xm;
				88	}
				89
				90
				91	/* generate a normal/denormal number with over,under handling
				92	* sn is sign
				93	* xe is an unbiased exponent
				94	* xm is 3bit extended precision value.
				95	*/
Ralf Baechle	2209bcb	2014-04-16 01:31:11 +0200	[diff] [blame]	96	union ieee754dp ieee754dp_format(int sn, int xe, u64 xm)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	97	{
				98	assert(xm); /* we don't gen exact zeros (probably should) */
				99
Ralf Baechle	ad8fb55	2014-04-22 15:51:55 +0200	[diff] [blame]	100	assert((xm >> (DP_FBITS + 1 + 3)) == 0); /* no execess */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	101	assert(xm & (DP_HIDDEN_BIT << 3));
				102
				103	if (xe < DP_EMIN) {
				104	/* strip lower bits */
				105	int es = DP_EMIN - xe;
				106
				107	if (ieee754_csr.nod) {
Ralf Baechle	9e8bad1	2014-04-19 00:36:32 +0200	[diff] [blame]	108	ieee754_setcx(IEEE754_UNDERFLOW);
				109	ieee754_setcx(IEEE754_INEXACT);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	110
				111	switch(ieee754_csr.rm) {
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	112	case FPU_CSR_RN:
				113	case FPU_CSR_RZ:
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	114	return ieee754dp_zero(sn);
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	115	case FPU_CSR_RU: /* toward +Infinity */
Ralf Baechle	47fa0c0	2014-04-16 11:00:12 +0200	[diff] [blame]	116	if (sn == 0)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	117	return ieee754dp_min(0);
				118	else
				119	return ieee754dp_zero(1);
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	120	case FPU_CSR_RD: /* toward -Infinity */
Ralf Baechle	47fa0c0	2014-04-16 11:00:12 +0200	[diff] [blame]	121	if (sn == 0)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	122	return ieee754dp_zero(0);
				123	else
				124	return ieee754dp_min(1);
				125	}
				126	}
				127
Ralf Baechle	de2fc34	2014-04-25 10:54:06 +0200	[diff] [blame]	128	if (xe == DP_EMIN - 1 &&
				129	ieee754dp_get_rounding(sn, xm) >> (DP_FBITS + 1 + 3))
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	130	{
				131	/* Not tiny after rounding */
Ralf Baechle	9e8bad1	2014-04-19 00:36:32 +0200	[diff] [blame]	132	ieee754_setcx(IEEE754_INEXACT);
Ralf Baechle	de2fc34	2014-04-25 10:54:06 +0200	[diff] [blame]	133	xm = ieee754dp_get_rounding(sn, xm);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	134	xm >>= 1;
				135	/* Clear grs bits */
				136	xm &= ~(DP_MBIT(3) - 1);
				137	xe++;
				138	}
				139	else {
				140	/* sticky right shift es bits
				141	*/
				142	xm = XDPSRS(xm, es);
				143	xe += es;
				144	assert((xm & (DP_HIDDEN_BIT << 3)) == 0);
				145	assert(xe == DP_EMIN);
				146	}
				147	}
				148	if (xm & (DP_MBIT(3) - 1)) {
Ralf Baechle	9e8bad1	2014-04-19 00:36:32 +0200	[diff] [blame]	149	ieee754_setcx(IEEE754_INEXACT);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	150	if ((xm & (DP_HIDDEN_BIT << 3)) == 0) {
Ralf Baechle	9e8bad1	2014-04-19 00:36:32 +0200	[diff] [blame]	151	ieee754_setcx(IEEE754_UNDERFLOW);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	152	}
				153
				154	/* inexact must round of 3 bits
				155	*/
Ralf Baechle	de2fc34	2014-04-25 10:54:06 +0200	[diff] [blame]	156	xm = ieee754dp_get_rounding(sn, xm);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	157	/* adjust exponent for rounding add overflowing
				158	*/
Ralf Baechle	ad8fb55	2014-04-22 15:51:55 +0200	[diff] [blame]	159	if (xm >> (DP_FBITS + 3 + 1)) {
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	160	/* add causes mantissa overflow */
				161	xm >>= 1;
				162	xe++;
				163	}
				164	}
				165	/* strip grs bits */
				166	xm >>= 3;
				167
Ralf Baechle	ad8fb55	2014-04-22 15:51:55 +0200	[diff] [blame]	168	assert((xm >> (DP_FBITS + 1)) == 0); /* no execess */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	169	assert(xe >= DP_EMIN);
				170
				171	if (xe > DP_EMAX) {
Ralf Baechle	9e8bad1	2014-04-19 00:36:32 +0200	[diff] [blame]	172	ieee754_setcx(IEEE754_OVERFLOW);
				173	ieee754_setcx(IEEE754_INEXACT);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	174	/* -O can be table indexed by (rm,sn) */
				175	switch (ieee754_csr.rm) {
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	176	case FPU_CSR_RN:
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	177	return ieee754dp_inf(sn);
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	178	case FPU_CSR_RZ:
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	179	return ieee754dp_max(sn);
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	180	case FPU_CSR_RU: /* toward +Infinity */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	181	if (sn == 0)
				182	return ieee754dp_inf(0);
				183	else
				184	return ieee754dp_max(1);
Ralf Baechle	56a6473	2014-04-30 11:21:55 +0200	[diff] [blame]	185	case FPU_CSR_RD: /* toward -Infinity */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	186	if (sn == 0)
				187	return ieee754dp_max(0);
				188	else
				189	return ieee754dp_inf(1);
				190	}
				191	}
				192	/* gen norm/denorm/zero */
				193
				194	if ((xm & DP_HIDDEN_BIT) == 0) {
				195	/* we underflow (tiny/zero) */
				196	assert(xe == DP_EMIN);
				197	if (ieee754_csr.mx & IEEE754_UNDERFLOW)
Ralf Baechle	9e8bad1	2014-04-19 00:36:32 +0200	[diff] [blame]	198	ieee754_setcx(IEEE754_UNDERFLOW);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	199	return builddp(sn, DP_EMIN - 1 + DP_EBIAS, xm);
				200	} else {
Ralf Baechle	ad8fb55	2014-04-22 15:51:55 +0200	[diff] [blame]	201	assert((xm >> (DP_FBITS + 1)) == 0); /* no execess */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	202	assert(xm & DP_HIDDEN_BIT);
				203
				204	return builddp(sn, xe + DP_EBIAS, xm & ~DP_HIDDEN_BIT);
				205	}
				206	}