Blame - src/util/rounding.h - platform/external/mesa3d

blob: 7b5608b8a7844dc7f9b09381dec1a2ab1baa3665 [file] [log] [blame]

Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	1	/*
				2	* Copyright © 2015 Intel Corporation
				3	*
				4	* Permission is hereby granted, free of charge, to any person obtaining a
				5	* copy of this software and associated documentation files (the "Software"),
				6	* to deal in the Software without restriction, including without limitation
				7	* the rights to use, copy, modify, merge, publish, distribute, sublicense,
				8	* and/or sell copies of the Software, and to permit persons to whom the
				9	* Software is furnished to do so, subject to the following conditions:
				10	*
				11	* The above copyright notice and this permission notice (including the next
				12	* paragraph) shall be included in all copies or substantial portions of the
				13	* Software.
				14	*
				15	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				16	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				17	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
				18	* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				19	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
				20	* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
				21	* IN THE SOFTWARE.
				22	*/
				23
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	24	#ifndef _ROUNDING_H
				25	#define _ROUNDING_H
				26
Jose Fonseca	497a22a	2015-08-09 11:55:28 +0100	[diff] [blame]	27	#include "c99_compat.h" // inline
				28
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	29	#include <math.h>
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	30	#include <limits.h>
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame^]	31	#include <stdint.h>
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	32
				33	#ifdef __x86_64__
				34	#include <xmmintrin.h>
				35	#include <emmintrin.h>
				36	#endif
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	37
Matt Turner	036e347	2015-03-18 14:23:41 -0700	[diff] [blame]	38	#ifdef __SSE4_1__
				39	#include <smmintrin.h>
				40	#endif
				41
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	42	/* The C standard library has functions round()/rint()/nearbyint() that round
				43	* their arguments according to the rounding mode set in the floating-point
				44	* control register. While there are trunc()/ceil()/floor() functions that do
				45	* a specific operation without modifying the rounding mode, there is no
				46	* roundeven() in any version of C.
				47	*
				48	* Technical Specification 18661 (ISO/IEC TS 18661-1:2014) adds roundeven(),
				49	* but it's unfortunately not implemented by glibc.
				50	*
				51	* This implementation differs in that it does not raise the inexact exception.
				52	*
				53	* We use rint() to implement these functions, with the assumption that the
				54	* floating-point rounding mode has not been changed from the default Round
				55	* to Nearest.
				56	*/
				57
				58	/**
				59	* \brief Rounds \c x to the nearest integer, with ties to the even integer.
				60	*/
				61	static inline float
				62	_mesa_roundevenf(float x)
				63	{
Matt Turner	036e347	2015-03-18 14:23:41 -0700	[diff] [blame]	64	#ifdef __SSE4_1__
				65	float ret;
				66	__m128 m = _mm_load_ss(&x);
				67	m = _mm_round_ss(m, m, _MM_FROUND_CUR_DIRECTION \| _MM_FROUND_NO_EXC);
				68	_mm_store_ss(&ret, m);
				69	return ret;
				70	#else
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	71	return rintf(x);
Matt Turner	036e347	2015-03-18 14:23:41 -0700	[diff] [blame]	72	#endif
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	73	}
				74
				75	/**
				76	* \brief Rounds \c x to the nearest integer, with ties to the even integer.
				77	*/
				78	static inline double
				79	_mesa_roundeven(double x)
				80	{
Matt Turner	036e347	2015-03-18 14:23:41 -0700	[diff] [blame]	81	#ifdef __SSE4_1__
				82	double ret;
				83	__m128d m = _mm_load_sd(&x);
				84	m = _mm_round_sd(m, m, _MM_FROUND_CUR_DIRECTION \| _MM_FROUND_NO_EXC);
				85	_mm_store_sd(&ret, m);
				86	return ret;
				87	#else
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	88	return rint(x);
Matt Turner	036e347	2015-03-18 14:23:41 -0700	[diff] [blame]	89	#endif
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	90	}
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	91
				92	/**
				93	* \brief Rounds \c x to the nearest integer, with ties to the even integer,
				94	* and returns the value as a long int.
				95	*/
				96	static inline long
				97	_mesa_lroundevenf(float x)
				98	{
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	99	#ifdef __x86_64__
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame^]	100	#if LONG_MAX == INT64_MAX
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	101	return _mm_cvtss_si64(_mm_load_ss(&x));
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame^]	102	#elif LONG_MAX == INT32_MAX
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	103	return _mm_cvtss_si32(_mm_load_ss(&x));
Jose Fonseca	21ccdbd	2015-08-09 11:25:41 +0100	[diff] [blame]	104	#else
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame^]	105	#error "Unsupported long size"
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	106	#endif
				107	#else
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	108	return lrintf(x);
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	109	#endif
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	110	}
				111
				112	/**
				113	* \brief Rounds \c x to the nearest integer, with ties to the even integer,
				114	* and returns the value as a long int.
				115	*/
				116	static inline long
				117	_mesa_lroundeven(double x)
				118	{
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	119	#ifdef __x86_64__
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame^]	120	#if LONG_MAX == INT64_MAX
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	121	return _mm_cvtsd_si64(_mm_load_sd(&x));
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame^]	122	#elif LONG_MAX == INT32_MAX
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	123	return _mm_cvtsd_si32(_mm_load_sd(&x));
Jose Fonseca	21ccdbd	2015-08-09 11:25:41 +0100	[diff] [blame]	124	#else
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame^]	125	#error "Unsupported long size"
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	126	#endif
				127	#else
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	128	return lrint(x);
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	129	#endif
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	130	}
				131
				132	#endif