Blame - src/util/rounding.h - platform/external/mesa3d

blob: afb38fbdb56b31188b50529a8f8006e12188329c [file] [log] [blame]

Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	1	/*
				2	* Copyright © 2015 Intel Corporation
				3	*
				4	* Permission is hereby granted, free of charge, to any person obtaining a
				5	* copy of this software and associated documentation files (the "Software"),
				6	* to deal in the Software without restriction, including without limitation
				7	* the rights to use, copy, modify, merge, publish, distribute, sublicense,
				8	* and/or sell copies of the Software, and to permit persons to whom the
				9	* Software is furnished to do so, subject to the following conditions:
				10	*
				11	* The above copyright notice and this permission notice (including the next
				12	* paragraph) shall be included in all copies or substantial portions of the
				13	* Software.
				14	*
				15	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				16	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				17	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
				18	* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				19	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
				20	* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
				21	* IN THE SOFTWARE.
				22	*/
				23
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	24	#ifndef _ROUNDING_H
				25	#define _ROUNDING_H
				26
Roland Scheidegger	3f797ef	2015-08-19 04:17:36 +0200	[diff] [blame]	27	#include "c99_math.h"
Jose Fonseca	497a22a	2015-08-09 11:55:28 +0100	[diff] [blame]	28
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	29	#include <limits.h>
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame]	30	#include <stdint.h>
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	31
				32	#ifdef __x86_64__
				33	#include <xmmintrin.h>
				34	#include <emmintrin.h>
				35	#endif
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	36
Matt Turner	036e347	2015-03-18 14:23:41 -0700	[diff] [blame]	37	#ifdef __SSE4_1__
				38	#include <smmintrin.h>
				39	#endif
				40
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	41	/* The C standard library has functions round()/rint()/nearbyint() that round
				42	* their arguments according to the rounding mode set in the floating-point
				43	* control register. While there are trunc()/ceil()/floor() functions that do
				44	* a specific operation without modifying the rounding mode, there is no
				45	* roundeven() in any version of C.
				46	*
				47	* Technical Specification 18661 (ISO/IEC TS 18661-1:2014) adds roundeven(),
				48	* but it's unfortunately not implemented by glibc.
				49	*
				50	* This implementation differs in that it does not raise the inexact exception.
				51	*
				52	* We use rint() to implement these functions, with the assumption that the
				53	* floating-point rounding mode has not been changed from the default Round
				54	* to Nearest.
				55	*/
				56
				57	/**
				58	* \brief Rounds \c x to the nearest integer, with ties to the even integer.
				59	*/
				60	static inline float
				61	_mesa_roundevenf(float x)
				62	{
Matt Turner	036e347	2015-03-18 14:23:41 -0700	[diff] [blame]	63	#ifdef __SSE4_1__
				64	float ret;
				65	__m128 m = _mm_load_ss(&x);
				66	m = _mm_round_ss(m, m, _MM_FROUND_CUR_DIRECTION \| _MM_FROUND_NO_EXC);
				67	_mm_store_ss(&ret, m);
				68	return ret;
				69	#else
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	70	return rintf(x);
Matt Turner	036e347	2015-03-18 14:23:41 -0700	[diff] [blame]	71	#endif
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	72	}
				73
				74	/**
				75	* \brief Rounds \c x to the nearest integer, with ties to the even integer.
				76	*/
				77	static inline double
				78	_mesa_roundeven(double x)
				79	{
Matt Turner	036e347	2015-03-18 14:23:41 -0700	[diff] [blame]	80	#ifdef __SSE4_1__
				81	double ret;
				82	__m128d m = _mm_load_sd(&x);
				83	m = _mm_round_sd(m, m, _MM_FROUND_CUR_DIRECTION \| _MM_FROUND_NO_EXC);
				84	_mm_store_sd(&ret, m);
				85	return ret;
				86	#else
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	87	return rint(x);
Matt Turner	036e347	2015-03-18 14:23:41 -0700	[diff] [blame]	88	#endif
Matt Turner	dd0d3a2	2015-03-10 17:55:21 -0700	[diff] [blame]	89	}
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	90
				91	/**
				92	* \brief Rounds \c x to the nearest integer, with ties to the even integer,
				93	* and returns the value as a long int.
				94	*/
				95	static inline long
				96	_mesa_lroundevenf(float x)
				97	{
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	98	#ifdef __x86_64__
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame]	99	#if LONG_MAX == INT64_MAX
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	100	return _mm_cvtss_si64(_mm_load_ss(&x));
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame]	101	#elif LONG_MAX == INT32_MAX
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	102	return _mm_cvtss_si32(_mm_load_ss(&x));
Jose Fonseca	21ccdbd	2015-08-09 11:25:41 +0100	[diff] [blame]	103	#else
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame]	104	#error "Unsupported long size"
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	105	#endif
				106	#else
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	107	return lrintf(x);
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	108	#endif
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	109	}
				110
				111	/**
				112	* \brief Rounds \c x to the nearest integer, with ties to the even integer,
				113	* and returns the value as a long int.
				114	*/
				115	static inline long
				116	_mesa_lroundeven(double x)
				117	{
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	118	#ifdef __x86_64__
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame]	119	#if LONG_MAX == INT64_MAX
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	120	return _mm_cvtsd_si64(_mm_load_sd(&x));
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame]	121	#elif LONG_MAX == INT32_MAX
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	122	return _mm_cvtsd_si32(_mm_load_sd(&x));
Jose Fonseca	21ccdbd	2015-08-09 11:25:41 +0100	[diff] [blame]	123	#else
Jose Fonseca	1eaa29c	2015-08-09 22:36:37 +0100	[diff] [blame]	124	#error "Unsupported long size"
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	125	#endif
				126	#else
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	127	return lrint(x);
Matt Turner	680de24	2015-06-29 09:38:34 -0700	[diff] [blame]	128	#endif
Matt Turner	594fc0f	2015-06-25 16:47:52 -0700	[diff] [blame]	129	}
				130
				131	#endif