blob: ef307c9d01f54f762b559675f903800fffab442a [file] [log] [blame]
// SwiftShader Software Renderer
//
// Copyright(c) 2005-2012 TransGaming Inc.
//
// All rights reserved. No part of this software may be copied, distributed, transmitted,
// transcribed, stored in a retrieval system, translated into any human or computer
// language by any means, or disclosed to third parties without the explicit written
// agreement of TransGaming Inc. Without such an agreement, no rights or licenses, express
// or implied, including but not limited to any patent rights, are granted to you.
//
#ifndef sw_Math_hpp
#define sw_Math_hpp
#include "Types.hpp"
#include <cmath>
#if defined(_MSC_VER)
#include <intrin.h>
#endif
namespace sw
{
using std::abs;
#undef min
#undef max
template<class T>
inline T max(T a, T b)
{
return a > b ? a : b;
}
template<class T>
inline T min(T a, T b)
{
return a < b ? a : b;
}
template<class T>
inline T max(T a, T b, T c)
{
return max(max(a, b), c);
}
template<class T>
inline T min(T a, T b, T c)
{
return min(min(a, b), c);
}
template<class T>
inline T max(T a, T b, T c, T d)
{
return max(max(a, b), max(c, d));
}
template<class T>
inline T min(T a, T b, T c, T d)
{
return min(min(a, b), min(c, d));
}
template<class T>
inline void swap(T &a, T &b)
{
T t = a;
a = b;
b = t;
}
inline int iround(float x)
{
return (int)floor(x + 0.5f);
// return _mm_cvtss_si32(_mm_load_ss(&x)); // FIXME: Demands SSE support
}
inline int ifloor(float x)
{
return (int)floor(x);
}
inline int ceilFix4(int x)
{
return (x + 0xF) & 0xFFFFFFF0;
}
inline int ceilInt4(int x)
{
return (x + 0xF) >> 4;
}
#define BITS(x) ( \
!!(x & 0x80000000) + \
!!(x & 0xC0000000) + \
!!(x & 0xE0000000) + \
!!(x & 0xF0000000) + \
!!(x & 0xF8000000) + \
!!(x & 0xFC000000) + \
!!(x & 0xFE000000) + \
!!(x & 0xFF000000) + \
!!(x & 0xFF800000) + \
!!(x & 0xFFC00000) + \
!!(x & 0xFFE00000) + \
!!(x & 0xFFF00000) + \
!!(x & 0xFFF80000) + \
!!(x & 0xFFFC0000) + \
!!(x & 0xFFFE0000) + \
!!(x & 0xFFFF0000) + \
!!(x & 0xFFFF8000) + \
!!(x & 0xFFFFC000) + \
!!(x & 0xFFFFE000) + \
!!(x & 0xFFFFF000) + \
!!(x & 0xFFFFF800) + \
!!(x & 0xFFFFFC00) + \
!!(x & 0xFFFFFE00) + \
!!(x & 0xFFFFFF00) + \
!!(x & 0xFFFFFF80) + \
!!(x & 0xFFFFFFC0) + \
!!(x & 0xFFFFFFE0) + \
!!(x & 0xFFFFFFF0) + \
!!(x & 0xFFFFFFF8) + \
!!(x & 0xFFFFFFFC) + \
!!(x & 0xFFFFFFFE) + \
!!(x & 0xFFFFFFFF))
inline float exp2(float x)
{
return exp2f(x);
}
inline int exp2(int x)
{
return 1 << x;
}
inline unsigned long log2(int x)
{
#if defined(_MSC_VER)
unsigned long y;
_BitScanReverse(&y, x);
return y;
#else
return 31 - __builtin_clz(x);
#endif
}
inline int ilog2(float x)
{
unsigned int y = *(unsigned int*)&x;
return ((y & 0x7F800000) >> 23) - 127;
}
inline float log2(float x)
{
unsigned int y = (*(unsigned int*)&x);
return (float)((y & 0x7F800000) >> 23) - 127 + (float)((*(unsigned int*)&x) & 0x007FFFFF) / 16777216.0f;
}
inline bool isPow2(int x)
{
return (x & -x) == x;
}
template<class T>
inline T clamp(T x, T a, T b)
{
if(x < a) x = a;
if(x > b) x = b;
return x;
}
inline int ceilPow2(int x)
{
int i = 1;
while(i < x)
{
i <<= 1;
}
return i;
}
inline int floorDiv(int a, int b)
{
return a / b + ((a % b) >> 31);
}
inline int floorMod(int a, int b)
{
int r = a % b;
return r + ((r >> 31) & b);
}
inline int ceilDiv(int a, int b)
{
return a / b - (-(a % b) >> 31);
}
inline int ceilMod(int a, int b)
{
int r = a % b;
return r - ((-r >> 31) & b);
}
template<const int n>
inline unsigned int unorm(float x)
{
static const unsigned int max = 0xFFFFFFFF >> (32 - n);
static const float maxf = static_cast<float>(max);
if(x >= 1.0f)
{
return max;
}
else if(x <= 0.0f)
{
return 0;
}
else
{
return static_cast<unsigned int>(maxf * x + 0.5f);
}
}
template<const int n>
inline int snorm(float x)
{
static const unsigned int min = 0x80000000 >> (32 - n);
static const unsigned int max = 0xFFFFFFFF >> (32 - n + 1);
static const float maxf = static_cast<float>(max);
static const unsigned int range = 0xFFFFFFFF >> (32 - n);
if(x >= 0.0f)
{
if(x >= 1.0f)
{
return max;
}
else
{
return static_cast<int>(maxf * x + 0.5f);
}
}
else
{
if(x <= -1.0f)
{
return min;
}
else
{
return static_cast<int>(maxf * x - 0.5f) & range;
}
}
}
template<const int n>
inline unsigned int ucast(float x)
{
static const unsigned int max = 0xFFFFFFFF >> (32 - n);
static const float maxf = static_cast<float>(max);
if(x >= maxf)
{
return max;
}
else if(x <= 0.0f)
{
return 0;
}
else
{
return static_cast<unsigned int>(x + 0.5f);
}
}
template<const int n>
inline int scast(float x)
{
static const unsigned int min = 0x80000000 >> (32 - n);
static const unsigned int max = 0xFFFFFFFF >> (32 - n + 1);
static const float maxf = static_cast<float>(max);
static const unsigned int range = 0xFFFFFFFF >> (32 - n);
if(x > 0.0f)
{
if(x >= maxf)
{
return max;
}
else
{
return static_cast<int>(maxf * x + 0.5f);
}
}
else
{
if(x <= -1.0f)
{
return min;
}
else
{
return static_cast<int>(maxf * x - 0.5f) & range;
}
}
}
inline float sRGBtoLinear(float c)
{
if(c <= 0.04045f)
{
return c * 0.07739938f; // 1.0f / 12.92f;
}
else
{
return powf((c + 0.055f) * 0.9478673f, 2.4f); // 1.0f / 1.055f
}
}
inline float linearToSRGB(float c)
{
if(c <= 0.0031308f)
{
return c * 12.92f;
}
else
{
return 1.055f * powf(c, 0.4166667f) - 0.055f; // 1.0f / 2.4f
}
}
unsigned char sRGB8toLinear8(unsigned char value);
uint64_t FNV_1a(const unsigned char *data, int size); // Fowler-Noll-Vo hash function
// Round up to the next multiple of alignment
inline unsigned int align(unsigned int value, unsigned int alignment)
{
return ((value + alignment - 1) / alignment) * alignment;
}
class RGB9E5Data
{
unsigned int R : 9;
unsigned int G : 9;
unsigned int B : 9;
unsigned int E : 5;
public:
void toRGBFloats(float* rgb) const
{
static const float Offset = -24.0f; // Exponent Bias (15) + Number of mantissa bits per component (9) = 24
const float factor = powf(2.0f, static_cast<float>(E) + Offset);
rgb[0] = static_cast<float>(R) * factor;
rgb[1] = static_cast<float>(G) * factor;
rgb[2] = static_cast<float>(B) * factor;
}
};
class R11G11B10FData
{
unsigned int R : 11;
unsigned int G : 11;
unsigned int B : 10;
static inline float float11ToFloat32(unsigned short fp11)
{
unsigned short exponent = (fp11 >> 6) & 0x1F;
unsigned short mantissa = fp11 & 0x3F;
unsigned int output;
if(exponent == 0x1F)
{
// INF or NAN
output = 0x7f800000 | (mantissa << 17);
}
else
{
if(exponent != 0)
{
// normalized
}
else if(mantissa != 0)
{
// The value is denormalized
exponent = 1;
do
{
exponent--;
mantissa <<= 1;
} while((mantissa & 0x40) == 0);
mantissa = mantissa & 0x3F;
}
else // The value is zero
{
exponent = static_cast<unsigned short>(-112);
}
output = ((exponent + 112) << 23) | (mantissa << 17);
}
return *(float*)(&output);
}
static inline float float10ToFloat32(unsigned short fp10)
{
unsigned short exponent = (fp10 >> 5) & 0x1F;
unsigned short mantissa = fp10 & 0x1F;
unsigned int output;
if(exponent == 0x1F)
{
// INF or NAN
output = 0x7f800000 | (mantissa << 17);
}
else
{
if(exponent != 0)
{
// normalized
}
else if(mantissa != 0)
{
// The value is denormalized
exponent = 1;
do
{
exponent--;
mantissa <<= 1;
} while((mantissa & 0x20) == 0);
mantissa = mantissa & 0x1F;
}
else // The value is zero
{
exponent = static_cast<unsigned short>(-112);
}
output = ((exponent + 112) << 23) | (mantissa << 18);
}
return *(float*)(&output);
}
public:
void toRGBFloats(float* rgb) const
{
rgb[0] = float11ToFloat32(R);
rgb[1] = float11ToFloat32(G);
rgb[2] = float10ToFloat32(B);
}
};
}
#endif // sw_Math_hpp