blob: 69e7902d2ab2829901f8503a93dde0629bf1e9db [file] [log] [blame]
Jason Sams1b937f52010-06-09 14:26:16 -07001#ifndef __RS_CL_RSH__
2#define __RS_CL_RSH__
3
4#define M_PI 3.14159265358979323846264338327950288f /* pi */
5
6
7// Conversions
8#define CVT_FUNC_2(typeout, typein) \
9static typeout##2 __attribute__((overloadable)) convert_##typeout##2(typein##2 v) { \
10 typeout##2 r = {v.x, v.y}; \
11 return r; \
12} \
13static typeout##3 __attribute__((overloadable)) convert_##typeout##3(typein##3 v) { \
14 typeout##3 r = {v.x, v.y, v.z}; \
15 return r; \
16} \
17static typeout##4 __attribute__((overloadable)) convert_##typeout##4(typein##4 v) { \
18 typeout##4 r = {v.x, v.y, v.z, v.w}; \
19 return r; \
20}
21
22#define CVT_FUNC(type) CVT_FUNC_2(type, uchar) \
23 CVT_FUNC_2(type, char) \
24 CVT_FUNC_2(type, ushort) \
25 CVT_FUNC_2(type, short) \
26 CVT_FUNC_2(type, int) \
27 CVT_FUNC_2(type, uint) \
28 CVT_FUNC_2(type, float)
29
30CVT_FUNC(char)
31CVT_FUNC(uchar)
32CVT_FUNC(short)
33CVT_FUNC(ushort)
34CVT_FUNC(int)
35CVT_FUNC(uint)
36CVT_FUNC(float)
37
38
39
Jason Sams22fa3712010-05-19 17:22:57 -070040// Float ops, 6.11.2
41
Jason Sams1b937f52010-06-09 14:26:16 -070042#define DEF_FUNC_1(fnc) \
43static float2 __attribute__((overloadable)) fnc(float2 v) { \
44 float2 r; \
45 r.x = fnc(v.x); \
46 r.y = fnc(v.y); \
47 return r; \
48} \
49static float3 __attribute__((overloadable)) fnc(float3 v) { \
50 float3 r; \
51 r.x = fnc(v.x); \
52 r.y = fnc(v.y); \
53 r.z = fnc(v.z); \
54 return r; \
55} \
56static float4 __attribute__((overloadable)) fnc(float4 v) { \
57 float4 r; \
58 r.x = fnc(v.x); \
59 r.y = fnc(v.y); \
60 r.z = fnc(v.z); \
61 r.w = fnc(v.w); \
62 return r; \
63}
64
65#define DEF_FUNC_2(fnc) \
66static float2 __attribute__((overloadable)) fnc(float2 v1, float2 v2) { \
67 float2 r; \
68 r.x = fnc(v1.x, v2.x); \
69 r.y = fnc(v1.y, v2.y); \
70 return r; \
71} \
72static float3 __attribute__((overloadable)) fnc(float3 v1, float3 v2) { \
73 float3 r; \
74 r.x = fnc(v1.x, v2.x); \
75 r.y = fnc(v1.y, v2.y); \
76 r.z = fnc(v1.z, v2.z); \
77 return r; \
78} \
79static float4 __attribute__((overloadable)) fnc(float4 v1, float4 v2) { \
80 float4 r; \
81 r.x = fnc(v1.x, v2.x); \
82 r.y = fnc(v1.y, v2.y); \
83 r.z = fnc(v1.z, v2.z); \
84 r.w = fnc(v1.w, v2.z); \
85 return r; \
86}
87
88#define DEF_FUNC_2F(fnc) \
89static float2 __attribute__((overloadable)) fnc(float2 v1, float v2) { \
90 float2 r; \
91 r.x = fnc(v1.x, v2); \
92 r.y = fnc(v1.y, v2); \
93 return r; \
94} \
95static float3 __attribute__((overloadable)) fnc(float3 v1, float v2) { \
96 float3 r; \
97 r.x = fnc(v1.x, v2); \
98 r.y = fnc(v1.y, v2); \
99 r.z = fnc(v1.z, v2); \
100 return r; \
101} \
102static float4 __attribute__((overloadable)) fnc(float4 v1, float v2) { \
103 float4 r; \
104 r.x = fnc(v1.x, v2); \
105 r.y = fnc(v1.y, v2); \
106 r.z = fnc(v1.z, v2); \
107 r.w = fnc(v1.w, v2); \
108 return r; \
109}
110
111
Jason Sams22fa3712010-05-19 17:22:57 -0700112extern float __attribute__((overloadable)) acos(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700113DEF_FUNC_1(acos)
Jason Sams22fa3712010-05-19 17:22:57 -0700114
115extern float __attribute__((overloadable)) acosh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700116DEF_FUNC_1(acosh)
Jason Sams22fa3712010-05-19 17:22:57 -0700117
Jason Sams1b937f52010-06-09 14:26:16 -0700118static float __attribute__((overloadable)) acospi(float v) {
119 return acos(v) / M_PI;
120}
121DEF_FUNC_1(acospi)
Jason Sams22fa3712010-05-19 17:22:57 -0700122
123extern float __attribute__((overloadable)) asin(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700124DEF_FUNC_1(asin)
Jason Sams22fa3712010-05-19 17:22:57 -0700125
126extern float __attribute__((overloadable)) asinh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700127DEF_FUNC_1(asinh)
Jason Sams22fa3712010-05-19 17:22:57 -0700128
Jason Sams1b937f52010-06-09 14:26:16 -0700129static float __attribute__((overloadable)) asinpi(float v) {
130 return asin(v) / M_PI;
131}
132DEF_FUNC_1(asinpi)
Jason Sams22fa3712010-05-19 17:22:57 -0700133
134extern float __attribute__((overloadable)) atan(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700135DEF_FUNC_1(atan)
Jason Sams22fa3712010-05-19 17:22:57 -0700136
137extern float __attribute__((overloadable)) atan2(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700138DEF_FUNC_2(atan2)
Jason Sams22fa3712010-05-19 17:22:57 -0700139
140extern float __attribute__((overloadable)) atanh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700141DEF_FUNC_1(atanh)
Jason Sams22fa3712010-05-19 17:22:57 -0700142
Jason Sams1b937f52010-06-09 14:26:16 -0700143static float __attribute__((overloadable)) atanpi(float v) {
144 return atan(v) / M_PI;
145}
146DEF_FUNC_1(atanpi)
Jason Sams22fa3712010-05-19 17:22:57 -0700147
Jason Sams1b937f52010-06-09 14:26:16 -0700148static float __attribute__((overloadable)) atan2pi(float y, float x) {
149 return atan2(y, x) / M_PI;
150}
151DEF_FUNC_2(atan2pi)
Jason Sams22fa3712010-05-19 17:22:57 -0700152
153extern float __attribute__((overloadable)) cbrt(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700154DEF_FUNC_1(cbrt)
Jason Sams22fa3712010-05-19 17:22:57 -0700155
156extern float __attribute__((overloadable)) ceil(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700157DEF_FUNC_1(ceil)
Jason Sams22fa3712010-05-19 17:22:57 -0700158
159extern float __attribute__((overloadable)) copysign(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700160DEF_FUNC_2(copysign)
Jason Sams22fa3712010-05-19 17:22:57 -0700161
162extern float __attribute__((overloadable)) cos(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700163DEF_FUNC_1(cos)
Jason Sams22fa3712010-05-19 17:22:57 -0700164
165extern float __attribute__((overloadable)) cosh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700166DEF_FUNC_1(cosh)
Jason Sams22fa3712010-05-19 17:22:57 -0700167
Jason Sams1b937f52010-06-09 14:26:16 -0700168static float __attribute__((overloadable)) cospi(float v) {
169 return cos(v * M_PI);
170}
171DEF_FUNC_1(cospi)
Jason Sams22fa3712010-05-19 17:22:57 -0700172
173extern float __attribute__((overloadable)) erfc(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700174DEF_FUNC_1(erfc)
Jason Sams22fa3712010-05-19 17:22:57 -0700175
176extern float __attribute__((overloadable)) erf(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700177DEF_FUNC_1(erf)
Jason Sams22fa3712010-05-19 17:22:57 -0700178
179extern float __attribute__((overloadable)) exp(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700180DEF_FUNC_1(exp)
Jason Sams22fa3712010-05-19 17:22:57 -0700181
182extern float __attribute__((overloadable)) exp2(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700183DEF_FUNC_1(exp2)
Jason Sams22fa3712010-05-19 17:22:57 -0700184
Jason Sams1b937f52010-06-09 14:26:16 -0700185extern float __attribute__((overloadable)) pow(float, float);
186static float __attribute__((overloadable)) exp10(float v) {
187 return pow(10.f, v);
188}
189DEF_FUNC_1(exp10)
Jason Sams22fa3712010-05-19 17:22:57 -0700190
191extern float __attribute__((overloadable)) expm1(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700192DEF_FUNC_1(expm1)
Jason Sams22fa3712010-05-19 17:22:57 -0700193
194extern float __attribute__((overloadable)) fabs(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700195DEF_FUNC_1(fabs)
Jason Sams22fa3712010-05-19 17:22:57 -0700196
197extern float __attribute__((overloadable)) fdim(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700198DEF_FUNC_2(fdim)
Jason Sams22fa3712010-05-19 17:22:57 -0700199
200extern float __attribute__((overloadable)) floor(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700201DEF_FUNC_1(floor)
Jason Sams22fa3712010-05-19 17:22:57 -0700202
203extern float __attribute__((overloadable)) fma(float, float, float);
204extern float2 __attribute__((overloadable)) fma(float2, float2, float2);
205extern float3 __attribute__((overloadable)) fma(float3, float3, float3);
206extern float4 __attribute__((overloadable)) fma(float4, float4, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700207
208extern float __attribute__((overloadable)) fmax(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700209DEF_FUNC_2(fmax);
210DEF_FUNC_2F(fmax);
Jason Sams22fa3712010-05-19 17:22:57 -0700211
212extern float __attribute__((overloadable)) fmin(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700213DEF_FUNC_2(fmin);
214DEF_FUNC_2F(fmin);
Jason Sams22fa3712010-05-19 17:22:57 -0700215
216extern float __attribute__((overloadable)) fmod(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700217DEF_FUNC_2(fmod)
Jason Sams22fa3712010-05-19 17:22:57 -0700218
Jason Sams1b937f52010-06-09 14:26:16 -0700219static float __attribute__((overloadable)) fract(float v, float *iptr) {
220 int i = (int)floor(v);
221 iptr[0] = i;
222 return fmin(v - i, 0x1.fffffep-1f);
223}
224static float2 __attribute__((overloadable)) fract(float2 v, float2 *iptr) {
225 float t[2];
226 float2 r;
227 r.x = fract(v.x, &t[0]);
228 r.y = fract(v.y, &t[1]);
229 iptr[0] = t[0];
230 iptr[1] = t[1];
231 return r;
232}
233static float3 __attribute__((overloadable)) fract(float3 v, float3 *iptr) {
234 float t[3];
235 float3 r;
236 r.x = fract(v.x, &t[0]);
237 r.y = fract(v.y, &t[1]);
238 r.z = fract(v.z, &t[2]);
239 iptr[0] = t[0];
240 iptr[1] = t[1];
241 iptr[2] = t[2];
242 return r;
243}
244static float4 __attribute__((overloadable)) fract(float4 v, float4 *iptr) {
245 float t[4];
246 float4 r;
247 r.x = fract(v.x, &t[0]);
248 r.y = fract(v.y, &t[1]);
249 r.z = fract(v.z, &t[2]);
250 r.w = fract(v.w, &t[3]);
251 iptr[0] = t[0];
252 iptr[1] = t[1];
253 iptr[2] = t[2];
254 iptr[3] = t[3];
255 return r;
256}
Jason Sams22fa3712010-05-19 17:22:57 -0700257
258extern float __attribute__((overloadable)) frexp(float, float *);
259extern float2 __attribute__((overloadable)) frexp(float2, float2 *);
260extern float3 __attribute__((overloadable)) frexp(float3, float3 *);
261extern float4 __attribute__((overloadable)) frexp(float4, float4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700262
263extern float __attribute__((overloadable)) hypot(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700264DEF_FUNC_2(hypot)
Jason Sams22fa3712010-05-19 17:22:57 -0700265
266extern int __attribute__((overloadable)) ilogb(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700267DEF_FUNC_1(ilogb)
Jason Sams22fa3712010-05-19 17:22:57 -0700268
269extern float __attribute__((overloadable)) ldexp(float, int);
270extern float2 __attribute__((overloadable)) ldexp(float2, int2);
271extern float3 __attribute__((overloadable)) ldexp(float3, int3);
272extern float4 __attribute__((overloadable)) ldexp(float4, int4);
Jason Sams22fa3712010-05-19 17:22:57 -0700273extern float2 __attribute__((overloadable)) ldexp(float2, int);
274extern float3 __attribute__((overloadable)) ldexp(float3, int);
275extern float4 __attribute__((overloadable)) ldexp(float4, int);
Jason Sams22fa3712010-05-19 17:22:57 -0700276
277extern float __attribute__((overloadable)) lgamma(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700278DEF_FUNC_1(lgamma)
Jason Sams22fa3712010-05-19 17:22:57 -0700279extern float __attribute__((overloadable)) lgamma(float, float *);
280extern float2 __attribute__((overloadable)) lgamma(float2, float2 *);
281extern float3 __attribute__((overloadable)) lgamma(float3, float3 *);
282extern float4 __attribute__((overloadable)) lgamma(float4, float4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700283
284extern float __attribute__((overloadable)) log(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700285DEF_FUNC_1(log)
Jason Sams22fa3712010-05-19 17:22:57 -0700286
Jason Sams22fa3712010-05-19 17:22:57 -0700287
288extern float __attribute__((overloadable)) log10(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700289DEF_FUNC_1(log10)
290
291static float __attribute__((overloadable)) log2(float v) {
292 return log10(v) / log10(2.f);
293}
294DEF_FUNC_1(log2)
Jason Sams22fa3712010-05-19 17:22:57 -0700295
296extern float __attribute__((overloadable)) log1p(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700297DEF_FUNC_1(log1p)
Jason Sams22fa3712010-05-19 17:22:57 -0700298
299extern float __attribute__((overloadable)) logb(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700300DEF_FUNC_1(logb)
Jason Sams22fa3712010-05-19 17:22:57 -0700301
302extern float __attribute__((overloadable)) mad(float, float, float);
303extern float2 __attribute__((overloadable)) mad(float2, float2, float2);
304extern float3 __attribute__((overloadable)) mad(float3, float3, float3);
305extern float4 __attribute__((overloadable)) mad(float4, float4, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700306
307extern float __attribute__((overloadable)) modf(float, float *);
308extern float2 __attribute__((overloadable)) modf(float2, float2 *);
309extern float3 __attribute__((overloadable)) modf(float3, float3 *);
310extern float4 __attribute__((overloadable)) modf(float4, float4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700311
Jason Sams1b937f52010-06-09 14:26:16 -0700312//extern float __attribute__((overloadable)) nan(uint);
Jason Sams22fa3712010-05-19 17:22:57 -0700313
314extern float __attribute__((overloadable)) nextafter(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700315DEF_FUNC_2(nextafter)
Jason Sams22fa3712010-05-19 17:22:57 -0700316
Jason Sams1b937f52010-06-09 14:26:16 -0700317DEF_FUNC_2(pow)
Jason Sams22fa3712010-05-19 17:22:57 -0700318
Jason Sams1b937f52010-06-09 14:26:16 -0700319static float __attribute__((overloadable)) pown(float v, int p) {
320 return pow(v, (float)p);
321}
322static float2 __attribute__((overloadable)) pown(float2 v, int2 p) {
323 return pow(v, (float2)p);
324}
325static float3 __attribute__((overloadable)) pown(float3 v, int3 p) {
326 return pow(v, (float3)p);
327}
328static float4 __attribute__((overloadable)) pown(float4 v, int4 p) {
329 return pow(v, (float4)p);
330}
Jason Sams22fa3712010-05-19 17:22:57 -0700331
Jason Sams1b937f52010-06-09 14:26:16 -0700332static float __attribute__((overloadable)) powr(float v, float p) {
333 return pow(v, p);
334}
335static float2 __attribute__((overloadable)) powr(float2 v, float2 p) {
336 return pow(v, p);
337}
338static float3 __attribute__((overloadable)) powr(float3 v, float3 p) {
339 return pow(v, p);
340}
341static float4 __attribute__((overloadable)) powr(float4 v, float4 p) {
342 return pow(v, p);
343}
Jason Sams22fa3712010-05-19 17:22:57 -0700344
345extern float __attribute__((overloadable)) remainder(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700346DEF_FUNC_2(remainder)
Jason Sams22fa3712010-05-19 17:22:57 -0700347
348extern float __attribute__((overloadable)) remquo(float, float, float *);
349extern float2 __attribute__((overloadable)) remquo(float2, float2, float2 *);
350extern float3 __attribute__((overloadable)) remquo(float3, float3, float3 *);
351extern float4 __attribute__((overloadable)) remquo(float4, float4, float4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700352
353extern float __attribute__((overloadable)) rint(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700354DEF_FUNC_1(rint)
Jason Sams22fa3712010-05-19 17:22:57 -0700355
Jason Sams1b937f52010-06-09 14:26:16 -0700356static float __attribute__((overloadable)) rootn(float v, int r) {
357 return pow(v, 1.f / r);
358}
359static float2 __attribute__((overloadable)) rootn(float2 v, int2 r) {
360 float2 t = {1.f / r.x, 1.f / r.y};
361 return pow(v, t);
362}
363static float3 __attribute__((overloadable)) rootn(float3 v, int3 r) {
364 float3 t = {1.f / r.x, 1.f / r.y, 1.f / r.z};
365 return pow(v, t);
366}
367static float4 __attribute__((overloadable)) rootn(float4 v, int4 r) {
368 float4 t = {1.f / r.x, 1.f / r.y, 1.f / r.z, 1.f / r.w};
369 return pow(v, t);
370}
Jason Sams22fa3712010-05-19 17:22:57 -0700371
372extern float __attribute__((overloadable)) round(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700373DEF_FUNC_1(round)
Jason Sams22fa3712010-05-19 17:22:57 -0700374
375extern float __attribute__((overloadable)) sqrt(float);
Shih-wei Liaof1e6ec32010-06-14 17:34:25 -0700376/*static float __attribute__((overloadable)) rsqrt(float v) {
Jason Sams1b937f52010-06-09 14:26:16 -0700377 return 1.f / sqrt(v);
378}
Shih-wei Liaof1e6ec32010-06-14 17:34:25 -0700379DEF_FUNC_1(rsqrt)*/
Jason Sams1b937f52010-06-09 14:26:16 -0700380
381extern float __attribute__((overloadable)) sin(float);
382DEF_FUNC_1(sin)
383
384static float __attribute__((overloadable)) sincos(float v, float *cosptr) {
385 *cosptr = cos(v);
386 return sin(v);
387}
388static float2 __attribute__((overloadable)) sincos(float2 v, float2 *cosptr) {
389 *cosptr = cos(v);
390 return sin(v);
391}
392static float3 __attribute__((overloadable)) sincos(float3 v, float3 *cosptr) {
393 *cosptr = cos(v);
394 return sin(v);
395}
396static float4 __attribute__((overloadable)) sincos(float4 v, float4 *cosptr) {
397 *cosptr = cos(v);
398 return sin(v);
399}
400
401extern float __attribute__((overloadable)) sinh(float);
402DEF_FUNC_1(sinh)
403
404static float __attribute__((overloadable)) sinpi(float v) {
405 return sin(v * M_PI);
406}
407DEF_FUNC_1(sinpi)
408
409DEF_FUNC_1(sqrt)
Jason Sams22fa3712010-05-19 17:22:57 -0700410
411extern float __attribute__((overloadable)) tan(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700412DEF_FUNC_1(tan)
Jason Sams22fa3712010-05-19 17:22:57 -0700413
414extern float __attribute__((overloadable)) tanh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700415DEF_FUNC_1(tanh)
Jason Sams22fa3712010-05-19 17:22:57 -0700416
Jason Sams1b937f52010-06-09 14:26:16 -0700417static float __attribute__((overloadable)) tanpi(float v) {
418 return tan(v * M_PI);
419}
420DEF_FUNC_1(tanpi)
Jason Sams22fa3712010-05-19 17:22:57 -0700421
422extern float __attribute__((overloadable)) tgamma(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700423DEF_FUNC_1(tgamma)
Jason Sams22fa3712010-05-19 17:22:57 -0700424
425extern float __attribute__((overloadable)) trunc(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700426DEF_FUNC_1(trunc)
Jason Sams22fa3712010-05-19 17:22:57 -0700427
428// Int ops (partial), 6.11.3
429extern uint __attribute__((overloadable)) abs(int);
430extern ushort __attribute__((overloadable)) abs(short);
431extern uchar __attribute__((overloadable)) abs(char);
432
433extern uint __attribute__((overloadable)) clz(uint);
434extern int __attribute__((overloadable)) clz(int);
435extern ushort __attribute__((overloadable)) clz(ushort);
436extern short __attribute__((overloadable)) clz(short);
437extern uchar __attribute__((overloadable)) clz(uchar);
438extern char __attribute__((overloadable)) clz(char);
439
Jason Sams1b937f52010-06-09 14:26:16 -0700440static uint __attribute__((overloadable)) min(uint v1, uint v2) {
441 return v1 < v2 ? v1 : v2;
442}
443static int __attribute__((overloadable)) min(int v1, int v2) {
444 return v1 < v2 ? v1 : v2;
445}
446static ushort __attribute__((overloadable)) min(ushort v1, ushort v2) {
447 return v1 < v2 ? v1 : v2;
448}
449static short __attribute__((overloadable)) min(short v1, short v2) {
450 return v1 < v2 ? v1 : v2;
451}
452static uchar __attribute__((overloadable)) min(uchar v1, uchar v2) {
453 return v1 < v2 ? v1 : v2;
454}
455static char __attribute__((overloadable)) min(char v1, char v2) {
456 return v1 < v2 ? v1 : v2;
457}
Jason Sams22fa3712010-05-19 17:22:57 -0700458
Jason Sams1b937f52010-06-09 14:26:16 -0700459static uint __attribute__((overloadable)) max(uint v1, uint v2) {
460 return v1 > v2 ? v1 : v2;
461}
462static int __attribute__((overloadable)) max(int v1, int v2) {
463 return v1 > v2 ? v1 : v2;
464}
465static ushort __attribute__((overloadable)) max(ushort v1, ushort v2) {
466 return v1 > v2 ? v1 : v2;
467}
468static short __attribute__((overloadable)) max(short v1, short v2) {
469 return v1 > v2 ? v1 : v2;
470}
471static uchar __attribute__((overloadable)) max(uchar v1, uchar v2) {
472 return v1 > v2 ? v1 : v2;
473}
474static char __attribute__((overloadable)) max(char v1, char v2) {
475 return v1 > v2 ? v1 : v2;
476}
Jason Sams22fa3712010-05-19 17:22:57 -0700477
478
479
480
481// 6.11.4
482
Jason Sams1b937f52010-06-09 14:26:16 -0700483static float __attribute__((overloadable)) clamp(float amount, float low, float high) {
484 return amount < low ? low : (amount > high ? high : amount);
485}
486static float2 __attribute__((overloadable)) clamp(float2 amount, float2 low, float2 high) {
487 float2 r;
488 r.x = amount.x < low.x ? low.x : (amount.x > high.x ? high.x : amount.x);
489 r.y = amount.y < low.y ? low.y : (amount.y > high.y ? high.y : amount.y);
490 return r;
491}
492static float3 __attribute__((overloadable)) clamp(float3 amount, float3 low, float3 high) {
493 float3 r;
494 r.x = amount.x < low.x ? low.x : (amount.x > high.x ? high.x : amount.x);
495 r.y = amount.y < low.y ? low.y : (amount.y > high.y ? high.y : amount.y);
496 r.z = amount.z < low.z ? low.z : (amount.z > high.z ? high.z : amount.z);
497 return r;
498}
499static float4 __attribute__((overloadable)) clamp(float4 amount, float4 low, float4 high) {
500 float4 r;
501 r.x = amount.x < low.x ? low.x : (amount.x > high.x ? high.x : amount.x);
502 r.y = amount.y < low.y ? low.y : (amount.y > high.y ? high.y : amount.y);
503 r.z = amount.z < low.z ? low.z : (amount.z > high.z ? high.z : amount.z);
504 r.w = amount.w < low.w ? low.w : (amount.w > high.w ? high.w : amount.w);
505 return r;
506}
507static float2 __attribute__((overloadable)) clamp(float2 amount, float low, float high) {
508 float2 r;
509 r.x = amount.x < low ? low : (amount.x > high ? high : amount.x);
510 r.y = amount.y < low ? low : (amount.y > high ? high : amount.y);
511 return r;
512}
513static float3 __attribute__((overloadable)) clamp(float3 amount, float low, float high) {
514 float3 r;
515 r.x = amount.x < low ? low : (amount.x > high ? high : amount.x);
516 r.y = amount.y < low ? low : (amount.y > high ? high : amount.y);
517 r.z = amount.z < low ? low : (amount.z > high ? high : amount.z);
518 return r;
519}
520static float4 __attribute__((overloadable)) clamp(float4 amount, float low, float high) {
521 float4 r;
522 r.x = amount.x < low ? low : (amount.x > high ? high : amount.x);
523 r.y = amount.y < low ? low : (amount.y > high ? high : amount.y);
524 r.z = amount.z < low ? low : (amount.z > high ? high : amount.z);
525 r.w = amount.w < low ? low : (amount.w > high ? high : amount.w);
526 return r;
527}
Jason Sams22fa3712010-05-19 17:22:57 -0700528
Jason Sams1b937f52010-06-09 14:26:16 -0700529static float __attribute__((overloadable)) degrees(float radians) {
530 return radians * (180.f / M_PI);
531}
532DEF_FUNC_1(degrees)
Jason Sams22fa3712010-05-19 17:22:57 -0700533
Jason Sams1b937f52010-06-09 14:26:16 -0700534static float __attribute__((overloadable)) max(float v1, float v2) {
535 return v1 > v2 ? v1 : v2;
536}
537static float2 __attribute__((overloadable)) max(float2 v1, float2 v2) {
538 float2 r;
539 r.x = v1.x > v2.x ? v1.x : v2.x;
540 r.y = v1.y > v2.y ? v1.y : v2.y;
541 return r;
542}
543static float3 __attribute__((overloadable)) max(float3 v1, float3 v2) {
544 float3 r;
545 r.x = v1.x > v2.x ? v1.x : v2.x;
546 r.y = v1.y > v2.y ? v1.y : v2.y;
547 r.z = v1.z > v2.z ? v1.z : v2.z;
548 return r;
549}
550static float4 __attribute__((overloadable)) max(float4 v1, float4 v2) {
551 float4 r;
552 r.x = v1.x > v2.x ? v1.x : v2.x;
553 r.y = v1.y > v2.y ? v1.y : v2.y;
554 r.z = v1.z > v2.z ? v1.z : v2.z;
555 r.w = v1.w > v2.w ? v1.w : v2.w;
556 return r;
557}
558static float2 __attribute__((overloadable)) max(float2 v1, float v2) {
559 float2 r;
560 r.x = v1.x > v2 ? v1.x : v2;
561 r.y = v1.y > v2 ? v1.y : v2;
562 return r;
563}
564static float3 __attribute__((overloadable)) max(float3 v1, float v2) {
565 float3 r;
566 r.x = v1.x > v2 ? v1.x : v2;
567 r.y = v1.y > v2 ? v1.y : v2;
568 r.z = v1.z > v2 ? v1.z : v2;
569 return r;
570}
571static float4 __attribute__((overloadable)) max(float4 v1, float v2) {
572 float4 r;
573 r.x = v1.x > v2 ? v1.x : v2;
574 r.y = v1.y > v2 ? v1.y : v2;
575 r.z = v1.z > v2 ? v1.z : v2;
576 r.w = v1.w > v2 ? v1.w : v2;
577 return r;
578}
Jason Sams22fa3712010-05-19 17:22:57 -0700579
Jason Sams1b937f52010-06-09 14:26:16 -0700580static float __attribute__((overloadable)) min(float v1, float v2) {
581 return v1 < v2 ? v1 : v2;
582}
583static float2 __attribute__((overloadable)) min(float2 v1, float2 v2) {
584 float2 r;
585 r.x = v1.x < v2.x ? v1.x : v2.x;
586 r.y = v1.y < v2.y ? v1.y : v2.y;
587 return r;
588}
589static float3 __attribute__((overloadable)) min(float3 v1, float3 v2) {
590 float3 r;
591 r.x = v1.x < v2.x ? v1.x : v2.x;
592 r.y = v1.y < v2.y ? v1.y : v2.y;
593 r.z = v1.z < v2.z ? v1.z : v2.z;
594 return r;
595}
596static float4 __attribute__((overloadable)) min(float4 v1, float4 v2) {
597 float4 r;
598 r.x = v1.x < v2.x ? v1.x : v2.x;
599 r.y = v1.y < v2.y ? v1.y : v2.y;
600 r.z = v1.z < v2.z ? v1.z : v2.z;
601 r.w = v1.w < v2.w ? v1.w : v2.w;
602 return r;
603}
604static float2 __attribute__((overloadable)) min(float2 v1, float v2) {
605 float2 r;
606 r.x = v1.x < v2 ? v1.x : v2;
607 r.y = v1.y < v2 ? v1.y : v2;
608 return r;
609}
610static float3 __attribute__((overloadable)) min(float3 v1, float v2) {
611 float3 r;
612 r.x = v1.x < v2 ? v1.x : v2;
613 r.y = v1.y < v2 ? v1.y : v2;
614 r.z = v1.z < v2 ? v1.z : v2;
615 return r;
616}
617static float4 __attribute__((overloadable)) min(float4 v1, float v2) {
618 float4 r;
619 r.x = v1.x < v2 ? v1.x : v2;
620 r.y = v1.y < v2 ? v1.y : v2;
621 r.z = v1.z < v2 ? v1.z : v2;
622 r.w = v1.w < v2 ? v1.w : v2;
623 return r;
624}
Jason Sams22fa3712010-05-19 17:22:57 -0700625
Jason Sams1b937f52010-06-09 14:26:16 -0700626static float __attribute__((overloadable)) mix(float start, float stop, float amount) {
627 return start + (stop - start) * amount;
628}
629static float2 __attribute__((overloadable)) mix(float2 start, float2 stop, float2 amount) {
630 return start + (stop - start) * amount;
631}
632static float3 __attribute__((overloadable)) mix(float3 start, float3 stop, float3 amount) {
633 return start + (stop - start) * amount;
634}
635static float4 __attribute__((overloadable)) mix(float4 start, float4 stop, float4 amount) {
636 return start + (stop - start) * amount;
637}
638static float2 __attribute__((overloadable)) mix(float2 start, float2 stop, float amount) {
639 return start + (stop - start) * amount;
640}
641static float3 __attribute__((overloadable)) mix(float3 start, float3 stop, float amount) {
642 return start + (stop - start) * amount;
643}
644static float4 __attribute__((overloadable)) mix(float4 start, float4 stop, float amount) {
645 return start + (stop - start) * amount;
646}
Jason Sams22fa3712010-05-19 17:22:57 -0700647
Jason Sams1b937f52010-06-09 14:26:16 -0700648static float __attribute__((overloadable)) radians(float degrees) {
649 return degrees * (M_PI / 180.f);
650}
651DEF_FUNC_1(radians)
Jason Sams22fa3712010-05-19 17:22:57 -0700652
Jason Sams1b937f52010-06-09 14:26:16 -0700653static float __attribute__((overloadable)) step(float edge, float v) {
654 return (v < edge) ? 0.f : 1.f;
655}
656static float2 __attribute__((overloadable)) step(float2 edge, float2 v) {
657 float2 r;
658 r.x = (v.x < edge.x) ? 0.f : 1.f;
659 r.y = (v.y < edge.y) ? 0.f : 1.f;
660 return r;
661}
662static float3 __attribute__((overloadable)) step(float3 edge, float3 v) {
663 float3 r;
664 r.x = (v.x < edge.x) ? 0.f : 1.f;
665 r.y = (v.y < edge.y) ? 0.f : 1.f;
666 r.z = (v.z < edge.z) ? 0.f : 1.f;
667 return r;
668}
669static float4 __attribute__((overloadable)) step(float4 edge, float4 v) {
670 float4 r;
671 r.x = (v.x < edge.x) ? 0.f : 1.f;
672 r.y = (v.y < edge.y) ? 0.f : 1.f;
673 r.z = (v.z < edge.z) ? 0.f : 1.f;
674 r.w = (v.w < edge.w) ? 0.f : 1.f;
675 return r;
676}
677static float2 __attribute__((overloadable)) step(float2 edge, float v) {
678 float2 r;
679 r.x = (v < edge.x) ? 0.f : 1.f;
680 r.y = (v < edge.y) ? 0.f : 1.f;
681 return r;
682}
683static float3 __attribute__((overloadable)) step(float3 edge, float v) {
684 float3 r;
685 r.x = (v < edge.x) ? 0.f : 1.f;
686 r.y = (v < edge.y) ? 0.f : 1.f;
687 r.z = (v < edge.z) ? 0.f : 1.f;
688 return r;
689}
690static float4 __attribute__((overloadable)) step(float4 edge, float v) {
691 float4 r;
692 r.x = (v < edge.x) ? 0.f : 1.f;
693 r.y = (v < edge.y) ? 0.f : 1.f;
694 r.z = (v < edge.z) ? 0.f : 1.f;
695 r.w = (v < edge.w) ? 0.f : 1.f;
696 return r;
697}
Jason Sams22fa3712010-05-19 17:22:57 -0700698
699extern float __attribute__((overloadable)) smoothstep(float, float, float);
700extern float2 __attribute__((overloadable)) smoothstep(float2, float2, float2);
701extern float3 __attribute__((overloadable)) smoothstep(float3, float3, float3);
702extern float4 __attribute__((overloadable)) smoothstep(float4, float4, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700703extern float2 __attribute__((overloadable)) smoothstep(float, float, float2);
704extern float3 __attribute__((overloadable)) smoothstep(float, float, float3);
705extern float4 __attribute__((overloadable)) smoothstep(float, float, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700706
Jason Sams1b937f52010-06-09 14:26:16 -0700707static float __attribute__((overloadable)) sign(float v) {
708 if (v > 0) return 1.f;
709 if (v < 0) return -1.f;
710 return v;
711}
712DEF_FUNC_1(sign)
Jason Sams22fa3712010-05-19 17:22:57 -0700713
714// 6.11.5
Jason Sams1b937f52010-06-09 14:26:16 -0700715static float3 __attribute__((overloadable)) cross(float3 lhs, float3 rhs) {
716 float3 r;
717 r.x = lhs.y * rhs.z - lhs.z * rhs.y;
718 r.y = lhs.z * rhs.x - lhs.x * rhs.z;
719 r.z = lhs.x * rhs.y - lhs.y * rhs.x;
720 return r;
721}
Jason Sams22fa3712010-05-19 17:22:57 -0700722
Jason Sams1b937f52010-06-09 14:26:16 -0700723static float4 __attribute__((overloadable)) cross(float4 lhs, float4 rhs) {
724 float4 r;
725 r.x = lhs.y * rhs.z - lhs.z * rhs.y;
726 r.y = lhs.z * rhs.x - lhs.x * rhs.z;
727 r.z = lhs.x * rhs.y - lhs.y * rhs.x;
728 r.w = 0.f;
729 return r;
730}
Jason Sams22fa3712010-05-19 17:22:57 -0700731
Jason Sams1b937f52010-06-09 14:26:16 -0700732static float __attribute__((overloadable)) dot(float lhs, float rhs) {
733 return lhs * rhs;
734}
735static float __attribute__((overloadable)) dot(float2 lhs, float2 rhs) {
736 return lhs.x*rhs.x + lhs.y*rhs.y;
737}
738static float __attribute__((overloadable)) dot(float3 lhs, float3 rhs) {
739 return lhs.x*rhs.x + lhs.y*rhs.y + lhs.z*rhs.z;
740}
741static float __attribute__((overloadable)) dot(float4 lhs, float4 rhs) {
742 return lhs.x*rhs.x + lhs.y*rhs.y + lhs.z*rhs.z + lhs.w*rhs.w;
743}
Jason Sams22fa3712010-05-19 17:22:57 -0700744
Jason Sams1b937f52010-06-09 14:26:16 -0700745static float __attribute__((overloadable)) length(float v) {
746 return v;
747}
748static float __attribute__((overloadable)) length(float2 v) {
749 return sqrt(v.x*v.x + v.y*v.y);
750}
751static float __attribute__((overloadable)) length(float3 v) {
752 return sqrt(v.x*v.x + v.y*v.y + v.z*v.z);
753}
754static float __attribute__((overloadable)) length(float4 v) {
755 return sqrt(v.x*v.x + v.y*v.y + v.z*v.z + v.w*v.w);
756}
Jason Sams22fa3712010-05-19 17:22:57 -0700757
Jason Sams1b937f52010-06-09 14:26:16 -0700758static float __attribute__((overloadable)) distance(float lhs, float rhs) {
759 return length(lhs - rhs);
760}
761static float __attribute__((overloadable)) distance(float2 lhs, float2 rhs) {
762 return length(lhs - rhs);
763}
764static float __attribute__((overloadable)) distance(float3 lhs, float3 rhs) {
765 return length(lhs - rhs);
766}
767static float __attribute__((overloadable)) distance(float4 lhs, float4 rhs) {
768 return length(lhs - rhs);
769}
Jason Sams22fa3712010-05-19 17:22:57 -0700770
Jason Sams1b937f52010-06-09 14:26:16 -0700771static float __attribute__((overloadable)) normalize(float v) {
772 return 1.f;
773}
774static float2 __attribute__((overloadable)) normalize(float2 v) {
775 return v / length(v);
776}
777static float3 __attribute__((overloadable)) normalize(float3 v) {
778 return v / length(v);
779}
780static float4 __attribute__((overloadable)) normalize(float4 v) {
781 return v / length(v);
782}
783
784
785#endif