blob: a5092b36fff0e6adcd3a0466b3159f002cc0c919 [file] [log] [blame]
Jason Sams1b937f52010-06-09 14:26:16 -07001#ifndef __RS_CL_RSH__
2#define __RS_CL_RSH__
3
4#define M_PI 3.14159265358979323846264338327950288f /* pi */
5
6
7// Conversions
8#define CVT_FUNC_2(typeout, typein) \
9static typeout##2 __attribute__((overloadable)) convert_##typeout##2(typein##2 v) { \
Jason Sams5e9811f2010-06-21 17:42:41 -070010 typeout##2 r = {(typeout)v.x, (typeout)v.y}; \
Jason Sams1b937f52010-06-09 14:26:16 -070011 return r; \
12} \
13static typeout##3 __attribute__((overloadable)) convert_##typeout##3(typein##3 v) { \
Jason Sams5e9811f2010-06-21 17:42:41 -070014 typeout##3 r = {(typeout)v.x, (typeout)v.y, (typeout)v.z}; \
Jason Sams1b937f52010-06-09 14:26:16 -070015 return r; \
16} \
17static typeout##4 __attribute__((overloadable)) convert_##typeout##4(typein##4 v) { \
Jason Sams5e9811f2010-06-21 17:42:41 -070018 typeout##4 r = {(typeout)v.x, (typeout)v.y, (typeout)v.z, (typeout)v.w}; \
Jason Sams1b937f52010-06-09 14:26:16 -070019 return r; \
20}
21
22#define CVT_FUNC(type) CVT_FUNC_2(type, uchar) \
23 CVT_FUNC_2(type, char) \
24 CVT_FUNC_2(type, ushort) \
25 CVT_FUNC_2(type, short) \
Jason Sams1b937f52010-06-09 14:26:16 -070026 CVT_FUNC_2(type, uint) \
Stephen Hines47416532011-01-11 14:38:18 -080027 CVT_FUNC_2(type, int) \
Jason Sams1b937f52010-06-09 14:26:16 -070028 CVT_FUNC_2(type, float)
29
30CVT_FUNC(char)
31CVT_FUNC(uchar)
32CVT_FUNC(short)
33CVT_FUNC(ushort)
34CVT_FUNC(int)
35CVT_FUNC(uint)
36CVT_FUNC(float)
37
38
39
Jason Sams22fa3712010-05-19 17:22:57 -070040// Float ops, 6.11.2
41
Jason Sams1b937f52010-06-09 14:26:16 -070042#define DEF_FUNC_1(fnc) \
43static float2 __attribute__((overloadable)) fnc(float2 v) { \
44 float2 r; \
45 r.x = fnc(v.x); \
46 r.y = fnc(v.y); \
47 return r; \
48} \
49static float3 __attribute__((overloadable)) fnc(float3 v) { \
50 float3 r; \
51 r.x = fnc(v.x); \
52 r.y = fnc(v.y); \
53 r.z = fnc(v.z); \
54 return r; \
55} \
56static float4 __attribute__((overloadable)) fnc(float4 v) { \
57 float4 r; \
58 r.x = fnc(v.x); \
59 r.y = fnc(v.y); \
60 r.z = fnc(v.z); \
61 r.w = fnc(v.w); \
62 return r; \
63}
64
Stephen Hines47416532011-01-11 14:38:18 -080065#define DEF_FUNC_1_RI(fnc) \
66static int2 __attribute__((overloadable)) fnc(float2 v) { \
67 int2 r; \
68 r.x = fnc(v.x); \
69 r.y = fnc(v.y); \
70 return r; \
71} \
72static int3 __attribute__((overloadable)) fnc(float3 v) { \
73 int3 r; \
74 r.x = fnc(v.x); \
75 r.y = fnc(v.y); \
76 r.z = fnc(v.z); \
77 return r; \
78} \
79static int4 __attribute__((overloadable)) fnc(float4 v) { \
80 int4 r; \
81 r.x = fnc(v.x); \
82 r.y = fnc(v.y); \
83 r.z = fnc(v.z); \
84 r.w = fnc(v.w); \
85 return r; \
86}
87
Jason Sams1b937f52010-06-09 14:26:16 -070088#define DEF_FUNC_2(fnc) \
89static float2 __attribute__((overloadable)) fnc(float2 v1, float2 v2) { \
90 float2 r; \
91 r.x = fnc(v1.x, v2.x); \
92 r.y = fnc(v1.y, v2.y); \
93 return r; \
94} \
95static float3 __attribute__((overloadable)) fnc(float3 v1, float3 v2) { \
96 float3 r; \
97 r.x = fnc(v1.x, v2.x); \
98 r.y = fnc(v1.y, v2.y); \
99 r.z = fnc(v1.z, v2.z); \
100 return r; \
101} \
102static float4 __attribute__((overloadable)) fnc(float4 v1, float4 v2) { \
103 float4 r; \
104 r.x = fnc(v1.x, v2.x); \
105 r.y = fnc(v1.y, v2.y); \
106 r.z = fnc(v1.z, v2.z); \
107 r.w = fnc(v1.w, v2.z); \
108 return r; \
109}
110
111#define DEF_FUNC_2F(fnc) \
112static float2 __attribute__((overloadable)) fnc(float2 v1, float v2) { \
113 float2 r; \
114 r.x = fnc(v1.x, v2); \
115 r.y = fnc(v1.y, v2); \
116 return r; \
117} \
118static float3 __attribute__((overloadable)) fnc(float3 v1, float v2) { \
119 float3 r; \
120 r.x = fnc(v1.x, v2); \
121 r.y = fnc(v1.y, v2); \
122 r.z = fnc(v1.z, v2); \
123 return r; \
124} \
125static float4 __attribute__((overloadable)) fnc(float4 v1, float v2) { \
126 float4 r; \
127 r.x = fnc(v1.x, v2); \
128 r.y = fnc(v1.y, v2); \
129 r.z = fnc(v1.z, v2); \
130 r.w = fnc(v1.w, v2); \
131 return r; \
132}
133
134
Jason Sams22fa3712010-05-19 17:22:57 -0700135extern float __attribute__((overloadable)) acos(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700136DEF_FUNC_1(acos)
Jason Sams22fa3712010-05-19 17:22:57 -0700137
138extern float __attribute__((overloadable)) acosh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700139DEF_FUNC_1(acosh)
Jason Sams22fa3712010-05-19 17:22:57 -0700140
Jason Sams1b937f52010-06-09 14:26:16 -0700141static float __attribute__((overloadable)) acospi(float v) {
142 return acos(v) / M_PI;
143}
144DEF_FUNC_1(acospi)
Jason Sams22fa3712010-05-19 17:22:57 -0700145
146extern float __attribute__((overloadable)) asin(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700147DEF_FUNC_1(asin)
Jason Sams22fa3712010-05-19 17:22:57 -0700148
149extern float __attribute__((overloadable)) asinh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700150DEF_FUNC_1(asinh)
Jason Sams22fa3712010-05-19 17:22:57 -0700151
Jason Sams1b937f52010-06-09 14:26:16 -0700152static float __attribute__((overloadable)) asinpi(float v) {
153 return asin(v) / M_PI;
154}
155DEF_FUNC_1(asinpi)
Jason Sams22fa3712010-05-19 17:22:57 -0700156
157extern float __attribute__((overloadable)) atan(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700158DEF_FUNC_1(atan)
Jason Sams22fa3712010-05-19 17:22:57 -0700159
160extern float __attribute__((overloadable)) atan2(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700161DEF_FUNC_2(atan2)
Jason Sams22fa3712010-05-19 17:22:57 -0700162
163extern float __attribute__((overloadable)) atanh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700164DEF_FUNC_1(atanh)
Jason Sams22fa3712010-05-19 17:22:57 -0700165
Jason Sams1b937f52010-06-09 14:26:16 -0700166static float __attribute__((overloadable)) atanpi(float v) {
167 return atan(v) / M_PI;
168}
169DEF_FUNC_1(atanpi)
Jason Sams22fa3712010-05-19 17:22:57 -0700170
Jason Sams1b937f52010-06-09 14:26:16 -0700171static float __attribute__((overloadable)) atan2pi(float y, float x) {
172 return atan2(y, x) / M_PI;
173}
174DEF_FUNC_2(atan2pi)
Jason Sams22fa3712010-05-19 17:22:57 -0700175
176extern float __attribute__((overloadable)) cbrt(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700177DEF_FUNC_1(cbrt)
Jason Sams22fa3712010-05-19 17:22:57 -0700178
179extern float __attribute__((overloadable)) ceil(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700180DEF_FUNC_1(ceil)
Jason Sams22fa3712010-05-19 17:22:57 -0700181
182extern float __attribute__((overloadable)) copysign(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700183DEF_FUNC_2(copysign)
Jason Sams22fa3712010-05-19 17:22:57 -0700184
185extern float __attribute__((overloadable)) cos(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700186DEF_FUNC_1(cos)
Jason Sams22fa3712010-05-19 17:22:57 -0700187
188extern float __attribute__((overloadable)) cosh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700189DEF_FUNC_1(cosh)
Jason Sams22fa3712010-05-19 17:22:57 -0700190
Jason Sams1b937f52010-06-09 14:26:16 -0700191static float __attribute__((overloadable)) cospi(float v) {
192 return cos(v * M_PI);
193}
194DEF_FUNC_1(cospi)
Jason Sams22fa3712010-05-19 17:22:57 -0700195
196extern float __attribute__((overloadable)) erfc(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700197DEF_FUNC_1(erfc)
Jason Sams22fa3712010-05-19 17:22:57 -0700198
199extern float __attribute__((overloadable)) erf(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700200DEF_FUNC_1(erf)
Jason Sams22fa3712010-05-19 17:22:57 -0700201
202extern float __attribute__((overloadable)) exp(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700203DEF_FUNC_1(exp)
Jason Sams22fa3712010-05-19 17:22:57 -0700204
205extern float __attribute__((overloadable)) exp2(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700206DEF_FUNC_1(exp2)
Jason Sams22fa3712010-05-19 17:22:57 -0700207
Jason Sams1b937f52010-06-09 14:26:16 -0700208extern float __attribute__((overloadable)) pow(float, float);
209static float __attribute__((overloadable)) exp10(float v) {
210 return pow(10.f, v);
211}
212DEF_FUNC_1(exp10)
Jason Sams22fa3712010-05-19 17:22:57 -0700213
214extern float __attribute__((overloadable)) expm1(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700215DEF_FUNC_1(expm1)
Jason Sams22fa3712010-05-19 17:22:57 -0700216
217extern float __attribute__((overloadable)) fabs(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700218DEF_FUNC_1(fabs)
Jason Sams22fa3712010-05-19 17:22:57 -0700219
220extern float __attribute__((overloadable)) fdim(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700221DEF_FUNC_2(fdim)
Jason Sams22fa3712010-05-19 17:22:57 -0700222
223extern float __attribute__((overloadable)) floor(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700224DEF_FUNC_1(floor)
Jason Sams22fa3712010-05-19 17:22:57 -0700225
226extern float __attribute__((overloadable)) fma(float, float, float);
227extern float2 __attribute__((overloadable)) fma(float2, float2, float2);
228extern float3 __attribute__((overloadable)) fma(float3, float3, float3);
229extern float4 __attribute__((overloadable)) fma(float4, float4, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700230
231extern float __attribute__((overloadable)) fmax(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700232DEF_FUNC_2(fmax);
233DEF_FUNC_2F(fmax);
Jason Sams22fa3712010-05-19 17:22:57 -0700234
235extern float __attribute__((overloadable)) fmin(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700236DEF_FUNC_2(fmin);
237DEF_FUNC_2F(fmin);
Jason Sams22fa3712010-05-19 17:22:57 -0700238
239extern float __attribute__((overloadable)) fmod(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700240DEF_FUNC_2(fmod)
Jason Sams22fa3712010-05-19 17:22:57 -0700241
Jason Sams1b937f52010-06-09 14:26:16 -0700242static float __attribute__((overloadable)) fract(float v, float *iptr) {
243 int i = (int)floor(v);
244 iptr[0] = i;
245 return fmin(v - i, 0x1.fffffep-1f);
246}
247static float2 __attribute__((overloadable)) fract(float2 v, float2 *iptr) {
248 float t[2];
249 float2 r;
250 r.x = fract(v.x, &t[0]);
251 r.y = fract(v.y, &t[1]);
252 iptr[0] = t[0];
253 iptr[1] = t[1];
254 return r;
255}
256static float3 __attribute__((overloadable)) fract(float3 v, float3 *iptr) {
257 float t[3];
258 float3 r;
259 r.x = fract(v.x, &t[0]);
260 r.y = fract(v.y, &t[1]);
261 r.z = fract(v.z, &t[2]);
262 iptr[0] = t[0];
263 iptr[1] = t[1];
264 iptr[2] = t[2];
265 return r;
266}
267static float4 __attribute__((overloadable)) fract(float4 v, float4 *iptr) {
268 float t[4];
269 float4 r;
270 r.x = fract(v.x, &t[0]);
271 r.y = fract(v.y, &t[1]);
272 r.z = fract(v.z, &t[2]);
273 r.w = fract(v.w, &t[3]);
274 iptr[0] = t[0];
275 iptr[1] = t[1];
276 iptr[2] = t[2];
277 iptr[3] = t[3];
278 return r;
279}
Jason Sams22fa3712010-05-19 17:22:57 -0700280
281extern float __attribute__((overloadable)) frexp(float, float *);
282extern float2 __attribute__((overloadable)) frexp(float2, float2 *);
283extern float3 __attribute__((overloadable)) frexp(float3, float3 *);
284extern float4 __attribute__((overloadable)) frexp(float4, float4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700285
286extern float __attribute__((overloadable)) hypot(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700287DEF_FUNC_2(hypot)
Jason Sams22fa3712010-05-19 17:22:57 -0700288
289extern int __attribute__((overloadable)) ilogb(float);
Stephen Hines47416532011-01-11 14:38:18 -0800290DEF_FUNC_1_RI(ilogb)
Jason Sams22fa3712010-05-19 17:22:57 -0700291
292extern float __attribute__((overloadable)) ldexp(float, int);
293extern float2 __attribute__((overloadable)) ldexp(float2, int2);
294extern float3 __attribute__((overloadable)) ldexp(float3, int3);
295extern float4 __attribute__((overloadable)) ldexp(float4, int4);
Jason Sams22fa3712010-05-19 17:22:57 -0700296extern float2 __attribute__((overloadable)) ldexp(float2, int);
297extern float3 __attribute__((overloadable)) ldexp(float3, int);
298extern float4 __attribute__((overloadable)) ldexp(float4, int);
Jason Sams22fa3712010-05-19 17:22:57 -0700299
300extern float __attribute__((overloadable)) lgamma(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700301DEF_FUNC_1(lgamma)
Jason Sams22fa3712010-05-19 17:22:57 -0700302extern float __attribute__((overloadable)) lgamma(float, float *);
303extern float2 __attribute__((overloadable)) lgamma(float2, float2 *);
304extern float3 __attribute__((overloadable)) lgamma(float3, float3 *);
305extern float4 __attribute__((overloadable)) lgamma(float4, float4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700306
307extern float __attribute__((overloadable)) log(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700308DEF_FUNC_1(log)
Jason Sams22fa3712010-05-19 17:22:57 -0700309
Jason Sams22fa3712010-05-19 17:22:57 -0700310
311extern float __attribute__((overloadable)) log10(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700312DEF_FUNC_1(log10)
313
314static float __attribute__((overloadable)) log2(float v) {
315 return log10(v) / log10(2.f);
316}
317DEF_FUNC_1(log2)
Jason Sams22fa3712010-05-19 17:22:57 -0700318
319extern float __attribute__((overloadable)) log1p(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700320DEF_FUNC_1(log1p)
Jason Sams22fa3712010-05-19 17:22:57 -0700321
322extern float __attribute__((overloadable)) logb(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700323DEF_FUNC_1(logb)
Jason Sams22fa3712010-05-19 17:22:57 -0700324
325extern float __attribute__((overloadable)) mad(float, float, float);
326extern float2 __attribute__((overloadable)) mad(float2, float2, float2);
327extern float3 __attribute__((overloadable)) mad(float3, float3, float3);
328extern float4 __attribute__((overloadable)) mad(float4, float4, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700329
330extern float __attribute__((overloadable)) modf(float, float *);
331extern float2 __attribute__((overloadable)) modf(float2, float2 *);
332extern float3 __attribute__((overloadable)) modf(float3, float3 *);
333extern float4 __attribute__((overloadable)) modf(float4, float4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700334
Jason Sams1b937f52010-06-09 14:26:16 -0700335//extern float __attribute__((overloadable)) nan(uint);
Jason Sams22fa3712010-05-19 17:22:57 -0700336
337extern float __attribute__((overloadable)) nextafter(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700338DEF_FUNC_2(nextafter)
Jason Sams22fa3712010-05-19 17:22:57 -0700339
Jason Sams1b937f52010-06-09 14:26:16 -0700340DEF_FUNC_2(pow)
Jason Sams22fa3712010-05-19 17:22:57 -0700341
Jason Sams1b937f52010-06-09 14:26:16 -0700342static float __attribute__((overloadable)) pown(float v, int p) {
343 return pow(v, (float)p);
344}
345static float2 __attribute__((overloadable)) pown(float2 v, int2 p) {
346 return pow(v, (float2)p);
347}
348static float3 __attribute__((overloadable)) pown(float3 v, int3 p) {
349 return pow(v, (float3)p);
350}
351static float4 __attribute__((overloadable)) pown(float4 v, int4 p) {
352 return pow(v, (float4)p);
353}
Jason Sams22fa3712010-05-19 17:22:57 -0700354
Jason Sams1b937f52010-06-09 14:26:16 -0700355static float __attribute__((overloadable)) powr(float v, float p) {
356 return pow(v, p);
357}
358static float2 __attribute__((overloadable)) powr(float2 v, float2 p) {
359 return pow(v, p);
360}
361static float3 __attribute__((overloadable)) powr(float3 v, float3 p) {
362 return pow(v, p);
363}
364static float4 __attribute__((overloadable)) powr(float4 v, float4 p) {
365 return pow(v, p);
366}
Jason Sams22fa3712010-05-19 17:22:57 -0700367
368extern float __attribute__((overloadable)) remainder(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700369DEF_FUNC_2(remainder)
Jason Sams22fa3712010-05-19 17:22:57 -0700370
Stephen Hines47416532011-01-11 14:38:18 -0800371extern float __attribute__((overloadable)) remquo(float, float, int *);
372extern float2 __attribute__((overloadable)) remquo(float2, float2, int2 *);
373extern float3 __attribute__((overloadable)) remquo(float3, float3, int3 *);
374extern float4 __attribute__((overloadable)) remquo(float4, float4, int4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700375
376extern float __attribute__((overloadable)) rint(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700377DEF_FUNC_1(rint)
Jason Sams22fa3712010-05-19 17:22:57 -0700378
Jason Sams1b937f52010-06-09 14:26:16 -0700379static float __attribute__((overloadable)) rootn(float v, int r) {
380 return pow(v, 1.f / r);
381}
382static float2 __attribute__((overloadable)) rootn(float2 v, int2 r) {
383 float2 t = {1.f / r.x, 1.f / r.y};
384 return pow(v, t);
385}
386static float3 __attribute__((overloadable)) rootn(float3 v, int3 r) {
387 float3 t = {1.f / r.x, 1.f / r.y, 1.f / r.z};
388 return pow(v, t);
389}
390static float4 __attribute__((overloadable)) rootn(float4 v, int4 r) {
391 float4 t = {1.f / r.x, 1.f / r.y, 1.f / r.z, 1.f / r.w};
392 return pow(v, t);
393}
Jason Sams22fa3712010-05-19 17:22:57 -0700394
395extern float __attribute__((overloadable)) round(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700396DEF_FUNC_1(round)
Jason Sams22fa3712010-05-19 17:22:57 -0700397
398extern float __attribute__((overloadable)) sqrt(float);
Stephen Hines47416532011-01-11 14:38:18 -0800399static float __attribute__((overloadable)) rsqrt(float v) {
Jason Sams1b937f52010-06-09 14:26:16 -0700400 return 1.f / sqrt(v);
401}
Stephen Hines47416532011-01-11 14:38:18 -0800402DEF_FUNC_1(rsqrt)
Jason Sams1b937f52010-06-09 14:26:16 -0700403
404extern float __attribute__((overloadable)) sin(float);
405DEF_FUNC_1(sin)
406
407static float __attribute__((overloadable)) sincos(float v, float *cosptr) {
408 *cosptr = cos(v);
409 return sin(v);
410}
411static float2 __attribute__((overloadable)) sincos(float2 v, float2 *cosptr) {
412 *cosptr = cos(v);
413 return sin(v);
414}
415static float3 __attribute__((overloadable)) sincos(float3 v, float3 *cosptr) {
416 *cosptr = cos(v);
417 return sin(v);
418}
419static float4 __attribute__((overloadable)) sincos(float4 v, float4 *cosptr) {
420 *cosptr = cos(v);
421 return sin(v);
422}
423
424extern float __attribute__((overloadable)) sinh(float);
425DEF_FUNC_1(sinh)
426
427static float __attribute__((overloadable)) sinpi(float v) {
428 return sin(v * M_PI);
429}
430DEF_FUNC_1(sinpi)
431
432DEF_FUNC_1(sqrt)
Jason Sams22fa3712010-05-19 17:22:57 -0700433
434extern float __attribute__((overloadable)) tan(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700435DEF_FUNC_1(tan)
Jason Sams22fa3712010-05-19 17:22:57 -0700436
437extern float __attribute__((overloadable)) tanh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700438DEF_FUNC_1(tanh)
Jason Sams22fa3712010-05-19 17:22:57 -0700439
Jason Sams1b937f52010-06-09 14:26:16 -0700440static float __attribute__((overloadable)) tanpi(float v) {
441 return tan(v * M_PI);
442}
443DEF_FUNC_1(tanpi)
Jason Sams22fa3712010-05-19 17:22:57 -0700444
445extern float __attribute__((overloadable)) tgamma(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700446DEF_FUNC_1(tgamma)
Jason Sams22fa3712010-05-19 17:22:57 -0700447
448extern float __attribute__((overloadable)) trunc(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700449DEF_FUNC_1(trunc)
Jason Sams22fa3712010-05-19 17:22:57 -0700450
451// Int ops (partial), 6.11.3
452extern uint __attribute__((overloadable)) abs(int);
453extern ushort __attribute__((overloadable)) abs(short);
454extern uchar __attribute__((overloadable)) abs(char);
455
456extern uint __attribute__((overloadable)) clz(uint);
457extern int __attribute__((overloadable)) clz(int);
458extern ushort __attribute__((overloadable)) clz(ushort);
459extern short __attribute__((overloadable)) clz(short);
460extern uchar __attribute__((overloadable)) clz(uchar);
461extern char __attribute__((overloadable)) clz(char);
462
Jason Sams1b937f52010-06-09 14:26:16 -0700463static uint __attribute__((overloadable)) min(uint v1, uint v2) {
464 return v1 < v2 ? v1 : v2;
465}
466static int __attribute__((overloadable)) min(int v1, int v2) {
467 return v1 < v2 ? v1 : v2;
468}
469static ushort __attribute__((overloadable)) min(ushort v1, ushort v2) {
470 return v1 < v2 ? v1 : v2;
471}
472static short __attribute__((overloadable)) min(short v1, short v2) {
473 return v1 < v2 ? v1 : v2;
474}
475static uchar __attribute__((overloadable)) min(uchar v1, uchar v2) {
476 return v1 < v2 ? v1 : v2;
477}
478static char __attribute__((overloadable)) min(char v1, char v2) {
479 return v1 < v2 ? v1 : v2;
480}
Jason Sams22fa3712010-05-19 17:22:57 -0700481
Jason Sams1b937f52010-06-09 14:26:16 -0700482static uint __attribute__((overloadable)) max(uint v1, uint v2) {
483 return v1 > v2 ? v1 : v2;
484}
485static int __attribute__((overloadable)) max(int v1, int v2) {
486 return v1 > v2 ? v1 : v2;
487}
488static ushort __attribute__((overloadable)) max(ushort v1, ushort v2) {
489 return v1 > v2 ? v1 : v2;
490}
491static short __attribute__((overloadable)) max(short v1, short v2) {
492 return v1 > v2 ? v1 : v2;
493}
494static uchar __attribute__((overloadable)) max(uchar v1, uchar v2) {
495 return v1 > v2 ? v1 : v2;
496}
497static char __attribute__((overloadable)) max(char v1, char v2) {
498 return v1 > v2 ? v1 : v2;
499}
Jason Sams22fa3712010-05-19 17:22:57 -0700500
501
502
503
504// 6.11.4
505
Jason Sams1b937f52010-06-09 14:26:16 -0700506static float __attribute__((overloadable)) clamp(float amount, float low, float high) {
507 return amount < low ? low : (amount > high ? high : amount);
508}
509static float2 __attribute__((overloadable)) clamp(float2 amount, float2 low, float2 high) {
510 float2 r;
511 r.x = amount.x < low.x ? low.x : (amount.x > high.x ? high.x : amount.x);
512 r.y = amount.y < low.y ? low.y : (amount.y > high.y ? high.y : amount.y);
513 return r;
514}
515static float3 __attribute__((overloadable)) clamp(float3 amount, float3 low, float3 high) {
516 float3 r;
517 r.x = amount.x < low.x ? low.x : (amount.x > high.x ? high.x : amount.x);
518 r.y = amount.y < low.y ? low.y : (amount.y > high.y ? high.y : amount.y);
519 r.z = amount.z < low.z ? low.z : (amount.z > high.z ? high.z : amount.z);
520 return r;
521}
522static float4 __attribute__((overloadable)) clamp(float4 amount, float4 low, float4 high) {
523 float4 r;
524 r.x = amount.x < low.x ? low.x : (amount.x > high.x ? high.x : amount.x);
525 r.y = amount.y < low.y ? low.y : (amount.y > high.y ? high.y : amount.y);
526 r.z = amount.z < low.z ? low.z : (amount.z > high.z ? high.z : amount.z);
527 r.w = amount.w < low.w ? low.w : (amount.w > high.w ? high.w : amount.w);
528 return r;
529}
530static float2 __attribute__((overloadable)) clamp(float2 amount, float low, float high) {
531 float2 r;
532 r.x = amount.x < low ? low : (amount.x > high ? high : amount.x);
533 r.y = amount.y < low ? low : (amount.y > high ? high : amount.y);
534 return r;
535}
536static float3 __attribute__((overloadable)) clamp(float3 amount, float low, float high) {
537 float3 r;
538 r.x = amount.x < low ? low : (amount.x > high ? high : amount.x);
539 r.y = amount.y < low ? low : (amount.y > high ? high : amount.y);
540 r.z = amount.z < low ? low : (amount.z > high ? high : amount.z);
541 return r;
542}
543static float4 __attribute__((overloadable)) clamp(float4 amount, float low, float high) {
544 float4 r;
545 r.x = amount.x < low ? low : (amount.x > high ? high : amount.x);
546 r.y = amount.y < low ? low : (amount.y > high ? high : amount.y);
547 r.z = amount.z < low ? low : (amount.z > high ? high : amount.z);
548 r.w = amount.w < low ? low : (amount.w > high ? high : amount.w);
549 return r;
550}
Jason Sams22fa3712010-05-19 17:22:57 -0700551
Jason Sams1b937f52010-06-09 14:26:16 -0700552static float __attribute__((overloadable)) degrees(float radians) {
553 return radians * (180.f / M_PI);
554}
555DEF_FUNC_1(degrees)
Jason Sams22fa3712010-05-19 17:22:57 -0700556
Jason Sams1b937f52010-06-09 14:26:16 -0700557static float __attribute__((overloadable)) max(float v1, float v2) {
558 return v1 > v2 ? v1 : v2;
559}
560static float2 __attribute__((overloadable)) max(float2 v1, float2 v2) {
561 float2 r;
562 r.x = v1.x > v2.x ? v1.x : v2.x;
563 r.y = v1.y > v2.y ? v1.y : v2.y;
564 return r;
565}
566static float3 __attribute__((overloadable)) max(float3 v1, float3 v2) {
567 float3 r;
568 r.x = v1.x > v2.x ? v1.x : v2.x;
569 r.y = v1.y > v2.y ? v1.y : v2.y;
570 r.z = v1.z > v2.z ? v1.z : v2.z;
571 return r;
572}
573static float4 __attribute__((overloadable)) max(float4 v1, float4 v2) {
574 float4 r;
575 r.x = v1.x > v2.x ? v1.x : v2.x;
576 r.y = v1.y > v2.y ? v1.y : v2.y;
577 r.z = v1.z > v2.z ? v1.z : v2.z;
578 r.w = v1.w > v2.w ? v1.w : v2.w;
579 return r;
580}
581static float2 __attribute__((overloadable)) max(float2 v1, float v2) {
582 float2 r;
583 r.x = v1.x > v2 ? v1.x : v2;
584 r.y = v1.y > v2 ? v1.y : v2;
585 return r;
586}
587static float3 __attribute__((overloadable)) max(float3 v1, float v2) {
588 float3 r;
589 r.x = v1.x > v2 ? v1.x : v2;
590 r.y = v1.y > v2 ? v1.y : v2;
591 r.z = v1.z > v2 ? v1.z : v2;
592 return r;
593}
594static float4 __attribute__((overloadable)) max(float4 v1, float v2) {
595 float4 r;
596 r.x = v1.x > v2 ? v1.x : v2;
597 r.y = v1.y > v2 ? v1.y : v2;
598 r.z = v1.z > v2 ? v1.z : v2;
599 r.w = v1.w > v2 ? v1.w : v2;
600 return r;
601}
Jason Sams22fa3712010-05-19 17:22:57 -0700602
Jason Sams1b937f52010-06-09 14:26:16 -0700603static float __attribute__((overloadable)) min(float v1, float v2) {
604 return v1 < v2 ? v1 : v2;
605}
606static float2 __attribute__((overloadable)) min(float2 v1, float2 v2) {
607 float2 r;
608 r.x = v1.x < v2.x ? v1.x : v2.x;
609 r.y = v1.y < v2.y ? v1.y : v2.y;
610 return r;
611}
612static float3 __attribute__((overloadable)) min(float3 v1, float3 v2) {
613 float3 r;
614 r.x = v1.x < v2.x ? v1.x : v2.x;
615 r.y = v1.y < v2.y ? v1.y : v2.y;
616 r.z = v1.z < v2.z ? v1.z : v2.z;
617 return r;
618}
619static float4 __attribute__((overloadable)) min(float4 v1, float4 v2) {
620 float4 r;
621 r.x = v1.x < v2.x ? v1.x : v2.x;
622 r.y = v1.y < v2.y ? v1.y : v2.y;
623 r.z = v1.z < v2.z ? v1.z : v2.z;
624 r.w = v1.w < v2.w ? v1.w : v2.w;
625 return r;
626}
627static float2 __attribute__((overloadable)) min(float2 v1, float v2) {
628 float2 r;
629 r.x = v1.x < v2 ? v1.x : v2;
630 r.y = v1.y < v2 ? v1.y : v2;
631 return r;
632}
633static float3 __attribute__((overloadable)) min(float3 v1, float v2) {
634 float3 r;
635 r.x = v1.x < v2 ? v1.x : v2;
636 r.y = v1.y < v2 ? v1.y : v2;
637 r.z = v1.z < v2 ? v1.z : v2;
638 return r;
639}
640static float4 __attribute__((overloadable)) min(float4 v1, float v2) {
641 float4 r;
642 r.x = v1.x < v2 ? v1.x : v2;
643 r.y = v1.y < v2 ? v1.y : v2;
644 r.z = v1.z < v2 ? v1.z : v2;
645 r.w = v1.w < v2 ? v1.w : v2;
646 return r;
647}
Jason Sams22fa3712010-05-19 17:22:57 -0700648
Jason Sams1b937f52010-06-09 14:26:16 -0700649static float __attribute__((overloadable)) mix(float start, float stop, float amount) {
650 return start + (stop - start) * amount;
651}
652static float2 __attribute__((overloadable)) mix(float2 start, float2 stop, float2 amount) {
653 return start + (stop - start) * amount;
654}
655static float3 __attribute__((overloadable)) mix(float3 start, float3 stop, float3 amount) {
656 return start + (stop - start) * amount;
657}
658static float4 __attribute__((overloadable)) mix(float4 start, float4 stop, float4 amount) {
659 return start + (stop - start) * amount;
660}
661static float2 __attribute__((overloadable)) mix(float2 start, float2 stop, float amount) {
662 return start + (stop - start) * amount;
663}
664static float3 __attribute__((overloadable)) mix(float3 start, float3 stop, float amount) {
665 return start + (stop - start) * amount;
666}
667static float4 __attribute__((overloadable)) mix(float4 start, float4 stop, float amount) {
668 return start + (stop - start) * amount;
669}
Jason Sams22fa3712010-05-19 17:22:57 -0700670
Jason Sams1b937f52010-06-09 14:26:16 -0700671static float __attribute__((overloadable)) radians(float degrees) {
672 return degrees * (M_PI / 180.f);
673}
674DEF_FUNC_1(radians)
Jason Sams22fa3712010-05-19 17:22:57 -0700675
Jason Sams1b937f52010-06-09 14:26:16 -0700676static float __attribute__((overloadable)) step(float edge, float v) {
677 return (v < edge) ? 0.f : 1.f;
678}
679static float2 __attribute__((overloadable)) step(float2 edge, float2 v) {
680 float2 r;
681 r.x = (v.x < edge.x) ? 0.f : 1.f;
682 r.y = (v.y < edge.y) ? 0.f : 1.f;
683 return r;
684}
685static float3 __attribute__((overloadable)) step(float3 edge, float3 v) {
686 float3 r;
687 r.x = (v.x < edge.x) ? 0.f : 1.f;
688 r.y = (v.y < edge.y) ? 0.f : 1.f;
689 r.z = (v.z < edge.z) ? 0.f : 1.f;
690 return r;
691}
692static float4 __attribute__((overloadable)) step(float4 edge, float4 v) {
693 float4 r;
694 r.x = (v.x < edge.x) ? 0.f : 1.f;
695 r.y = (v.y < edge.y) ? 0.f : 1.f;
696 r.z = (v.z < edge.z) ? 0.f : 1.f;
697 r.w = (v.w < edge.w) ? 0.f : 1.f;
698 return r;
699}
700static float2 __attribute__((overloadable)) step(float2 edge, float v) {
701 float2 r;
702 r.x = (v < edge.x) ? 0.f : 1.f;
703 r.y = (v < edge.y) ? 0.f : 1.f;
704 return r;
705}
706static float3 __attribute__((overloadable)) step(float3 edge, float v) {
707 float3 r;
708 r.x = (v < edge.x) ? 0.f : 1.f;
709 r.y = (v < edge.y) ? 0.f : 1.f;
710 r.z = (v < edge.z) ? 0.f : 1.f;
711 return r;
712}
713static float4 __attribute__((overloadable)) step(float4 edge, float v) {
714 float4 r;
715 r.x = (v < edge.x) ? 0.f : 1.f;
716 r.y = (v < edge.y) ? 0.f : 1.f;
717 r.z = (v < edge.z) ? 0.f : 1.f;
718 r.w = (v < edge.w) ? 0.f : 1.f;
719 return r;
720}
Jason Sams22fa3712010-05-19 17:22:57 -0700721
722extern float __attribute__((overloadable)) smoothstep(float, float, float);
723extern float2 __attribute__((overloadable)) smoothstep(float2, float2, float2);
724extern float3 __attribute__((overloadable)) smoothstep(float3, float3, float3);
725extern float4 __attribute__((overloadable)) smoothstep(float4, float4, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700726extern float2 __attribute__((overloadable)) smoothstep(float, float, float2);
727extern float3 __attribute__((overloadable)) smoothstep(float, float, float3);
728extern float4 __attribute__((overloadable)) smoothstep(float, float, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700729
Jason Sams1b937f52010-06-09 14:26:16 -0700730static float __attribute__((overloadable)) sign(float v) {
731 if (v > 0) return 1.f;
732 if (v < 0) return -1.f;
733 return v;
734}
735DEF_FUNC_1(sign)
Jason Sams22fa3712010-05-19 17:22:57 -0700736
737// 6.11.5
Jason Sams1b937f52010-06-09 14:26:16 -0700738static float3 __attribute__((overloadable)) cross(float3 lhs, float3 rhs) {
739 float3 r;
740 r.x = lhs.y * rhs.z - lhs.z * rhs.y;
741 r.y = lhs.z * rhs.x - lhs.x * rhs.z;
742 r.z = lhs.x * rhs.y - lhs.y * rhs.x;
743 return r;
744}
Jason Sams22fa3712010-05-19 17:22:57 -0700745
Jason Sams1b937f52010-06-09 14:26:16 -0700746static float4 __attribute__((overloadable)) cross(float4 lhs, float4 rhs) {
747 float4 r;
748 r.x = lhs.y * rhs.z - lhs.z * rhs.y;
749 r.y = lhs.z * rhs.x - lhs.x * rhs.z;
750 r.z = lhs.x * rhs.y - lhs.y * rhs.x;
751 r.w = 0.f;
752 return r;
753}
Jason Sams22fa3712010-05-19 17:22:57 -0700754
Jason Sams1b937f52010-06-09 14:26:16 -0700755static float __attribute__((overloadable)) dot(float lhs, float rhs) {
756 return lhs * rhs;
757}
758static float __attribute__((overloadable)) dot(float2 lhs, float2 rhs) {
759 return lhs.x*rhs.x + lhs.y*rhs.y;
760}
761static float __attribute__((overloadable)) dot(float3 lhs, float3 rhs) {
762 return lhs.x*rhs.x + lhs.y*rhs.y + lhs.z*rhs.z;
763}
764static float __attribute__((overloadable)) dot(float4 lhs, float4 rhs) {
765 return lhs.x*rhs.x + lhs.y*rhs.y + lhs.z*rhs.z + lhs.w*rhs.w;
766}
Jason Sams22fa3712010-05-19 17:22:57 -0700767
Jason Sams1b937f52010-06-09 14:26:16 -0700768static float __attribute__((overloadable)) length(float v) {
769 return v;
770}
771static float __attribute__((overloadable)) length(float2 v) {
772 return sqrt(v.x*v.x + v.y*v.y);
773}
774static float __attribute__((overloadable)) length(float3 v) {
775 return sqrt(v.x*v.x + v.y*v.y + v.z*v.z);
776}
777static float __attribute__((overloadable)) length(float4 v) {
778 return sqrt(v.x*v.x + v.y*v.y + v.z*v.z + v.w*v.w);
779}
Jason Sams22fa3712010-05-19 17:22:57 -0700780
Jason Sams1b937f52010-06-09 14:26:16 -0700781static float __attribute__((overloadable)) distance(float lhs, float rhs) {
782 return length(lhs - rhs);
783}
784static float __attribute__((overloadable)) distance(float2 lhs, float2 rhs) {
785 return length(lhs - rhs);
786}
787static float __attribute__((overloadable)) distance(float3 lhs, float3 rhs) {
788 return length(lhs - rhs);
789}
790static float __attribute__((overloadable)) distance(float4 lhs, float4 rhs) {
791 return length(lhs - rhs);
792}
Jason Sams22fa3712010-05-19 17:22:57 -0700793
Jason Sams1b937f52010-06-09 14:26:16 -0700794static float __attribute__((overloadable)) normalize(float v) {
795 return 1.f;
796}
797static float2 __attribute__((overloadable)) normalize(float2 v) {
798 return v / length(v);
799}
800static float3 __attribute__((overloadable)) normalize(float3 v) {
801 return v / length(v);
802}
803static float4 __attribute__((overloadable)) normalize(float4 v) {
804 return v / length(v);
805}
806
Stephen Hines47416532011-01-11 14:38:18 -0800807#undef CVT_FUNC
808#undef CVT_FUNC_2
809#undef DEF_FUNC_1
810#undef DEF_FUNC_1_RI
811#undef DEF_FUNC_2
812#undef DEF_FUNC_2F
Jason Sams1b937f52010-06-09 14:26:16 -0700813
814#endif