blob: b9bb1f729f4235f2b4e198937f6a0d67334cf34b [file] [log] [blame]
Jason Sams1b937f52010-06-09 14:26:16 -07001#ifndef __RS_CL_RSH__
2#define __RS_CL_RSH__
3
4#define M_PI 3.14159265358979323846264338327950288f /* pi */
5
6
7// Conversions
8#define CVT_FUNC_2(typeout, typein) \
9static typeout##2 __attribute__((overloadable)) convert_##typeout##2(typein##2 v) { \
Jason Sams5e9811f2010-06-21 17:42:41 -070010 typeout##2 r = {(typeout)v.x, (typeout)v.y}; \
Jason Sams1b937f52010-06-09 14:26:16 -070011 return r; \
12} \
13static typeout##3 __attribute__((overloadable)) convert_##typeout##3(typein##3 v) { \
Jason Sams5e9811f2010-06-21 17:42:41 -070014 typeout##3 r = {(typeout)v.x, (typeout)v.y, (typeout)v.z}; \
Jason Sams1b937f52010-06-09 14:26:16 -070015 return r; \
16} \
17static typeout##4 __attribute__((overloadable)) convert_##typeout##4(typein##4 v) { \
Jason Sams5e9811f2010-06-21 17:42:41 -070018 typeout##4 r = {(typeout)v.x, (typeout)v.y, (typeout)v.z, (typeout)v.w}; \
Jason Sams1b937f52010-06-09 14:26:16 -070019 return r; \
20}
21
22#define CVT_FUNC(type) CVT_FUNC_2(type, uchar) \
23 CVT_FUNC_2(type, char) \
24 CVT_FUNC_2(type, ushort) \
25 CVT_FUNC_2(type, short) \
Jason Sams1b937f52010-06-09 14:26:16 -070026 CVT_FUNC_2(type, uint) \
Stephen Hines47416532011-01-11 14:38:18 -080027 CVT_FUNC_2(type, int) \
Jason Sams1b937f52010-06-09 14:26:16 -070028 CVT_FUNC_2(type, float)
29
30CVT_FUNC(char)
31CVT_FUNC(uchar)
32CVT_FUNC(short)
33CVT_FUNC(ushort)
34CVT_FUNC(int)
35CVT_FUNC(uint)
36CVT_FUNC(float)
37
38
39
Jason Sams22fa3712010-05-19 17:22:57 -070040// Float ops, 6.11.2
41
Jason Sams1b937f52010-06-09 14:26:16 -070042#define DEF_FUNC_1(fnc) \
43static float2 __attribute__((overloadable)) fnc(float2 v) { \
44 float2 r; \
45 r.x = fnc(v.x); \
46 r.y = fnc(v.y); \
47 return r; \
48} \
49static float3 __attribute__((overloadable)) fnc(float3 v) { \
50 float3 r; \
51 r.x = fnc(v.x); \
52 r.y = fnc(v.y); \
53 r.z = fnc(v.z); \
54 return r; \
55} \
56static float4 __attribute__((overloadable)) fnc(float4 v) { \
57 float4 r; \
58 r.x = fnc(v.x); \
59 r.y = fnc(v.y); \
60 r.z = fnc(v.z); \
61 r.w = fnc(v.w); \
62 return r; \
63}
64
Stephen Hines47416532011-01-11 14:38:18 -080065#define DEF_FUNC_1_RI(fnc) \
66static int2 __attribute__((overloadable)) fnc(float2 v) { \
67 int2 r; \
68 r.x = fnc(v.x); \
69 r.y = fnc(v.y); \
70 return r; \
71} \
72static int3 __attribute__((overloadable)) fnc(float3 v) { \
73 int3 r; \
74 r.x = fnc(v.x); \
75 r.y = fnc(v.y); \
76 r.z = fnc(v.z); \
77 return r; \
78} \
79static int4 __attribute__((overloadable)) fnc(float4 v) { \
80 int4 r; \
81 r.x = fnc(v.x); \
82 r.y = fnc(v.y); \
83 r.z = fnc(v.z); \
84 r.w = fnc(v.w); \
85 return r; \
86}
87
Jason Sams1b937f52010-06-09 14:26:16 -070088#define DEF_FUNC_2(fnc) \
89static float2 __attribute__((overloadable)) fnc(float2 v1, float2 v2) { \
90 float2 r; \
91 r.x = fnc(v1.x, v2.x); \
92 r.y = fnc(v1.y, v2.y); \
93 return r; \
94} \
95static float3 __attribute__((overloadable)) fnc(float3 v1, float3 v2) { \
96 float3 r; \
97 r.x = fnc(v1.x, v2.x); \
98 r.y = fnc(v1.y, v2.y); \
99 r.z = fnc(v1.z, v2.z); \
100 return r; \
101} \
102static float4 __attribute__((overloadable)) fnc(float4 v1, float4 v2) { \
103 float4 r; \
104 r.x = fnc(v1.x, v2.x); \
105 r.y = fnc(v1.y, v2.y); \
106 r.z = fnc(v1.z, v2.z); \
107 r.w = fnc(v1.w, v2.z); \
108 return r; \
109}
110
111#define DEF_FUNC_2F(fnc) \
112static float2 __attribute__((overloadable)) fnc(float2 v1, float v2) { \
113 float2 r; \
114 r.x = fnc(v1.x, v2); \
115 r.y = fnc(v1.y, v2); \
116 return r; \
117} \
118static float3 __attribute__((overloadable)) fnc(float3 v1, float v2) { \
119 float3 r; \
120 r.x = fnc(v1.x, v2); \
121 r.y = fnc(v1.y, v2); \
122 r.z = fnc(v1.z, v2); \
123 return r; \
124} \
125static float4 __attribute__((overloadable)) fnc(float4 v1, float v2) { \
126 float4 r; \
127 r.x = fnc(v1.x, v2); \
128 r.y = fnc(v1.y, v2); \
129 r.z = fnc(v1.z, v2); \
130 r.w = fnc(v1.w, v2); \
131 return r; \
132}
133
134
Jason Sams22fa3712010-05-19 17:22:57 -0700135extern float __attribute__((overloadable)) acos(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700136DEF_FUNC_1(acos)
Jason Sams22fa3712010-05-19 17:22:57 -0700137
138extern float __attribute__((overloadable)) acosh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700139DEF_FUNC_1(acosh)
Jason Sams22fa3712010-05-19 17:22:57 -0700140
Jason Sams1b937f52010-06-09 14:26:16 -0700141static float __attribute__((overloadable)) acospi(float v) {
142 return acos(v) / M_PI;
143}
144DEF_FUNC_1(acospi)
Jason Sams22fa3712010-05-19 17:22:57 -0700145
146extern float __attribute__((overloadable)) asin(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700147DEF_FUNC_1(asin)
Jason Sams22fa3712010-05-19 17:22:57 -0700148
149extern float __attribute__((overloadable)) asinh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700150DEF_FUNC_1(asinh)
Jason Sams22fa3712010-05-19 17:22:57 -0700151
Jason Sams1b937f52010-06-09 14:26:16 -0700152static float __attribute__((overloadable)) asinpi(float v) {
153 return asin(v) / M_PI;
154}
155DEF_FUNC_1(asinpi)
Jason Sams22fa3712010-05-19 17:22:57 -0700156
157extern float __attribute__((overloadable)) atan(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700158DEF_FUNC_1(atan)
Jason Sams22fa3712010-05-19 17:22:57 -0700159
160extern float __attribute__((overloadable)) atan2(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700161DEF_FUNC_2(atan2)
Jason Sams22fa3712010-05-19 17:22:57 -0700162
163extern float __attribute__((overloadable)) atanh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700164DEF_FUNC_1(atanh)
Jason Sams22fa3712010-05-19 17:22:57 -0700165
Jason Sams1b937f52010-06-09 14:26:16 -0700166static float __attribute__((overloadable)) atanpi(float v) {
167 return atan(v) / M_PI;
168}
169DEF_FUNC_1(atanpi)
Jason Sams22fa3712010-05-19 17:22:57 -0700170
Jason Sams1b937f52010-06-09 14:26:16 -0700171static float __attribute__((overloadable)) atan2pi(float y, float x) {
172 return atan2(y, x) / M_PI;
173}
174DEF_FUNC_2(atan2pi)
Jason Sams22fa3712010-05-19 17:22:57 -0700175
176extern float __attribute__((overloadable)) cbrt(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700177DEF_FUNC_1(cbrt)
Jason Sams22fa3712010-05-19 17:22:57 -0700178
179extern float __attribute__((overloadable)) ceil(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700180DEF_FUNC_1(ceil)
Jason Sams22fa3712010-05-19 17:22:57 -0700181
182extern float __attribute__((overloadable)) copysign(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700183DEF_FUNC_2(copysign)
Jason Sams22fa3712010-05-19 17:22:57 -0700184
185extern float __attribute__((overloadable)) cos(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700186DEF_FUNC_1(cos)
Jason Sams22fa3712010-05-19 17:22:57 -0700187
188extern float __attribute__((overloadable)) cosh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700189DEF_FUNC_1(cosh)
Jason Sams22fa3712010-05-19 17:22:57 -0700190
Jason Sams1b937f52010-06-09 14:26:16 -0700191static float __attribute__((overloadable)) cospi(float v) {
192 return cos(v * M_PI);
193}
194DEF_FUNC_1(cospi)
Jason Sams22fa3712010-05-19 17:22:57 -0700195
196extern float __attribute__((overloadable)) erfc(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700197DEF_FUNC_1(erfc)
Jason Sams22fa3712010-05-19 17:22:57 -0700198
199extern float __attribute__((overloadable)) erf(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700200DEF_FUNC_1(erf)
Jason Sams22fa3712010-05-19 17:22:57 -0700201
202extern float __attribute__((overloadable)) exp(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700203DEF_FUNC_1(exp)
Jason Sams22fa3712010-05-19 17:22:57 -0700204
205extern float __attribute__((overloadable)) exp2(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700206DEF_FUNC_1(exp2)
Jason Sams22fa3712010-05-19 17:22:57 -0700207
Jason Sams1b937f52010-06-09 14:26:16 -0700208extern float __attribute__((overloadable)) pow(float, float);
209static float __attribute__((overloadable)) exp10(float v) {
210 return pow(10.f, v);
211}
212DEF_FUNC_1(exp10)
Jason Sams22fa3712010-05-19 17:22:57 -0700213
214extern float __attribute__((overloadable)) expm1(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700215DEF_FUNC_1(expm1)
Jason Sams22fa3712010-05-19 17:22:57 -0700216
217extern float __attribute__((overloadable)) fabs(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700218DEF_FUNC_1(fabs)
Jason Sams22fa3712010-05-19 17:22:57 -0700219
220extern float __attribute__((overloadable)) fdim(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700221DEF_FUNC_2(fdim)
Jason Sams22fa3712010-05-19 17:22:57 -0700222
223extern float __attribute__((overloadable)) floor(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700224DEF_FUNC_1(floor)
Jason Sams22fa3712010-05-19 17:22:57 -0700225
226extern float __attribute__((overloadable)) fma(float, float, float);
227extern float2 __attribute__((overloadable)) fma(float2, float2, float2);
228extern float3 __attribute__((overloadable)) fma(float3, float3, float3);
229extern float4 __attribute__((overloadable)) fma(float4, float4, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700230
231extern float __attribute__((overloadable)) fmax(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700232DEF_FUNC_2(fmax);
233DEF_FUNC_2F(fmax);
Jason Sams22fa3712010-05-19 17:22:57 -0700234
235extern float __attribute__((overloadable)) fmin(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700236DEF_FUNC_2(fmin);
237DEF_FUNC_2F(fmin);
Jason Sams22fa3712010-05-19 17:22:57 -0700238
239extern float __attribute__((overloadable)) fmod(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700240DEF_FUNC_2(fmod)
Jason Sams22fa3712010-05-19 17:22:57 -0700241
Jason Sams1b937f52010-06-09 14:26:16 -0700242static float __attribute__((overloadable)) fract(float v, float *iptr) {
243 int i = (int)floor(v);
244 iptr[0] = i;
245 return fmin(v - i, 0x1.fffffep-1f);
246}
247static float2 __attribute__((overloadable)) fract(float2 v, float2 *iptr) {
248 float t[2];
249 float2 r;
250 r.x = fract(v.x, &t[0]);
251 r.y = fract(v.y, &t[1]);
252 iptr[0] = t[0];
253 iptr[1] = t[1];
254 return r;
255}
256static float3 __attribute__((overloadable)) fract(float3 v, float3 *iptr) {
257 float t[3];
258 float3 r;
259 r.x = fract(v.x, &t[0]);
260 r.y = fract(v.y, &t[1]);
261 r.z = fract(v.z, &t[2]);
262 iptr[0] = t[0];
263 iptr[1] = t[1];
264 iptr[2] = t[2];
265 return r;
266}
267static float4 __attribute__((overloadable)) fract(float4 v, float4 *iptr) {
268 float t[4];
269 float4 r;
270 r.x = fract(v.x, &t[0]);
271 r.y = fract(v.y, &t[1]);
272 r.z = fract(v.z, &t[2]);
273 r.w = fract(v.w, &t[3]);
274 iptr[0] = t[0];
275 iptr[1] = t[1];
276 iptr[2] = t[2];
277 iptr[3] = t[3];
278 return r;
279}
Jason Sams22fa3712010-05-19 17:22:57 -0700280
281extern float __attribute__((overloadable)) frexp(float, float *);
282extern float2 __attribute__((overloadable)) frexp(float2, float2 *);
283extern float3 __attribute__((overloadable)) frexp(float3, float3 *);
284extern float4 __attribute__((overloadable)) frexp(float4, float4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700285
286extern float __attribute__((overloadable)) hypot(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700287DEF_FUNC_2(hypot)
Jason Sams22fa3712010-05-19 17:22:57 -0700288
289extern int __attribute__((overloadable)) ilogb(float);
Stephen Hines47416532011-01-11 14:38:18 -0800290DEF_FUNC_1_RI(ilogb)
Jason Sams22fa3712010-05-19 17:22:57 -0700291
292extern float __attribute__((overloadable)) ldexp(float, int);
293extern float2 __attribute__((overloadable)) ldexp(float2, int2);
294extern float3 __attribute__((overloadable)) ldexp(float3, int3);
295extern float4 __attribute__((overloadable)) ldexp(float4, int4);
Jason Sams22fa3712010-05-19 17:22:57 -0700296extern float2 __attribute__((overloadable)) ldexp(float2, int);
297extern float3 __attribute__((overloadable)) ldexp(float3, int);
298extern float4 __attribute__((overloadable)) ldexp(float4, int);
Jason Sams22fa3712010-05-19 17:22:57 -0700299
300extern float __attribute__((overloadable)) lgamma(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700301DEF_FUNC_1(lgamma)
Jason Sams22fa3712010-05-19 17:22:57 -0700302extern float __attribute__((overloadable)) lgamma(float, float *);
303extern float2 __attribute__((overloadable)) lgamma(float2, float2 *);
304extern float3 __attribute__((overloadable)) lgamma(float3, float3 *);
305extern float4 __attribute__((overloadable)) lgamma(float4, float4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700306
307extern float __attribute__((overloadable)) log(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700308DEF_FUNC_1(log)
Jason Sams22fa3712010-05-19 17:22:57 -0700309
Jason Sams22fa3712010-05-19 17:22:57 -0700310
311extern float __attribute__((overloadable)) log10(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700312DEF_FUNC_1(log10)
313
314static float __attribute__((overloadable)) log2(float v) {
315 return log10(v) / log10(2.f);
316}
317DEF_FUNC_1(log2)
Jason Sams22fa3712010-05-19 17:22:57 -0700318
319extern float __attribute__((overloadable)) log1p(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700320DEF_FUNC_1(log1p)
Jason Sams22fa3712010-05-19 17:22:57 -0700321
322extern float __attribute__((overloadable)) logb(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700323DEF_FUNC_1(logb)
Jason Sams22fa3712010-05-19 17:22:57 -0700324
325extern float __attribute__((overloadable)) mad(float, float, float);
326extern float2 __attribute__((overloadable)) mad(float2, float2, float2);
327extern float3 __attribute__((overloadable)) mad(float3, float3, float3);
328extern float4 __attribute__((overloadable)) mad(float4, float4, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700329
330extern float __attribute__((overloadable)) modf(float, float *);
331extern float2 __attribute__((overloadable)) modf(float2, float2 *);
332extern float3 __attribute__((overloadable)) modf(float3, float3 *);
333extern float4 __attribute__((overloadable)) modf(float4, float4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700334
Jason Sams1b937f52010-06-09 14:26:16 -0700335//extern float __attribute__((overloadable)) nan(uint);
Jason Sams22fa3712010-05-19 17:22:57 -0700336
337extern float __attribute__((overloadable)) nextafter(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700338DEF_FUNC_2(nextafter)
Jason Sams22fa3712010-05-19 17:22:57 -0700339
Jason Sams1b937f52010-06-09 14:26:16 -0700340DEF_FUNC_2(pow)
Jason Sams22fa3712010-05-19 17:22:57 -0700341
Jason Sams1b937f52010-06-09 14:26:16 -0700342static float __attribute__((overloadable)) pown(float v, int p) {
343 return pow(v, (float)p);
344}
345static float2 __attribute__((overloadable)) pown(float2 v, int2 p) {
346 return pow(v, (float2)p);
347}
348static float3 __attribute__((overloadable)) pown(float3 v, int3 p) {
349 return pow(v, (float3)p);
350}
351static float4 __attribute__((overloadable)) pown(float4 v, int4 p) {
352 return pow(v, (float4)p);
353}
Jason Sams22fa3712010-05-19 17:22:57 -0700354
Jason Sams1b937f52010-06-09 14:26:16 -0700355static float __attribute__((overloadable)) powr(float v, float p) {
356 return pow(v, p);
357}
358static float2 __attribute__((overloadable)) powr(float2 v, float2 p) {
359 return pow(v, p);
360}
361static float3 __attribute__((overloadable)) powr(float3 v, float3 p) {
362 return pow(v, p);
363}
364static float4 __attribute__((overloadable)) powr(float4 v, float4 p) {
365 return pow(v, p);
366}
Jason Sams22fa3712010-05-19 17:22:57 -0700367
368extern float __attribute__((overloadable)) remainder(float, float);
Jason Sams1b937f52010-06-09 14:26:16 -0700369DEF_FUNC_2(remainder)
Jason Sams22fa3712010-05-19 17:22:57 -0700370
Stephen Hines47416532011-01-11 14:38:18 -0800371extern float __attribute__((overloadable)) remquo(float, float, int *);
372extern float2 __attribute__((overloadable)) remquo(float2, float2, int2 *);
373extern float3 __attribute__((overloadable)) remquo(float3, float3, int3 *);
374extern float4 __attribute__((overloadable)) remquo(float4, float4, int4 *);
Jason Sams22fa3712010-05-19 17:22:57 -0700375
376extern float __attribute__((overloadable)) rint(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700377DEF_FUNC_1(rint)
Jason Sams22fa3712010-05-19 17:22:57 -0700378
Jason Sams1b937f52010-06-09 14:26:16 -0700379static float __attribute__((overloadable)) rootn(float v, int r) {
380 return pow(v, 1.f / r);
381}
382static float2 __attribute__((overloadable)) rootn(float2 v, int2 r) {
383 float2 t = {1.f / r.x, 1.f / r.y};
384 return pow(v, t);
385}
386static float3 __attribute__((overloadable)) rootn(float3 v, int3 r) {
387 float3 t = {1.f / r.x, 1.f / r.y, 1.f / r.z};
388 return pow(v, t);
389}
390static float4 __attribute__((overloadable)) rootn(float4 v, int4 r) {
391 float4 t = {1.f / r.x, 1.f / r.y, 1.f / r.z, 1.f / r.w};
392 return pow(v, t);
393}
Jason Sams22fa3712010-05-19 17:22:57 -0700394
395extern float __attribute__((overloadable)) round(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700396DEF_FUNC_1(round)
Jason Sams22fa3712010-05-19 17:22:57 -0700397
398extern float __attribute__((overloadable)) sqrt(float);
Stephen Hines47416532011-01-11 14:38:18 -0800399static float __attribute__((overloadable)) rsqrt(float v) {
Jason Sams1b937f52010-06-09 14:26:16 -0700400 return 1.f / sqrt(v);
401}
Stephen Hines47416532011-01-11 14:38:18 -0800402DEF_FUNC_1(rsqrt)
Jason Sams1b937f52010-06-09 14:26:16 -0700403
404extern float __attribute__((overloadable)) sin(float);
405DEF_FUNC_1(sin)
406
407static float __attribute__((overloadable)) sincos(float v, float *cosptr) {
408 *cosptr = cos(v);
409 return sin(v);
410}
411static float2 __attribute__((overloadable)) sincos(float2 v, float2 *cosptr) {
412 *cosptr = cos(v);
413 return sin(v);
414}
415static float3 __attribute__((overloadable)) sincos(float3 v, float3 *cosptr) {
416 *cosptr = cos(v);
417 return sin(v);
418}
419static float4 __attribute__((overloadable)) sincos(float4 v, float4 *cosptr) {
420 *cosptr = cos(v);
421 return sin(v);
422}
423
424extern float __attribute__((overloadable)) sinh(float);
425DEF_FUNC_1(sinh)
426
427static float __attribute__((overloadable)) sinpi(float v) {
428 return sin(v * M_PI);
429}
430DEF_FUNC_1(sinpi)
431
432DEF_FUNC_1(sqrt)
Jason Sams22fa3712010-05-19 17:22:57 -0700433
434extern float __attribute__((overloadable)) tan(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700435DEF_FUNC_1(tan)
Jason Sams22fa3712010-05-19 17:22:57 -0700436
437extern float __attribute__((overloadable)) tanh(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700438DEF_FUNC_1(tanh)
Jason Sams22fa3712010-05-19 17:22:57 -0700439
Jason Sams1b937f52010-06-09 14:26:16 -0700440static float __attribute__((overloadable)) tanpi(float v) {
441 return tan(v * M_PI);
442}
443DEF_FUNC_1(tanpi)
Jason Sams22fa3712010-05-19 17:22:57 -0700444
445extern float __attribute__((overloadable)) tgamma(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700446DEF_FUNC_1(tgamma)
Jason Sams22fa3712010-05-19 17:22:57 -0700447
448extern float __attribute__((overloadable)) trunc(float);
Jason Sams1b937f52010-06-09 14:26:16 -0700449DEF_FUNC_1(trunc)
Jason Sams22fa3712010-05-19 17:22:57 -0700450
451// Int ops (partial), 6.11.3
Jason Sams22fa3712010-05-19 17:22:57 -0700452
Stephen Hinesb902e4c2011-01-14 18:49:01 -0800453#define DEF_RIFUNC_1(typeout, typein, fnc) \
454extern typeout __attribute__((overloadable)) fnc(typein); \
455static typeout##2 __attribute__((overloadable)) fnc(typein##2 v) { \
456 typeout##2 r; \
457 r.x = fnc(v.x); \
458 r.y = fnc(v.y); \
459 return r; \
460} \
461static typeout##3 __attribute__((overloadable)) fnc(typein##3 v) { \
462 typeout##3 r; \
463 r.x = fnc(v.x); \
464 r.y = fnc(v.y); \
465 r.z = fnc(v.z); \
466 return r; \
467} \
468static typeout##4 __attribute__((overloadable)) fnc(typein##4 v) { \
469 typeout##4 r; \
470 r.x = fnc(v.x); \
471 r.y = fnc(v.y); \
472 r.z = fnc(v.z); \
473 r.w = fnc(v.w); \
474 return r; \
Jason Sams1b937f52010-06-09 14:26:16 -0700475}
Jason Sams22fa3712010-05-19 17:22:57 -0700476
Stephen Hinesb902e4c2011-01-14 18:49:01 -0800477#define DEF_UIFUNC_1(fnc) \
478DEF_RIFUNC_1(uchar, char, fnc) \
479DEF_RIFUNC_1(ushort, short, fnc) \
480DEF_RIFUNC_1(uint, int, fnc)
Jason Sams22fa3712010-05-19 17:22:57 -0700481
Stephen Hinesb902e4c2011-01-14 18:49:01 -0800482#define DEF_IFUNC_1(fnc) \
483DEF_RIFUNC_1(uchar, uchar, fnc) \
484DEF_RIFUNC_1(char, char, fnc) \
485DEF_RIFUNC_1(ushort, ushort, fnc) \
486DEF_RIFUNC_1(short, short, fnc) \
487DEF_RIFUNC_1(uint, uint, fnc) \
488DEF_RIFUNC_1(int, int, fnc)
Jason Sams22fa3712010-05-19 17:22:57 -0700489
Stephen Hinesb902e4c2011-01-14 18:49:01 -0800490#define DEF_RIFUNC_2(type, fnc, body) \
491static type __attribute__((overloadable)) fnc(type v1, type v2) { \
492 return body; \
493} \
494static type##2 __attribute__((overloadable)) fnc(type##2 v1, type##2 v2) { \
495 type##2 r; \
496 r.x = fnc(v1.x, v2.x); \
497 r.y = fnc(v1.y, v2.y); \
498 return r; \
499} \
500static type##3 __attribute__((overloadable)) fnc(type##3 v1, type##3 v2) { \
501 type##3 r; \
502 r.x = fnc(v1.x, v2.x); \
503 r.y = fnc(v1.y, v2.y); \
504 r.z = fnc(v1.z, v2.z); \
505 return r; \
506} \
507static type##4 __attribute__((overloadable)) fnc(type##4 v1, type##4 v2) { \
508 type##4 r; \
509 r.x = fnc(v1.x, v2.x); \
510 r.y = fnc(v1.y, v2.y); \
511 r.z = fnc(v1.z, v2.z); \
512 r.w = fnc(v1.w, v2.w); \
513 return r; \
514} \
Jason Sams22fa3712010-05-19 17:22:57 -0700515
Stephen Hinesb902e4c2011-01-14 18:49:01 -0800516#define DEF_IFUNC_2(fnc, body) \
517DEF_RIFUNC_2(uchar, fnc, body) \
518DEF_RIFUNC_2(char, fnc, body) \
519DEF_RIFUNC_2(ushort, fnc, body) \
520DEF_RIFUNC_2(short, fnc, body) \
521DEF_RIFUNC_2(uint, fnc, body) \
522DEF_RIFUNC_2(int, fnc, body) \
523DEF_RIFUNC_2(float, fnc, body)
524
525DEF_UIFUNC_1(abs)
526DEF_IFUNC_1(clz)
527
528DEF_IFUNC_2(min, (v1 < v2 ? v1 : v2))
529DEF_FUNC_2F(min)
530
531DEF_IFUNC_2(max, (v1 > v2 ? v1 : v2))
532DEF_FUNC_2F(max)
Jason Sams22fa3712010-05-19 17:22:57 -0700533
534// 6.11.4
535
Jason Sams1b937f52010-06-09 14:26:16 -0700536static float __attribute__((overloadable)) clamp(float amount, float low, float high) {
537 return amount < low ? low : (amount > high ? high : amount);
538}
539static float2 __attribute__((overloadable)) clamp(float2 amount, float2 low, float2 high) {
540 float2 r;
541 r.x = amount.x < low.x ? low.x : (amount.x > high.x ? high.x : amount.x);
542 r.y = amount.y < low.y ? low.y : (amount.y > high.y ? high.y : amount.y);
543 return r;
544}
545static float3 __attribute__((overloadable)) clamp(float3 amount, float3 low, float3 high) {
546 float3 r;
547 r.x = amount.x < low.x ? low.x : (amount.x > high.x ? high.x : amount.x);
548 r.y = amount.y < low.y ? low.y : (amount.y > high.y ? high.y : amount.y);
549 r.z = amount.z < low.z ? low.z : (amount.z > high.z ? high.z : amount.z);
550 return r;
551}
552static float4 __attribute__((overloadable)) clamp(float4 amount, float4 low, float4 high) {
553 float4 r;
554 r.x = amount.x < low.x ? low.x : (amount.x > high.x ? high.x : amount.x);
555 r.y = amount.y < low.y ? low.y : (amount.y > high.y ? high.y : amount.y);
556 r.z = amount.z < low.z ? low.z : (amount.z > high.z ? high.z : amount.z);
557 r.w = amount.w < low.w ? low.w : (amount.w > high.w ? high.w : amount.w);
558 return r;
559}
560static float2 __attribute__((overloadable)) clamp(float2 amount, float low, float high) {
561 float2 r;
562 r.x = amount.x < low ? low : (amount.x > high ? high : amount.x);
563 r.y = amount.y < low ? low : (amount.y > high ? high : amount.y);
564 return r;
565}
566static float3 __attribute__((overloadable)) clamp(float3 amount, float low, float high) {
567 float3 r;
568 r.x = amount.x < low ? low : (amount.x > high ? high : amount.x);
569 r.y = amount.y < low ? low : (amount.y > high ? high : amount.y);
570 r.z = amount.z < low ? low : (amount.z > high ? high : amount.z);
571 return r;
572}
573static float4 __attribute__((overloadable)) clamp(float4 amount, float low, float high) {
574 float4 r;
575 r.x = amount.x < low ? low : (amount.x > high ? high : amount.x);
576 r.y = amount.y < low ? low : (amount.y > high ? high : amount.y);
577 r.z = amount.z < low ? low : (amount.z > high ? high : amount.z);
578 r.w = amount.w < low ? low : (amount.w > high ? high : amount.w);
579 return r;
580}
Jason Sams22fa3712010-05-19 17:22:57 -0700581
Jason Sams1b937f52010-06-09 14:26:16 -0700582static float __attribute__((overloadable)) degrees(float radians) {
583 return radians * (180.f / M_PI);
584}
585DEF_FUNC_1(degrees)
Jason Sams22fa3712010-05-19 17:22:57 -0700586
Jason Sams1b937f52010-06-09 14:26:16 -0700587static float __attribute__((overloadable)) mix(float start, float stop, float amount) {
588 return start + (stop - start) * amount;
589}
590static float2 __attribute__((overloadable)) mix(float2 start, float2 stop, float2 amount) {
591 return start + (stop - start) * amount;
592}
593static float3 __attribute__((overloadable)) mix(float3 start, float3 stop, float3 amount) {
594 return start + (stop - start) * amount;
595}
596static float4 __attribute__((overloadable)) mix(float4 start, float4 stop, float4 amount) {
597 return start + (stop - start) * amount;
598}
599static float2 __attribute__((overloadable)) mix(float2 start, float2 stop, float amount) {
600 return start + (stop - start) * amount;
601}
602static float3 __attribute__((overloadable)) mix(float3 start, float3 stop, float amount) {
603 return start + (stop - start) * amount;
604}
605static float4 __attribute__((overloadable)) mix(float4 start, float4 stop, float amount) {
606 return start + (stop - start) * amount;
607}
Jason Sams22fa3712010-05-19 17:22:57 -0700608
Jason Sams1b937f52010-06-09 14:26:16 -0700609static float __attribute__((overloadable)) radians(float degrees) {
610 return degrees * (M_PI / 180.f);
611}
612DEF_FUNC_1(radians)
Jason Sams22fa3712010-05-19 17:22:57 -0700613
Jason Sams1b937f52010-06-09 14:26:16 -0700614static float __attribute__((overloadable)) step(float edge, float v) {
615 return (v < edge) ? 0.f : 1.f;
616}
617static float2 __attribute__((overloadable)) step(float2 edge, float2 v) {
618 float2 r;
619 r.x = (v.x < edge.x) ? 0.f : 1.f;
620 r.y = (v.y < edge.y) ? 0.f : 1.f;
621 return r;
622}
623static float3 __attribute__((overloadable)) step(float3 edge, float3 v) {
624 float3 r;
625 r.x = (v.x < edge.x) ? 0.f : 1.f;
626 r.y = (v.y < edge.y) ? 0.f : 1.f;
627 r.z = (v.z < edge.z) ? 0.f : 1.f;
628 return r;
629}
630static float4 __attribute__((overloadable)) step(float4 edge, float4 v) {
631 float4 r;
632 r.x = (v.x < edge.x) ? 0.f : 1.f;
633 r.y = (v.y < edge.y) ? 0.f : 1.f;
634 r.z = (v.z < edge.z) ? 0.f : 1.f;
635 r.w = (v.w < edge.w) ? 0.f : 1.f;
636 return r;
637}
638static float2 __attribute__((overloadable)) step(float2 edge, float v) {
639 float2 r;
640 r.x = (v < edge.x) ? 0.f : 1.f;
641 r.y = (v < edge.y) ? 0.f : 1.f;
642 return r;
643}
644static float3 __attribute__((overloadable)) step(float3 edge, float v) {
645 float3 r;
646 r.x = (v < edge.x) ? 0.f : 1.f;
647 r.y = (v < edge.y) ? 0.f : 1.f;
648 r.z = (v < edge.z) ? 0.f : 1.f;
649 return r;
650}
651static float4 __attribute__((overloadable)) step(float4 edge, float v) {
652 float4 r;
653 r.x = (v < edge.x) ? 0.f : 1.f;
654 r.y = (v < edge.y) ? 0.f : 1.f;
655 r.z = (v < edge.z) ? 0.f : 1.f;
656 r.w = (v < edge.w) ? 0.f : 1.f;
657 return r;
658}
Jason Sams22fa3712010-05-19 17:22:57 -0700659
660extern float __attribute__((overloadable)) smoothstep(float, float, float);
661extern float2 __attribute__((overloadable)) smoothstep(float2, float2, float2);
662extern float3 __attribute__((overloadable)) smoothstep(float3, float3, float3);
663extern float4 __attribute__((overloadable)) smoothstep(float4, float4, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700664extern float2 __attribute__((overloadable)) smoothstep(float, float, float2);
665extern float3 __attribute__((overloadable)) smoothstep(float, float, float3);
666extern float4 __attribute__((overloadable)) smoothstep(float, float, float4);
Jason Sams22fa3712010-05-19 17:22:57 -0700667
Jason Sams1b937f52010-06-09 14:26:16 -0700668static float __attribute__((overloadable)) sign(float v) {
669 if (v > 0) return 1.f;
670 if (v < 0) return -1.f;
671 return v;
672}
673DEF_FUNC_1(sign)
Jason Sams22fa3712010-05-19 17:22:57 -0700674
675// 6.11.5
Jason Sams1b937f52010-06-09 14:26:16 -0700676static float3 __attribute__((overloadable)) cross(float3 lhs, float3 rhs) {
677 float3 r;
678 r.x = lhs.y * rhs.z - lhs.z * rhs.y;
679 r.y = lhs.z * rhs.x - lhs.x * rhs.z;
680 r.z = lhs.x * rhs.y - lhs.y * rhs.x;
681 return r;
682}
Jason Sams22fa3712010-05-19 17:22:57 -0700683
Jason Sams1b937f52010-06-09 14:26:16 -0700684static float4 __attribute__((overloadable)) cross(float4 lhs, float4 rhs) {
685 float4 r;
686 r.x = lhs.y * rhs.z - lhs.z * rhs.y;
687 r.y = lhs.z * rhs.x - lhs.x * rhs.z;
688 r.z = lhs.x * rhs.y - lhs.y * rhs.x;
689 r.w = 0.f;
690 return r;
691}
Jason Sams22fa3712010-05-19 17:22:57 -0700692
Jason Sams1b937f52010-06-09 14:26:16 -0700693static float __attribute__((overloadable)) dot(float lhs, float rhs) {
694 return lhs * rhs;
695}
696static float __attribute__((overloadable)) dot(float2 lhs, float2 rhs) {
697 return lhs.x*rhs.x + lhs.y*rhs.y;
698}
699static float __attribute__((overloadable)) dot(float3 lhs, float3 rhs) {
700 return lhs.x*rhs.x + lhs.y*rhs.y + lhs.z*rhs.z;
701}
702static float __attribute__((overloadable)) dot(float4 lhs, float4 rhs) {
703 return lhs.x*rhs.x + lhs.y*rhs.y + lhs.z*rhs.z + lhs.w*rhs.w;
704}
Jason Sams22fa3712010-05-19 17:22:57 -0700705
Jason Sams1b937f52010-06-09 14:26:16 -0700706static float __attribute__((overloadable)) length(float v) {
707 return v;
708}
709static float __attribute__((overloadable)) length(float2 v) {
710 return sqrt(v.x*v.x + v.y*v.y);
711}
712static float __attribute__((overloadable)) length(float3 v) {
713 return sqrt(v.x*v.x + v.y*v.y + v.z*v.z);
714}
715static float __attribute__((overloadable)) length(float4 v) {
716 return sqrt(v.x*v.x + v.y*v.y + v.z*v.z + v.w*v.w);
717}
Jason Sams22fa3712010-05-19 17:22:57 -0700718
Jason Sams1b937f52010-06-09 14:26:16 -0700719static float __attribute__((overloadable)) distance(float lhs, float rhs) {
720 return length(lhs - rhs);
721}
722static float __attribute__((overloadable)) distance(float2 lhs, float2 rhs) {
723 return length(lhs - rhs);
724}
725static float __attribute__((overloadable)) distance(float3 lhs, float3 rhs) {
726 return length(lhs - rhs);
727}
728static float __attribute__((overloadable)) distance(float4 lhs, float4 rhs) {
729 return length(lhs - rhs);
730}
Jason Sams22fa3712010-05-19 17:22:57 -0700731
Jason Sams1b937f52010-06-09 14:26:16 -0700732static float __attribute__((overloadable)) normalize(float v) {
733 return 1.f;
734}
735static float2 __attribute__((overloadable)) normalize(float2 v) {
736 return v / length(v);
737}
738static float3 __attribute__((overloadable)) normalize(float3 v) {
739 return v / length(v);
740}
741static float4 __attribute__((overloadable)) normalize(float4 v) {
742 return v / length(v);
743}
744
Stephen Hines47416532011-01-11 14:38:18 -0800745#undef CVT_FUNC
746#undef CVT_FUNC_2
747#undef DEF_FUNC_1
748#undef DEF_FUNC_1_RI
749#undef DEF_FUNC_2
750#undef DEF_FUNC_2F
Stephen Hinesb902e4c2011-01-14 18:49:01 -0800751#undef DEF_RIFUNC_1
752#undef DEF_UIFUNC_1
753#undef DEF_IFUNC_1
754#undef DEF_RIFUNC_2
755#undef DEF_IFUNC_2
Jason Sams1b937f52010-06-09 14:26:16 -0700756
757#endif