blob: 55887fa5bdf00008f6b41fb30c08bce6f2bf867d [file] [log] [blame]
Jason Sams87fe59a2011-04-20 15:09:01 -07001/*
Jason Sams709a0972012-11-15 18:18:04 -08002 * Copyright (C) 2011-2012 The Android Open Source Project
Jason Sams87fe59a2011-04-20 15:09:01 -07003 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
Stephen Hines43cfc0c2013-08-15 10:02:11 -070017#if !defined(RS_SERVER) && !defined(RS_COMPATIBILITY_LIB)
Glenn Kasten72f4f4c2011-12-15 09:51:17 -080018#include <cutils/compiler.h>
Tim Murray0b575de2013-03-15 15:56:43 -070019#endif
Glenn Kasten72f4f4c2011-12-15 09:51:17 -080020
Jason Sams87fe59a2011-04-20 15:09:01 -070021#include "rsContext.h"
22#include "rsScriptC.h"
23#include "rsMatrix4x4.h"
24#include "rsMatrix3x3.h"
25#include "rsMatrix2x2.h"
26
Jason Sams709a0972012-11-15 18:18:04 -080027#include "rsCpuCore.h"
28#include "rsCpuScript.h"
Jason Sams87fe59a2011-04-20 15:09:01 -070029
Jason Sams87fe59a2011-04-20 15:09:01 -070030using namespace android;
31using namespace android::renderscript;
32
Tim Murrayd6f1f462013-03-25 16:36:59 -070033#define EXPORT_F32_FN_F32(func) \
34 float __attribute__((overloadable)) SC_##func(float v) { \
35 return func(v); \
36 }
37
38#define EXPORT_F32_FN_F32_F32(func) \
39 float __attribute__((overloadable)) SC_##func(float t, float v) { \
40 return func(t, v); \
41 }
Jason Sams87fe59a2011-04-20 15:09:01 -070042
Jason Sams87fe59a2011-04-20 15:09:01 -070043//////////////////////////////////////////////////////////////////////////////
44// Float util
45//////////////////////////////////////////////////////////////////////////////
46
Tim Murrayd6f1f462013-03-25 16:36:59 -070047// Handle missing Gingerbread functions like tgammaf.
48float SC_tgammaf(float x) {
Stephen Hines11418c82013-08-14 16:46:21 -070049#ifdef RS_COMPATIBILITY_LIB
Tim Murrayd6f1f462013-03-25 16:36:59 -070050 return tgamma(x);
Stephen Hines11418c82013-08-14 16:46:21 -070051#else
52 return tgammaf(x);
53#endif
Tim Murrayd6f1f462013-03-25 16:36:59 -070054}
55
56uint32_t SC_abs_i32(int32_t v) {return abs(v);}
Jason Sams87fe59a2011-04-20 15:09:01 -070057
58static void SC_MatrixLoadRotate(Matrix4x4 *m, float rot, float x, float y, float z) {
59 m->loadRotate(rot, x, y, z);
60}
61static void SC_MatrixLoadScale(Matrix4x4 *m, float x, float y, float z) {
62 m->loadScale(x, y, z);
63}
64static void SC_MatrixLoadTranslate(Matrix4x4 *m, float x, float y, float z) {
65 m->loadTranslate(x, y, z);
66}
67static void SC_MatrixRotate(Matrix4x4 *m, float rot, float x, float y, float z) {
68 m->rotate(rot, x, y, z);
69}
70static void SC_MatrixScale(Matrix4x4 *m, float x, float y, float z) {
71 m->scale(x, y, z);
72}
73static void SC_MatrixTranslate(Matrix4x4 *m, float x, float y, float z) {
74 m->translate(x, y, z);
75}
76
Jason Sams87fe59a2011-04-20 15:09:01 -070077static void SC_MatrixLoadOrtho(Matrix4x4 *m, float l, float r, float b, float t, float n, float f) {
78 m->loadOrtho(l, r, b, t, n, f);
79}
80static void SC_MatrixLoadFrustum(Matrix4x4 *m, float l, float r, float b, float t, float n, float f) {
81 m->loadFrustum(l, r, b, t, n, f);
82}
83static void SC_MatrixLoadPerspective(Matrix4x4 *m, float fovy, float aspect, float near, float far) {
84 m->loadPerspective(fovy, aspect, near, far);
85}
86
87static bool SC_MatrixInverse_4x4(Matrix4x4 *m) {
88 return m->inverse();
89}
90static bool SC_MatrixInverseTranspose_4x4(Matrix4x4 *m) {
91 return m->inverseTranspose();
92}
93static void SC_MatrixTranspose_4x4(Matrix4x4 *m) {
94 m->transpose();
95}
96static void SC_MatrixTranspose_3x3(Matrix3x3 *m) {
97 m->transpose();
98}
99static void SC_MatrixTranspose_2x2(Matrix2x2 *m) {
100 m->transpose();
101}
102
Stephen Hinesb93cb422013-03-27 17:32:31 -0700103float SC_randf2(float min, float max) {
Jason Sams87fe59a2011-04-20 15:09:01 -0700104 float r = (float)rand();
Jason Samsb8fa7562011-04-22 14:19:42 -0700105 r /= RAND_MAX;
Jason Sams87fe59a2011-04-20 15:09:01 -0700106 r = r * (max - min) + min;
Jason Samsb8fa7562011-04-22 14:19:42 -0700107 return r;
Jason Sams87fe59a2011-04-20 15:09:01 -0700108}
109
Jason Sams87fe59a2011-04-20 15:09:01 -0700110static float SC_frac(float v) {
111 int i = (int)floor(v);
112 return fmin(v - i, 0x1.fffffep-1f);
113}
114
Tim Murrayd6f1f462013-03-25 16:36:59 -0700115EXPORT_F32_FN_F32(acosf)
116EXPORT_F32_FN_F32(acoshf)
117EXPORT_F32_FN_F32(asinf)
118EXPORT_F32_FN_F32(asinhf)
119EXPORT_F32_FN_F32(atanf)
120EXPORT_F32_FN_F32_F32(atan2f)
121EXPORT_F32_FN_F32(atanhf)
122EXPORT_F32_FN_F32(cbrtf)
123EXPORT_F32_FN_F32(ceilf)
124EXPORT_F32_FN_F32_F32(copysignf)
125EXPORT_F32_FN_F32(cosf)
126EXPORT_F32_FN_F32(coshf)
127EXPORT_F32_FN_F32(erfcf)
128EXPORT_F32_FN_F32(erff)
129EXPORT_F32_FN_F32(expf)
130EXPORT_F32_FN_F32(exp2f)
131EXPORT_F32_FN_F32(expm1f)
132EXPORT_F32_FN_F32_F32(fdimf)
133EXPORT_F32_FN_F32(floorf)
134float SC_fmaf(float u, float t, float v) {return fmaf(u, t, v);}
135EXPORT_F32_FN_F32_F32(fmaxf)
136EXPORT_F32_FN_F32_F32(fminf)
137EXPORT_F32_FN_F32_F32(fmodf)
138float SC_frexpf(float v, int* ptr) {return frexpf(v, ptr);}
139EXPORT_F32_FN_F32_F32(hypotf)
Pirama Arumuga Nainar6fdd0602015-01-13 11:21:13 -0800140int SC_ilogbf(float v) {return ilogbf(v); }
Tim Murrayd6f1f462013-03-25 16:36:59 -0700141float SC_ldexpf(float v, int i) {return ldexpf(v, i);}
142EXPORT_F32_FN_F32(lgammaf)
143float SC_lgammaf_r(float v, int* ptr) {return lgammaf_r(v, ptr);}
144EXPORT_F32_FN_F32(logf)
145EXPORT_F32_FN_F32(log10f)
146EXPORT_F32_FN_F32(log1pf)
147EXPORT_F32_FN_F32(logbf)
148float SC_modff(float v, float* ptr) {return modff(v, ptr);}
149EXPORT_F32_FN_F32_F32(nextafterf)
150EXPORT_F32_FN_F32_F32(powf)
151EXPORT_F32_FN_F32_F32(remainderf)
152float SC_remquof(float t, float v, int* ptr) {return remquof(t, v, ptr);}
153EXPORT_F32_FN_F32(rintf)
154EXPORT_F32_FN_F32(roundf)
155EXPORT_F32_FN_F32(sinf)
156EXPORT_F32_FN_F32(sinhf)
157EXPORT_F32_FN_F32(sqrtf)
158EXPORT_F32_FN_F32(tanf)
159EXPORT_F32_FN_F32(tanhf)
160EXPORT_F32_FN_F32(truncf)
Stephen Hinescadee382013-12-12 13:21:00 -0800161float __attribute__((overloadable)) rsFrac(float f) {
162 return SC_frac(f);
163}
164void __attribute__((overloadable)) rsMatrixLoadRotate(rs_matrix4x4 *m,
165 float rot, float x, float y, float z) {
166 SC_MatrixLoadRotate((Matrix4x4 *) m, rot, x, y, z);
167}
168void __attribute__((overloadable)) rsMatrixLoadScale(rs_matrix4x4 *m,
169 float x, float y, float z) {
170 SC_MatrixLoadScale((Matrix4x4 *) m, x, y, z);
171}
172void __attribute__((overloadable)) rsMatrixLoadTranslate(rs_matrix4x4 *m,
173 float x, float y, float z) {
174 SC_MatrixLoadTranslate((Matrix4x4 *) m, x, y, z);
175}
176void __attribute__((overloadable)) rsMatrixRotate(rs_matrix4x4 *m, float rot,
177 float x, float y, float z) {
178 SC_MatrixRotate((Matrix4x4 *) m, rot, x, y, z);
179}
180void __attribute__((overloadable)) rsMatrixScale(rs_matrix4x4 *m, float x,
181 float y, float z) {
182 SC_MatrixScale((Matrix4x4 *) m, x, y, z);
183}
184void __attribute__((overloadable)) rsMatrixTranslate(rs_matrix4x4 *m, float x,
185 float y, float z) {
186 SC_MatrixTranslate((Matrix4x4 *) m, x, y, z);
187}
188void __attribute__((overloadable)) rsMatrixLoadOrtho(rs_matrix4x4 *m, float l,
189 float r, float b, float t, float n, float f) {
190 SC_MatrixLoadOrtho((Matrix4x4 *) m, l, r, b, t, n, f);
191}
192void __attribute__((overloadable)) rsMatrixLoadFrustum(rs_matrix4x4 *m,
193 float l, float r, float b, float t, float n, float f) {
194 SC_MatrixLoadFrustum((Matrix4x4 *) m, l, r, b, t, n, f);
195}
196void __attribute__((overloadable)) rsMatrixLoadPerspective(rs_matrix4x4 *m,
197 float fovy, float aspect, float near, float far) {
198 SC_MatrixLoadPerspective((Matrix4x4 *) m, fovy, aspect, near, far);
199}
200bool __attribute__((overloadable)) rsMatrixInverse(rs_matrix4x4 *m) {
201 return SC_MatrixInverse_4x4((Matrix4x4 *) m);
202}
203bool __attribute__((overloadable)) rsMatrixInverseTranspose(rs_matrix4x4 *m) {
204 return SC_MatrixInverseTranspose_4x4((Matrix4x4 *) m);
205}
206void __attribute__((overloadable)) rsMatrixTranspose(rs_matrix4x4 *m) {
207 SC_MatrixTranspose_4x4((Matrix4x4 *) m);
208}
209void __attribute__((overloadable)) rsMatrixTranspose(rs_matrix3x3 *m) {
210 SC_MatrixTranspose_3x3((Matrix3x3 *) m);
211}
212void __attribute__((overloadable)) rsMatrixTranspose(rs_matrix2x2 *m) {
213 SC_MatrixTranspose_2x2((Matrix2x2 *) m);
214}
Jason Sams87fe59a2011-04-20 15:09:01 -0700215
216//////////////////////////////////////////////////////////////////////////////
217// Class implementation
218//////////////////////////////////////////////////////////////////////////////
219
220// llvm name mangling ref
221// <builtin-type> ::= v # void
222// ::= b # bool
223// ::= c # char
224// ::= a # signed char
225// ::= h # unsigned char
226// ::= s # short
227// ::= t # unsigned short
228// ::= i # int
229// ::= j # unsigned int
230// ::= l # long
231// ::= m # unsigned long
232// ::= x # long long, __int64
233// ::= y # unsigned long long, __int64
234// ::= f # float
235// ::= d # double
236
Jason Sams709a0972012-11-15 18:18:04 -0800237static RsdCpuReference::CpuSymbol gSyms[] = {
Jason Sams87fe59a2011-04-20 15:09:01 -0700238 { "_Z4acosf", (void *)&acosf, true },
239 { "_Z5acoshf", (void *)&acoshf, true },
240 { "_Z4asinf", (void *)&asinf, true },
241 { "_Z5asinhf", (void *)&asinhf, true },
242 { "_Z4atanf", (void *)&atanf, true },
243 { "_Z5atan2ff", (void *)&atan2f, true },
244 { "_Z5atanhf", (void *)&atanhf, true },
245 { "_Z4cbrtf", (void *)&cbrtf, true },
246 { "_Z4ceilf", (void *)&ceilf, true },
247 { "_Z8copysignff", (void *)&copysignf, true },
248 { "_Z3cosf", (void *)&cosf, true },
249 { "_Z4coshf", (void *)&coshf, true },
250 { "_Z4erfcf", (void *)&erfcf, true },
251 { "_Z3erff", (void *)&erff, true },
252 { "_Z3expf", (void *)&expf, true },
253 { "_Z4exp2f", (void *)&exp2f, true },
Tim Murray6a9cc722014-05-30 15:07:30 -0700254 { "exp2f", (void *)&exp2f, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700255 { "_Z5expm1f", (void *)&expm1f, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700256 { "_Z4fdimff", (void *)&fdimf, true },
257 { "_Z5floorf", (void *)&floorf, true },
258 { "_Z3fmafff", (void *)&fmaf, true },
259 { "_Z4fmaxff", (void *)&fmaxf, true },
260 { "_Z4fminff", (void *)&fminf, true }, // float fmin(float, float)
261 { "_Z4fmodff", (void *)&fmodf, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700262 { "_Z5frexpfPi", (void *)&frexpf, true },
263 { "_Z5hypotff", (void *)&hypotf, true },
264 { "_Z5ilogbf", (void *)&ilogbf, true },
265 { "_Z5ldexpfi", (void *)&ldexpf, true },
266 { "_Z6lgammaf", (void *)&lgammaf, true },
267 { "_Z6lgammafPi", (void *)&lgammaf_r, true },
268 { "_Z3logf", (void *)&logf, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700269 { "_Z5log10f", (void *)&log10f, true },
270 { "_Z5log1pf", (void *)&log1pf, true },
271 { "_Z4logbf", (void *)&logbf, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700272 { "_Z4modffPf", (void *)&modff, true },
273 //{ "_Z3nanj", (void *)&SC_nan, true },
274 { "_Z9nextafterff", (void *)&nextafterf, true },
275 { "_Z3powff", (void *)&powf, true },
Tim Murray60fe47d2014-05-27 13:29:32 -0700276 { "powf", (void *)&powf, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700277 { "_Z9remainderff", (void *)&remainderf, true },
278 { "_Z6remquoffPi", (void *)&remquof, true },
279 { "_Z4rintf", (void *)&rintf, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700280 { "_Z5roundf", (void *)&roundf, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700281 { "_Z3sinf", (void *)&sinf, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700282 { "_Z4sinhf", (void *)&sinhf, true },
283 { "_Z4sqrtf", (void *)&sqrtf, true },
284 { "_Z3tanf", (void *)&tanf, true },
285 { "_Z4tanhf", (void *)&tanhf, true },
Stephen Hines11418c82013-08-14 16:46:21 -0700286 { "_Z6tgammaf", (void *)&SC_tgammaf, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700287 { "_Z5truncf", (void *)&truncf, true },
288
Jason Sams87fe59a2011-04-20 15:09:01 -0700289 //{ "smoothstep", (void *)&, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700290
291 // matrix
Jason Sams87fe59a2011-04-20 15:09:01 -0700292 { "_Z18rsMatrixLoadRotateP12rs_matrix4x4ffff", (void *)&SC_MatrixLoadRotate, true },
293 { "_Z17rsMatrixLoadScaleP12rs_matrix4x4fff", (void *)&SC_MatrixLoadScale, true },
294 { "_Z21rsMatrixLoadTranslateP12rs_matrix4x4fff", (void *)&SC_MatrixLoadTranslate, true },
295 { "_Z14rsMatrixRotateP12rs_matrix4x4ffff", (void *)&SC_MatrixRotate, true },
296 { "_Z13rsMatrixScaleP12rs_matrix4x4fff", (void *)&SC_MatrixScale, true },
297 { "_Z17rsMatrixTranslateP12rs_matrix4x4fff", (void *)&SC_MatrixTranslate, true },
298
Jason Sams87fe59a2011-04-20 15:09:01 -0700299 { "_Z17rsMatrixLoadOrthoP12rs_matrix4x4ffffff", (void *)&SC_MatrixLoadOrtho, true },
300 { "_Z19rsMatrixLoadFrustumP12rs_matrix4x4ffffff", (void *)&SC_MatrixLoadFrustum, true },
301 { "_Z23rsMatrixLoadPerspectiveP12rs_matrix4x4ffff", (void *)&SC_MatrixLoadPerspective, true },
302
303 { "_Z15rsMatrixInverseP12rs_matrix4x4", (void *)&SC_MatrixInverse_4x4, true },
304 { "_Z24rsMatrixInverseTransposeP12rs_matrix4x4", (void *)&SC_MatrixInverseTranspose_4x4, true },
305 { "_Z17rsMatrixTransposeP12rs_matrix4x4", (void *)&SC_MatrixTranspose_4x4, true },
yuyanc84b56e2012-09-11 15:10:14 +0800306 { "_Z17rsMatrixTransposeP12rs_matrix3x3", (void *)&SC_MatrixTranspose_3x3, true },
307 { "_Z17rsMatrixTransposeP12rs_matrix2x2", (void *)&SC_MatrixTranspose_2x2, true },
Jason Sams87fe59a2011-04-20 15:09:01 -0700308
309 // RS Math
Jason Sams87fe59a2011-04-20 15:09:01 -0700310 { "_Z6rsRandff", (void *)&SC_randf2, true },
311 { "_Z6rsFracf", (void *)&SC_frac, true },
312
Chris Wailes44bef6f2014-08-12 13:51:10 -0700313 { nullptr, nullptr, false }
Jason Sams87fe59a2011-04-20 15:09:01 -0700314};
315
Jason Sams709a0972012-11-15 18:18:04 -0800316const RsdCpuReference::CpuSymbol * RsdCpuScriptImpl::lookupSymbolMath(const char *sym) {
317 const RsdCpuReference::CpuSymbol *syms = gSyms;
Jason Sams87fe59a2011-04-20 15:09:01 -0700318
Jason Sams709a0972012-11-15 18:18:04 -0800319 while (syms->fnPtr) {
320 if (!strcmp(syms->name, sym)) {
Jason Sams87fe59a2011-04-20 15:09:01 -0700321 return syms;
322 }
323 syms++;
324 }
Chris Wailes44bef6f2014-08-12 13:51:10 -0700325 return nullptr;
Jason Sams87fe59a2011-04-20 15:09:01 -0700326}
327