blob: 00d9cb1eab65848bab798af83a4f3993904e34ba [file] [log] [blame]
Jason Samsbad80742011-03-16 16:29:28 -07001/*
Stephen Hinesee7aa2e2012-01-12 18:56:23 -08002 * Copyright (C) 2011-2012 The Android Open Source Project
Jason Samsbad80742011-03-16 16:29:28 -07003 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
Jason Samsbad80742011-03-16 16:29:28 -070017#include "rsdCore.h"
18#include "rsdBcc.h"
Jason Sams87fe59a2011-04-20 15:09:01 -070019#include "rsdRuntime.h"
Jason Sams807fdc42012-07-25 17:55:39 -070020#include "rsdAllocation.h"
Jason Samsbad80742011-03-16 16:29:28 -070021
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -070022#include <bcc/BCCContext.h>
23#include <bcc/RenderScript/RSCompilerDriver.h>
24#include <bcc/RenderScript/RSExecutable.h>
25#include <bcc/RenderScript/RSInfo.h>
Stephen Hines689821f2011-07-18 17:24:11 -070026
Jason Samsbad80742011-03-16 16:29:28 -070027#include "rsContext.h"
Stephen Hines2980f072012-04-09 18:26:29 -070028#include "rsElement.h"
Jason Samsbad80742011-03-16 16:29:28 -070029#include "rsScriptC.h"
30
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -070031#include "utils/Vector.h"
Jason Samsbad80742011-03-16 16:29:28 -070032#include "utils/Timers.h"
33#include "utils/StopWatch.h"
Jason Samsbad80742011-03-16 16:29:28 -070034
Jason Samsbad80742011-03-16 16:29:28 -070035using namespace android;
36using namespace android::renderscript;
37
38struct DrvScript {
39 int (*mRoot)();
Stephen Hinesee7aa2e2012-01-12 18:56:23 -080040 int (*mRootExpand)();
Jason Samsbad80742011-03-16 16:29:28 -070041 void (*mInit)();
Stephen Hines4ee16ff2011-08-31 17:41:39 -070042 void (*mFreeChildren)();
Jason Samsbad80742011-03-16 16:29:28 -070043
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -070044 bcc::BCCContext *mCompilerContext;
45 bcc::RSCompilerDriver *mCompilerDriver;
46 bcc::RSExecutable *mExecutable;
Jason Sams807fdc42012-07-25 17:55:39 -070047
48 Allocation **mBoundAllocs;
Jason Samsbad80742011-03-16 16:29:28 -070049};
50
Stephen Hinesee7aa2e2012-01-12 18:56:23 -080051typedef void (*outer_foreach_t)(
52 const android::renderscript::RsForEachStubParamStruct *,
53 uint32_t x1, uint32_t x2,
54 uint32_t instep, uint32_t outstep);
Jason Sams83c451a2011-04-21 11:46:50 -070055
Jason Samscdfdb8f2011-03-17 16:12:47 -070056static Script * setTLS(Script *sc) {
Jason Sams83c451a2011-04-21 11:46:50 -070057 ScriptTLSStruct * tls = (ScriptTLSStruct *)pthread_getspecific(rsdgThreadTLSKey);
Jason Samscdfdb8f2011-03-17 16:12:47 -070058 rsAssert(tls);
59 Script *old = tls->mScript;
60 tls->mScript = sc;
61 return old;
62}
63
64
Jason Samsbad80742011-03-16 16:29:28 -070065bool rsdScriptInit(const Context *rsc,
66 ScriptC *script,
67 char const *resName,
68 char const *cacheDir,
69 uint8_t const *bitcode,
70 size_t bitcodeSize,
Jason Sams87fe59a2011-04-20 15:09:01 -070071 uint32_t flags) {
Steve Blockaf12ac62012-01-06 19:20:56 +000072 //ALOGE("rsdScriptCreate %p %p %p %p %i %i %p", rsc, resName, cacheDir, bitcode, bitcodeSize, flags, lookupFunc);
Jason Sams0ab9f9f2012-06-15 16:10:17 -070073 //ALOGE("rsdScriptInit %p %p", rsc, script);
Jason Samsbad80742011-03-16 16:29:28 -070074
Jason Sams83c451a2011-04-21 11:46:50 -070075 pthread_mutex_lock(&rsdgInitMutex);
Logan Chien1415ca42011-11-27 08:41:23 +080076
Stephen Hinesebee9482012-05-09 11:53:24 -070077 const char* coreLib = "/system/lib/libclcore.bc";
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -070078 bcc::RSInfo::FloatPrecision prec;
79 bcc::RSExecutable *exec;
80 const bcc::RSInfo *info;
Jason Samsbad80742011-03-16 16:29:28 -070081 DrvScript *drv = (DrvScript *)calloc(1, sizeof(DrvScript));
82 if (drv == NULL) {
Jason Sams83c451a2011-04-21 11:46:50 -070083 goto error;
Jason Samsbad80742011-03-16 16:29:28 -070084 }
85 script->mHal.drv = drv;
86
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -070087 drv->mCompilerContext = NULL;
88 drv->mCompilerDriver = NULL;
89 drv->mExecutable = NULL;
Jason Samsbad80742011-03-16 16:29:28 -070090
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -070091 drv->mCompilerContext = new bcc::BCCContext();
92 if (drv->mCompilerContext == NULL) {
93 ALOGE("bcc: FAILS to create compiler context (out of memory)");
Jason Samsbad80742011-03-16 16:29:28 -070094 goto error;
95 }
96
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -070097 drv->mCompilerDriver = new bcc::RSCompilerDriver();
98 if (drv->mCompilerDriver == NULL) {
99 ALOGE("bcc: FAILS to create compiler driver (out of memory)");
Stephen Hines070cb232012-05-03 12:33:35 -0700100 goto error;
Jason Samsbad80742011-03-16 16:29:28 -0700101 }
102
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700103 script->mHal.info.isThreadable = true;
104
105 drv->mCompilerDriver->setRSRuntimeLookupFunction(rsdLookupRuntimeStub);
106 drv->mCompilerDriver->setRSRuntimeLookupContext(script);
107
108 exec = drv->mCompilerDriver->build(*drv->mCompilerContext,
109 cacheDir, resName,
110 (const char *)bitcode, bitcodeSize);
111
112 if (exec == NULL) {
113 ALOGE("bcc: FAILS to prepare executable for '%s'", resName);
Stephen Hines070cb232012-05-03 12:33:35 -0700114 goto error;
115 }
Jason Samsbad80742011-03-16 16:29:28 -0700116
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700117 drv->mExecutable = exec;
118
119 exec->setThreadable(script->mHal.info.isThreadable);
120 if (!exec->syncInfo()) {
121 ALOGW("bcc: FAILS to synchronize the RS info file to the disk");
Stephen Hines070cb232012-05-03 12:33:35 -0700122 }
123
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700124 drv->mRoot = reinterpret_cast<int (*)()>(exec->getSymbolAddress("root"));
125 drv->mRootExpand =
126 reinterpret_cast<int (*)()>(exec->getSymbolAddress("root.expand"));
127 drv->mInit = reinterpret_cast<void (*)()>(exec->getSymbolAddress("init"));
128 drv->mFreeChildren =
129 reinterpret_cast<void (*)()>(exec->getSymbolAddress(".rs.dtor"));
Stephen Hines070cb232012-05-03 12:33:35 -0700130
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700131 info = &drv->mExecutable->getInfo();
Jason Samsbad80742011-03-16 16:29:28 -0700132 // Copy info over to runtime
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700133 script->mHal.info.exportedFunctionCount = info->getExportFuncNames().size();
134 script->mHal.info.exportedVariableCount = info->getExportVarNames().size();
135 script->mHal.info.exportedPragmaCount = info->getPragmas().size();
136 script->mHal.info.exportedPragmaKeyList =
137 const_cast<const char**>(exec->getPragmaKeys().array());
138 script->mHal.info.exportedPragmaValueList =
139 const_cast<const char**>(exec->getPragmaValues().array());
Stephen Hinesee7aa2e2012-01-12 18:56:23 -0800140
141 if (drv->mRootExpand) {
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700142 script->mHal.info.root = drv->mRootExpand;
Stephen Hinesee7aa2e2012-01-12 18:56:23 -0800143 } else {
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700144 script->mHal.info.root = drv->mRoot;
Stephen Hinesee7aa2e2012-01-12 18:56:23 -0800145 }
Jason Samsbad80742011-03-16 16:29:28 -0700146
Jason Sams807fdc42012-07-25 17:55:39 -0700147 if (script->mHal.info.exportedVariableCount) {
148 drv->mBoundAllocs = new Allocation *[script->mHal.info.exportedVariableCount];
149 memset(drv->mBoundAllocs, 0, sizeof(void *) * script->mHal.info.exportedVariableCount);
150 }
151
Jason Sams83c451a2011-04-21 11:46:50 -0700152 pthread_mutex_unlock(&rsdgInitMutex);
Jason Samsbad80742011-03-16 16:29:28 -0700153 return true;
154
155error:
156
Jason Sams83c451a2011-04-21 11:46:50 -0700157 pthread_mutex_unlock(&rsdgInitMutex);
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700158 if (drv) {
159 delete drv->mCompilerContext;
160 delete drv->mCompilerDriver;
161 delete drv->mExecutable;
Jason Sams807fdc42012-07-25 17:55:39 -0700162 delete[] drv->mBoundAllocs;
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700163 free(drv);
Stephen Hinescbb0b8a2011-08-01 15:02:34 -0700164 }
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700165 script->mHal.drv = NULL;
Jason Samsbad80742011-03-16 16:29:28 -0700166 return false;
167
168}
169
Jason Samscdfdb8f2011-03-17 16:12:47 -0700170typedef struct {
171 Context *rsc;
172 Script *script;
Stephen Hines44199772012-02-21 20:13:12 -0800173 ForEachFunc_t kernel;
Stephen Hines3815bad2011-08-18 19:33:01 -0700174 uint32_t sig;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700175 const Allocation * ain;
176 Allocation * aout;
177 const void * usr;
Jason Sams451cf2e2011-08-17 13:46:46 -0700178 size_t usrLen;
Jason Samsbad80742011-03-16 16:29:28 -0700179
Jason Samscdfdb8f2011-03-17 16:12:47 -0700180 uint32_t mSliceSize;
181 volatile int mSliceNum;
182
183 const uint8_t *ptrIn;
184 uint32_t eStrideIn;
185 uint8_t *ptrOut;
186 uint32_t eStrideOut;
187
Jason Samsf22c8ac2012-04-03 19:31:36 -0700188 uint32_t yStrideIn;
189 uint32_t yStrideOut;
190
Jason Samscdfdb8f2011-03-17 16:12:47 -0700191 uint32_t xStart;
192 uint32_t xEnd;
193 uint32_t yStart;
194 uint32_t yEnd;
195 uint32_t zStart;
196 uint32_t zEnd;
197 uint32_t arrayStart;
198 uint32_t arrayEnd;
199
200 uint32_t dimX;
201 uint32_t dimY;
202 uint32_t dimZ;
203 uint32_t dimArray;
204} MTLaunchStruct;
Stephen Hines3815bad2011-08-18 19:33:01 -0700205typedef void (*rs_t)(const void *, void *, const void *, uint32_t, uint32_t, uint32_t, uint32_t);
Jason Samscdfdb8f2011-03-17 16:12:47 -0700206
207static void wc_xy(void *usr, uint32_t idx) {
208 MTLaunchStruct *mtls = (MTLaunchStruct *)usr;
Jason Sams451cf2e2011-08-17 13:46:46 -0700209 RsForEachStubParamStruct p;
210 memset(&p, 0, sizeof(p));
211 p.usr = mtls->usr;
212 p.usr_len = mtls->usrLen;
Stephen Hines3815bad2011-08-18 19:33:01 -0700213 RsdHal * dc = (RsdHal *)mtls->rsc->mHal.drv;
214 uint32_t sig = mtls->sig;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700215
Stephen Hines44199772012-02-21 20:13:12 -0800216 outer_foreach_t fn = (outer_foreach_t) mtls->kernel;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700217 while (1) {
218 uint32_t slice = (uint32_t)android_atomic_inc(&mtls->mSliceNum);
219 uint32_t yStart = mtls->yStart + slice * mtls->mSliceSize;
220 uint32_t yEnd = yStart + mtls->mSliceSize;
221 yEnd = rsMin(yEnd, mtls->yEnd);
222 if (yEnd <= yStart) {
223 return;
224 }
225
Steve Blockaf12ac62012-01-06 19:20:56 +0000226 //ALOGE("usr idx %i, x %i,%i y %i,%i", idx, mtls->xStart, mtls->xEnd, yStart, yEnd);
227 //ALOGE("usr ptr in %p, out %p", mtls->ptrIn, mtls->ptrOut);
Jason Sams451cf2e2011-08-17 13:46:46 -0700228 for (p.y = yStart; p.y < yEnd; p.y++) {
Jason Samsf22c8ac2012-04-03 19:31:36 -0700229 p.out = mtls->ptrOut + (mtls->yStrideOut * p.y);
230 p.in = mtls->ptrIn + (mtls->yStrideIn * p.y);
Stephen Hinesee7aa2e2012-01-12 18:56:23 -0800231 fn(&p, mtls->xStart, mtls->xEnd, mtls->eStrideIn, mtls->eStrideOut);
Jason Samscdfdb8f2011-03-17 16:12:47 -0700232 }
233 }
Jason Samsbad80742011-03-16 16:29:28 -0700234}
235
Jason Samscdfdb8f2011-03-17 16:12:47 -0700236static void wc_x(void *usr, uint32_t idx) {
237 MTLaunchStruct *mtls = (MTLaunchStruct *)usr;
Jason Sams451cf2e2011-08-17 13:46:46 -0700238 RsForEachStubParamStruct p;
239 memset(&p, 0, sizeof(p));
240 p.usr = mtls->usr;
241 p.usr_len = mtls->usrLen;
Stephen Hines3815bad2011-08-18 19:33:01 -0700242 RsdHal * dc = (RsdHal *)mtls->rsc->mHal.drv;
243 uint32_t sig = mtls->sig;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700244
Stephen Hines44199772012-02-21 20:13:12 -0800245 outer_foreach_t fn = (outer_foreach_t) mtls->kernel;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700246 while (1) {
247 uint32_t slice = (uint32_t)android_atomic_inc(&mtls->mSliceNum);
248 uint32_t xStart = mtls->xStart + slice * mtls->mSliceSize;
249 uint32_t xEnd = xStart + mtls->mSliceSize;
250 xEnd = rsMin(xEnd, mtls->xEnd);
251 if (xEnd <= xStart) {
252 return;
253 }
254
Steve Blockaf12ac62012-01-06 19:20:56 +0000255 //ALOGE("usr slice %i idx %i, x %i,%i", slice, idx, xStart, xEnd);
256 //ALOGE("usr ptr in %p, out %p", mtls->ptrIn, mtls->ptrOut);
Jason Sams96cd1362011-10-12 18:33:01 -0700257
Jason Sams70415112011-10-11 18:44:05 -0700258 p.out = mtls->ptrOut + (mtls->eStrideOut * xStart);
259 p.in = mtls->ptrIn + (mtls->eStrideIn * xStart);
Stephen Hinesee7aa2e2012-01-12 18:56:23 -0800260 fn(&p, xStart, xEnd, mtls->eStrideIn, mtls->eStrideOut);
Jason Samscdfdb8f2011-03-17 16:12:47 -0700261 }
262}
263
264void rsdScriptInvokeForEach(const Context *rsc,
265 Script *s,
Jason Sams35e429e2011-07-13 11:26:26 -0700266 uint32_t slot,
Jason Samscdfdb8f2011-03-17 16:12:47 -0700267 const Allocation * ain,
268 Allocation * aout,
269 const void * usr,
270 uint32_t usrLen,
271 const RsScriptCall *sc) {
272
Jason Sams87fe59a2011-04-20 15:09:01 -0700273 RsdHal * dc = (RsdHal *)rsc->mHal.drv;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700274
275 MTLaunchStruct mtls;
276 memset(&mtls, 0, sizeof(mtls));
277
Jason Sams0ab9f9f2012-06-15 16:10:17 -0700278 //ALOGE("for each script %p in %p out %p", s, ain, aout);
279
Stephen Hines3815bad2011-08-18 19:33:01 -0700280 DrvScript *drv = (DrvScript *)s->mHal.drv;
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700281 rsAssert(slot < drv->mExecutable->getExportForeachFuncAddrs().size());
282 mtls.kernel = reinterpret_cast<ForEachFunc_t>(
283 drv->mExecutable->getExportForeachFuncAddrs()[slot]);
Stephen Hines44199772012-02-21 20:13:12 -0800284 rsAssert(mtls.kernel != NULL);
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700285 mtls.sig = drv->mExecutable->getInfo().getExportForeachFuncs()[slot].second;
286
Jason Samscdfdb8f2011-03-17 16:12:47 -0700287 if (ain) {
288 mtls.dimX = ain->getType()->getDimX();
289 mtls.dimY = ain->getType()->getDimY();
290 mtls.dimZ = ain->getType()->getDimZ();
291 //mtls.dimArray = ain->getType()->getDimArray();
292 } else if (aout) {
293 mtls.dimX = aout->getType()->getDimX();
294 mtls.dimY = aout->getType()->getDimY();
295 mtls.dimZ = aout->getType()->getDimZ();
296 //mtls.dimArray = aout->getType()->getDimArray();
297 } else {
298 rsc->setError(RS_ERROR_BAD_SCRIPT, "rsForEach called with null allocations");
299 return;
300 }
301
302 if (!sc || (sc->xEnd == 0)) {
303 mtls.xEnd = mtls.dimX;
304 } else {
305 rsAssert(sc->xStart < mtls.dimX);
306 rsAssert(sc->xEnd <= mtls.dimX);
307 rsAssert(sc->xStart < sc->xEnd);
308 mtls.xStart = rsMin(mtls.dimX, sc->xStart);
309 mtls.xEnd = rsMin(mtls.dimX, sc->xEnd);
310 if (mtls.xStart >= mtls.xEnd) return;
311 }
312
313 if (!sc || (sc->yEnd == 0)) {
314 mtls.yEnd = mtls.dimY;
315 } else {
316 rsAssert(sc->yStart < mtls.dimY);
317 rsAssert(sc->yEnd <= mtls.dimY);
318 rsAssert(sc->yStart < sc->yEnd);
319 mtls.yStart = rsMin(mtls.dimY, sc->yStart);
320 mtls.yEnd = rsMin(mtls.dimY, sc->yEnd);
321 if (mtls.yStart >= mtls.yEnd) return;
322 }
323
324 mtls.xEnd = rsMax((uint32_t)1, mtls.xEnd);
325 mtls.yEnd = rsMax((uint32_t)1, mtls.yEnd);
326 mtls.zEnd = rsMax((uint32_t)1, mtls.zEnd);
327 mtls.arrayEnd = rsMax((uint32_t)1, mtls.arrayEnd);
328
Stephen Hineseed1b152011-04-11 14:02:22 -0700329 rsAssert(!ain || (ain->getType()->getDimZ() == 0));
Jason Samscdfdb8f2011-03-17 16:12:47 -0700330
331 Context *mrsc = (Context *)rsc;
332 Script * oldTLS = setTLS(s);
333
334 mtls.rsc = mrsc;
335 mtls.ain = ain;
336 mtls.aout = aout;
337 mtls.script = s;
338 mtls.usr = usr;
Jason Sams451cf2e2011-08-17 13:46:46 -0700339 mtls.usrLen = usrLen;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700340 mtls.mSliceSize = 10;
341 mtls.mSliceNum = 0;
342
343 mtls.ptrIn = NULL;
344 mtls.eStrideIn = 0;
345 if (ain) {
Jason Sams807fdc42012-07-25 17:55:39 -0700346 DrvAllocation *aindrv = (DrvAllocation *)ain->mHal.drv;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700347 mtls.ptrIn = (const uint8_t *)ain->getPtr();
348 mtls.eStrideIn = ain->getType()->getElementSizeBytes();
Jason Sams807fdc42012-07-25 17:55:39 -0700349 mtls.yStrideIn = aindrv->lod[0].stride;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700350 }
351
352 mtls.ptrOut = NULL;
353 mtls.eStrideOut = 0;
354 if (aout) {
Jason Sams807fdc42012-07-25 17:55:39 -0700355 DrvAllocation *aoutdrv = (DrvAllocation *)aout->mHal.drv;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700356 mtls.ptrOut = (uint8_t *)aout->getPtr();
357 mtls.eStrideOut = aout->getType()->getElementSizeBytes();
Jason Sams807fdc42012-07-25 17:55:39 -0700358 mtls.yStrideOut = aoutdrv->lod[0].stride;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700359 }
360
Jason Samsaa152102012-06-13 15:16:44 -0700361 if ((dc->mWorkers.mCount > 1) && s->mHal.info.isThreadable && !dc->mInForEach) {
362 dc->mInForEach = true;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700363 if (mtls.dimY > 1) {
Jason Sams0ab9f9f2012-06-15 16:10:17 -0700364 mtls.mSliceSize = mtls.dimY / (dc->mWorkers.mCount * 4);
365 if(mtls.mSliceSize < 1) {
366 mtls.mSliceSize = 1;
367 }
368
Jason Samscdfdb8f2011-03-17 16:12:47 -0700369 rsdLaunchThreads(mrsc, wc_xy, &mtls);
370 } else {
Jason Sams0ab9f9f2012-06-15 16:10:17 -0700371 mtls.mSliceSize = mtls.dimX / (dc->mWorkers.mCount * 4);
372 if(mtls.mSliceSize < 1) {
373 mtls.mSliceSize = 1;
374 }
375
Jason Samscdfdb8f2011-03-17 16:12:47 -0700376 rsdLaunchThreads(mrsc, wc_x, &mtls);
377 }
Jason Samsaa152102012-06-13 15:16:44 -0700378 dc->mInForEach = false;
Jason Samscdfdb8f2011-03-17 16:12:47 -0700379
Steve Blockaf12ac62012-01-06 19:20:56 +0000380 //ALOGE("launch 1");
Jason Samscdfdb8f2011-03-17 16:12:47 -0700381 } else {
Jason Sams451cf2e2011-08-17 13:46:46 -0700382 RsForEachStubParamStruct p;
383 memset(&p, 0, sizeof(p));
384 p.usr = mtls.usr;
385 p.usr_len = mtls.usrLen;
Stephen Hines3815bad2011-08-18 19:33:01 -0700386 uint32_t sig = mtls.sig;
Jason Sams451cf2e2011-08-17 13:46:46 -0700387
Steve Blockaf12ac62012-01-06 19:20:56 +0000388 //ALOGE("launch 3");
Stephen Hines44199772012-02-21 20:13:12 -0800389 outer_foreach_t fn = (outer_foreach_t) mtls.kernel;
Jason Sams451cf2e2011-08-17 13:46:46 -0700390 for (p.ar[0] = mtls.arrayStart; p.ar[0] < mtls.arrayEnd; p.ar[0]++) {
391 for (p.z = mtls.zStart; p.z < mtls.zEnd; p.z++) {
392 for (p.y = mtls.yStart; p.y < mtls.yEnd; p.y++) {
393 uint32_t offset = mtls.dimX * mtls.dimY * mtls.dimZ * p.ar[0] +
394 mtls.dimX * mtls.dimY * p.z +
395 mtls.dimX * p.y;
Jason Sams70415112011-10-11 18:44:05 -0700396 p.out = mtls.ptrOut + (mtls.eStrideOut * offset);
397 p.in = mtls.ptrIn + (mtls.eStrideIn * offset);
Stephen Hinesee7aa2e2012-01-12 18:56:23 -0800398 fn(&p, mtls.xStart, mtls.xEnd, mtls.eStrideIn,
399 mtls.eStrideOut);
Jason Samscdfdb8f2011-03-17 16:12:47 -0700400 }
401 }
402 }
403 }
404
405 setTLS(oldTLS);
406}
407
408
409int rsdScriptInvokeRoot(const Context *dc, Script *script) {
410 DrvScript *drv = (DrvScript *)script->mHal.drv;
411
412 Script * oldTLS = setTLS(script);
413 int ret = drv->mRoot();
414 setTLS(oldTLS);
415
416 return ret;
417}
418
419void rsdScriptInvokeInit(const Context *dc, Script *script) {
Jason Samsbad80742011-03-16 16:29:28 -0700420 DrvScript *drv = (DrvScript *)script->mHal.drv;
421
422 if (drv->mInit) {
423 drv->mInit();
424 }
425}
426
Stephen Hines4ee16ff2011-08-31 17:41:39 -0700427void rsdScriptInvokeFreeChildren(const Context *dc, Script *script) {
428 DrvScript *drv = (DrvScript *)script->mHal.drv;
429
430 if (drv->mFreeChildren) {
431 drv->mFreeChildren();
432 }
433}
Jason Samsbad80742011-03-16 16:29:28 -0700434
Jason Samscdfdb8f2011-03-17 16:12:47 -0700435void rsdScriptInvokeFunction(const Context *dc, Script *script,
Jason Samsbad80742011-03-16 16:29:28 -0700436 uint32_t slot,
437 const void *params,
438 size_t paramLength) {
439 DrvScript *drv = (DrvScript *)script->mHal.drv;
Steve Blockaf12ac62012-01-06 19:20:56 +0000440 //ALOGE("invoke %p %p %i %p %i", dc, script, slot, params, paramLength);
Jason Samsbad80742011-03-16 16:29:28 -0700441
Jason Samscdfdb8f2011-03-17 16:12:47 -0700442 Script * oldTLS = setTLS(script);
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700443 reinterpret_cast<void (*)(const void *, uint32_t)>(
444 drv->mExecutable->getExportFuncAddrs()[slot])(params, paramLength);
Jason Samscdfdb8f2011-03-17 16:12:47 -0700445 setTLS(oldTLS);
Jason Samsbad80742011-03-16 16:29:28 -0700446}
447
448void rsdScriptSetGlobalVar(const Context *dc, const Script *script,
449 uint32_t slot, void *data, size_t dataLength) {
450 DrvScript *drv = (DrvScript *)script->mHal.drv;
451 //rsAssert(!script->mFieldIsObject[slot]);
Steve Blockaf12ac62012-01-06 19:20:56 +0000452 //ALOGE("setGlobalVar %p %p %i %p %i", dc, script, slot, data, dataLength);
Jason Samsbad80742011-03-16 16:29:28 -0700453
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700454 int32_t *destPtr = reinterpret_cast<int32_t *>(
455 drv->mExecutable->getExportVarAddrs()[slot]);
Jason Samsbad80742011-03-16 16:29:28 -0700456 if (!destPtr) {
Steve Block65982012011-10-20 11:56:00 +0100457 //ALOGV("Calling setVar on slot = %i which is null", slot);
Jason Samsbad80742011-03-16 16:29:28 -0700458 return;
459 }
460
461 memcpy(destPtr, data, dataLength);
462}
463
Stephen Hines2980f072012-04-09 18:26:29 -0700464void rsdScriptSetGlobalVarWithElemDims(
465 const android::renderscript::Context *dc,
466 const android::renderscript::Script *script,
467 uint32_t slot, void *data, size_t dataLength,
468 const android::renderscript::Element *elem,
469 const size_t *dims, size_t dimLength) {
470 DrvScript *drv = (DrvScript *)script->mHal.drv;
471
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700472 int32_t *destPtr = reinterpret_cast<int32_t *>(
473 drv->mExecutable->getExportVarAddrs()[slot]);
Stephen Hines2980f072012-04-09 18:26:29 -0700474 if (!destPtr) {
475 //ALOGV("Calling setVar on slot = %i which is null", slot);
476 return;
477 }
478
479 // We want to look at dimension in terms of integer components,
480 // but dimLength is given in terms of bytes.
481 dimLength /= sizeof(int);
482
483 // Only a single dimension is currently supported.
484 rsAssert(dimLength == 1);
485 if (dimLength == 1) {
486 // First do the increment loop.
487 size_t stride = elem->getSizeBytes();
488 char *cVal = reinterpret_cast<char *>(data);
489 for (size_t i = 0; i < dims[0]; i++) {
490 elem->incRefs(cVal);
491 cVal += stride;
492 }
493
494 // Decrement loop comes after (to prevent race conditions).
495 char *oldVal = reinterpret_cast<char *>(destPtr);
496 for (size_t i = 0; i < dims[0]; i++) {
497 elem->decRefs(oldVal);
498 oldVal += stride;
499 }
500 }
501
502 memcpy(destPtr, data, dataLength);
503}
504
Jason Sams807fdc42012-07-25 17:55:39 -0700505void rsdScriptSetGlobalBind(const Context *dc, const Script *script, uint32_t slot, Allocation *data) {
Jason Samsbad80742011-03-16 16:29:28 -0700506 DrvScript *drv = (DrvScript *)script->mHal.drv;
Jason Sams807fdc42012-07-25 17:55:39 -0700507
Jason Samsbad80742011-03-16 16:29:28 -0700508 //rsAssert(!script->mFieldIsObject[slot]);
Steve Blockaf12ac62012-01-06 19:20:56 +0000509 //ALOGE("setGlobalBind %p %p %i %p", dc, script, slot, data);
Jason Samsbad80742011-03-16 16:29:28 -0700510
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700511 int32_t *destPtr = reinterpret_cast<int32_t *>(
512 drv->mExecutable->getExportVarAddrs()[slot]);
Jason Samsbad80742011-03-16 16:29:28 -0700513 if (!destPtr) {
Steve Block65982012011-10-20 11:56:00 +0100514 //ALOGV("Calling setVar on slot = %i which is null", slot);
Jason Samsbad80742011-03-16 16:29:28 -0700515 return;
516 }
517
Jason Sams807fdc42012-07-25 17:55:39 -0700518 void *ptr = NULL;
519 drv->mBoundAllocs[slot] = data;
520 if(data) {
521 DrvAllocation *allocDrv = (DrvAllocation *)data->mHal.drv;
522 ptr = allocDrv->lod[0].mallocPtr;
523 }
524 memcpy(destPtr, &ptr, sizeof(void *));
Jason Samsbad80742011-03-16 16:29:28 -0700525}
526
527void rsdScriptSetGlobalObj(const Context *dc, const Script *script, uint32_t slot, ObjectBase *data) {
528 DrvScript *drv = (DrvScript *)script->mHal.drv;
529 //rsAssert(script->mFieldIsObject[slot]);
Steve Blockaf12ac62012-01-06 19:20:56 +0000530 //ALOGE("setGlobalObj %p %p %i %p", dc, script, slot, data);
Jason Samsbad80742011-03-16 16:29:28 -0700531
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700532 int32_t *destPtr = reinterpret_cast<int32_t *>(
533 drv->mExecutable->getExportVarAddrs()[slot]);
Jason Samsbad80742011-03-16 16:29:28 -0700534 if (!destPtr) {
Steve Block65982012011-10-20 11:56:00 +0100535 //ALOGV("Calling setVar on slot = %i which is null", slot);
Jason Samsbad80742011-03-16 16:29:28 -0700536 return;
537 }
538
Jason Sams87fe59a2011-04-20 15:09:01 -0700539 rsrSetObject(dc, script, (ObjectBase **)destPtr, data);
Jason Samsbad80742011-03-16 16:29:28 -0700540}
541
542void rsdScriptDestroy(const Context *dc, Script *script) {
543 DrvScript *drv = (DrvScript *)script->mHal.drv;
544
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700545 if (drv == NULL) {
546 return;
547 }
548
549 if (drv->mExecutable) {
550 Vector<void *>::const_iterator var_addr_iter =
551 drv->mExecutable->getExportVarAddrs().begin();
552 Vector<void *>::const_iterator var_addr_end =
553 drv->mExecutable->getExportVarAddrs().end();
554
555 bcc::RSInfo::ObjectSlotListTy::const_iterator is_object_iter =
556 drv->mExecutable->getInfo().getObjectSlots().begin();
557 bcc::RSInfo::ObjectSlotListTy::const_iterator is_object_end =
558 drv->mExecutable->getInfo().getObjectSlots().end();
559
560 while ((var_addr_iter != var_addr_end) &&
561 (is_object_iter != is_object_end)) {
562 // The field address can be NULL if the script-side has optimized
563 // the corresponding global variable away.
564 ObjectBase **obj_addr =
565 reinterpret_cast<ObjectBase **>(*var_addr_iter);
566 if (*is_object_iter) {
567 if (*var_addr_iter != NULL) {
568 rsrClearObject(dc, script, obj_addr);
Stephen Hines8d43eaf2011-03-24 20:03:49 -0700569 }
Jason Samsbad80742011-03-16 16:29:28 -0700570 }
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700571 var_addr_iter++;
572 is_object_iter++;
Jason Samsbad80742011-03-16 16:29:28 -0700573 }
Jason Samsbad80742011-03-16 16:29:28 -0700574 }
Stephen Hines689821f2011-07-18 17:24:11 -0700575
Shih-wei Liaoa3af2cd2012-04-25 04:18:31 -0700576 delete drv->mCompilerContext;
577 delete drv->mCompilerDriver;
578 delete drv->mExecutable;
Jason Sams807fdc42012-07-25 17:55:39 -0700579 delete[] drv->mBoundAllocs;
Jason Samsbad80742011-03-16 16:29:28 -0700580 free(drv);
581 script->mHal.drv = NULL;
Jason Samsbad80742011-03-16 16:29:28 -0700582}
Jason Sams807fdc42012-07-25 17:55:39 -0700583
584Allocation * rsdScriptGetAllocationForPointer(const android::renderscript::Context *dc,
585 const android::renderscript::Script *sc,
586 const void *ptr) {
587 DrvScript *drv = (DrvScript *)sc->mHal.drv;
588 if (!ptr) {
589 return NULL;
590 }
591
592 for (uint32_t ct=0; ct < sc->mHal.info.exportedVariableCount; ct++) {
593 Allocation *a = drv->mBoundAllocs[ct];
594 if (!a) continue;
595 DrvAllocation *adrv = (DrvAllocation *)a->mHal.drv;
596 if (adrv->lod[0].mallocPtr == ptr) {
597 return a;
598 }
599 }
600 ALOGE("rsGetAllocation, failed to find %p", ptr);
601 return NULL;
602}
603