• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (C) 2011 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 
18 #include "rsdCore.h"
19 #include "rsdBcc.h"
20 #include "rsdRuntime.h"
21 
22 #include <bcinfo/MetadataExtractor.h>
23 
24 #include "rsContext.h"
25 #include "rsScriptC.h"
26 
27 #include "utils/Timers.h"
28 #include "utils/StopWatch.h"
29 extern "C" {
30 #include "libdex/ZipArchive.h"
31 }
32 
33 
34 using namespace android;
35 using namespace android::renderscript;
36 
37 struct DrvScript {
38     int (*mRoot)();
39     void (*mInit)();
40     void (*mFreeChildren)();
41 
42     BCCScriptRef mBccScript;
43 
44     bcinfo::MetadataExtractor *ME;
45 
46     InvokeFunc_t *mInvokeFunctions;
47     void ** mFieldAddress;
48     bool * mFieldIsObject;
49     const uint32_t *mExportForEachSignatureList;
50 
51     const uint8_t * mScriptText;
52     uint32_t mScriptTextLength;
53 };
54 
55 
setTLS(Script * sc)56 static Script * setTLS(Script *sc) {
57     ScriptTLSStruct * tls = (ScriptTLSStruct *)pthread_getspecific(rsdgThreadTLSKey);
58     rsAssert(tls);
59     Script *old = tls->mScript;
60     tls->mScript = sc;
61     return old;
62 }
63 
64 
rsdScriptInit(const Context * rsc,ScriptC * script,char const * resName,char const * cacheDir,uint8_t const * bitcode,size_t bitcodeSize,uint32_t flags)65 bool rsdScriptInit(const Context *rsc,
66                      ScriptC *script,
67                      char const *resName,
68                      char const *cacheDir,
69                      uint8_t const *bitcode,
70                      size_t bitcodeSize,
71                      uint32_t flags) {
72     //LOGE("rsdScriptCreate %p %p %p %p %i %i %p", rsc, resName, cacheDir, bitcode, bitcodeSize, flags, lookupFunc);
73 
74     pthread_mutex_lock(&rsdgInitMutex);
75     char *cachePath = NULL;
76     size_t exportFuncCount = 0;
77     size_t exportVarCount = 0;
78     size_t objectSlotCount = 0;
79     size_t exportForEachSignatureCount = 0;
80 
81     DrvScript *drv = (DrvScript *)calloc(1, sizeof(DrvScript));
82     if (drv == NULL) {
83         goto error;
84     }
85     script->mHal.drv = drv;
86 
87     drv->mBccScript = bccCreateScript();
88     script->mHal.info.isThreadable = true;
89     drv->mScriptText = bitcode;
90     drv->mScriptTextLength = bitcodeSize;
91 
92 
93     drv->ME = new bcinfo::MetadataExtractor((const char*)drv->mScriptText,
94                                             drv->mScriptTextLength);
95     if (!drv->ME->extract()) {
96       LOGE("bcinfo: failed to read script metadata");
97       goto error;
98     }
99 
100     //LOGE("mBccScript %p", script->mBccScript);
101 
102     if (bccRegisterSymbolCallback(drv->mBccScript, &rsdLookupRuntimeStub, script) != 0) {
103         LOGE("bcc: FAILS to register symbol callback");
104         goto error;
105     }
106 
107     if (bccReadBC(drv->mBccScript,
108                   resName,
109                   (char const *)drv->mScriptText,
110                   drv->mScriptTextLength, 0) != 0) {
111         LOGE("bcc: FAILS to read bitcode");
112         goto error;
113     }
114 
115     if (bccLinkFile(drv->mBccScript, "/system/lib/libclcore.bc", 0) != 0) {
116         LOGE("bcc: FAILS to link bitcode");
117         goto error;
118     }
119 
120     if (bccPrepareExecutable(drv->mBccScript, cacheDir, resName, 0) != 0) {
121         LOGE("bcc: FAILS to prepare executable");
122         goto error;
123     }
124 
125     free(cachePath);
126 
127     drv->mRoot = reinterpret_cast<int (*)()>(bccGetFuncAddr(drv->mBccScript, "root"));
128     drv->mInit = reinterpret_cast<void (*)()>(bccGetFuncAddr(drv->mBccScript, "init"));
129     drv->mFreeChildren = reinterpret_cast<void (*)()>(bccGetFuncAddr(drv->mBccScript, ".rs.dtor"));
130 
131     exportFuncCount = drv->ME->getExportFuncCount();
132     if (exportFuncCount > 0) {
133         drv->mInvokeFunctions = (InvokeFunc_t*) calloc(exportFuncCount,
134                                                        sizeof(InvokeFunc_t));
135         bccGetExportFuncList(drv->mBccScript, exportFuncCount,
136                              (void **) drv->mInvokeFunctions);
137     } else {
138         drv->mInvokeFunctions = NULL;
139     }
140 
141     exportVarCount = drv->ME->getExportVarCount();
142     if (exportVarCount > 0) {
143         drv->mFieldAddress = (void **) calloc(exportVarCount, sizeof(void*));
144         drv->mFieldIsObject = (bool *) calloc(exportVarCount, sizeof(bool));
145         bccGetExportVarList(drv->mBccScript, exportVarCount,
146                             (void **) drv->mFieldAddress);
147     } else {
148         drv->mFieldAddress = NULL;
149         drv->mFieldIsObject = NULL;
150     }
151 
152     objectSlotCount = drv->ME->getObjectSlotCount();
153     if (objectSlotCount > 0) {
154         const uint32_t *objectSlotList = drv->ME->getObjectSlotList();
155         for (uint32_t ct=0; ct < objectSlotCount; ct++) {
156             drv->mFieldIsObject[objectSlotList[ct]] = true;
157         }
158     }
159 
160     exportForEachSignatureCount = drv->ME->getExportForEachSignatureCount();
161     rsAssert(exportForEachSignatureCount <= 1);
162     drv->mExportForEachSignatureList = drv->ME->getExportForEachSignatureList();
163 
164     // Copy info over to runtime
165     script->mHal.info.exportedFunctionCount = drv->ME->getExportFuncCount();
166     script->mHal.info.exportedVariableCount = drv->ME->getExportVarCount();
167     script->mHal.info.exportedPragmaCount = drv->ME->getPragmaCount();
168     script->mHal.info.exportedPragmaKeyList = drv->ME->getPragmaKeyList();
169     script->mHal.info.exportedPragmaValueList = drv->ME->getPragmaValueList();
170     script->mHal.info.root = drv->mRoot;
171 
172     pthread_mutex_unlock(&rsdgInitMutex);
173     return true;
174 
175 error:
176 
177     pthread_mutex_unlock(&rsdgInitMutex);
178     if (drv->ME) {
179         delete drv->ME;
180         drv->ME = NULL;
181     }
182     free(drv);
183     return false;
184 
185 }
186 
187 typedef struct {
188     Context *rsc;
189     Script *script;
190     uint32_t sig;
191     const Allocation * ain;
192     Allocation * aout;
193     const void * usr;
194     size_t usrLen;
195 
196     uint32_t mSliceSize;
197     volatile int mSliceNum;
198 
199     const uint8_t *ptrIn;
200     uint32_t eStrideIn;
201     uint8_t *ptrOut;
202     uint32_t eStrideOut;
203 
204     uint32_t xStart;
205     uint32_t xEnd;
206     uint32_t yStart;
207     uint32_t yEnd;
208     uint32_t zStart;
209     uint32_t zEnd;
210     uint32_t arrayStart;
211     uint32_t arrayEnd;
212 
213     uint32_t dimX;
214     uint32_t dimY;
215     uint32_t dimZ;
216     uint32_t dimArray;
217 } MTLaunchStruct;
218 typedef void (*rs_t)(const void *, void *, const void *, uint32_t, uint32_t, uint32_t, uint32_t);
219 
wc_xy(void * usr,uint32_t idx)220 static void wc_xy(void *usr, uint32_t idx) {
221     MTLaunchStruct *mtls = (MTLaunchStruct *)usr;
222     RsForEachStubParamStruct p;
223     memset(&p, 0, sizeof(p));
224     p.usr = mtls->usr;
225     p.usr_len = mtls->usrLen;
226     RsdHal * dc = (RsdHal *)mtls->rsc->mHal.drv;
227     uint32_t sig = mtls->sig;
228 
229     while (1) {
230         uint32_t slice = (uint32_t)android_atomic_inc(&mtls->mSliceNum);
231         uint32_t yStart = mtls->yStart + slice * mtls->mSliceSize;
232         uint32_t yEnd = yStart + mtls->mSliceSize;
233         yEnd = rsMin(yEnd, mtls->yEnd);
234         if (yEnd <= yStart) {
235             return;
236         }
237 
238         //LOGE("usr idx %i, x %i,%i  y %i,%i", idx, mtls->xStart, mtls->xEnd, yStart, yEnd);
239         //LOGE("usr ptr in %p,  out %p", mtls->ptrIn, mtls->ptrOut);
240         for (p.y = yStart; p.y < yEnd; p.y++) {
241             uint32_t offset = mtls->dimX * p.y;
242             uint8_t *xPtrOut = mtls->ptrOut + (mtls->eStrideOut * offset);
243             const uint8_t *xPtrIn = mtls->ptrIn + (mtls->eStrideIn * offset);
244 
245             for (p.x = mtls->xStart; p.x < mtls->xEnd; p.x++) {
246                 p.in = xPtrIn;
247                 p.out = xPtrOut;
248                 dc->mForEachLaunch[sig](&mtls->script->mHal.info.root, &p);
249                 xPtrIn += mtls->eStrideIn;
250                 xPtrOut += mtls->eStrideOut;
251             }
252         }
253     }
254 }
255 
wc_x(void * usr,uint32_t idx)256 static void wc_x(void *usr, uint32_t idx) {
257     MTLaunchStruct *mtls = (MTLaunchStruct *)usr;
258     RsForEachStubParamStruct p;
259     memset(&p, 0, sizeof(p));
260     p.usr = mtls->usr;
261     p.usr_len = mtls->usrLen;
262     RsdHal * dc = (RsdHal *)mtls->rsc->mHal.drv;
263     uint32_t sig = mtls->sig;
264 
265     while (1) {
266         uint32_t slice = (uint32_t)android_atomic_inc(&mtls->mSliceNum);
267         uint32_t xStart = mtls->xStart + slice * mtls->mSliceSize;
268         uint32_t xEnd = xStart + mtls->mSliceSize;
269         xEnd = rsMin(xEnd, mtls->xEnd);
270         if (xEnd <= xStart) {
271             return;
272         }
273 
274         //LOGE("usr idx %i, x %i,%i  y %i,%i", idx, mtls->xStart, mtls->xEnd, yStart, yEnd);
275         //LOGE("usr ptr in %p,  out %p", mtls->ptrIn, mtls->ptrOut);
276         uint8_t *xPtrOut = mtls->ptrOut + (mtls->eStrideOut * xStart);
277         const uint8_t *xPtrIn = mtls->ptrIn + (mtls->eStrideIn * xStart);
278         for (p.x = xStart; p.x < xEnd; p.x++) {
279             p.in = xPtrIn;
280             p.out = xPtrOut;
281             dc->mForEachLaunch[sig](&mtls->script->mHal.info.root, &p);
282             xPtrIn += mtls->eStrideIn;
283             xPtrOut += mtls->eStrideOut;
284         }
285     }
286 }
287 
rsdScriptInvokeForEach(const Context * rsc,Script * s,uint32_t slot,const Allocation * ain,Allocation * aout,const void * usr,uint32_t usrLen,const RsScriptCall * sc)288 void rsdScriptInvokeForEach(const Context *rsc,
289                             Script *s,
290                             uint32_t slot,
291                             const Allocation * ain,
292                             Allocation * aout,
293                             const void * usr,
294                             uint32_t usrLen,
295                             const RsScriptCall *sc) {
296 
297     RsdHal * dc = (RsdHal *)rsc->mHal.drv;
298 
299     MTLaunchStruct mtls;
300     memset(&mtls, 0, sizeof(mtls));
301 
302     DrvScript *drv = (DrvScript *)s->mHal.drv;
303     // We only support slot 0 (root) at this point in time.
304     rsAssert(slot == 0);
305     mtls.sig = 0x1f;  // temp fix for old apps, full table in slang_rs_export_foreach.cpp
306     if (drv->mExportForEachSignatureList) {
307         mtls.sig = drv->mExportForEachSignatureList[slot];
308     }
309     if (ain) {
310         mtls.dimX = ain->getType()->getDimX();
311         mtls.dimY = ain->getType()->getDimY();
312         mtls.dimZ = ain->getType()->getDimZ();
313         //mtls.dimArray = ain->getType()->getDimArray();
314     } else if (aout) {
315         mtls.dimX = aout->getType()->getDimX();
316         mtls.dimY = aout->getType()->getDimY();
317         mtls.dimZ = aout->getType()->getDimZ();
318         //mtls.dimArray = aout->getType()->getDimArray();
319     } else {
320         rsc->setError(RS_ERROR_BAD_SCRIPT, "rsForEach called with null allocations");
321         return;
322     }
323 
324     if (!sc || (sc->xEnd == 0)) {
325         mtls.xEnd = mtls.dimX;
326     } else {
327         rsAssert(sc->xStart < mtls.dimX);
328         rsAssert(sc->xEnd <= mtls.dimX);
329         rsAssert(sc->xStart < sc->xEnd);
330         mtls.xStart = rsMin(mtls.dimX, sc->xStart);
331         mtls.xEnd = rsMin(mtls.dimX, sc->xEnd);
332         if (mtls.xStart >= mtls.xEnd) return;
333     }
334 
335     if (!sc || (sc->yEnd == 0)) {
336         mtls.yEnd = mtls.dimY;
337     } else {
338         rsAssert(sc->yStart < mtls.dimY);
339         rsAssert(sc->yEnd <= mtls.dimY);
340         rsAssert(sc->yStart < sc->yEnd);
341         mtls.yStart = rsMin(mtls.dimY, sc->yStart);
342         mtls.yEnd = rsMin(mtls.dimY, sc->yEnd);
343         if (mtls.yStart >= mtls.yEnd) return;
344     }
345 
346     mtls.xEnd = rsMax((uint32_t)1, mtls.xEnd);
347     mtls.yEnd = rsMax((uint32_t)1, mtls.yEnd);
348     mtls.zEnd = rsMax((uint32_t)1, mtls.zEnd);
349     mtls.arrayEnd = rsMax((uint32_t)1, mtls.arrayEnd);
350 
351     rsAssert(!ain || (ain->getType()->getDimZ() == 0));
352 
353     Context *mrsc = (Context *)rsc;
354     Script * oldTLS = setTLS(s);
355 
356     mtls.rsc = mrsc;
357     mtls.ain = ain;
358     mtls.aout = aout;
359     mtls.script = s;
360     mtls.usr = usr;
361     mtls.usrLen = usrLen;
362     mtls.mSliceSize = 10;
363     mtls.mSliceNum = 0;
364 
365     mtls.ptrIn = NULL;
366     mtls.eStrideIn = 0;
367     if (ain) {
368         mtls.ptrIn = (const uint8_t *)ain->getPtr();
369         mtls.eStrideIn = ain->getType()->getElementSizeBytes();
370     }
371 
372     mtls.ptrOut = NULL;
373     mtls.eStrideOut = 0;
374     if (aout) {
375         mtls.ptrOut = (uint8_t *)aout->getPtr();
376         mtls.eStrideOut = aout->getType()->getElementSizeBytes();
377     }
378 
379     if ((dc->mWorkers.mCount > 1) && s->mHal.info.isThreadable) {
380         if (mtls.dimY > 1) {
381             rsdLaunchThreads(mrsc, wc_xy, &mtls);
382         } else {
383             rsdLaunchThreads(mrsc, wc_x, &mtls);
384         }
385 
386         //LOGE("launch 1");
387     } else {
388         RsForEachStubParamStruct p;
389         memset(&p, 0, sizeof(p));
390         p.usr = mtls.usr;
391         p.usr_len = mtls.usrLen;
392         uint32_t sig = mtls.sig;
393 
394         //LOGE("launch 3");
395         for (p.ar[0] = mtls.arrayStart; p.ar[0] < mtls.arrayEnd; p.ar[0]++) {
396             for (p.z = mtls.zStart; p.z < mtls.zEnd; p.z++) {
397                 for (p.y = mtls.yStart; p.y < mtls.yEnd; p.y++) {
398                     uint32_t offset = mtls.dimX * mtls.dimY * mtls.dimZ * p.ar[0] +
399                                       mtls.dimX * mtls.dimY * p.z +
400                                       mtls.dimX * p.y;
401                     uint8_t *xPtrOut = mtls.ptrOut + (mtls.eStrideOut * offset);
402                     const uint8_t *xPtrIn = mtls.ptrIn + (mtls.eStrideIn * offset);
403 
404                     for (p.x = mtls.xStart; p.x < mtls.xEnd; p.x++) {
405                         p.in = xPtrIn;
406                         p.out = xPtrOut;
407                         dc->mForEachLaunch[sig](&s->mHal.info.root, &p);
408                         xPtrIn += mtls.eStrideIn;
409                         xPtrOut += mtls.eStrideOut;
410                     }
411                 }
412             }
413         }
414     }
415 
416     setTLS(oldTLS);
417 }
418 
419 
rsdScriptInvokeRoot(const Context * dc,Script * script)420 int rsdScriptInvokeRoot(const Context *dc, Script *script) {
421     DrvScript *drv = (DrvScript *)script->mHal.drv;
422 
423     Script * oldTLS = setTLS(script);
424     int ret = drv->mRoot();
425     setTLS(oldTLS);
426 
427     return ret;
428 }
429 
rsdScriptInvokeInit(const Context * dc,Script * script)430 void rsdScriptInvokeInit(const Context *dc, Script *script) {
431     DrvScript *drv = (DrvScript *)script->mHal.drv;
432 
433     if (drv->mInit) {
434         drv->mInit();
435     }
436 }
437 
rsdScriptInvokeFreeChildren(const Context * dc,Script * script)438 void rsdScriptInvokeFreeChildren(const Context *dc, Script *script) {
439     DrvScript *drv = (DrvScript *)script->mHal.drv;
440 
441     if (drv->mFreeChildren) {
442         drv->mFreeChildren();
443     }
444 }
445 
rsdScriptInvokeFunction(const Context * dc,Script * script,uint32_t slot,const void * params,size_t paramLength)446 void rsdScriptInvokeFunction(const Context *dc, Script *script,
447                             uint32_t slot,
448                             const void *params,
449                             size_t paramLength) {
450     DrvScript *drv = (DrvScript *)script->mHal.drv;
451     //LOGE("invoke %p %p %i %p %i", dc, script, slot, params, paramLength);
452 
453     Script * oldTLS = setTLS(script);
454     ((void (*)(const void *, uint32_t))
455         drv->mInvokeFunctions[slot])(params, paramLength);
456     setTLS(oldTLS);
457 }
458 
rsdScriptSetGlobalVar(const Context * dc,const Script * script,uint32_t slot,void * data,size_t dataLength)459 void rsdScriptSetGlobalVar(const Context *dc, const Script *script,
460                            uint32_t slot, void *data, size_t dataLength) {
461     DrvScript *drv = (DrvScript *)script->mHal.drv;
462     //rsAssert(!script->mFieldIsObject[slot]);
463     //LOGE("setGlobalVar %p %p %i %p %i", dc, script, slot, data, dataLength);
464 
465     int32_t *destPtr = ((int32_t **)drv->mFieldAddress)[slot];
466     if (!destPtr) {
467         //LOGV("Calling setVar on slot = %i which is null", slot);
468         return;
469     }
470 
471     memcpy(destPtr, data, dataLength);
472 }
473 
rsdScriptSetGlobalBind(const Context * dc,const Script * script,uint32_t slot,void * data)474 void rsdScriptSetGlobalBind(const Context *dc, const Script *script, uint32_t slot, void *data) {
475     DrvScript *drv = (DrvScript *)script->mHal.drv;
476     //rsAssert(!script->mFieldIsObject[slot]);
477     //LOGE("setGlobalBind %p %p %i %p", dc, script, slot, data);
478 
479     int32_t *destPtr = ((int32_t **)drv->mFieldAddress)[slot];
480     if (!destPtr) {
481         //LOGV("Calling setVar on slot = %i which is null", slot);
482         return;
483     }
484 
485     memcpy(destPtr, &data, sizeof(void *));
486 }
487 
rsdScriptSetGlobalObj(const Context * dc,const Script * script,uint32_t slot,ObjectBase * data)488 void rsdScriptSetGlobalObj(const Context *dc, const Script *script, uint32_t slot, ObjectBase *data) {
489     DrvScript *drv = (DrvScript *)script->mHal.drv;
490     //rsAssert(script->mFieldIsObject[slot]);
491     //LOGE("setGlobalObj %p %p %i %p", dc, script, slot, data);
492 
493     int32_t *destPtr = ((int32_t **)drv->mFieldAddress)[slot];
494     if (!destPtr) {
495         //LOGV("Calling setVar on slot = %i which is null", slot);
496         return;
497     }
498 
499     rsrSetObject(dc, script, (ObjectBase **)destPtr, data);
500 }
501 
rsdScriptDestroy(const Context * dc,Script * script)502 void rsdScriptDestroy(const Context *dc, Script *script) {
503     DrvScript *drv = (DrvScript *)script->mHal.drv;
504 
505     if (drv->mFieldAddress) {
506         size_t exportVarCount = drv->ME->getExportVarCount();
507         for (size_t ct = 0; ct < exportVarCount; ct++) {
508             if (drv->mFieldIsObject[ct]) {
509                 // The field address can be NULL if the script-side has
510                 // optimized the corresponding global variable away.
511                 if (drv->mFieldAddress[ct]) {
512                     rsrClearObject(dc, script, (ObjectBase **)drv->mFieldAddress[ct]);
513                 }
514             }
515         }
516         free(drv->mFieldAddress);
517         drv->mFieldAddress = NULL;
518         free(drv->mFieldIsObject);
519         drv->mFieldIsObject = NULL;    }
520 
521     if (drv->mInvokeFunctions) {
522         free(drv->mInvokeFunctions);
523         drv->mInvokeFunctions = NULL;
524     }
525 
526     delete drv->ME;
527     drv->ME = NULL;
528 
529     free(drv);
530     script->mHal.drv = NULL;
531 
532 }
533 
534 
535