/* * Copyright (C) 2009 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include "rsContext.h" #include "rsScriptC.h" #include "rsMatrix.h" #include "utils/Timers.h" #include "utils/StopWatch.h" extern "C" { #include "libdex/ZipArchive.h" } #include #include using namespace android; using namespace android::renderscript; #define GET_TLS() Context::ScriptTLSStruct * tls = \ (Context::ScriptTLSStruct *)pthread_getspecific(Context::gThreadTLSKey); \ Context * rsc = tls->mContext; \ ScriptC * sc = (ScriptC *) tls->mScript // Input: cacheDir // Input: resName // Input: extName // // Note: cacheFile = resName + extName // // Output: Returns cachePath == cacheDir + cacheFile char *genCacheFileName(const char *cacheDir, const char *resName, const char *extName) { char cachePath[512]; char cacheFile[sizeof(cachePath)]; const size_t kBufLen = sizeof(cachePath) - 1; cacheFile[0] = '\0'; // Note: resName today is usually something like // "/com.android.fountain:raw/fountain" if (resName[0] != '/') { // Get the absolute path of the raw/***.bc file. // Generate the absolute path. This doesn't do everything it // should, e.g. if resName is "./out/whatever" it doesn't crunch // the leading "./" out because this if-block is not triggered, // but it'll make do. // if (getcwd(cacheFile, kBufLen) == NULL) { LOGE("Can't get CWD while opening raw/***.bc file\n"); return NULL; } // Append "/" at the end of cacheFile so far. strncat(cacheFile, "/", kBufLen); } // cacheFile = resName + extName // strncat(cacheFile, resName, kBufLen); if (extName != NULL) { // TODO(srhines): strncat() is a bit dangerous strncat(cacheFile, extName, kBufLen); } // Turn the path into a flat filename by replacing // any slashes after the first one with '@' characters. char *cp = cacheFile + 1; while (*cp != '\0') { if (*cp == '/') { *cp = '@'; } cp++; } // Tack on the file name for the actual cache file path. strncpy(cachePath, cacheDir, kBufLen); strncat(cachePath, cacheFile, kBufLen); LOGV("Cache file for '%s' '%s' is '%s'\n", resName, extName, cachePath); return strdup(cachePath); } ScriptC::ScriptC(Context *rsc) : Script(rsc) { mBccScript = NULL; memset(&mProgram, 0, sizeof(mProgram)); } ScriptC::~ScriptC() { if (mBccScript) { if (mProgram.mObjectSlotList) { for (size_t ct=0; ct < mProgram.mObjectSlotCount; ct++) { setVarObj(mProgram.mObjectSlotList[ct], NULL); } delete [] mProgram.mObjectSlotList; mProgram.mObjectSlotList = NULL; mProgram.mObjectSlotCount = 0; } LOGD(">>>> ~ScriptC bccDisposeScript(%p)", mBccScript); bccDisposeScript(mBccScript); } free(mEnviroment.mScriptText); mEnviroment.mScriptText = NULL; } void ScriptC::setupScript(Context *rsc) { mEnviroment.mStartTimeMillis = nanoseconds_to_milliseconds(systemTime(SYSTEM_TIME_MONOTONIC)); for (uint32_t ct=0; ct < mEnviroment.mFieldCount; ct++) { if (mSlots[ct].get() && !mTypes[ct].get()) { mTypes[ct].set(mSlots[ct]->getType()); } if (!mTypes[ct].get()) continue; void *ptr = NULL; if (mSlots[ct].get()) { ptr = mSlots[ct]->getPtr(); } void **dest = ((void ***)mEnviroment.mFieldAddress)[ct]; if (rsc->props.mLogScripts) { if (mSlots[ct].get() != NULL) { LOGV("%p ScriptC::setupScript slot=%i dst=%p src=%p type=%p", rsc, ct, dest, ptr, mSlots[ct]->getType()); } else { LOGV("%p ScriptC::setupScript slot=%i dst=%p src=%p type=null", rsc, ct, dest, ptr); } } if (dest) { *dest = ptr; } } } const Allocation *ScriptC::ptrToAllocation(const void *ptr) const { if (!ptr) { return NULL; } for (uint32_t ct=0; ct < mEnviroment.mFieldCount; ct++) { if (!mSlots[ct].get()) continue; if (mSlots[ct]->getPtr() == ptr) { return mSlots[ct].get(); } } LOGE("ScriptC::ptrToAllocation, failed to find %p", ptr); return NULL; } Script * ScriptC::setTLS(Script *sc) { Context::ScriptTLSStruct * tls = (Context::ScriptTLSStruct *) pthread_getspecific(Context::gThreadTLSKey); rsAssert(tls); Script *old = tls->mScript; tls->mScript = sc; return old; } void ScriptC::setupGLState(Context *rsc) { if (mEnviroment.mFragmentStore.get()) { rsc->setProgramStore(mEnviroment.mFragmentStore.get()); } if (mEnviroment.mFragment.get()) { rsc->setProgramFragment(mEnviroment.mFragment.get()); } if (mEnviroment.mVertex.get()) { rsc->setProgramVertex(mEnviroment.mVertex.get()); } if (mEnviroment.mRaster.get()) { rsc->setProgramRaster(mEnviroment.mRaster.get()); } } uint32_t ScriptC::run(Context *rsc) { if (mProgram.mRoot == NULL) { rsc->setError(RS_ERROR_BAD_SCRIPT, "Attempted to run bad script"); return 0; } setupGLState(rsc); setupScript(rsc); uint32_t ret = 0; Script * oldTLS = setTLS(this); if (rsc->props.mLogScripts) { LOGV("%p ScriptC::run invoking root, ptr %p", rsc, mProgram.mRoot); } ret = mProgram.mRoot(); if (rsc->props.mLogScripts) { LOGV("%p ScriptC::run invoking complete, ret=%i", rsc, ret); } setTLS(oldTLS); return ret; } typedef struct { Context *rsc; ScriptC *script; const Allocation * ain; Allocation * aout; const void * usr; uint32_t mSliceSize; volatile int mSliceNum; const uint8_t *ptrIn; uint32_t eStrideIn; uint8_t *ptrOut; uint32_t eStrideOut; uint32_t xStart; uint32_t xEnd; uint32_t yStart; uint32_t yEnd; uint32_t zStart; uint32_t zEnd; uint32_t arrayStart; uint32_t arrayEnd; uint32_t dimX; uint32_t dimY; uint32_t dimZ; uint32_t dimArray; } MTLaunchStruct; typedef int (*rs_t)(const void *, void *, const void *, uint32_t, uint32_t, uint32_t, uint32_t); static void wc_xy(void *usr, uint32_t idx) { MTLaunchStruct *mtls = (MTLaunchStruct *)usr; while (1) { uint32_t slice = (uint32_t)android_atomic_inc(&mtls->mSliceNum); uint32_t yStart = mtls->yStart + slice * mtls->mSliceSize; uint32_t yEnd = yStart + mtls->mSliceSize; yEnd = rsMin(yEnd, mtls->yEnd); if (yEnd <= yStart) { return; } //LOGE("usr idx %i, x %i,%i y %i,%i", idx, mtls->xStart, mtls->xEnd, yStart, yEnd); //LOGE("usr ptr in %p, out %p", mtls->ptrIn, mtls->ptrOut); for (uint32_t y = yStart; y < yEnd; y++) { uint32_t offset = mtls->dimX * y; uint8_t *xPtrOut = mtls->ptrOut + (mtls->eStrideOut * offset); const uint8_t *xPtrIn = mtls->ptrIn + (mtls->eStrideIn * offset); for (uint32_t x = mtls->xStart; x < mtls->xEnd; x++) { ((rs_t)mtls->script->mProgram.mRoot) (xPtrIn, xPtrOut, mtls->usr, x, y, 0, 0); xPtrIn += mtls->eStrideIn; xPtrOut += mtls->eStrideOut; } } } } static void wc_x(void *usr, uint32_t idx) { MTLaunchStruct *mtls = (MTLaunchStruct *)usr; while (1) { uint32_t slice = (uint32_t)android_atomic_inc(&mtls->mSliceNum); uint32_t xStart = mtls->xStart + slice * mtls->mSliceSize; uint32_t xEnd = xStart + mtls->mSliceSize; xEnd = rsMin(xEnd, mtls->xEnd); if (xEnd <= xStart) { return; } //LOGE("usr idx %i, x %i,%i y %i,%i", idx, mtls->xStart, mtls->xEnd, yStart, yEnd); //LOGE("usr ptr in %p, out %p", mtls->ptrIn, mtls->ptrOut); uint8_t *xPtrOut = mtls->ptrOut + (mtls->eStrideOut * xStart); const uint8_t *xPtrIn = mtls->ptrIn + (mtls->eStrideIn * xStart); for (uint32_t x = xStart; x < xEnd; x++) { ((rs_t)mtls->script->mProgram.mRoot) (xPtrIn, xPtrOut, mtls->usr, x, 0, 0, 0); xPtrIn += mtls->eStrideIn; xPtrOut += mtls->eStrideOut; } } } void ScriptC::runForEach(Context *rsc, const Allocation * ain, Allocation * aout, const void * usr, const RsScriptCall *sc) { MTLaunchStruct mtls; memset(&mtls, 0, sizeof(mtls)); Context::PushState ps(rsc); if (ain) { mtls.dimX = ain->getType()->getDimX(); mtls.dimY = ain->getType()->getDimY(); mtls.dimZ = ain->getType()->getDimZ(); //mtls.dimArray = ain->getType()->getDimArray(); } else if (aout) { mtls.dimX = aout->getType()->getDimX(); mtls.dimY = aout->getType()->getDimY(); mtls.dimZ = aout->getType()->getDimZ(); //mtls.dimArray = aout->getType()->getDimArray(); } else { rsc->setError(RS_ERROR_BAD_SCRIPT, "rsForEach called with null allocations"); return; } if (!sc || (sc->xEnd == 0)) { mtls.xEnd = mtls.dimX; } else { rsAssert(sc->xStart < mtls.dimX); rsAssert(sc->xEnd <= mtls.dimX); rsAssert(sc->xStart < sc->xEnd); mtls.xStart = rsMin(mtls.dimX, sc->xStart); mtls.xEnd = rsMin(mtls.dimX, sc->xEnd); if (mtls.xStart >= mtls.xEnd) return; } if (!sc || (sc->yEnd == 0)) { mtls.yEnd = mtls.dimY; } else { rsAssert(sc->yStart < mtls.dimY); rsAssert(sc->yEnd <= mtls.dimY); rsAssert(sc->yStart < sc->yEnd); mtls.yStart = rsMin(mtls.dimY, sc->yStart); mtls.yEnd = rsMin(mtls.dimY, sc->yEnd); if (mtls.yStart >= mtls.yEnd) return; } mtls.xEnd = rsMax((uint32_t)1, mtls.xEnd); mtls.yEnd = rsMax((uint32_t)1, mtls.yEnd); mtls.zEnd = rsMax((uint32_t)1, mtls.zEnd); mtls.arrayEnd = rsMax((uint32_t)1, mtls.arrayEnd); rsAssert(ain->getType()->getDimZ() == 0); setupGLState(rsc); setupScript(rsc); Script * oldTLS = setTLS(this); mtls.rsc = rsc; mtls.ain = ain; mtls.aout = aout; mtls.script = this; mtls.usr = usr; mtls.mSliceSize = 10; mtls.mSliceNum = 0; mtls.ptrIn = NULL; mtls.eStrideIn = 0; if (ain) { mtls.ptrIn = (const uint8_t *)ain->getPtr(); mtls.eStrideIn = ain->getType()->getElementSizeBytes(); } mtls.ptrOut = NULL; mtls.eStrideOut = 0; if (aout) { mtls.ptrOut = (uint8_t *)aout->getPtr(); mtls.eStrideOut = aout->getType()->getElementSizeBytes(); } if ((rsc->getWorkerPoolSize() > 1) && mEnviroment.mIsThreadable) { if (mtls.dimY > 1) { rsc->launchThreads(wc_xy, &mtls); } else { rsc->launchThreads(wc_x, &mtls); } //LOGE("launch 1"); } else { //LOGE("launch 3"); for (uint32_t ar = mtls.arrayStart; ar < mtls.arrayEnd; ar++) { for (uint32_t z = mtls.zStart; z < mtls.zEnd; z++) { for (uint32_t y = mtls.yStart; y < mtls.yEnd; y++) { uint32_t offset = mtls.dimX * mtls.dimY * mtls.dimZ * ar + mtls.dimX * mtls.dimY * z + mtls.dimX * y; uint8_t *xPtrOut = mtls.ptrOut + (mtls.eStrideOut * offset); const uint8_t *xPtrIn = mtls.ptrIn + (mtls.eStrideIn * offset); for (uint32_t x = mtls.xStart; x < mtls.xEnd; x++) { ((rs_t)mProgram.mRoot) (xPtrIn, xPtrOut, usr, x, y, z, ar); xPtrIn += mtls.eStrideIn; xPtrOut += mtls.eStrideOut; } } } } } setTLS(oldTLS); } void ScriptC::Invoke(Context *rsc, uint32_t slot, const void *data, uint32_t len) { if ((slot >= mEnviroment.mInvokeFunctionCount) || (mEnviroment.mInvokeFunctions[slot] == NULL)) { rsc->setError(RS_ERROR_BAD_SCRIPT, "Calling invoke on bad script"); return; } setupScript(rsc); Script * oldTLS = setTLS(this); if (rsc->props.mLogScripts) { LOGV("%p ScriptC::Invoke invoking slot %i, ptr %p", rsc, slot, mEnviroment.mInvokeFunctions[slot]); } ((void (*)(const void *, uint32_t)) mEnviroment.mInvokeFunctions[slot])(data, len); if (rsc->props.mLogScripts) { LOGV("%p ScriptC::Invoke complete", rsc); } setTLS(oldTLS); } ScriptCState::ScriptCState() { } ScriptCState::~ScriptCState() { } static void* symbolLookup(void* pContext, char const* name) { const ScriptCState::SymbolTable_t *sym; ScriptC *s = (ScriptC *)pContext; if (!strcmp(name, "__isThreadable")) { return (void*) s->mEnviroment.mIsThreadable; } else if (!strcmp(name, "__clearThreadable")) { s->mEnviroment.mIsThreadable = false; return NULL; } sym = ScriptCState::lookupSymbol(name); if (!sym) { sym = ScriptCState::lookupSymbolCL(name); } if (!sym) { sym = ScriptCState::lookupSymbolGL(name); } if (sym) { s->mEnviroment.mIsThreadable &= sym->threadable; return sym->mPtr; } LOGE("ScriptC sym lookup failed for %s", name); return NULL; } #if 0 extern const char rs_runtime_lib_bc[]; extern unsigned rs_runtime_lib_bc_size; #endif bool ScriptCState::runCompiler(Context *rsc, ScriptC *s, const char *resName, const char *cacheDir) { s->mBccScript = bccCreateScript(); s->mEnviroment.mIsThreadable = true; if (bccRegisterSymbolCallback(s->mBccScript, symbolLookup, s) != 0) { LOGE("bcc: FAILS to register symbol callback"); return false; } if (bccReadBC(s->mBccScript, resName, s->mEnviroment.mScriptText, s->mEnviroment.mScriptTextLength, 0) != 0) { LOGE("bcc: FAILS to read bitcode"); return false; } #if 1 if (bccLinkFile(s->mBccScript, "/system/lib/libclcore.bc", 0) != 0) { LOGE("bcc: FAILS to link bitcode"); return false; } #endif char *cachePath = genCacheFileName(cacheDir, resName, ".oBCC"); if (bccPrepareExecutable(s->mBccScript, cachePath, 0) != 0) { LOGE("bcc: FAILS to prepare executable"); return false; } free(cachePath); s->mProgram.mRoot = reinterpret_cast(bccGetFuncAddr(s->mBccScript, "root")); s->mProgram.mInit = reinterpret_cast(bccGetFuncAddr(s->mBccScript, "init")); if (s->mProgram.mInit) { s->mProgram.mInit(); } s->mEnviroment.mInvokeFunctionCount = bccGetExportFuncCount(s->mBccScript); if (s->mEnviroment.mInvokeFunctionCount <= 0) s->mEnviroment.mInvokeFunctions = NULL; else { s->mEnviroment.mInvokeFunctions = (Script::InvokeFunc_t*) calloc(s->mEnviroment.mInvokeFunctionCount, sizeof(Script::InvokeFunc_t)); bccGetExportFuncList(s->mBccScript, s->mEnviroment.mInvokeFunctionCount, (void **) s->mEnviroment.mInvokeFunctions); } s->mEnviroment.mFieldCount = bccGetExportVarCount(s->mBccScript); if (s->mEnviroment.mFieldCount <= 0) s->mEnviroment.mFieldAddress = NULL; else { s->mEnviroment.mFieldAddress = (void **) calloc(s->mEnviroment.mFieldCount, sizeof(void *)); bccGetExportVarList(s->mBccScript, s->mEnviroment.mFieldCount, (void **) s->mEnviroment.mFieldAddress); s->initSlots(); } s->mEnviroment.mFragment.set(rsc->getDefaultProgramFragment()); s->mEnviroment.mVertex.set(rsc->getDefaultProgramVertex()); s->mEnviroment.mFragmentStore.set(rsc->getDefaultProgramStore()); s->mEnviroment.mRaster.set(rsc->getDefaultProgramRaster()); const static int pragmaMax = 16; size_t pragmaCount = bccGetPragmaCount(s->mBccScript); char const *keys[pragmaMax]; char const *values[pragmaMax]; bccGetPragmaList(s->mBccScript, pragmaMax, keys, values); for (size_t i=0; i < pragmaCount; ++i) { //LOGE("pragma %s %s", keys[i], values[i]); if (!strcmp(keys[i], "version")) { if (!strcmp(values[i], "1")) { continue; } LOGE("Invalid version pragma value: %s\n", values[i]); return false; } if (!strcmp(keys[i], "stateVertex")) { if (!strcmp(values[i], "default")) { continue; } if (!strcmp(values[i], "parent")) { s->mEnviroment.mVertex.clear(); continue; } LOGE("Unrecognized value %s passed to stateVertex", values[i]); return false; } if (!strcmp(keys[i], "stateRaster")) { if (!strcmp(values[i], "default")) { continue; } if (!strcmp(values[i], "parent")) { s->mEnviroment.mRaster.clear(); continue; } LOGE("Unrecognized value %s passed to stateRaster", values[i]); return false; } if (!strcmp(keys[i], "stateFragment")) { if (!strcmp(values[i], "default")) { continue; } if (!strcmp(values[i], "parent")) { s->mEnviroment.mFragment.clear(); continue; } LOGE("Unrecognized value %s passed to stateFragment", values[i]); return false; } if (!strcmp(keys[i], "stateStore")) { if (!strcmp(values[i], "default")) { continue; } if (!strcmp(values[i], "parent")) { s->mEnviroment.mFragmentStore.clear(); continue; } LOGE("Unrecognized value %s passed to stateStore", values[i]); return false; } } size_t objectSlotCount = bccGetObjectSlotCount(s->mBccScript); uint32_t *objectSlots = NULL; if (objectSlotCount) { objectSlots = new uint32_t[objectSlotCount]; bccGetObjectSlotList(s->mBccScript, objectSlotCount, objectSlots); s->mProgram.mObjectSlotList = objectSlots; s->mProgram.mObjectSlotCount = objectSlotCount; } return true; } namespace android { namespace renderscript { void rsi_ScriptCBegin(Context * rsc) { } void rsi_ScriptCSetText(Context *rsc, const char *text, uint32_t len) { ScriptCState *ss = &rsc->mScriptC; char *t = (char *)malloc(len + 1); memcpy(t, text, len); t[len] = 0; ss->mScriptText = t; ss->mScriptLen = len; } RsScript rsi_ScriptCCreate(Context *rsc, const char *packageName /* deprecated */, const char *resName, const char *cacheDir) { ScriptCState *ss = &rsc->mScriptC; ScriptC *s = new ScriptC(rsc); s->mEnviroment.mScriptText = ss->mScriptText; s->mEnviroment.mScriptTextLength = ss->mScriptLen; ss->mScriptText = NULL; ss->mScriptLen = 0; s->incUserRef(); if (!ss->runCompiler(rsc, s, resName, cacheDir)) { // Error during compile, destroy s and return null. delete s; return NULL; } return s; } } }