xref: /aosp_15_r20/frameworks/rs/cpu_ref/rsCpuScriptGroup2.cpp (revision e1eccf28f96817838ad6867f7f39d2351ec11f56)
1*e1eccf28SAndroid Build Coastguard Worker #include "rsCpuScriptGroup2.h"
2*e1eccf28SAndroid Build Coastguard Worker 
3*e1eccf28SAndroid Build Coastguard Worker #include <dlfcn.h>
4*e1eccf28SAndroid Build Coastguard Worker #include <stdio.h>
5*e1eccf28SAndroid Build Coastguard Worker #include <stdlib.h>
6*e1eccf28SAndroid Build Coastguard Worker #include <unistd.h>
7*e1eccf28SAndroid Build Coastguard Worker 
8*e1eccf28SAndroid Build Coastguard Worker #include <set>
9*e1eccf28SAndroid Build Coastguard Worker #include <sstream>
10*e1eccf28SAndroid Build Coastguard Worker #include <string>
11*e1eccf28SAndroid Build Coastguard Worker #include <vector>
12*e1eccf28SAndroid Build Coastguard Worker 
13*e1eccf28SAndroid Build Coastguard Worker #ifndef RS_COMPATIBILITY_LIB
14*e1eccf28SAndroid Build Coastguard Worker #include "bcc/Config.h"
15*e1eccf28SAndroid Build Coastguard Worker #endif
16*e1eccf28SAndroid Build Coastguard Worker 
17*e1eccf28SAndroid Build Coastguard Worker #include "cpu_ref/rsCpuCore.h"
18*e1eccf28SAndroid Build Coastguard Worker #include "rsClosure.h"
19*e1eccf28SAndroid Build Coastguard Worker #include "rsContext.h"
20*e1eccf28SAndroid Build Coastguard Worker #include "rsCpuCore.h"
21*e1eccf28SAndroid Build Coastguard Worker #include "rsCpuExecutable.h"
22*e1eccf28SAndroid Build Coastguard Worker #include "rsCpuScript.h"
23*e1eccf28SAndroid Build Coastguard Worker #include "rsScript.h"
24*e1eccf28SAndroid Build Coastguard Worker #include "rsScriptGroup2.h"
25*e1eccf28SAndroid Build Coastguard Worker #include "rsScriptIntrinsic.h"
26*e1eccf28SAndroid Build Coastguard Worker 
27*e1eccf28SAndroid Build Coastguard Worker using std::string;
28*e1eccf28SAndroid Build Coastguard Worker using std::vector;
29*e1eccf28SAndroid Build Coastguard Worker 
30*e1eccf28SAndroid Build Coastguard Worker namespace android {
31*e1eccf28SAndroid Build Coastguard Worker namespace renderscript {
32*e1eccf28SAndroid Build Coastguard Worker 
33*e1eccf28SAndroid Build Coastguard Worker namespace {
34*e1eccf28SAndroid Build Coastguard Worker 
35*e1eccf28SAndroid Build Coastguard Worker const size_t DefaultKernelArgCount = 2;
36*e1eccf28SAndroid Build Coastguard Worker 
groupRoot(const RsExpandKernelDriverInfo * kinfo,uint32_t xstart,uint32_t xend,uint32_t outstep)37*e1eccf28SAndroid Build Coastguard Worker void groupRoot(const RsExpandKernelDriverInfo *kinfo, uint32_t xstart,
38*e1eccf28SAndroid Build Coastguard Worker                uint32_t xend, uint32_t outstep) {
39*e1eccf28SAndroid Build Coastguard Worker     const List<CPUClosure*>& closures = *(List<CPUClosure*>*)kinfo->usr;
40*e1eccf28SAndroid Build Coastguard Worker     RsExpandKernelDriverInfo *mutable_kinfo = const_cast<RsExpandKernelDriverInfo *>(kinfo);
41*e1eccf28SAndroid Build Coastguard Worker 
42*e1eccf28SAndroid Build Coastguard Worker     const size_t oldInLen = mutable_kinfo->inLen;
43*e1eccf28SAndroid Build Coastguard Worker 
44*e1eccf28SAndroid Build Coastguard Worker     decltype(mutable_kinfo->inStride) oldInStride;
45*e1eccf28SAndroid Build Coastguard Worker     memcpy(&oldInStride, &mutable_kinfo->inStride, sizeof(oldInStride));
46*e1eccf28SAndroid Build Coastguard Worker 
47*e1eccf28SAndroid Build Coastguard Worker     for (CPUClosure* cpuClosure : closures) {
48*e1eccf28SAndroid Build Coastguard Worker         const Closure* closure = cpuClosure->mClosure;
49*e1eccf28SAndroid Build Coastguard Worker 
50*e1eccf28SAndroid Build Coastguard Worker         // There had better be enough space in mutable_kinfo
51*e1eccf28SAndroid Build Coastguard Worker         rsAssert(closure->mNumArg <= RS_KERNEL_INPUT_LIMIT);
52*e1eccf28SAndroid Build Coastguard Worker 
53*e1eccf28SAndroid Build Coastguard Worker         for (size_t i = 0; i < closure->mNumArg; i++) {
54*e1eccf28SAndroid Build Coastguard Worker             const void* arg = closure->mArgs[i];
55*e1eccf28SAndroid Build Coastguard Worker             const Allocation* a = (const Allocation*)arg;
56*e1eccf28SAndroid Build Coastguard Worker             const uint32_t eStride = a->mHal.state.elementSizeBytes;
57*e1eccf28SAndroid Build Coastguard Worker             const uint8_t* ptr = (uint8_t*)(a->mHal.drvState.lod[0].mallocPtr) +
58*e1eccf28SAndroid Build Coastguard Worker                     eStride * xstart;
59*e1eccf28SAndroid Build Coastguard Worker             if (kinfo->dim.y > 1) {
60*e1eccf28SAndroid Build Coastguard Worker                 ptr += a->mHal.drvState.lod[0].stride * kinfo->current.y;
61*e1eccf28SAndroid Build Coastguard Worker             }
62*e1eccf28SAndroid Build Coastguard Worker             mutable_kinfo->inPtr[i] = ptr;
63*e1eccf28SAndroid Build Coastguard Worker             mutable_kinfo->inStride[i] = eStride;
64*e1eccf28SAndroid Build Coastguard Worker         }
65*e1eccf28SAndroid Build Coastguard Worker         mutable_kinfo->inLen = closure->mNumArg;
66*e1eccf28SAndroid Build Coastguard Worker 
67*e1eccf28SAndroid Build Coastguard Worker         const Allocation* out = closure->mReturnValue;
68*e1eccf28SAndroid Build Coastguard Worker         const uint32_t ostep = out->mHal.state.elementSizeBytes;
69*e1eccf28SAndroid Build Coastguard Worker         const uint8_t* ptr = (uint8_t *)(out->mHal.drvState.lod[0].mallocPtr) +
70*e1eccf28SAndroid Build Coastguard Worker                 ostep * xstart;
71*e1eccf28SAndroid Build Coastguard Worker         if (kinfo->dim.y > 1) {
72*e1eccf28SAndroid Build Coastguard Worker             ptr += out->mHal.drvState.lod[0].stride * kinfo->current.y;
73*e1eccf28SAndroid Build Coastguard Worker         }
74*e1eccf28SAndroid Build Coastguard Worker 
75*e1eccf28SAndroid Build Coastguard Worker         mutable_kinfo->outPtr[0] = const_cast<uint8_t*>(ptr);
76*e1eccf28SAndroid Build Coastguard Worker 
77*e1eccf28SAndroid Build Coastguard Worker         // The implementation of an intrinsic relies on kinfo->usr being
78*e1eccf28SAndroid Build Coastguard Worker         // the "this" pointer to the intrinsic (an RsdCpuScriptIntrinsic object)
79*e1eccf28SAndroid Build Coastguard Worker         mutable_kinfo->usr = cpuClosure->mSi;
80*e1eccf28SAndroid Build Coastguard Worker 
81*e1eccf28SAndroid Build Coastguard Worker         cpuClosure->mFunc(kinfo, xstart, xend, ostep);
82*e1eccf28SAndroid Build Coastguard Worker     }
83*e1eccf28SAndroid Build Coastguard Worker 
84*e1eccf28SAndroid Build Coastguard Worker     mutable_kinfo->inLen = oldInLen;
85*e1eccf28SAndroid Build Coastguard Worker     mutable_kinfo->usr = &closures;
86*e1eccf28SAndroid Build Coastguard Worker     memcpy(&mutable_kinfo->inStride, &oldInStride, sizeof(oldInStride));
87*e1eccf28SAndroid Build Coastguard Worker }
88*e1eccf28SAndroid Build Coastguard Worker 
89*e1eccf28SAndroid Build Coastguard Worker }  // namespace
90*e1eccf28SAndroid Build Coastguard Worker 
Batch(CpuScriptGroup2Impl * group,const char * name)91*e1eccf28SAndroid Build Coastguard Worker Batch::Batch(CpuScriptGroup2Impl* group, const char* name) :
92*e1eccf28SAndroid Build Coastguard Worker     mGroup(group), mFunc(nullptr) {
93*e1eccf28SAndroid Build Coastguard Worker     mName = strndup(name, strlen(name));
94*e1eccf28SAndroid Build Coastguard Worker }
95*e1eccf28SAndroid Build Coastguard Worker 
~Batch()96*e1eccf28SAndroid Build Coastguard Worker Batch::~Batch() {
97*e1eccf28SAndroid Build Coastguard Worker     for (CPUClosure* c : mClosures) {
98*e1eccf28SAndroid Build Coastguard Worker         delete c;
99*e1eccf28SAndroid Build Coastguard Worker     }
100*e1eccf28SAndroid Build Coastguard Worker     free(mName);
101*e1eccf28SAndroid Build Coastguard Worker }
102*e1eccf28SAndroid Build Coastguard Worker 
conflict(CPUClosure * cpuClosure) const103*e1eccf28SAndroid Build Coastguard Worker bool Batch::conflict(CPUClosure* cpuClosure) const {
104*e1eccf28SAndroid Build Coastguard Worker     if (mClosures.empty()) {
105*e1eccf28SAndroid Build Coastguard Worker         return false;
106*e1eccf28SAndroid Build Coastguard Worker     }
107*e1eccf28SAndroid Build Coastguard Worker 
108*e1eccf28SAndroid Build Coastguard Worker     const Closure* closure = cpuClosure->mClosure;
109*e1eccf28SAndroid Build Coastguard Worker 
110*e1eccf28SAndroid Build Coastguard Worker     if (!closure->mIsKernel || !mClosures.front()->mClosure->mIsKernel) {
111*e1eccf28SAndroid Build Coastguard Worker         // An invoke should be in a batch by itself, so it conflicts with any other
112*e1eccf28SAndroid Build Coastguard Worker         // closure.
113*e1eccf28SAndroid Build Coastguard Worker         return true;
114*e1eccf28SAndroid Build Coastguard Worker     }
115*e1eccf28SAndroid Build Coastguard Worker 
116*e1eccf28SAndroid Build Coastguard Worker     const auto& globalDeps = closure->mGlobalDeps;
117*e1eccf28SAndroid Build Coastguard Worker     const auto& argDeps = closure->mArgDeps;
118*e1eccf28SAndroid Build Coastguard Worker 
119*e1eccf28SAndroid Build Coastguard Worker     for (CPUClosure* c : mClosures) {
120*e1eccf28SAndroid Build Coastguard Worker         const Closure* batched = c->mClosure;
121*e1eccf28SAndroid Build Coastguard Worker         if (globalDeps.find(batched) != globalDeps.end()) {
122*e1eccf28SAndroid Build Coastguard Worker             return true;
123*e1eccf28SAndroid Build Coastguard Worker         }
124*e1eccf28SAndroid Build Coastguard Worker         const auto& it = argDeps.find(batched);
125*e1eccf28SAndroid Build Coastguard Worker         if (it != argDeps.end()) {
126*e1eccf28SAndroid Build Coastguard Worker             const auto& args = (*it).second;
127*e1eccf28SAndroid Build Coastguard Worker             for (const auto &p1 : *args) {
128*e1eccf28SAndroid Build Coastguard Worker                 if (p1.second.get() != nullptr) {
129*e1eccf28SAndroid Build Coastguard Worker                     return true;
130*e1eccf28SAndroid Build Coastguard Worker                 }
131*e1eccf28SAndroid Build Coastguard Worker             }
132*e1eccf28SAndroid Build Coastguard Worker         }
133*e1eccf28SAndroid Build Coastguard Worker     }
134*e1eccf28SAndroid Build Coastguard Worker 
135*e1eccf28SAndroid Build Coastguard Worker     // The compiler fusion pass in bcc expects that kernels chained up through
136*e1eccf28SAndroid Build Coastguard Worker     // (1st) input and output.
137*e1eccf28SAndroid Build Coastguard Worker 
138*e1eccf28SAndroid Build Coastguard Worker     const Closure* lastBatched = mClosures.back()->mClosure;
139*e1eccf28SAndroid Build Coastguard Worker     const auto& it = argDeps.find(lastBatched);
140*e1eccf28SAndroid Build Coastguard Worker 
141*e1eccf28SAndroid Build Coastguard Worker     if (it == argDeps.end()) {
142*e1eccf28SAndroid Build Coastguard Worker         return true;
143*e1eccf28SAndroid Build Coastguard Worker     }
144*e1eccf28SAndroid Build Coastguard Worker 
145*e1eccf28SAndroid Build Coastguard Worker     const auto& args = (*it).second;
146*e1eccf28SAndroid Build Coastguard Worker     for (const auto &p1 : *args) {
147*e1eccf28SAndroid Build Coastguard Worker         if (p1.first == 0 && p1.second.get() == nullptr) {
148*e1eccf28SAndroid Build Coastguard Worker             // The new closure depends on the last batched closure's return
149*e1eccf28SAndroid Build Coastguard Worker             // value (fieldId being nullptr) for its first argument (argument 0)
150*e1eccf28SAndroid Build Coastguard Worker             return false;
151*e1eccf28SAndroid Build Coastguard Worker         }
152*e1eccf28SAndroid Build Coastguard Worker     }
153*e1eccf28SAndroid Build Coastguard Worker 
154*e1eccf28SAndroid Build Coastguard Worker     return true;
155*e1eccf28SAndroid Build Coastguard Worker }
156*e1eccf28SAndroid Build Coastguard Worker 
CpuScriptGroup2Impl(RsdCpuReferenceImpl * cpuRefImpl,const ScriptGroupBase * sg)157*e1eccf28SAndroid Build Coastguard Worker CpuScriptGroup2Impl::CpuScriptGroup2Impl(RsdCpuReferenceImpl *cpuRefImpl,
158*e1eccf28SAndroid Build Coastguard Worker                                          const ScriptGroupBase *sg) :
159*e1eccf28SAndroid Build Coastguard Worker     mCpuRefImpl(cpuRefImpl), mGroup((const ScriptGroup2*)(sg)),
160*e1eccf28SAndroid Build Coastguard Worker     mExecutable(nullptr), mScriptObj(nullptr) {
161*e1eccf28SAndroid Build Coastguard Worker     rsAssert(!mGroup->mClosures.empty());
162*e1eccf28SAndroid Build Coastguard Worker 
163*e1eccf28SAndroid Build Coastguard Worker     mCpuRefImpl->lockMutex();
164*e1eccf28SAndroid Build Coastguard Worker     Batch* batch = new Batch(this, "Batch0");
165*e1eccf28SAndroid Build Coastguard Worker     int i = 0;
166*e1eccf28SAndroid Build Coastguard Worker     for (Closure* closure: mGroup->mClosures) {
167*e1eccf28SAndroid Build Coastguard Worker         CPUClosure* cc;
168*e1eccf28SAndroid Build Coastguard Worker         const IDBase* funcID = closure->mFunctionID.get();
169*e1eccf28SAndroid Build Coastguard Worker         RsdCpuScriptImpl* si =
170*e1eccf28SAndroid Build Coastguard Worker                 (RsdCpuScriptImpl *)mCpuRefImpl->lookupScript(funcID->mScript);
171*e1eccf28SAndroid Build Coastguard Worker         if (closure->mIsKernel) {
172*e1eccf28SAndroid Build Coastguard Worker             MTLaunchStructForEach mtls;
173*e1eccf28SAndroid Build Coastguard Worker             si->forEachKernelSetup(funcID->mSlot, &mtls);
174*e1eccf28SAndroid Build Coastguard Worker             cc = new CPUClosure(closure, si, (ExpandFuncTy)mtls.kernel);
175*e1eccf28SAndroid Build Coastguard Worker         } else {
176*e1eccf28SAndroid Build Coastguard Worker             cc = new CPUClosure(closure, si);
177*e1eccf28SAndroid Build Coastguard Worker         }
178*e1eccf28SAndroid Build Coastguard Worker 
179*e1eccf28SAndroid Build Coastguard Worker         if (batch->conflict(cc)) {
180*e1eccf28SAndroid Build Coastguard Worker             mBatches.push_back(batch);
181*e1eccf28SAndroid Build Coastguard Worker             std::stringstream ss;
182*e1eccf28SAndroid Build Coastguard Worker             ss << "Batch" << ++i;
183*e1eccf28SAndroid Build Coastguard Worker             std::string batchStr(ss.str());
184*e1eccf28SAndroid Build Coastguard Worker             batch = new Batch(this, batchStr.c_str());
185*e1eccf28SAndroid Build Coastguard Worker         }
186*e1eccf28SAndroid Build Coastguard Worker 
187*e1eccf28SAndroid Build Coastguard Worker         batch->mClosures.push_back(cc);
188*e1eccf28SAndroid Build Coastguard Worker     }
189*e1eccf28SAndroid Build Coastguard Worker 
190*e1eccf28SAndroid Build Coastguard Worker     rsAssert(!batch->mClosures.empty());
191*e1eccf28SAndroid Build Coastguard Worker     mBatches.push_back(batch);
192*e1eccf28SAndroid Build Coastguard Worker 
193*e1eccf28SAndroid Build Coastguard Worker #ifndef RS_COMPATIBILITY_LIB
194*e1eccf28SAndroid Build Coastguard Worker     compile(mGroup->mCacheDir);
195*e1eccf28SAndroid Build Coastguard Worker     if (mScriptObj != nullptr && mExecutable != nullptr) {
196*e1eccf28SAndroid Build Coastguard Worker         for (Batch* batch : mBatches) {
197*e1eccf28SAndroid Build Coastguard Worker             batch->resolveFuncPtr(mScriptObj);
198*e1eccf28SAndroid Build Coastguard Worker         }
199*e1eccf28SAndroid Build Coastguard Worker     }
200*e1eccf28SAndroid Build Coastguard Worker #endif  // RS_COMPATIBILITY_LIB
201*e1eccf28SAndroid Build Coastguard Worker     mCpuRefImpl->unlockMutex();
202*e1eccf28SAndroid Build Coastguard Worker }
203*e1eccf28SAndroid Build Coastguard Worker 
resolveFuncPtr(void * sharedObj)204*e1eccf28SAndroid Build Coastguard Worker void Batch::resolveFuncPtr(void* sharedObj) {
205*e1eccf28SAndroid Build Coastguard Worker     std::string funcName(mName);
206*e1eccf28SAndroid Build Coastguard Worker     if (mClosures.front()->mClosure->mIsKernel) {
207*e1eccf28SAndroid Build Coastguard Worker         funcName.append(".expand");
208*e1eccf28SAndroid Build Coastguard Worker     }
209*e1eccf28SAndroid Build Coastguard Worker     mFunc = dlsym(sharedObj, funcName.c_str());
210*e1eccf28SAndroid Build Coastguard Worker     rsAssert (mFunc != nullptr);
211*e1eccf28SAndroid Build Coastguard Worker }
212*e1eccf28SAndroid Build Coastguard Worker 
~CpuScriptGroup2Impl()213*e1eccf28SAndroid Build Coastguard Worker CpuScriptGroup2Impl::~CpuScriptGroup2Impl() {
214*e1eccf28SAndroid Build Coastguard Worker     for (Batch* batch : mBatches) {
215*e1eccf28SAndroid Build Coastguard Worker         delete batch;
216*e1eccf28SAndroid Build Coastguard Worker     }
217*e1eccf28SAndroid Build Coastguard Worker     delete mExecutable;
218*e1eccf28SAndroid Build Coastguard Worker     // TODO: move this dlclose into ~ScriptExecutable().
219*e1eccf28SAndroid Build Coastguard Worker     if (mScriptObj != nullptr) {
220*e1eccf28SAndroid Build Coastguard Worker         dlclose(mScriptObj);
221*e1eccf28SAndroid Build Coastguard Worker     }
222*e1eccf28SAndroid Build Coastguard Worker }
223*e1eccf28SAndroid Build Coastguard Worker 
224*e1eccf28SAndroid Build Coastguard Worker namespace {
225*e1eccf28SAndroid Build Coastguard Worker 
226*e1eccf28SAndroid Build Coastguard Worker #ifndef RS_COMPATIBILITY_LIB
227*e1eccf28SAndroid Build Coastguard Worker 
getCoreLibPath(Context * context,string * coreLibRelaxedPath)228*e1eccf28SAndroid Build Coastguard Worker string getCoreLibPath(Context* context, string* coreLibRelaxedPath) {
229*e1eccf28SAndroid Build Coastguard Worker     *coreLibRelaxedPath = "";
230*e1eccf28SAndroid Build Coastguard Worker 
231*e1eccf28SAndroid Build Coastguard Worker     // If we're debugging, use the debug library.
232*e1eccf28SAndroid Build Coastguard Worker     if (context->getContextType() == RS_CONTEXT_TYPE_DEBUG) {
233*e1eccf28SAndroid Build Coastguard Worker         return SYSLIBPATH_BC"/libclcore_debug.bc";
234*e1eccf28SAndroid Build Coastguard Worker     }
235*e1eccf28SAndroid Build Coastguard Worker 
236*e1eccf28SAndroid Build Coastguard Worker     // Check for a platform specific library
237*e1eccf28SAndroid Build Coastguard Worker 
238*e1eccf28SAndroid Build Coastguard Worker #if defined(ARCH_ARM_HAVE_NEON) && !defined(DISABLE_CLCORE_NEON)
239*e1eccf28SAndroid Build Coastguard Worker     // NEON-capable ARMv7a devices can use an accelerated math library
240*e1eccf28SAndroid Build Coastguard Worker     // for all reduced precision scripts.
241*e1eccf28SAndroid Build Coastguard Worker     // ARMv8 does not use NEON, as ASIMD can be used with all precision
242*e1eccf28SAndroid Build Coastguard Worker     // levels.
243*e1eccf28SAndroid Build Coastguard Worker     *coreLibRelaxedPath = SYSLIBPATH_BC"/libclcore_neon.bc";
244*e1eccf28SAndroid Build Coastguard Worker #endif
245*e1eccf28SAndroid Build Coastguard Worker 
246*e1eccf28SAndroid Build Coastguard Worker #if defined(__i386__) || defined(__x86_64__)
247*e1eccf28SAndroid Build Coastguard Worker     // x86 devices will use an optimized library.
248*e1eccf28SAndroid Build Coastguard Worker     return SYSLIBPATH_BC"/libclcore_x86.bc";
249*e1eccf28SAndroid Build Coastguard Worker #else
250*e1eccf28SAndroid Build Coastguard Worker     return SYSLIBPATH_BC"/libclcore.bc";
251*e1eccf28SAndroid Build Coastguard Worker #endif
252*e1eccf28SAndroid Build Coastguard Worker }
253*e1eccf28SAndroid Build Coastguard Worker 
setupCompileArguments(const vector<const char * > & inputs,const vector<string> & kernelBatches,const vector<string> & invokeBatches,const char * outputDir,const char * outputFileName,const char * coreLibPath,const char * coreLibRelaxedPath,const bool emitGlobalInfo,const bool emitGlobalInfoSkipConstant,int optLevel,vector<const char * > * args)254*e1eccf28SAndroid Build Coastguard Worker void setupCompileArguments(
255*e1eccf28SAndroid Build Coastguard Worker         const vector<const char*>& inputs, const vector<string>& kernelBatches,
256*e1eccf28SAndroid Build Coastguard Worker         const vector<string>& invokeBatches,
257*e1eccf28SAndroid Build Coastguard Worker         const char* outputDir, const char* outputFileName,
258*e1eccf28SAndroid Build Coastguard Worker         const char* coreLibPath, const char* coreLibRelaxedPath,
259*e1eccf28SAndroid Build Coastguard Worker         const bool emitGlobalInfo, const bool emitGlobalInfoSkipConstant,
260*e1eccf28SAndroid Build Coastguard Worker         int optLevel, vector<const char*>* args) {
261*e1eccf28SAndroid Build Coastguard Worker     args->push_back(RsdCpuScriptImpl::BCC_EXE_PATH);
262*e1eccf28SAndroid Build Coastguard Worker     args->push_back("-fPIC");
263*e1eccf28SAndroid Build Coastguard Worker     args->push_back("-embedRSInfo");
264*e1eccf28SAndroid Build Coastguard Worker     if (emitGlobalInfo) {
265*e1eccf28SAndroid Build Coastguard Worker         args->push_back("-rs-global-info");
266*e1eccf28SAndroid Build Coastguard Worker         if (emitGlobalInfoSkipConstant) {
267*e1eccf28SAndroid Build Coastguard Worker             args->push_back("-rs-global-info-skip-constant");
268*e1eccf28SAndroid Build Coastguard Worker         }
269*e1eccf28SAndroid Build Coastguard Worker     }
270*e1eccf28SAndroid Build Coastguard Worker     args->push_back("-mtriple");
271*e1eccf28SAndroid Build Coastguard Worker     args->push_back(DEFAULT_TARGET_TRIPLE_STRING);
272*e1eccf28SAndroid Build Coastguard Worker     args->push_back("-bclib");
273*e1eccf28SAndroid Build Coastguard Worker     args->push_back(coreLibPath);
274*e1eccf28SAndroid Build Coastguard Worker     args->push_back("-bclib_relaxed");
275*e1eccf28SAndroid Build Coastguard Worker     args->push_back(coreLibRelaxedPath);
276*e1eccf28SAndroid Build Coastguard Worker     for (const char* input : inputs) {
277*e1eccf28SAndroid Build Coastguard Worker         args->push_back(input);
278*e1eccf28SAndroid Build Coastguard Worker     }
279*e1eccf28SAndroid Build Coastguard Worker     for (const string& batch : kernelBatches) {
280*e1eccf28SAndroid Build Coastguard Worker         args->push_back("-merge");
281*e1eccf28SAndroid Build Coastguard Worker         args->push_back(batch.c_str());
282*e1eccf28SAndroid Build Coastguard Worker     }
283*e1eccf28SAndroid Build Coastguard Worker     for (const string& batch : invokeBatches) {
284*e1eccf28SAndroid Build Coastguard Worker         args->push_back("-invoke");
285*e1eccf28SAndroid Build Coastguard Worker         args->push_back(batch.c_str());
286*e1eccf28SAndroid Build Coastguard Worker     }
287*e1eccf28SAndroid Build Coastguard Worker     args->push_back("-output_path");
288*e1eccf28SAndroid Build Coastguard Worker     args->push_back(outputDir);
289*e1eccf28SAndroid Build Coastguard Worker 
290*e1eccf28SAndroid Build Coastguard Worker     args->push_back("-O");
291*e1eccf28SAndroid Build Coastguard Worker     switch (optLevel) {
292*e1eccf28SAndroid Build Coastguard Worker     case 0:
293*e1eccf28SAndroid Build Coastguard Worker         args->push_back("0");
294*e1eccf28SAndroid Build Coastguard Worker         break;
295*e1eccf28SAndroid Build Coastguard Worker     case 3:
296*e1eccf28SAndroid Build Coastguard Worker         args->push_back("3");
297*e1eccf28SAndroid Build Coastguard Worker         break;
298*e1eccf28SAndroid Build Coastguard Worker     default:
299*e1eccf28SAndroid Build Coastguard Worker         ALOGW("Expected optimization level of 0 or 3. Received %d", optLevel);
300*e1eccf28SAndroid Build Coastguard Worker         args->push_back("3");
301*e1eccf28SAndroid Build Coastguard Worker         break;
302*e1eccf28SAndroid Build Coastguard Worker     }
303*e1eccf28SAndroid Build Coastguard Worker 
304*e1eccf28SAndroid Build Coastguard Worker     // The output filename has to be the last, in case we need to pop it out and
305*e1eccf28SAndroid Build Coastguard Worker     // replace with a different name.
306*e1eccf28SAndroid Build Coastguard Worker     args->push_back("-o");
307*e1eccf28SAndroid Build Coastguard Worker     args->push_back(outputFileName);
308*e1eccf28SAndroid Build Coastguard Worker }
309*e1eccf28SAndroid Build Coastguard Worker 
generateSourceSlot(RsdCpuReferenceImpl * ctxt,const Closure & closure,const std::vector<const char * > & inputs,std::stringstream & ss)310*e1eccf28SAndroid Build Coastguard Worker void generateSourceSlot(RsdCpuReferenceImpl* ctxt,
311*e1eccf28SAndroid Build Coastguard Worker                         const Closure& closure,
312*e1eccf28SAndroid Build Coastguard Worker                         const std::vector<const char*>& inputs,
313*e1eccf28SAndroid Build Coastguard Worker                         std::stringstream& ss) {
314*e1eccf28SAndroid Build Coastguard Worker     const IDBase* funcID = (const IDBase*)closure.mFunctionID.get();
315*e1eccf28SAndroid Build Coastguard Worker     const Script* script = funcID->mScript;
316*e1eccf28SAndroid Build Coastguard Worker 
317*e1eccf28SAndroid Build Coastguard Worker     rsAssert (!script->isIntrinsic());
318*e1eccf28SAndroid Build Coastguard Worker 
319*e1eccf28SAndroid Build Coastguard Worker     const RsdCpuScriptImpl *cpuScript =
320*e1eccf28SAndroid Build Coastguard Worker             (const RsdCpuScriptImpl *)ctxt->lookupScript(script);
321*e1eccf28SAndroid Build Coastguard Worker     const string& bitcodeFilename = cpuScript->getBitcodeFilePath();
322*e1eccf28SAndroid Build Coastguard Worker 
323*e1eccf28SAndroid Build Coastguard Worker     const int index = find(inputs.begin(), inputs.end(), bitcodeFilename) -
324*e1eccf28SAndroid Build Coastguard Worker             inputs.begin();
325*e1eccf28SAndroid Build Coastguard Worker 
326*e1eccf28SAndroid Build Coastguard Worker     ss << index << "," << funcID->mSlot << ".";
327*e1eccf28SAndroid Build Coastguard Worker }
328*e1eccf28SAndroid Build Coastguard Worker 
329*e1eccf28SAndroid Build Coastguard Worker #endif  // RS_COMPATIBILTY_LIB
330*e1eccf28SAndroid Build Coastguard Worker 
331*e1eccf28SAndroid Build Coastguard Worker }  // anonymous namespace
332*e1eccf28SAndroid Build Coastguard Worker 
333*e1eccf28SAndroid Build Coastguard Worker // This function is used by the debugger to inspect ScriptGroup
334*e1eccf28SAndroid Build Coastguard Worker // compilations.
335*e1eccf28SAndroid Build Coastguard Worker //
336*e1eccf28SAndroid Build Coastguard Worker // "__attribute__((noinline))" and "__asm__" are used to prevent the
337*e1eccf28SAndroid Build Coastguard Worker // function call from being eliminated as a no-op (see the "noinline"
338*e1eccf28SAndroid Build Coastguard Worker // attribute in gcc documentation).
339*e1eccf28SAndroid Build Coastguard Worker //
340*e1eccf28SAndroid Build Coastguard Worker // "__attribute__((weak))" is used to prevent callers from recognizing
341*e1eccf28SAndroid Build Coastguard Worker // that this is guaranteed to be the function definition, recognizing
342*e1eccf28SAndroid Build Coastguard Worker // that certain arguments are unused, and optimizing away the passing
343*e1eccf28SAndroid Build Coastguard Worker // of those arguments (see the LLVM optimization
344*e1eccf28SAndroid Build Coastguard Worker // DeadArgumentElimination).  Theoretically, the compiler could get
345*e1eccf28SAndroid Build Coastguard Worker // aggressive enough with link-time optimization that even marking the
346*e1eccf28SAndroid Build Coastguard Worker // entry point as a weak definition wouldn't solve the problem.
347*e1eccf28SAndroid Build Coastguard Worker //
348*e1eccf28SAndroid Build Coastguard Worker extern __attribute__((noinline)) __attribute__((weak))
debugHintScriptGroup2(const char * groupName,const uint32_t groupNameSize,const ExpandFuncTy * kernel,const uint32_t kernelCount)349*e1eccf28SAndroid Build Coastguard Worker void debugHintScriptGroup2(const char* groupName,
350*e1eccf28SAndroid Build Coastguard Worker                            const uint32_t groupNameSize,
351*e1eccf28SAndroid Build Coastguard Worker                            const ExpandFuncTy* kernel,
352*e1eccf28SAndroid Build Coastguard Worker                            const uint32_t kernelCount) {
353*e1eccf28SAndroid Build Coastguard Worker     ALOGV("group name: %d:%s\n", groupNameSize, groupName);
354*e1eccf28SAndroid Build Coastguard Worker     for (uint32_t i=0; i < kernelCount; ++i) {
355*e1eccf28SAndroid Build Coastguard Worker         const char* f1 = (const char*)(kernel[i]);
356*e1eccf28SAndroid Build Coastguard Worker         __asm__ __volatile__("");
357*e1eccf28SAndroid Build Coastguard Worker         ALOGV("  closure: %p\n", (const void*)f1);
358*e1eccf28SAndroid Build Coastguard Worker     }
359*e1eccf28SAndroid Build Coastguard Worker     // do nothing, this is just a hook point for the debugger.
360*e1eccf28SAndroid Build Coastguard Worker     return;
361*e1eccf28SAndroid Build Coastguard Worker }
362*e1eccf28SAndroid Build Coastguard Worker 
compile(const char * cacheDir)363*e1eccf28SAndroid Build Coastguard Worker void CpuScriptGroup2Impl::compile(const char* cacheDir) {
364*e1eccf28SAndroid Build Coastguard Worker #ifndef RS_COMPATIBILITY_LIB
365*e1eccf28SAndroid Build Coastguard Worker     if (mGroup->mClosures.size() < 2) {
366*e1eccf28SAndroid Build Coastguard Worker         return;
367*e1eccf28SAndroid Build Coastguard Worker     }
368*e1eccf28SAndroid Build Coastguard Worker 
369*e1eccf28SAndroid Build Coastguard Worker     const int optLevel = getCpuRefImpl()->getContext()->getOptLevel();
370*e1eccf28SAndroid Build Coastguard Worker     if (optLevel == 0) {
371*e1eccf28SAndroid Build Coastguard Worker         std::vector<ExpandFuncTy> kernels;
372*e1eccf28SAndroid Build Coastguard Worker         for (const Batch* b : mBatches)
373*e1eccf28SAndroid Build Coastguard Worker             for (const CPUClosure* c : b->mClosures)
374*e1eccf28SAndroid Build Coastguard Worker                 kernels.push_back(c->mFunc);
375*e1eccf28SAndroid Build Coastguard Worker 
376*e1eccf28SAndroid Build Coastguard Worker         if (kernels.size()) {
377*e1eccf28SAndroid Build Coastguard Worker             // pass this information on to the debugger via a hint function.
378*e1eccf28SAndroid Build Coastguard Worker             debugHintScriptGroup2(mGroup->mName,
379*e1eccf28SAndroid Build Coastguard Worker                                   strlen(mGroup->mName),
380*e1eccf28SAndroid Build Coastguard Worker                                   kernels.data(),
381*e1eccf28SAndroid Build Coastguard Worker                                   kernels.size());
382*e1eccf28SAndroid Build Coastguard Worker         }
383*e1eccf28SAndroid Build Coastguard Worker 
384*e1eccf28SAndroid Build Coastguard Worker         // skip script group compilation forcing the driver to use the fallback
385*e1eccf28SAndroid Build Coastguard Worker         // execution path which currently has better support for debugging.
386*e1eccf28SAndroid Build Coastguard Worker         return;
387*e1eccf28SAndroid Build Coastguard Worker     }
388*e1eccf28SAndroid Build Coastguard Worker 
389*e1eccf28SAndroid Build Coastguard Worker     auto comparator = [](const char* str1, const char* str2) -> bool {
390*e1eccf28SAndroid Build Coastguard Worker         return strcmp(str1, str2) < 0;
391*e1eccf28SAndroid Build Coastguard Worker     };
392*e1eccf28SAndroid Build Coastguard Worker     std::set<const char*, decltype(comparator)> inputSet(comparator);
393*e1eccf28SAndroid Build Coastguard Worker 
394*e1eccf28SAndroid Build Coastguard Worker     for (Closure* closure : mGroup->mClosures) {
395*e1eccf28SAndroid Build Coastguard Worker         const Script* script = closure->mFunctionID.get()->mScript;
396*e1eccf28SAndroid Build Coastguard Worker 
397*e1eccf28SAndroid Build Coastguard Worker         // If any script is an intrinsic, give up trying fusing the kernels.
398*e1eccf28SAndroid Build Coastguard Worker         if (script->isIntrinsic()) {
399*e1eccf28SAndroid Build Coastguard Worker             return;
400*e1eccf28SAndroid Build Coastguard Worker         }
401*e1eccf28SAndroid Build Coastguard Worker 
402*e1eccf28SAndroid Build Coastguard Worker         const RsdCpuScriptImpl *cpuScript =
403*e1eccf28SAndroid Build Coastguard Worker             (const RsdCpuScriptImpl *)mCpuRefImpl->lookupScript(script);
404*e1eccf28SAndroid Build Coastguard Worker 
405*e1eccf28SAndroid Build Coastguard Worker         const char* bitcodeFilename = cpuScript->getBitcodeFilePath();
406*e1eccf28SAndroid Build Coastguard Worker         inputSet.insert(bitcodeFilename);
407*e1eccf28SAndroid Build Coastguard Worker     }
408*e1eccf28SAndroid Build Coastguard Worker 
409*e1eccf28SAndroid Build Coastguard Worker     std::vector<const char*> inputs(inputSet.begin(), inputSet.end());
410*e1eccf28SAndroid Build Coastguard Worker 
411*e1eccf28SAndroid Build Coastguard Worker     std::vector<string> kernelBatches;
412*e1eccf28SAndroid Build Coastguard Worker     std::vector<string> invokeBatches;
413*e1eccf28SAndroid Build Coastguard Worker 
414*e1eccf28SAndroid Build Coastguard Worker     int i = 0;
415*e1eccf28SAndroid Build Coastguard Worker     for (const auto& batch : mBatches) {
416*e1eccf28SAndroid Build Coastguard Worker         rsAssert(batch->size() > 0);
417*e1eccf28SAndroid Build Coastguard Worker 
418*e1eccf28SAndroid Build Coastguard Worker         std::stringstream ss;
419*e1eccf28SAndroid Build Coastguard Worker         ss << batch->mName << ":";
420*e1eccf28SAndroid Build Coastguard Worker 
421*e1eccf28SAndroid Build Coastguard Worker         if (!batch->mClosures.front()->mClosure->mIsKernel) {
422*e1eccf28SAndroid Build Coastguard Worker             rsAssert(batch->size() == 1);
423*e1eccf28SAndroid Build Coastguard Worker             generateSourceSlot(mCpuRefImpl, *batch->mClosures.front()->mClosure, inputs, ss);
424*e1eccf28SAndroid Build Coastguard Worker             invokeBatches.push_back(ss.str());
425*e1eccf28SAndroid Build Coastguard Worker         } else {
426*e1eccf28SAndroid Build Coastguard Worker             for (const auto& cpuClosure : batch->mClosures) {
427*e1eccf28SAndroid Build Coastguard Worker                 generateSourceSlot(mCpuRefImpl, *cpuClosure->mClosure, inputs, ss);
428*e1eccf28SAndroid Build Coastguard Worker             }
429*e1eccf28SAndroid Build Coastguard Worker             kernelBatches.push_back(ss.str());
430*e1eccf28SAndroid Build Coastguard Worker         }
431*e1eccf28SAndroid Build Coastguard Worker     }
432*e1eccf28SAndroid Build Coastguard Worker 
433*e1eccf28SAndroid Build Coastguard Worker     rsAssert(cacheDir != nullptr);
434*e1eccf28SAndroid Build Coastguard Worker     string objFilePath(cacheDir);
435*e1eccf28SAndroid Build Coastguard Worker     objFilePath.append("/");
436*e1eccf28SAndroid Build Coastguard Worker     objFilePath.append(mGroup->mName);
437*e1eccf28SAndroid Build Coastguard Worker     objFilePath.append(".o");
438*e1eccf28SAndroid Build Coastguard Worker 
439*e1eccf28SAndroid Build Coastguard Worker     const char* resName = mGroup->mName;
440*e1eccf28SAndroid Build Coastguard Worker     string coreLibRelaxedPath;
441*e1eccf28SAndroid Build Coastguard Worker     const string& coreLibPath = getCoreLibPath(getCpuRefImpl()->getContext(),
442*e1eccf28SAndroid Build Coastguard Worker                                                &coreLibRelaxedPath);
443*e1eccf28SAndroid Build Coastguard Worker 
444*e1eccf28SAndroid Build Coastguard Worker     vector<const char*> arguments;
445*e1eccf28SAndroid Build Coastguard Worker     bool emitGlobalInfo = getCpuRefImpl()->getEmbedGlobalInfo();
446*e1eccf28SAndroid Build Coastguard Worker     bool emitGlobalInfoSkipConstant = getCpuRefImpl()->getEmbedGlobalInfoSkipConstant();
447*e1eccf28SAndroid Build Coastguard Worker     setupCompileArguments(inputs, kernelBatches, invokeBatches, cacheDir,
448*e1eccf28SAndroid Build Coastguard Worker                           resName, coreLibPath.c_str(), coreLibRelaxedPath.c_str(),
449*e1eccf28SAndroid Build Coastguard Worker                           emitGlobalInfo, emitGlobalInfoSkipConstant,
450*e1eccf28SAndroid Build Coastguard Worker                           optLevel, &arguments);
451*e1eccf28SAndroid Build Coastguard Worker 
452*e1eccf28SAndroid Build Coastguard Worker     std::unique_ptr<const char> cmdLine(rsuJoinStrings(arguments.size() - 1,
453*e1eccf28SAndroid Build Coastguard Worker                                                        arguments.data()));
454*e1eccf28SAndroid Build Coastguard Worker 
455*e1eccf28SAndroid Build Coastguard Worker     inputs.push_back(coreLibPath.c_str());
456*e1eccf28SAndroid Build Coastguard Worker     inputs.push_back(coreLibRelaxedPath.c_str());
457*e1eccf28SAndroid Build Coastguard Worker 
458*e1eccf28SAndroid Build Coastguard Worker     uint32_t checksum = constructBuildChecksum(nullptr, 0, cmdLine.get(),
459*e1eccf28SAndroid Build Coastguard Worker                                                inputs.data(), inputs.size());
460*e1eccf28SAndroid Build Coastguard Worker 
461*e1eccf28SAndroid Build Coastguard Worker     if (checksum == 0) {
462*e1eccf28SAndroid Build Coastguard Worker         return;
463*e1eccf28SAndroid Build Coastguard Worker     }
464*e1eccf28SAndroid Build Coastguard Worker 
465*e1eccf28SAndroid Build Coastguard Worker     std::stringstream ss;
466*e1eccf28SAndroid Build Coastguard Worker     ss << std::hex << checksum;
467*e1eccf28SAndroid Build Coastguard Worker     std::string checksumStr(ss.str());
468*e1eccf28SAndroid Build Coastguard Worker 
469*e1eccf28SAndroid Build Coastguard Worker     //===--------------------------------------------------------------------===//
470*e1eccf28SAndroid Build Coastguard Worker     // Try to load a shared lib from code cache matching filename and checksum
471*e1eccf28SAndroid Build Coastguard Worker     //===--------------------------------------------------------------------===//
472*e1eccf28SAndroid Build Coastguard Worker 
473*e1eccf28SAndroid Build Coastguard Worker     bool alreadyLoaded = false;
474*e1eccf28SAndroid Build Coastguard Worker     std::string cloneName;
475*e1eccf28SAndroid Build Coastguard Worker 
476*e1eccf28SAndroid Build Coastguard Worker     const bool useRSDebugContext =
477*e1eccf28SAndroid Build Coastguard Worker             (mCpuRefImpl->getContext()->getContextType() == RS_CONTEXT_TYPE_DEBUG);
478*e1eccf28SAndroid Build Coastguard Worker     const bool reuse = !is_force_recompile() && !useRSDebugContext;
479*e1eccf28SAndroid Build Coastguard Worker     if (reuse) {
480*e1eccf28SAndroid Build Coastguard Worker         mScriptObj = SharedLibraryUtils::loadSharedLibrary(cacheDir, resName, nullptr,
481*e1eccf28SAndroid Build Coastguard Worker                                                            &alreadyLoaded);
482*e1eccf28SAndroid Build Coastguard Worker     }
483*e1eccf28SAndroid Build Coastguard Worker     if (mScriptObj != nullptr) {
484*e1eccf28SAndroid Build Coastguard Worker         // A shared library named resName is found in code cache directory
485*e1eccf28SAndroid Build Coastguard Worker         // cacheDir, and loaded with the handle stored in mScriptObj.
486*e1eccf28SAndroid Build Coastguard Worker 
487*e1eccf28SAndroid Build Coastguard Worker         mExecutable = ScriptExecutable::createFromSharedObject(
488*e1eccf28SAndroid Build Coastguard Worker             mScriptObj, checksum);
489*e1eccf28SAndroid Build Coastguard Worker 
490*e1eccf28SAndroid Build Coastguard Worker         if (mExecutable != nullptr) {
491*e1eccf28SAndroid Build Coastguard Worker             // The loaded shared library in mScriptObj has a matching checksum.
492*e1eccf28SAndroid Build Coastguard Worker             // An executable object has been created.
493*e1eccf28SAndroid Build Coastguard Worker             return;
494*e1eccf28SAndroid Build Coastguard Worker         }
495*e1eccf28SAndroid Build Coastguard Worker 
496*e1eccf28SAndroid Build Coastguard Worker         ALOGV("Failed to create an executable object from so file due to "
497*e1eccf28SAndroid Build Coastguard Worker               "mismatching checksum");
498*e1eccf28SAndroid Build Coastguard Worker 
499*e1eccf28SAndroid Build Coastguard Worker         if (alreadyLoaded) {
500*e1eccf28SAndroid Build Coastguard Worker             // The shared object found in code cache has already been loaded.
501*e1eccf28SAndroid Build Coastguard Worker             // A different file name is needed for the new shared library, to
502*e1eccf28SAndroid Build Coastguard Worker             // avoid corrupting the currently loaded instance.
503*e1eccf28SAndroid Build Coastguard Worker 
504*e1eccf28SAndroid Build Coastguard Worker             cloneName.append(resName);
505*e1eccf28SAndroid Build Coastguard Worker             cloneName.append("#");
506*e1eccf28SAndroid Build Coastguard Worker             cloneName.append(SharedLibraryUtils::getRandomString(6).c_str());
507*e1eccf28SAndroid Build Coastguard Worker 
508*e1eccf28SAndroid Build Coastguard Worker             // The last element in arguments is the output filename.
509*e1eccf28SAndroid Build Coastguard Worker             arguments.pop_back();
510*e1eccf28SAndroid Build Coastguard Worker             arguments.push_back(cloneName.c_str());
511*e1eccf28SAndroid Build Coastguard Worker         }
512*e1eccf28SAndroid Build Coastguard Worker 
513*e1eccf28SAndroid Build Coastguard Worker         dlclose(mScriptObj);
514*e1eccf28SAndroid Build Coastguard Worker         mScriptObj = nullptr;
515*e1eccf28SAndroid Build Coastguard Worker     }
516*e1eccf28SAndroid Build Coastguard Worker 
517*e1eccf28SAndroid Build Coastguard Worker     //===--------------------------------------------------------------------===//
518*e1eccf28SAndroid Build Coastguard Worker     // Fuse the input kernels and generate native code in an object file
519*e1eccf28SAndroid Build Coastguard Worker     //===--------------------------------------------------------------------===//
520*e1eccf28SAndroid Build Coastguard Worker 
521*e1eccf28SAndroid Build Coastguard Worker     arguments.push_back("-build-checksum");
522*e1eccf28SAndroid Build Coastguard Worker     arguments.push_back(checksumStr.c_str());
523*e1eccf28SAndroid Build Coastguard Worker     arguments.push_back(nullptr);
524*e1eccf28SAndroid Build Coastguard Worker 
525*e1eccf28SAndroid Build Coastguard Worker     bool compiled = rsuExecuteCommand(RsdCpuScriptImpl::BCC_EXE_PATH,
526*e1eccf28SAndroid Build Coastguard Worker                                       arguments.size()-1,
527*e1eccf28SAndroid Build Coastguard Worker                                       arguments.data());
528*e1eccf28SAndroid Build Coastguard Worker     if (!compiled) {
529*e1eccf28SAndroid Build Coastguard Worker         return;
530*e1eccf28SAndroid Build Coastguard Worker     }
531*e1eccf28SAndroid Build Coastguard Worker 
532*e1eccf28SAndroid Build Coastguard Worker     //===--------------------------------------------------------------------===//
533*e1eccf28SAndroid Build Coastguard Worker     // Create and load the shared lib
534*e1eccf28SAndroid Build Coastguard Worker     //===--------------------------------------------------------------------===//
535*e1eccf28SAndroid Build Coastguard Worker 
536*e1eccf28SAndroid Build Coastguard Worker     std::string SOPath;
537*e1eccf28SAndroid Build Coastguard Worker 
538*e1eccf28SAndroid Build Coastguard Worker     if (!SharedLibraryUtils::createSharedLibrary(
539*e1eccf28SAndroid Build Coastguard Worker             getCpuRefImpl()->getContext()->getDriverName(), cacheDir, resName,
540*e1eccf28SAndroid Build Coastguard Worker             reuse, &SOPath)) {
541*e1eccf28SAndroid Build Coastguard Worker         ALOGE("Failed to link object file '%s'", resName);
542*e1eccf28SAndroid Build Coastguard Worker         unlink(objFilePath.c_str());
543*e1eccf28SAndroid Build Coastguard Worker         return;
544*e1eccf28SAndroid Build Coastguard Worker     }
545*e1eccf28SAndroid Build Coastguard Worker 
546*e1eccf28SAndroid Build Coastguard Worker     unlink(objFilePath.c_str());
547*e1eccf28SAndroid Build Coastguard Worker 
548*e1eccf28SAndroid Build Coastguard Worker     if (reuse) {
549*e1eccf28SAndroid Build Coastguard Worker         mScriptObj = SharedLibraryUtils::loadSharedLibrary(cacheDir, resName);
550*e1eccf28SAndroid Build Coastguard Worker     } else {
551*e1eccf28SAndroid Build Coastguard Worker         mScriptObj = SharedLibraryUtils::loadAndDeleteSharedLibrary(SOPath.c_str());
552*e1eccf28SAndroid Build Coastguard Worker     }
553*e1eccf28SAndroid Build Coastguard Worker     if (mScriptObj == nullptr) {
554*e1eccf28SAndroid Build Coastguard Worker         ALOGE("Unable to load '%s'", resName);
555*e1eccf28SAndroid Build Coastguard Worker         return;
556*e1eccf28SAndroid Build Coastguard Worker     }
557*e1eccf28SAndroid Build Coastguard Worker 
558*e1eccf28SAndroid Build Coastguard Worker     if (alreadyLoaded) {
559*e1eccf28SAndroid Build Coastguard Worker         // Delete the temporary, random-named file that we created to avoid
560*e1eccf28SAndroid Build Coastguard Worker         // interfering with an already loaded shared library.
561*e1eccf28SAndroid Build Coastguard Worker         string cloneFilePath(cacheDir);
562*e1eccf28SAndroid Build Coastguard Worker         cloneFilePath.append("/");
563*e1eccf28SAndroid Build Coastguard Worker         cloneFilePath.append(cloneName.c_str());
564*e1eccf28SAndroid Build Coastguard Worker         cloneFilePath.append(".so");
565*e1eccf28SAndroid Build Coastguard Worker         unlink(cloneFilePath.c_str());
566*e1eccf28SAndroid Build Coastguard Worker     }
567*e1eccf28SAndroid Build Coastguard Worker 
568*e1eccf28SAndroid Build Coastguard Worker     mExecutable = ScriptExecutable::createFromSharedObject(mScriptObj);
569*e1eccf28SAndroid Build Coastguard Worker 
570*e1eccf28SAndroid Build Coastguard Worker #endif  // RS_COMPATIBILITY_LIB
571*e1eccf28SAndroid Build Coastguard Worker }
572*e1eccf28SAndroid Build Coastguard Worker 
execute()573*e1eccf28SAndroid Build Coastguard Worker void CpuScriptGroup2Impl::execute() {
574*e1eccf28SAndroid Build Coastguard Worker     for (auto batch : mBatches) {
575*e1eccf28SAndroid Build Coastguard Worker         batch->setGlobalsForBatch();
576*e1eccf28SAndroid Build Coastguard Worker         batch->run();
577*e1eccf28SAndroid Build Coastguard Worker     }
578*e1eccf28SAndroid Build Coastguard Worker }
579*e1eccf28SAndroid Build Coastguard Worker 
setGlobalsForBatch()580*e1eccf28SAndroid Build Coastguard Worker void Batch::setGlobalsForBatch() {
581*e1eccf28SAndroid Build Coastguard Worker     for (CPUClosure* cpuClosure : mClosures) {
582*e1eccf28SAndroid Build Coastguard Worker         const Closure* closure = cpuClosure->mClosure;
583*e1eccf28SAndroid Build Coastguard Worker         const IDBase* funcID = closure->mFunctionID.get();
584*e1eccf28SAndroid Build Coastguard Worker         Script* s = funcID->mScript;;
585*e1eccf28SAndroid Build Coastguard Worker         for (const auto& p : closure->mGlobals) {
586*e1eccf28SAndroid Build Coastguard Worker             const int64_t value = p.second.first;
587*e1eccf28SAndroid Build Coastguard Worker             int size = p.second.second;
588*e1eccf28SAndroid Build Coastguard Worker             if (value == 0 && size == 0) {
589*e1eccf28SAndroid Build Coastguard Worker                 // This indicates the current closure depends on another closure for a
590*e1eccf28SAndroid Build Coastguard Worker                 // global in their shared module (script). In this case we don't need to
591*e1eccf28SAndroid Build Coastguard Worker                 // copy the value. For example, an invoke intializes a global variable
592*e1eccf28SAndroid Build Coastguard Worker                 // which a kernel later reads.
593*e1eccf28SAndroid Build Coastguard Worker                 continue;
594*e1eccf28SAndroid Build Coastguard Worker             }
595*e1eccf28SAndroid Build Coastguard Worker             rsAssert(p.first != nullptr);
596*e1eccf28SAndroid Build Coastguard Worker             Script* script = p.first->mScript;
597*e1eccf28SAndroid Build Coastguard Worker             rsAssert(script == s);
598*e1eccf28SAndroid Build Coastguard Worker             RsdCpuReferenceImpl* ctxt = mGroup->getCpuRefImpl();
599*e1eccf28SAndroid Build Coastguard Worker             const RsdCpuScriptImpl *cpuScript =
600*e1eccf28SAndroid Build Coastguard Worker                     (const RsdCpuScriptImpl *)ctxt->lookupScript(script);
601*e1eccf28SAndroid Build Coastguard Worker             int slot = p.first->mSlot;
602*e1eccf28SAndroid Build Coastguard Worker             ScriptExecutable* exec = mGroup->getExecutable();
603*e1eccf28SAndroid Build Coastguard Worker             if (exec != nullptr) {
604*e1eccf28SAndroid Build Coastguard Worker                 const char* varName = cpuScript->getFieldName(slot);
605*e1eccf28SAndroid Build Coastguard Worker                 void* addr = exec->getFieldAddress(varName);
606*e1eccf28SAndroid Build Coastguard Worker                 if (size < 0) {
607*e1eccf28SAndroid Build Coastguard Worker                     rsrSetObject(mGroup->getCpuRefImpl()->getContext(),
608*e1eccf28SAndroid Build Coastguard Worker                                  (rs_object_base*)addr, (ObjectBase*)value);
609*e1eccf28SAndroid Build Coastguard Worker                 } else {
610*e1eccf28SAndroid Build Coastguard Worker                     memcpy(addr, (const void*)&value, size);
611*e1eccf28SAndroid Build Coastguard Worker                 }
612*e1eccf28SAndroid Build Coastguard Worker             } else {
613*e1eccf28SAndroid Build Coastguard Worker                 // We use -1 size to indicate an ObjectBase rather than a primitive type
614*e1eccf28SAndroid Build Coastguard Worker                 if (size < 0) {
615*e1eccf28SAndroid Build Coastguard Worker                     s->setVarObj(slot, (ObjectBase*)value);
616*e1eccf28SAndroid Build Coastguard Worker                 } else {
617*e1eccf28SAndroid Build Coastguard Worker                     s->setVar(slot, (const void*)&value, size);
618*e1eccf28SAndroid Build Coastguard Worker                 }
619*e1eccf28SAndroid Build Coastguard Worker             }
620*e1eccf28SAndroid Build Coastguard Worker         }
621*e1eccf28SAndroid Build Coastguard Worker     }
622*e1eccf28SAndroid Build Coastguard Worker }
623*e1eccf28SAndroid Build Coastguard Worker 
run()624*e1eccf28SAndroid Build Coastguard Worker void Batch::run() {
625*e1eccf28SAndroid Build Coastguard Worker     if (!mClosures.front()->mClosure->mIsKernel) {
626*e1eccf28SAndroid Build Coastguard Worker         rsAssert(mClosures.size() == 1);
627*e1eccf28SAndroid Build Coastguard Worker 
628*e1eccf28SAndroid Build Coastguard Worker         // This batch contains a single closure for an invoke function
629*e1eccf28SAndroid Build Coastguard Worker         CPUClosure* cc = mClosures.front();
630*e1eccf28SAndroid Build Coastguard Worker         const Closure* c = cc->mClosure;
631*e1eccf28SAndroid Build Coastguard Worker 
632*e1eccf28SAndroid Build Coastguard Worker         if (mFunc != nullptr) {
633*e1eccf28SAndroid Build Coastguard Worker             // TODO: Need align pointers for x86_64.
634*e1eccf28SAndroid Build Coastguard Worker             // See RsdCpuScriptImpl::invokeFunction in rsCpuScript.cpp
635*e1eccf28SAndroid Build Coastguard Worker             ((InvokeFuncTy)mFunc)(c->mParams, c->mParamLength);
636*e1eccf28SAndroid Build Coastguard Worker         } else {
637*e1eccf28SAndroid Build Coastguard Worker             const ScriptInvokeID* invokeID = (const ScriptInvokeID*)c->mFunctionID.get();
638*e1eccf28SAndroid Build Coastguard Worker             rsAssert(invokeID != nullptr);
639*e1eccf28SAndroid Build Coastguard Worker             cc->mSi->invokeFunction(invokeID->mSlot, c->mParams, c->mParamLength);
640*e1eccf28SAndroid Build Coastguard Worker         }
641*e1eccf28SAndroid Build Coastguard Worker 
642*e1eccf28SAndroid Build Coastguard Worker         return;
643*e1eccf28SAndroid Build Coastguard Worker     }
644*e1eccf28SAndroid Build Coastguard Worker 
645*e1eccf28SAndroid Build Coastguard Worker     if (mFunc != nullptr) {
646*e1eccf28SAndroid Build Coastguard Worker         MTLaunchStructForEach mtls;
647*e1eccf28SAndroid Build Coastguard Worker         const CPUClosure* firstCpuClosure = mClosures.front();
648*e1eccf28SAndroid Build Coastguard Worker         const CPUClosure* lastCpuClosure = mClosures.back();
649*e1eccf28SAndroid Build Coastguard Worker 
650*e1eccf28SAndroid Build Coastguard Worker         firstCpuClosure->mSi->forEachMtlsSetup(
651*e1eccf28SAndroid Build Coastguard Worker                 (const Allocation**)firstCpuClosure->mClosure->mArgs,
652*e1eccf28SAndroid Build Coastguard Worker                 firstCpuClosure->mClosure->mNumArg,
653*e1eccf28SAndroid Build Coastguard Worker                 lastCpuClosure->mClosure->mReturnValue,
654*e1eccf28SAndroid Build Coastguard Worker                 nullptr, 0, nullptr, &mtls);
655*e1eccf28SAndroid Build Coastguard Worker 
656*e1eccf28SAndroid Build Coastguard Worker         mtls.script = nullptr;
657*e1eccf28SAndroid Build Coastguard Worker         mtls.fep.usr = nullptr;
658*e1eccf28SAndroid Build Coastguard Worker         mtls.kernel = (ForEachFunc_t)mFunc;
659*e1eccf28SAndroid Build Coastguard Worker 
660*e1eccf28SAndroid Build Coastguard Worker         mGroup->getCpuRefImpl()->launchForEach(
661*e1eccf28SAndroid Build Coastguard Worker                 (const Allocation**)firstCpuClosure->mClosure->mArgs,
662*e1eccf28SAndroid Build Coastguard Worker                 firstCpuClosure->mClosure->mNumArg,
663*e1eccf28SAndroid Build Coastguard Worker                 lastCpuClosure->mClosure->mReturnValue,
664*e1eccf28SAndroid Build Coastguard Worker                 nullptr, &mtls);
665*e1eccf28SAndroid Build Coastguard Worker 
666*e1eccf28SAndroid Build Coastguard Worker         return;
667*e1eccf28SAndroid Build Coastguard Worker     }
668*e1eccf28SAndroid Build Coastguard Worker 
669*e1eccf28SAndroid Build Coastguard Worker     for (CPUClosure* cpuClosure : mClosures) {
670*e1eccf28SAndroid Build Coastguard Worker         const Closure* closure = cpuClosure->mClosure;
671*e1eccf28SAndroid Build Coastguard Worker         const ScriptKernelID* kernelID =
672*e1eccf28SAndroid Build Coastguard Worker                 (const ScriptKernelID*)closure->mFunctionID.get();
673*e1eccf28SAndroid Build Coastguard Worker         cpuClosure->mSi->preLaunch(kernelID->mSlot,
674*e1eccf28SAndroid Build Coastguard Worker                                    (const Allocation**)closure->mArgs,
675*e1eccf28SAndroid Build Coastguard Worker                                    closure->mNumArg, closure->mReturnValue,
676*e1eccf28SAndroid Build Coastguard Worker                                    nullptr, 0, nullptr);
677*e1eccf28SAndroid Build Coastguard Worker     }
678*e1eccf28SAndroid Build Coastguard Worker 
679*e1eccf28SAndroid Build Coastguard Worker     const CPUClosure* cpuClosure = mClosures.front();
680*e1eccf28SAndroid Build Coastguard Worker     const Closure* closure = cpuClosure->mClosure;
681*e1eccf28SAndroid Build Coastguard Worker     MTLaunchStructForEach mtls;
682*e1eccf28SAndroid Build Coastguard Worker 
683*e1eccf28SAndroid Build Coastguard Worker     if (cpuClosure->mSi->forEachMtlsSetup((const Allocation**)closure->mArgs,
684*e1eccf28SAndroid Build Coastguard Worker                                           closure->mNumArg,
685*e1eccf28SAndroid Build Coastguard Worker                                           closure->mReturnValue,
686*e1eccf28SAndroid Build Coastguard Worker                                           nullptr, 0, nullptr, &mtls)) {
687*e1eccf28SAndroid Build Coastguard Worker 
688*e1eccf28SAndroid Build Coastguard Worker         mtls.script = nullptr;
689*e1eccf28SAndroid Build Coastguard Worker         mtls.kernel = &groupRoot;
690*e1eccf28SAndroid Build Coastguard Worker         mtls.fep.usr = &mClosures;
691*e1eccf28SAndroid Build Coastguard Worker 
692*e1eccf28SAndroid Build Coastguard Worker         mGroup->getCpuRefImpl()->launchForEach(nullptr, 0, nullptr, nullptr, &mtls);
693*e1eccf28SAndroid Build Coastguard Worker     }
694*e1eccf28SAndroid Build Coastguard Worker 
695*e1eccf28SAndroid Build Coastguard Worker     for (CPUClosure* cpuClosure : mClosures) {
696*e1eccf28SAndroid Build Coastguard Worker         const Closure* closure = cpuClosure->mClosure;
697*e1eccf28SAndroid Build Coastguard Worker         const ScriptKernelID* kernelID =
698*e1eccf28SAndroid Build Coastguard Worker                 (const ScriptKernelID*)closure->mFunctionID.get();
699*e1eccf28SAndroid Build Coastguard Worker         cpuClosure->mSi->postLaunch(kernelID->mSlot,
700*e1eccf28SAndroid Build Coastguard Worker                                     (const Allocation**)closure->mArgs,
701*e1eccf28SAndroid Build Coastguard Worker                                     closure->mNumArg, closure->mReturnValue,
702*e1eccf28SAndroid Build Coastguard Worker                                     nullptr, 0, nullptr);
703*e1eccf28SAndroid Build Coastguard Worker     }
704*e1eccf28SAndroid Build Coastguard Worker }
705*e1eccf28SAndroid Build Coastguard Worker 
706*e1eccf28SAndroid Build Coastguard Worker }  // namespace renderscript
707*e1eccf28SAndroid Build Coastguard Worker }  // namespace android
708