1 /*
2  * Copyright 2012, The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *     http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 #include "bcc/RSCompilerDriver.h"
18 
19 #include "Assert.h"
20 #include "FileMutex.h"
21 #include "Log.h"
22 #include "RSScriptGroupFusion.h"
23 #include "slang_version.h"
24 
25 #include "bcc/BCCContext.h"
26 #include "bcc/Compiler.h"
27 #include "bcc/CompilerConfig.h"
28 #include "bcc/Config.h"
29 #include "bcc/Initialization.h"
30 #include "bcc/Script.h"
31 #include "bcc/Source.h"
32 #include "bcinfo/BitcodeWrapper.h"
33 #include "bcinfo/MetadataExtractor.h"
34 
35 #include "llvm/ADT/STLExtras.h"
36 #include "llvm/IR/AssemblyAnnotationWriter.h"
37 #include <llvm/IR/Module.h>
38 #include "llvm/Linker/Linker.h"
39 #include <llvm/Support/CommandLine.h>
40 #include <llvm/Support/FileSystem.h>
41 #include <llvm/Support/Path.h>
42 #include <llvm/Support/raw_ostream.h>
43 #include <llvm/Target/TargetMachine.h>
44 
45 #include <sstream>
46 #include <string>
47 
48 using namespace bcc;
49 
RSCompilerDriver()50 RSCompilerDriver::RSCompilerDriver() :
51     mConfig(nullptr), mCompiler(), mDebugContext(false),
52     mLinkRuntimeCallback(nullptr), mEnableGlobalMerge(true),
53     mEmbedGlobalInfo(false), mEmbedGlobalInfoSkipConstant(false) {
54   init::Initialize();
55 }
56 
~RSCompilerDriver()57 RSCompilerDriver::~RSCompilerDriver() {
58   delete mConfig;
59 }
60 
61 
62 #if defined(PROVIDE_ARM_CODEGEN)
63 extern llvm::cl::opt<bool> EnableGlobalMerge;
64 #endif
65 
setupConfig(const Script & pScript)66 bool RSCompilerDriver::setupConfig(const Script &pScript) {
67   bool changed = false;
68 
69   const llvm::CodeGenOpt::Level script_opt_level = pScript.getOptimizationLevel();
70 
71 #if defined(PROVIDE_ARM_CODEGEN)
72   EnableGlobalMerge = mEnableGlobalMerge;
73 #endif
74 
75   if (mConfig != nullptr) {
76     // Renderscript bitcode may have their optimization flag configuration
77     // different than the previous run of RS compilation.
78     if (mConfig->getOptimizationLevel() != script_opt_level) {
79       mConfig->setOptimizationLevel(script_opt_level);
80       changed = true;
81     }
82   } else {
83     // Haven't run the compiler ever.
84     mConfig = new (std::nothrow) CompilerConfig(DEFAULT_TARGET_TRIPLE_STRING);
85     if (mConfig == nullptr) {
86       // Return false since mConfig remains NULL and out-of-memory.
87       return false;
88     }
89     mConfig->setOptimizationLevel(script_opt_level);
90     changed = true;
91   }
92 
93 #if defined(PROVIDE_ARM_CODEGEN)
94   bcinfo::MetadataExtractor me(&pScript.getSource().getModule());
95   if (!me.extract()) {
96     bccAssert("Could not extract RS pragma metadata for module!");
97   }
98 
99   bool script_full_prec = (me.getRSFloatPrecision() == bcinfo::RS_FP_Full);
100   if (mConfig->getFullPrecision() != script_full_prec) {
101     mConfig->setFullPrecision(script_full_prec);
102     changed = true;
103   }
104 #endif
105 
106   return changed;
107 }
108 
compileScript(Script & pScript,const char * pScriptName,const char * pOutputPath,const char * pRuntimePath,const char * pBuildChecksum,bool pDumpIR)109 Compiler::ErrorCode RSCompilerDriver::compileScript(Script& pScript, const char* pScriptName,
110                                                     const char* pOutputPath,
111                                                     const char* pRuntimePath,
112                                                     const char* pBuildChecksum,
113                                                     bool pDumpIR) {
114   // embed build checksum metadata into the source
115   if (pBuildChecksum != nullptr && strlen(pBuildChecksum) > 0) {
116     pScript.getSource().addBuildChecksumMetadata(pBuildChecksum);
117   }
118 
119   // Verify that the only external functions in pScript are Renderscript
120   // functions.  Fail if verification returns an error.
121   if (mCompiler.screenGlobalFunctions(pScript) != Compiler::kSuccess) {
122     return Compiler::kErrInvalidSource;
123   }
124 
125   // For (32-bit) x86, translate GEPs on structs or arrays of structs to GEPs on
126   // int8* with byte offsets.  This is to ensure that layout of structs with
127   // 64-bit scalar fields matches frontend-generated code that adheres to ARM
128   // data layout.
129   //
130   // The translation is done before RenderScript runtime library is linked
131   // (during LinkRuntime below) to ensure that RenderScript-driver-provided
132   // structs (like Allocation_t) don't get forced into using the ARM layout
133   // rules.
134   if (!pScript.isStructExplicitlyPaddedBySlang() &&
135       (mCompiler.getTargetMachine().getTargetTriple().getArch() == llvm::Triple::x86)) {
136     mCompiler.translateGEPs(pScript);
137   }
138 
139   //===--------------------------------------------------------------------===//
140   // Link RS script with Renderscript runtime.
141   //===--------------------------------------------------------------------===//
142   if (!pScript.LinkRuntime(pRuntimePath)) {
143     ALOGE("Failed to link script '%s' with Renderscript runtime %s!",
144           pScriptName, pRuntimePath);
145     return Compiler::kErrInvalidSource;
146   }
147 
148   {
149     // FIXME(srhines): Windows compilation can't use locking like this, but
150     // we also don't need to worry about concurrent writers of the same file.
151 #ifndef _WIN32
152     //===------------------------------------------------------------------===//
153     // Acquire the write lock for writing output object file.
154     //===------------------------------------------------------------------===//
155     FileMutex write_output_mutex(pOutputPath);
156 
157     if (write_output_mutex.hasError() || !write_output_mutex.lockMutex()) {
158       ALOGE("Unable to acquire the lock for writing %s! (%s)",
159             pOutputPath, write_output_mutex.getErrorMessage().c_str());
160       return Compiler::kErrInvalidOutputFileState;
161     }
162 #endif
163 
164     // Open the output file for write.
165     std::error_code error;
166     llvm::raw_fd_ostream out_stream(pOutputPath, error, llvm::sys::fs::F_RW);
167     if (error) {
168       ALOGE("Unable to open %s for write! (%s)", pOutputPath,
169             error.message().c_str());
170       return Compiler::kErrPrepareOutput;
171     }
172 
173     // Setup the config to the compiler.
174     bool compiler_need_reconfigure = setupConfig(pScript);
175 
176     if (mConfig == nullptr) {
177       ALOGE("Failed to setup config for RS compiler to compile %s!",
178             pOutputPath);
179       return Compiler::kErrInvalidSource;
180     }
181 
182     if (compiler_need_reconfigure) {
183       Compiler::ErrorCode err = mCompiler.config(*mConfig);
184       if (err != Compiler::kSuccess) {
185         ALOGE("Failed to config the RS compiler for %s! (%s)",pOutputPath,
186               Compiler::GetErrorString(err));
187         return Compiler::kErrInvalidSource;
188       }
189     }
190 
191     std::unique_ptr<llvm::raw_fd_ostream> IRStream;
192     if (pDumpIR) {
193       std::string path(pOutputPath);
194       path.append(".ll");
195       IRStream.reset(new llvm::raw_fd_ostream(
196           path.c_str(), error, llvm::sys::fs::F_RW | llvm::sys::fs::F_Text));
197       if (error) {
198         ALOGE("Unable to open %s for write! (%s)", path.c_str(),
199               error.message().c_str());
200         return Compiler::kErrPrepareOutput;
201       }
202     }
203 
204     // Run the compiler.
205     Compiler::ErrorCode compile_result =
206         mCompiler.compile(pScript, out_stream, IRStream.get());
207 
208     if (compile_result != Compiler::kSuccess) {
209       ALOGE("Unable to compile the source to file %s! (%s)", pOutputPath,
210             Compiler::GetErrorString(compile_result));
211       return Compiler::kErrInvalidSource;
212     }
213   }
214 
215   return Compiler::kSuccess;
216 }
217 
build(BCCContext & pContext,const char * pCacheDir,const char * pResName,const char * pBitcode,size_t pBitcodeSize,const char * pBuildChecksum,const char * pRuntimePath,RSLinkRuntimeCallback pLinkRuntimeCallback,bool pDumpIR)218 bool RSCompilerDriver::build(BCCContext &pContext,
219                              const char *pCacheDir,
220                              const char *pResName,
221                              const char *pBitcode,
222                              size_t pBitcodeSize,
223                              const char *pBuildChecksum,
224                              const char *pRuntimePath,
225                              RSLinkRuntimeCallback pLinkRuntimeCallback,
226                              bool pDumpIR) {
227     //  android::StopWatch build_time("bcc: RSCompilerDriver::build time");
228   //===--------------------------------------------------------------------===//
229   // Check parameters.
230   //===--------------------------------------------------------------------===//
231   if ((pCacheDir == nullptr) || (pResName == nullptr)) {
232     ALOGE("Invalid parameter passed to RSCompilerDriver::build()! (cache dir: "
233           "%s, resource name: %s)", ((pCacheDir) ? pCacheDir : "(null)"),
234                                     ((pResName) ? pResName : "(null)"));
235     return false;
236   }
237 
238   if ((pBitcode == nullptr) || (pBitcodeSize <= 0)) {
239     ALOGE("No bitcode supplied! (bitcode: %p, size of bitcode: %u)",
240           pBitcode, static_cast<unsigned>(pBitcodeSize));
241     return false;
242   }
243 
244   //===--------------------------------------------------------------------===//
245   // Construct output path.
246   // {pCacheDir}/{pResName}.o
247   //===--------------------------------------------------------------------===//
248   llvm::SmallString<80> output_path(pCacheDir);
249   llvm::sys::path::append(output_path, pResName);
250   llvm::sys::path::replace_extension(output_path, ".o");
251 
252   //===--------------------------------------------------------------------===//
253   // Load the bitcode and create script.
254   //===--------------------------------------------------------------------===//
255   Source *source = Source::CreateFromBuffer(pContext, pResName,
256                                             pBitcode, pBitcodeSize);
257   if (source == nullptr) {
258     return false;
259   }
260 
261   Script script(source);
262   script.setOptimizationLevel(getConfig()->getOptimizationLevel());
263   if (pLinkRuntimeCallback) {
264     setLinkRuntimeCallback(pLinkRuntimeCallback);
265   }
266 
267   script.setLinkRuntimeCallback(getLinkRuntimeCallback());
268 
269   script.setEmbedGlobalInfo(mEmbedGlobalInfo);
270   script.setEmbedGlobalInfoSkipConstant(mEmbedGlobalInfoSkipConstant);
271 
272   // Read optimization level from bitcode wrapper.
273   bcinfo::BitcodeWrapper wrapper(pBitcode, pBitcodeSize);
274   script.setOptimizationLevel(static_cast<llvm::CodeGenOpt::Level>(
275                               wrapper.getOptimizationLevel()));
276 
277 // Assertion-enabled builds can't compile legacy bitcode (due to the use of
278 // getName() with anonymous structure definitions).
279 #ifdef _DEBUG
280   static const uint32_t kSlangMinimumFixedStructureNames = SlangVersion::M_RS_OBJECT;
281   uint32_t version = wrapper.getCompilerVersion();
282   if (version < kSlangMinimumFixedStructureNames) {
283     ALOGE("Found invalid legacy bitcode compiled with a version %u llvm-rs-cc "
284           "used with an assertion build", version);
285     ALOGE("Please recompile this apk with a more recent llvm-rs-cc "
286           "(at least %u)", kSlangMinimumFixedStructureNames);
287     return false;
288   }
289 #endif
290 
291   //===--------------------------------------------------------------------===//
292   // Compile the script
293   //===--------------------------------------------------------------------===//
294   Compiler::ErrorCode status = compileScript(script, pResName,
295                                              output_path.c_str(),
296                                              pRuntimePath,
297                                              pBuildChecksum,
298                                              pDumpIR);
299 
300   return status == Compiler::kSuccess;
301 }
302 
buildScriptGroup(BCCContext & Context,const char * pOutputFilepath,const char * pRuntimePath,const char * pRuntimeRelaxedPath,bool dumpIR,const char * buildChecksum,const std::vector<Source * > & sources,const std::list<std::list<std::pair<int,int>>> & toFuse,const std::list<std::string> & fused,const std::list<std::list<std::pair<int,int>>> & invokes,const std::list<std::string> & invokeBatchNames)303 bool RSCompilerDriver::buildScriptGroup(
304     BCCContext& Context, const char* pOutputFilepath, const char* pRuntimePath,
305     const char* pRuntimeRelaxedPath, bool dumpIR, const char* buildChecksum,
306     const std::vector<Source*>& sources,
307     const std::list<std::list<std::pair<int, int>>>& toFuse,
308     const std::list<std::string>& fused,
309     const std::list<std::list<std::pair<int, int>>>& invokes,
310     const std::list<std::string>& invokeBatchNames) {
311 
312   // Read and store metadata before linking the modules together
313   std::vector<bcinfo::MetadataExtractor*> metadata;
314   for (Source* source : sources) {
315     if (!source->extractMetadata()) {
316       ALOGE("Cannot extract metadata from module");
317       return false;
318     }
319   }
320 
321   // ---------------------------------------------------------------------------
322   // Link all input modules into a single module
323   // ---------------------------------------------------------------------------
324 
325   llvm::LLVMContext& context = Context.getLLVMContext();
326   llvm::Module module("Merged Script Group", context);
327 
328   unsigned wrapperCompilerVersion = 0, wrapperOptimizationLevel = 0;
329   bool gotFirstSource = false;
330   llvm::Linker linker(module);
331   for (Source* source : sources) {
332     unsigned sourceWrapperCompilerVersion, sourceWrapperOptimizationLevel;
333     source->getWrapperInformation(&sourceWrapperCompilerVersion, &sourceWrapperOptimizationLevel);
334     if (gotFirstSource) {
335       if ((wrapperCompilerVersion != sourceWrapperCompilerVersion) ||
336           (wrapperOptimizationLevel != sourceWrapperOptimizationLevel))
337         ALOGE("ScriptGroup source files have inconsistent metadata");
338         return false;
339     } else {
340       wrapperCompilerVersion = sourceWrapperCompilerVersion;
341       wrapperOptimizationLevel = sourceWrapperOptimizationLevel;
342       gotFirstSource = true;
343     }
344     std::unique_ptr<llvm::Module> sourceModule(&source->getModule());
345     if (linker.linkInModule(std::move(sourceModule))) {
346       ALOGE("Linking for module in source failed.");
347       return false;
348     }
349     // source->getModule() is destroyed after linking.
350     source->markModuleDestroyed();
351     // linking copies metadata from source->getModule(), but we don't
352     // want the wrapper metadata (we'll be reconstructing this when we
353     // instantiate a Source instance from the new Module).
354     llvm::NamedMDNode *const wrapperMDNode =
355         module.getNamedMetadata(bcinfo::MetadataExtractor::kWrapperMetadataName);
356     bccAssert(wrapperMDNode != nullptr);
357     module.eraseNamedMetadata(wrapperMDNode);
358   }
359 
360   // ---------------------------------------------------------------------------
361   // Create fused kernels
362   // ---------------------------------------------------------------------------
363 
364   auto inputIter = toFuse.begin();
365   for (const std::string& nameOfFused : fused) {
366     auto inputKernels = *inputIter++;
367     std::vector<Source*> sourcesToFuse;
368     std::vector<int> slots;
369 
370     for (auto p : inputKernels) {
371       sourcesToFuse.push_back(sources[p.first]);
372       slots.push_back(p.second);
373     }
374 
375     if (!fuseKernels(Context, sourcesToFuse, slots, nameOfFused, &module)) {
376       return false;
377     }
378   }
379 
380   // ---------------------------------------------------------------------------
381   // Rename invokes
382   // ---------------------------------------------------------------------------
383 
384   auto invokeIter = invokes.begin();
385   for (const std::string& newName : invokeBatchNames) {
386     auto inputInvoke = *invokeIter++;
387     auto p = inputInvoke.front();
388     Source* source = sources[p.first];
389     int slot = p.second;
390 
391     if (!renameInvoke(Context, source, slot, newName, &module)) {
392       return false;
393     }
394   }
395 
396   // ---------------------------------------------------------------------------
397   // Compile the new module with fused kernels
398   // ---------------------------------------------------------------------------
399 
400   const std::unique_ptr<Source> source(
401       Source::CreateFromModule(Context, pOutputFilepath, module,
402                                wrapperCompilerVersion, wrapperOptimizationLevel,
403                                true));
404   Script script(source.get());
405 
406   // Embed the info string directly in the ELF
407   script.setEmbedInfo(true);
408   // TODO jeanluc Should we override the config's optimization?
409   // i.e., why not script.setOptimizationLevel(getConfig()->getOptimizationLevel)?
410   script.setOptimizationLevel(llvm::CodeGenOpt::Level::Aggressive);
411   script.setEmbedGlobalInfo(mEmbedGlobalInfo);
412   script.setEmbedGlobalInfoSkipConstant(mEmbedGlobalInfoSkipConstant);
413 
414   llvm::SmallString<80> output_path(pOutputFilepath);
415   llvm::sys::path::replace_extension(output_path, ".o");
416 
417   // Pick the right runtime lib
418   const char* coreLibPath = pRuntimePath;
419   if (strcmp(pRuntimeRelaxedPath, "")) {
420       bcinfo::MetadataExtractor me(&module);
421       me.extract();
422       if (me.getRSFloatPrecision() == bcinfo::RS_FP_Relaxed) {
423           coreLibPath = pRuntimeRelaxedPath;
424       }
425   }
426 
427   compileScript(script, pOutputFilepath, output_path.c_str(), coreLibPath,
428                 buildChecksum, dumpIR);
429 
430   return true;
431 }
432 
buildForCompatLib(Script & pScript,const char * pOut,const char * pBuildChecksum,const char * pRuntimePath,bool pDumpIR)433 bool RSCompilerDriver::buildForCompatLib(Script &pScript, const char *pOut,
434                                          const char *pBuildChecksum,
435                                          const char *pRuntimePath,
436                                          bool pDumpIR) {
437   // Embed the info string directly in the ELF, since this path is for an
438   // offline (host) compilation.
439   pScript.setEmbedInfo(true);
440 
441   pScript.setEmbedGlobalInfo(mEmbedGlobalInfo);
442   pScript.setEmbedGlobalInfoSkipConstant(mEmbedGlobalInfoSkipConstant);
443   pScript.setLinkRuntimeCallback(getLinkRuntimeCallback());
444 
445   Compiler::ErrorCode status = compileScript(pScript, pOut, pOut, pRuntimePath,
446                                              pBuildChecksum, pDumpIR);
447   if (status != Compiler::kSuccess) {
448     return false;
449   }
450 
451   return true;
452 }
453