RSCompilerDriver.cpp revision 8486498c5f6083b8ab0f7aebb1944eaed33bd290
10dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh/*
20dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh * Copyright 2012, The Android Open Source Project
30dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh *
40dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh * Licensed under the Apache License, Version 2.0 (the "License");
50dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh * you may not use this file except in compliance with the License.
60dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh * You may obtain a copy of the License at
70dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh *
80dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh *     http://www.apache.org/licenses/LICENSE-2.0
90dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh *
100dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh * Unless required by applicable law or agreed to in writing, software
110dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh * distributed under the License is distributed on an "AS IS" BASIS,
120dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
130dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh * See the License for the specific language governing permissions and
140dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh * limitations under the License.
150dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh */
160dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh
170dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include "bcc/RSCompilerDriver.h"
180dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh
190dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include "Assert.h"
200dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include "FileMutex.h"
210dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include "InputFile.h"
220dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include "Log.h"
23ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh#include "OutputFile.h"
24ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh#include "RSScriptGroupFusion.h"
25ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh
26ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh#include "bcc/BCCContext.h"
27ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh#include "bcc/Compiler.h"
28ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh#include "bcc/CompilerConfig.h"
29ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh#include "bcc/Config.h"
30ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh#include "bcc/Initialization.h"
31ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh#include "bcc/Script.h"
32ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh#include "bcc/Source.h"
330dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include "bcinfo/BitcodeWrapper.h"
340dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include "bcinfo/MetadataExtractor.h"
350dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh
360dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include "llvm/ADT/STLExtras.h"
37c360382bf257d815b2a411152485d3c3b37a9f46Yin-Chia Yeh#include "llvm/IR/AssemblyAnnotationWriter.h"
38d56db1d2bee182d1851097a9c712712fc094d117Eino-Ville Talvala#include <llvm/IR/Module.h>
390dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include "llvm/Linker/Linker.h"
400dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include <llvm/Support/CommandLine.h>
4102bf03287652923b5bb5316667b065423565d6b4Eino-Ville Talvala#include <llvm/Support/Path.h>
420dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include <llvm/Support/raw_ostream.h>
430dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include <llvm/Target/TargetMachine.h>
440dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh
450dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include <sstream>
46ead9146f844ee194a4f4244ba8ae1a3aece12b63Yin-Chia Yeh#include <string>
470dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh
480dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#ifdef __ANDROID__
490dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include <cutils/properties.h>
500dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#endif
510dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh#include <utils/StopWatch.h>
528aac03f4d6c66749803d5708086ba5f509aa88c6Yin-Chia Yeh
530dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yehusing namespace bcc;
540dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh
550dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia YehRSCompilerDriver::RSCompilerDriver() :
560dea57fd9fc4b2ccaab97d9477359fbd5a626f5cYin-Chia Yeh    mConfig(nullptr), mCompiler(), mDebugContext(false),
57    mLinkRuntimeCallback(nullptr), mEnableGlobalMerge(true),
58    mEmbedGlobalInfo(false), mEmbedGlobalInfoSkipConstant(false) {
59  init::Initialize();
60}
61
62RSCompilerDriver::~RSCompilerDriver() {
63  delete mConfig;
64}
65
66
67#if defined(PROVIDE_ARM_CODEGEN)
68extern llvm::cl::opt<bool> EnableGlobalMerge;
69#endif
70
71bool RSCompilerDriver::setupConfig(const Script &pScript) {
72  bool changed = false;
73
74  const llvm::CodeGenOpt::Level script_opt_level = pScript.getOptimizationLevel();
75
76#if defined(PROVIDE_ARM_CODEGEN)
77  EnableGlobalMerge = mEnableGlobalMerge;
78#endif
79
80  if (mConfig != nullptr) {
81    // Renderscript bitcode may have their optimization flag configuration
82    // different than the previous run of RS compilation.
83    if (mConfig->getOptimizationLevel() != script_opt_level) {
84      mConfig->setOptimizationLevel(script_opt_level);
85      changed = true;
86    }
87  } else {
88    // Haven't run the compiler ever.
89    mConfig = new (std::nothrow) CompilerConfig(DEFAULT_TARGET_TRIPLE_STRING);
90    if (mConfig == nullptr) {
91      // Return false since mConfig remains NULL and out-of-memory.
92      return false;
93    }
94    mConfig->setOptimizationLevel(script_opt_level);
95    changed = true;
96  }
97
98#if defined(PROVIDE_ARM_CODEGEN)
99  bcinfo::MetadataExtractor me(&pScript.getSource().getModule());
100  if (!me.extract()) {
101    bccAssert("Could not extract RS pragma metadata for module!");
102  }
103
104  bool script_full_prec = (me.getRSFloatPrecision() == bcinfo::RS_FP_Full);
105  if (mConfig->getFullPrecision() != script_full_prec) {
106    mConfig->setFullPrecision(script_full_prec);
107    changed = true;
108  }
109#endif
110
111  return changed;
112}
113
114Compiler::ErrorCode RSCompilerDriver::compileScript(Script& pScript, const char* pScriptName,
115                                                    const char* pOutputPath,
116                                                    const char* pRuntimePath,
117                                                    const char* pBuildChecksum,
118                                                    bool pDumpIR) {
119  // embed build checksum metadata into the source
120  if (pBuildChecksum != nullptr && strlen(pBuildChecksum) > 0) {
121    pScript.getSource().addBuildChecksumMetadata(pBuildChecksum);
122  }
123
124  // Verify that the only external functions in pScript are Renderscript
125  // functions.  Fail if verification returns an error.
126  if (mCompiler.screenGlobalFunctions(pScript) != Compiler::kSuccess) {
127    return Compiler::kErrInvalidSource;
128  }
129
130  // For (32-bit) x86, translate GEPs on structs or arrays of structs to GEPs on
131  // int8* with byte offsets.  This is to ensure that layout of structs with
132  // 64-bit scalar fields matches frontend-generated code that adheres to ARM
133  // data layout.
134  //
135  // The translation is done before RenderScript runtime library is linked
136  // (during LinkRuntime below) to ensure that RenderScript-driver-provided
137  // structs (like Allocation_t) don't get forced into using the ARM layout
138  // rules.
139  if (mCompiler.getTargetMachine().getTargetTriple().getArch() == llvm::Triple::x86) {
140    mCompiler.translateGEPs(pScript);
141  }
142
143  //===--------------------------------------------------------------------===//
144  // Link RS script with Renderscript runtime.
145  //===--------------------------------------------------------------------===//
146  if (!pScript.LinkRuntime(pRuntimePath)) {
147    ALOGE("Failed to link script '%s' with Renderscript runtime %s!",
148          pScriptName, pRuntimePath);
149    return Compiler::kErrInvalidSource;
150  }
151
152  {
153    // FIXME(srhines): Windows compilation can't use locking like this, but
154    // we also don't need to worry about concurrent writers of the same file.
155#ifndef _WIN32
156    //===------------------------------------------------------------------===//
157    // Acquire the write lock for writing output object file.
158    //===------------------------------------------------------------------===//
159    FileMutex write_output_mutex(pOutputPath);
160
161    if (write_output_mutex.hasError() || !write_output_mutex.lockMutex()) {
162      ALOGE("Unable to acquire the lock for writing %s! (%s)",
163            pOutputPath, write_output_mutex.getErrorMessage().c_str());
164      return Compiler::kErrInvalidSource;
165    }
166#endif
167
168    // Open the output file for write.
169    OutputFile output_file(pOutputPath,
170                           FileBase::kTruncate | FileBase::kBinary);
171
172    if (output_file.hasError()) {
173        ALOGE("Unable to open %s for write! (%s)", pOutputPath,
174              output_file.getErrorMessage().c_str());
175      return Compiler::kErrInvalidSource;
176    }
177
178    // Setup the config to the compiler.
179    bool compiler_need_reconfigure = setupConfig(pScript);
180
181    if (mConfig == nullptr) {
182      ALOGE("Failed to setup config for RS compiler to compile %s!",
183            pOutputPath);
184      return Compiler::kErrInvalidSource;
185    }
186
187    if (compiler_need_reconfigure) {
188      Compiler::ErrorCode err = mCompiler.config(*mConfig);
189      if (err != Compiler::kSuccess) {
190        ALOGE("Failed to config the RS compiler for %s! (%s)",pOutputPath,
191              Compiler::GetErrorString(err));
192        return Compiler::kErrInvalidSource;
193      }
194    }
195
196    OutputFile *ir_file = nullptr;
197    llvm::raw_fd_ostream *IRStream = nullptr;
198    if (pDumpIR) {
199      std::string path(pOutputPath);
200      path.append(".ll");
201      ir_file = new OutputFile(path.c_str(), FileBase::kTruncate);
202      IRStream = ir_file->dup();
203    }
204
205    // Run the compiler.
206    Compiler::ErrorCode compile_result =
207        mCompiler.compile(pScript, output_file, IRStream);
208
209    if (ir_file) {
210      ir_file->close();
211      delete ir_file;
212    }
213
214    if (compile_result != Compiler::kSuccess) {
215      ALOGE("Unable to compile the source to file %s! (%s)", pOutputPath,
216            Compiler::GetErrorString(compile_result));
217      return Compiler::kErrInvalidSource;
218    }
219  }
220
221  return Compiler::kSuccess;
222}
223
224bool RSCompilerDriver::build(BCCContext &pContext,
225                             const char *pCacheDir,
226                             const char *pResName,
227                             const char *pBitcode,
228                             size_t pBitcodeSize,
229                             const char *pBuildChecksum,
230                             const char *pRuntimePath,
231                             RSLinkRuntimeCallback pLinkRuntimeCallback,
232                             bool pDumpIR) {
233    //  android::StopWatch build_time("bcc: RSCompilerDriver::build time");
234  //===--------------------------------------------------------------------===//
235  // Check parameters.
236  //===--------------------------------------------------------------------===//
237  if ((pCacheDir == nullptr) || (pResName == nullptr)) {
238    ALOGE("Invalid parameter passed to RSCompilerDriver::build()! (cache dir: "
239          "%s, resource name: %s)", ((pCacheDir) ? pCacheDir : "(null)"),
240                                    ((pResName) ? pResName : "(null)"));
241    return false;
242  }
243
244  if ((pBitcode == nullptr) || (pBitcodeSize <= 0)) {
245    ALOGE("No bitcode supplied! (bitcode: %p, size of bitcode: %u)",
246          pBitcode, static_cast<unsigned>(pBitcodeSize));
247    return false;
248  }
249
250  //===--------------------------------------------------------------------===//
251  // Construct output path.
252  // {pCacheDir}/{pResName}.o
253  //===--------------------------------------------------------------------===//
254  llvm::SmallString<80> output_path(pCacheDir);
255  llvm::sys::path::append(output_path, pResName);
256  llvm::sys::path::replace_extension(output_path, ".o");
257
258  //===--------------------------------------------------------------------===//
259  // Load the bitcode and create script.
260  //===--------------------------------------------------------------------===//
261  Source *source = Source::CreateFromBuffer(pContext, pResName,
262                                            pBitcode, pBitcodeSize);
263  if (source == nullptr) {
264    return false;
265  }
266
267  Script script(source);
268  script.setOptimizationLevel(getConfig()->getOptimizationLevel());
269  if (pLinkRuntimeCallback) {
270    setLinkRuntimeCallback(pLinkRuntimeCallback);
271  }
272
273  script.setLinkRuntimeCallback(getLinkRuntimeCallback());
274
275  script.setEmbedGlobalInfo(mEmbedGlobalInfo);
276  script.setEmbedGlobalInfoSkipConstant(mEmbedGlobalInfoSkipConstant);
277
278  // Read information from bitcode wrapper.
279  bcinfo::BitcodeWrapper wrapper(pBitcode, pBitcodeSize);
280  script.setOptimizationLevel(static_cast<llvm::CodeGenOpt::Level>(
281                              wrapper.getOptimizationLevel()));
282
283// Assertion-enabled builds can't compile legacy bitcode (due to the use of
284// getName() with anonymous structure definitions).
285#ifdef _DEBUG
286  static const uint32_t kSlangMinimumFixedStructureNames = 2310;
287  uint32_t version = wrapper.getCompilerVersion();
288  if (version < kSlangMinimumFixedStructureNames) {
289    ALOGE("Found invalid legacy bitcode compiled with a version %u llvm-rs-cc "
290          "used with an assertion build", version);
291    ALOGE("Please recompile this apk with a more recent llvm-rs-cc "
292          "(at least %u)", kSlangMinimumFixedStructureNames);
293    return false;
294  }
295#endif
296
297  //===--------------------------------------------------------------------===//
298  // Compile the script
299  //===--------------------------------------------------------------------===//
300  Compiler::ErrorCode status = compileScript(script, pResName,
301                                             output_path.c_str(),
302                                             pRuntimePath,
303                                             pBuildChecksum,
304                                             pDumpIR);
305
306  return status == Compiler::kSuccess;
307}
308
309bool RSCompilerDriver::buildScriptGroup(
310    BCCContext& Context, const char* pOutputFilepath, const char* pRuntimePath,
311    const char* pRuntimeRelaxedPath, bool dumpIR, const char* buildChecksum,
312    const std::vector<Source*>& sources,
313    const std::list<std::list<std::pair<int, int>>>& toFuse,
314    const std::list<std::string>& fused,
315    const std::list<std::list<std::pair<int, int>>>& invokes,
316    const std::list<std::string>& invokeBatchNames) {
317
318  // Read and store metadata before linking the modules together
319  std::vector<bcinfo::MetadataExtractor*> metadata;
320  for (Source* source : sources) {
321    if (!source->extractMetadata()) {
322      ALOGE("Cannot extract metadata from module");
323      return false;
324    }
325  }
326
327  // ---------------------------------------------------------------------------
328  // Link all input modules into a single module
329  // ---------------------------------------------------------------------------
330
331  llvm::LLVMContext& context = Context.getLLVMContext();
332  llvm::Module module("Merged Script Group", context);
333
334  llvm::Linker linker(module);
335  for (Source* source : sources) {
336    std::unique_ptr<llvm::Module> sourceModule(&source->getModule());
337    if (linker.linkInModule(std::move(sourceModule))) {
338      ALOGE("Linking for module in source failed.");
339      return false;
340    }
341    // source->getModule() is destroyed after linking.
342    source->markModuleDestroyed();
343  }
344
345  // ---------------------------------------------------------------------------
346  // Create fused kernels
347  // ---------------------------------------------------------------------------
348
349  auto inputIter = toFuse.begin();
350  for (const std::string& nameOfFused : fused) {
351    auto inputKernels = *inputIter++;
352    std::vector<Source*> sourcesToFuse;
353    std::vector<int> slots;
354
355    for (auto p : inputKernels) {
356      sourcesToFuse.push_back(sources[p.first]);
357      slots.push_back(p.second);
358    }
359
360    if (!fuseKernels(Context, sourcesToFuse, slots, nameOfFused, &module)) {
361      return false;
362    }
363  }
364
365  // ---------------------------------------------------------------------------
366  // Rename invokes
367  // ---------------------------------------------------------------------------
368
369  auto invokeIter = invokes.begin();
370  for (const std::string& newName : invokeBatchNames) {
371    auto inputInvoke = *invokeIter++;
372    auto p = inputInvoke.front();
373    Source* source = sources[p.first];
374    int slot = p.second;
375
376    if (!renameInvoke(Context, source, slot, newName, &module)) {
377      return false;
378    }
379  }
380
381  // ---------------------------------------------------------------------------
382  // Compile the new module with fused kernels
383  // ---------------------------------------------------------------------------
384
385  const std::unique_ptr<Source> source(
386      Source::CreateFromModule(Context, pOutputFilepath, module, true));
387  Script script(source.get());
388
389  // Embed the info string directly in the ELF
390  script.setEmbedInfo(true);
391  // TODO jeanluc Should we override the config's optimization?
392  // i.e., why not script.setOptimizationLevel(getConfig()->getOptimizationLevel)?
393  script.setOptimizationLevel(llvm::CodeGenOpt::Level::Aggressive);
394  script.setEmbedGlobalInfo(mEmbedGlobalInfo);
395  script.setEmbedGlobalInfoSkipConstant(mEmbedGlobalInfoSkipConstant);
396
397  llvm::SmallString<80> output_path(pOutputFilepath);
398  llvm::sys::path::replace_extension(output_path, ".o");
399
400  // Pick the right runtime lib
401  const char* coreLibPath = pRuntimePath;
402  if (strcmp(pRuntimeRelaxedPath, "")) {
403      bcinfo::MetadataExtractor me(&module);
404      me.extract();
405      if (me.getRSFloatPrecision() == bcinfo::RS_FP_Relaxed) {
406          coreLibPath = pRuntimeRelaxedPath;
407      }
408  }
409
410  compileScript(script, pOutputFilepath, output_path.c_str(), coreLibPath,
411                buildChecksum, dumpIR);
412
413  return true;
414}
415
416bool RSCompilerDriver::buildForCompatLib(Script &pScript, const char *pOut,
417                                         const char *pBuildChecksum,
418                                         const char *pRuntimePath,
419                                         bool pDumpIR) {
420  // Embed the info string directly in the ELF, since this path is for an
421  // offline (host) compilation.
422  pScript.setEmbedInfo(true);
423
424  pScript.setEmbedGlobalInfo(mEmbedGlobalInfo);
425  pScript.setEmbedGlobalInfoSkipConstant(mEmbedGlobalInfoSkipConstant);
426  pScript.setLinkRuntimeCallback(getLinkRuntimeCallback());
427
428  Compiler::ErrorCode status = compileScript(pScript, pOut, pOut, pRuntimePath,
429                                             pBuildChecksum, pDumpIR);
430  if (status != Compiler::kSuccess) {
431    return false;
432  }
433
434  return true;
435}
436