/*
* Copyright 2012, The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "bcc/CompilerConfig.h"
#include "Log.h"
#include "Properties.h"
#include "bcc/Config.h"
#include <llvm/CodeGen/SchedulerRegistry.h>
#include <llvm/MC/SubtargetFeature.h>
#include <llvm/Support/Host.h>
#include <llvm/Support/TargetRegistry.h>
using namespace bcc;
#if defined (PROVIDE_X86_CODEGEN) && !defined(__HOST__)
namespace {
// Utility function to add feature flags supported by the running CPU.
// This function is only needed for on-device bcc for x86.
void AddX86NativeCPUFeatures(std::vector<std::string>* attributes) {
llvm::StringMap<bool> features;
if (llvm::sys::getHostCPUFeatures(features)) {
for (const auto& f : features)
attributes->push_back((f.second ? '+' : '-') + f.first().str());
}
// LLVM generates AVX code that treats a long3 as 256 bits, while
// RenderScript considers a long3 192 bits (http://b/28879581)
attributes->push_back("-avx");
}
}
#endif // (PROVIDE_X86_CODEGEN) && !defined(__HOST__)
CompilerConfig::CompilerConfig(const std::string &pTriple)
: mTriple(pTriple), mFullPrecision(true), mTarget(nullptr) {
//===--------------------------------------------------------------------===//
// Default setting of target options
//===--------------------------------------------------------------------===//
// Use soft-float ABI. This only selects the ABI (and is applicable only to
// ARM targets). Codegen still uses hardware FPU by default. To use software
// floating point, add 'soft-float' feature to mFeatureString below.
mTargetOpts.FloatABIType = llvm::FloatABI::Soft;
//===--------------------------------------------------------------------===//
// Default setting for code model
//===--------------------------------------------------------------------===//
mCodeModel = llvm::CodeModel::Small;
//===--------------------------------------------------------------------===//
// Default setting for optimization level (-O2)
//===--------------------------------------------------------------------===//
mOptLevel = llvm::CodeGenOpt::Default;
//===--------------------------------------------------------------------===//
// Default setting for architecture type
//===--------------------------------------------------------------------===//
mArchType = llvm::Triple::UnknownArch;
initializeTarget();
initializeArch();
return;
}
bool CompilerConfig::initializeTarget() {
std::string error;
mTarget = llvm::TargetRegistry::lookupTarget(mTriple, error);
if (mTarget != nullptr) {
return true;
} else {
ALOGE("Cannot initialize llvm::Target for given triple '%s'! (%s)",
mTriple.c_str(), error.c_str());
return false;
}
}
bool CompilerConfig::initializeArch() {
if (mTarget != nullptr) {
mArchType = llvm::Triple::getArchTypeForLLVMName(mTarget->getName());
} else {
mArchType = llvm::Triple::UnknownArch;
return false;
}
// Configure each architecture for any necessary additional flags.
std::vector<std::string> attributes;
switch (mArchType) {
#if defined(PROVIDE_ARM_CODEGEN)
case llvm::Triple::arm: {
llvm::StringMap<bool> features;
llvm::sys::getHostCPUFeatures(features);
#if defined(__HOST__) || defined(ARCH_ARM_HAVE_VFP)
attributes.push_back("+vfp3");
#if !defined(__HOST__) && !defined(ARCH_ARM_HAVE_VFP_D32)
attributes.push_back("+d16");
#endif // !__HOST__ && !ARCH_ARM_HAVE_VFP_D32
#endif // __HOST__ || ARCH_ARM_HAVE_VFP
#if defined(__HOST__) || defined(ARCH_ARM_HAVE_NEON)
// Only enable NEON on ARM if we have relaxed precision floats.
if (!mFullPrecision) {
attributes.push_back("+neon");
} else {
#endif // __HOST__ || ARCH_ARM_HAVE_NEON
attributes.push_back("-neon");
attributes.push_back("-neonfp");
#if defined(__HOST__) || defined(ARCH_ARM_HAVE_NEON)
}
#endif // __HOST__ || ARCH_ARM_HAVE_NEON
if (!getProperty("debug.rs.arm-no-hwdiv")) {
if (features.count("hwdiv-arm") && features["hwdiv-arm"])
attributes.push_back("+hwdiv-arm");
if (features.count("hwdiv") && features["hwdiv"])
attributes.push_back("+hwdiv");
}
// Enable fp16 attribute if available in the feature list. This feature
// will not be added in the host version of bcc or bcc_compat since
// 'features' would correspond to features in an x86 host.
if (features.count("fp16") && features["fp16"])
attributes.push_back("+fp16");
#if defined(PROVIDE_ARM64_CODEGEN)
// On AArch64, asimd in /proc/cpuinfo signals the presence of hardware
// half-precision conversion instructions. getHostCPUFeatures translates
// this to "neon". If PROVIDE_ARM64_CODEGEN is set, enable "+fp16" for ARM
// codegen if "neon" is present in features.
if (features.count("neon") && features["neon"])
attributes.push_back("+fp16");
#endif // PROVIDE_ARM64_CODEGEN
#if defined(TARGET_BUILD)
if (!getProperty("debug.rs.arm-no-tune-for-cpu")) {
#ifdef DEFAULT_ARM_CODEGEN
setCPU(llvm::sys::getHostCPUName());
#endif
}
#endif // TARGET_BUILD
break;
}
#endif // PROVIDE_ARM_CODEGEN
#if defined(PROVIDE_ARM64_CODEGEN)
case llvm::Triple::aarch64:
#if defined(TARGET_BUILD)
if (!getProperty("debug.rs.arm-no-tune-for-cpu")) {
#ifdef DEFAULT_ARM64_CODEGEN
setCPU(llvm::sys::getHostCPUName());
#endif
}
#endif // TARGET_BUILD
break;
#endif // PROVIDE_ARM64_CODEGEN
#if defined (PROVIDE_MIPS_CODEGEN)
case llvm::Triple::mips:
case llvm::Triple::mipsel:
if (!mRelocModel.hasValue()) {
mRelocModel = llvm::Reloc::Static;
}
break;
#endif // PROVIDE_MIPS_CODEGEN
#if defined (PROVIDE_MIPS64_CODEGEN)
case llvm::Triple::mips64:
case llvm::Triple::mips64el:
// Default revision for MIPS64 Android is R6.
setCPU("mips64r6");
break;
#endif // PROVIDE_MIPS64_CODEGEN
#if defined (PROVIDE_X86_CODEGEN)
case llvm::Triple::x86:
getTargetOptions().UseInitArray = true;
#if defined (DEFAULT_X86_CODEGEN) && !defined (__HOST__)
setCPU(llvm::sys::getHostCPUName());
AddX86NativeCPUFeatures(&attributes);
#else
// generic fallback for 32bit x86 targets
setCPU("atom");
#endif // DEFAULT_X86_CODEGEN && !__HOST__
break;
#endif // PROVIDE_X86_CODEGEN
#if defined (PROVIDE_X86_CODEGEN)
// PROVIDE_X86_CODEGEN is defined for both x86 and x86_64
case llvm::Triple::x86_64:
#if defined(DEFAULT_X86_64_CODEGEN) && !defined(__HOST__)
setCPU(llvm::sys::getHostCPUName());
AddX86NativeCPUFeatures(&attributes);
#else
// generic fallback for 64bit x86 targets
setCPU("core2");
#endif
// x86_64 needs small CodeModel if use PIC_ reloc, or else dlopen failed with TEXTREL.
if (mRelocModel.hasValue() && mRelocModel.getValue() == llvm::Reloc::PIC_) {
setCodeModel(llvm::CodeModel::Small);
} else {
setCodeModel(llvm::CodeModel::Medium);
}
getTargetOptions().UseInitArray = true;
break;
#endif // PROVIDE_X86_CODEGEN
default:
ALOGE("Unsupported architecture type: %s", mTarget->getName());
return false;
}
setFeatureString(attributes);
return true;
}
void CompilerConfig::setFeatureString(const std::vector<std::string> &pAttrs) {
llvm::SubtargetFeatures f;
for (std::vector<std::string>::const_iterator attr_iter = pAttrs.begin(),
attr_end = pAttrs.end();
attr_iter != attr_end; attr_iter++) {
f.AddFeature(*attr_iter);
}
mFeatureString = f.getString();
return;
}