/*
* Copyright 2012, The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "bcc/Support/CompilerConfig.h"
#include "bcc/Config/Config.h"
#include "bcc/Support/Properties.h"
#include <llvm/CodeGen/SchedulerRegistry.h>
#include <llvm/MC/SubtargetFeature.h>
#include <llvm/Support/Host.h>
#include <llvm/Support/TargetRegistry.h>
#include "bcc/Support/Log.h"
using namespace bcc;
#if defined (PROVIDE_X86_CODEGEN) && !defined(__HOST__)
namespace {
// Utility function to test for f16c feature. This function is only needed for
// on-device bcc for x86
bool HasF16C() {
llvm::StringMap<bool> features;
if (!llvm::sys::getHostCPUFeatures(features))
return false;
if (features.count("f16c") && features["f16c"])
return true;
else
return false;
}
}
#endif // (PROVIDE_X86_CODEGEN) && !defined(__HOST__)
CompilerConfig::CompilerConfig(const std::string &pTriple)
: mTriple(pTriple), mFullPrecision(true), mTarget(nullptr) {
//===--------------------------------------------------------------------===//
// Default setting of target options
//===--------------------------------------------------------------------===//
// Use soft-float ABI. This only selects the ABI (and is applicable only to
// ARM targets). Codegen still uses hardware FPU by default. To use software
// floating point, add 'soft-float' feature to mFeatureString below.
mTargetOpts.FloatABIType = llvm::FloatABI::Soft;
//===--------------------------------------------------------------------===//
// Default setting for code model
//===--------------------------------------------------------------------===//
mCodeModel = llvm::CodeModel::Small;
//===--------------------------------------------------------------------===//
// Default setting for relocation model
//===--------------------------------------------------------------------===//
mRelocModel = llvm::Reloc::Default;
//===--------------------------------------------------------------------===//
// Default setting for optimization level (-O2)
//===--------------------------------------------------------------------===//
mOptLevel = llvm::CodeGenOpt::Default;
//===--------------------------------------------------------------------===//
// Default setting for architecture type
//===--------------------------------------------------------------------===//
mArchType = llvm::Triple::UnknownArch;
initializeTarget();
initializeArch();
return;
}
bool CompilerConfig::initializeTarget() {
std::string error;
mTarget = llvm::TargetRegistry::lookupTarget(mTriple, error);
if (mTarget != nullptr) {
return true;
} else {
ALOGE("Cannot initialize llvm::Target for given triple '%s'! (%s)",
mTriple.c_str(), error.c_str());
return false;
}
}
bool CompilerConfig::initializeArch() {
if (mTarget != nullptr) {
mArchType = llvm::Triple::getArchTypeForLLVMName(mTarget->getName());
} else {
mArchType = llvm::Triple::UnknownArch;
return false;
}
// Configure each architecture for any necessary additional flags.
std::vector<std::string> attributes;
switch (mArchType) {
#if defined(PROVIDE_ARM_CODEGEN)
case llvm::Triple::arm: {
llvm::StringMap<bool> features;
llvm::sys::getHostCPUFeatures(features);
#if defined(__HOST__) || defined(ARCH_ARM_HAVE_VFP)
attributes.push_back("+vfp3");
#if !defined(__HOST__) && !defined(ARCH_ARM_HAVE_VFP_D32)
attributes.push_back("+d16");
#endif // !__HOST__ && !ARCH_ARM_HAVE_VFP_D32
#endif // __HOST__ || ARCH_ARM_HAVE_VFP
#if defined(__HOST__) || defined(ARCH_ARM_HAVE_NEON)
// Only enable NEON on ARM if we have relaxed precision floats.
if (!mFullPrecision) {
attributes.push_back("+neon");
} else {
#endif // __HOST__ || ARCH_ARM_HAVE_NEON
attributes.push_back("-neon");
attributes.push_back("-neonfp");
#if defined(__HOST__) || defined(ARCH_ARM_HAVE_NEON)
}
#endif // __HOST__ || ARCH_ARM_HAVE_NEON
if (!getProperty("debug.rs.arm-no-hwdiv")) {
if (features.count("hwdiv-arm") && features["hwdiv-arm"])
attributes.push_back("+hwdiv-arm");
if (features.count("hwdiv") && features["hwdiv"])
attributes.push_back("+hwdiv");
}
// Enable fp16 attribute if available in the feature list. This feature
// will not be added in the host version of bcc or bcc_compat since
// 'features' would correspond to features in an x86 host.
if (features.count("fp16") && features["fp16"])
attributes.push_back("+fp16");
#if defined(PROVIDE_ARM64_CODEGEN)
// On AArch64, asimd in /proc/cpuinfo signals the presence of hardware
// half-precision conversion instructions. getHostCPUFeatures translates
// this to "neon". If PROVIDE_ARM64_CODEGEN is set, enable "+fp16" for ARM
// codegen if "neon" is present in features.
if (features.count("neon") && features["neon"])
attributes.push_back("+fp16");
#endif // PROVIDE_ARM64_CODEGEN
#if defined(TARGET_BUILD)
if (!getProperty("debug.rs.arm-no-tune-for-cpu")) {
#ifndef FORCE_CPU_VARIANT_32
#ifdef DEFAULT_ARM_CODEGEN
setCPU(llvm::sys::getHostCPUName());
#endif
#else
#define XSTR(S) #S
#define STR(S) XSTR(S)
setCPU(STR(FORCE_CPU_VARIANT_32));
#undef STR
#undef XSTR
#endif
}
#endif // TARGET_BUILD
break;
}
#endif // PROVIDE_ARM_CODEGEN
#if defined(PROVIDE_ARM64_CODEGEN)
case llvm::Triple::aarch64:
#if defined(TARGET_BUILD)
if (!getProperty("debug.rs.arm-no-tune-for-cpu")) {
#ifndef FORCE_CPU_VARIANT_64
#ifdef DEFAULT_ARM64_CODEGEN
setCPU(llvm::sys::getHostCPUName());
#endif
#else
#define XSTR(S) #S
#define STR(S) XSTR(S)
setCPU(STR(FORCE_CPU_VARIANT_64));
#undef STR
#undef XSTR
#endif
}
#endif // TARGET_BUILD
break;
#endif // PROVIDE_ARM64_CODEGEN
#if defined (PROVIDE_MIPS_CODEGEN)
case llvm::Triple::mips:
case llvm::Triple::mipsel:
if (getRelocationModel() == llvm::Reloc::Default) {
setRelocationModel(llvm::Reloc::Static);
}
break;
#endif // PROVIDE_MIPS_CODEGEN
#if defined (PROVIDE_MIPS64_CODEGEN)
case llvm::Triple::mips64:
case llvm::Triple::mips64el:
// Default revision for MIPS64 Android is R6.
setCPU("mips64r6");
break;
#endif // PROVIDE_MIPS64_CODEGEN
#if defined (PROVIDE_X86_CODEGEN)
case llvm::Triple::x86:
getTargetOptions().UseInitArray = true;
#if defined (DEFAULT_X86_CODEGEN) && !defined (DEFAULT_X86_64_CODEGEN)
setCPU(llvm::sys::getHostCPUName());
#else
// generic fallback for 32bit x86 targets
setCPU("atom");
#endif // DEFAULT_X86_CODEGEN && !DEFAULT_X86_64_CODEGEN
#ifndef __HOST__
// If not running on the host, and f16c is available, set it in the feature
// string
if (HasF16C())
attributes.push_back("+f16c");
#if defined(__SSE3__)
attributes.push_back("+sse3");
attributes.push_back("+ssse3");
#endif
#if defined(__SSE4_1__)
attributes.push_back("+sse4.1");
#endif
#if defined(__SSE4_2__)
attributes.push_back("+sse4.2");
#endif
#endif // __HOST__
break;
#endif // PROVIDE_X86_CODEGEN
#if defined (PROVIDE_X86_CODEGEN)
// PROVIDE_X86_CODEGEN is defined for both x86 and x86_64
case llvm::Triple::x86_64:
#if defined(DEFAULT_X86_64_CODEGEN) && !defined(__HOST__)
setCPU(llvm::sys::getHostCPUName());
#else
// generic fallback for 64bit x86 targets
setCPU("core2");
#endif
// x86_64 needs small CodeModel if use PIC_ reloc, or else dlopen failed with TEXTREL.
if (getRelocationModel() == llvm::Reloc::PIC_) {
setCodeModel(llvm::CodeModel::Small);
} else {
setCodeModel(llvm::CodeModel::Medium);
}
getTargetOptions().UseInitArray = true;
#ifndef __HOST__
// If not running on the host, and f16c is available, set it in the feature
// string
if (HasF16C())
attributes.push_back("+f16c");
#endif // __HOST__
break;
#endif // PROVIDE_X86_CODEGEN
default:
ALOGE("Unsupported architecture type: %s", mTarget->getName());
return false;
}
setFeatureString(attributes);
return true;
}
void CompilerConfig::setFeatureString(const std::vector<std::string> &pAttrs) {
llvm::SubtargetFeatures f;
for (std::vector<std::string>::const_iterator attr_iter = pAttrs.begin(),
attr_end = pAttrs.end();
attr_iter != attr_end; attr_iter++) {
f.AddFeature(*attr_iter);
}
mFeatureString = f.getString();
return;
}