lib/CompilerConfig.cpp - platform/frameworks/compile/libbcc - Git at Google

 /*
  * Copyright 2012, The Android Open Source Project
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 #include "bcc/CompilerConfig.h"

 #include "Log.h"
 #include "Properties.h"

 #include "bcc/Config.h"

 #include <llvm/CodeGen/SchedulerRegistry.h>
 #include <llvm/MC/SubtargetFeature.h>
 #include <llvm/Support/Host.h>
 #include <llvm/Support/TargetRegistry.h>

 using namespace bcc;

 #if defined (PROVIDE_X86_CODEGEN) && !defined(__HOST__)

 namespace {

 // Utility function to add feature flags supported by the running CPU.
 // This function is only needed for on-device bcc for x86.
 void AddX86NativeCPUFeatures(std::vector<std::string>* attributes) {
   llvm::StringMap<bool> features;
   if (llvm::sys::getHostCPUFeatures(features)) {
     for (const auto& f : features)
       attributes->push_back((f.second ? '+' : '-') + f.first().str());
   }

   // LLVM generates AVX code that treats a long3 as 256 bits, while
   // RenderScript considers a long3 192 bits (http://b/28879581)
   attributes->push_back("-avx");
 }

 }
 #endif // (PROVIDE_X86_CODEGEN) && !defined(__HOST__)

 CompilerConfig::CompilerConfig(const std::string &pTriple)
   : mTriple(pTriple), mFullPrecision(true), mTarget(nullptr) {
   //===--------------------------------------------------------------------===//
   // Default setting of target options
   //===--------------------------------------------------------------------===//

   // Use soft-float ABI.  This only selects the ABI (and is applicable only to
   // ARM targets).  Codegen still uses hardware FPU by default.  To use software
   // floating point, add 'soft-float' feature to mFeatureString below.
   mTargetOpts.FloatABIType = llvm::FloatABI::Soft;

   //===--------------------------------------------------------------------===//
   // Default setting for code model
   //===--------------------------------------------------------------------===//
   mCodeModel = llvm::CodeModel::Small;

   //===--------------------------------------------------------------------===//
   // Default setting for optimization level (-O2)
   //===--------------------------------------------------------------------===//
   mOptLevel = llvm::CodeGenOpt::Default;

   //===--------------------------------------------------------------------===//
   // Default setting for architecture type
   //===--------------------------------------------------------------------===//
   mArchType = llvm::Triple::UnknownArch;

   initializeTarget();
   initializeArch();

   return;
 }

 bool CompilerConfig::initializeTarget() {
   std::string error;
   mTarget = llvm::TargetRegistry::lookupTarget(mTriple, error);
   if (mTarget != nullptr) {
     return true;
   } else {
     ALOGE("Cannot initialize llvm::Target for given triple '%s'! (%s)",
           mTriple.c_str(), error.c_str());
     return false;
   }
 }

 bool CompilerConfig::initializeArch() {
   if (mTarget != nullptr) {
     mArchType = llvm::Triple::getArchTypeForLLVMName(mTarget->getName());
   } else {
     mArchType = llvm::Triple::UnknownArch;
     return false;
   }

   // Configure each architecture for any necessary additional flags.
   std::vector<std::string> attributes;
   switch (mArchType) {
 #if defined(PROVIDE_ARM_CODEGEN)
   case llvm::Triple::arm: {
     llvm::StringMap<bool> features;
     llvm::sys::getHostCPUFeatures(features);

 #if defined(__HOST__) || defined(ARCH_ARM_HAVE_VFP)
     attributes.push_back("+vfp3");
 #if !defined(__HOST__) && !defined(ARCH_ARM_HAVE_VFP_D32)
     attributes.push_back("+d16");
 #endif  // !__HOST__ && !ARCH_ARM_HAVE_VFP_D32
 #endif  // __HOST__ || ARCH_ARM_HAVE_VFP

 #if defined(__HOST__) || defined(ARCH_ARM_HAVE_NEON)
     // Only enable NEON on ARM if we have relaxed precision floats.
     if (!mFullPrecision) {
       attributes.push_back("+neon");
     } else {
 #endif  // __HOST__ || ARCH_ARM_HAVE_NEON
       attributes.push_back("-neon");
       attributes.push_back("-neonfp");
 #if defined(__HOST__) || defined(ARCH_ARM_HAVE_NEON)
     }
 #endif  // __HOST__ || ARCH_ARM_HAVE_NEON

     if (!getProperty("debug.rs.arm-no-hwdiv")) {
       if (features.count("hwdiv-arm") && features["hwdiv-arm"])
         attributes.push_back("+hwdiv-arm");

       if (features.count("hwdiv") && features["hwdiv"])
         attributes.push_back("+hwdiv");
     }

     // Enable fp16 attribute if available in the feature list.  This feature
     // will not be added in the host version of bcc or bcc_compat since
     // 'features' would correspond to features in an x86 host.
     if (features.count("fp16") && features["fp16"])
       attributes.push_back("+fp16");

 #if defined(PROVIDE_ARM64_CODEGEN)
     // On AArch64, asimd in /proc/cpuinfo signals the presence of hardware
     // half-precision conversion instructions.  getHostCPUFeatures translates
     // this to "neon".  If PROVIDE_ARM64_CODEGEN is set, enable "+fp16" for ARM
     // codegen if "neon" is present in features.
     if (features.count("neon") && features["neon"])
       attributes.push_back("+fp16");
 #endif // PROVIDE_ARM64_CODEGEN

 #if defined(TARGET_BUILD)
     if (!getProperty("debug.rs.arm-no-tune-for-cpu")) {
 #ifdef DEFAULT_ARM_CODEGEN
       setCPU(llvm::sys::getHostCPUName());
 #endif
     }
 #endif  // TARGET_BUILD

     break;
   }
 #endif  // PROVIDE_ARM_CODEGEN

 #if defined(PROVIDE_ARM64_CODEGEN)
   case llvm::Triple::aarch64:
 #if defined(TARGET_BUILD)
     if (!getProperty("debug.rs.arm-no-tune-for-cpu")) {
 #ifdef DEFAULT_ARM64_CODEGEN
       setCPU(llvm::sys::getHostCPUName());
 #endif
     }
 #endif  // TARGET_BUILD
     break;
 #endif  // PROVIDE_ARM64_CODEGEN

 #if defined (PROVIDE_MIPS_CODEGEN)
   case llvm::Triple::mips:
   case llvm::Triple::mipsel:
     if (!mRelocModel.hasValue()) {
       mRelocModel = llvm::Reloc::Static;
     }
     break;
 #endif  // PROVIDE_MIPS_CODEGEN

 #if defined (PROVIDE_MIPS64_CODEGEN)
   case llvm::Triple::mips64:
   case llvm::Triple::mips64el:
     // Default revision for MIPS64 Android is R6.
     setCPU("mips64r6");
     break;
 #endif // PROVIDE_MIPS64_CODEGEN

 #if defined (PROVIDE_X86_CODEGEN)
   case llvm::Triple::x86:
     getTargetOptions().UseInitArray = true;
 #if defined (DEFAULT_X86_CODEGEN) && !defined (__HOST__)
     setCPU(llvm::sys::getHostCPUName());
     AddX86NativeCPUFeatures(&attributes);
 #else
     // generic fallback for 32bit x86 targets
     setCPU("atom");
 #endif // DEFAULT_X86_CODEGEN && !__HOST__
     break;
 #endif  // PROVIDE_X86_CODEGEN

 #if defined (PROVIDE_X86_CODEGEN)
 // PROVIDE_X86_CODEGEN is defined for both x86 and x86_64
   case llvm::Triple::x86_64:
 #if defined(DEFAULT_X86_64_CODEGEN) && !defined(__HOST__)
     setCPU(llvm::sys::getHostCPUName());
     AddX86NativeCPUFeatures(&attributes);
 #else
     // generic fallback for 64bit x86 targets
     setCPU("core2");
 #endif
     // x86_64 needs small CodeModel if use PIC_ reloc, or else dlopen failed with TEXTREL.
     if (mRelocModel.hasValue() && mRelocModel.getValue() == llvm::Reloc::PIC_) {
       setCodeModel(llvm::CodeModel::Small);
     } else {
       setCodeModel(llvm::CodeModel::Medium);
     }
     getTargetOptions().UseInitArray = true;
     break;
 #endif  // PROVIDE_X86_CODEGEN

   default:
     ALOGE("Unsupported architecture type: %s", mTarget->getName());
     return false;
   }

   setFeatureString(attributes);
   return true;
 }

 void CompilerConfig::setFeatureString(const std::vector<std::string> &pAttrs) {
   llvm::SubtargetFeatures f;

   for (std::vector<std::string>::const_iterator attr_iter = pAttrs.begin(),
            attr_end = pAttrs.end();
        attr_iter != attr_end; attr_iter++) {
     f.AddFeature(*attr_iter);
   }

   mFeatureString = f.getString();
   return;
 }
	/*
	* Copyright 2012, The Android Open Source Project
	*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	#include "bcc/CompilerConfig.h"

	#include "Log.h"
	#include "Properties.h"

	#include "bcc/Config.h"

	#include <llvm/CodeGen/SchedulerRegistry.h>
	#include <llvm/MC/SubtargetFeature.h>
	#include <llvm/Support/Host.h>
	#include <llvm/Support/TargetRegistry.h>

	using namespace bcc;

	#if defined (PROVIDE_X86_CODEGEN) && !defined(__HOST__)

	namespace {

	// Utility function to add feature flags supported by the running CPU.
	// This function is only needed for on-device bcc for x86.
	void AddX86NativeCPUFeatures(std::vector<std::string>* attributes) {
	llvm::StringMap<bool> features;
	if (llvm::sys::getHostCPUFeatures(features)) {
	for (const auto& f : features)
	attributes->push_back((f.second ? '+' : '-') + f.first().str());
	}

	// LLVM generates AVX code that treats a long3 as 256 bits, while
	// RenderScript considers a long3 192 bits (http://b/28879581)
	attributes->push_back("-avx");
	}

	}
	#endif // (PROVIDE_X86_CODEGEN) && !defined(__HOST__)

	CompilerConfig::CompilerConfig(const std::string &pTriple)
	: mTriple(pTriple), mFullPrecision(true), mTarget(nullptr) {
	//===--------------------------------------------------------------------===//
	// Default setting of target options
	//===--------------------------------------------------------------------===//

	// Use soft-float ABI. This only selects the ABI (and is applicable only to
	// ARM targets). Codegen still uses hardware FPU by default. To use software
	// floating point, add 'soft-float' feature to mFeatureString below.
	mTargetOpts.FloatABIType = llvm::FloatABI::Soft;

	//===--------------------------------------------------------------------===//
	// Default setting for code model
	//===--------------------------------------------------------------------===//
	mCodeModel = llvm::CodeModel::Small;

	//===--------------------------------------------------------------------===//
	// Default setting for optimization level (-O2)
	//===--------------------------------------------------------------------===//
	mOptLevel = llvm::CodeGenOpt::Default;

	//===--------------------------------------------------------------------===//
	// Default setting for architecture type
	//===--------------------------------------------------------------------===//
	mArchType = llvm::Triple::UnknownArch;

	initializeTarget();
	initializeArch();

	return;
	}

	bool CompilerConfig::initializeTarget() {
	std::string error;
	mTarget = llvm::TargetRegistry::lookupTarget(mTriple, error);
	if (mTarget != nullptr) {
	return true;
	} else {
	ALOGE("Cannot initialize llvm::Target for given triple '%s'! (%s)",
	mTriple.c_str(), error.c_str());
	return false;
	}
	}

	bool CompilerConfig::initializeArch() {
	if (mTarget != nullptr) {
	mArchType = llvm::Triple::getArchTypeForLLVMName(mTarget->getName());
	} else {
	mArchType = llvm::Triple::UnknownArch;
	return false;
	}

	// Configure each architecture for any necessary additional flags.
	std::vector<std::string> attributes;
	switch (mArchType) {
	#if defined(PROVIDE_ARM_CODEGEN)
	case llvm::Triple::arm: {
	llvm::StringMap<bool> features;
	llvm::sys::getHostCPUFeatures(features);

	#if defined(__HOST__) \|\| defined(ARCH_ARM_HAVE_VFP)
	attributes.push_back("+vfp3");
	#if !defined(__HOST__) && !defined(ARCH_ARM_HAVE_VFP_D32)
	attributes.push_back("+d16");
	#endif // !__HOST__ && !ARCH_ARM_HAVE_VFP_D32
	#endif // __HOST__ \|\| ARCH_ARM_HAVE_VFP

	#if defined(__HOST__) \|\| defined(ARCH_ARM_HAVE_NEON)
	// Only enable NEON on ARM if we have relaxed precision floats.
	if (!mFullPrecision) {
	attributes.push_back("+neon");
	} else {
	#endif // __HOST__ \|\| ARCH_ARM_HAVE_NEON
	attributes.push_back("-neon");
	attributes.push_back("-neonfp");
	#if defined(__HOST__) \|\| defined(ARCH_ARM_HAVE_NEON)
	}
	#endif // __HOST__ \|\| ARCH_ARM_HAVE_NEON

	if (!getProperty("debug.rs.arm-no-hwdiv")) {
	if (features.count("hwdiv-arm") && features["hwdiv-arm"])
	attributes.push_back("+hwdiv-arm");

	if (features.count("hwdiv") && features["hwdiv"])
	attributes.push_back("+hwdiv");
	}

	// Enable fp16 attribute if available in the feature list. This feature
	// will not be added in the host version of bcc or bcc_compat since
	// 'features' would correspond to features in an x86 host.
	if (features.count("fp16") && features["fp16"])
	attributes.push_back("+fp16");

	#if defined(PROVIDE_ARM64_CODEGEN)
	// On AArch64, asimd in /proc/cpuinfo signals the presence of hardware
	// half-precision conversion instructions. getHostCPUFeatures translates
	// this to "neon". If PROVIDE_ARM64_CODEGEN is set, enable "+fp16" for ARM
	// codegen if "neon" is present in features.
	if (features.count("neon") && features["neon"])
	attributes.push_back("+fp16");
	#endif // PROVIDE_ARM64_CODEGEN

	#if defined(TARGET_BUILD)
	if (!getProperty("debug.rs.arm-no-tune-for-cpu")) {
	#ifdef DEFAULT_ARM_CODEGEN
	setCPU(llvm::sys::getHostCPUName());
	#endif
	}
	#endif // TARGET_BUILD

	break;
	}
	#endif // PROVIDE_ARM_CODEGEN

	#if defined(PROVIDE_ARM64_CODEGEN)
	case llvm::Triple::aarch64:
	#if defined(TARGET_BUILD)
	if (!getProperty("debug.rs.arm-no-tune-for-cpu")) {
	#ifdef DEFAULT_ARM64_CODEGEN
	setCPU(llvm::sys::getHostCPUName());
	#endif
	}
	#endif // TARGET_BUILD
	break;
	#endif // PROVIDE_ARM64_CODEGEN

	#if defined (PROVIDE_MIPS_CODEGEN)
	case llvm::Triple::mips:
	case llvm::Triple::mipsel:
	if (!mRelocModel.hasValue()) {
	mRelocModel = llvm::Reloc::Static;
	}
	break;
	#endif // PROVIDE_MIPS_CODEGEN

	#if defined (PROVIDE_MIPS64_CODEGEN)
	case llvm::Triple::mips64:
	case llvm::Triple::mips64el:
	// Default revision for MIPS64 Android is R6.
	setCPU("mips64r6");
	break;
	#endif // PROVIDE_MIPS64_CODEGEN

	#if defined (PROVIDE_X86_CODEGEN)
	case llvm::Triple::x86:
	getTargetOptions().UseInitArray = true;
	#if defined (DEFAULT_X86_CODEGEN) && !defined (__HOST__)
	setCPU(llvm::sys::getHostCPUName());
	AddX86NativeCPUFeatures(&attributes);
	#else
	// generic fallback for 32bit x86 targets
	setCPU("atom");
	#endif // DEFAULT_X86_CODEGEN && !__HOST__
	break;
	#endif // PROVIDE_X86_CODEGEN

	#if defined (PROVIDE_X86_CODEGEN)
	// PROVIDE_X86_CODEGEN is defined for both x86 and x86_64
	case llvm::Triple::x86_64:
	#if defined(DEFAULT_X86_64_CODEGEN) && !defined(__HOST__)
	setCPU(llvm::sys::getHostCPUName());
	AddX86NativeCPUFeatures(&attributes);
	#else
	// generic fallback for 64bit x86 targets
	setCPU("core2");
	#endif
	// x86_64 needs small CodeModel if use PIC_ reloc, or else dlopen failed with TEXTREL.
	if (mRelocModel.hasValue() && mRelocModel.getValue() == llvm::Reloc::PIC_) {
	setCodeModel(llvm::CodeModel::Small);
	} else {
	setCodeModel(llvm::CodeModel::Medium);
	}
	getTargetOptions().UseInitArray = true;
	break;
	#endif // PROVIDE_X86_CODEGEN

	default:
	ALOGE("Unsupported architecture type: %s", mTarget->getName());
	return false;
	}

	setFeatureString(attributes);
	return true;
	}

	void CompilerConfig::setFeatureString(const std::vector<std::string> &pAttrs) {
	llvm::SubtargetFeatures f;

	for (std::vector<std::string>::const_iterator attr_iter = pAttrs.begin(),
	attr_end = pAttrs.end();
	attr_iter != attr_end; attr_iter++) {
	f.AddFeature(*attr_iter);
	}

	mFeatureString = f.getString();
	return;
	}