lib/Target/ARM/ARMTargetMachine.cpp - llvm - Git at Google

 //===-- ARMTargetMachine.cpp - Define TargetMachine for ARM ---------------===//
 //
 //                     The LLVM Compiler Infrastructure
 //
 // This file is distributed under the University of Illinois Open Source
 // License. See LICENSE.TXT for details.
 //
 //===----------------------------------------------------------------------===//
 //
 //
 //===----------------------------------------------------------------------===//

 #include "ARM.h"
 #include "ARMFrameLowering.h"
 #include "ARMTargetMachine.h"
 #include "ARMTargetObjectFile.h"
 #include "ARMTargetTransformInfo.h"
 #include "llvm/CodeGen/Passes.h"
 #include "llvm/IR/Function.h"
 #include "llvm/IR/LegacyPassManager.h"
 #include "llvm/MC/MCAsmInfo.h"
 #include "llvm/Support/CommandLine.h"
 #include "llvm/Support/FormattedStream.h"
 #include "llvm/Support/TargetRegistry.h"
 #include "llvm/Target/TargetOptions.h"
 #include "llvm/Transforms/Scalar.h"
 using namespace llvm;

 static cl::opt<bool>
 DisableA15SDOptimization("disable-a15-sd-optimization", cl::Hidden,
                    cl::desc("Inhibit optimization of S->D register accesses on A15"),
                    cl::init(false));

 static cl::opt<bool>
 EnableAtomicTidy("arm-atomic-cfg-tidy", cl::Hidden,
                  cl::desc("Run SimplifyCFG after expanding atomic operations"
                           " to make use of cmpxchg flow-based information"),
                  cl::init(true));

 static cl::opt<bool>
 EnableARMLoadStoreOpt("arm-load-store-opt", cl::Hidden,
                       cl::desc("Enable ARM load/store optimization pass"),
                       cl::init(true));

 // FIXME: Unify control over GlobalMerge.
 static cl::opt<cl::boolOrDefault>
 EnableGlobalMerge("arm-global-merge", cl::Hidden,
                   cl::desc("Enable the global merge pass"));

 extern "C" void LLVMInitializeARMTarget() {
   // Register the target.
   RegisterTargetMachine<ARMLETargetMachine> X(TheARMLETarget);
   RegisterTargetMachine<ARMBETargetMachine> Y(TheARMBETarget);
   RegisterTargetMachine<ThumbLETargetMachine> A(TheThumbLETarget);
   RegisterTargetMachine<ThumbBETargetMachine> B(TheThumbBETarget);
 }

 static std::unique_ptr<TargetLoweringObjectFile> createTLOF(const Triple &TT) {
   if (TT.isOSBinFormatMachO())
     return make_unique<TargetLoweringObjectFileMachO>();
   if (TT.isOSWindows())
     return make_unique<TargetLoweringObjectFileCOFF>();
   return make_unique<ARMElfTargetObjectFile>();
 }

 static ARMBaseTargetMachine::ARMABI
 computeTargetABI(const Triple &TT, StringRef CPU,
                  const TargetOptions &Options) {
   if (Options.MCOptions.getABIName().startswith("aapcs"))
     return ARMBaseTargetMachine::ARM_ABI_AAPCS;
   else if (Options.MCOptions.getABIName().startswith("apcs"))
     return ARMBaseTargetMachine::ARM_ABI_APCS;

   assert(Options.MCOptions.getABIName().empty() &&
          "Unknown target-abi option!");

   ARMBaseTargetMachine::ARMABI TargetABI =
       ARMBaseTargetMachine::ARM_ABI_UNKNOWN;

   // FIXME: This is duplicated code from the front end and should be unified.
   if (TT.isOSBinFormatMachO()) {
     if (TT.getEnvironment() == llvm::Triple::EABI ||
         (TT.getOS() == llvm::Triple::UnknownOS && TT.isOSBinFormatMachO()) ||
         CPU.startswith("cortex-m")) {
       TargetABI = ARMBaseTargetMachine::ARM_ABI_AAPCS;
     } else {
       TargetABI = ARMBaseTargetMachine::ARM_ABI_APCS;
     }
   } else if (TT.isOSWindows()) {
     // FIXME: this is invalid for WindowsCE
     TargetABI = ARMBaseTargetMachine::ARM_ABI_AAPCS;
   } else {
     // Select the default based on the platform.
     switch (TT.getEnvironment()) {
     case llvm::Triple::Android:
     case llvm::Triple::GNUEABI:
     case llvm::Triple::GNUEABIHF:
     case llvm::Triple::EABIHF:
     case llvm::Triple::EABI:
       TargetABI = ARMBaseTargetMachine::ARM_ABI_AAPCS;
       break;
     case llvm::Triple::GNU:
       TargetABI = ARMBaseTargetMachine::ARM_ABI_APCS;
       break;
     default:
       if (TT.isOSNetBSD())
         TargetABI = ARMBaseTargetMachine::ARM_ABI_APCS;
       else
 	TargetABI = ARMBaseTargetMachine::ARM_ABI_AAPCS;
       break;
     }
   }

   return TargetABI;
 }

 static std::string computeDataLayout(const Triple &TT, StringRef CPU,
                                      const TargetOptions &Options,
                                      bool isLittle) {
   auto ABI = computeTargetABI(TT, CPU, Options);
   std::string Ret = "";

   if (isLittle)
     // Little endian.
     Ret += "e";
   else
     // Big endian.
     Ret += "E";

   Ret += DataLayout::getManglingComponent(TT);

   // Pointers are 32 bits and aligned to 32 bits.
   Ret += "-p:32:32";

   // ABIs other than APCS have 64 bit integers with natural alignment.
   if (ABI != ARMBaseTargetMachine::ARM_ABI_APCS)
     Ret += "-i64:64";

   // We have 64 bits floats. The APCS ABI requires them to be aligned to 32
   // bits, others to 64 bits. We always try to align to 64 bits.
   if (ABI == ARMBaseTargetMachine::ARM_ABI_APCS)
     Ret += "-f64:32:64";

   // We have 128 and 64 bit vectors. The APCS ABI aligns them to 32 bits, others
   // to 64. We always ty to give them natural alignment.
   if (ABI == ARMBaseTargetMachine::ARM_ABI_APCS)
     Ret += "-v64:32:64-v128:32:128";
   else
     Ret += "-v128:64:128";

   // Try to align aggregates to 32 bits (the default is 64 bits, which has no
   // particular hardware support on 32-bit ARM).
   Ret += "-a:0:32";

   // Integer registers are 32 bits.
   Ret += "-n32";

   // The stack is 128 bit aligned on NaCl, 64 bit aligned on AAPCS and 32 bit
   // aligned everywhere else.
   if (TT.isOSNaCl())
     Ret += "-S128";
   else if (ABI == ARMBaseTargetMachine::ARM_ABI_AAPCS)
     Ret += "-S64";
   else
     Ret += "-S32";

   return Ret;
 }

 /// TargetMachine ctor - Create an ARM architecture model.
 ///
 ARMBaseTargetMachine::ARMBaseTargetMachine(const Target &T, const Triple &TT,
                                            StringRef CPU, StringRef FS,
                                            const TargetOptions &Options,
                                            Reloc::Model RM, CodeModel::Model CM,
                                            CodeGenOpt::Level OL, bool isLittle)
     : LLVMTargetMachine(T, computeDataLayout(TT, CPU, Options, isLittle), TT,
                         CPU, FS, Options, RM, CM, OL),
       TargetABI(computeTargetABI(TT, CPU, Options)),
       TLOF(createTLOF(getTargetTriple())),
       Subtarget(TT, CPU, FS, *this, isLittle), isLittle(isLittle) {

   // Default to triple-appropriate float ABI
   if (Options.FloatABIType == FloatABI::Default)
     this->Options.FloatABIType =
         Subtarget.isTargetHardFloat() ? FloatABI::Hard : FloatABI::Soft;
 }

 ARMBaseTargetMachine::~ARMBaseTargetMachine() {}

 const ARMSubtarget *
 ARMBaseTargetMachine::getSubtargetImpl(const Function &F) const {
   Attribute CPUAttr = F.getFnAttribute("target-cpu");
   Attribute FSAttr = F.getFnAttribute("target-features");

   std::string CPU = !CPUAttr.hasAttribute(Attribute::None)
                         ? CPUAttr.getValueAsString().str()
                         : TargetCPU;
   std::string FS = !FSAttr.hasAttribute(Attribute::None)
                        ? FSAttr.getValueAsString().str()
                        : TargetFS;

   // FIXME: This is related to the code below to reset the target options,
   // we need to know whether or not the soft float flag is set on the
   // function before we can generate a subtarget. We also need to use
   // it as a key for the subtarget since that can be the only difference
   // between two functions.
   bool SoftFloat =
       F.hasFnAttribute("use-soft-float") &&
       F.getFnAttribute("use-soft-float").getValueAsString() == "true";
   // If the soft float attribute is set on the function turn on the soft float
   // subtarget feature.
   if (SoftFloat)
     FS += FS.empty() ? "+soft-float" : ",+soft-float";

   auto &I = SubtargetMap[CPU + FS];
   if (!I) {
     // This needs to be done before we create a new subtarget since any
     // creation will depend on the TM and the code generation flags on the
     // function that reside in TargetOptions.
     resetTargetOptions(F);
     I = llvm::make_unique<ARMSubtarget>(TargetTriple, CPU, FS, *this, isLittle);
   }
   return I.get();
 }

 TargetIRAnalysis ARMBaseTargetMachine::getTargetIRAnalysis() {
   return TargetIRAnalysis(
       [this](Function &F) { return TargetTransformInfo(ARMTTIImpl(this, F)); });
 }


 void ARMTargetMachine::anchor() { }

 ARMTargetMachine::ARMTargetMachine(const Target &T, const Triple &TT,
                                    StringRef CPU, StringRef FS,
                                    const TargetOptions &Options,
                                    Reloc::Model RM, CodeModel::Model CM,
                                    CodeGenOpt::Level OL, bool isLittle)
     : ARMBaseTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, isLittle) {
   initAsmInfo();
   if (!Subtarget.hasARMOps())
     report_fatal_error("CPU: '" + Subtarget.getCPUString() + "' does not "
                        "support ARM mode execution!");
 }

 void ARMLETargetMachine::anchor() { }

 ARMLETargetMachine::ARMLETargetMachine(const Target &T, const Triple &TT,
                                        StringRef CPU, StringRef FS,
                                        const TargetOptions &Options,
                                        Reloc::Model RM, CodeModel::Model CM,
                                        CodeGenOpt::Level OL)
     : ARMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, true) {}

 void ARMBETargetMachine::anchor() { }

 ARMBETargetMachine::ARMBETargetMachine(const Target &T, const Triple &TT,
                                        StringRef CPU, StringRef FS,
                                        const TargetOptions &Options,
                                        Reloc::Model RM, CodeModel::Model CM,
                                        CodeGenOpt::Level OL)
     : ARMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, false) {}

 void ThumbTargetMachine::anchor() { }

 ThumbTargetMachine::ThumbTargetMachine(const Target &T, const Triple &TT,
                                        StringRef CPU, StringRef FS,
                                        const TargetOptions &Options,
                                        Reloc::Model RM, CodeModel::Model CM,
                                        CodeGenOpt::Level OL, bool isLittle)
     : ARMBaseTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, isLittle) {
   initAsmInfo();
 }

 void ThumbLETargetMachine::anchor() { }

 ThumbLETargetMachine::ThumbLETargetMachine(const Target &T, const Triple &TT,
                                            StringRef CPU, StringRef FS,
                                            const TargetOptions &Options,
                                            Reloc::Model RM, CodeModel::Model CM,
                                            CodeGenOpt::Level OL)
     : ThumbTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, true) {}

 void ThumbBETargetMachine::anchor() { }

 ThumbBETargetMachine::ThumbBETargetMachine(const Target &T, const Triple &TT,
                                            StringRef CPU, StringRef FS,
                                            const TargetOptions &Options,
                                            Reloc::Model RM, CodeModel::Model CM,
                                            CodeGenOpt::Level OL)
     : ThumbTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, false) {}

 namespace {
 /// ARM Code Generator Pass Configuration Options.
 class ARMPassConfig : public TargetPassConfig {
 public:
   ARMPassConfig(ARMBaseTargetMachine *TM, PassManagerBase &PM)
     : TargetPassConfig(TM, PM) {}

   ARMBaseTargetMachine &getARMTargetMachine() const {
     return getTM<ARMBaseTargetMachine>();
   }

   void addIRPasses() override;
   bool addPreISel() override;
   bool addInstSelector() override;
   void addPreRegAlloc() override;
   void addPreSched2() override;
   void addPreEmitPass() override;
 };
 } // namespace

 TargetPassConfig *ARMBaseTargetMachine::createPassConfig(PassManagerBase &PM) {
   return new ARMPassConfig(this, PM);
 }

 void ARMPassConfig::addIRPasses() {
   if (TM->Options.ThreadModel == ThreadModel::Single)
     addPass(createLowerAtomicPass());
   else
     addPass(createAtomicExpandPass(TM));

   // Cmpxchg instructions are often used with a subsequent comparison to
   // determine whether it succeeded. We can exploit existing control-flow in
   // ldrex/strex loops to simplify this, but it needs tidying up.
   if (TM->getOptLevel() != CodeGenOpt::None && EnableAtomicTidy)
     addPass(createCFGSimplificationPass(-1, [this](const Function &F) {
       const auto &ST = this->TM->getSubtarget<ARMSubtarget>(F);
       return ST.hasAnyDataBarrier() && !ST.isThumb1Only();
     }));

   TargetPassConfig::addIRPasses();

   // Match interleaved memory accesses to ldN/stN intrinsics.
   if (TM->getOptLevel() != CodeGenOpt::None)
     addPass(createInterleavedAccessPass(TM));
 }

 bool ARMPassConfig::addPreISel() {
   if ((TM->getOptLevel() != CodeGenOpt::None &&
        EnableGlobalMerge == cl::BOU_UNSET) ||
       EnableGlobalMerge == cl::BOU_TRUE) {
     // FIXME: This is using the thumb1 only constant value for
     // maximal global offset for merging globals. We may want
     // to look into using the old value for non-thumb1 code of
     // 4095 based on the TargetMachine, but this starts to become
     // tricky when doing code gen per function.
     bool OnlyOptimizeForSize = (TM->getOptLevel() < CodeGenOpt::Aggressive) &&
                                (EnableGlobalMerge == cl::BOU_UNSET);
     addPass(createGlobalMergePass(TM, 127, OnlyOptimizeForSize));
   }

   return false;
 }

 bool ARMPassConfig::addInstSelector() {
   addPass(createARMISelDag(getARMTargetMachine(), getOptLevel()));

   if (TM->getTargetTriple().isOSBinFormatELF() && TM->Options.EnableFastISel)
     addPass(createARMGlobalBaseRegPass());
   return false;
 }

 void ARMPassConfig::addPreRegAlloc() {
   if (getOptLevel() != CodeGenOpt::None) {
     addPass(createMLxExpansionPass());

     if (EnableARMLoadStoreOpt)
       addPass(createARMLoadStoreOptimizationPass(/* pre-register alloc */ true));

     if (!DisableA15SDOptimization)
       addPass(createA15SDOptimizerPass());
   }
 }

 void ARMPassConfig::addPreSched2() {
   if (getOptLevel() != CodeGenOpt::None) {
     if (EnableARMLoadStoreOpt)
       addPass(createARMLoadStoreOptimizationPass());

     addPass(createExecutionDependencyFixPass(&ARM::DPRRegClass));
   }

   // Expand some pseudo instructions into multiple instructions to allow
   // proper scheduling.
   addPass(createARMExpandPseudoPass());

   if (getOptLevel() != CodeGenOpt::None) {
     // in v8, IfConversion depends on Thumb instruction widths
     addPass(createThumb2SizeReductionPass([this](const Function &F) {
       return this->TM->getSubtarget<ARMSubtarget>(F).restrictIT();
     }));

     addPass(createIfConverter([this](const Function &F) {
       return !this->TM->getSubtarget<ARMSubtarget>(F).isThumb1Only();
     }));
   }
   addPass(createThumb2ITBlockPass());
 }

 void ARMPassConfig::addPreEmitPass() {
   addPass(createThumb2SizeReductionPass());

   // Constant island pass work on unbundled instructions.
   addPass(createUnpackMachineBundles([this](const Function &F) {
     return this->TM->getSubtarget<ARMSubtarget>(F).isThumb2();
   }));

   // Don't optimize barriers at -O0.
   if (getOptLevel() != CodeGenOpt::None)
     addPass(createARMOptimizeBarriersPass());

   addPass(createARMConstantIslandPass());
 }
	//===-- ARMTargetMachine.cpp - Define TargetMachine for ARM ---------------===//
	//
	// The LLVM Compiler Infrastructure
	//
	// This file is distributed under the University of Illinois Open Source
	// License. See LICENSE.TXT for details.
	//
	//===----------------------------------------------------------------------===//
	//
	//
	//===----------------------------------------------------------------------===//

	#include "ARM.h"
	#include "ARMFrameLowering.h"
	#include "ARMTargetMachine.h"
	#include "ARMTargetObjectFile.h"
	#include "ARMTargetTransformInfo.h"
	#include "llvm/CodeGen/Passes.h"
	#include "llvm/IR/Function.h"
	#include "llvm/IR/LegacyPassManager.h"
	#include "llvm/MC/MCAsmInfo.h"
	#include "llvm/Support/CommandLine.h"
	#include "llvm/Support/FormattedStream.h"
	#include "llvm/Support/TargetRegistry.h"
	#include "llvm/Target/TargetOptions.h"
	#include "llvm/Transforms/Scalar.h"
	using namespace llvm;

	static cl::opt<bool>
	DisableA15SDOptimization("disable-a15-sd-optimization", cl::Hidden,
	cl::desc("Inhibit optimization of S->D register accesses on A15"),
	cl::init(false));

	static cl::opt<bool>
	EnableAtomicTidy("arm-atomic-cfg-tidy", cl::Hidden,
	cl::desc("Run SimplifyCFG after expanding atomic operations"
	" to make use of cmpxchg flow-based information"),
	cl::init(true));

	static cl::opt<bool>
	EnableARMLoadStoreOpt("arm-load-store-opt", cl::Hidden,
	cl::desc("Enable ARM load/store optimization pass"),
	cl::init(true));

	// FIXME: Unify control over GlobalMerge.
	static cl::opt<cl::boolOrDefault>
	EnableGlobalMerge("arm-global-merge", cl::Hidden,
	cl::desc("Enable the global merge pass"));

	extern "C" void LLVMInitializeARMTarget() {
	// Register the target.
	RegisterTargetMachine<ARMLETargetMachine> X(TheARMLETarget);
	RegisterTargetMachine<ARMBETargetMachine> Y(TheARMBETarget);
	RegisterTargetMachine<ThumbLETargetMachine> A(TheThumbLETarget);
	RegisterTargetMachine<ThumbBETargetMachine> B(TheThumbBETarget);
	}

	static std::unique_ptr<TargetLoweringObjectFile> createTLOF(const Triple &TT) {
	if (TT.isOSBinFormatMachO())
	return make_unique<TargetLoweringObjectFileMachO>();
	if (TT.isOSWindows())
	return make_unique<TargetLoweringObjectFileCOFF>();
	return make_unique<ARMElfTargetObjectFile>();
	}

	static ARMBaseTargetMachine::ARMABI
	computeTargetABI(const Triple &TT, StringRef CPU,
	const TargetOptions &Options) {
	if (Options.MCOptions.getABIName().startswith("aapcs"))
	return ARMBaseTargetMachine::ARM_ABI_AAPCS;
	else if (Options.MCOptions.getABIName().startswith("apcs"))
	return ARMBaseTargetMachine::ARM_ABI_APCS;

	assert(Options.MCOptions.getABIName().empty() &&
	"Unknown target-abi option!");

	ARMBaseTargetMachine::ARMABI TargetABI =
	ARMBaseTargetMachine::ARM_ABI_UNKNOWN;

	// FIXME: This is duplicated code from the front end and should be unified.
	if (TT.isOSBinFormatMachO()) {
	if (TT.getEnvironment() == llvm::Triple::EABI \|\|
	(TT.getOS() == llvm::Triple::UnknownOS && TT.isOSBinFormatMachO()) \|\|
	CPU.startswith("cortex-m")) {
	TargetABI = ARMBaseTargetMachine::ARM_ABI_AAPCS;
	} else {
	TargetABI = ARMBaseTargetMachine::ARM_ABI_APCS;
	}
	} else if (TT.isOSWindows()) {
	// FIXME: this is invalid for WindowsCE
	TargetABI = ARMBaseTargetMachine::ARM_ABI_AAPCS;
	} else {
	// Select the default based on the platform.
	switch (TT.getEnvironment()) {
	case llvm::Triple::Android:
	case llvm::Triple::GNUEABI:
	case llvm::Triple::GNUEABIHF:
	case llvm::Triple::EABIHF:
	case llvm::Triple::EABI:
	TargetABI = ARMBaseTargetMachine::ARM_ABI_AAPCS;
	break;
	case llvm::Triple::GNU:
	TargetABI = ARMBaseTargetMachine::ARM_ABI_APCS;
	break;
	default:
	if (TT.isOSNetBSD())
	TargetABI = ARMBaseTargetMachine::ARM_ABI_APCS;
	else
	TargetABI = ARMBaseTargetMachine::ARM_ABI_AAPCS;
	break;
	}
	}

	return TargetABI;
	}

	static std::string computeDataLayout(const Triple &TT, StringRef CPU,
	const TargetOptions &Options,
	bool isLittle) {
	auto ABI = computeTargetABI(TT, CPU, Options);
	std::string Ret = "";

	if (isLittle)
	// Little endian.
	Ret += "e";
	else
	// Big endian.
	Ret += "E";

	Ret += DataLayout::getManglingComponent(TT);

	// Pointers are 32 bits and aligned to 32 bits.
	Ret += "-p:32:32";

	// ABIs other than APCS have 64 bit integers with natural alignment.
	if (ABI != ARMBaseTargetMachine::ARM_ABI_APCS)
	Ret += "-i64:64";

	// We have 64 bits floats. The APCS ABI requires them to be aligned to 32
	// bits, others to 64 bits. We always try to align to 64 bits.
	if (ABI == ARMBaseTargetMachine::ARM_ABI_APCS)
	Ret += "-f64:32:64";

	// We have 128 and 64 bit vectors. The APCS ABI aligns them to 32 bits, others
	// to 64. We always ty to give them natural alignment.
	if (ABI == ARMBaseTargetMachine::ARM_ABI_APCS)
	Ret += "-v64:32:64-v128:32:128";
	else
	Ret += "-v128:64:128";

	// Try to align aggregates to 32 bits (the default is 64 bits, which has no
	// particular hardware support on 32-bit ARM).
	Ret += "-a:0:32";

	// Integer registers are 32 bits.
	Ret += "-n32";

	// The stack is 128 bit aligned on NaCl, 64 bit aligned on AAPCS and 32 bit
	// aligned everywhere else.
	if (TT.isOSNaCl())
	Ret += "-S128";
	else if (ABI == ARMBaseTargetMachine::ARM_ABI_AAPCS)
	Ret += "-S64";
	else
	Ret += "-S32";

	return Ret;
	}

	/// TargetMachine ctor - Create an ARM architecture model.
	///
	ARMBaseTargetMachine::ARMBaseTargetMachine(const Target &T, const Triple &TT,
	StringRef CPU, StringRef FS,
	const TargetOptions &Options,
	Reloc::Model RM, CodeModel::Model CM,
	CodeGenOpt::Level OL, bool isLittle)
	: LLVMTargetMachine(T, computeDataLayout(TT, CPU, Options, isLittle), TT,
	CPU, FS, Options, RM, CM, OL),
	TargetABI(computeTargetABI(TT, CPU, Options)),
	TLOF(createTLOF(getTargetTriple())),
	Subtarget(TT, CPU, FS, *this, isLittle), isLittle(isLittle) {

	// Default to triple-appropriate float ABI
	if (Options.FloatABIType == FloatABI::Default)
	this->Options.FloatABIType =
	Subtarget.isTargetHardFloat() ? FloatABI::Hard : FloatABI::Soft;
	}

	ARMBaseTargetMachine::~ARMBaseTargetMachine() {}

	const ARMSubtarget *
	ARMBaseTargetMachine::getSubtargetImpl(const Function &F) const {
	Attribute CPUAttr = F.getFnAttribute("target-cpu");
	Attribute FSAttr = F.getFnAttribute("target-features");

	std::string CPU = !CPUAttr.hasAttribute(Attribute::None)
	? CPUAttr.getValueAsString().str()
	: TargetCPU;
	std::string FS = !FSAttr.hasAttribute(Attribute::None)
	? FSAttr.getValueAsString().str()
	: TargetFS;

	// FIXME: This is related to the code below to reset the target options,
	// we need to know whether or not the soft float flag is set on the
	// function before we can generate a subtarget. We also need to use
	// it as a key for the subtarget since that can be the only difference
	// between two functions.
	bool SoftFloat =
	F.hasFnAttribute("use-soft-float") &&
	F.getFnAttribute("use-soft-float").getValueAsString() == "true";
	// If the soft float attribute is set on the function turn on the soft float
	// subtarget feature.
	if (SoftFloat)
	FS += FS.empty() ? "+soft-float" : ",+soft-float";

	auto &I = SubtargetMap[CPU + FS];
	if (!I) {
	// This needs to be done before we create a new subtarget since any
	// creation will depend on the TM and the code generation flags on the
	// function that reside in TargetOptions.
	resetTargetOptions(F);
	I = llvm::make_unique<ARMSubtarget>(TargetTriple, CPU, FS, *this, isLittle);
	}
	return I.get();
	}

	TargetIRAnalysis ARMBaseTargetMachine::getTargetIRAnalysis() {
	return TargetIRAnalysis(
	[this](Function &F) { return TargetTransformInfo(ARMTTIImpl(this, F)); });
	}


	void ARMTargetMachine::anchor() { }

	ARMTargetMachine::ARMTargetMachine(const Target &T, const Triple &TT,
	StringRef CPU, StringRef FS,
	const TargetOptions &Options,
	Reloc::Model RM, CodeModel::Model CM,
	CodeGenOpt::Level OL, bool isLittle)
	: ARMBaseTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, isLittle) {
	initAsmInfo();
	if (!Subtarget.hasARMOps())
	report_fatal_error("CPU: '" + Subtarget.getCPUString() + "' does not "
	"support ARM mode execution!");
	}

	void ARMLETargetMachine::anchor() { }

	ARMLETargetMachine::ARMLETargetMachine(const Target &T, const Triple &TT,
	StringRef CPU, StringRef FS,
	const TargetOptions &Options,
	Reloc::Model RM, CodeModel::Model CM,
	CodeGenOpt::Level OL)
	: ARMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, true) {}

	void ARMBETargetMachine::anchor() { }

	ARMBETargetMachine::ARMBETargetMachine(const Target &T, const Triple &TT,
	StringRef CPU, StringRef FS,
	const TargetOptions &Options,
	Reloc::Model RM, CodeModel::Model CM,
	CodeGenOpt::Level OL)
	: ARMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, false) {}

	void ThumbTargetMachine::anchor() { }

	ThumbTargetMachine::ThumbTargetMachine(const Target &T, const Triple &TT,
	StringRef CPU, StringRef FS,
	const TargetOptions &Options,
	Reloc::Model RM, CodeModel::Model CM,
	CodeGenOpt::Level OL, bool isLittle)
	: ARMBaseTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, isLittle) {
	initAsmInfo();
	}

	void ThumbLETargetMachine::anchor() { }

	ThumbLETargetMachine::ThumbLETargetMachine(const Target &T, const Triple &TT,
	StringRef CPU, StringRef FS,
	const TargetOptions &Options,
	Reloc::Model RM, CodeModel::Model CM,
	CodeGenOpt::Level OL)
	: ThumbTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, true) {}

	void ThumbBETargetMachine::anchor() { }

	ThumbBETargetMachine::ThumbBETargetMachine(const Target &T, const Triple &TT,
	StringRef CPU, StringRef FS,
	const TargetOptions &Options,
	Reloc::Model RM, CodeModel::Model CM,
	CodeGenOpt::Level OL)
	: ThumbTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, false) {}

	namespace {
	/// ARM Code Generator Pass Configuration Options.
	class ARMPassConfig : public TargetPassConfig {
	public:
	ARMPassConfig(ARMBaseTargetMachine *TM, PassManagerBase &PM)
	: TargetPassConfig(TM, PM) {}

	ARMBaseTargetMachine &getARMTargetMachine() const {
	return getTM<ARMBaseTargetMachine>();
	}

	void addIRPasses() override;
	bool addPreISel() override;
	bool addInstSelector() override;
	void addPreRegAlloc() override;
	void addPreSched2() override;
	void addPreEmitPass() override;
	};
	} // namespace

	TargetPassConfig *ARMBaseTargetMachine::createPassConfig(PassManagerBase &PM) {
	return new ARMPassConfig(this, PM);
	}

	void ARMPassConfig::addIRPasses() {
	if (TM->Options.ThreadModel == ThreadModel::Single)
	addPass(createLowerAtomicPass());
	else
	addPass(createAtomicExpandPass(TM));

	// Cmpxchg instructions are often used with a subsequent comparison to
	// determine whether it succeeded. We can exploit existing control-flow in
	// ldrex/strex loops to simplify this, but it needs tidying up.
	if (TM->getOptLevel() != CodeGenOpt::None && EnableAtomicTidy)
	addPass(createCFGSimplificationPass(-1, [this](const Function &F) {
	const auto &ST = this->TM->getSubtarget<ARMSubtarget>(F);
	return ST.hasAnyDataBarrier() && !ST.isThumb1Only();
	}));

	TargetPassConfig::addIRPasses();

	// Match interleaved memory accesses to ldN/stN intrinsics.
	if (TM->getOptLevel() != CodeGenOpt::None)
	addPass(createInterleavedAccessPass(TM));
	}

	bool ARMPassConfig::addPreISel() {
	if ((TM->getOptLevel() != CodeGenOpt::None &&
	EnableGlobalMerge == cl::BOU_UNSET) \|\|
	EnableGlobalMerge == cl::BOU_TRUE) {
	// FIXME: This is using the thumb1 only constant value for
	// maximal global offset for merging globals. We may want
	// to look into using the old value for non-thumb1 code of
	// 4095 based on the TargetMachine, but this starts to become
	// tricky when doing code gen per function.
	bool OnlyOptimizeForSize = (TM->getOptLevel() < CodeGenOpt::Aggressive) &&
	(EnableGlobalMerge == cl::BOU_UNSET);
	addPass(createGlobalMergePass(TM, 127, OnlyOptimizeForSize));
	}

	return false;
	}

	bool ARMPassConfig::addInstSelector() {
	addPass(createARMISelDag(getARMTargetMachine(), getOptLevel()));

	if (TM->getTargetTriple().isOSBinFormatELF() && TM->Options.EnableFastISel)
	addPass(createARMGlobalBaseRegPass());
	return false;
	}

	void ARMPassConfig::addPreRegAlloc() {
	if (getOptLevel() != CodeGenOpt::None) {
	addPass(createMLxExpansionPass());

	if (EnableARMLoadStoreOpt)
	addPass(createARMLoadStoreOptimizationPass(/* pre-register alloc */ true));

	if (!DisableA15SDOptimization)
	addPass(createA15SDOptimizerPass());
	}
	}

	void ARMPassConfig::addPreSched2() {
	if (getOptLevel() != CodeGenOpt::None) {
	if (EnableARMLoadStoreOpt)
	addPass(createARMLoadStoreOptimizationPass());

	addPass(createExecutionDependencyFixPass(&ARM::DPRRegClass));
	}

	// Expand some pseudo instructions into multiple instructions to allow
	// proper scheduling.
	addPass(createARMExpandPseudoPass());

	if (getOptLevel() != CodeGenOpt::None) {
	// in v8, IfConversion depends on Thumb instruction widths
	addPass(createThumb2SizeReductionPass([this](const Function &F) {
	return this->TM->getSubtarget<ARMSubtarget>(F).restrictIT();
	}));

	addPass(createIfConverter([this](const Function &F) {
	return !this->TM->getSubtarget<ARMSubtarget>(F).isThumb1Only();
	}));
	}
	addPass(createThumb2ITBlockPass());
	}

	void ARMPassConfig::addPreEmitPass() {
	addPass(createThumb2SizeReductionPass());

	// Constant island pass work on unbundled instructions.
	addPass(createUnpackMachineBundles([this](const Function &F) {
	return this->TM->getSubtarget<ARMSubtarget>(F).isThumb2();
	}));

	// Don't optimize barriers at -O0.
	if (getOptLevel() != CodeGenOpt::None)
	addPass(createARMOptimizeBarriersPass());

	addPass(createARMConstantIslandPass());
	}