Lower thumbv4t & thumbv5 lo->lo copies through a push-pop sequence

[oota-llvm.git] / lib / Target / ARM / ARMSubtarget.cpp
diff --git a/lib/Target/ARM/ARMSubtarget.cpp b/lib/Target/ARM/ARMSubtarget.cpp

index 0c6ff529653f2161bc29ad9b5f5d280c0398a36b..9c4f05283f20ca68aec8e0113f08c2f74dba0b58 100644 (file)
--- a/lib/Target/ARM/ARMSubtarget.cpp
+++ b/lib/Target/ARM/ARMSubtarget.cpp
@@ -50,11 +50,13 @@ static cl::opt<bool>
  UseFusedMulOps("arm-use-mulops",
                 cl::init(true), cl::Hidden);
  
+namespace {
  enum AlignMode {
    DefaultAlign,
    StrictAlign,
    NoStrictAlign
  };
+}
  
  static cl::opt<AlignMode>
  Align(cl::desc("Load/store alignment support"),
@@ -191,7 +193,6 @@ void ARMSubtarget::initializeEnvironment() {
    InThumbMode = false;
    HasThumb2 = false;
    NoARM = false;
-  PostRAScheduler = false;
    IsR9Reserved = ReserveR9;
    UseMovt = false;
    SupportsTailCall = false;
@@ -308,9 +309,6 @@ void ARMSubtarget::resetSubtargetFeatures(StringRef CPU, StringRef FS) {
      SupportsTailCall = !isThumb1Only();
    }
  
-  if (!isThumb() || hasThumb2())
-    PostRAScheduler = true;
-
    switch (Align) {
      case DefaultAlign:
        // Assume pre-ARMv6 doesn't support unaligned accesses.
@@ -425,25 +423,15 @@ bool ARMSubtarget::hasSinCos() const {
      !getTargetTriple().isOSVersionLT(7, 0);
  }
  
-// Enable the PostMachineScheduler if the target selects it instead of
-// PostRAScheduler. Currently only available on the command line via
-// -misched-postra.
+// This overrides the PostRAScheduler bit in the SchedModel for any CPU.
  bool ARMSubtarget::enablePostMachineScheduler() const {
-  return PostRAScheduler;
+  return (!isThumb() || hasThumb2());
  }
  
  bool ARMSubtarget::enableAtomicExpandLoadLinked() const {
    return hasAnyDataBarrier() && !isThumb1Only();
  }
  
-bool ARMSubtarget::enablePostRAScheduler(
-           CodeGenOpt::Level OptLevel,
-           TargetSubtargetInfo::AntiDepBreakMode& Mode,
-           RegClassVector& CriticalPathRCs) const {
-  Mode = TargetSubtargetInfo::ANTIDEP_NONE;
-  return PostRAScheduler && OptLevel >= CodeGenOpt::Default;
-}
-
  bool ARMSubtarget::useMovt(const MachineFunction &MF) const {
    // NOTE Windows on ARM needs to use mov.w/mov.t pairs to materialise 32-bit
    // immediates as it is inherently position independent, and may be out of
@@ -452,51 +440,3 @@ bool ARMSubtarget::useMovt(const MachineFunction &MF) const {
                       !MF.getFunction()->getAttributes().hasAttribute(
                           AttributeSet::FunctionIndex, Attribute::MinSize));
  }
-
-bool ARMSubtarget::shouldCoalesce(MachineInstr *MI,
-                                  const TargetRegisterClass *SrcRC,
-                                  unsigned SubReg,
-                                  const TargetRegisterClass *DstRC,
-                                  unsigned DstSubReg,
-                                  const TargetRegisterClass *NewRC) const {
-  auto MBB = MI->getParent();
-  auto MF = MBB->getParent();
-  const MachineRegisterInfo &MRI = MF->getRegInfo();
-  // If not copying into a sub-register this should be ok because we shouldn't
-  // need to split the reg.
-  if (!DstSubReg)
-    return true;
-  // Small registers don't frequently cause a problem, so we can coalesce them.
-  if (NewRC->getSize() < 32 && DstRC->getSize() < 32 && SrcRC->getSize() < 32)
-    return true;
-
-  auto NewRCWeight =
-              MRI.getTargetRegisterInfo()->getRegClassWeight(NewRC);
-  auto SrcRCWeight =
-              MRI.getTargetRegisterInfo()->getRegClassWeight(SrcRC);
-  auto DstRCWeight =
-              MRI.getTargetRegisterInfo()->getRegClassWeight(DstRC);
-  // If the source register class is more expensive than the destination, the
-  // coalescing is probably profitable.
-  if (SrcRCWeight.RegWeight > NewRCWeight.RegWeight)
-    return true;
-  if (DstRCWeight.RegWeight > NewRCWeight.RegWeight)
-    return true;
-
-  // If the register allocator isn't constrained, we can always allow coalescing
-  // unfortunately we don't know yet if we will be constrained.
-  // The goal of this heuristic is to restrict how many expensive registers
-  // we allow to coalesce in a given basic block.
-  auto AFI = MF->getInfo<ARMFunctionInfo>();
-  auto It = AFI->getCoalescedWeight(MBB);
-
-  DEBUG(dbgs() << "\tARM::shouldCoalesce - Coalesced Weight: " << It->second << "\n");
-  DEBUG(dbgs() << "\tARM::shouldCoalesce - Reg Weight: " << NewRCWeight.RegWeight << "\n");
-  unsigned SizeMultiplier = MBB->size()/100;
-  SizeMultiplier = SizeMultiplier ? SizeMultiplier : 1;
-  if (It->second < NewRCWeight.WeightLimit * SizeMultiplier) {
-    It->second += NewRCWeight.RegWeight;
-    return true;
-  }
-  return false;
-}