NFC: Fix indentation and add braces to clarify nested of else-statement.

[oota-llvm.git] / lib / Target / ARM / ARMLoadStoreOptimizer.cpp
diff --git a/lib/Target/ARM/ARMLoadStoreOptimizer.cpp b/lib/Target/ARM/ARMLoadStoreOptimizer.cpp

index c64c190ed158a922ffc596864be72e5ff15e5da2..d099deda26cd65ea22043d5d4c191f295ae28087 100644 (file)
--- a/lib/Target/ARM/ARMLoadStoreOptimizer.cpp
+++ b/lib/Target/ARM/ARMLoadStoreOptimizer.cpp
@@ -60,17 +60,24 @@ STATISTIC(NumSTRD2STM,  "Number of strd instructions turned back into stm");
  STATISTIC(NumLDRD2LDR,  "Number of ldrd instructions turned back into ldr's");
  STATISTIC(NumSTRD2STR,  "Number of strd instructions turned back into str's");
  
+namespace llvm {
+void initializeARMLoadStoreOptPass(PassRegistry &);
+}
+
+#define ARM_LOAD_STORE_OPT_NAME "ARM load / store optimization pass"
+
  namespace {
    /// Post- register allocation pass the combine load / store instructions to
    /// form ldm / stm instructions.
    struct ARMLoadStoreOpt : public MachineFunctionPass {
      static char ID;
-    ARMLoadStoreOpt() : MachineFunctionPass(ID) {}
+    ARMLoadStoreOpt() : MachineFunctionPass(ID) {
+      initializeARMLoadStoreOptPass(*PassRegistry::getPassRegistry());
+    }
  
      const MachineFunction *MF;
      const TargetInstrInfo *TII;
      const TargetRegisterInfo *TRI;
-    const MachineRegisterInfo *MRI;
      const ARMSubtarget *STI;
      const TargetLowering *TL;
      ARMFunctionInfo *AFI;
@@ -84,7 +91,7 @@ namespace {
      bool runOnMachineFunction(MachineFunction &Fn) override;
  
      const char *getPassName() const override {
-      return "ARM load / store optimization pass";
+      return ARM_LOAD_STORE_OPT_NAME;
      }
  
    private:
@@ -116,7 +123,7 @@ namespace {
        /// Whether the instructions can be merged into a ldrd/strd instruction.
        bool CanMergeToLSDouble;
      };
-    BumpPtrAllocator Allocator;
+    SpecificBumpPtrAllocator<MergeCandidate> Allocator;
      SmallVector<const MergeCandidate*,4> Candidates;
      SmallVector<MachineInstr*,4> MergeBaseCandidates;
  
@@ -148,6 +155,8 @@ namespace {
    char ARMLoadStoreOpt::ID = 0;
  }
  
+INITIALIZE_PASS(ARMLoadStoreOpt, "arm-load-store-opt", ARM_LOAD_STORE_OPT_NAME, false, false)
+
  static bool definesCPSR(const MachineInstr *MI) {
    for (const auto &MO : MI->operands()) {
      if (!MO.isReg())
@@ -786,6 +795,7 @@ MachineInstr *ARMLoadStoreOpt::MergeOpsUpdate(const MergeCandidate &Cand) {
    SmallVector<std::pair<unsigned, bool>, 8> Regs;
    SmallVector<unsigned, 4> ImpDefs;
    DenseSet<unsigned> KilledRegs;
+  DenseSet<unsigned> UsedRegs;
    // Determine list of registers and list of implicit super-register defs.
    for (const MachineInstr *MI : Cand.Instrs) {
      const MachineOperand &MO = getLoadStoreRegOp(*MI);
@@ -794,6 +804,7 @@ MachineInstr *ARMLoadStoreOpt::MergeOpsUpdate(const MergeCandidate &Cand) {
      if (IsKill)
        KilledRegs.insert(Reg);
      Regs.push_back(std::make_pair(Reg, IsKill));
+    UsedRegs.insert(Reg);
  
      if (IsLoad) {
        // Collect any implicit defs of super-registers, after merging we can't
@@ -883,7 +894,7 @@ MachineInstr *ARMLoadStoreOpt::MergeOpsUpdate(const MergeCandidate &Cand) {
        for (MachineOperand &MO : MI.uses()) {
          if (!MO.isReg() || !MO.isKill())
            continue;
-        if (KilledRegs.count(MO.getReg()))
+        if (UsedRegs.count(MO.getReg()))
            MO.setIsKill(false);
        }
      }
@@ -906,25 +917,6 @@ void ARMLoadStoreOpt::FormCandidates(const MemOpQueue &MemOps) {
    unsigned Opcode = FirstMI->getOpcode();
    bool isNotVFP = isi32Load(Opcode) || isi32Store(Opcode);
    unsigned Size = getLSMultipleTransferSize(FirstMI);
-  // vldm / vstm limit are 32 for S variants, 16 for D variants.
-  unsigned Limit;
-  switch (Opcode) {
-  default:
-    Limit = UINT_MAX;
-    break;
-  case ARM::VSTRS:
-    Limit = 32;
-    break;
-  case ARM::VSTRD:
-    Limit = 16;
-    break;
-  case ARM::VLDRD:
-    Limit = 16;
-    break;
-  case ARM::VLDRS:
-    Limit = 32;
-    break;
-  }
  
    unsigned SIndex = 0;
    unsigned EIndex = MemOps.size();
@@ -952,6 +944,11 @@ void ARMLoadStoreOpt::FormCandidates(const MemOpQueue &MemOps) {
      if (STI->isSwift() && !isNotVFP && (PRegNum % 2) == 1)
        CanMergeToLSMulti = false;
  
+    // LDRD/STRD do not allow SP/PC. LDM/STM do not support it or have it
+    // deprecated; LDM to PC is fine but cannot happen here.
+    if (PReg == ARM::SP || PReg == ARM::PC)
+      CanMergeToLSMulti = CanMergeToLSDouble = false;
+
      // Merge following instructions where possible.
      for (unsigned I = SIndex+1; I < EIndex; ++I, ++Count) {
        int NewOffset = MemOps[I].Offset;
@@ -959,16 +956,15 @@ void ARMLoadStoreOpt::FormCandidates(const MemOpQueue &MemOps) {
          break;
        const MachineOperand &MO = getLoadStoreRegOp(*MemOps[I].MI);
        unsigned Reg = MO.getReg();
-      unsigned RegNum = MO.isUndef() ? UINT_MAX : TRI->getEncodingValue(Reg);
+      if (Reg == ARM::SP || Reg == ARM::PC)
+        break;
  
        // See if the current load/store may be part of a multi load/store.
+      unsigned RegNum = MO.isUndef() ? UINT_MAX : TRI->getEncodingValue(Reg);
        bool PartOfLSMulti = CanMergeToLSMulti;
        if (PartOfLSMulti) {
-        // Cannot load from SP
-        if (Reg == ARM::SP)
-          PartOfLSMulti = false;
          // Register numbers must be in ascending order.
-        else if (RegNum <= PRegNum)
+        if (RegNum <= PRegNum)
            PartOfLSMulti = false;
          // For VFP / NEON load/store multiples, the registers must be
          // consecutive and within the limit on the number of registers per
@@ -996,7 +992,7 @@ void ARMLoadStoreOpt::FormCandidates(const MemOpQueue &MemOps) {
      }
  
      // Form a candidate from the Ops collected so far.
-    MergeCandidate *Candidate = new(Allocator) MergeCandidate;
+    MergeCandidate *Candidate = new(Allocator.Allocate()) MergeCandidate;
      for (unsigned C = SIndex, CE = SIndex + Count; C < CE; ++C)
        Candidate->Instrs.push_back(MemOps[C].MI);
      Candidate->LatestMIIdx = Latest - SIndex;
@@ -1634,9 +1630,7 @@ bool ARMLoadStoreOpt::LoadStoreMultipleOpti(MachineBasicBlock &MBB) {
    MemOpQueue MemOps;
    unsigned CurrBase = 0;
    unsigned CurrOpc = ~0u;
-  unsigned CurrSize = 0;
    ARMCC::CondCodes CurrPred = ARMCC::AL;
-  unsigned CurrPredReg = 0;
    unsigned Position = 0;
    assert(Candidates.size() == 0);
    assert(MergeBaseCandidates.size() == 0);
@@ -1652,7 +1646,6 @@ bool ARMLoadStoreOpt::LoadStoreMultipleOpti(MachineBasicBlock &MBB) {
  
      if (isMemoryOp(MBBI)) {
        unsigned Opcode = MBBI->getOpcode();
-      unsigned Size = getLSMultipleTransferSize(MBBI);
        const MachineOperand &MO = MBBI->getOperand(0);
        unsigned Reg = MO.getReg();
        unsigned Base = getLoadStoreBaseOp(*MBBI).getReg();
@@ -1663,9 +1656,7 @@ bool ARMLoadStoreOpt::LoadStoreMultipleOpti(MachineBasicBlock &MBB) {
          // Start of a new chain.
          CurrBase = Base;
          CurrOpc  = Opcode;
-        CurrSize = Size;
          CurrPred = Pred;
-        CurrPredReg = PredReg;
          MemOps.push_back(MemOpQueueEntry(MBBI, Offset, Position));
          continue;
        }
@@ -1737,9 +1728,7 @@ bool ARMLoadStoreOpt::LoadStoreMultipleOpti(MachineBasicBlock &MBB) {
        // Reset for the next chain.
        CurrBase = 0;
        CurrOpc = ~0u;
-      CurrSize = 0;
        CurrPred = ARMCC::AL;
-      CurrPredReg = 0;
        MemOps.clear();
      }
    }
@@ -1835,7 +1824,7 @@ bool ARMLoadStoreOpt::runOnMachineFunction(MachineFunction &Fn) {
    AFI = Fn.getInfo<ARMFunctionInfo>();
    TII = STI->getInstrInfo();
    TRI = STI->getRegisterInfo();
-  MRI = &Fn.getRegInfo();
+
    RegClassInfoValid = false;
    isThumb2 = AFI->isThumb2Function();
    isThumb1 = AFI->isThumbFunction() && !isThumb2;
@@ -1849,16 +1838,25 @@ bool ARMLoadStoreOpt::runOnMachineFunction(MachineFunction &Fn) {
        Modified |= MergeReturnIntoLDM(MBB);
    }
  
-  Allocator.Reset();
+  Allocator.DestroyAll();
    return Modified;
  }
  
+namespace llvm {
+void initializeARMPreAllocLoadStoreOptPass(PassRegistry &);
+}
+
+#define ARM_PREALLOC_LOAD_STORE_OPT_NAME                                       \
+  "ARM pre- register allocation load / store optimization pass"
+
  namespace {
    /// Pre- register allocation pass that move load / stores from consecutive
    /// locations close to make it more likely they will be combined later.
    struct ARMPreAllocLoadStoreOpt : public MachineFunctionPass{
      static char ID;
-    ARMPreAllocLoadStoreOpt() : MachineFunctionPass(ID) {}
+    ARMPreAllocLoadStoreOpt() : MachineFunctionPass(ID) {
+      initializeARMPreAllocLoadStoreOptPass(*PassRegistry::getPassRegistry());
+    }
  
      const DataLayout *TD;
      const TargetInstrInfo *TII;
@@ -1870,7 +1868,7 @@ namespace {
      bool runOnMachineFunction(MachineFunction &Fn) override;
  
      const char *getPassName() const override {
-      return "ARM pre- register allocation load / store optimization pass";
+      return ARM_PREALLOC_LOAD_STORE_OPT_NAME;
      }
  
    private:
@@ -1889,8 +1887,11 @@ namespace {
    char ARMPreAllocLoadStoreOpt::ID = 0;
  }
  
+INITIALIZE_PASS(ARMPreAllocLoadStoreOpt, "arm-prera-load-store-opt",
+                ARM_PREALLOC_LOAD_STORE_OPT_NAME, false, false)
+
  bool ARMPreAllocLoadStoreOpt::runOnMachineFunction(MachineFunction &Fn) {
-  TD = Fn.getTarget().getDataLayout();
+  TD = &Fn.getDataLayout();
    STI = &static_cast<const ARMSubtarget &>(Fn.getSubtarget());
    TII = STI->getInstrInfo();
    TRI = STI->getRegisterInfo();
@@ -2317,3 +2318,4 @@ FunctionPass *llvm::createARMLoadStoreOptimizationPass(bool PreAlloc) {
      return new ARMPreAllocLoadStoreOpt();
    return new ARMLoadStoreOpt();
  }
+