Constify arguments in AliasSetTracker methods. NFC

[oota-llvm.git] / lib / Analysis / LoopAccessAnalysis.cpp
diff --git a/lib/Analysis/LoopAccessAnalysis.cpp b/lib/Analysis/LoopAccessAnalysis.cpp

index 4bedccf8d01b226396781567be8c2fc87791f9b8..cfa8fbe4a8c59c0a5a3f1c81bb1a4ee700819e37 100644 (file)
--- a/lib/Analysis/LoopAccessAnalysis.cpp
+++ b/lib/Analysis/LoopAccessAnalysis.cpp
@@ -15,11 +15,13 @@
  #include "llvm/Analysis/LoopAccessAnalysis.h"
  #include "llvm/Analysis/LoopInfo.h"
  #include "llvm/Analysis/ScalarEvolutionExpander.h"
+#include "llvm/Analysis/TargetLibraryInfo.h"
  #include "llvm/Analysis/ValueTracking.h"
  #include "llvm/IR/DiagnosticInfo.h"
  #include "llvm/IR/Dominators.h"
  #include "llvm/IR/IRBuilder.h"
  #include "llvm/Support/Debug.h"
+#include "llvm/Support/raw_ostream.h"
  #include "llvm/Transforms/Utils/VectorUtils.h"
  using namespace llvm;
  
@@ -175,6 +177,17 @@ void LoopAccessInfo::RuntimePointerCheck::print(
        }
  }
  
+bool LoopAccessInfo::RuntimePointerCheck::needsAnyChecking(
+    const SmallVectorImpl<int> *PtrPartition) const {
+  unsigned NumPointers = Pointers.size();
+
+  for (unsigned I = 0; I < NumPointers; ++I)
+    for (unsigned J = I + 1; J < NumPointers; ++J)
+      if (needsChecking(I, J, PtrPartition))
+        return true;
+  return false;
+}
+
  namespace {
  /// \brief Analyses memory accesses in a loop.
  ///
@@ -186,9 +199,9 @@ public:
    typedef PointerIntPair<Value *, 1, bool> MemAccessInfo;
    typedef SmallPtrSet<MemAccessInfo, 8> MemAccessInfoSet;
  
-  AccessAnalysis(const DataLayout &Dl, AliasAnalysis *AA,
+  AccessAnalysis(const DataLayout &Dl, AliasAnalysis *AA, LoopInfo *LI,
                   MemoryDepChecker::DepCandidates &DA)
-      : DL(Dl), AST(*AA), DepCands(DA), IsRTCheckNeeded(false) {}
+      : DL(Dl), AST(*AA), LI(LI), DepCands(DA), IsRTCheckNeeded(false) {}
  
    /// \brief Register a load  and whether it is only read from.
    void addLoad(AliasAnalysis::Location &Loc, bool IsReadOnly) {
@@ -248,6 +261,8 @@ private:
    //intrinsic property (such as TBAA metadata).
    AliasSetTracker AST;
  
+  LoopInfo *LI;
+
    /// Sets of potentially dependent accesses - members of one set share an
    /// underlying pointer. The set "CheckDeps" identfies which sets really need a
    /// dependence check.
@@ -464,7 +479,9 @@ void AccessAnalysis::processMemAccesses() {
            // underlying object.
            typedef SmallVector<Value *, 16> ValueVector;
            ValueVector TempObjects;
-          GetUnderlyingObjects(Ptr, TempObjects, DL);
+
+          GetUnderlyingObjects(Ptr, TempObjects, DL, LI);
+          DEBUG(dbgs() << "Underlying objects for pointer " << *Ptr << "\n");
            for (Value *UnderlyingObj : TempObjects) {
              UnderlyingObjToAccessMap::iterator Prev =
                  ObjToLastAccess.find(UnderlyingObj);
@@ -472,6 +489,7 @@ void AccessAnalysis::processMemAccesses() {
                DepCands.unionSets(Access, Prev->second);
  
              ObjToLastAccess[UnderlyingObj] = Access;
+            DEBUG(dbgs() << "  " << *UnderlyingObj << "\n");
            }
          }
        }
@@ -580,6 +598,7 @@ bool MemoryDepChecker::Dependence::isSafeForVectorization(DepType Type) {
    case BackwardVectorizableButPreventsForwarding:
      return false;
    }
+  llvm_unreachable("unexpected DepType!");
  }
  
  bool MemoryDepChecker::Dependence::isInterestingDependence(DepType Type) {
@@ -595,6 +614,7 @@ bool MemoryDepChecker::Dependence::isInterestingDependence(DepType Type) {
    case BackwardVectorizableButPreventsForwarding:
      return true;
    }
+  llvm_unreachable("unexpected DepType!");
  }
  
  bool MemoryDepChecker::Dependence::isPossiblyBackward() const {
@@ -610,6 +630,7 @@ bool MemoryDepChecker::Dependence::isPossiblyBackward() const {
    case BackwardVectorizableButPreventsForwarding:
      return true;
    }
+  llvm_unreachable("unexpected DepType!");
  }
  
  bool MemoryDepChecker::couldPreventStoreLoadForward(unsigned Distance,
@@ -874,14 +895,20 @@ void MemoryDepChecker::Dependence::print(
  }
  
  bool LoopAccessInfo::canAnalyzeLoop() {
+  // We need to have a loop header.
+  DEBUG(dbgs() << "LAA: Found a loop: " <<
+        TheLoop->getHeader()->getName() << '\n');
+
      // We can only analyze innermost loops.
    if (!TheLoop->empty()) {
+    DEBUG(dbgs() << "LAA: loop is not the innermost loop\n");
      emitAnalysis(LoopAccessReport() << "loop is not the innermost loop");
      return false;
    }
  
    // We must have a single backedge.
    if (TheLoop->getNumBackEdges() != 1) {
+    DEBUG(dbgs() << "LAA: loop control flow is not understood by analyzer\n");
      emitAnalysis(
          LoopAccessReport() <<
          "loop control flow is not understood by analyzer");
@@ -890,6 +917,7 @@ bool LoopAccessInfo::canAnalyzeLoop() {
  
    // We must have a single exiting block.
    if (!TheLoop->getExitingBlock()) {
+    DEBUG(dbgs() << "LAA: loop control flow is not understood by analyzer\n");
      emitAnalysis(
          LoopAccessReport() <<
          "loop control flow is not understood by analyzer");
@@ -900,16 +928,13 @@ bool LoopAccessInfo::canAnalyzeLoop() {
    // checked at the end of each iteration. With that we can assume that all
    // instructions in the loop are executed the same number of times.
    if (TheLoop->getExitingBlock() != TheLoop->getLoopLatch()) {
+    DEBUG(dbgs() << "LAA: loop control flow is not understood by analyzer\n");
      emitAnalysis(
          LoopAccessReport() <<
          "loop control flow is not understood by analyzer");
      return false;
    }
  
-  // We need to have a loop header.
-  DEBUG(dbgs() << "LAA: Found a loop: " <<
-        TheLoop->getHeader()->getName() << '\n');
-
    // ScalarEvolution needs to be able to find the exit count.
    const SCEV *ExitCount = SE->getBackedgeTakenCount(TheLoop);
    if (ExitCount == SE->getCouldNotCompute()) {
@@ -959,6 +984,12 @@ void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
          if (Call && getIntrinsicIDForCall(Call, TLI))
            continue;
  
+        // If the function has an explicit vectorized counterpart, we can safely
+        // assume that it can be vectorized.
+        if (Call && !Call->isNoBuiltin() && Call->getCalledFunction() &&
+            TLI->isFunctionVectorizable(Call->getCalledFunction()->getName()))
+          continue;
+
          LoadInst *Ld = dyn_cast<LoadInst>(it);
          if (!Ld || (!Ld->isSimple() && !IsAnnotatedParallel)) {
            emitAnalysis(LoopAccessReport(Ld)
@@ -1009,7 +1040,7 @@ void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
  
    MemoryDepChecker::DepCandidates DependentAccesses;
    AccessAnalysis Accesses(TheLoop->getHeader()->getModule()->getDataLayout(),
-                          AA, DependentAccesses);
+                          AA, LI, DependentAccesses);
  
    // Holds the analyzed pointers. We don't want to call GetUnderlyingObjects
    // multiple times on the same object. If the ptr is accessed twice, once
@@ -1022,16 +1053,8 @@ void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
    for (I = Stores.begin(), IE = Stores.end(); I != IE; ++I) {
      StoreInst *ST = cast<StoreInst>(*I);
      Value* Ptr = ST->getPointerOperand();
-
-    if (isUniform(Ptr)) {
-      emitAnalysis(
-          LoopAccessReport(ST)
-          << "write to a loop invariant address could not be vectorized");
-      DEBUG(dbgs() << "LAA: We don't allow storing to uniform addresses\n");
-      CanVecMem = false;
-      return;
-    }
-
+    // Check for store to loop invariant address.
+    StoreToLoopInvariantAddress |= isUniform(Ptr);
      // If we did *not* see this pointer before, insert it to  the read-write
      // list. At this phase it is only a 'write' list.
      if (Seen.insert(Ptr).second) {
@@ -1111,7 +1134,7 @@ void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
    if (NumComparisons == 0 && NeedRTCheck)
      NeedRTCheck = false;
  
-  // Check that we did not find an unsizeable pointer.
+  // Check that we found the bounds for the pointer.
    if (CanDoRT)
      DEBUG(dbgs() << "LAA: We can perform a memory runtime check if needed.\n");
    else if (NeedRTCheck) {
@@ -1144,7 +1167,7 @@ void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
  
        CanDoRT = Accesses.canCheckPtrAtRT(PtrRtCheck, NumComparisons, SE,
                                           TheLoop, Strides, true);
-      // Check that we didn't find an unsizeable pointer.
+      // Check that we found the bounds for the pointer.
        if (!CanDoRT && NumComparisons > 0) {
          emitAnalysis(LoopAccessReport()
                       << "cannot check memory dependencies at runtime");
@@ -1158,12 +1181,15 @@ void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
      }
    }
  
-  if (!CanVecMem)
+  if (CanVecMem)
+    DEBUG(dbgs() << "LAA: No unsafe dependent memory operations in loop.  We"
+                 << (NeedRTCheck ? "" : " don't")
+                 << " need a runtime memory check.\n");
+  else {
      emitAnalysis(LoopAccessReport() <<
                   "unsafe dependent memory operations in loop");
-
-  DEBUG(dbgs() << "LAA: We" << (NeedRTCheck ? "" : " don't") <<
-        " need a runtime memory check.\n");
+    DEBUG(dbgs() << "LAA: unsafe dependent memory operations in loop\n");
+  }
  }
  
  bool LoopAccessInfo::blockNeedsPredication(BasicBlock *BB, Loop *TheLoop,
@@ -1197,9 +1223,8 @@ static Instruction *getFirstInst(Instruction *FirstInst, Value *V,
  
  std::pair<Instruction *, Instruction *> LoopAccessInfo::addRuntimeCheck(
      Instruction *Loc, const SmallVectorImpl<int> *PtrPartition) const {
-  Instruction *tnullptr = nullptr;
    if (!PtrRtCheck.Need)
-    return std::pair<Instruction *, Instruction *>(tnullptr, tnullptr);
+    return std::make_pair(nullptr, nullptr);
  
    unsigned NumPointers = PtrRtCheck.Pointers.size();
    SmallVector<TrackingVH<Value> , 2> Starts;
@@ -1270,6 +1295,9 @@ std::pair<Instruction *, Instruction *> LoopAccessInfo::addRuntimeCheck(
      }
    }
  
+  if (!MemoryRuntimeCheck)
+    return std::make_pair(nullptr, nullptr);
+
    // We have to do this trickery because the IRBuilder might fold the check to a
    // constant expression in which case there is no Instruction anchored in a
    // the block.
@@ -1283,23 +1311,28 @@ std::pair<Instruction *, Instruction *> LoopAccessInfo::addRuntimeCheck(
  LoopAccessInfo::LoopAccessInfo(Loop *L, ScalarEvolution *SE,
                                 const DataLayout &DL,
                                 const TargetLibraryInfo *TLI, AliasAnalysis *AA,
-                               DominatorTree *DT,
+                               DominatorTree *DT, LoopInfo *LI,
                                 const ValueToValueMap &Strides)
      : DepChecker(SE, L), NumComparisons(0), TheLoop(L), SE(SE), DL(DL),
-      TLI(TLI), AA(AA), DT(DT), NumLoads(0), NumStores(0),
-      MaxSafeDepDistBytes(-1U), CanVecMem(false) {
+      TLI(TLI), AA(AA), DT(DT), LI(LI), NumLoads(0), NumStores(0),
+      MaxSafeDepDistBytes(-1U), CanVecMem(false),
+      StoreToLoopInvariantAddress(false) {
    if (canAnalyzeLoop())
      analyzeLoop(Strides);
  }
  
  void LoopAccessInfo::print(raw_ostream &OS, unsigned Depth) const {
    if (CanVecMem) {
-    if (PtrRtCheck.empty())
-      OS.indent(Depth) << "Memory dependences are safe\n";
-    else
+    if (PtrRtCheck.Need)
        OS.indent(Depth) << "Memory dependences are safe with run-time checks\n";
+    else
+      OS.indent(Depth) << "Memory dependences are safe\n";
    }
  
+  OS.indent(Depth) << "Store to invariant address was "
+                   << (StoreToLoopInvariantAddress ? "" : "not ")
+                   << "found in loop.\n";
+
    if (Report)
      OS.indent(Depth) << "Report: " << Report->str() << "\n";
  
@@ -1328,7 +1361,8 @@ LoopAccessAnalysis::getInfo(Loop *L, const ValueToValueMap &Strides) {
  
    if (!LAI) {
      const DataLayout &DL = L->getHeader()->getModule()->getDataLayout();
-    LAI = llvm::make_unique<LoopAccessInfo>(L, SE, DL, TLI, AA, DT, Strides);
+    LAI = llvm::make_unique<LoopAccessInfo>(L, SE, DL, TLI, AA, DT, LI,
+                                            Strides);
  #ifndef NDEBUG
      LAI->NumSymbolicStrides = Strides.size();
  #endif
@@ -1339,7 +1373,6 @@ LoopAccessAnalysis::getInfo(Loop *L, const ValueToValueMap &Strides) {
  void LoopAccessAnalysis::print(raw_ostream &OS, const Module *M) const {
    LoopAccessAnalysis &LAA = *const_cast<LoopAccessAnalysis *>(this);
  
-  LoopInfo *LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
    ValueToValueMap NoSymbolicStrides;
  
    for (Loop *TopLevelLoop : *LI)
@@ -1356,6 +1389,7 @@ bool LoopAccessAnalysis::runOnFunction(Function &F) {
    TLI = TLIP ? &TLIP->getTLI() : nullptr;
    AA = &getAnalysis<AliasAnalysis>();
    DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();
+  LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
  
    return false;
  }