Make some intrinsics safe to speculatively execute.

[oota-llvm.git] / lib / Transforms / Utils / Local.cpp
diff --git a/lib/Transforms/Utils/Local.cpp b/lib/Transforms/Utils/Local.cpp

index b1dd733ffe54f0494ff1ee9f63e051f1c2bb7d03..4dd93cf2c7599d04d4117e507ec3169d54ef1f9f 100644 (file)
--- a/lib/Transforms/Utils/Local.cpp
+++ b/lib/Transforms/Utils/Local.cpp
@@ -27,8 +27,8 @@
  #include "llvm/Analysis/DebugInfo.h"
  #include "llvm/Analysis/DIBuilder.h"
  #include "llvm/Analysis/Dominators.h"
-#include "llvm/Analysis/ConstantFolding.h"
  #include "llvm/Analysis/InstructionSimplify.h"
+#include "llvm/Analysis/MemoryBuiltins.h"
  #include "llvm/Analysis/ProfileInfo.h"
  #include "llvm/Analysis/ValueTracking.h"
  #include "llvm/Target/TargetData.h"
@@ -227,13 +227,17 @@ bool llvm::ConstantFoldTerminator(BasicBlock *BB, bool DeleteDeadConditions) {
  bool llvm::isInstructionTriviallyDead(Instruction *I) {
    if (!I->use_empty() || isa<TerminatorInst>(I)) return false;
  
+  // We don't want the landingpad instruction removed by anything this general.
+  if (isa<LandingPadInst>(I))
+    return false;
+
    // We don't want debug info removed by anything this general, unless
    // debug info is empty.
    if (DbgDeclareInst *DDI = dyn_cast<DbgDeclareInst>(I)) {
-    if (DDI->getAddress()) 
+    if (DDI->getAddress())
        return false;
      return true;
-  } 
+  }
    if (DbgValueInst *DVI = dyn_cast<DbgValueInst>(I)) {
      if (DVI->getValue())
        return false;
@@ -244,10 +248,23 @@ bool llvm::isInstructionTriviallyDead(Instruction *I) {
  
    // Special case intrinsics that "may have side effects" but can be deleted
    // when dead.
-  if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(I))
+  if (IntrinsicInst *II = dyn_cast<IntrinsicInst>(I)) {
      // Safe to delete llvm.stacksave if dead.
      if (II->getIntrinsicID() == Intrinsic::stacksave)
        return true;
+
+    // Lifetime intrinsics are dead when their right-hand is undef.
+    if (II->getIntrinsicID() == Intrinsic::lifetime_start ||
+        II->getIntrinsicID() == Intrinsic::lifetime_end)
+      return isa<UndefValue>(II->getArgOperand(1));
+  }
+
+  if (extractMallocCall(I)) return true;
+
+  if (CallInst *CI = isFreeCall(I))
+    if (Constant *C = dyn_cast<Constant>(CI->getArgOperand(0)))
+      return C->isNullValue() || isa<UndefValue>(C);
+
    return false;
  }
  
@@ -477,22 +494,8 @@ static bool CanPropagatePredecessorsForPHIs(BasicBlock *BB, BasicBlock *Succ) {
    if (Succ->getSinglePredecessor()) return true;
  
    // Make a list of the predecessors of BB
-  typedef SmallPtrSet<BasicBlock*, 16> BlockSet;
-  BlockSet BBPreds(pred_begin(BB), pred_end(BB));
-
-  // Use that list to make another list of common predecessors of BB and Succ
-  BlockSet CommonPreds;
-  for (pred_iterator PI = pred_begin(Succ), PE = pred_end(Succ);
-       PI != PE; ++PI) {
-    BasicBlock *P = *PI;
-    if (BBPreds.count(P))
-      CommonPreds.insert(P);
-  }
+  SmallPtrSet<BasicBlock*, 16> BBPreds(pred_begin(BB), pred_end(BB));
  
-  // Shortcut, if there are no common predecessors, merging is always safe
-  if (CommonPreds.empty())
-    return true;
-  
    // Look at all the phi nodes in Succ, to see if they present a conflict when
    // merging these blocks
    for (BasicBlock::iterator I = Succ->begin(); isa<PHINode>(I); ++I) {
@@ -503,28 +506,28 @@ static bool CanPropagatePredecessorsForPHIs(BasicBlock *BB, BasicBlock *Succ) {
      // merge the phi nodes and then the blocks can still be merged
      PHINode *BBPN = dyn_cast<PHINode>(PN->getIncomingValueForBlock(BB));
      if (BBPN && BBPN->getParent() == BB) {
-      for (BlockSet::iterator PI = CommonPreds.begin(), PE = CommonPreds.end();
-            PI != PE; PI++) {
-        if (BBPN->getIncomingValueForBlock(*PI) 
-              != PN->getIncomingValueForBlock(*PI)) {
+      for (unsigned PI = 0, PE = PN->getNumIncomingValues(); PI != PE; ++PI) {
+        BasicBlock *IBB = PN->getIncomingBlock(PI);
+        if (BBPreds.count(IBB) &&
+            BBPN->getIncomingValueForBlock(IBB) != PN->getIncomingValue(PI)) {
            DEBUG(dbgs() << "Can't fold, phi node " << PN->getName() << " in " 
                  << Succ->getName() << " is conflicting with " 
                  << BBPN->getName() << " with regard to common predecessor "
-                << (*PI)->getName() << "\n");
+                << IBB->getName() << "\n");
            return false;
          }
        }
      } else {
        Value* Val = PN->getIncomingValueForBlock(BB);
-      for (BlockSet::iterator PI = CommonPreds.begin(), PE = CommonPreds.end();
-            PI != PE; PI++) {
+      for (unsigned PI = 0, PE = PN->getNumIncomingValues(); PI != PE; ++PI) {
          // See if the incoming value for the common predecessor is equal to the
          // one for BB, in which case this phi node will not prevent the merging
          // of the block.
-        if (Val != PN->getIncomingValueForBlock(*PI)) {
+        BasicBlock *IBB = PN->getIncomingBlock(PI);
+        if (BBPreds.count(IBB) && Val != PN->getIncomingValue(PI)) {
            DEBUG(dbgs() << "Can't fold, phi node " << PN->getName() << " in " 
                  << Succ->getName() << " is conflicting with regard to common "
-                << "predecessor " << (*PI)->getName() << "\n");
+                << "predecessor " << IBB->getName() << "\n");
            return false;
          }
        }
@@ -536,9 +539,9 @@ static bool CanPropagatePredecessorsForPHIs(BasicBlock *BB, BasicBlock *Succ) {
  
  /// TryToSimplifyUncondBranchFromEmptyBlock - BB is known to contain an
  /// unconditional branch, and contains no instructions other than PHI nodes,
-/// potential debug intrinsics and the branch.  If possible, eliminate BB by
-/// rewriting all the predecessors to branch to the successor block and return
-/// true.  If we can't transform, return false.
+/// potential side-effect free intrinsics and the branch.  If possible,
+/// eliminate BB by rewriting all the predecessors to branch to the successor
+/// block and return true.  If we can't transform, return false.
  bool llvm::TryToSimplifyUncondBranchFromEmptyBlock(BasicBlock *BB) {
    assert(BB != &BB->getParent()->getEntryBlock() &&
           "TryToSimplifyUncondBranchFromEmptyBlock called on entry block!");
@@ -613,13 +616,15 @@ bool llvm::TryToSimplifyUncondBranchFromEmptyBlock(BasicBlock *BB) {
      }
    }
    
-  while (PHINode *PN = dyn_cast<PHINode>(&BB->front())) {
-    if (Succ->getSinglePredecessor()) {
-      // BB is the only predecessor of Succ, so Succ will end up with exactly
-      // the same predecessors BB had.
-      Succ->getInstList().splice(Succ->begin(),
-                                 BB->getInstList(), BB->begin());
-    } else {
+  if (Succ->getSinglePredecessor()) {
+    // BB is the only predecessor of Succ, so Succ will end up with exactly
+    // the same predecessors BB had.
+
+    // Copy over any phi, debug or lifetime instruction.
+    BB->getTerminator()->eraseFromParent();
+    Succ->getInstList().splice(Succ->getFirstNonPHI(), BB->getInstList());
+  } else {
+    while (PHINode *PN = dyn_cast<PHINode>(&BB->front())) {
        // We explicitly check for such uses in CanPropagatePredecessorsForPHIs.
        assert(PN->use_empty() && "There shouldn't be any uses here!");
        PN->eraseFromParent();
@@ -710,10 +715,14 @@ bool llvm::EliminateDuplicatePHINodes(BasicBlock *BB) {
  /// their preferred alignment from the beginning.
  ///
  static unsigned enforceKnownAlignment(Value *V, unsigned Align,
-                                      unsigned PrefAlign) {
+                                      unsigned PrefAlign, const TargetData *TD) {
    V = V->stripPointerCasts();
  
    if (AllocaInst *AI = dyn_cast<AllocaInst>(V)) {
+    // If the preferred alignment is greater than the natural stack alignment
+    // then don't round up. This avoids dynamic stack realignment.
+    if (TD && TD->exceedsNaturalStackAlignment(PrefAlign))
+      return Align;
      // If there is a requested alignment and if this is an alloca, round up.
      if (AI->getAlignment() >= PrefAlign)
        return AI->getAlignment();
@@ -725,6 +734,10 @@ static unsigned enforceKnownAlignment(Value *V, unsigned Align,
      // If there is a large requested alignment and we can, bump up the alignment
      // of the global.
      if (GV->isDeclaration()) return Align;
+    // If the memory we set aside for the global may not be the memory used by
+    // the final program then it is impossible for us to reliably enforce the
+    // preferred alignment.
+    if (GV->isWeakForLinker()) return Align;
      
      if (GV->getAlignment() >= PrefAlign)
        return GV->getAlignment();
@@ -764,7 +777,7 @@ unsigned llvm::getOrEnforceKnownAlignment(Value *V, unsigned PrefAlign,
    Align = std::min(Align, +Value::MaximumAlignment);
    
    if (PrefAlign > Align)
-    Align = enforceKnownAlignment(V, Align, PrefAlign);
+    Align = enforceKnownAlignment(V, Align, PrefAlign, TD);
      
    // We don't need to make any adjustment.
    return Align;