Add some additional fields to TTI::UnrollingPreferences

[oota-llvm.git] / lib / Transforms / Scalar / SROA.cpp
diff --git a/lib/Transforms/Scalar/SROA.cpp b/lib/Transforms/Scalar/SROA.cpp

index 01320e22a3d5f3a7c6942b229d061d9f0de2e61e..ed5e61823e4f3abd06fbdf1e83d361283c9b2215 100644 (file)
--- a/lib/Transforms/Scalar/SROA.cpp
+++ b/lib/Transforms/Scalar/SROA.cpp
@@ -32,19 +32,19 @@
  #include "llvm/Analysis/Loads.h"
  #include "llvm/Analysis/PtrUseVisitor.h"
  #include "llvm/Analysis/ValueTracking.h"
-#include "llvm/DIBuilder.h"
-#include "llvm/DebugInfo.h"
  #include "llvm/IR/Constants.h"
+#include "llvm/IR/DIBuilder.h"
  #include "llvm/IR/DataLayout.h"
+#include "llvm/IR/DebugInfo.h"
  #include "llvm/IR/DerivedTypes.h"
  #include "llvm/IR/Dominators.h"
  #include "llvm/IR/Function.h"
  #include "llvm/IR/IRBuilder.h"
+#include "llvm/IR/InstVisitor.h"
  #include "llvm/IR/Instructions.h"
  #include "llvm/IR/IntrinsicInst.h"
  #include "llvm/IR/LLVMContext.h"
  #include "llvm/IR/Operator.h"
-#include "llvm/InstVisitor.h"
  #include "llvm/Pass.h"
  #include "llvm/Support/CommandLine.h"
  #include "llvm/Support/Compiler.h"
@@ -356,7 +356,7 @@ private:
                   bool IsSplittable = false) {
      // Completely skip uses which have a zero size or start either before or
      // past the end of the allocation.
-    if (Size == 0 || Offset.isNegative() || Offset.uge(AllocSize)) {
+    if (Size == 0 || Offset.uge(AllocSize)) {
        DEBUG(dbgs() << "WARNING: Ignoring " << Size << " byte use @" << Offset
                     << " which has zero size or starts outside of the "
                     << AllocSize << " byte alloca:\n"
@@ -480,8 +480,7 @@ private:
      // risk of overflow.
      // FIXME: We should instead consider the pointer to have escaped if this
      // function is being instrumented for addressing bugs or race conditions.
-    if (Offset.isNegative() || Size > AllocSize ||
-        Offset.ugt(AllocSize - Size)) {
+    if (Size > AllocSize || Offset.ugt(AllocSize - Size)) {
        DEBUG(dbgs() << "WARNING: Ignoring " << Size << " byte store @" << Offset
                     << " which extends past the end of the " << AllocSize
                     << " byte alloca:\n"
@@ -500,7 +499,7 @@ private:
      assert(II.getRawDest() == *U && "Pointer use is not the destination?");
      ConstantInt *Length = dyn_cast<ConstantInt>(II.getLength());
      if ((Length && Length->getValue() == 0) ||
-        (IsOffsetKnown && !Offset.isNegative() && Offset.uge(AllocSize)))
+        (IsOffsetKnown && Offset.uge(AllocSize)))
        // Zero-length mem transfer intrinsics can be ignored entirely.
        return markAsDead(II);
  
@@ -532,7 +531,7 @@ private:
      // if already added to our partitions.
      // FIXME: Yet another place we really should bypass this when
      // instrumenting for ASan.
-    if (!Offset.isNegative() && Offset.uge(AllocSize)) {
+    if (Offset.uge(AllocSize)) {
        SmallDenseMap<Instruction *, unsigned>::iterator MTPI = MemTransferSliceMap.find(&II);
        if (MTPI != MemTransferSliceMap.end())
          S.Slices[MTPI->second].kill();
@@ -557,7 +556,7 @@ private:
      // they both point to the same alloca.
      bool Inserted;
      SmallDenseMap<Instruction *, unsigned>::iterator MTPI;
-    llvm::tie(MTPI, Inserted) =
+    std::tie(MTPI, Inserted) =
          MemTransferSliceMap.insert(std::make_pair(&II, S.Slices.size()));
      unsigned PrevIdx = MTPI->second;
      if (!Inserted) {
@@ -616,7 +615,7 @@ private:
      Size = 0;
      do {
        Instruction *I, *UsedI;
-      llvm::tie(UsedI, I) = Uses.pop_back_val();
+      std::tie(UsedI, I) = Uses.pop_back_val();
  
        if (LoadInst *LI = dyn_cast<LoadInst>(I)) {
          Size = std::max(Size, DL.getTypeStoreSize(LI->getType()));
@@ -638,10 +637,9 @@ private:
          return I;
        }
  
-      for (Value::use_iterator UI = I->use_begin(), UE = I->use_end(); UI != UE;
-           ++UI)
-        if (Visited.insert(cast<Instruction>(*UI)))
-          Uses.push_back(std::make_pair(I, cast<Instruction>(*UI)));
+      for (User *U : I->users())
+        if (Visited.insert(cast<Instruction>(U)))
+          Uses.push_back(std::make_pair(I, cast<Instruction>(U)));
      } while (!Uses.empty());
  
      return 0;
@@ -667,8 +665,7 @@ private:
      // themselves which should be replaced with undef.
      // FIXME: This should instead be escaped in the event we're instrumenting
      // for address sanitization.
-    if ((Offset.isNegative() && (-Offset).uge(PHISize)) ||
-        (!Offset.isNegative() && Offset.uge(AllocSize))) {
+    if (Offset.uge(AllocSize)) {
        S.DeadOperands.push_back(U);
        return;
      }
@@ -708,8 +705,7 @@ private:
      // themselves which should be replaced with undef.
      // FIXME: This should instead be escaped in the event we're instrumenting
      // for address sanitization.
-    if ((Offset.isNegative() && Offset.uge(SelectSize)) ||
-        (!Offset.isNegative() && Offset.uge(AllocSize))) {
+    if (Offset.uge(AllocSize)) {
        S.DeadOperands.push_back(U);
        return;
      }
@@ -820,12 +816,10 @@ public:
      // Retain the debug information attached to the alloca for use when
      // rewriting loads and stores.
      if (MDNode *DebugNode = MDNode::getIfExists(AI.getContext(), &AI)) {
-      for (Value::use_iterator UI = DebugNode->use_begin(),
-                               UE = DebugNode->use_end();
-           UI != UE; ++UI)
-        if (DbgDeclareInst *DDI = dyn_cast<DbgDeclareInst>(*UI))
+      for (User *U : DebugNode->users())
+        if (DbgDeclareInst *DDI = dyn_cast<DbgDeclareInst>(U))
            DDIs.push_back(DDI);
-        else if (DbgValueInst *DVI = dyn_cast<DbgValueInst>(*UI))
+        else if (DbgValueInst *DVI = dyn_cast<DbgValueInst>(U))
            DVIs.push_back(DVI);
      }
  
@@ -839,8 +833,8 @@ public:
        DVIs.pop_back_val()->eraseFromParent();
    }
  
-  virtual bool isInstInList(Instruction *I,
-                            const SmallVectorImpl<Instruction*> &Insts) const {
+  bool isInstInList(Instruction *I,
+                    const SmallVectorImpl<Instruction*> &Insts) const override {
      Value *Ptr;
      if (LoadInst *LI = dyn_cast<LoadInst>(I))
        Ptr = LI->getOperand(0);
@@ -867,7 +861,7 @@ public:
      return false;
    }
  
-  virtual void updateDebugInfo(Instruction *Inst) const {
+  void updateDebugInfo(Instruction *Inst) const override {
      for (SmallVectorImpl<DbgDeclareInst *>::const_iterator I = DDIs.begin(),
             E = DDIs.end(); I != E; ++I) {
        DbgDeclareInst *DDI = *I;
@@ -978,10 +972,10 @@ public:
          C(0), DL(0), DT(0) {
      initializeSROAPass(*PassRegistry::getPassRegistry());
    }
-  bool runOnFunction(Function &F);
-  void getAnalysisUsage(AnalysisUsage &AU) const;
+  bool runOnFunction(Function &F) override;
+  void getAnalysisUsage(AnalysisUsage &AU) const override;
  
-  const char *getPassName() const { return "SROA"; }
+  const char *getPassName() const override { return "SROA"; }
    static char ID;
  
  private:
@@ -1088,9 +1082,8 @@ static bool isSafePHIToSpeculate(PHINode &PN,
    BasicBlock *BB = PN.getParent();
    unsigned MaxAlign = 0;
    bool HaveLoad = false;
-  for (Value::use_iterator UI = PN.use_begin(), UE = PN.use_end(); UI != UE;
-       ++UI) {
-    LoadInst *LI = dyn_cast<LoadInst>(*UI);
+  for (User *U : PN.users()) {
+    LoadInst *LI = dyn_cast<LoadInst>(U);
      if (LI == 0 || !LI->isSimple())
        return false;
  
@@ -1154,13 +1147,13 @@ static void speculatePHINodeLoads(PHINode &PN) {
  
    // Get the TBAA tag and alignment to use from one of the loads.  It doesn't
    // matter which one we get and if any differ.
-  LoadInst *SomeLoad = cast<LoadInst>(*PN.use_begin());
+  LoadInst *SomeLoad = cast<LoadInst>(PN.user_back());
    MDNode *TBAATag = SomeLoad->getMetadata(LLVMContext::MD_tbaa);
    unsigned Align = SomeLoad->getAlignment();
  
    // Rewrite all loads of the PN to use the new PHI.
    while (!PN.use_empty()) {
-    LoadInst *LI = cast<LoadInst>(*PN.use_begin());
+    LoadInst *LI = cast<LoadInst>(PN.user_back());
      LI->replaceAllUsesWith(NewPN);
      LI->eraseFromParent();
    }
@@ -1204,9 +1197,8 @@ static bool isSafeSelectToSpeculate(SelectInst &SI, const DataLayout *DL = 0) {
    bool TDerefable = TValue->isDereferenceablePointer();
    bool FDerefable = FValue->isDereferenceablePointer();
  
-  for (Value::use_iterator UI = SI.use_begin(), UE = SI.use_end(); UI != UE;
-       ++UI) {
-    LoadInst *LI = dyn_cast<LoadInst>(*UI);
+  for (User *U : SI.users()) {
+    LoadInst *LI = dyn_cast<LoadInst>(U);
      if (LI == 0 || !LI->isSimple())
        return false;
  
@@ -1232,7 +1224,7 @@ static void speculateSelectInstLoads(SelectInst &SI) {
    Value *FV = SI.getFalseValue();
    // Replace the loads of the select with a select of two loads.
    while (!SI.use_empty()) {
-    LoadInst *LI = cast<LoadInst>(*SI.use_begin());
+    LoadInst *LI = cast<LoadInst>(SI.user_back());
      assert(LI->isSimple() && "We only speculate simple loads");
  
      IRB.SetInsertPoint(LI);
@@ -1293,6 +1285,9 @@ static Value *getNaturalGEPWithType(IRBuilderTy &IRB, const DataLayout &DL,
    if (Ty == TargetTy)
      return buildGEP(IRB, BasePtr, Indices, NamePrefix);
  
+  // Pointer size to use for the indices.
+  unsigned PtrSize = DL.getPointerTypeSizeInBits(BasePtr->getType());
+
    // See if we can descend into a struct and locate a field with the correct
    // type.
    unsigned NumLayers = 0;
@@ -1300,11 +1295,13 @@ static Value *getNaturalGEPWithType(IRBuilderTy &IRB, const DataLayout &DL,
    do {
      if (ElementTy->isPointerTy())
        break;
-    if (SequentialType *SeqTy = dyn_cast<SequentialType>(ElementTy)) {
-      ElementTy = SeqTy->getElementType();
-      // Note that we use the default address space as this index is over an
-      // array or a vector, not a pointer.
-      Indices.push_back(IRB.getInt(APInt(DL.getPointerSizeInBits(0), 0)));
+
+    if (ArrayType *ArrayTy = dyn_cast<ArrayType>(ElementTy)) {
+      ElementTy = ArrayTy->getElementType();
+      Indices.push_back(IRB.getIntN(PtrSize, 0));
+    } else if (VectorType *VectorTy = dyn_cast<VectorType>(ElementTy)) {
+      ElementTy = VectorTy->getElementType();
+      Indices.push_back(IRB.getInt32(0));
      } else if (StructType *STy = dyn_cast<StructType>(ElementTy)) {
        if (STy->element_begin() == STy->element_end())
          break; // Nothing left to descend into.
@@ -1404,7 +1401,7 @@ static Value *getNaturalGEPWithOffset(IRBuilderTy &IRB, const DataLayout &DL,
  
    // Don't consider any GEPs through an i8* as natural unless the TargetTy is
    // an i8.
-  if (Ty == IRB.getInt8PtrTy() && TargetTy->isIntegerTy(8))
+  if (Ty == IRB.getInt8PtrTy(Ty->getAddressSpace()) && TargetTy->isIntegerTy(8))
      return 0;
  
    Type *ElementTy = Ty->getElementType();
@@ -1506,8 +1503,9 @@ static Value *getAdjustedPtr(IRBuilderTy &IRB, const DataLayout &DL, Value *Ptr,
  
    if (!OffsetPtr) {
      if (!Int8Ptr) {
-      Int8Ptr = IRB.CreateBitCast(Ptr, IRB.getInt8PtrTy(),
-                                  NamePrefix + "sroa_raw_cast");
+      Int8Ptr = IRB.CreateBitCast(
+          Ptr, IRB.getInt8PtrTy(PointerTy->getPointerAddressSpace()),
+          NamePrefix + "sroa_raw_cast");
        Int8PtrOffset = Offset;
      }
  
@@ -2012,8 +2010,14 @@ class AllocaSliceRewriter : public InstVisitor<AllocaSliceRewriter, bool> {
    // integer type will be stored here for easy access during rewriting.
    IntegerType *IntTy;
  
-  // The offset of the slice currently being rewritten.
+  // The original offset of the slice currently being rewritten relative to
+  // the original alloca.
    uint64_t BeginOffset, EndOffset;
+  // The new offsets of the slice currently being rewritten relative to the
+  // original alloca.
+  uint64_t NewBeginOffset, NewEndOffset;
+
+  uint64_t SliceSize;
    bool IsSplittable;
    bool IsSplit;
    Use *OldUse;
@@ -2030,12 +2034,14 @@ class AllocaSliceRewriter : public InstVisitor<AllocaSliceRewriter, bool> {
  public:
    AllocaSliceRewriter(const DataLayout &DL, AllocaSlices &S, SROA &Pass,
                        AllocaInst &OldAI, AllocaInst &NewAI,
-                      uint64_t NewBeginOffset, uint64_t NewEndOffset,
-                      bool IsVectorPromotable, bool IsIntegerPromotable,
+                      uint64_t NewAllocaBeginOffset,
+                      uint64_t NewAllocaEndOffset, bool IsVectorPromotable,
+                      bool IsIntegerPromotable,
                        SmallPtrSetImpl<PHINode *> &PHIUsers,
                        SmallPtrSetImpl<SelectInst *> &SelectUsers)
        : DL(DL), S(S), Pass(Pass), OldAI(OldAI), NewAI(NewAI),
-        NewAllocaBeginOffset(NewBeginOffset), NewAllocaEndOffset(NewEndOffset),
+        NewAllocaBeginOffset(NewAllocaBeginOffset),
+        NewAllocaEndOffset(NewAllocaEndOffset),
          NewAllocaTy(NewAI.getAllocatedType()),
          VecTy(IsVectorPromotable ? cast<VectorType>(NewAllocaTy) : 0),
          ElementTy(VecTy ? VecTy->getElementType() : 0),
@@ -2065,6 +2071,14 @@ public:
      IsSplit =
          BeginOffset < NewAllocaBeginOffset || EndOffset > NewAllocaEndOffset;
  
+    // Compute the intersecting offset range.
+    assert(BeginOffset < NewAllocaEndOffset);
+    assert(EndOffset > NewAllocaBeginOffset);
+    NewBeginOffset = std::max(BeginOffset, NewAllocaBeginOffset);
+    NewEndOffset = std::min(EndOffset, NewAllocaEndOffset);
+
+    SliceSize = NewEndOffset - NewBeginOffset;
+
      OldUse = I->getUse();
      OldPtr = cast<Instruction>(OldUse->get());
  
@@ -2089,9 +2103,12 @@ private:
      llvm_unreachable("No rewrite rule for this instruction!");
    }
  
-  Value *getAdjustedAllocaPtr(IRBuilderTy &IRB, uint64_t Offset,
-                              Type *PointerTy) {
-    assert(Offset >= NewAllocaBeginOffset);
+  Value *getNewAllocaSlicePtr(IRBuilderTy &IRB, Type *PointerTy) {
+    // Note that the offset computation can use BeginOffset or NewBeginOffset
+    // interchangeably for unsplit slices.
+    assert(IsSplit || BeginOffset == NewBeginOffset);
+    uint64_t Offset = NewBeginOffset - NewAllocaBeginOffset;
+
  #ifndef NDEBUG
      StringRef OldName = OldPtr->getName();
      // Skip through the last '.sroa.' component of the name.
@@ -2112,9 +2129,9 @@ private:
      // Strip any SROA suffixes as well.
      OldName = OldName.substr(0, OldName.find(".sroa_"));
  #endif
-    return getAdjustedPtr(IRB, DL, &NewAI, APInt(DL.getPointerSizeInBits(),
-                                                 Offset - NewAllocaBeginOffset),
-                          PointerTy,
+
+    return getAdjustedPtr(IRB, DL, &NewAI,
+                          APInt(DL.getPointerSizeInBits(), Offset), PointerTy,
  #ifndef NDEBUG
                            Twine(OldName) + "."
  #else
@@ -2123,22 +2140,16 @@ private:
                            );
    }
  
-  /// \brief Compute suitable alignment to access an offset into the new alloca.
-  unsigned getOffsetAlign(uint64_t Offset) {
+  /// \brief Compute suitable alignment to access this slice of the *new* alloca.
+  ///
+  /// You can optionally pass a type to this routine and if that type's ABI
+  /// alignment is itself suitable, this will return zero.
+  unsigned getSliceAlign(Type *Ty = 0) {
      unsigned NewAIAlign = NewAI.getAlignment();
      if (!NewAIAlign)
        NewAIAlign = DL.getABITypeAlignment(NewAI.getAllocatedType());
-    return MinAlign(NewAIAlign, Offset);
-  }
-
-  /// \brief Compute suitable alignment to access a type at an offset of the
-  /// new alloca.
-  ///
-  /// \returns zero if the type's ABI alignment is a suitable alignment,
-  /// otherwise returns the maximal suitable alignment.
-  unsigned getOffsetTypeAlign(Type *Ty, uint64_t Offset) {
-    unsigned Align = getOffsetAlign(Offset);
-    return Align == DL.getABITypeAlignment(Ty) ? 0 : Align;
+    unsigned Align = MinAlign(NewAIAlign, NewBeginOffset - NewAllocaBeginOffset);
+    return (Ty && Align == DL.getABITypeAlignment(Ty)) ? 0 : Align;
    }
  
    unsigned getIndex(uint64_t Offset) {
@@ -2156,8 +2167,7 @@ private:
        Pass.DeadInsts.insert(I);
    }
  
-  Value *rewriteVectorizedLoadInst(uint64_t NewBeginOffset,
-                                   uint64_t NewEndOffset) {
+  Value *rewriteVectorizedLoadInst() {
      unsigned BeginIndex = getIndex(NewBeginOffset);
      unsigned EndIndex = getIndex(NewEndOffset);
      assert(EndIndex > BeginIndex && "Empty vector!");
@@ -2167,8 +2177,7 @@ private:
      return extractVector(IRB, V, BeginIndex, EndIndex, "vec");
    }
  
-  Value *rewriteIntegerLoad(LoadInst &LI, uint64_t NewBeginOffset,
-                            uint64_t NewEndOffset) {
+  Value *rewriteIntegerLoad(LoadInst &LI) {
      assert(IntTy && "We cannot insert an integer to the alloca");
      assert(!LI.isVolatile());
      Value *V = IRB.CreateAlignedLoad(&NewAI, NewAI.getAlignment(),
@@ -2187,32 +2196,23 @@ private:
      Value *OldOp = LI.getOperand(0);
      assert(OldOp == OldPtr);
  
-    // Compute the intersecting offset range.
-    assert(BeginOffset < NewAllocaEndOffset);
-    assert(EndOffset > NewAllocaBeginOffset);
-    uint64_t NewBeginOffset = std::max(BeginOffset, NewAllocaBeginOffset);
-    uint64_t NewEndOffset = std::min(EndOffset, NewAllocaEndOffset);
-
-    uint64_t Size = NewEndOffset - NewBeginOffset;
-
-    Type *TargetTy = IsSplit ? Type::getIntNTy(LI.getContext(), Size * 8)
+    Type *TargetTy = IsSplit ? Type::getIntNTy(LI.getContext(), SliceSize * 8)
                               : LI.getType();
      bool IsPtrAdjusted = false;
      Value *V;
      if (VecTy) {
-      V = rewriteVectorizedLoadInst(NewBeginOffset, NewEndOffset);
+      V = rewriteVectorizedLoadInst();
      } else if (IntTy && LI.getType()->isIntegerTy()) {
-      V = rewriteIntegerLoad(LI, NewBeginOffset, NewEndOffset);
+      V = rewriteIntegerLoad(LI);
      } else if (NewBeginOffset == NewAllocaBeginOffset &&
                 canConvertValue(DL, NewAllocaTy, LI.getType())) {
        V = IRB.CreateAlignedLoad(&NewAI, NewAI.getAlignment(),
                                  LI.isVolatile(), LI.getName());
      } else {
        Type *LTy = TargetTy->getPointerTo();
-      V = IRB.CreateAlignedLoad(
-          getAdjustedAllocaPtr(IRB, NewBeginOffset, LTy),
-          getOffsetTypeAlign(TargetTy, NewBeginOffset - NewAllocaBeginOffset),
-          LI.isVolatile(), LI.getName());
+      V = IRB.CreateAlignedLoad(getNewAllocaSlicePtr(IRB, LTy),
+                                getSliceAlign(TargetTy), LI.isVolatile(),
+                                LI.getName());
        IsPtrAdjusted = true;
      }
      V = convertValue(DL, IRB, V, TargetTy);
@@ -2221,13 +2221,13 @@ private:
        assert(!LI.isVolatile());
        assert(LI.getType()->isIntegerTy() &&
               "Only integer type loads and stores are split");
-      assert(Size < DL.getTypeStoreSize(LI.getType()) &&
+      assert(SliceSize < DL.getTypeStoreSize(LI.getType()) &&
               "Split load isn't smaller than original load");
        assert(LI.getType()->getIntegerBitWidth() ==
               DL.getTypeStoreSizeInBits(LI.getType()) &&
               "Non-byte-multiple bit width");
        // Move the insertion point just past the load so that we can refer to it.
-      IRB.SetInsertPoint(llvm::next(BasicBlock::iterator(&LI)));
+      IRB.SetInsertPoint(std::next(BasicBlock::iterator(&LI)));
        // Create a placeholder value with the same type as LI to use as the
        // basis for the new value. This allows us to replace the uses of LI with
        // the computed value, and then replace the placeholder with LI, leaving
@@ -2249,9 +2249,7 @@ private:
      return !LI.isVolatile() && !IsPtrAdjusted;
    }
  
-  bool rewriteVectorizedStoreInst(Value *V, StoreInst &SI, Value *OldOp,
-                                  uint64_t NewBeginOffset,
-                                  uint64_t NewEndOffset) {
+  bool rewriteVectorizedStoreInst(Value *V, StoreInst &SI, Value *OldOp) {
      if (V->getType() != VecTy) {
        unsigned BeginIndex = getIndex(NewBeginOffset);
        unsigned EndIndex = getIndex(NewEndOffset);
@@ -2277,8 +2275,7 @@ private:
      return true;
    }
  
-  bool rewriteIntegerStore(Value *V, StoreInst &SI,
-                           uint64_t NewBeginOffset, uint64_t NewEndOffset) {
+  bool rewriteIntegerStore(Value *V, StoreInst &SI) {
      assert(IntTy && "We cannot extract an integer from the alloca");
      assert(!SI.isVolatile());
      if (DL.getTypeSizeInBits(V->getType()) != IntTy->getBitWidth()) {
@@ -2311,30 +2308,22 @@ private:
        if (AllocaInst *AI = dyn_cast<AllocaInst>(V->stripInBoundsOffsets()))
          Pass.PostPromotionWorklist.insert(AI);
  
-    // Compute the intersecting offset range.
-    assert(BeginOffset < NewAllocaEndOffset);
-    assert(EndOffset > NewAllocaBeginOffset);
-    uint64_t NewBeginOffset = std::max(BeginOffset, NewAllocaBeginOffset);
-    uint64_t NewEndOffset = std::min(EndOffset, NewAllocaEndOffset);
-
-    uint64_t Size = NewEndOffset - NewBeginOffset;
-    if (Size < DL.getTypeStoreSize(V->getType())) {
+    if (SliceSize < DL.getTypeStoreSize(V->getType())) {
        assert(!SI.isVolatile());
        assert(V->getType()->isIntegerTy() &&
               "Only integer type loads and stores are split");
        assert(V->getType()->getIntegerBitWidth() ==
               DL.getTypeStoreSizeInBits(V->getType()) &&
               "Non-byte-multiple bit width");
-      IntegerType *NarrowTy = Type::getIntNTy(SI.getContext(), Size * 8);
+      IntegerType *NarrowTy = Type::getIntNTy(SI.getContext(), SliceSize * 8);
        V = extractInteger(DL, IRB, V, NarrowTy, NewBeginOffset,
                           "extract");
      }
  
      if (VecTy)
-      return rewriteVectorizedStoreInst(V, SI, OldOp, NewBeginOffset,
-                                        NewEndOffset);
+      return rewriteVectorizedStoreInst(V, SI, OldOp);
      if (IntTy && V->getType()->isIntegerTy())
-      return rewriteIntegerStore(V, SI, NewBeginOffset, NewEndOffset);
+      return rewriteIntegerStore(V, SI);
  
      StoreInst *NewSI;
      if (NewBeginOffset == NewAllocaBeginOffset &&
@@ -2344,12 +2333,9 @@ private:
        NewSI = IRB.CreateAlignedStore(V, &NewAI, NewAI.getAlignment(),
                                       SI.isVolatile());
      } else {
-      Value *NewPtr = getAdjustedAllocaPtr(IRB, NewBeginOffset,
-                                           V->getType()->getPointerTo());
-      NewSI = IRB.CreateAlignedStore(
-          V, NewPtr, getOffsetTypeAlign(V->getType(),
-                                        NewBeginOffset - NewAllocaBeginOffset),
-          SI.isVolatile());
+      Value *NewPtr = getNewAllocaSlicePtr(IRB, V->getType()->getPointerTo());
+      NewSI = IRB.CreateAlignedStore(V, NewPtr, getSliceAlign(V->getType()),
+                                     SI.isVolatile());
      }
      (void)NewSI;
      Pass.DeadInsts.insert(&SI);
@@ -2401,10 +2387,10 @@ private:
      // pointer to the new alloca.
      if (!isa<Constant>(II.getLength())) {
        assert(!IsSplit);
-      assert(BeginOffset >= NewAllocaBeginOffset);
-      II.setDest(getAdjustedAllocaPtr(IRB, BeginOffset, OldPtr->getType()));
+      assert(NewBeginOffset == BeginOffset);
+      II.setDest(getNewAllocaSlicePtr(IRB, OldPtr->getType()));
        Type *CstTy = II.getAlignmentCst()->getType();
-      II.setAlignment(ConstantInt::get(CstTy, getOffsetAlign(BeginOffset)));
+      II.setAlignment(ConstantInt::get(CstTy, getSliceAlign()));
  
        deleteIfTriviallyDead(OldPtr);
        return false;
@@ -2416,13 +2402,6 @@ private:
      Type *AllocaTy = NewAI.getAllocatedType();
      Type *ScalarTy = AllocaTy->getScalarType();
  
-    // Compute the intersecting offset range.
-    assert(BeginOffset < NewAllocaEndOffset);
-    assert(EndOffset > NewAllocaBeginOffset);
-    uint64_t NewBeginOffset = std::max(BeginOffset, NewAllocaBeginOffset);
-    uint64_t NewEndOffset = std::min(EndOffset, NewAllocaEndOffset);
-    uint64_t SliceOffset = NewBeginOffset - NewAllocaBeginOffset;
-
      // If this doesn't map cleanly onto the alloca type, and that type isn't
      // a single value type, just emit a memset.
      if (!VecTy && !IntTy &&
@@ -2434,8 +2413,8 @@ private:
        Type *SizeTy = II.getLength()->getType();
        Constant *Size = ConstantInt::get(SizeTy, NewEndOffset - NewBeginOffset);
        CallInst *New = IRB.CreateMemSet(
-          getAdjustedAllocaPtr(IRB, NewBeginOffset, OldPtr->getType()),
-          II.getValue(), Size, getOffsetAlign(SliceOffset), II.isVolatile());
+          getNewAllocaSlicePtr(IRB, OldPtr->getType()), II.getValue(), Size,
+          getSliceAlign(), II.isVolatile());
        (void)New;
        DEBUG(dbgs() << "          to: " << *New << "\n");
        return false;
@@ -2512,26 +2491,11 @@ private:
  
      DEBUG(dbgs() << "    original: " << II << "\n");
  
-    // Compute the intersecting offset range.
-    assert(BeginOffset < NewAllocaEndOffset);
-    assert(EndOffset > NewAllocaBeginOffset);
-    uint64_t NewBeginOffset = std::max(BeginOffset, NewAllocaBeginOffset);
-    uint64_t NewEndOffset = std::min(EndOffset, NewAllocaEndOffset);
-
      bool IsDest = &II.getRawDestUse() == OldUse;
      assert((IsDest && II.getRawDest() == OldPtr) ||
             (!IsDest && II.getRawSource() == OldPtr));
  
-    // Compute the relative offset within the transfer.
-    unsigned IntPtrWidth = DL.getPointerSizeInBits();
-    APInt RelOffset(IntPtrWidth, NewBeginOffset - BeginOffset);
-
-    unsigned Align = II.getAlignment();
-    uint64_t SliceOffset = NewBeginOffset - NewAllocaBeginOffset;
-    if (Align > 1)
-      Align =
-          MinAlign(RelOffset.zextOrTrunc(64).getZExtValue(),
-                   MinAlign(II.getAlignment(), getOffsetAlign(SliceOffset)));
+    unsigned SliceAlign = getSliceAlign();
  
      // For unsplit intrinsics, we simply modify the source and destination
      // pointers in place. This isn't just an optimization, it is a matter of
@@ -2541,15 +2505,17 @@ private:
      // memcpy, and so simply updating the pointers is the necessary for us to
      // update both source and dest of a single call.
      if (!IsSplittable) {
-      Value *AdjustedPtr =
-          getAdjustedAllocaPtr(IRB, BeginOffset, OldPtr->getType());
+      Value *AdjustedPtr = getNewAllocaSlicePtr(IRB, OldPtr->getType());
        if (IsDest)
          II.setDest(AdjustedPtr);
        else
          II.setSource(AdjustedPtr);
  
-      Type *CstTy = II.getAlignmentCst()->getType();
-      II.setAlignment(ConstantInt::get(CstTy, Align));
+      if (II.getAlignment() > SliceAlign) {
+        Type *CstTy = II.getAlignmentCst()->getType();
+        II.setAlignment(
+            ConstantInt::get(CstTy, MinAlign(II.getAlignment(), SliceAlign)));
+      }
  
        DEBUG(dbgs() << "          to: " << II << "\n");
        deleteIfTriviallyDead(OldPtr);
@@ -2594,33 +2560,33 @@ private:
        Pass.Worklist.insert(AI);
      }
  
-    if (EmitMemCpy) {
-      Type *OtherPtrTy = OtherPtr->getType();
+    Type *OtherPtrTy = OtherPtr->getType();
+    unsigned OtherAS = OtherPtrTy->getPointerAddressSpace();
+
+    // Compute the relative offset for the other pointer within the transfer.
+    unsigned IntPtrWidth = DL.getPointerSizeInBits(OtherAS);
+    APInt OtherOffset(IntPtrWidth, NewBeginOffset - BeginOffset);
+    unsigned OtherAlign = MinAlign(II.getAlignment() ? II.getAlignment() : 1,
+                                   OtherOffset.zextOrTrunc(64).getZExtValue());
  
+    if (EmitMemCpy) {
        // Compute the other pointer, folding as much as possible to produce
        // a single, simple GEP in most cases.
-      OtherPtr = getAdjustedPtr(IRB, DL, OtherPtr, RelOffset, OtherPtrTy,
+      OtherPtr = getAdjustedPtr(IRB, DL, OtherPtr, OtherOffset, OtherPtrTy,
                                  OtherPtr->getName() + ".");
  
-      Value *OurPtr =
-          getAdjustedAllocaPtr(IRB, NewBeginOffset, OldPtr->getType());
+      Value *OurPtr = getNewAllocaSlicePtr(IRB, OldPtr->getType());
        Type *SizeTy = II.getLength()->getType();
        Constant *Size = ConstantInt::get(SizeTy, NewEndOffset - NewBeginOffset);
  
-      CallInst *New = IRB.CreateMemCpy(IsDest ? OurPtr : OtherPtr,
-                                       IsDest ? OtherPtr : OurPtr,
-                                       Size, Align, II.isVolatile());
+      CallInst *New = IRB.CreateMemCpy(
+          IsDest ? OurPtr : OtherPtr, IsDest ? OtherPtr : OurPtr, Size,
+          MinAlign(SliceAlign, OtherAlign), II.isVolatile());
        (void)New;
        DEBUG(dbgs() << "          to: " << *New << "\n");
        return false;
      }
  
-    // Note that we clamp the alignment to 1 here as a 0 alignment for a memcpy
-    // is equivalent to 1, but that isn't true if we end up rewriting this as
-    // a load or store.
-    if (!Align)
-      Align = 1;
-
      bool IsWholeAlloca = NewBeginOffset == NewAllocaBeginOffset &&
                           NewEndOffset == NewAllocaEndOffset;
      uint64_t Size = NewEndOffset - NewBeginOffset;
@@ -2630,23 +2596,30 @@ private:
      IntegerType *SubIntTy
        = IntTy ? Type::getIntNTy(IntTy->getContext(), Size*8) : 0;
  
-    Type *OtherPtrTy = NewAI.getType();
+    // Reset the other pointer type to match the register type we're going to
+    // use, but using the address space of the original other pointer.
      if (VecTy && !IsWholeAlloca) {
        if (NumElements == 1)
          OtherPtrTy = VecTy->getElementType();
        else
          OtherPtrTy = VectorType::get(VecTy->getElementType(), NumElements);
  
-      OtherPtrTy = OtherPtrTy->getPointerTo();
+      OtherPtrTy = OtherPtrTy->getPointerTo(OtherAS);
      } else if (IntTy && !IsWholeAlloca) {
-      OtherPtrTy = SubIntTy->getPointerTo();
+      OtherPtrTy = SubIntTy->getPointerTo(OtherAS);
+    } else {
+      OtherPtrTy = NewAllocaTy->getPointerTo(OtherAS);
      }
  
-    Value *SrcPtr = getAdjustedPtr(IRB, DL, OtherPtr, RelOffset, OtherPtrTy,
+    Value *SrcPtr = getAdjustedPtr(IRB, DL, OtherPtr, OtherOffset, OtherPtrTy,
                                     OtherPtr->getName() + ".");
+    unsigned SrcAlign = OtherAlign;
      Value *DstPtr = &NewAI;
-    if (!IsDest)
+    unsigned DstAlign = SliceAlign;
+    if (!IsDest) {
        std::swap(SrcPtr, DstPtr);
+      std::swap(SrcAlign, DstAlign);
+    }
  
      Value *Src;
      if (VecTy && !IsWholeAlloca && !IsDest) {
@@ -2660,7 +2633,7 @@ private:
        uint64_t Offset = NewBeginOffset - NewAllocaBeginOffset;
        Src = extractInteger(DL, IRB, Src, SubIntTy, Offset, "extract");
      } else {
-      Src = IRB.CreateAlignedLoad(SrcPtr, Align, II.isVolatile(),
+      Src = IRB.CreateAlignedLoad(SrcPtr, SrcAlign, II.isVolatile(),
                                    "copyload");
      }
  
@@ -2678,7 +2651,7 @@ private:
      }
  
      StoreInst *Store = cast<StoreInst>(
-      IRB.CreateAlignedStore(Src, DstPtr, Align, II.isVolatile()));
+        IRB.CreateAlignedStore(Src, DstPtr, DstAlign, II.isVolatile()));
      (void)Store;
      DEBUG(dbgs() << "          to: " << *Store << "\n");
      return !II.isVolatile();
@@ -2690,19 +2663,13 @@ private:
      DEBUG(dbgs() << "    original: " << II << "\n");
      assert(II.getArgOperand(1) == OldPtr);
  
-    // Compute the intersecting offset range.
-    assert(BeginOffset < NewAllocaEndOffset);
-    assert(EndOffset > NewAllocaBeginOffset);
-    uint64_t NewBeginOffset = std::max(BeginOffset, NewAllocaBeginOffset);
-    uint64_t NewEndOffset = std::min(EndOffset, NewAllocaEndOffset);
-
      // Record this instruction for deletion.
      Pass.DeadInsts.insert(&II);
  
      ConstantInt *Size
        = ConstantInt::get(cast<IntegerType>(II.getArgOperand(0)->getType()),
                           NewEndOffset - NewBeginOffset);
-    Value *Ptr = getAdjustedAllocaPtr(IRB, NewBeginOffset, OldPtr->getType());
+    Value *Ptr = getNewAllocaSlicePtr(IRB, OldPtr->getType());
      Value *New;
      if (II.getIntrinsicID() == Intrinsic::lifetime_start)
        New = IRB.CreateLifetimeStart(Ptr, Size);
@@ -2727,8 +2694,7 @@ private:
      PtrBuilder.SetInsertPoint(OldPtr);
      PtrBuilder.SetCurrentDebugLocation(OldPtr->getDebugLoc());
  
-    Value *NewPtr =
-        getAdjustedAllocaPtr(PtrBuilder, BeginOffset, OldPtr->getType());
+    Value *NewPtr = getNewAllocaSlicePtr(PtrBuilder, OldPtr->getType());
      // Replace the operands which were using the old pointer.
      std::replace(PN.op_begin(), PN.op_end(), cast<Value>(OldPtr), NewPtr);
  
@@ -2749,7 +2715,7 @@ private:
      assert(BeginOffset >= NewAllocaBeginOffset && "Selects are unsplittable");
      assert(EndOffset <= NewAllocaEndOffset && "Selects are unsplittable");
  
-    Value *NewPtr = getAdjustedAllocaPtr(IRB, BeginOffset, OldPtr->getType());
+    Value *NewPtr = getNewAllocaSlicePtr(IRB, OldPtr->getType());
      // Replace the operands which were using the old pointer.
      if (SI.getOperand(1) == OldPtr)
        SI.setOperand(1, NewPtr);
@@ -2811,10 +2777,9 @@ private:
    /// Enqueue all the users of the given instruction for further processing.
    /// This uses a set to de-duplicate users.
    void enqueueUsers(Instruction &I) {
-    for (Value::use_iterator UI = I.use_begin(), UE = I.use_end(); UI != UE;
-         ++UI)
-      if (Visited.insert(*UI))
-        Queue.push_back(&UI.getUse());
+    for (Use &U : I.uses())
+      if (Visited.insert(U.getUser()))
+        Queue.push_back(&U);
    }
  
    // Conservative default is to not rewrite anything.
@@ -3284,18 +3249,6 @@ bool SROA::rewritePartition(AllocaInst &AI, AllocaSlices &S,
    return true;
  }
  
-namespace {
-struct IsSliceEndLessOrEqualTo {
-  uint64_t UpperBound;
-
-  IsSliceEndLessOrEqualTo(uint64_t UpperBound) : UpperBound(UpperBound) {}
-
-  bool operator()(const AllocaSlices::iterator &I) {
-    return I->endOffset() <= UpperBound;
-  }
-};
-}
-
  static void
  removeFinishedSplitUses(SmallVectorImpl<AllocaSlices::iterator> &SplitUses,
                          uint64_t &MaxSplitUseEndOffset, uint64_t Offset) {
@@ -3307,7 +3260,9 @@ removeFinishedSplitUses(SmallVectorImpl<AllocaSlices::iterator> &SplitUses,
  
    size_t SplitUsesOldSize = SplitUses.size();
    SplitUses.erase(std::remove_if(SplitUses.begin(), SplitUses.end(),
-                                 IsSliceEndLessOrEqualTo(Offset)),
+                                 [Offset](const AllocaSlices::iterator &I) {
+                    return I->endOffset() <= Offset;
+                  }),
                    SplitUses.end());
    if (SplitUsesOldSize == SplitUses.size())
      return;
@@ -3334,7 +3289,7 @@ bool SROA::splitAlloca(AllocaInst &AI, AllocaSlices &S) {
  
    uint64_t BeginOffset = S.begin()->beginOffset();
  
-  for (AllocaSlices::iterator SI = S.begin(), SJ = llvm::next(SI), SE = S.end();
+  for (AllocaSlices::iterator SI = S.begin(), SJ = std::next(SI), SE = S.end();
         SI != SE; SI = SJ) {
      uint64_t MaxEndOffset = SI->endOffset();
  
@@ -3486,9 +3441,8 @@ bool SROA::runOnAlloca(AllocaInst &AI) {
                                          DE = S.dead_user_end();
         DI != DE; ++DI) {
      // Free up everything used by this instruction.
-    for (User::op_iterator DOI = (*DI)->op_begin(), DOE = (*DI)->op_end();
-         DOI != DOE; ++DOI)
-      clobberUse(*DOI);
+    for (Use &DeadOp : (*DI)->operands())
+      clobberUse(DeadOp);
  
      // Now replace the uses of this instruction.
      (*DI)->replaceAllUsesWith(UndefValue::get((*DI)->getType()));
@@ -3537,10 +3491,10 @@ void SROA::deleteDeadInstructions(SmallPtrSet<AllocaInst*, 4> &DeletedAllocas) {
  
      I->replaceAllUsesWith(UndefValue::get(I->getType()));
  
-    for (User::op_iterator OI = I->op_begin(), E = I->op_end(); OI != E; ++OI)
-      if (Instruction *U = dyn_cast<Instruction>(*OI)) {
+    for (Use &Operand : I->operands())
+      if (Instruction *U = dyn_cast<Instruction>(Operand)) {
          // Zero out the operand and see if it becomes trivially dead.
-        *OI = 0;
+        Operand = 0;
          if (isInstructionTriviallyDead(U))
            DeadInsts.insert(U);
        }
@@ -3556,10 +3510,9 @@ void SROA::deleteDeadInstructions(SmallPtrSet<AllocaInst*, 4> &DeletedAllocas) {
  static void enqueueUsersInWorklist(Instruction &I,
                                     SmallVectorImpl<Instruction *> &Worklist,
                                     SmallPtrSet<Instruction *, 8> &Visited) {
-  for (Value::use_iterator UI = I.use_begin(), UE = I.use_end(); UI != UE;
-       ++UI)
-    if (Visited.insert(cast<Instruction>(*UI)))
-      Worklist.push_back(cast<Instruction>(*UI));
+  for (User *U : I.users())
+    if (Visited.insert(cast<Instruction>(U)))
+      Worklist.push_back(cast<Instruction>(U));
  }
  
  /// \brief Promote the allocas, using the best available technique.
@@ -3645,20 +3598,6 @@ bool SROA::promoteAllocas(Function &F) {
    return true;
  }
  
-namespace {
-  /// \brief A predicate to test whether an alloca belongs to a set.
-  class IsAllocaInSet {
-    typedef SmallPtrSet<AllocaInst *, 4> SetType;
-    const SetType &Set;
-
-  public:
-    typedef AllocaInst *argument_type;
-
-    IsAllocaInSet(const SetType &Set) : Set(Set) {}
-    bool operator()(AllocaInst *AI) const { return Set.count(AI); }
-  };
-}
-
  bool SROA::runOnFunction(Function &F) {
    if (skipOptnoneFunction(F))
      return false;
@@ -3676,7 +3615,7 @@ bool SROA::runOnFunction(Function &F) {
    DT = DTWP ? &DTWP->getDomTree() : 0;
  
    BasicBlock &EntryBB = F.getEntryBlock();
-  for (BasicBlock::iterator I = EntryBB.begin(), E = llvm::prior(EntryBB.end());
+  for (BasicBlock::iterator I = EntryBB.begin(), E = std::prev(EntryBB.end());
         I != E; ++I)
      if (AllocaInst *AI = dyn_cast<AllocaInst>(I))
        Worklist.insert(AI);
@@ -3694,11 +3633,14 @@ bool SROA::runOnFunction(Function &F) {
        // Remove the deleted allocas from various lists so that we don't try to
        // continue processing them.
        if (!DeletedAllocas.empty()) {
-        Worklist.remove_if(IsAllocaInSet(DeletedAllocas));
-        PostPromotionWorklist.remove_if(IsAllocaInSet(DeletedAllocas));
+        auto IsInSet = [&](AllocaInst *AI) {
+          return DeletedAllocas.count(AI);
+        };
+        Worklist.remove_if(IsInSet);
+        PostPromotionWorklist.remove_if(IsInSet);
          PromotableAllocas.erase(std::remove_if(PromotableAllocas.begin(),
                                                 PromotableAllocas.end(),
-                                               IsAllocaInSet(DeletedAllocas)),
+                                               IsInSet),
                                  PromotableAllocas.end());
          DeletedAllocas.clear();
        }