Teach bottom up pre-ra scheduler to track register pressure. Work in progress.

[oota-llvm.git] / lib / CodeGen / SelectionDAG / SelectionDAG.cpp
diff --git a/lib/CodeGen/SelectionDAG/SelectionDAG.cpp b/lib/CodeGen/SelectionDAG/SelectionDAG.cpp

index 7dea29c8c7becffca8db26c465ba83a4924365c2..27d7a829d9fcf5ffdb3c6e9b1562a1facbab5293 100644 (file)
--- a/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
+++ b/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
@@ -15,6 +15,7 @@
  #include "SDNodeOrdering.h"
  #include "SDNodeDbgValue.h"
  #include "llvm/Constants.h"
+#include "llvm/Analysis/DebugInfo.h"
  #include "llvm/Analysis/ValueTracking.h"
  #include "llvm/Function.h"
  #include "llvm/GlobalAlias.h"
@@ -32,6 +33,7 @@
  #include "llvm/Target/TargetData.h"
  #include "llvm/Target/TargetFrameInfo.h"
  #include "llvm/Target/TargetLowering.h"
+#include "llvm/Target/TargetSelectionDAGInfo.h"
  #include "llvm/Target/TargetOptions.h"
  #include "llvm/Target/TargetInstrInfo.h"
  #include "llvm/Target/TargetIntrinsicInfo.h"
@@ -304,10 +306,6 @@ ISD::CondCode ISD::getSetCCAndOperation(ISD::CondCode Op1, ISD::CondCode Op2,
    return Result;
  }
  
-const TargetMachine &SelectionDAG::getTarget() const {
-  return MF->getTarget();
-}
-
  //===----------------------------------------------------------------------===//
  //                           SDNode Profile Support
  //===----------------------------------------------------------------------===//
@@ -792,8 +790,8 @@ unsigned SelectionDAG::getEVTAlignment(EVT VT) const {
  }
  
  // EntryNode could meaningfully have debug info if we can find it...
-SelectionDAG::SelectionDAG(TargetLowering &tli, FunctionLoweringInfo &fli)
-  : TLI(tli), FLI(fli),
+SelectionDAG::SelectionDAG(const TargetMachine &tm)
+  : TM(tm), TLI(*tm.getTargetLowering()), TSI(*tm.getSelectionDAGInfo()),
      EntryNode(ISD::EntryToken, DebugLoc(), getVTList(MVT::Other)),
      Root(getEntryNode()), Ordering(0) {
    AllNodes.push_back(&EntryNode);
@@ -801,16 +799,14 @@ SelectionDAG::SelectionDAG(TargetLowering &tli, FunctionLoweringInfo &fli)
    DbgInfo = new SDDbgInfo();
  }
  
-void SelectionDAG::init(MachineFunction &mf, MachineModuleInfo *mmi) {
+void SelectionDAG::init(MachineFunction &mf) {
    MF = &mf;
-  MMI = mmi;
    Context = &mf.getFunction()->getContext();
  }
  
  SelectionDAG::~SelectionDAG() {
    allnodes_clear();
    delete Ordering;
-  DbgInfo->clear();
    delete DbgInfo;
  }
  
@@ -837,11 +833,8 @@ void SelectionDAG::clear() {
    EntryNode.UseList = 0;
    AllNodes.push_back(&EntryNode);
    Root = getEntryNode();
-  delete Ordering;
-  Ordering = new SDNodeOrdering();
+  Ordering->clear();
    DbgInfo->clear();
-  delete DbgInfo;
-  DbgInfo = new SDDbgInfo();
  }
  
  SDValue SelectionDAG::getSExtOrTrunc(SDValue Op, DebugLoc DL, EVT VT) {
@@ -968,11 +961,21 @@ SDValue SelectionDAG::getConstantFP(double Val, EVT VT, bool isTarget) {
    EVT EltVT = VT.getScalarType();
    if (EltVT==MVT::f32)
      return getConstantFP(APFloat((float)Val), VT, isTarget);
-  else
+  else if (EltVT==MVT::f64)
      return getConstantFP(APFloat(Val), VT, isTarget);
+  else if (EltVT==MVT::f80 || EltVT==MVT::f128) {
+    bool ignored;
+    APFloat apf = APFloat(Val);
+    apf.convert(*EVTToAPFloatSemantics(EltVT), APFloat::rmNearestTiesToEven,
+                &ignored);
+    return getConstantFP(apf, VT, isTarget);
+  } else {
+    assert(0 && "Unsupported type in getConstantFP");
+    return SDValue();
+  }
  }
  
-SDValue SelectionDAG::getGlobalAddress(const GlobalValue *GV,
+SDValue SelectionDAG::getGlobalAddress(const GlobalValue *GV, DebugLoc DL,
                                         EVT VT, int64_t Offset,
                                         bool isTargetGA,
                                         unsigned char TargetFlags) {
@@ -1007,7 +1010,7 @@ SDValue SelectionDAG::getGlobalAddress(const GlobalValue *GV,
    if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
      return SDValue(E, 0);
  
-  SDNode *N = new (NodeAllocator) GlobalAddressSDNode(Opc, GV, VT,
+  SDNode *N = new (NodeAllocator) GlobalAddressSDNode(Opc, DL, GV, VT,
                                                        Offset, TargetFlags);
    CSEMap.InsertNode(N, IP);
    AllNodes.push_back(N);
@@ -1049,7 +1052,7 @@ SDValue SelectionDAG::getJumpTable(int JTI, EVT VT, bool isTarget,
    return SDValue(N, 0);
  }
  
-SDValue SelectionDAG::getConstantPool(Constant *C, EVT VT,
+SDValue SelectionDAG::getConstantPool(const Constant *C, EVT VT,
                                        unsigned Alignment, int Offset,
                                        bool isTarget,
                                        unsigned char TargetFlags) {
@@ -1320,7 +1323,7 @@ SDValue SelectionDAG::getEHLabel(DebugLoc dl, SDValue Root, MCSymbol *Label) {
  }
  
  
-SDValue SelectionDAG::getBlockAddress(BlockAddress *BA, EVT VT,
+SDValue SelectionDAG::getBlockAddress(const BlockAddress *BA, EVT VT,
                                        bool isTarget,
                                        unsigned char TargetFlags) {
    unsigned Opc = isTarget ? ISD::TargetBlockAddress : ISD::BlockAddress;
@@ -1357,6 +1360,23 @@ SDValue SelectionDAG::getSrcValue(const Value *V) {
    return SDValue(N, 0);
  }
  
+/// getMDNode - Return an MDNodeSDNode which holds an MDNode.
+SDValue SelectionDAG::getMDNode(const MDNode *MD) {
+  FoldingSetNodeID ID;
+  AddNodeIDNode(ID, ISD::MDNODE_SDNODE, getVTList(MVT::Other), 0, 0);
+  ID.AddPointer(MD);
+  
+  void *IP = 0;
+  if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
+    return SDValue(E, 0);
+  
+  SDNode *N = new (NodeAllocator) MDNodeSDNode(MD);
+  CSEMap.InsertNode(N, IP);
+  AllNodes.push_back(N);
+  return SDValue(N, 0);
+}
+
+
  /// getShiftAmountOperand - Return the specified value casted to
  /// the target's desired shift amount type.
  SDValue SelectionDAG::getShiftAmountOperand(SDValue Op) {
@@ -1905,7 +1925,8 @@ void SelectionDAG::ComputeMaskedBits(SDValue Op, const APInt &Mask,
      // Output known-0 bits are known if clear or set in both the low clear bits
      // common to both LHS & RHS.  For example, 8+(X<<3) is known to have the
      // low 3 bits clear.
-    APInt Mask2 = APInt::getLowBitsSet(BitWidth, Mask.countTrailingOnes());
+    APInt Mask2 = APInt::getLowBitsSet(BitWidth,
+                                       BitWidth - Mask.countLeadingZeros());
      ComputeMaskedBits(Op.getOperand(0), Mask2, KnownZero2, KnownOne2, Depth+1);
      assert((KnownZero2 & KnownOne2) == 0 && "Bits known to be one AND zero?");
      unsigned KnownZeroOut = KnownZero2.countTrailingOnes();
@@ -2215,7 +2236,7 @@ unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, unsigned Depth) const{
  
  bool SelectionDAG::isKnownNeverNaN(SDValue Op) const {
    // If we're told that NaNs won't happen, assume they won't.
-  if (FiniteOnlyFPMath())
+  if (NoNaNsFPMath)
      return true;
  
    // If the value is a constant, we can obviously see if it is a NaN or not.
@@ -2254,10 +2275,9 @@ bool SelectionDAG::isVerifiedDebugInfoDesc(SDValue Op) const {
    GlobalAddressSDNode *GA = dyn_cast<GlobalAddressSDNode>(Op);
    if (!GA) return false;
    if (GA->getOffset() != 0) return false;
-  GlobalVariable *GV = dyn_cast<GlobalVariable>(GA->getGlobal());
+  const GlobalVariable *GV = dyn_cast<GlobalVariable>(GA->getGlobal());
    if (!GV) return false;
-  MachineModuleInfo *MMI = getMachineModuleInfo();
-  return MMI && MMI->hasDebugInfo();
+  return MF->getMMI().hasDebugInfo();
  }
  
  
@@ -2266,7 +2286,6 @@ bool SelectionDAG::isVerifiedDebugInfoDesc(SDValue Op) const {
  SDValue SelectionDAG::getShuffleScalarElt(const ShuffleVectorSDNode *N,
                                            unsigned i) {
    EVT VT = N->getValueType(0);
-  DebugLoc dl = N->getDebugLoc();
    if (N->getMaskElt(i) < 0)
      return getUNDEF(VT.getVectorElementType());
    unsigned Index = N->getMaskElt(i);
@@ -2450,9 +2469,18 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL,
              VT.getVectorNumElements() ==
              Operand.getValueType().getVectorNumElements()) &&
             "Vector element count mismatch!");
-    if (OpOpcode == ISD::ZERO_EXTEND || OpOpcode == ISD::SIGN_EXTEND)
+
+    if (OpOpcode == ISD::ZERO_EXTEND || OpOpcode == ISD::SIGN_EXTEND ||
+        OpOpcode == ISD::ANY_EXTEND)
        // (ext (zext x)) -> (zext x)  and  (ext (sext x)) -> (sext x)
        return getNode(OpOpcode, DL, VT, Operand.getNode()->getOperand(0));
+
+    // (ext (trunx x)) -> x
+    if (OpOpcode == ISD::TRUNCATE) {
+      SDValue OpOp = Operand.getNode()->getOperand(0);
+      if (OpOp.getValueType() == VT)
+        return OpOp;
+    }
      break;
    case ISD::TRUNCATE:
      assert(VT.isInteger() && Operand.getValueType().isInteger() &&
@@ -2597,12 +2625,13 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
      if (N1.getOpcode() == ISD::BUILD_VECTOR &&
          N2.getOpcode() == ISD::BUILD_VECTOR) {
        SmallVector<SDValue, 16> Elts(N1.getNode()->op_begin(), N1.getNode()->op_end());
-      Elts.insert(Elts.end(), N2.getNode()->op_begin(), N2.getNode()->op_end());
+      Elts.append(N2.getNode()->op_begin(), N2.getNode()->op_end());
        return getNode(ISD::BUILD_VECTOR, DL, VT, &Elts[0], Elts.size());
      }
      break;
    case ISD::AND:
-    assert(VT.isInteger() && N1.getValueType() == N2.getValueType() &&
+    assert(VT.isInteger() && "This operator does not apply to FP types!");
+    assert(N1.getValueType() == N2.getValueType() &&
             N1.getValueType() == VT && "Binary operator types must match!");
      // (X & 0) -> 0.  This commonly occurs when legalizing i64 values, so it's
      // worth handling here.
@@ -2615,7 +2644,8 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
    case ISD::XOR:
    case ISD::ADD:
    case ISD::SUB:
-    assert(VT.isInteger() && N1.getValueType() == N2.getValueType() &&
+    assert(VT.isInteger() && "This operator does not apply to FP types!");
+    assert(N1.getValueType() == N2.getValueType() &&
             N1.getValueType() == VT && "Binary operator types must match!");
      // (X ^|+- 0) -> X.  This commonly occurs when legalizing i64 values, so
      // it's worth handling here.
@@ -2630,7 +2660,9 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
    case ISD::SDIV:
    case ISD::SREM:
      assert(VT.isInteger() && "This operator does not apply to FP types!");
-    // fall through
+    assert(N1.getValueType() == N2.getValueType() &&
+           N1.getValueType() == VT && "Binary operator types must match!");
+    break;
    case ISD::FADD:
    case ISD::FSUB:
    case ISD::FMUL:
@@ -2653,6 +2685,7 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
              return N1;
        }
      }
+    assert(VT.isFloatingPoint() && "This operator only applies to FP types!");
      assert(N1.getValueType() == N2.getValueType() &&
             N1.getValueType() == VT && "Binary operator types must match!");
      break;
@@ -2780,14 +2813,19 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
        // If the indices are the same, return the inserted element else
        // if the indices are known different, extract the element from
        // the original vector.
-      if (N1.getOperand(2) == N2) {
-        if (VT == N1.getOperand(1).getValueType())
-          return N1.getOperand(1);
-        else
-          return getSExtOrTrunc(N1.getOperand(1), DL, VT);
-      } else if (isa<ConstantSDNode>(N1.getOperand(2)) &&
-                 isa<ConstantSDNode>(N2))
+      SDValue N1Op2 = N1.getOperand(2);
+      ConstantSDNode *N1Op2C = dyn_cast<ConstantSDNode>(N1Op2.getNode());
+
+      if (N1Op2C && N2C) {
+        if (N1Op2C->getZExtValue() == N2C->getZExtValue()) {
+          if (VT == N1.getOperand(1).getValueType())
+            return N1.getOperand(1);
+          else
+            return getSExtOrTrunc(N1.getOperand(1), DL, VT);
+        }
+
          return getNode(ISD::EXTRACT_VECTOR_ELT, DL, VT, N1.getOperand(0), N2);
+      }
      }
      break;
    case ISD::EXTRACT_ELEMENT:
@@ -2976,7 +3014,6 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
                                SDValue N1, SDValue N2, SDValue N3) {
    // Perform various simplifications.
    ConstantSDNode *N1C = dyn_cast<ConstantSDNode>(N1.getNode());
-  ConstantSDNode *N2C = dyn_cast<ConstantSDNode>(N2.getNode());
    switch (Opcode) {
    case ISD::CONCAT_VECTORS:
      // A CONCAT_VECTOR with all operands BUILD_VECTOR can be simplified to
@@ -2985,8 +3022,8 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
          N2.getOpcode() == ISD::BUILD_VECTOR &&
          N3.getOpcode() == ISD::BUILD_VECTOR) {
        SmallVector<SDValue, 16> Elts(N1.getNode()->op_begin(), N1.getNode()->op_end());
-      Elts.insert(Elts.end(), N2.getNode()->op_begin(), N2.getNode()->op_end());
-      Elts.insert(Elts.end(), N3.getNode()->op_begin(), N3.getNode()->op_end());
+      Elts.append(N2.getNode()->op_begin(), N2.getNode()->op_end());
+      Elts.append(N3.getNode()->op_begin(), N3.getNode()->op_end());
        return getNode(ISD::BUILD_VECTOR, DL, VT, &Elts[0], Elts.size());
      }
      break;
@@ -3006,14 +3043,6 @@ SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
  
      if (N2 == N3) return N2;   // select C, X, X -> X
      break;
-  case ISD::BRCOND:
-    if (N2C) {
-      if (N2C->getZExtValue()) // Unconditional branch
-        return getNode(ISD::BR, DL, MVT::Other, N1, N3);
-      else
-        return N1;         // Never-taken branch
-    }
-    break;
    case ISD::VECTOR_SHUFFLE:
      llvm_unreachable("should use getVectorShuffle constructor!");
      break;
@@ -3180,7 +3209,7 @@ static bool isMemSrcFromString(SDValue Src, std::string &Str) {
    if (!G)
      return false;
  
-  GlobalVariable *GV = dyn_cast<GlobalVariable>(G->getGlobal());
+  const GlobalVariable *GV = dyn_cast<GlobalVariable>(G->getGlobal());
    if (GV && GetConstantStringInfo(GV, Str, SrcDelta, false))
      return true;
  
@@ -3195,6 +3224,7 @@ static bool FindOptimalMemOpLowering(std::vector<EVT> &MemOps,
                                       unsigned Limit, uint64_t Size,
                                       unsigned DstAlign, unsigned SrcAlign,
                                       bool NonScalarIntSafe,
+                                     bool MemcpyStrSrc,
                                       SelectionDAG &DAG,
                                       const TargetLowering &TLI) {
    assert((SrcAlign == 0 || SrcAlign >= DstAlign) &&
@@ -3203,16 +3233,17 @@ static bool FindOptimalMemOpLowering(std::vector<EVT> &MemOps,
    // the value, i.e. memset or memcpy from constant string. Otherwise, it's
    // the inferred alignment of the source. 'DstAlign', on the other hand, is the
    // specified alignment of the memory operation. If it is zero, that means
-  // it's possible to change the alignment of the destination.
+  // it's possible to change the alignment of the destination. 'MemcpyStrSrc'
+  // indicates whether the memcpy source is constant so it does not need to be
+  // loaded.
    EVT VT = TLI.getOptimalMemOpType(Size, DstAlign, SrcAlign,
-                                   NonScalarIntSafe, DAG);
+                                   NonScalarIntSafe, MemcpyStrSrc,
+                                   DAG.getMachineFunction());
  
    if (VT == MVT::Other) {
-    VT = TLI.getPointerTy();
-    const Type *Ty = VT.getTypeForEVT(*DAG.getContext());
-    if (DstAlign >= TLI.getTargetData()->getABITypeAlignment(Ty) ||
+    if (DstAlign >= TLI.getTargetData()->getPointerPrefAlignment() ||
          TLI.allowsUnalignedMemoryAccesses(VT)) {
-      VT = MVT::i64;
+      VT = TLI.getPointerTy();
      } else {
        switch (DstAlign & 7) {
        case 0:  VT = MVT::i64; break;
@@ -3230,6 +3261,15 @@ static bool FindOptimalMemOpLowering(std::vector<EVT> &MemOps,
      if (VT.bitsGT(LVT))
        VT = LVT;
    }
+  
+  // If we're optimizing for size, and there is a limit, bump the maximum number
+  // of operations inserted down to 4.  This is a wild guess that approximates
+  // the size of a call to memcpy or memset (3 arguments + call).
+  if (Limit != ~0U) {
+    const Function *F = DAG.getMachineFunction().getFunction();
+    if (F->hasFnAttr(Attribute::OptimizeForSize))
+      Limit = 4;
+  }
  
    unsigned NumMemOps = 0;
    while (Size != 0) {
@@ -3273,9 +3313,6 @@ static SDValue getMemcpyLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
    // below a certain threshold.
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
    std::vector<EVT> MemOps;
-  uint64_t Limit = -1ULL;
-  if (!AlwaysInline)
-    Limit = TLI.getMaxStoresPerMemcpy();
    bool DstAlignCanChange = false;
    MachineFrameInfo *MFI = DAG.getMachineFunction().getFrameInfo();
    FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
@@ -3287,9 +3324,12 @@ static SDValue getMemcpyLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
    std::string Str;
    bool CopyFromStr = isMemSrcFromString(Src, Str);
    bool isZeroStr = CopyFromStr && Str.empty();
+  unsigned Limit = AlwaysInline ? ~0U : TLI.getMaxStoresPerMemcpy();
+  
    if (!FindOptimalMemOpLowering(MemOps, Limit, Size,
                                  (DstAlignCanChange ? 0 : Align),
-                                (isZeroStr ? 0 : SrcAlign), true, DAG, TLI))
+                                (isZeroStr ? 0 : SrcAlign),
+                                true, CopyFromStr, DAG, TLI))
      return SDValue();
  
    if (DstAlignCanChange) {
@@ -3330,7 +3370,7 @@ static SDValue getMemcpyLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
        // FIXME does the case above also need this?
        EVT NVT = TLI.getTypeToTransformTo(*DAG.getContext(), VT);
        assert(NVT.bitsGE(VT));
-      Value = DAG.getExtLoad(ISD::EXTLOAD, dl, NVT, Chain,
+      Value = DAG.getExtLoad(ISD::EXTLOAD, NVT, dl, Chain,
                               getMemBasePlusOffset(Src, SrcOff, DAG),
                               SrcSV, SrcSVOff + SrcOff, VT, isVol, false,
                               MinAlign(SrcAlign, SrcOff));
@@ -3363,9 +3403,6 @@ static SDValue getMemmoveLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
    // below a certain threshold.
    const TargetLowering &TLI = DAG.getTargetLoweringInfo();
    std::vector<EVT> MemOps;
-  uint64_t Limit = -1ULL;
-  if (!AlwaysInline)
-    Limit = TLI.getMaxStoresPerMemmove();
    bool DstAlignCanChange = false;
    MachineFrameInfo *MFI = DAG.getMachineFunction().getFrameInfo();
    FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
@@ -3374,10 +3411,11 @@ static SDValue getMemmoveLoadsAndStores(SelectionDAG &DAG, DebugLoc dl,
    unsigned SrcAlign = DAG.InferPtrAlignment(Src);
    if (Align > SrcAlign)
      SrcAlign = Align;
+  unsigned Limit = AlwaysInline ? ~0U : TLI.getMaxStoresPerMemmove();
  
    if (!FindOptimalMemOpLowering(MemOps, Limit, Size,
                                  (DstAlignCanChange ? 0 : Align),
-                                SrcAlign, true, DAG, TLI))
+                                SrcAlign, true, false, DAG, TLI))
      return SDValue();
  
    if (DstAlignCanChange) {
@@ -3449,7 +3487,7 @@ static SDValue getMemsetStores(SelectionDAG &DAG, DebugLoc dl,
      isa<ConstantSDNode>(Src) && cast<ConstantSDNode>(Src)->isNullValue();
    if (!FindOptimalMemOpLowering(MemOps, TLI.getMaxStoresPerMemset(),
                                  Size, (DstAlignCanChange ? 0 : Align), 0,
-                                NonScalarIntSafe, DAG, TLI))
+                                NonScalarIntSafe, false, DAG, TLI))
      return SDValue();
  
    if (DstAlignCanChange) {
@@ -3505,7 +3543,7 @@ SDValue SelectionDAG::getMemcpy(SDValue Chain, DebugLoc dl, SDValue Dst,
    // Then check to see if we should lower the memcpy with target-specific
    // code. If the target chooses to do this, this is the next best.
    SDValue Result =
-    TLI.EmitTargetCodeForMemcpy(*this, dl, Chain, Dst, Src, Size, Align,
+    TSI.EmitTargetCodeForMemcpy(*this, dl, Chain, Dst, Src, Size, Align,
                                  isVol, AlwaysInline,
                                  DstSV, DstSVOff, SrcSV, SrcSVOff);
    if (Result.getNode())
@@ -3520,8 +3558,13 @@ SDValue SelectionDAG::getMemcpy(SDValue Chain, DebugLoc dl, SDValue Dst,
                                     true, DstSV, DstSVOff, SrcSV, SrcSVOff);
    }
  
+  // FIXME: If the memcpy is volatile (isVol), lowering it to a plain libc
+  // memcpy is not guaranteed to be safe. libc memcpys aren't required to
+  // respect volatile, so they may do things like read or write memory
+  // beyond the given memory regions. But fixing this isn't easy, and most
+  // people don't care.
+
    // Emit a library call.
-  assert(!isVol && "library memcpy does not support volatile");
    TargetLowering::ArgListTy Args;
    TargetLowering::ArgListEntry Entry;
    Entry.Ty = TLI.getTargetData()->getIntPtrType(*getContext());
@@ -3565,13 +3608,15 @@ SDValue SelectionDAG::getMemmove(SDValue Chain, DebugLoc dl, SDValue Dst,
    // Then check to see if we should lower the memmove with target-specific
    // code. If the target chooses to do this, this is the next best.
    SDValue Result =
-    TLI.EmitTargetCodeForMemmove(*this, dl, Chain, Dst, Src, Size, Align, isVol,
+    TSI.EmitTargetCodeForMemmove(*this, dl, Chain, Dst, Src, Size, Align, isVol,
                                   DstSV, DstSVOff, SrcSV, SrcSVOff);
    if (Result.getNode())
      return Result;
  
+  // FIXME: If the memmove is volatile, lowering it to plain libc memmove may
+  // not be safe.  See memcpy above for more details.
+
    // Emit a library call.
-  assert(!isVol && "library memmove does not support volatile");
    TargetLowering::ArgListTy Args;
    TargetLowering::ArgListEntry Entry;
    Entry.Ty = TLI.getTargetData()->getIntPtrType(*getContext());
@@ -3614,13 +3659,12 @@ SDValue SelectionDAG::getMemset(SDValue Chain, DebugLoc dl, SDValue Dst,
    // Then check to see if we should lower the memset with target-specific
    // code. If the target chooses to do this, this is the next best.
    SDValue Result =
-    TLI.EmitTargetCodeForMemset(*this, dl, Chain, Dst, Src, Size, Align, isVol,
+    TSI.EmitTargetCodeForMemset(*this, dl, Chain, Dst, Src, Size, Align, isVol,
                                  DstSV, DstSVOff);
    if (Result.getNode())
      return Result;
  
-  // Emit a library call.
-  assert(!isVol && "library memset does not support volatile");
+  // Emit a library call.  
    const Type *IntPtrTy = TLI.getTargetData()->getIntPtrType(*getContext());
    TargetLowering::ArgListTy Args;
    TargetLowering::ArgListEntry Entry;
@@ -3851,8 +3895,8 @@ SelectionDAG::getMemIntrinsicNode(unsigned Opcode, DebugLoc dl, SDVTList VTList,
  }
  
  SDValue
-SelectionDAG::getLoad(ISD::MemIndexedMode AM, DebugLoc dl,
-                      ISD::LoadExtType ExtType, EVT VT, SDValue Chain,
+SelectionDAG::getLoad(ISD::MemIndexedMode AM, ISD::LoadExtType ExtType,
+                      EVT VT, DebugLoc dl, SDValue Chain,
                        SDValue Ptr, SDValue Offset,
                        const Value *SV, int SVOffset, EVT MemVT,
                        bool isVolatile, bool isNonTemporal,
@@ -3875,12 +3919,12 @@ SelectionDAG::getLoad(ISD::MemIndexedMode AM, DebugLoc dl,
    MachineMemOperand *MMO =
      MF.getMachineMemOperand(SV, Flags, SVOffset,
                              MemVT.getStoreSize(), Alignment);
-  return getLoad(AM, dl, ExtType, VT, Chain, Ptr, Offset, MemVT, MMO);
+  return getLoad(AM, ExtType, VT, dl, Chain, Ptr, Offset, MemVT, MMO);
  }
  
  SDValue
-SelectionDAG::getLoad(ISD::MemIndexedMode AM, DebugLoc dl,
-                      ISD::LoadExtType ExtType, EVT VT, SDValue Chain,
+SelectionDAG::getLoad(ISD::MemIndexedMode AM, ISD::LoadExtType ExtType, 
+                      EVT VT, DebugLoc dl, SDValue Chain,
                        SDValue Ptr, SDValue Offset, EVT MemVT,
                        MachineMemOperand *MMO) {
    if (VT == MemVT) {
@@ -3930,18 +3974,18 @@ SDValue SelectionDAG::getLoad(EVT VT, DebugLoc dl,
                                bool isVolatile, bool isNonTemporal,
                                unsigned Alignment) {
    SDValue Undef = getUNDEF(Ptr.getValueType());
-  return getLoad(ISD::UNINDEXED, dl, ISD::NON_EXTLOAD, VT, Chain, Ptr, Undef,
+  return getLoad(ISD::UNINDEXED, ISD::NON_EXTLOAD, VT, dl, Chain, Ptr, Undef,
                   SV, SVOffset, VT, isVolatile, isNonTemporal, Alignment);
  }
  
-SDValue SelectionDAG::getExtLoad(ISD::LoadExtType ExtType, DebugLoc dl, EVT VT,
+SDValue SelectionDAG::getExtLoad(ISD::LoadExtType ExtType, EVT VT, DebugLoc dl,
                                   SDValue Chain, SDValue Ptr,
                                   const Value *SV,
                                   int SVOffset, EVT MemVT,
                                   bool isVolatile, bool isNonTemporal,
                                   unsigned Alignment) {
    SDValue Undef = getUNDEF(Ptr.getValueType());
-  return getLoad(ISD::UNINDEXED, dl, ExtType, VT, Chain, Ptr, Undef,
+  return getLoad(ISD::UNINDEXED, ExtType, VT, dl, Chain, Ptr, Undef,
                   SV, SVOffset, MemVT, isVolatile, isNonTemporal, Alignment);
  }
  
@@ -3951,7 +3995,7 @@ SelectionDAG::getIndexedLoad(SDValue OrigLoad, DebugLoc dl, SDValue Base,
    LoadSDNode *LD = cast<LoadSDNode>(OrigLoad);
    assert(LD->getOffset().getOpcode() == ISD::UNDEF &&
           "Load is already a indexed load!");
-  return getLoad(AM, dl, LD->getExtensionType(), OrigLoad.getValueType(),
+  return getLoad(AM, LD->getExtensionType(), OrigLoad.getValueType(), dl,
                   LD->getChain(), Base, Offset, LD->getSrcValue(),
                   LD->getSrcValueOffset(), LD->getMemoryVT(),
                   LD->isVolatile(), LD->isNonTemporal(), LD->getAlignment());
@@ -4097,9 +4141,10 @@ SelectionDAG::getIndexedStore(SDValue OrigStore, DebugLoc dl, SDValue Base,
  
  SDValue SelectionDAG::getVAArg(EVT VT, DebugLoc dl,
                                 SDValue Chain, SDValue Ptr,
-                               SDValue SV) {
-  SDValue Ops[] = { Chain, Ptr, SV };
-  return getNode(ISD::VAARG, dl, getVTList(VT, MVT::Other), Ops, 3);
+                               SDValue SV,
+                               unsigned Align) {
+  SDValue Ops[] = { Chain, Ptr, SV, getTargetConstant(Align, MVT::i32) };
+  return getNode(ISD::VAARG, dl, getVTList(VT, MVT::Other), Ops, 4);
  }
  
  SDValue SelectionDAG::getNode(unsigned Opcode, DebugLoc DL, EVT VT,
@@ -4381,17 +4426,16 @@ SDVTList SelectionDAG::getVTList(const EVT *VTs, unsigned NumVTs) {
  /// already exists.  If the resultant node does not exist in the DAG, the
  /// input node is returned.  As a degenerate case, if you specify the same
  /// input operands as the node already has, the input node is returned.
-SDValue SelectionDAG::UpdateNodeOperands(SDValue InN, SDValue Op) {
-  SDNode *N = InN.getNode();
+SDNode *SelectionDAG::UpdateNodeOperands(SDNode *N, SDValue Op) {
    assert(N->getNumOperands() == 1 && "Update with wrong number of operands");
  
    // Check to see if there is no change.
-  if (Op == N->getOperand(0)) return InN;
+  if (Op == N->getOperand(0)) return N;
  
    // See if the modified node already exists.
    void *InsertPos = 0;
    if (SDNode *Existing = FindModifiedNodeSlot(N, Op, InsertPos))
-    return SDValue(Existing, InN.getResNo());
+    return Existing;
  
    // Nope it doesn't.  Remove the node from its current place in the maps.
    if (InsertPos)
@@ -4403,22 +4447,20 @@ SDValue SelectionDAG::UpdateNodeOperands(SDValue InN, SDValue Op) {
  
    // If this gets put into a CSE map, add it.
    if (InsertPos) CSEMap.InsertNode(N, InsertPos);
-  return InN;
+  return N;
  }
  
-SDValue SelectionDAG::
-UpdateNodeOperands(SDValue InN, SDValue Op1, SDValue Op2) {
-  SDNode *N = InN.getNode();
+SDNode *SelectionDAG::UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2) {
    assert(N->getNumOperands() == 2 && "Update with wrong number of operands");
  
    // Check to see if there is no change.
    if (Op1 == N->getOperand(0) && Op2 == N->getOperand(1))
-    return InN;   // No operands changed, just return the input node.
+    return N;   // No operands changed, just return the input node.
  
    // See if the modified node already exists.
    void *InsertPos = 0;
    if (SDNode *Existing = FindModifiedNodeSlot(N, Op1, Op2, InsertPos))
-    return SDValue(Existing, InN.getResNo());
+    return Existing;
  
    // Nope it doesn't.  Remove the node from its current place in the maps.
    if (InsertPos)
@@ -4433,32 +4475,31 @@ UpdateNodeOperands(SDValue InN, SDValue Op1, SDValue Op2) {
  
    // If this gets put into a CSE map, add it.
    if (InsertPos) CSEMap.InsertNode(N, InsertPos);
-  return InN;
+  return N;
  }
  
-SDValue SelectionDAG::
-UpdateNodeOperands(SDValue N, SDValue Op1, SDValue Op2, SDValue Op3) {
+SDNode *SelectionDAG::
+UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2, SDValue Op3) {
    SDValue Ops[] = { Op1, Op2, Op3 };
    return UpdateNodeOperands(N, Ops, 3);
  }
  
-SDValue SelectionDAG::
-UpdateNodeOperands(SDValue N, SDValue Op1, SDValue Op2,
+SDNode *SelectionDAG::
+UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2,
                     SDValue Op3, SDValue Op4) {
    SDValue Ops[] = { Op1, Op2, Op3, Op4 };
    return UpdateNodeOperands(N, Ops, 4);
  }
  
-SDValue SelectionDAG::
-UpdateNodeOperands(SDValue N, SDValue Op1, SDValue Op2,
+SDNode *SelectionDAG::
+UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2,
                     SDValue Op3, SDValue Op4, SDValue Op5) {
    SDValue Ops[] = { Op1, Op2, Op3, Op4, Op5 };
    return UpdateNodeOperands(N, Ops, 5);
  }
  
-SDValue SelectionDAG::
-UpdateNodeOperands(SDValue InN, const SDValue *Ops, unsigned NumOps) {
-  SDNode *N = InN.getNode();
+SDNode *SelectionDAG::
+UpdateNodeOperands(SDNode *N, const SDValue *Ops, unsigned NumOps) {
    assert(N->getNumOperands() == NumOps &&
           "Update with wrong number of operands");
  
@@ -4472,12 +4513,12 @@ UpdateNodeOperands(SDValue InN, const SDValue *Ops, unsigned NumOps) {
    }
  
    // No operands changed, just return the input node.
-  if (!AnyChange) return InN;
+  if (!AnyChange) return N;
  
    // See if the modified node already exists.
    void *InsertPos = 0;
    if (SDNode *Existing = FindModifiedNodeSlot(N, Ops, NumOps, InsertPos))
-    return SDValue(Existing, InN.getResNo());
+    return Existing;
  
    // Nope it doesn't.  Remove the node from its current place in the maps.
    if (InsertPos)
@@ -4491,7 +4532,7 @@ UpdateNodeOperands(SDValue InN, const SDValue *Ops, unsigned NumOps) {
  
    // If this gets put into a CSE map, add it.
    if (InsertPos) CSEMap.InsertNode(N, InsertPos);
-  return InN;
+  return N;
  }
  
  /// DropOperands - Release the operands and set this node to have
@@ -4912,7 +4953,7 @@ SelectionDAG::getDbgValue(MDNode *MDPtr, SDNode *N, unsigned R, uint64_t Off,
  }
  
  SDDbgValue *
-SelectionDAG::getDbgValue(MDNode *MDPtr, Value *C, uint64_t Off,
+SelectionDAG::getDbgValue(MDNode *MDPtr, const Value *C, uint64_t Off,
                            DebugLoc DL, unsigned O) {
    return new (Allocator) SDDbgValue(MDPtr, C, Off, DL, O);
  }
@@ -5320,8 +5361,8 @@ unsigned SelectionDAG::GetOrdering(const SDNode *SD) const {
  
  /// AddDbgValue - Add a dbg_value SDNode. If SD is non-null that means the
  /// value is produced by SD.
-void SelectionDAG::AddDbgValue(SDDbgValue *DB, SDNode *SD) {
-  DbgInfo->add(DB, SD);
+void SelectionDAG::AddDbgValue(SDDbgValue *DB, SDNode *SD, bool isParameter) {
+  DbgInfo->add(DB, SD, isParameter);
    if (SD)
      SD->setHasDebugValue(true);
  }
@@ -5334,10 +5375,11 @@ HandleSDNode::~HandleSDNode() {
    DropOperands();
  }
  
-GlobalAddressSDNode::GlobalAddressSDNode(unsigned Opc, const GlobalValue *GA,
+GlobalAddressSDNode::GlobalAddressSDNode(unsigned Opc, DebugLoc DL,
+                                         const GlobalValue *GA,
                                           EVT VT, int64_t o, unsigned char TF)
-  : SDNode(Opc, DebugLoc(), getSDVTList(VT)), Offset(o), TargetFlags(TF) {
-  TheGlobal = const_cast<GlobalValue*>(GA);
+  : SDNode(Opc, DL, getSDVTList(VT)), Offset(o), TargetFlags(TF) {
+  TheGlobal = GA;
  }
  
  MemSDNode::MemSDNode(unsigned Opc, DebugLoc dl, SDVTList VTs, EVT memvt,
@@ -5391,6 +5433,8 @@ const EVT *SDNode::getValueTypeList(EVT VT) {
      sys::SmartScopedLock<true> Lock(*VTMutex);
      return &(*EVTs->insert(VT).first);
    } else {
+    assert(VT.getSimpleVT().SimpleTy < MVT::LAST_VALUETYPE &&
+           "Value type out of range!");
      return &SimpleVTArray->VTs[VT.getSimpleVT().SimpleTy];
    }
  }
@@ -5557,6 +5601,7 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::PCMARKER:      return "PCMarker";
    case ISD::READCYCLECOUNTER: return "ReadCycleCounter";
    case ISD::SRCVALUE:      return "SrcValue";
+  case ISD::MDNODE_SDNODE: return "MDNode";
    case ISD::EntryToken:    return "EntryToken";
    case ISD::TokenFactor:   return "TokenFactor";
    case ISD::AssertSext:    return "AssertSext";
@@ -5580,6 +5625,8 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::LSDAADDR: return "LSDAADDR";
    case ISD::EHSELECTION: return "EHSELECTION";
    case ISD::EH_RETURN: return "EH_RETURN";
+  case ISD::EH_SJLJ_SETJMP: return "EH_SJLJ_SETJMP";
+  case ISD::EH_SJLJ_LONGJMP: return "EH_SJLJ_LONGJMP";
    case ISD::ConstantPool:  return "ConstantPool";
    case ISD::ExternalSymbol: return "ExternalSymbol";
    case ISD::BlockAddress:  return "BlockAddress";
@@ -5620,13 +5667,16 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::FSQRT:  return "fsqrt";
    case ISD::FSIN:   return "fsin";
    case ISD::FCOS:   return "fcos";
-  case ISD::FPOWI:  return "fpowi";
-  case ISD::FPOW:   return "fpow";
    case ISD::FTRUNC: return "ftrunc";
    case ISD::FFLOOR: return "ffloor";
    case ISD::FCEIL:  return "fceil";
    case ISD::FRINT:  return "frint";
    case ISD::FNEARBYINT: return "fnearbyint";
+  case ISD::FEXP:   return "fexp";
+  case ISD::FEXP2:  return "fexp2";
+  case ISD::FLOG:   return "flog";
+  case ISD::FLOG2:  return "flog2";
+  case ISD::FLOG10: return "flog10";
  
    // Binary operators
    case ISD::ADD:    return "add";
@@ -5657,7 +5707,9 @@ std::string SDNode::getOperationName(const SelectionDAG *G) const {
    case ISD::FREM:   return "frem";
    case ISD::FCOPYSIGN: return "fcopysign";
    case ISD::FGETSIGN:  return "fgetsign";
+  case ISD::FPOW:   return "fpow";
  
+  case ISD::FPOWI:  return "fpowi";
    case ISD::SETCC:       return "setcc";
    case ISD::VSETCC:      return "vsetcc";
    case ISD::SELECT:      return "select";
@@ -5925,6 +5977,11 @@ void SDNode::print_details(raw_ostream &OS, const SelectionDAG *G) const {
        OS << "<" << M->getValue() << ">";
      else
        OS << "<null>";
+  } else if (const MDNodeSDNode *MD = dyn_cast<MDNodeSDNode>(this)) {
+    if (MD->getMD())
+      OS << "<" << MD->getMD() << ">";
+    else
+      OS << "<null>";
    } else if (const VTSDNode *N = dyn_cast<VTSDNode>(this)) {
      OS << ":" << N->getVT().getEVTString();
    }
@@ -5976,6 +6033,21 @@ void SDNode::print_details(raw_ostream &OS, const SelectionDAG *G) const {
  
    if (getNodeId() != -1)
      OS << " [ID=" << getNodeId() << ']';
+
+  DebugLoc dl = getDebugLoc();
+  if (G && !dl.isUnknown()) {
+    DIScope
+      Scope(dl.getScope(G->getMachineFunction().getFunction()->getContext()));
+    OS << " dbg:";
+    // Omit the directory, since it's usually long and uninteresting.
+    if (Scope.Verify())
+      OS << Scope.getFilename();
+    else
+      OS << "<unknown>";
+    OS << ':' << dl.getLine();
+    if (dl.getCol() != 0)
+      OS << ':' << dl.getCol();
+  }
  }
  
  void SDNode::print(raw_ostream &OS, const SelectionDAG *G) const {
@@ -6062,7 +6134,7 @@ SDValue SelectionDAG::UnrollVectorOp(SDNode *N, unsigned ResNE) {
  
    unsigned i;
    for (i= 0; i != NE; ++i) {
-    for (unsigned j = 0; j != N->getNumOperands(); ++j) {
+    for (unsigned j = 0, e = N->getNumOperands(); j != e; ++j) {
        SDValue Operand = N->getOperand(j);
        EVT OperandVT = Operand.getValueType();
        if (OperandVT.isVector()) {
@@ -6140,8 +6212,8 @@ bool SelectionDAG::isConsecutiveLoad(LoadSDNode *LD, LoadSDNode *Base,
        return true;
    }
  
-  GlobalValue *GV1 = NULL;
-  GlobalValue *GV2 = NULL;
+  const GlobalValue *GV1 = NULL;
+  const GlobalValue *GV2 = NULL;
    int64_t Offset1 = 0;
    int64_t Offset2 = 0;
    bool isGA1 = TLI.isGAPlusOffset(Loc.getNode(), GV1, Offset1);
@@ -6156,14 +6228,14 @@ bool SelectionDAG::isConsecutiveLoad(LoadSDNode *LD, LoadSDNode *Base,
  /// it cannot be inferred.
  unsigned SelectionDAG::InferPtrAlignment(SDValue Ptr) const {
    // If this is a GlobalAddress + cst, return the alignment.
-  GlobalValue *GV;
+  const GlobalValue *GV;
    int64_t GVOffset = 0;
    if (TLI.isGAPlusOffset(Ptr.getNode(), GV, GVOffset)) {
      // If GV has specified alignment, then use it. Otherwise, use the preferred
      // alignment.
      unsigned Align = GV->getAlignment();
      if (!Align) {
-      if (GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
+      if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
          if (GVar->hasInitializer()) {
            const TargetData *TD = TLI.getTargetData();
            Align = TD->getPreferredAlignment(GVar);
@@ -6191,23 +6263,6 @@ unsigned SelectionDAG::InferPtrAlignment(SDValue Ptr) const {
      const MachineFrameInfo &MFI = *getMachineFunction().getFrameInfo();
      unsigned FIInfoAlign = MinAlign(MFI.getObjectAlignment(FrameIdx),
                                      FrameOffset);
-    if (MFI.isFixedObjectIndex(FrameIdx)) {
-      int64_t ObjectOffset = MFI.getObjectOffset(FrameIdx) + FrameOffset;
-
-      // The alignment of the frame index can be determined from its offset from
-      // the incoming frame position.  If the frame object is at offset 32 and
-      // the stack is guaranteed to be 16-byte aligned, then we know that the
-      // object is 16-byte aligned.
-      unsigned StackAlign = getTarget().getFrameInfo()->getStackAlignment();
-      unsigned Align = MinAlign(ObjectOffset, StackAlign);
-
-      // Finally, the frame object itself may have a known alignment.  Factor
-      // the alignment + offset into a new alignment.  For example, if we know
-      // the FI is 8 byte aligned, but the pointer is 4 off, we really have a
-      // 4-byte alignment of the resultant pointer.  Likewise align 4 + 4-byte
-      // offset = 4-byte alignment, align 4 + 1-byte offset = align 1, etc.
-      return std::max(Align, FIInfoAlign);
-    }
      return FIInfoAlign;
    }
  
@@ -6325,8 +6380,8 @@ bool BuildVectorSDNode::isConstantSplat(APInt &SplatValue,
      if (OpVal.getOpcode() == ISD::UNDEF)
        SplatUndef |= APInt::getBitsSet(sz, BitPos, BitPos + EltBitSize);
      else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal))
-      SplatValue |= (APInt(CN->getAPIntValue()).zextOrTrunc(EltBitSize).
-                     zextOrTrunc(sz) << BitPos);
+      SplatValue |= APInt(CN->getAPIntValue()).zextOrTrunc(EltBitSize).
+                    zextOrTrunc(sz) << BitPos;
      else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal))
        SplatValue |= CN->getValueAPF().bitcastToAPInt().zextOrTrunc(sz) <<BitPos;
       else