lib/CodeGen/SelectionDAG/SelectionDAG.cpp

   1 //===-- SelectionDAG.cpp - Implement the SelectionDAG data structures -----===//
   2 //
   3 //                     The LLVM Compiler Infrastructure
   4 //
   5 // This file is distributed under the University of Illinois Open Source
   6 // License. See LICENSE.TXT for details.
   7 //
   8 //===----------------------------------------------------------------------===//
   9 //
  10 // This implements the SelectionDAG class.
  11 //
  12 //===----------------------------------------------------------------------===//
  13
  14 #include "llvm/CodeGen/SelectionDAG.h"
  15 #include "SDNodeDbgValue.h"
  16 #include "llvm/ADT/SetVector.h"
  17 #include "llvm/ADT/SmallPtrSet.h"
  18 #include "llvm/ADT/SmallSet.h"
  19 #include "llvm/ADT/SmallVector.h"
  20 #include "llvm/ADT/StringExtras.h"
  21 #include "llvm/Analysis/ValueTracking.h"
  22 #include "llvm/CodeGen/MachineBasicBlock.h"
  23 #include "llvm/CodeGen/MachineConstantPool.h"
  24 #include "llvm/CodeGen/MachineFrameInfo.h"
  25 #include "llvm/CodeGen/MachineModuleInfo.h"
  26 #include "llvm/IR/CallingConv.h"
  27 #include "llvm/IR/Constants.h"
  28 #include "llvm/IR/DataLayout.h"
  29 #include "llvm/IR/DebugInfo.h"
  30 #include "llvm/IR/DerivedTypes.h"
  31 #include "llvm/IR/Function.h"
  32 #include "llvm/IR/GlobalAlias.h"
  33 #include "llvm/IR/GlobalVariable.h"
  34 #include "llvm/IR/Intrinsics.h"
  35 #include "llvm/Support/CommandLine.h"
  36 #include "llvm/Support/Debug.h"
  37 #include "llvm/Support/ErrorHandling.h"
  38 #include "llvm/Support/ManagedStatic.h"
  39 #include "llvm/Support/MathExtras.h"
  40 #include "llvm/Support/Mutex.h"
  41 #include "llvm/Support/raw_ostream.h"
  42 #include "llvm/Target/TargetInstrInfo.h"
  43 #include "llvm/Target/TargetIntrinsicInfo.h"
  44 #include "llvm/Target/TargetLowering.h"
  45 #include "llvm/Target/TargetMachine.h"
  46 #include "llvm/Target/TargetOptions.h"
  47 #include "llvm/Target/TargetRegisterInfo.h"
  48 #include "llvm/Target/TargetSelectionDAGInfo.h"
  49 #include <algorithm>
  50 #include <cmath>
  51
  52 using namespace llvm;
  53
  54 /// makeVTList - Return an instance of the SDVTList struct initialized with the
  55 /// specified members.
  56 static SDVTList makeVTList(const EVT *VTs, unsigned NumVTs) {
  57   SDVTList Res = {VTs, NumVTs};
  58   return Res;
  59 }
  60
  61 // Default null implementations of the callbacks.
  62 void SelectionDAG::DAGUpdateListener::NodeDeleted(SDNode*, SDNode*) {}
  63 void SelectionDAG::DAGUpdateListener::NodeUpdated(SDNode*) {}
  64
  65 //===----------------------------------------------------------------------===//
  66 //                              ConstantFPSDNode Class
  67 //===----------------------------------------------------------------------===//
  68
  69 /// isExactlyValue - We don't rely on operator== working on double values, as
  70 /// it returns true for things that are clearly not equal, like -0.0 and 0.0.
  71 /// As such, this method can be used to do an exact bit-for-bit comparison of
  72 /// two floating point values.
  73 bool ConstantFPSDNode::isExactlyValue(const APFloat& V) const {
  74   return getValueAPF().bitwiseIsEqual(V);
  75 }
  76
  77 bool ConstantFPSDNode::isValueValidForType(EVT VT,
  78                                            const APFloat& Val) {
  79   assert(VT.isFloatingPoint() && "Can only convert between FP types");
  80
  81   // convert modifies in place, so make a copy.
  82   APFloat Val2 = APFloat(Val);
  83   bool losesInfo;
  84   (void) Val2.convert(SelectionDAG::EVTToAPFloatSemantics(VT),
  85                       APFloat::rmNearestTiesToEven,
  86                       &losesInfo);
  87   return !losesInfo;
  88 }
  89
  90 //===----------------------------------------------------------------------===//
  91 //                              ISD Namespace
  92 //===----------------------------------------------------------------------===//
  93
  94 /// isBuildVectorAllOnes - Return true if the specified node is a
  95 /// BUILD_VECTOR where all of the elements are ~0 or undef.
  96 bool ISD::isBuildVectorAllOnes(const SDNode *N) {
  97   // Look through a bit convert.
  98   if (N->getOpcode() == ISD::BITCAST)
  99     N = N->getOperand(0).getNode();
 100
 101   if (N->getOpcode() != ISD::BUILD_VECTOR) return false;
 102
 103   unsigned i = 0, e = N->getNumOperands();
 104
 105   // Skip over all of the undef values.
 106   while (i != e && N->getOperand(i).getOpcode() == ISD::UNDEF)
 107     ++i;
 108
 109   // Do not accept an all-undef vector.
 110   if (i == e) return false;
 111
 112   // Do not accept build_vectors that aren't all constants or which have non-~0
 113   // elements. We have to be a bit careful here, as the type of the constant
 114   // may not be the same as the type of the vector elements due to type
 115   // legalization (the elements are promoted to a legal type for the target and
 116   // a vector of a type may be legal when the base element type is not).
 117   // We only want to check enough bits to cover the vector elements, because
 118   // we care if the resultant vector is all ones, not whether the individual
 119   // constants are.
 120   SDValue NotZero = N->getOperand(i);
 121   unsigned EltSize = N->getValueType(0).getVectorElementType().getSizeInBits();
 122   if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(NotZero)) {
 123     if (CN->getAPIntValue().countTrailingOnes() < EltSize)
 124       return false;
 125   } else if (ConstantFPSDNode *CFPN = dyn_cast<ConstantFPSDNode>(NotZero)) {
 126     if (CFPN->getValueAPF().bitcastToAPInt().countTrailingOnes() < EltSize)
 127       return false;
 128   } else
 129     return false;
 130
 131   // Okay, we have at least one ~0 value, check to see if the rest match or are
 132   // undefs. Even with the above element type twiddling, this should be OK, as
 133   // the same type legalization should have applied to all the elements.
 134   for (++i; i != e; ++i)
 135     if (N->getOperand(i) != NotZero &&
 136         N->getOperand(i).getOpcode() != ISD::UNDEF)
 137       return false;
 138   return true;
 139 }
 140
 141
 142 /// isBuildVectorAllZeros - Return true if the specified node is a
 143 /// BUILD_VECTOR where all of the elements are 0 or undef.
 144 bool ISD::isBuildVectorAllZeros(const SDNode *N) {
 145   // Look through a bit convert.
 146   if (N->getOpcode() == ISD::BITCAST)
 147     N = N->getOperand(0).getNode();
 148
 149   if (N->getOpcode() != ISD::BUILD_VECTOR) return false;
 150
 151   bool IsAllUndef = true;
 152   for (unsigned i = 0, e = N->getNumOperands(); i < e; ++i) {
 153     if (N->getOperand(i).getOpcode() == ISD::UNDEF)
 154       continue;
 155     IsAllUndef = false;
 156     // Do not accept build_vectors that aren't all constants or which have non-0
 157     // elements. We have to be a bit careful here, as the type of the constant
 158     // may not be the same as the type of the vector elements due to type
 159     // legalization (the elements are promoted to a legal type for the target
 160     // and a vector of a type may be legal when the base element type is not).
 161     // We only want to check enough bits to cover the vector elements, because
 162     // we care if the resultant vector is all zeros, not whether the individual
 163     // constants are.
 164     SDValue Zero = N->getOperand(i);
 165     unsigned EltSize = N->getValueType(0).getVectorElementType().getSizeInBits();
 166     if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Zero)) {
 167       if (CN->getAPIntValue().countTrailingZeros() < EltSize)
 168         return false;
 169     } else if (ConstantFPSDNode *CFPN = dyn_cast<ConstantFPSDNode>(Zero)) {
 170       if (CFPN->getValueAPF().bitcastToAPInt().countTrailingZeros() < EltSize)
 171         return false;
 172     } else
 173       return false;
 174   }
 175
 176   // Do not accept an all-undef vector.
 177   if (IsAllUndef)
 178     return false;
 179   return true;
 180 }
 181
 182 /// \brief Return true if the specified node is a BUILD_VECTOR node of
 183 /// all ConstantSDNode or undef.
 184 bool ISD::isBuildVectorOfConstantSDNodes(const SDNode *N) {
 185   if (N->getOpcode() != ISD::BUILD_VECTOR)
 186     return false;
 187
 188   for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
 189     SDValue Op = N->getOperand(i);
 190     if (Op.getOpcode() == ISD::UNDEF)
 191       continue;
 192     if (!isa<ConstantSDNode>(Op))
 193       return false;
 194   }
 195   return true;
 196 }
 197
 198 /// isScalarToVector - Return true if the specified node is a
 199 /// ISD::SCALAR_TO_VECTOR node or a BUILD_VECTOR node where only the low
 200 /// element is not an undef.
 201 bool ISD::isScalarToVector(const SDNode *N) {
 202   if (N->getOpcode() == ISD::SCALAR_TO_VECTOR)
 203     return true;
 204
 205   if (N->getOpcode() != ISD::BUILD_VECTOR)
 206     return false;
 207   if (N->getOperand(0).getOpcode() == ISD::UNDEF)
 208     return false;
 209   unsigned NumElems = N->getNumOperands();
 210   if (NumElems == 1)
 211     return false;
 212   for (unsigned i = 1; i < NumElems; ++i) {
 213     SDValue V = N->getOperand(i);
 214     if (V.getOpcode() != ISD::UNDEF)
 215       return false;
 216   }
 217   return true;
 218 }
 219
 220 /// allOperandsUndef - Return true if the node has at least one operand
 221 /// and all operands of the specified node are ISD::UNDEF.
 222 bool ISD::allOperandsUndef(const SDNode *N) {
 223   // Return false if the node has no operands.
 224   // This is "logically inconsistent" with the definition of "all" but
 225   // is probably the desired behavior.
 226   if (N->getNumOperands() == 0)
 227     return false;
 228
 229   for (unsigned i = 0, e = N->getNumOperands(); i != e ; ++i)
 230     if (N->getOperand(i).getOpcode() != ISD::UNDEF)
 231       return false;
 232
 233   return true;
 234 }
 235
 236 ISD::NodeType ISD::getExtForLoadExtType(ISD::LoadExtType ExtType) {
 237   switch (ExtType) {
 238   case ISD::EXTLOAD:
 239     return ISD::ANY_EXTEND;
 240   case ISD::SEXTLOAD:
 241     return ISD::SIGN_EXTEND;
 242   case ISD::ZEXTLOAD:
 243     return ISD::ZERO_EXTEND;
 244   default:
 245     break;
 246   }
 247
 248   llvm_unreachable("Invalid LoadExtType");
 249 }
 250
 251 /// getSetCCSwappedOperands - Return the operation corresponding to (Y op X)
 252 /// when given the operation for (X op Y).
 253 ISD::CondCode ISD::getSetCCSwappedOperands(ISD::CondCode Operation) {
 254   // To perform this operation, we just need to swap the L and G bits of the
 255   // operation.
 256   unsigned OldL = (Operation >> 2) & 1;
 257   unsigned OldG = (Operation >> 1) & 1;
 258   return ISD::CondCode((Operation & ~6) |  // Keep the N, U, E bits
 259                        (OldL << 1) |       // New G bit
 260                        (OldG << 2));       // New L bit.
 261 }
 262
 263 /// getSetCCInverse - Return the operation corresponding to !(X op Y), where
 264 /// 'op' is a valid SetCC operation.
 265 ISD::CondCode ISD::getSetCCInverse(ISD::CondCode Op, bool isInteger) {
 266   unsigned Operation = Op;
 267   if (isInteger)
 268     Operation ^= 7;   // Flip L, G, E bits, but not U.
 269   else
 270     Operation ^= 15;  // Flip all of the condition bits.
 271
 272   if (Operation > ISD::SETTRUE2)
 273     Operation &= ~8;  // Don't let N and U bits get set.
 274
 275   return ISD::CondCode(Operation);
 276 }
 277
 278
 279 /// isSignedOp - For an integer comparison, return 1 if the comparison is a
 280 /// signed operation and 2 if the result is an unsigned comparison.  Return zero
 281 /// if the operation does not depend on the sign of the input (setne and seteq).
 282 static int isSignedOp(ISD::CondCode Opcode) {
 283   switch (Opcode) {
 284   default: llvm_unreachable("Illegal integer setcc operation!");
 285   case ISD::SETEQ:
 286   case ISD::SETNE: return 0;
 287   case ISD::SETLT:
 288   case ISD::SETLE:
 289   case ISD::SETGT:
 290   case ISD::SETGE: return 1;
 291   case ISD::SETULT:
 292   case ISD::SETULE:
 293   case ISD::SETUGT:
 294   case ISD::SETUGE: return 2;
 295   }
 296 }
 297
 298 /// getSetCCOrOperation - Return the result of a logical OR between different
 299 /// comparisons of identical values: ((X op1 Y) | (X op2 Y)).  This function
 300 /// returns SETCC_INVALID if it is not possible to represent the resultant
 301 /// comparison.
 302 ISD::CondCode ISD::getSetCCOrOperation(ISD::CondCode Op1, ISD::CondCode Op2,
 303                                        bool isInteger) {
 304   if (isInteger && (isSignedOp(Op1) | isSignedOp(Op2)) == 3)
 305     // Cannot fold a signed integer setcc with an unsigned integer setcc.
 306     return ISD::SETCC_INVALID;
 307
 308   unsigned Op = Op1 | Op2;  // Combine all of the condition bits.
 309
 310   // If the N and U bits get set then the resultant comparison DOES suddenly
 311   // care about orderedness, and is true when ordered.
 312   if (Op > ISD::SETTRUE2)
 313     Op &= ~16;     // Clear the U bit if the N bit is set.
 314
 315   // Canonicalize illegal integer setcc's.
 316   if (isInteger && Op == ISD::SETUNE)  // e.g. SETUGT | SETULT
 317     Op = ISD::SETNE;
 318
 319   return ISD::CondCode(Op);
 320 }
 321
 322 /// getSetCCAndOperation - Return the result of a logical AND between different
 323 /// comparisons of identical values: ((X op1 Y) & (X op2 Y)).  This
 324 /// function returns zero if it is not possible to represent the resultant
 325 /// comparison.
 326 ISD::CondCode ISD::getSetCCAndOperation(ISD::CondCode Op1, ISD::CondCode Op2,
 327                                         bool isInteger) {
 328   if (isInteger && (isSignedOp(Op1) | isSignedOp(Op2)) == 3)
 329     // Cannot fold a signed setcc with an unsigned setcc.
 330     return ISD::SETCC_INVALID;
 331
 332   // Combine all of the condition bits.
 333   ISD::CondCode Result = ISD::CondCode(Op1 & Op2);
 334
 335   // Canonicalize illegal integer setcc's.
 336   if (isInteger) {
 337     switch (Result) {
 338     default: break;
 339     case ISD::SETUO : Result = ISD::SETFALSE; break;  // SETUGT & SETULT
 340     case ISD::SETOEQ:                                 // SETEQ  & SETU[LG]E
 341     case ISD::SETUEQ: Result = ISD::SETEQ   ; break;  // SETUGE & SETULE
 342     case ISD::SETOLT: Result = ISD::SETULT  ; break;  // SETULT & SETNE
 343     case ISD::SETOGT: Result = ISD::SETUGT  ; break;  // SETUGT & SETNE
 344     }
 345   }
 346
 347   return Result;
 348 }
 349
 350 //===----------------------------------------------------------------------===//
 351 //                           SDNode Profile Support
 352 //===----------------------------------------------------------------------===//
 353
 354 /// AddNodeIDOpcode - Add the node opcode to the NodeID data.
 355 ///
 356 static void AddNodeIDOpcode(FoldingSetNodeID &ID, unsigned OpC)  {
 357   ID.AddInteger(OpC);
 358 }
 359
 360 /// AddNodeIDValueTypes - Value type lists are intern'd so we can represent them
 361 /// solely with their pointer.
 362 static void AddNodeIDValueTypes(FoldingSetNodeID &ID, SDVTList VTList) {
 363   ID.AddPointer(VTList.VTs);
 364 }
 365
 366 /// AddNodeIDOperands - Various routines for adding operands to the NodeID data.
 367 ///
 368 static void AddNodeIDOperands(FoldingSetNodeID &ID,
 369                               ArrayRef<SDValue> Ops) {
 370   for (auto& Op : Ops) {
 371     ID.AddPointer(Op.getNode());
 372     ID.AddInteger(Op.getResNo());
 373   }
 374 }
 375
 376 /// AddNodeIDOperands - Various routines for adding operands to the NodeID data.
 377 ///
 378 static void AddNodeIDOperands(FoldingSetNodeID &ID,
 379                               ArrayRef<SDUse> Ops) {
 380   for (auto& Op : Ops) {
 381     ID.AddPointer(Op.getNode());
 382     ID.AddInteger(Op.getResNo());
 383   }
 384 }
 385
 386 static void AddBinaryNodeIDCustom(FoldingSetNodeID &ID, bool nuw, bool nsw,
 387                                   bool exact) {
 388   ID.AddBoolean(nuw);
 389   ID.AddBoolean(nsw);
 390   ID.AddBoolean(exact);
 391 }
 392
 393 /// AddBinaryNodeIDCustom - Add BinarySDNodes special infos
 394 static void AddBinaryNodeIDCustom(FoldingSetNodeID &ID, unsigned Opcode,
 395                                   bool nuw, bool nsw, bool exact) {
 396   if (isBinOpWithFlags(Opcode))
 397     AddBinaryNodeIDCustom(ID, nuw, nsw, exact);
 398 }
 399
 400 static void AddNodeIDNode(FoldingSetNodeID &ID, unsigned short OpC,
 401                           SDVTList VTList, ArrayRef<SDValue> OpList) {
 402   AddNodeIDOpcode(ID, OpC);
 403   AddNodeIDValueTypes(ID, VTList);
 404   AddNodeIDOperands(ID, OpList);
 405 }
 406
 407 /// AddNodeIDCustom - If this is an SDNode with special info, add this info to
 408 /// the NodeID data.
 409 static void AddNodeIDCustom(FoldingSetNodeID &ID, const SDNode *N) {
 410   switch (N->getOpcode()) {
 411   case ISD::TargetExternalSymbol:
 412   case ISD::ExternalSymbol:
 413     llvm_unreachable("Should only be used on nodes with operands");
 414   default: break;  // Normal nodes don't need extra info.
 415   case ISD::TargetConstant:
 416   case ISD::Constant: {
 417     const ConstantSDNode *C = cast<ConstantSDNode>(N);
 418     ID.AddPointer(C->getConstantIntValue());
 419     ID.AddBoolean(C->isOpaque());
 420     break;
 421   }
 422   case ISD::TargetConstantFP:
 423   case ISD::ConstantFP: {
 424     ID.AddPointer(cast<ConstantFPSDNode>(N)->getConstantFPValue());
 425     break;
 426   }
 427   case ISD::TargetGlobalAddress:
 428   case ISD::GlobalAddress:
 429   case ISD::TargetGlobalTLSAddress:
 430   case ISD::GlobalTLSAddress: {
 431     const GlobalAddressSDNode *GA = cast<GlobalAddressSDNode>(N);
 432     ID.AddPointer(GA->getGlobal());
 433     ID.AddInteger(GA->getOffset());
 434     ID.AddInteger(GA->getTargetFlags());
 435     ID.AddInteger(GA->getAddressSpace());
 436     break;
 437   }
 438   case ISD::BasicBlock:
 439     ID.AddPointer(cast<BasicBlockSDNode>(N)->getBasicBlock());
 440     break;
 441   case ISD::Register:
 442     ID.AddInteger(cast<RegisterSDNode>(N)->getReg());
 443     break;
 444   case ISD::RegisterMask:
 445     ID.AddPointer(cast<RegisterMaskSDNode>(N)->getRegMask());
 446     break;
 447   case ISD::SRCVALUE:
 448     ID.AddPointer(cast<SrcValueSDNode>(N)->getValue());
 449     break;
 450   case ISD::FrameIndex:
 451   case ISD::TargetFrameIndex:
 452     ID.AddInteger(cast<FrameIndexSDNode>(N)->getIndex());
 453     break;
 454   case ISD::JumpTable:
 455   case ISD::TargetJumpTable:
 456     ID.AddInteger(cast<JumpTableSDNode>(N)->getIndex());
 457     ID.AddInteger(cast<JumpTableSDNode>(N)->getTargetFlags());
 458     break;
 459   case ISD::ConstantPool:
 460   case ISD::TargetConstantPool: {
 461     const ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(N);
 462     ID.AddInteger(CP->getAlignment());
 463     ID.AddInteger(CP->getOffset());
 464     if (CP->isMachineConstantPoolEntry())
 465       CP->getMachineCPVal()->addSelectionDAGCSEId(ID);
 466     else
 467       ID.AddPointer(CP->getConstVal());
 468     ID.AddInteger(CP->getTargetFlags());
 469     break;
 470   }
 471   case ISD::TargetIndex: {
 472     const TargetIndexSDNode *TI = cast<TargetIndexSDNode>(N);
 473     ID.AddInteger(TI->getIndex());
 474     ID.AddInteger(TI->getOffset());
 475     ID.AddInteger(TI->getTargetFlags());
 476     break;
 477   }
 478   case ISD::LOAD: {
 479     const LoadSDNode *LD = cast<LoadSDNode>(N);
 480     ID.AddInteger(LD->getMemoryVT().getRawBits());
 481     ID.AddInteger(LD->getRawSubclassData());
 482     ID.AddInteger(LD->getPointerInfo().getAddrSpace());
 483     break;
 484   }
 485   case ISD::STORE: {
 486     const StoreSDNode *ST = cast<StoreSDNode>(N);
 487     ID.AddInteger(ST->getMemoryVT().getRawBits());
 488     ID.AddInteger(ST->getRawSubclassData());
 489     ID.AddInteger(ST->getPointerInfo().getAddrSpace());
 490     break;
 491   }
 492   case ISD::SDIV:
 493   case ISD::UDIV:
 494   case ISD::SRA:
 495   case ISD::SRL:
 496   case ISD::MUL:
 497   case ISD::ADD:
 498   case ISD::SUB:
 499   case ISD::SHL: {
 500     const BinaryWithFlagsSDNode *BinNode = cast<BinaryWithFlagsSDNode>(N);
 501     AddBinaryNodeIDCustom(ID, N->getOpcode(), BinNode->hasNoUnsignedWrap(),
 502                           BinNode->hasNoSignedWrap(), BinNode->isExact());
 503     break;
 504   }
 505   case ISD::ATOMIC_CMP_SWAP:
 506   case ISD::ATOMIC_CMP_SWAP_WITH_SUCCESS:
 507   case ISD::ATOMIC_SWAP:
 508   case ISD::ATOMIC_LOAD_ADD:
 509   case ISD::ATOMIC_LOAD_SUB:
 510   case ISD::ATOMIC_LOAD_AND:
 511   case ISD::ATOMIC_LOAD_OR:
 512   case ISD::ATOMIC_LOAD_XOR:
 513   case ISD::ATOMIC_LOAD_NAND:
 514   case ISD::ATOMIC_LOAD_MIN:
 515   case ISD::ATOMIC_LOAD_MAX:
 516   case ISD::ATOMIC_LOAD_UMIN:
 517   case ISD::ATOMIC_LOAD_UMAX:
 518   case ISD::ATOMIC_LOAD:
 519   case ISD::ATOMIC_STORE: {
 520     const AtomicSDNode *AT = cast<AtomicSDNode>(N);
 521     ID.AddInteger(AT->getMemoryVT().getRawBits());
 522     ID.AddInteger(AT->getRawSubclassData());
 523     ID.AddInteger(AT->getPointerInfo().getAddrSpace());
 524     break;
 525   }
 526   case ISD::PREFETCH: {
 527     const MemSDNode *PF = cast<MemSDNode>(N);
 528     ID.AddInteger(PF->getPointerInfo().getAddrSpace());
 529     break;
 530   }
 531   case ISD::VECTOR_SHUFFLE: {
 532     const ShuffleVectorSDNode *SVN = cast<ShuffleVectorSDNode>(N);
 533     for (unsigned i = 0, e = N->getValueType(0).getVectorNumElements();
 534          i != e; ++i)
 535       ID.AddInteger(SVN->getMaskElt(i));
 536     break;
 537   }
 538   case ISD::TargetBlockAddress:
 539   case ISD::BlockAddress: {
 540     const BlockAddressSDNode *BA = cast<BlockAddressSDNode>(N);
 541     ID.AddPointer(BA->getBlockAddress());
 542     ID.AddInteger(BA->getOffset());
 543     ID.AddInteger(BA->getTargetFlags());
 544     break;
 545   }
 546   } // end switch (N->getOpcode())
 547
 548   // Target specific memory nodes could also have address spaces to check.
 549   if (N->isTargetMemoryOpcode())
 550     ID.AddInteger(cast<MemSDNode>(N)->getPointerInfo().getAddrSpace());
 551 }
 552
 553 /// AddNodeIDNode - Generic routine for adding a nodes info to the NodeID
 554 /// data.
 555 static void AddNodeIDNode(FoldingSetNodeID &ID, const SDNode *N) {
 556   AddNodeIDOpcode(ID, N->getOpcode());
 557   // Add the return value info.
 558   AddNodeIDValueTypes(ID, N->getVTList());
 559   // Add the operand info.
 560   AddNodeIDOperands(ID, N->ops());
 561
 562   // Handle SDNode leafs with special info.
 563   AddNodeIDCustom(ID, N);
 564 }
 565
 566 /// encodeMemSDNodeFlags - Generic routine for computing a value for use in
 567 /// the CSE map that carries volatility, temporalness, indexing mode, and
 568 /// extension/truncation information.
 569 ///
 570 static inline unsigned
 571 encodeMemSDNodeFlags(int ConvType, ISD::MemIndexedMode AM, bool isVolatile,
 572                      bool isNonTemporal, bool isInvariant) {
 573   assert((ConvType & 3) == ConvType &&
 574          "ConvType may not require more than 2 bits!");
 575   assert((AM & 7) == AM &&
 576          "AM may not require more than 3 bits!");
 577   return ConvType |
 578          (AM << 2) |
 579          (isVolatile << 5) |
 580          (isNonTemporal << 6) |
 581          (isInvariant << 7);
 582 }
 583
 584 //===----------------------------------------------------------------------===//
 585 //                              SelectionDAG Class
 586 //===----------------------------------------------------------------------===//
 587
 588 /// doNotCSE - Return true if CSE should not be performed for this node.
 589 static bool doNotCSE(SDNode *N) {
 590   if (N->getValueType(0) == MVT::Glue)
 591     return true; // Never CSE anything that produces a flag.
 592
 593   switch (N->getOpcode()) {
 594   default: break;
 595   case ISD::HANDLENODE:
 596   case ISD::EH_LABEL:
 597     return true;   // Never CSE these nodes.
 598   }
 599
 600   // Check that remaining values produced are not flags.
 601   for (unsigned i = 1, e = N->getNumValues(); i != e; ++i)
 602     if (N->getValueType(i) == MVT::Glue)
 603       return true; // Never CSE anything that produces a flag.
 604
 605   return false;
 606 }
 607
 608 /// RemoveDeadNodes - This method deletes all unreachable nodes in the
 609 /// SelectionDAG.
 610 void SelectionDAG::RemoveDeadNodes() {
 611   // Create a dummy node (which is not added to allnodes), that adds a reference
 612   // to the root node, preventing it from being deleted.
 613   HandleSDNode Dummy(getRoot());
 614
 615   SmallVector<SDNode*, 128> DeadNodes;
 616
 617   // Add all obviously-dead nodes to the DeadNodes worklist.
 618   for (allnodes_iterator I = allnodes_begin(), E = allnodes_end(); I != E; ++I)
 619     if (I->use_empty())
 620       DeadNodes.push_back(I);
 621
 622   RemoveDeadNodes(DeadNodes);
 623
 624   // If the root changed (e.g. it was a dead load, update the root).
 625   setRoot(Dummy.getValue());
 626 }
 627
 628 /// RemoveDeadNodes - This method deletes the unreachable nodes in the
 629 /// given list, and any nodes that become unreachable as a result.
 630 void SelectionDAG::RemoveDeadNodes(SmallVectorImpl<SDNode *> &DeadNodes) {
 631
 632   // Process the worklist, deleting the nodes and adding their uses to the
 633   // worklist.
 634   while (!DeadNodes.empty()) {
 635     SDNode *N = DeadNodes.pop_back_val();
 636
 637     for (DAGUpdateListener *DUL = UpdateListeners; DUL; DUL = DUL->Next)
 638       DUL->NodeDeleted(N, nullptr);
 639
 640     // Take the node out of the appropriate CSE map.
 641     RemoveNodeFromCSEMaps(N);
 642
 643     // Next, brutally remove the operand list.  This is safe to do, as there are
 644     // no cycles in the graph.
 645     for (SDNode::op_iterator I = N->op_begin(), E = N->op_end(); I != E; ) {
 646       SDUse &Use = *I++;
 647       SDNode *Operand = Use.getNode();
 648       Use.set(SDValue());
 649
 650       // Now that we removed this operand, see if there are no uses of it left.
 651       if (Operand->use_empty())
 652         DeadNodes.push_back(Operand);
 653     }
 654
 655     DeallocateNode(N);
 656   }
 657 }
 658
 659 void SelectionDAG::RemoveDeadNode(SDNode *N){
 660   SmallVector<SDNode*, 16> DeadNodes(1, N);
 661
 662   // Create a dummy node that adds a reference to the root node, preventing
 663   // it from being deleted.  (This matters if the root is an operand of the
 664   // dead node.)
 665   HandleSDNode Dummy(getRoot());
 666
 667   RemoveDeadNodes(DeadNodes);
 668 }
 669
 670 void SelectionDAG::DeleteNode(SDNode *N) {
 671   // First take this out of the appropriate CSE map.
 672   RemoveNodeFromCSEMaps(N);
 673
 674   // Finally, remove uses due to operands of this node, remove from the
 675   // AllNodes list, and delete the node.
 676   DeleteNodeNotInCSEMaps(N);
 677 }
 678
 679 void SelectionDAG::DeleteNodeNotInCSEMaps(SDNode *N) {
 680   assert(N != AllNodes.begin() && "Cannot delete the entry node!");
 681   assert(N->use_empty() && "Cannot delete a node that is not dead!");
 682
 683   // Drop all of the operands and decrement used node's use counts.
 684   N->DropOperands();
 685
 686   DeallocateNode(N);
 687 }
 688
 689 void SelectionDAG::DeallocateNode(SDNode *N) {
 690   if (N->OperandsNeedDelete)
 691     delete[] N->OperandList;
 692
 693   // Set the opcode to DELETED_NODE to help catch bugs when node
 694   // memory is reallocated.
 695   N->NodeType = ISD::DELETED_NODE;
 696
 697   NodeAllocator.Deallocate(AllNodes.remove(N));
 698
 699   // If any of the SDDbgValue nodes refer to this SDNode, invalidate them.
 700   ArrayRef<SDDbgValue*> DbgVals = DbgInfo->getSDDbgValues(N);
 701   for (unsigned i = 0, e = DbgVals.size(); i != e; ++i)
 702     DbgVals[i]->setIsInvalidated();
 703 }
 704
 705 /// RemoveNodeFromCSEMaps - Take the specified node out of the CSE map that
 706 /// correspond to it.  This is useful when we're about to delete or repurpose
 707 /// the node.  We don't want future request for structurally identical nodes
 708 /// to return N anymore.
 709 bool SelectionDAG::RemoveNodeFromCSEMaps(SDNode *N) {
 710   bool Erased = false;
 711   switch (N->getOpcode()) {
 712   case ISD::HANDLENODE: return false;  // noop.
 713   case ISD::CONDCODE:
 714     assert(CondCodeNodes[cast<CondCodeSDNode>(N)->get()] &&
 715            "Cond code doesn't exist!");
 716     Erased = CondCodeNodes[cast<CondCodeSDNode>(N)->get()] != nullptr;
 717     CondCodeNodes[cast<CondCodeSDNode>(N)->get()] = nullptr;
 718     break;
 719   case ISD::ExternalSymbol:
 720     Erased = ExternalSymbols.erase(cast<ExternalSymbolSDNode>(N)->getSymbol());
 721     break;
 722   case ISD::TargetExternalSymbol: {
 723     ExternalSymbolSDNode *ESN = cast<ExternalSymbolSDNode>(N);
 724     Erased = TargetExternalSymbols.erase(
 725                std::pair<std::string,unsigned char>(ESN->getSymbol(),
 726                                                     ESN->getTargetFlags()));
 727     break;
 728   }
 729   case ISD::VALUETYPE: {
 730     EVT VT = cast<VTSDNode>(N)->getVT();
 731     if (VT.isExtended()) {
 732       Erased = ExtendedValueTypeNodes.erase(VT);
 733     } else {
 734       Erased = ValueTypeNodes[VT.getSimpleVT().SimpleTy] != nullptr;
 735       ValueTypeNodes[VT.getSimpleVT().SimpleTy] = nullptr;
 736     }
 737     break;
 738   }
 739   default:
 740     // Remove it from the CSE Map.
 741     assert(N->getOpcode() != ISD::DELETED_NODE && "DELETED_NODE in CSEMap!");
 742     assert(N->getOpcode() != ISD::EntryToken && "EntryToken in CSEMap!");
 743     Erased = CSEMap.RemoveNode(N);
 744     break;
 745   }
 746 #ifndef NDEBUG
 747   // Verify that the node was actually in one of the CSE maps, unless it has a
 748   // flag result (which cannot be CSE'd) or is one of the special cases that are
 749   // not subject to CSE.
 750   if (!Erased && N->getValueType(N->getNumValues()-1) != MVT::Glue &&
 751       !N->isMachineOpcode() && !doNotCSE(N)) {
 752     N->dump(this);
 753     dbgs() << "\n";
 754     llvm_unreachable("Node is not in map!");
 755   }
 756 #endif
 757   return Erased;
 758 }
 759
 760 /// AddModifiedNodeToCSEMaps - The specified node has been removed from the CSE
 761 /// maps and modified in place. Add it back to the CSE maps, unless an identical
 762 /// node already exists, in which case transfer all its users to the existing
 763 /// node. This transfer can potentially trigger recursive merging.
 764 ///
 765 void
 766 SelectionDAG::AddModifiedNodeToCSEMaps(SDNode *N) {
 767   // For node types that aren't CSE'd, just act as if no identical node
 768   // already exists.
 769   if (!doNotCSE(N)) {
 770     SDNode *Existing = CSEMap.GetOrInsertNode(N);
 771     if (Existing != N) {
 772       // If there was already an existing matching node, use ReplaceAllUsesWith
 773       // to replace the dead one with the existing one.  This can cause
 774       // recursive merging of other unrelated nodes down the line.
 775       ReplaceAllUsesWith(N, Existing);
 776
 777       // N is now dead. Inform the listeners and delete it.
 778       for (DAGUpdateListener *DUL = UpdateListeners; DUL; DUL = DUL->Next)
 779         DUL->NodeDeleted(N, Existing);
 780       DeleteNodeNotInCSEMaps(N);
 781       return;
 782     }
 783   }
 784
 785   // If the node doesn't already exist, we updated it.  Inform listeners.
 786   for (DAGUpdateListener *DUL = UpdateListeners; DUL; DUL = DUL->Next)
 787     DUL->NodeUpdated(N);
 788 }
 789
 790 /// FindModifiedNodeSlot - Find a slot for the specified node if its operands
 791 /// were replaced with those specified.  If this node is never memoized,
 792 /// return null, otherwise return a pointer to the slot it would take.  If a
 793 /// node already exists with these operands, the slot will be non-null.
 794 SDNode *SelectionDAG::FindModifiedNodeSlot(SDNode *N, SDValue Op,
 795                                            void *&InsertPos) {
 796   if (doNotCSE(N))
 797     return nullptr;
 798
 799   SDValue Ops[] = { Op };
 800   FoldingSetNodeID ID;
 801   AddNodeIDNode(ID, N->getOpcode(), N->getVTList(), Ops);
 802   AddNodeIDCustom(ID, N);
 803   SDNode *Node = CSEMap.FindNodeOrInsertPos(ID, InsertPos);
 804   return Node;
 805 }
 806
 807 /// FindModifiedNodeSlot - Find a slot for the specified node if its operands
 808 /// were replaced with those specified.  If this node is never memoized,
 809 /// return null, otherwise return a pointer to the slot it would take.  If a
 810 /// node already exists with these operands, the slot will be non-null.
 811 SDNode *SelectionDAG::FindModifiedNodeSlot(SDNode *N,
 812                                            SDValue Op1, SDValue Op2,
 813                                            void *&InsertPos) {
 814   if (doNotCSE(N))
 815     return nullptr;
 816
 817   SDValue Ops[] = { Op1, Op2 };
 818   FoldingSetNodeID ID;
 819   AddNodeIDNode(ID, N->getOpcode(), N->getVTList(), Ops);
 820   AddNodeIDCustom(ID, N);
 821   SDNode *Node = CSEMap.FindNodeOrInsertPos(ID, InsertPos);
 822   return Node;
 823 }
 824
 825
 826 /// FindModifiedNodeSlot - Find a slot for the specified node if its operands
 827 /// were replaced with those specified.  If this node is never memoized,
 828 /// return null, otherwise return a pointer to the slot it would take.  If a
 829 /// node already exists with these operands, the slot will be non-null.
 830 SDNode *SelectionDAG::FindModifiedNodeSlot(SDNode *N, ArrayRef<SDValue> Ops,
 831                                            void *&InsertPos) {
 832   if (doNotCSE(N))
 833     return nullptr;
 834
 835   FoldingSetNodeID ID;
 836   AddNodeIDNode(ID, N->getOpcode(), N->getVTList(), Ops);
 837   AddNodeIDCustom(ID, N);
 838   SDNode *Node = CSEMap.FindNodeOrInsertPos(ID, InsertPos);
 839   return Node;
 840 }
 841
 842 #ifndef NDEBUG
 843 /// VerifyNodeCommon - Sanity check the given node.  Aborts if it is invalid.
 844 static void VerifyNodeCommon(SDNode *N) {
 845   switch (N->getOpcode()) {
 846   default:
 847     break;
 848   case ISD::BUILD_PAIR: {
 849     EVT VT = N->getValueType(0);
 850     assert(N->getNumValues() == 1 && "Too many results!");
 851     assert(!VT.isVector() && (VT.isInteger() || VT.isFloatingPoint()) &&
 852            "Wrong return type!");
 853     assert(N->getNumOperands() == 2 && "Wrong number of operands!");
 854     assert(N->getOperand(0).getValueType() == N->getOperand(1).getValueType() &&
 855            "Mismatched operand types!");
 856     assert(N->getOperand(0).getValueType().isInteger() == VT.isInteger() &&
 857            "Wrong operand type!");
 858     assert(VT.getSizeInBits() == 2 * N->getOperand(0).getValueSizeInBits() &&
 859            "Wrong return type size");
 860     break;
 861   }
 862   case ISD::BUILD_VECTOR: {
 863     assert(N->getNumValues() == 1 && "Too many results!");
 864     assert(N->getValueType(0).isVector() && "Wrong return type!");
 865     assert(N->getNumOperands() == N->getValueType(0).getVectorNumElements() &&
 866            "Wrong number of operands!");
 867     EVT EltVT = N->getValueType(0).getVectorElementType();
 868     for (SDNode::op_iterator I = N->op_begin(), E = N->op_end(); I != E; ++I) {
 869       assert((I->getValueType() == EltVT ||
 870              (EltVT.isInteger() && I->getValueType().isInteger() &&
 871               EltVT.bitsLE(I->getValueType()))) &&
 872             "Wrong operand type!");
 873       assert(I->getValueType() == N->getOperand(0).getValueType() &&
 874              "Operands must all have the same type");
 875     }
 876     break;
 877   }
 878   }
 879 }
 880
 881 /// VerifySDNode - Sanity check the given SDNode.  Aborts if it is invalid.
 882 static void VerifySDNode(SDNode *N) {
 883   // The SDNode allocators cannot be used to allocate nodes with fields that are
 884   // not present in an SDNode!
 885   assert(!isa<MemSDNode>(N) && "Bad MemSDNode!");
 886   assert(!isa<ShuffleVectorSDNode>(N) && "Bad ShuffleVectorSDNode!");
 887   assert(!isa<ConstantSDNode>(N) && "Bad ConstantSDNode!");
 888   assert(!isa<ConstantFPSDNode>(N) && "Bad ConstantFPSDNode!");
 889   assert(!isa<GlobalAddressSDNode>(N) && "Bad GlobalAddressSDNode!");
 890   assert(!isa<FrameIndexSDNode>(N) && "Bad FrameIndexSDNode!");
 891   assert(!isa<JumpTableSDNode>(N) && "Bad JumpTableSDNode!");
 892   assert(!isa<ConstantPoolSDNode>(N) && "Bad ConstantPoolSDNode!");
 893   assert(!isa<BasicBlockSDNode>(N) && "Bad BasicBlockSDNode!");
 894   assert(!isa<SrcValueSDNode>(N) && "Bad SrcValueSDNode!");
 895   assert(!isa<MDNodeSDNode>(N) && "Bad MDNodeSDNode!");
 896   assert(!isa<RegisterSDNode>(N) && "Bad RegisterSDNode!");
 897   assert(!isa<BlockAddressSDNode>(N) && "Bad BlockAddressSDNode!");
 898   assert(!isa<EHLabelSDNode>(N) && "Bad EHLabelSDNode!");
 899   assert(!isa<ExternalSymbolSDNode>(N) && "Bad ExternalSymbolSDNode!");
 900   assert(!isa<CondCodeSDNode>(N) && "Bad CondCodeSDNode!");
 901   assert(!isa<CvtRndSatSDNode>(N) && "Bad CvtRndSatSDNode!");
 902   assert(!isa<VTSDNode>(N) && "Bad VTSDNode!");
 903   assert(!isa<MachineSDNode>(N) && "Bad MachineSDNode!");
 904
 905   VerifyNodeCommon(N);
 906 }
 907
 908 /// VerifyMachineNode - Sanity check the given MachineNode.  Aborts if it is
 909 /// invalid.
 910 static void VerifyMachineNode(SDNode *N) {
 911   // The MachineNode allocators cannot be used to allocate nodes with fields
 912   // that are not present in a MachineNode!
 913   // Currently there are no such nodes.
 914
 915   VerifyNodeCommon(N);
 916 }
 917 #endif // NDEBUG
 918
 919 /// getEVTAlignment - Compute the default alignment value for the
 920 /// given type.
 921 ///
 922 unsigned SelectionDAG::getEVTAlignment(EVT VT) const {
 923   Type *Ty = VT == MVT::iPTR ?
 924                    PointerType::get(Type::getInt8Ty(*getContext()), 0) :
 925                    VT.getTypeForEVT(*getContext());
 926
 927   return TM.getTargetLowering()->getDataLayout()->getABITypeAlignment(Ty);
 928 }
 929
 930 // EntryNode could meaningfully have debug info if we can find it...
 931 SelectionDAG::SelectionDAG(const TargetMachine &tm, CodeGenOpt::Level OL)
 932   : TM(tm), TSI(*tm.getSelectionDAGInfo()), TLI(nullptr), OptLevel(OL),
 933     EntryNode(ISD::EntryToken, 0, DebugLoc(), getVTList(MVT::Other)),
 934     Root(getEntryNode()), NewNodesMustHaveLegalTypes(false),
 935     UpdateListeners(nullptr) {
 936   AllNodes.push_back(&EntryNode);
 937   DbgInfo = new SDDbgInfo();
 938 }
 939
 940 void SelectionDAG::init(MachineFunction &mf, const TargetLowering *tli) {
 941   MF = &mf;
 942   TLI = tli;
 943   Context = &mf.getFunction()->getContext();
 944 }
 945
 946 SelectionDAG::~SelectionDAG() {
 947   assert(!UpdateListeners && "Dangling registered DAGUpdateListeners");
 948   allnodes_clear();
 949   delete DbgInfo;
 950 }
 951
 952 void SelectionDAG::allnodes_clear() {
 953   assert(&*AllNodes.begin() == &EntryNode);
 954   AllNodes.remove(AllNodes.begin());
 955   while (!AllNodes.empty())
 956     DeallocateNode(AllNodes.begin());
 957 }
 958
 959 BinarySDNode *SelectionDAG::GetBinarySDNode(unsigned Opcode, SDLoc DL,
 960                                             SDVTList VTs, SDValue N1,
 961                                             SDValue N2, bool nuw, bool nsw,
 962                                             bool exact) {
 963   if (isBinOpWithFlags(Opcode)) {
 964     BinaryWithFlagsSDNode *FN = new (NodeAllocator) BinaryWithFlagsSDNode(
 965         Opcode, DL.getIROrder(), DL.getDebugLoc(), VTs, N1, N2);
 966     FN->setHasNoUnsignedWrap(nuw);
 967     FN->setHasNoSignedWrap(nsw);
 968     FN->setIsExact(exact);
 969
 970     return FN;
 971   }
 972
 973   BinarySDNode *N = new (NodeAllocator)
 974       BinarySDNode(Opcode, DL.getIROrder(), DL.getDebugLoc(), VTs, N1, N2);
 975   return N;
 976 }
 977
 978 void SelectionDAG::clear() {
 979   allnodes_clear();
 980   OperandAllocator.Reset();
 981   CSEMap.clear();
 982
 983   ExtendedValueTypeNodes.clear();
 984   ExternalSymbols.clear();
 985   TargetExternalSymbols.clear();
 986   std::fill(CondCodeNodes.begin(), CondCodeNodes.end(),
 987             static_cast<CondCodeSDNode*>(nullptr));
 988   std::fill(ValueTypeNodes.begin(), ValueTypeNodes.end(),
 989             static_cast<SDNode*>(nullptr));
 990
 991   EntryNode.UseList = nullptr;
 992   AllNodes.push_back(&EntryNode);
 993   Root = getEntryNode();
 994   DbgInfo->clear();
 995 }
 996
 997 SDValue SelectionDAG::getAnyExtOrTrunc(SDValue Op, SDLoc DL, EVT VT) {
 998   return VT.bitsGT(Op.getValueType()) ?
 999     getNode(ISD::ANY_EXTEND, DL, VT, Op) :
1000     getNode(ISD::TRUNCATE, DL, VT, Op);
1001 }
1002
1003 SDValue SelectionDAG::getSExtOrTrunc(SDValue Op, SDLoc DL, EVT VT) {
1004   return VT.bitsGT(Op.getValueType()) ?
1005     getNode(ISD::SIGN_EXTEND, DL, VT, Op) :
1006     getNode(ISD::TRUNCATE, DL, VT, Op);
1007 }
1008
1009 SDValue SelectionDAG::getZExtOrTrunc(SDValue Op, SDLoc DL, EVT VT) {
1010   return VT.bitsGT(Op.getValueType()) ?
1011     getNode(ISD::ZERO_EXTEND, DL, VT, Op) :
1012     getNode(ISD::TRUNCATE, DL, VT, Op);
1013 }
1014
1015 SDValue SelectionDAG::getBoolExtOrTrunc(SDValue Op, SDLoc SL, EVT VT,
1016                                         EVT OpVT) {
1017   if (VT.bitsLE(Op.getValueType()))
1018     return getNode(ISD::TRUNCATE, SL, VT, Op);
1019
1020   TargetLowering::BooleanContent BType = TLI->getBooleanContents(OpVT);
1021   return getNode(TLI->getExtendForContent(BType), SL, VT, Op);
1022 }
1023
1024 SDValue SelectionDAG::getZeroExtendInReg(SDValue Op, SDLoc DL, EVT VT) {
1025   assert(!VT.isVector() &&
1026          "getZeroExtendInReg should use the vector element type instead of "
1027          "the vector type!");
1028   if (Op.getValueType() == VT) return Op;
1029   unsigned BitWidth = Op.getValueType().getScalarType().getSizeInBits();
1030   APInt Imm = APInt::getLowBitsSet(BitWidth,
1031                                    VT.getSizeInBits());
1032   return getNode(ISD::AND, DL, Op.getValueType(), Op,
1033                  getConstant(Imm, Op.getValueType()));
1034 }
1035
1036 SDValue SelectionDAG::getAnyExtendVectorInReg(SDValue Op, SDLoc DL, EVT VT) {
1037   assert(VT.isVector() && "This DAG node is restricted to vector types.");
1038   assert(VT.getSizeInBits() == Op.getValueType().getSizeInBits() &&
1039          "The sizes of the input and result must match in order to perform the "
1040          "extend in-register.");
1041   assert(VT.getVectorNumElements() < Op.getValueType().getVectorNumElements() &&
1042          "The destination vector type must have fewer lanes than the input.");
1043   return getNode(ISD::ANY_EXTEND_VECTOR_INREG, DL, VT, Op);
1044 }
1045
1046 SDValue SelectionDAG::getSignExtendVectorInReg(SDValue Op, SDLoc DL, EVT VT) {
1047   assert(VT.isVector() && "This DAG node is restricted to vector types.");
1048   assert(VT.getSizeInBits() == Op.getValueType().getSizeInBits() &&
1049          "The sizes of the input and result must match in order to perform the "
1050          "extend in-register.");
1051   assert(VT.getVectorNumElements() < Op.getValueType().getVectorNumElements() &&
1052          "The destination vector type must have fewer lanes than the input.");
1053   return getNode(ISD::SIGN_EXTEND_VECTOR_INREG, DL, VT, Op);
1054 }
1055
1056 SDValue SelectionDAG::getZeroExtendVectorInReg(SDValue Op, SDLoc DL, EVT VT) {
1057   assert(VT.isVector() && "This DAG node is restricted to vector types.");
1058   assert(VT.getSizeInBits() == Op.getValueType().getSizeInBits() &&
1059          "The sizes of the input and result must match in order to perform the "
1060          "extend in-register.");
1061   assert(VT.getVectorNumElements() < Op.getValueType().getVectorNumElements() &&
1062          "The destination vector type must have fewer lanes than the input.");
1063   return getNode(ISD::ZERO_EXTEND_VECTOR_INREG, DL, VT, Op);
1064 }
1065
1066 /// getNOT - Create a bitwise NOT operation as (XOR Val, -1).
1067 ///
1068 SDValue SelectionDAG::getNOT(SDLoc DL, SDValue Val, EVT VT) {
1069   EVT EltVT = VT.getScalarType();
1070   SDValue NegOne =
1071     getConstant(APInt::getAllOnesValue(EltVT.getSizeInBits()), VT);
1072   return getNode(ISD::XOR, DL, VT, Val, NegOne);
1073 }
1074
1075 SDValue SelectionDAG::getLogicalNOT(SDLoc DL, SDValue Val, EVT VT) {
1076   EVT EltVT = VT.getScalarType();
1077   SDValue TrueValue;
1078   switch (TLI->getBooleanContents(VT)) {
1079     case TargetLowering::ZeroOrOneBooleanContent:
1080     case TargetLowering::UndefinedBooleanContent:
1081       TrueValue = getConstant(1, VT);
1082       break;
1083     case TargetLowering::ZeroOrNegativeOneBooleanContent:
1084       TrueValue = getConstant(APInt::getAllOnesValue(EltVT.getSizeInBits()),
1085                               VT);
1086       break;
1087   }
1088   return getNode(ISD::XOR, DL, VT, Val, TrueValue);
1089 }
1090
1091 SDValue SelectionDAG::getConstant(uint64_t Val, EVT VT, bool isT, bool isO) {
1092   EVT EltVT = VT.getScalarType();
1093   assert((EltVT.getSizeInBits() >= 64 ||
1094          (uint64_t)((int64_t)Val >> EltVT.getSizeInBits()) + 1 < 2) &&
1095          "getConstant with a uint64_t value that doesn't fit in the type!");
1096   return getConstant(APInt(EltVT.getSizeInBits(), Val), VT, isT, isO);
1097 }
1098
1099 SDValue SelectionDAG::getConstant(const APInt &Val, EVT VT, bool isT, bool isO)
1100 {
1101   return getConstant(*ConstantInt::get(*Context, Val), VT, isT, isO);
1102 }
1103
1104 SDValue SelectionDAG::getConstant(const ConstantInt &Val, EVT VT, bool isT,
1105                                   bool isO) {
1106   assert(VT.isInteger() && "Cannot create FP integer constant!");
1107
1108   EVT EltVT = VT.getScalarType();
1109   const ConstantInt *Elt = &Val;
1110
1111   const TargetLowering *TLI = TM.getTargetLowering();
1112
1113   // In some cases the vector type is legal but the element type is illegal and
1114   // needs to be promoted, for example v8i8 on ARM.  In this case, promote the
1115   // inserted value (the type does not need to match the vector element type).
1116   // Any extra bits introduced will be truncated away.
1117   if (VT.isVector() && TLI->getTypeAction(*getContext(), EltVT) ==
1118       TargetLowering::TypePromoteInteger) {
1119    EltVT = TLI->getTypeToTransformTo(*getContext(), EltVT);
1120    APInt NewVal = Elt->getValue().zext(EltVT.getSizeInBits());
1121    Elt = ConstantInt::get(*getContext(), NewVal);
1122   }
1123   // In other cases the element type is illegal and needs to be expanded, for
1124   // example v2i64 on MIPS32. In this case, find the nearest legal type, split
1125   // the value into n parts and use a vector type with n-times the elements.
1126   // Then bitcast to the type requested.
1127   // Legalizing constants too early makes the DAGCombiner's job harder so we
1128   // only legalize if the DAG tells us we must produce legal types.
1129   else if (NewNodesMustHaveLegalTypes && VT.isVector() &&
1130            TLI->getTypeAction(*getContext(), EltVT) ==
1131            TargetLowering::TypeExpandInteger) {
1132     APInt NewVal = Elt->getValue();
1133     EVT ViaEltVT = TLI->getTypeToTransformTo(*getContext(), EltVT);
1134     unsigned ViaEltSizeInBits = ViaEltVT.getSizeInBits();
1135     unsigned ViaVecNumElts = VT.getSizeInBits() / ViaEltSizeInBits;
1136     EVT ViaVecVT = EVT::getVectorVT(*getContext(), ViaEltVT, ViaVecNumElts);
1137
1138     // Check the temporary vector is the correct size. If this fails then
1139     // getTypeToTransformTo() probably returned a type whose size (in bits)
1140     // isn't a power-of-2 factor of the requested type size.
1141     assert(ViaVecVT.getSizeInBits() == VT.getSizeInBits());
1142
1143     SmallVector<SDValue, 2> EltParts;
1144     for (unsigned i = 0; i < ViaVecNumElts / VT.getVectorNumElements(); ++i) {
1145       EltParts.push_back(getConstant(NewVal.lshr(i * ViaEltSizeInBits)
1146                                            .trunc(ViaEltSizeInBits),
1147                                      ViaEltVT, isT, isO));
1148     }
1149
1150     // EltParts is currently in little endian order. If we actually want
1151     // big-endian order then reverse it now.
1152     if (TLI->isBigEndian())
1153       std::reverse(EltParts.begin(), EltParts.end());
1154
1155     // The elements must be reversed when the element order is different
1156     // to the endianness of the elements (because the BITCAST is itself a
1157     // vector shuffle in this situation). However, we do not need any code to
1158     // perform this reversal because getConstant() is producing a vector
1159     // splat.
1160     // This situation occurs in MIPS MSA.
1161
1162     SmallVector<SDValue, 8> Ops;
1163     for (unsigned i = 0; i < VT.getVectorNumElements(); ++i)
1164       Ops.insert(Ops.end(), EltParts.begin(), EltParts.end());
1165
1166     SDValue Result = getNode(ISD::BITCAST, SDLoc(), VT,
1167                              getNode(ISD::BUILD_VECTOR, SDLoc(), ViaVecVT,
1168                                      Ops));
1169     return Result;
1170   }
1171
1172   assert(Elt->getBitWidth() == EltVT.getSizeInBits() &&
1173          "APInt size does not match type size!");
1174   unsigned Opc = isT ? ISD::TargetConstant : ISD::Constant;
1175   FoldingSetNodeID ID;
1176   AddNodeIDNode(ID, Opc, getVTList(EltVT), None);
1177   ID.AddPointer(Elt);
1178   ID.AddBoolean(isO);
1179   void *IP = nullptr;
1180   SDNode *N = nullptr;
1181   if ((N = CSEMap.FindNodeOrInsertPos(ID, IP)))
1182     if (!VT.isVector())
1183       return SDValue(N, 0);
1184
1185   if (!N) {
1186     N = new (NodeAllocator) ConstantSDNode(isT, isO, Elt, EltVT);
1187     CSEMap.InsertNode(N, IP);
1188     AllNodes.push_back(N);
1189   }
1190
1191   SDValue Result(N, 0);
1192   if (VT.isVector()) {
1193     SmallVector<SDValue, 8> Ops;
1194     Ops.assign(VT.getVectorNumElements(), Result);
1195     Result = getNode(ISD::BUILD_VECTOR, SDLoc(), VT, Ops);
1196   }
1197   return Result;
1198 }
1199
1200 SDValue SelectionDAG::getIntPtrConstant(uint64_t Val, bool isTarget) {
1201   return getConstant(Val, TM.getTargetLowering()->getPointerTy(), isTarget);
1202 }
1203
1204
1205 SDValue SelectionDAG::getConstantFP(const APFloat& V, EVT VT, bool isTarget) {
1206   return getConstantFP(*ConstantFP::get(*getContext(), V), VT, isTarget);
1207 }
1208
1209 SDValue SelectionDAG::getConstantFP(const ConstantFP& V, EVT VT, bool isTarget){
1210   assert(VT.isFloatingPoint() && "Cannot create integer FP constant!");
1211
1212   EVT EltVT = VT.getScalarType();
1213
1214   // Do the map lookup using the actual bit pattern for the floating point
1215   // value, so that we don't have problems with 0.0 comparing equal to -0.0, and
1216   // we don't have issues with SNANs.
1217   unsigned Opc = isTarget ? ISD::TargetConstantFP : ISD::ConstantFP;
1218   FoldingSetNodeID ID;
1219   AddNodeIDNode(ID, Opc, getVTList(EltVT), None);
1220   ID.AddPointer(&V);
1221   void *IP = nullptr;
1222   SDNode *N = nullptr;
1223   if ((N = CSEMap.FindNodeOrInsertPos(ID, IP)))
1224     if (!VT.isVector())
1225       return SDValue(N, 0);
1226
1227   if (!N) {
1228     N = new (NodeAllocator) ConstantFPSDNode(isTarget, &V, EltVT);
1229     CSEMap.InsertNode(N, IP);
1230     AllNodes.push_back(N);
1231   }
1232
1233   SDValue Result(N, 0);
1234   if (VT.isVector()) {
1235     SmallVector<SDValue, 8> Ops;
1236     Ops.assign(VT.getVectorNumElements(), Result);
1237     // FIXME SDLoc info might be appropriate here
1238     Result = getNode(ISD::BUILD_VECTOR, SDLoc(), VT, Ops);
1239   }
1240   return Result;
1241 }
1242
1243 SDValue SelectionDAG::getConstantFP(double Val, EVT VT, bool isTarget) {
1244   EVT EltVT = VT.getScalarType();
1245   if (EltVT==MVT::f32)
1246     return getConstantFP(APFloat((float)Val), VT, isTarget);
1247   else if (EltVT==MVT::f64)
1248     return getConstantFP(APFloat(Val), VT, isTarget);
1249   else if (EltVT==MVT::f80 || EltVT==MVT::f128 || EltVT==MVT::ppcf128 ||
1250            EltVT==MVT::f16) {
1251     bool ignored;
1252     APFloat apf = APFloat(Val);
1253     apf.convert(EVTToAPFloatSemantics(EltVT), APFloat::rmNearestTiesToEven,
1254                 &ignored);
1255     return getConstantFP(apf, VT, isTarget);
1256   } else
1257     llvm_unreachable("Unsupported type in getConstantFP");
1258 }
1259
1260 SDValue SelectionDAG::getGlobalAddress(const GlobalValue *GV, SDLoc DL,
1261                                        EVT VT, int64_t Offset,
1262                                        bool isTargetGA,
1263                                        unsigned char TargetFlags) {
1264   assert((TargetFlags == 0 || isTargetGA) &&
1265          "Cannot set target flags on target-independent globals");
1266   const TargetLowering *TLI = TM.getTargetLowering();
1267
1268   // Truncate (with sign-extension) the offset value to the pointer size.
1269   unsigned BitWidth = TLI->getPointerTypeSizeInBits(GV->getType());
1270   if (BitWidth < 64)
1271     Offset = SignExtend64(Offset, BitWidth);
1272
1273   unsigned Opc;
1274   if (GV->isThreadLocal())
1275     Opc = isTargetGA ? ISD::TargetGlobalTLSAddress : ISD::GlobalTLSAddress;
1276   else
1277     Opc = isTargetGA ? ISD::TargetGlobalAddress : ISD::GlobalAddress;
1278
1279   FoldingSetNodeID ID;
1280   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1281   ID.AddPointer(GV);
1282   ID.AddInteger(Offset);
1283   ID.AddInteger(TargetFlags);
1284   ID.AddInteger(GV->getType()->getAddressSpace());
1285   void *IP = nullptr;
1286   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1287     return SDValue(E, 0);
1288
1289   SDNode *N = new (NodeAllocator) GlobalAddressSDNode(Opc, DL.getIROrder(),
1290                                                       DL.getDebugLoc(), GV, VT,
1291                                                       Offset, TargetFlags);
1292   CSEMap.InsertNode(N, IP);
1293   AllNodes.push_back(N);
1294   return SDValue(N, 0);
1295 }
1296
1297 SDValue SelectionDAG::getFrameIndex(int FI, EVT VT, bool isTarget) {
1298   unsigned Opc = isTarget ? ISD::TargetFrameIndex : ISD::FrameIndex;
1299   FoldingSetNodeID ID;
1300   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1301   ID.AddInteger(FI);
1302   void *IP = nullptr;
1303   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1304     return SDValue(E, 0);
1305
1306   SDNode *N = new (NodeAllocator) FrameIndexSDNode(FI, VT, isTarget);
1307   CSEMap.InsertNode(N, IP);
1308   AllNodes.push_back(N);
1309   return SDValue(N, 0);
1310 }
1311
1312 SDValue SelectionDAG::getJumpTable(int JTI, EVT VT, bool isTarget,
1313                                    unsigned char TargetFlags) {
1314   assert((TargetFlags == 0 || isTarget) &&
1315          "Cannot set target flags on target-independent jump tables");
1316   unsigned Opc = isTarget ? ISD::TargetJumpTable : ISD::JumpTable;
1317   FoldingSetNodeID ID;
1318   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1319   ID.AddInteger(JTI);
1320   ID.AddInteger(TargetFlags);
1321   void *IP = nullptr;
1322   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1323     return SDValue(E, 0);
1324
1325   SDNode *N = new (NodeAllocator) JumpTableSDNode(JTI, VT, isTarget,
1326                                                   TargetFlags);
1327   CSEMap.InsertNode(N, IP);
1328   AllNodes.push_back(N);
1329   return SDValue(N, 0);
1330 }
1331
1332 SDValue SelectionDAG::getConstantPool(const Constant *C, EVT VT,
1333                                       unsigned Alignment, int Offset,
1334                                       bool isTarget,
1335                                       unsigned char TargetFlags) {
1336   assert((TargetFlags == 0 || isTarget) &&
1337          "Cannot set target flags on target-independent globals");
1338   if (Alignment == 0)
1339     Alignment =
1340     TM.getTargetLowering()->getDataLayout()->getPrefTypeAlignment(C->getType());
1341   unsigned Opc = isTarget ? ISD::TargetConstantPool : ISD::ConstantPool;
1342   FoldingSetNodeID ID;
1343   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1344   ID.AddInteger(Alignment);
1345   ID.AddInteger(Offset);
1346   ID.AddPointer(C);
1347   ID.AddInteger(TargetFlags);
1348   void *IP = nullptr;
1349   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1350     return SDValue(E, 0);
1351
1352   SDNode *N = new (NodeAllocator) ConstantPoolSDNode(isTarget, C, VT, Offset,
1353                                                      Alignment, TargetFlags);
1354   CSEMap.InsertNode(N, IP);
1355   AllNodes.push_back(N);
1356   return SDValue(N, 0);
1357 }
1358
1359
1360 SDValue SelectionDAG::getConstantPool(MachineConstantPoolValue *C, EVT VT,
1361                                       unsigned Alignment, int Offset,
1362                                       bool isTarget,
1363                                       unsigned char TargetFlags) {
1364   assert((TargetFlags == 0 || isTarget) &&
1365          "Cannot set target flags on target-independent globals");
1366   if (Alignment == 0)
1367     Alignment =
1368     TM.getTargetLowering()->getDataLayout()->getPrefTypeAlignment(C->getType());
1369   unsigned Opc = isTarget ? ISD::TargetConstantPool : ISD::ConstantPool;
1370   FoldingSetNodeID ID;
1371   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1372   ID.AddInteger(Alignment);
1373   ID.AddInteger(Offset);
1374   C->addSelectionDAGCSEId(ID);
1375   ID.AddInteger(TargetFlags);
1376   void *IP = nullptr;
1377   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1378     return SDValue(E, 0);
1379
1380   SDNode *N = new (NodeAllocator) ConstantPoolSDNode(isTarget, C, VT, Offset,
1381                                                      Alignment, TargetFlags);
1382   CSEMap.InsertNode(N, IP);
1383   AllNodes.push_back(N);
1384   return SDValue(N, 0);
1385 }
1386
1387 SDValue SelectionDAG::getTargetIndex(int Index, EVT VT, int64_t Offset,
1388                                      unsigned char TargetFlags) {
1389   FoldingSetNodeID ID;
1390   AddNodeIDNode(ID, ISD::TargetIndex, getVTList(VT), None);
1391   ID.AddInteger(Index);
1392   ID.AddInteger(Offset);
1393   ID.AddInteger(TargetFlags);
1394   void *IP = nullptr;
1395   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1396     return SDValue(E, 0);
1397
1398   SDNode *N = new (NodeAllocator) TargetIndexSDNode(Index, VT, Offset,
1399                                                     TargetFlags);
1400   CSEMap.InsertNode(N, IP);
1401   AllNodes.push_back(N);
1402   return SDValue(N, 0);
1403 }
1404
1405 SDValue SelectionDAG::getBasicBlock(MachineBasicBlock *MBB) {
1406   FoldingSetNodeID ID;
1407   AddNodeIDNode(ID, ISD::BasicBlock, getVTList(MVT::Other), None);
1408   ID.AddPointer(MBB);
1409   void *IP = nullptr;
1410   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1411     return SDValue(E, 0);
1412
1413   SDNode *N = new (NodeAllocator) BasicBlockSDNode(MBB);
1414   CSEMap.InsertNode(N, IP);
1415   AllNodes.push_back(N);
1416   return SDValue(N, 0);
1417 }
1418
1419 SDValue SelectionDAG::getValueType(EVT VT) {
1420   if (VT.isSimple() && (unsigned)VT.getSimpleVT().SimpleTy >=
1421       ValueTypeNodes.size())
1422     ValueTypeNodes.resize(VT.getSimpleVT().SimpleTy+1);
1423
1424   SDNode *&N = VT.isExtended() ?
1425     ExtendedValueTypeNodes[VT] : ValueTypeNodes[VT.getSimpleVT().SimpleTy];
1426
1427   if (N) return SDValue(N, 0);
1428   N = new (NodeAllocator) VTSDNode(VT);
1429   AllNodes.push_back(N);
1430   return SDValue(N, 0);
1431 }
1432
1433 SDValue SelectionDAG::getExternalSymbol(const char *Sym, EVT VT) {
1434   SDNode *&N = ExternalSymbols[Sym];
1435   if (N) return SDValue(N, 0);
1436   N = new (NodeAllocator) ExternalSymbolSDNode(false, Sym, 0, VT);
1437   AllNodes.push_back(N);
1438   return SDValue(N, 0);
1439 }
1440
1441 SDValue SelectionDAG::getTargetExternalSymbol(const char *Sym, EVT VT,
1442                                               unsigned char TargetFlags) {
1443   SDNode *&N =
1444     TargetExternalSymbols[std::pair<std::string,unsigned char>(Sym,
1445                                                                TargetFlags)];
1446   if (N) return SDValue(N, 0);
1447   N = new (NodeAllocator) ExternalSymbolSDNode(true, Sym, TargetFlags, VT);
1448   AllNodes.push_back(N);
1449   return SDValue(N, 0);
1450 }
1451
1452 SDValue SelectionDAG::getCondCode(ISD::CondCode Cond) {
1453   if ((unsigned)Cond >= CondCodeNodes.size())
1454     CondCodeNodes.resize(Cond+1);
1455
1456   if (!CondCodeNodes[Cond]) {
1457     CondCodeSDNode *N = new (NodeAllocator) CondCodeSDNode(Cond);
1458     CondCodeNodes[Cond] = N;
1459     AllNodes.push_back(N);
1460   }
1461
1462   return SDValue(CondCodeNodes[Cond], 0);
1463 }
1464
1465 // commuteShuffle - swaps the values of N1 and N2, and swaps all indices in
1466 // the shuffle mask M that point at N1 to point at N2, and indices that point
1467 // N2 to point at N1.
1468 static void commuteShuffle(SDValue &N1, SDValue &N2, SmallVectorImpl<int> &M) {
1469   std::swap(N1, N2);
1470   int NElts = M.size();
1471   for (int i = 0; i != NElts; ++i) {
1472     if (M[i] >= NElts)
1473       M[i] -= NElts;
1474     else if (M[i] >= 0)
1475       M[i] += NElts;
1476   }
1477 }
1478
1479 SDValue SelectionDAG::getVectorShuffle(EVT VT, SDLoc dl, SDValue N1,
1480                                        SDValue N2, const int *Mask) {
1481   assert(VT == N1.getValueType() && VT == N2.getValueType() &&
1482          "Invalid VECTOR_SHUFFLE");
1483
1484   // Canonicalize shuffle undef, undef -> undef
1485   if (N1.getOpcode() == ISD::UNDEF && N2.getOpcode() == ISD::UNDEF)
1486     return getUNDEF(VT);
1487
1488   // Validate that all indices in Mask are within the range of the elements
1489   // input to the shuffle.
1490   unsigned NElts = VT.getVectorNumElements();
1491   SmallVector<int, 8> MaskVec;
1492   for (unsigned i = 0; i != NElts; ++i) {
1493     assert(Mask[i] < (int)(NElts * 2) && "Index out of range");
1494     MaskVec.push_back(Mask[i]);
1495   }
1496
1497   // Canonicalize shuffle v, v -> v, undef
1498   if (N1 == N2) {
1499     N2 = getUNDEF(VT);
1500     for (unsigned i = 0; i != NElts; ++i)
1501       if (MaskVec[i] >= (int)NElts) MaskVec[i] -= NElts;
1502   }
1503
1504   // Canonicalize shuffle undef, v -> v, undef.  Commute the shuffle mask.
1505   if (N1.getOpcode() == ISD::UNDEF)
1506     commuteShuffle(N1, N2, MaskVec);
1507
1508   // Canonicalize all index into lhs, -> shuffle lhs, undef
1509   // Canonicalize all index into rhs, -> shuffle rhs, undef
1510   bool AllLHS = true, AllRHS = true;
1511   bool N2Undef = N2.getOpcode() == ISD::UNDEF;
1512   for (unsigned i = 0; i != NElts; ++i) {
1513     if (MaskVec[i] >= (int)NElts) {
1514       if (N2Undef)
1515         MaskVec[i] = -1;
1516       else
1517         AllLHS = false;
1518     } else if (MaskVec[i] >= 0) {
1519       AllRHS = false;
1520     }
1521   }
1522   if (AllLHS && AllRHS)
1523     return getUNDEF(VT);
1524   if (AllLHS && !N2Undef)
1525     N2 = getUNDEF(VT);
1526   if (AllRHS) {
1527     N1 = getUNDEF(VT);
1528     commuteShuffle(N1, N2, MaskVec);
1529   }
1530   // Reset our undef status after accounting for the mask.
1531   N2Undef = N2.getOpcode() == ISD::UNDEF;
1532   // Re-check whether both sides ended up undef.
1533   if (N1.getOpcode() == ISD::UNDEF && N2Undef)
1534     return getUNDEF(VT);
1535
1536   // If Identity shuffle return that node.
1537   bool Identity = true;
1538   for (unsigned i = 0; i != NElts; ++i) {
1539     if (MaskVec[i] >= 0 && MaskVec[i] != (int)i) Identity = false;
1540   }
1541   if (Identity && NElts)
1542     return N1;
1543
1544   // Shuffling a constant splat doesn't change the result.
1545   if (N2Undef) {
1546     SDValue V = N1;
1547
1548     // Look through any bitcasts. We check that these don't change the number
1549     // (and size) of elements and just changes their types.
1550     while (V.getOpcode() == ISD::BITCAST)
1551       V = V->getOperand(0);
1552
1553     // A splat should always show up as a build vector node.
1554     if (auto *BV = dyn_cast<BuildVectorSDNode>(V)) {
1555       BitVector UndefElements;
1556       SDValue Splat = BV->getSplatValue(&UndefElements);
1557       // If this is a splat of an undef, shuffling it is also undef.
1558       if (Splat && Splat.getOpcode() == ISD::UNDEF)
1559         return getUNDEF(VT);
1560
1561       // We only have a splat which can skip shuffles if there is a splatted
1562       // value and no undef lanes rearranged by the shuffle.
1563       if (Splat && UndefElements.none()) {
1564         // Splat of <x, x, ..., x>, return <x, x, ..., x>, provided that the
1565         // number of elements match or the value splatted is a zero constant.
1566         if (V.getValueType().getVectorNumElements() ==
1567             VT.getVectorNumElements())
1568           return N1;
1569         if (auto *C = dyn_cast<ConstantSDNode>(Splat))
1570           if (C->isNullValue())
1571             return N1;
1572       }
1573     }
1574   }
1575
1576   FoldingSetNodeID ID;
1577   SDValue Ops[2] = { N1, N2 };
1578   AddNodeIDNode(ID, ISD::VECTOR_SHUFFLE, getVTList(VT), Ops);
1579   for (unsigned i = 0; i != NElts; ++i)
1580     ID.AddInteger(MaskVec[i]);
1581
1582   void* IP = nullptr;
1583   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1584     return SDValue(E, 0);
1585
1586   // Allocate the mask array for the node out of the BumpPtrAllocator, since
1587   // SDNode doesn't have access to it.  This memory will be "leaked" when
1588   // the node is deallocated, but recovered when the NodeAllocator is released.
1589   int *MaskAlloc = OperandAllocator.Allocate<int>(NElts);
1590   memcpy(MaskAlloc, &MaskVec[0], NElts * sizeof(int));
1591
1592   ShuffleVectorSDNode *N =
1593     new (NodeAllocator) ShuffleVectorSDNode(VT, dl.getIROrder(),
1594                                             dl.getDebugLoc(), N1, N2,
1595                                             MaskAlloc);
1596   CSEMap.InsertNode(N, IP);
1597   AllNodes.push_back(N);
1598   return SDValue(N, 0);
1599 }
1600
1601 SDValue SelectionDAG::getConvertRndSat(EVT VT, SDLoc dl,
1602                                        SDValue Val, SDValue DTy,
1603                                        SDValue STy, SDValue Rnd, SDValue Sat,
1604                                        ISD::CvtCode Code) {
1605   // If the src and dest types are the same and the conversion is between
1606   // integer types of the same sign or two floats, no conversion is necessary.
1607   if (DTy == STy &&
1608       (Code == ISD::CVT_UU || Code == ISD::CVT_SS || Code == ISD::CVT_FF))
1609     return Val;
1610
1611   FoldingSetNodeID ID;
1612   SDValue Ops[] = { Val, DTy, STy, Rnd, Sat };
1613   AddNodeIDNode(ID, ISD::CONVERT_RNDSAT, getVTList(VT), Ops);
1614   void* IP = nullptr;
1615   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1616     return SDValue(E, 0);
1617
1618   CvtRndSatSDNode *N = new (NodeAllocator) CvtRndSatSDNode(VT, dl.getIROrder(),
1619                                                            dl.getDebugLoc(),
1620                                                            Ops, Code);
1621   CSEMap.InsertNode(N, IP);
1622   AllNodes.push_back(N);
1623   return SDValue(N, 0);
1624 }
1625
1626 SDValue SelectionDAG::getRegister(unsigned RegNo, EVT VT) {
1627   FoldingSetNodeID ID;
1628   AddNodeIDNode(ID, ISD::Register, getVTList(VT), None);
1629   ID.AddInteger(RegNo);
1630   void *IP = nullptr;
1631   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1632     return SDValue(E, 0);
1633
1634   SDNode *N = new (NodeAllocator) RegisterSDNode(RegNo, VT);
1635   CSEMap.InsertNode(N, IP);
1636   AllNodes.push_back(N);
1637   return SDValue(N, 0);
1638 }
1639
1640 SDValue SelectionDAG::getRegisterMask(const uint32_t *RegMask) {
1641   FoldingSetNodeID ID;
1642   AddNodeIDNode(ID, ISD::RegisterMask, getVTList(MVT::Untyped), None);
1643   ID.AddPointer(RegMask);
1644   void *IP = nullptr;
1645   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1646     return SDValue(E, 0);
1647
1648   SDNode *N = new (NodeAllocator) RegisterMaskSDNode(RegMask);
1649   CSEMap.InsertNode(N, IP);
1650   AllNodes.push_back(N);
1651   return SDValue(N, 0);
1652 }
1653
1654 SDValue SelectionDAG::getEHLabel(SDLoc dl, SDValue Root, MCSymbol *Label) {
1655   FoldingSetNodeID ID;
1656   SDValue Ops[] = { Root };
1657   AddNodeIDNode(ID, ISD::EH_LABEL, getVTList(MVT::Other), Ops);
1658   ID.AddPointer(Label);
1659   void *IP = nullptr;
1660   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1661     return SDValue(E, 0);
1662
1663   SDNode *N = new (NodeAllocator) EHLabelSDNode(dl.getIROrder(),
1664                                                 dl.getDebugLoc(), Root, Label);
1665   CSEMap.InsertNode(N, IP);
1666   AllNodes.push_back(N);
1667   return SDValue(N, 0);
1668 }
1669
1670
1671 SDValue SelectionDAG::getBlockAddress(const BlockAddress *BA, EVT VT,
1672                                       int64_t Offset,
1673                                       bool isTarget,
1674                                       unsigned char TargetFlags) {
1675   unsigned Opc = isTarget ? ISD::TargetBlockAddress : ISD::BlockAddress;
1676
1677   FoldingSetNodeID ID;
1678   AddNodeIDNode(ID, Opc, getVTList(VT), None);
1679   ID.AddPointer(BA);
1680   ID.AddInteger(Offset);
1681   ID.AddInteger(TargetFlags);
1682   void *IP = nullptr;
1683   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1684     return SDValue(E, 0);
1685
1686   SDNode *N = new (NodeAllocator) BlockAddressSDNode(Opc, VT, BA, Offset,
1687                                                      TargetFlags);
1688   CSEMap.InsertNode(N, IP);
1689   AllNodes.push_back(N);
1690   return SDValue(N, 0);
1691 }
1692
1693 SDValue SelectionDAG::getSrcValue(const Value *V) {
1694   assert((!V || V->getType()->isPointerTy()) &&
1695          "SrcValue is not a pointer?");
1696
1697   FoldingSetNodeID ID;
1698   AddNodeIDNode(ID, ISD::SRCVALUE, getVTList(MVT::Other), None);
1699   ID.AddPointer(V);
1700
1701   void *IP = nullptr;
1702   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1703     return SDValue(E, 0);
1704
1705   SDNode *N = new (NodeAllocator) SrcValueSDNode(V);
1706   CSEMap.InsertNode(N, IP);
1707   AllNodes.push_back(N);
1708   return SDValue(N, 0);
1709 }
1710
1711 /// getMDNode - Return an MDNodeSDNode which holds an MDNode.
1712 SDValue SelectionDAG::getMDNode(const MDNode *MD) {
1713   FoldingSetNodeID ID;
1714   AddNodeIDNode(ID, ISD::MDNODE_SDNODE, getVTList(MVT::Other), None);
1715   ID.AddPointer(MD);
1716
1717   void *IP = nullptr;
1718   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1719     return SDValue(E, 0);
1720
1721   SDNode *N = new (NodeAllocator) MDNodeSDNode(MD);
1722   CSEMap.InsertNode(N, IP);
1723   AllNodes.push_back(N);
1724   return SDValue(N, 0);
1725 }
1726
1727 /// getAddrSpaceCast - Return an AddrSpaceCastSDNode.
1728 SDValue SelectionDAG::getAddrSpaceCast(SDLoc dl, EVT VT, SDValue Ptr,
1729                                        unsigned SrcAS, unsigned DestAS) {
1730   SDValue Ops[] = {Ptr};
1731   FoldingSetNodeID ID;
1732   AddNodeIDNode(ID, ISD::ADDRSPACECAST, getVTList(VT), Ops);
1733   ID.AddInteger(SrcAS);
1734   ID.AddInteger(DestAS);
1735
1736   void *IP = nullptr;
1737   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
1738     return SDValue(E, 0);
1739
1740   SDNode *N = new (NodeAllocator) AddrSpaceCastSDNode(dl.getIROrder(),
1741                                                       dl.getDebugLoc(),
1742                                                       VT, Ptr, SrcAS, DestAS);
1743   CSEMap.InsertNode(N, IP);
1744   AllNodes.push_back(N);
1745   return SDValue(N, 0);
1746 }
1747
1748 /// getShiftAmountOperand - Return the specified value casted to
1749 /// the target's desired shift amount type.
1750 SDValue SelectionDAG::getShiftAmountOperand(EVT LHSTy, SDValue Op) {
1751   EVT OpTy = Op.getValueType();
1752   EVT ShTy = TM.getTargetLowering()->getShiftAmountTy(LHSTy);
1753   if (OpTy == ShTy || OpTy.isVector()) return Op;
1754
1755   ISD::NodeType Opcode = OpTy.bitsGT(ShTy) ?  ISD::TRUNCATE : ISD::ZERO_EXTEND;
1756   return getNode(Opcode, SDLoc(Op), ShTy, Op);
1757 }
1758
1759 /// CreateStackTemporary - Create a stack temporary, suitable for holding the
1760 /// specified value type.
1761 SDValue SelectionDAG::CreateStackTemporary(EVT VT, unsigned minAlign) {
1762   MachineFrameInfo *FrameInfo = getMachineFunction().getFrameInfo();
1763   unsigned ByteSize = VT.getStoreSize();
1764   Type *Ty = VT.getTypeForEVT(*getContext());
1765   const TargetLowering *TLI = TM.getTargetLowering();
1766   unsigned StackAlign =
1767   std::max((unsigned)TLI->getDataLayout()->getPrefTypeAlignment(Ty), minAlign);
1768
1769   int FrameIdx = FrameInfo->CreateStackObject(ByteSize, StackAlign, false);
1770   return getFrameIndex(FrameIdx, TLI->getPointerTy());
1771 }
1772
1773 /// CreateStackTemporary - Create a stack temporary suitable for holding
1774 /// either of the specified value types.
1775 SDValue SelectionDAG::CreateStackTemporary(EVT VT1, EVT VT2) {
1776   unsigned Bytes = std::max(VT1.getStoreSizeInBits(),
1777                             VT2.getStoreSizeInBits())/8;
1778   Type *Ty1 = VT1.getTypeForEVT(*getContext());
1779   Type *Ty2 = VT2.getTypeForEVT(*getContext());
1780   const TargetLowering *TLI = TM.getTargetLowering();
1781   const DataLayout *TD = TLI->getDataLayout();
1782   unsigned Align = std::max(TD->getPrefTypeAlignment(Ty1),
1783                             TD->getPrefTypeAlignment(Ty2));
1784
1785   MachineFrameInfo *FrameInfo = getMachineFunction().getFrameInfo();
1786   int FrameIdx = FrameInfo->CreateStackObject(Bytes, Align, false);
1787   return getFrameIndex(FrameIdx, TLI->getPointerTy());
1788 }
1789
1790 SDValue SelectionDAG::FoldSetCC(EVT VT, SDValue N1,
1791                                 SDValue N2, ISD::CondCode Cond, SDLoc dl) {
1792   // These setcc operations always fold.
1793   switch (Cond) {
1794   default: break;
1795   case ISD::SETFALSE:
1796   case ISD::SETFALSE2: return getConstant(0, VT);
1797   case ISD::SETTRUE:
1798   case ISD::SETTRUE2: {
1799     const TargetLowering *TLI = TM.getTargetLowering();
1800     TargetLowering::BooleanContent Cnt =
1801         TLI->getBooleanContents(N1->getValueType(0));
1802     return getConstant(
1803         Cnt == TargetLowering::ZeroOrNegativeOneBooleanContent ? -1ULL : 1, VT);
1804   }
1805
1806   case ISD::SETOEQ:
1807   case ISD::SETOGT:
1808   case ISD::SETOGE:
1809   case ISD::SETOLT:
1810   case ISD::SETOLE:
1811   case ISD::SETONE:
1812   case ISD::SETO:
1813   case ISD::SETUO:
1814   case ISD::SETUEQ:
1815   case ISD::SETUNE:
1816     assert(!N1.getValueType().isInteger() && "Illegal setcc for integer!");
1817     break;
1818   }
1819
1820   if (ConstantSDNode *N2C = dyn_cast<ConstantSDNode>(N2.getNode())) {
1821     const APInt &C2 = N2C->getAPIntValue();
1822     if (ConstantSDNode *N1C = dyn_cast<ConstantSDNode>(N1.getNode())) {
1823       const APInt &C1 = N1C->getAPIntValue();
1824
1825       switch (Cond) {
1826       default: llvm_unreachable("Unknown integer setcc!");
1827       case ISD::SETEQ:  return getConstant(C1 == C2, VT);
1828       case ISD::SETNE:  return getConstant(C1 != C2, VT);
1829       case ISD::SETULT: return getConstant(C1.ult(C2), VT);
1830       case ISD::SETUGT: return getConstant(C1.ugt(C2), VT);
1831       case ISD::SETULE: return getConstant(C1.ule(C2), VT);
1832       case ISD::SETUGE: return getConstant(C1.uge(C2), VT);
1833       case ISD::SETLT:  return getConstant(C1.slt(C2), VT);
1834       case ISD::SETGT:  return getConstant(C1.sgt(C2), VT);
1835       case ISD::SETLE:  return getConstant(C1.sle(C2), VT);
1836       case ISD::SETGE:  return getConstant(C1.sge(C2), VT);
1837       }
1838     }
1839   }
1840   if (ConstantFPSDNode *N1C = dyn_cast<ConstantFPSDNode>(N1.getNode())) {
1841     if (ConstantFPSDNode *N2C = dyn_cast<ConstantFPSDNode>(N2.getNode())) {
1842       APFloat::cmpResult R = N1C->getValueAPF().compare(N2C->getValueAPF());
1843       switch (Cond) {
1844       default: break;
1845       case ISD::SETEQ:  if (R==APFloat::cmpUnordered)
1846                           return getUNDEF(VT);
1847                         // fall through
1848       case ISD::SETOEQ: return getConstant(R==APFloat::cmpEqual, VT);
1849       case ISD::SETNE:  if (R==APFloat::cmpUnordered)
1850                           return getUNDEF(VT);
1851                         // fall through
1852       case ISD::SETONE: return getConstant(R==APFloat::cmpGreaterThan ||
1853                                            R==APFloat::cmpLessThan, VT);
1854       case ISD::SETLT:  if (R==APFloat::cmpUnordered)
1855                           return getUNDEF(VT);
1856                         // fall through
1857       case ISD::SETOLT: return getConstant(R==APFloat::cmpLessThan, VT);
1858       case ISD::SETGT:  if (R==APFloat::cmpUnordered)
1859                           return getUNDEF(VT);
1860                         // fall through
1861       case ISD::SETOGT: return getConstant(R==APFloat::cmpGreaterThan, VT);
1862       case ISD::SETLE:  if (R==APFloat::cmpUnordered)
1863                           return getUNDEF(VT);
1864                         // fall through
1865       case ISD::SETOLE: return getConstant(R==APFloat::cmpLessThan ||
1866                                            R==APFloat::cmpEqual, VT);
1867       case ISD::SETGE:  if (R==APFloat::cmpUnordered)
1868                           return getUNDEF(VT);
1869                         // fall through
1870       case ISD::SETOGE: return getConstant(R==APFloat::cmpGreaterThan ||
1871                                            R==APFloat::cmpEqual, VT);
1872       case ISD::SETO:   return getConstant(R!=APFloat::cmpUnordered, VT);
1873       case ISD::SETUO:  return getConstant(R==APFloat::cmpUnordered, VT);
1874       case ISD::SETUEQ: return getConstant(R==APFloat::cmpUnordered ||
1875                                            R==APFloat::cmpEqual, VT);
1876       case ISD::SETUNE: return getConstant(R!=APFloat::cmpEqual, VT);
1877       case ISD::SETULT: return getConstant(R==APFloat::cmpUnordered ||
1878                                            R==APFloat::cmpLessThan, VT);
1879       case ISD::SETUGT: return getConstant(R==APFloat::cmpGreaterThan ||
1880                                            R==APFloat::cmpUnordered, VT);
1881       case ISD::SETULE: return getConstant(R!=APFloat::cmpGreaterThan, VT);
1882       case ISD::SETUGE: return getConstant(R!=APFloat::cmpLessThan, VT);
1883       }
1884     } else {
1885       // Ensure that the constant occurs on the RHS.
1886       ISD::CondCode SwappedCond = ISD::getSetCCSwappedOperands(Cond);
1887       MVT CompVT = N1.getValueType().getSimpleVT();
1888       if (!TM.getTargetLowering()->isCondCodeLegal(SwappedCond, CompVT))
1889         return SDValue();
1890
1891       return getSetCC(dl, VT, N2, N1, SwappedCond);
1892     }
1893   }
1894
1895   // Could not fold it.
1896   return SDValue();
1897 }
1898
1899 /// SignBitIsZero - Return true if the sign bit of Op is known to be zero.  We
1900 /// use this predicate to simplify operations downstream.
1901 bool SelectionDAG::SignBitIsZero(SDValue Op, unsigned Depth) const {
1902   // This predicate is not safe for vector operations.
1903   if (Op.getValueType().isVector())
1904     return false;
1905
1906   unsigned BitWidth = Op.getValueType().getScalarType().getSizeInBits();
1907   return MaskedValueIsZero(Op, APInt::getSignBit(BitWidth), Depth);
1908 }
1909
1910 /// MaskedValueIsZero - Return true if 'V & Mask' is known to be zero.  We use
1911 /// this predicate to simplify operations downstream.  Mask is known to be zero
1912 /// for bits that V cannot have.
1913 bool SelectionDAG::MaskedValueIsZero(SDValue Op, const APInt &Mask,
1914                                      unsigned Depth) const {
1915   APInt KnownZero, KnownOne;
1916   computeKnownBits(Op, KnownZero, KnownOne, Depth);
1917   return (KnownZero & Mask) == Mask;
1918 }
1919
1920 /// Determine which bits of Op are known to be either zero or one and return
1921 /// them in the KnownZero/KnownOne bitsets.
1922 void SelectionDAG::computeKnownBits(SDValue Op, APInt &KnownZero,
1923                                     APInt &KnownOne, unsigned Depth) const {
1924   const TargetLowering *TLI = TM.getTargetLowering();
1925   unsigned BitWidth = Op.getValueType().getScalarType().getSizeInBits();
1926
1927   KnownZero = KnownOne = APInt(BitWidth, 0);   // Don't know anything.
1928   if (Depth == 6)
1929     return;  // Limit search depth.
1930
1931   APInt KnownZero2, KnownOne2;
1932
1933   switch (Op.getOpcode()) {
1934   case ISD::Constant:
1935     // We know all of the bits for a constant!
1936     KnownOne = cast<ConstantSDNode>(Op)->getAPIntValue();
1937     KnownZero = ~KnownOne;
1938     break;
1939   case ISD::AND:
1940     // If either the LHS or the RHS are Zero, the result is zero.
1941     computeKnownBits(Op.getOperand(1), KnownZero, KnownOne, Depth+1);
1942     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
1943
1944     // Output known-1 bits are only known if set in both the LHS & RHS.
1945     KnownOne &= KnownOne2;
1946     // Output known-0 are known to be clear if zero in either the LHS | RHS.
1947     KnownZero |= KnownZero2;
1948     break;
1949   case ISD::OR:
1950     computeKnownBits(Op.getOperand(1), KnownZero, KnownOne, Depth+1);
1951     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
1952
1953     // Output known-0 bits are only known if clear in both the LHS & RHS.
1954     KnownZero &= KnownZero2;
1955     // Output known-1 are known to be set if set in either the LHS | RHS.
1956     KnownOne |= KnownOne2;
1957     break;
1958   case ISD::XOR: {
1959     computeKnownBits(Op.getOperand(1), KnownZero, KnownOne, Depth+1);
1960     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
1961
1962     // Output known-0 bits are known if clear or set in both the LHS & RHS.
1963     APInt KnownZeroOut = (KnownZero & KnownZero2) | (KnownOne & KnownOne2);
1964     // Output known-1 are known to be set if set in only one of the LHS, RHS.
1965     KnownOne = (KnownZero & KnownOne2) | (KnownOne & KnownZero2);
1966     KnownZero = KnownZeroOut;
1967     break;
1968   }
1969   case ISD::MUL: {
1970     computeKnownBits(Op.getOperand(1), KnownZero, KnownOne, Depth+1);
1971     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
1972
1973     // If low bits are zero in either operand, output low known-0 bits.
1974     // Also compute a conserative estimate for high known-0 bits.
1975     // More trickiness is possible, but this is sufficient for the
1976     // interesting case of alignment computation.
1977     KnownOne.clearAllBits();
1978     unsigned TrailZ = KnownZero.countTrailingOnes() +
1979                       KnownZero2.countTrailingOnes();
1980     unsigned LeadZ =  std::max(KnownZero.countLeadingOnes() +
1981                                KnownZero2.countLeadingOnes(),
1982                                BitWidth) - BitWidth;
1983
1984     TrailZ = std::min(TrailZ, BitWidth);
1985     LeadZ = std::min(LeadZ, BitWidth);
1986     KnownZero = APInt::getLowBitsSet(BitWidth, TrailZ) |
1987                 APInt::getHighBitsSet(BitWidth, LeadZ);
1988     break;
1989   }
1990   case ISD::UDIV: {
1991     // For the purposes of computing leading zeros we can conservatively
1992     // treat a udiv as a logical right shift by the power of 2 known to
1993     // be less than the denominator.
1994     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
1995     unsigned LeadZ = KnownZero2.countLeadingOnes();
1996
1997     KnownOne2.clearAllBits();
1998     KnownZero2.clearAllBits();
1999     computeKnownBits(Op.getOperand(1), KnownZero2, KnownOne2, Depth+1);
2000     unsigned RHSUnknownLeadingOnes = KnownOne2.countLeadingZeros();
2001     if (RHSUnknownLeadingOnes != BitWidth)
2002       LeadZ = std::min(BitWidth,
2003                        LeadZ + BitWidth - RHSUnknownLeadingOnes - 1);
2004
2005     KnownZero = APInt::getHighBitsSet(BitWidth, LeadZ);
2006     break;
2007   }
2008   case ISD::SELECT:
2009     computeKnownBits(Op.getOperand(2), KnownZero, KnownOne, Depth+1);
2010     computeKnownBits(Op.getOperand(1), KnownZero2, KnownOne2, Depth+1);
2011
2012     // Only known if known in both the LHS and RHS.
2013     KnownOne &= KnownOne2;
2014     KnownZero &= KnownZero2;
2015     break;
2016   case ISD::SELECT_CC:
2017     computeKnownBits(Op.getOperand(3), KnownZero, KnownOne, Depth+1);
2018     computeKnownBits(Op.getOperand(2), KnownZero2, KnownOne2, Depth+1);
2019
2020     // Only known if known in both the LHS and RHS.
2021     KnownOne &= KnownOne2;
2022     KnownZero &= KnownZero2;
2023     break;
2024   case ISD::SADDO:
2025   case ISD::UADDO:
2026   case ISD::SSUBO:
2027   case ISD::USUBO:
2028   case ISD::SMULO:
2029   case ISD::UMULO:
2030     if (Op.getResNo() != 1)
2031       break;
2032     // The boolean result conforms to getBooleanContents.
2033     // If we know the result of a setcc has the top bits zero, use this info.
2034     // We know that we have an integer-based boolean since these operations
2035     // are only available for integer.
2036     if (TLI->getBooleanContents(Op.getValueType().isVector(), false) ==
2037             TargetLowering::ZeroOrOneBooleanContent &&
2038         BitWidth > 1)
2039       KnownZero |= APInt::getHighBitsSet(BitWidth, BitWidth - 1);
2040     break;
2041   case ISD::SETCC:
2042     // If we know the result of a setcc has the top bits zero, use this info.
2043     if (TLI->getBooleanContents(Op.getOperand(0).getValueType()) ==
2044             TargetLowering::ZeroOrOneBooleanContent &&
2045         BitWidth > 1)
2046       KnownZero |= APInt::getHighBitsSet(BitWidth, BitWidth - 1);
2047     break;
2048   case ISD::SHL:
2049     // (shl X, C1) & C2 == 0   iff   (X & C2 >>u C1) == 0
2050     if (ConstantSDNode *SA = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2051       unsigned ShAmt = SA->getZExtValue();
2052
2053       // If the shift count is an invalid immediate, don't do anything.
2054       if (ShAmt >= BitWidth)
2055         break;
2056
2057       computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2058       KnownZero <<= ShAmt;
2059       KnownOne  <<= ShAmt;
2060       // low bits known zero.
2061       KnownZero |= APInt::getLowBitsSet(BitWidth, ShAmt);
2062     }
2063     break;
2064   case ISD::SRL:
2065     // (ushr X, C1) & C2 == 0   iff  (-1 >> C1) & C2 == 0
2066     if (ConstantSDNode *SA = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2067       unsigned ShAmt = SA->getZExtValue();
2068
2069       // If the shift count is an invalid immediate, don't do anything.
2070       if (ShAmt >= BitWidth)
2071         break;
2072
2073       computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2074       KnownZero = KnownZero.lshr(ShAmt);
2075       KnownOne  = KnownOne.lshr(ShAmt);
2076
2077       APInt HighBits = APInt::getHighBitsSet(BitWidth, ShAmt);
2078       KnownZero |= HighBits;  // High bits known zero.
2079     }
2080     break;
2081   case ISD::SRA:
2082     if (ConstantSDNode *SA = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2083       unsigned ShAmt = SA->getZExtValue();
2084
2085       // If the shift count is an invalid immediate, don't do anything.
2086       if (ShAmt >= BitWidth)
2087         break;
2088
2089       // If any of the demanded bits are produced by the sign extension, we also
2090       // demand the input sign bit.
2091       APInt HighBits = APInt::getHighBitsSet(BitWidth, ShAmt);
2092
2093       computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2094       KnownZero = KnownZero.lshr(ShAmt);
2095       KnownOne  = KnownOne.lshr(ShAmt);
2096
2097       // Handle the sign bits.
2098       APInt SignBit = APInt::getSignBit(BitWidth);
2099       SignBit = SignBit.lshr(ShAmt);  // Adjust to where it is now in the mask.
2100
2101       if (KnownZero.intersects(SignBit)) {
2102         KnownZero |= HighBits;  // New bits are known zero.
2103       } else if (KnownOne.intersects(SignBit)) {
2104         KnownOne  |= HighBits;  // New bits are known one.
2105       }
2106     }
2107     break;
2108   case ISD::SIGN_EXTEND_INREG: {
2109     EVT EVT = cast<VTSDNode>(Op.getOperand(1))->getVT();
2110     unsigned EBits = EVT.getScalarType().getSizeInBits();
2111
2112     // Sign extension.  Compute the demanded bits in the result that are not
2113     // present in the input.
2114     APInt NewBits = APInt::getHighBitsSet(BitWidth, BitWidth - EBits);
2115
2116     APInt InSignBit = APInt::getSignBit(EBits);
2117     APInt InputDemandedBits = APInt::getLowBitsSet(BitWidth, EBits);
2118
2119     // If the sign extended bits are demanded, we know that the sign
2120     // bit is demanded.
2121     InSignBit = InSignBit.zext(BitWidth);
2122     if (NewBits.getBoolValue())
2123       InputDemandedBits |= InSignBit;
2124
2125     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2126     KnownOne &= InputDemandedBits;
2127     KnownZero &= InputDemandedBits;
2128
2129     // If the sign bit of the input is known set or clear, then we know the
2130     // top bits of the result.
2131     if (KnownZero.intersects(InSignBit)) {         // Input sign bit known clear
2132       KnownZero |= NewBits;
2133       KnownOne  &= ~NewBits;
2134     } else if (KnownOne.intersects(InSignBit)) {   // Input sign bit known set
2135       KnownOne  |= NewBits;
2136       KnownZero &= ~NewBits;
2137     } else {                              // Input sign bit unknown
2138       KnownZero &= ~NewBits;
2139       KnownOne  &= ~NewBits;
2140     }
2141     break;
2142   }
2143   case ISD::CTTZ:
2144   case ISD::CTTZ_ZERO_UNDEF:
2145   case ISD::CTLZ:
2146   case ISD::CTLZ_ZERO_UNDEF:
2147   case ISD::CTPOP: {
2148     unsigned LowBits = Log2_32(BitWidth)+1;
2149     KnownZero = APInt::getHighBitsSet(BitWidth, BitWidth - LowBits);
2150     KnownOne.clearAllBits();
2151     break;
2152   }
2153   case ISD::LOAD: {
2154     LoadSDNode *LD = cast<LoadSDNode>(Op);
2155     // If this is a ZEXTLoad and we are looking at the loaded value.
2156     if (ISD::isZEXTLoad(Op.getNode()) && Op.getResNo() == 0) {
2157       EVT VT = LD->getMemoryVT();
2158       unsigned MemBits = VT.getScalarType().getSizeInBits();
2159       KnownZero |= APInt::getHighBitsSet(BitWidth, BitWidth - MemBits);
2160     } else if (const MDNode *Ranges = LD->getRanges()) {
2161       computeKnownBitsFromRangeMetadata(*Ranges, KnownZero);
2162     }
2163     break;
2164   }
2165   case ISD::ZERO_EXTEND: {
2166     EVT InVT = Op.getOperand(0).getValueType();
2167     unsigned InBits = InVT.getScalarType().getSizeInBits();
2168     APInt NewBits   = APInt::getHighBitsSet(BitWidth, BitWidth - InBits);
2169     KnownZero = KnownZero.trunc(InBits);
2170     KnownOne = KnownOne.trunc(InBits);
2171     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2172     KnownZero = KnownZero.zext(BitWidth);
2173     KnownOne = KnownOne.zext(BitWidth);
2174     KnownZero |= NewBits;
2175     break;
2176   }
2177   case ISD::SIGN_EXTEND: {
2178     EVT InVT = Op.getOperand(0).getValueType();
2179     unsigned InBits = InVT.getScalarType().getSizeInBits();
2180     APInt NewBits   = APInt::getHighBitsSet(BitWidth, BitWidth - InBits);
2181
2182     KnownZero = KnownZero.trunc(InBits);
2183     KnownOne = KnownOne.trunc(InBits);
2184     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2185
2186     // Note if the sign bit is known to be zero or one.
2187     bool SignBitKnownZero = KnownZero.isNegative();
2188     bool SignBitKnownOne  = KnownOne.isNegative();
2189
2190     KnownZero = KnownZero.zext(BitWidth);
2191     KnownOne = KnownOne.zext(BitWidth);
2192
2193     // If the sign bit is known zero or one, the top bits match.
2194     if (SignBitKnownZero)
2195       KnownZero |= NewBits;
2196     else if (SignBitKnownOne)
2197       KnownOne  |= NewBits;
2198     break;
2199   }
2200   case ISD::ANY_EXTEND: {
2201     EVT InVT = Op.getOperand(0).getValueType();
2202     unsigned InBits = InVT.getScalarType().getSizeInBits();
2203     KnownZero = KnownZero.trunc(InBits);
2204     KnownOne = KnownOne.trunc(InBits);
2205     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2206     KnownZero = KnownZero.zext(BitWidth);
2207     KnownOne = KnownOne.zext(BitWidth);
2208     break;
2209   }
2210   case ISD::TRUNCATE: {
2211     EVT InVT = Op.getOperand(0).getValueType();
2212     unsigned InBits = InVT.getScalarType().getSizeInBits();
2213     KnownZero = KnownZero.zext(InBits);
2214     KnownOne = KnownOne.zext(InBits);
2215     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2216     KnownZero = KnownZero.trunc(BitWidth);
2217     KnownOne = KnownOne.trunc(BitWidth);
2218     break;
2219   }
2220   case ISD::AssertZext: {
2221     EVT VT = cast<VTSDNode>(Op.getOperand(1))->getVT();
2222     APInt InMask = APInt::getLowBitsSet(BitWidth, VT.getSizeInBits());
2223     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2224     KnownZero |= (~InMask);
2225     KnownOne  &= (~KnownZero);
2226     break;
2227   }
2228   case ISD::FGETSIGN:
2229     // All bits are zero except the low bit.
2230     KnownZero = APInt::getHighBitsSet(BitWidth, BitWidth - 1);
2231     break;
2232
2233   case ISD::SUB: {
2234     if (ConstantSDNode *CLHS = dyn_cast<ConstantSDNode>(Op.getOperand(0))) {
2235       // We know that the top bits of C-X are clear if X contains less bits
2236       // than C (i.e. no wrap-around can happen).  For example, 20-X is
2237       // positive if we can prove that X is >= 0 and < 16.
2238       if (CLHS->getAPIntValue().isNonNegative()) {
2239         unsigned NLZ = (CLHS->getAPIntValue()+1).countLeadingZeros();
2240         // NLZ can't be BitWidth with no sign bit
2241         APInt MaskV = APInt::getHighBitsSet(BitWidth, NLZ+1);
2242         computeKnownBits(Op.getOperand(1), KnownZero2, KnownOne2, Depth+1);
2243
2244         // If all of the MaskV bits are known to be zero, then we know the
2245         // output top bits are zero, because we now know that the output is
2246         // from [0-C].
2247         if ((KnownZero2 & MaskV) == MaskV) {
2248           unsigned NLZ2 = CLHS->getAPIntValue().countLeadingZeros();
2249           // Top bits known zero.
2250           KnownZero = APInt::getHighBitsSet(BitWidth, NLZ2);
2251         }
2252       }
2253     }
2254   }
2255   // fall through
2256   case ISD::ADD:
2257   case ISD::ADDE: {
2258     // Output known-0 bits are known if clear or set in both the low clear bits
2259     // common to both LHS & RHS.  For example, 8+(X<<3) is known to have the
2260     // low 3 bits clear.
2261     computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth+1);
2262     unsigned KnownZeroOut = KnownZero2.countTrailingOnes();
2263
2264     computeKnownBits(Op.getOperand(1), KnownZero2, KnownOne2, Depth+1);
2265     KnownZeroOut = std::min(KnownZeroOut,
2266                             KnownZero2.countTrailingOnes());
2267
2268     if (Op.getOpcode() == ISD::ADD) {
2269       KnownZero |= APInt::getLowBitsSet(BitWidth, KnownZeroOut);
2270       break;
2271     }
2272
2273     // With ADDE, a carry bit may be added in, so we can only use this
2274     // information if we know (at least) that the low two bits are clear.  We
2275     // then return to the caller that the low bit is unknown but that other bits
2276     // are known zero.
2277     if (KnownZeroOut >= 2) // ADDE
2278       KnownZero |= APInt::getBitsSet(BitWidth, 1, KnownZeroOut);
2279     break;
2280   }
2281   case ISD::SREM:
2282     if (ConstantSDNode *Rem = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2283       const APInt &RA = Rem->getAPIntValue().abs();
2284       if (RA.isPowerOf2()) {
2285         APInt LowBits = RA - 1;
2286         computeKnownBits(Op.getOperand(0), KnownZero2,KnownOne2,Depth+1);
2287
2288         // The low bits of the first operand are unchanged by the srem.
2289         KnownZero = KnownZero2 & LowBits;
2290         KnownOne = KnownOne2 & LowBits;
2291
2292         // If the first operand is non-negative or has all low bits zero, then
2293         // the upper bits are all zero.
2294         if (KnownZero2[BitWidth-1] || ((KnownZero2 & LowBits) == LowBits))
2295           KnownZero |= ~LowBits;
2296
2297         // If the first operand is negative and not all low bits are zero, then
2298         // the upper bits are all one.
2299         if (KnownOne2[BitWidth-1] && ((KnownOne2 & LowBits) != 0))
2300           KnownOne |= ~LowBits;
2301         assert((KnownZero & KnownOne) == 0&&"Bits known to be one AND zero?");
2302       }
2303     }
2304     break;
2305   case ISD::UREM: {
2306     if (ConstantSDNode *Rem = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2307       const APInt &RA = Rem->getAPIntValue();
2308       if (RA.isPowerOf2()) {
2309         APInt LowBits = (RA - 1);
2310         computeKnownBits(Op.getOperand(0), KnownZero2, KnownOne2, Depth + 1);
2311
2312         // The upper bits are all zero, the lower ones are unchanged.
2313         KnownZero = KnownZero2 | ~LowBits;
2314         KnownOne = KnownOne2 & LowBits;
2315         break;
2316       }
2317     }
2318
2319     // Since the result is less than or equal to either operand, any leading
2320     // zero bits in either operand must also exist in the result.
2321     computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2322     computeKnownBits(Op.getOperand(1), KnownZero2, KnownOne2, Depth+1);
2323
2324     uint32_t Leaders = std::max(KnownZero.countLeadingOnes(),
2325                                 KnownZero2.countLeadingOnes());
2326     KnownOne.clearAllBits();
2327     KnownZero = APInt::getHighBitsSet(BitWidth, Leaders);
2328     break;
2329   }
2330   case ISD::FrameIndex:
2331   case ISD::TargetFrameIndex:
2332     if (unsigned Align = InferPtrAlignment(Op)) {
2333       // The low bits are known zero if the pointer is aligned.
2334       KnownZero = APInt::getLowBitsSet(BitWidth, Log2_32(Align));
2335       break;
2336     }
2337     break;
2338
2339   default:
2340     if (Op.getOpcode() < ISD::BUILTIN_OP_END)
2341       break;
2342     // Fallthrough
2343   case ISD::INTRINSIC_WO_CHAIN:
2344   case ISD::INTRINSIC_W_CHAIN:
2345   case ISD::INTRINSIC_VOID:
2346     // Allow the target to implement this method for its nodes.
2347     TLI->computeKnownBitsForTargetNode(Op, KnownZero, KnownOne, *this, Depth);
2348     break;
2349   }
2350
2351   assert((KnownZero & KnownOne) == 0 && "Bits known to be one AND zero?");
2352 }
2353
2354 /// ComputeNumSignBits - Return the number of times the sign bit of the
2355 /// register is replicated into the other bits.  We know that at least 1 bit
2356 /// is always equal to the sign bit (itself), but other cases can give us
2357 /// information.  For example, immediately after an "SRA X, 2", we know that
2358 /// the top 3 bits are all equal to each other, so we return 3.
2359 unsigned SelectionDAG::ComputeNumSignBits(SDValue Op, unsigned Depth) const{
2360   const TargetLowering *TLI = TM.getTargetLowering();
2361   EVT VT = Op.getValueType();
2362   assert(VT.isInteger() && "Invalid VT!");
2363   unsigned VTBits = VT.getScalarType().getSizeInBits();
2364   unsigned Tmp, Tmp2;
2365   unsigned FirstAnswer = 1;
2366
2367   if (Depth == 6)
2368     return 1;  // Limit search depth.
2369
2370   switch (Op.getOpcode()) {
2371   default: break;
2372   case ISD::AssertSext:
2373     Tmp = cast<VTSDNode>(Op.getOperand(1))->getVT().getSizeInBits();
2374     return VTBits-Tmp+1;
2375   case ISD::AssertZext:
2376     Tmp = cast<VTSDNode>(Op.getOperand(1))->getVT().getSizeInBits();
2377     return VTBits-Tmp;
2378
2379   case ISD::Constant: {
2380     const APInt &Val = cast<ConstantSDNode>(Op)->getAPIntValue();
2381     return Val.getNumSignBits();
2382   }
2383
2384   case ISD::SIGN_EXTEND:
2385     Tmp =
2386         VTBits-Op.getOperand(0).getValueType().getScalarType().getSizeInBits();
2387     return ComputeNumSignBits(Op.getOperand(0), Depth+1) + Tmp;
2388
2389   case ISD::SIGN_EXTEND_INREG:
2390     // Max of the input and what this extends.
2391     Tmp =
2392       cast<VTSDNode>(Op.getOperand(1))->getVT().getScalarType().getSizeInBits();
2393     Tmp = VTBits-Tmp+1;
2394
2395     Tmp2 = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2396     return std::max(Tmp, Tmp2);
2397
2398   case ISD::SRA:
2399     Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2400     // SRA X, C   -> adds C sign bits.
2401     if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2402       Tmp += C->getZExtValue();
2403       if (Tmp > VTBits) Tmp = VTBits;
2404     }
2405     return Tmp;
2406   case ISD::SHL:
2407     if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2408       // shl destroys sign bits.
2409       Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2410       if (C->getZExtValue() >= VTBits ||      // Bad shift.
2411           C->getZExtValue() >= Tmp) break;    // Shifted all sign bits out.
2412       return Tmp - C->getZExtValue();
2413     }
2414     break;
2415   case ISD::AND:
2416   case ISD::OR:
2417   case ISD::XOR:    // NOT is handled here.
2418     // Logical binary ops preserve the number of sign bits at the worst.
2419     Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2420     if (Tmp != 1) {
2421       Tmp2 = ComputeNumSignBits(Op.getOperand(1), Depth+1);
2422       FirstAnswer = std::min(Tmp, Tmp2);
2423       // We computed what we know about the sign bits as our first
2424       // answer. Now proceed to the generic code that uses
2425       // computeKnownBits, and pick whichever answer is better.
2426     }
2427     break;
2428
2429   case ISD::SELECT:
2430     Tmp = ComputeNumSignBits(Op.getOperand(1), Depth+1);
2431     if (Tmp == 1) return 1;  // Early out.
2432     Tmp2 = ComputeNumSignBits(Op.getOperand(2), Depth+1);
2433     return std::min(Tmp, Tmp2);
2434
2435   case ISD::SADDO:
2436   case ISD::UADDO:
2437   case ISD::SSUBO:
2438   case ISD::USUBO:
2439   case ISD::SMULO:
2440   case ISD::UMULO:
2441     if (Op.getResNo() != 1)
2442       break;
2443     // The boolean result conforms to getBooleanContents.  Fall through.
2444     // If setcc returns 0/-1, all bits are sign bits.
2445     // We know that we have an integer-based boolean since these operations
2446     // are only available for integer.
2447     if (TLI->getBooleanContents(Op.getValueType().isVector(), false) ==
2448         TargetLowering::ZeroOrNegativeOneBooleanContent)
2449       return VTBits;
2450     break;
2451   case ISD::SETCC:
2452     // If setcc returns 0/-1, all bits are sign bits.
2453     if (TLI->getBooleanContents(Op.getOperand(0).getValueType()) ==
2454         TargetLowering::ZeroOrNegativeOneBooleanContent)
2455       return VTBits;
2456     break;
2457   case ISD::ROTL:
2458   case ISD::ROTR:
2459     if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
2460       unsigned RotAmt = C->getZExtValue() & (VTBits-1);
2461
2462       // Handle rotate right by N like a rotate left by 32-N.
2463       if (Op.getOpcode() == ISD::ROTR)
2464         RotAmt = (VTBits-RotAmt) & (VTBits-1);
2465
2466       // If we aren't rotating out all of the known-in sign bits, return the
2467       // number that are left.  This handles rotl(sext(x), 1) for example.
2468       Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2469       if (Tmp > RotAmt+1) return Tmp-RotAmt;
2470     }
2471     break;
2472   case ISD::ADD:
2473     // Add can have at most one carry bit.  Thus we know that the output
2474     // is, at worst, one more bit than the inputs.
2475     Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2476     if (Tmp == 1) return 1;  // Early out.
2477
2478     // Special case decrementing a value (ADD X, -1):
2479     if (ConstantSDNode *CRHS = dyn_cast<ConstantSDNode>(Op.getOperand(1)))
2480       if (CRHS->isAllOnesValue()) {
2481         APInt KnownZero, KnownOne;
2482         computeKnownBits(Op.getOperand(0), KnownZero, KnownOne, Depth+1);
2483
2484         // If the input is known to be 0 or 1, the output is 0/-1, which is all
2485         // sign bits set.
2486         if ((KnownZero | APInt(VTBits, 1)).isAllOnesValue())
2487           return VTBits;
2488
2489         // If we are subtracting one from a positive number, there is no carry
2490         // out of the result.
2491         if (KnownZero.isNegative())
2492           return Tmp;
2493       }
2494
2495     Tmp2 = ComputeNumSignBits(Op.getOperand(1), Depth+1);
2496     if (Tmp2 == 1) return 1;
2497     return std::min(Tmp, Tmp2)-1;
2498
2499   case ISD::SUB:
2500     Tmp2 = ComputeNumSignBits(Op.getOperand(1), Depth+1);
2501     if (Tmp2 == 1) return 1;
2502
2503     // Handle NEG.
2504     if (ConstantSDNode *CLHS = dyn_cast<ConstantSDNode>(Op.getOperand(0)))
2505       if (CLHS->isNullValue()) {
2506         APInt KnownZero, KnownOne;
2507         computeKnownBits(Op.getOperand(1), KnownZero, KnownOne, Depth+1);
2508         // If the input is known to be 0 or 1, the output is 0/-1, which is all
2509         // sign bits set.
2510         if ((KnownZero | APInt(VTBits, 1)).isAllOnesValue())
2511           return VTBits;
2512
2513         // If the input is known to be positive (the sign bit is known clear),
2514         // the output of the NEG has the same number of sign bits as the input.
2515         if (KnownZero.isNegative())
2516           return Tmp2;
2517
2518         // Otherwise, we treat this like a SUB.
2519       }
2520
2521     // Sub can have at most one carry bit.  Thus we know that the output
2522     // is, at worst, one more bit than the inputs.
2523     Tmp = ComputeNumSignBits(Op.getOperand(0), Depth+1);
2524     if (Tmp == 1) return 1;  // Early out.
2525     return std::min(Tmp, Tmp2)-1;
2526   case ISD::TRUNCATE:
2527     // FIXME: it's tricky to do anything useful for this, but it is an important
2528     // case for targets like X86.
2529     break;
2530   }
2531
2532   // If we are looking at the loaded value of the SDNode.
2533   if (Op.getResNo() == 0) {
2534     // Handle LOADX separately here. EXTLOAD case will fallthrough.
2535     if (LoadSDNode *LD = dyn_cast<LoadSDNode>(Op)) {
2536       unsigned ExtType = LD->getExtensionType();
2537       switch (ExtType) {
2538         default: break;
2539         case ISD::SEXTLOAD:    // '17' bits known
2540           Tmp = LD->getMemoryVT().getScalarType().getSizeInBits();
2541           return VTBits-Tmp+1;
2542         case ISD::ZEXTLOAD:    // '16' bits known
2543           Tmp = LD->getMemoryVT().getScalarType().getSizeInBits();
2544           return VTBits-Tmp;
2545       }
2546     }
2547   }
2548
2549   // Allow the target to implement this method for its nodes.
2550   if (Op.getOpcode() >= ISD::BUILTIN_OP_END ||
2551       Op.getOpcode() == ISD::INTRINSIC_WO_CHAIN ||
2552       Op.getOpcode() == ISD::INTRINSIC_W_CHAIN ||
2553       Op.getOpcode() == ISD::INTRINSIC_VOID) {
2554     unsigned NumBits = TLI->ComputeNumSignBitsForTargetNode(Op, *this, Depth);
2555     if (NumBits > 1) FirstAnswer = std::max(FirstAnswer, NumBits);
2556   }
2557
2558   // Finally, if we can prove that the top bits of the result are 0's or 1's,
2559   // use this information.
2560   APInt KnownZero, KnownOne;
2561   computeKnownBits(Op, KnownZero, KnownOne, Depth);
2562
2563   APInt Mask;
2564   if (KnownZero.isNegative()) {        // sign bit is 0
2565     Mask = KnownZero;
2566   } else if (KnownOne.isNegative()) {  // sign bit is 1;
2567     Mask = KnownOne;
2568   } else {
2569     // Nothing known.
2570     return FirstAnswer;
2571   }
2572
2573   // Okay, we know that the sign bit in Mask is set.  Use CLZ to determine
2574   // the number of identical bits in the top of the input value.
2575   Mask = ~Mask;
2576   Mask <<= Mask.getBitWidth()-VTBits;
2577   // Return # leading zeros.  We use 'min' here in case Val was zero before
2578   // shifting.  We don't want to return '64' as for an i32 "0".
2579   return std::max(FirstAnswer, std::min(VTBits, Mask.countLeadingZeros()));
2580 }
2581
2582 /// isBaseWithConstantOffset - Return true if the specified operand is an
2583 /// ISD::ADD with a ConstantSDNode on the right-hand side, or if it is an
2584 /// ISD::OR with a ConstantSDNode that is guaranteed to have the same
2585 /// semantics as an ADD.  This handles the equivalence:
2586 ///     X|Cst == X+Cst iff X&Cst = 0.
2587 bool SelectionDAG::isBaseWithConstantOffset(SDValue Op) const {
2588   if ((Op.getOpcode() != ISD::ADD && Op.getOpcode() != ISD::OR) ||
2589       !isa<ConstantSDNode>(Op.getOperand(1)))
2590     return false;
2591
2592   if (Op.getOpcode() == ISD::OR &&
2593       !MaskedValueIsZero(Op.getOperand(0),
2594                      cast<ConstantSDNode>(Op.getOperand(1))->getAPIntValue()))
2595     return false;
2596
2597   return true;
2598 }
2599
2600
2601 bool SelectionDAG::isKnownNeverNaN(SDValue Op) const {
2602   // If we're told that NaNs won't happen, assume they won't.
2603   if (getTarget().Options.NoNaNsFPMath)
2604     return true;
2605
2606   // If the value is a constant, we can obviously see if it is a NaN or not.
2607   if (const ConstantFPSDNode *C = dyn_cast<ConstantFPSDNode>(Op))
2608     return !C->getValueAPF().isNaN();
2609
2610   // TODO: Recognize more cases here.
2611
2612   return false;
2613 }
2614
2615 bool SelectionDAG::isKnownNeverZero(SDValue Op) const {
2616   // If the value is a constant, we can obviously see if it is a zero or not.
2617   if (const ConstantFPSDNode *C = dyn_cast<ConstantFPSDNode>(Op))
2618     return !C->isZero();
2619
2620   // TODO: Recognize more cases here.
2621   switch (Op.getOpcode()) {
2622   default: break;
2623   case ISD::OR:
2624     if (const ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1)))
2625       return !C->isNullValue();
2626     break;
2627   }
2628
2629   return false;
2630 }
2631
2632 bool SelectionDAG::isEqualTo(SDValue A, SDValue B) const {
2633   // Check the obvious case.
2634   if (A == B) return true;
2635
2636   // For for negative and positive zero.
2637   if (const ConstantFPSDNode *CA = dyn_cast<ConstantFPSDNode>(A))
2638     if (const ConstantFPSDNode *CB = dyn_cast<ConstantFPSDNode>(B))
2639       if (CA->isZero() && CB->isZero()) return true;
2640
2641   // Otherwise they may not be equal.
2642   return false;
2643 }
2644
2645 /// getNode - Gets or creates the specified node.
2646 ///
2647 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT) {
2648   FoldingSetNodeID ID;
2649   AddNodeIDNode(ID, Opcode, getVTList(VT), None);
2650   void *IP = nullptr;
2651   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
2652     return SDValue(E, 0);
2653
2654   SDNode *N = new (NodeAllocator) SDNode(Opcode, DL.getIROrder(),
2655                                          DL.getDebugLoc(), getVTList(VT));
2656   CSEMap.InsertNode(N, IP);
2657
2658   AllNodes.push_back(N);
2659 #ifndef NDEBUG
2660   VerifySDNode(N);
2661 #endif
2662   return SDValue(N, 0);
2663 }
2664
2665 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL,
2666                               EVT VT, SDValue Operand) {
2667   // Constant fold unary operations with an integer constant operand. Even
2668   // opaque constant will be folded, because the folding of unary operations
2669   // doesn't create new constants with different values. Nevertheless, the
2670   // opaque flag is preserved during folding to prevent future folding with
2671   // other constants.
2672   if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Operand.getNode())) {
2673     const APInt &Val = C->getAPIntValue();
2674     switch (Opcode) {
2675     default: break;
2676     case ISD::SIGN_EXTEND:
2677       return getConstant(Val.sextOrTrunc(VT.getSizeInBits()), VT,
2678                          C->isTargetOpcode(), C->isOpaque());
2679     case ISD::ANY_EXTEND:
2680     case ISD::ZERO_EXTEND:
2681     case ISD::TRUNCATE:
2682       return getConstant(Val.zextOrTrunc(VT.getSizeInBits()), VT,
2683                          C->isTargetOpcode(), C->isOpaque());
2684     case ISD::UINT_TO_FP:
2685     case ISD::SINT_TO_FP: {
2686       APFloat apf(EVTToAPFloatSemantics(VT),
2687                   APInt::getNullValue(VT.getSizeInBits()));
2688       (void)apf.convertFromAPInt(Val,
2689                                  Opcode==ISD::SINT_TO_FP,
2690                                  APFloat::rmNearestTiesToEven);
2691       return getConstantFP(apf, VT);
2692     }
2693     case ISD::BITCAST:
2694       if (VT == MVT::f32 && C->getValueType(0) == MVT::i32)
2695         return getConstantFP(APFloat(APFloat::IEEEsingle, Val), VT);
2696       else if (VT == MVT::f64 && C->getValueType(0) == MVT::i64)
2697         return getConstantFP(APFloat(APFloat::IEEEdouble, Val), VT);
2698       break;
2699     case ISD::BSWAP:
2700       return getConstant(Val.byteSwap(), VT, C->isTargetOpcode(),
2701                          C->isOpaque());
2702     case ISD::CTPOP:
2703       return getConstant(Val.countPopulation(), VT, C->isTargetOpcode(),
2704                          C->isOpaque());
2705     case ISD::CTLZ:
2706     case ISD::CTLZ_ZERO_UNDEF:
2707       return getConstant(Val.countLeadingZeros(), VT, C->isTargetOpcode(),
2708                          C->isOpaque());
2709     case ISD::CTTZ:
2710     case ISD::CTTZ_ZERO_UNDEF:
2711       return getConstant(Val.countTrailingZeros(), VT, C->isTargetOpcode(),
2712                          C->isOpaque());
2713     }
2714   }
2715
2716   // Constant fold unary operations with a floating point constant operand.
2717   if (ConstantFPSDNode *C = dyn_cast<ConstantFPSDNode>(Operand.getNode())) {
2718     APFloat V = C->getValueAPF();    // make copy
2719     switch (Opcode) {
2720     case ISD::FNEG:
2721       V.changeSign();
2722       return getConstantFP(V, VT);
2723     case ISD::FABS:
2724       V.clearSign();
2725       return getConstantFP(V, VT);
2726     case ISD::FCEIL: {
2727       APFloat::opStatus fs = V.roundToIntegral(APFloat::rmTowardPositive);
2728       if (fs == APFloat::opOK || fs == APFloat::opInexact)
2729         return getConstantFP(V, VT);
2730       break;
2731     }
2732     case ISD::FTRUNC: {
2733       APFloat::opStatus fs = V.roundToIntegral(APFloat::rmTowardZero);
2734       if (fs == APFloat::opOK || fs == APFloat::opInexact)
2735         return getConstantFP(V, VT);
2736       break;
2737     }
2738     case ISD::FFLOOR: {
2739       APFloat::opStatus fs = V.roundToIntegral(APFloat::rmTowardNegative);
2740       if (fs == APFloat::opOK || fs == APFloat::opInexact)
2741         return getConstantFP(V, VT);
2742       break;
2743     }
2744     case ISD::FP_EXTEND: {
2745       bool ignored;
2746       // This can return overflow, underflow, or inexact; we don't care.
2747       // FIXME need to be more flexible about rounding mode.
2748       (void)V.convert(EVTToAPFloatSemantics(VT),
2749                       APFloat::rmNearestTiesToEven, &ignored);
2750       return getConstantFP(V, VT);
2751     }
2752     case ISD::FP_TO_SINT:
2753     case ISD::FP_TO_UINT: {
2754       integerPart x[2];
2755       bool ignored;
2756       assert(integerPartWidth >= 64);
2757       // FIXME need to be more flexible about rounding mode.
2758       APFloat::opStatus s = V.convertToInteger(x, VT.getSizeInBits(),
2759                             Opcode==ISD::FP_TO_SINT,
2760                             APFloat::rmTowardZero, &ignored);
2761       if (s==APFloat::opInvalidOp)     // inexact is OK, in fact usual
2762         break;
2763       APInt api(VT.getSizeInBits(), x);
2764       return getConstant(api, VT);
2765     }
2766     case ISD::BITCAST:
2767       if (VT == MVT::i32 && C->getValueType(0) == MVT::f32)
2768         return getConstant((uint32_t)V.bitcastToAPInt().getZExtValue(), VT);
2769       else if (VT == MVT::i64 && C->getValueType(0) == MVT::f64)
2770         return getConstant(V.bitcastToAPInt().getZExtValue(), VT);
2771       break;
2772     }
2773   }
2774
2775   unsigned OpOpcode = Operand.getNode()->getOpcode();
2776   switch (Opcode) {
2777   case ISD::TokenFactor:
2778   case ISD::MERGE_VALUES:
2779   case ISD::CONCAT_VECTORS:
2780     return Operand;         // Factor, merge or concat of one node?  No need.
2781   case ISD::FP_ROUND: llvm_unreachable("Invalid method to make FP_ROUND node");
2782   case ISD::FP_EXTEND:
2783     assert(VT.isFloatingPoint() &&
2784            Operand.getValueType().isFloatingPoint() && "Invalid FP cast!");
2785     if (Operand.getValueType() == VT) return Operand;  // noop conversion.
2786     assert((!VT.isVector() ||
2787             VT.getVectorNumElements() ==
2788             Operand.getValueType().getVectorNumElements()) &&
2789            "Vector element count mismatch!");
2790     if (Operand.getOpcode() == ISD::UNDEF)
2791       return getUNDEF(VT);
2792     break;
2793   case ISD::SIGN_EXTEND:
2794     assert(VT.isInteger() && Operand.getValueType().isInteger() &&
2795            "Invalid SIGN_EXTEND!");
2796     if (Operand.getValueType() == VT) return Operand;   // noop extension
2797     assert(Operand.getValueType().getScalarType().bitsLT(VT.getScalarType()) &&
2798            "Invalid sext node, dst < src!");
2799     assert((!VT.isVector() ||
2800             VT.getVectorNumElements() ==
2801             Operand.getValueType().getVectorNumElements()) &&
2802            "Vector element count mismatch!");
2803     if (OpOpcode == ISD::SIGN_EXTEND || OpOpcode == ISD::ZERO_EXTEND)
2804       return getNode(OpOpcode, DL, VT, Operand.getNode()->getOperand(0));
2805     else if (OpOpcode == ISD::UNDEF)
2806       // sext(undef) = 0, because the top bits will all be the same.
2807       return getConstant(0, VT);
2808     break;
2809   case ISD::ZERO_EXTEND:
2810     assert(VT.isInteger() && Operand.getValueType().isInteger() &&
2811            "Invalid ZERO_EXTEND!");
2812     if (Operand.getValueType() == VT) return Operand;   // noop extension
2813     assert(Operand.getValueType().getScalarType().bitsLT(VT.getScalarType()) &&
2814            "Invalid zext node, dst < src!");
2815     assert((!VT.isVector() ||
2816             VT.getVectorNumElements() ==
2817             Operand.getValueType().getVectorNumElements()) &&
2818            "Vector element count mismatch!");
2819     if (OpOpcode == ISD::ZERO_EXTEND)   // (zext (zext x)) -> (zext x)
2820       return getNode(ISD::ZERO_EXTEND, DL, VT,
2821                      Operand.getNode()->getOperand(0));
2822     else if (OpOpcode == ISD::UNDEF)
2823       // zext(undef) = 0, because the top bits will be zero.
2824       return getConstant(0, VT);
2825     break;
2826   case ISD::ANY_EXTEND:
2827     assert(VT.isInteger() && Operand.getValueType().isInteger() &&
2828            "Invalid ANY_EXTEND!");
2829     if (Operand.getValueType() == VT) return Operand;   // noop extension
2830     assert(Operand.getValueType().getScalarType().bitsLT(VT.getScalarType()) &&
2831            "Invalid anyext node, dst < src!");
2832     assert((!VT.isVector() ||
2833             VT.getVectorNumElements() ==
2834             Operand.getValueType().getVectorNumElements()) &&
2835            "Vector element count mismatch!");
2836
2837     if (OpOpcode == ISD::ZERO_EXTEND || OpOpcode == ISD::SIGN_EXTEND ||
2838         OpOpcode == ISD::ANY_EXTEND)
2839       // (ext (zext x)) -> (zext x)  and  (ext (sext x)) -> (sext x)
2840       return getNode(OpOpcode, DL, VT, Operand.getNode()->getOperand(0));
2841     else if (OpOpcode == ISD::UNDEF)
2842       return getUNDEF(VT);
2843
2844     // (ext (trunx x)) -> x
2845     if (OpOpcode == ISD::TRUNCATE) {
2846       SDValue OpOp = Operand.getNode()->getOperand(0);
2847       if (OpOp.getValueType() == VT)
2848         return OpOp;
2849     }
2850     break;
2851   case ISD::TRUNCATE:
2852     assert(VT.isInteger() && Operand.getValueType().isInteger() &&
2853            "Invalid TRUNCATE!");
2854     if (Operand.getValueType() == VT) return Operand;   // noop truncate
2855     assert(Operand.getValueType().getScalarType().bitsGT(VT.getScalarType()) &&
2856            "Invalid truncate node, src < dst!");
2857     assert((!VT.isVector() ||
2858             VT.getVectorNumElements() ==
2859             Operand.getValueType().getVectorNumElements()) &&
2860            "Vector element count mismatch!");
2861     if (OpOpcode == ISD::TRUNCATE)
2862       return getNode(ISD::TRUNCATE, DL, VT, Operand.getNode()->getOperand(0));
2863     if (OpOpcode == ISD::ZERO_EXTEND || OpOpcode == ISD::SIGN_EXTEND ||
2864         OpOpcode == ISD::ANY_EXTEND) {
2865       // If the source is smaller than the dest, we still need an extend.
2866       if (Operand.getNode()->getOperand(0).getValueType().getScalarType()
2867             .bitsLT(VT.getScalarType()))
2868         return getNode(OpOpcode, DL, VT, Operand.getNode()->getOperand(0));
2869       if (Operand.getNode()->getOperand(0).getValueType().bitsGT(VT))
2870         return getNode(ISD::TRUNCATE, DL, VT, Operand.getNode()->getOperand(0));
2871       return Operand.getNode()->getOperand(0);
2872     }
2873     if (OpOpcode == ISD::UNDEF)
2874       return getUNDEF(VT);
2875     break;
2876   case ISD::BITCAST:
2877     // Basic sanity checking.
2878     assert(VT.getSizeInBits() == Operand.getValueType().getSizeInBits()
2879            && "Cannot BITCAST between types of different sizes!");
2880     if (VT == Operand.getValueType()) return Operand;  // noop conversion.
2881     if (OpOpcode == ISD::BITCAST)  // bitconv(bitconv(x)) -> bitconv(x)
2882       return getNode(ISD::BITCAST, DL, VT, Operand.getOperand(0));
2883     if (OpOpcode == ISD::UNDEF)
2884       return getUNDEF(VT);
2885     break;
2886   case ISD::SCALAR_TO_VECTOR:
2887     assert(VT.isVector() && !Operand.getValueType().isVector() &&
2888            (VT.getVectorElementType() == Operand.getValueType() ||
2889             (VT.getVectorElementType().isInteger() &&
2890              Operand.getValueType().isInteger() &&
2891              VT.getVectorElementType().bitsLE(Operand.getValueType()))) &&
2892            "Illegal SCALAR_TO_VECTOR node!");
2893     if (OpOpcode == ISD::UNDEF)
2894       return getUNDEF(VT);
2895     // scalar_to_vector(extract_vector_elt V, 0) -> V, top bits are undefined.
2896     if (OpOpcode == ISD::EXTRACT_VECTOR_ELT &&
2897         isa<ConstantSDNode>(Operand.getOperand(1)) &&
2898         Operand.getConstantOperandVal(1) == 0 &&
2899         Operand.getOperand(0).getValueType() == VT)
2900       return Operand.getOperand(0);
2901     break;
2902   case ISD::FNEG:
2903     // -(X-Y) -> (Y-X) is unsafe because when X==Y, -0.0 != +0.0
2904     if (getTarget().Options.UnsafeFPMath && OpOpcode == ISD::FSUB)
2905       return getNode(ISD::FSUB, DL, VT, Operand.getNode()->getOperand(1),
2906                      Operand.getNode()->getOperand(0));
2907     if (OpOpcode == ISD::FNEG)  // --X -> X
2908       return Operand.getNode()->getOperand(0);
2909     break;
2910   case ISD::FABS:
2911     if (OpOpcode == ISD::FNEG)  // abs(-X) -> abs(X)
2912       return getNode(ISD::FABS, DL, VT, Operand.getNode()->getOperand(0));
2913     break;
2914   }
2915
2916   SDNode *N;
2917   SDVTList VTs = getVTList(VT);
2918   if (VT != MVT::Glue) { // Don't CSE flag producing nodes
2919     FoldingSetNodeID ID;
2920     SDValue Ops[1] = { Operand };
2921     AddNodeIDNode(ID, Opcode, VTs, Ops);
2922     void *IP = nullptr;
2923     if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
2924       return SDValue(E, 0);
2925
2926     N = new (NodeAllocator) UnarySDNode(Opcode, DL.getIROrder(),
2927                                         DL.getDebugLoc(), VTs, Operand);
2928     CSEMap.InsertNode(N, IP);
2929   } else {
2930     N = new (NodeAllocator) UnarySDNode(Opcode, DL.getIROrder(),
2931                                         DL.getDebugLoc(), VTs, Operand);
2932   }
2933
2934   AllNodes.push_back(N);
2935 #ifndef NDEBUG
2936   VerifySDNode(N);
2937 #endif
2938   return SDValue(N, 0);
2939 }
2940
2941 SDValue SelectionDAG::FoldConstantArithmetic(unsigned Opcode, EVT VT,
2942                                              SDNode *Cst1, SDNode *Cst2) {
2943   // If the opcode is a target-specific ISD node, there's nothing we can
2944   // do here and the operand rules may not line up with the below, so
2945   // bail early.
2946   if (Opcode >= ISD::BUILTIN_OP_END)
2947     return SDValue();
2948
2949   SmallVector<std::pair<ConstantSDNode *, ConstantSDNode *>, 4> Inputs;
2950   SmallVector<SDValue, 4> Outputs;
2951   EVT SVT = VT.getScalarType();
2952
2953   ConstantSDNode *Scalar1 = dyn_cast<ConstantSDNode>(Cst1);
2954   ConstantSDNode *Scalar2 = dyn_cast<ConstantSDNode>(Cst2);
2955   if (Scalar1 && Scalar2 && (Scalar1->isOpaque() || Scalar2->isOpaque()))
2956     return SDValue();
2957
2958   if (Scalar1 && Scalar2)
2959     // Scalar instruction.
2960     Inputs.push_back(std::make_pair(Scalar1, Scalar2));
2961   else {
2962     // For vectors extract each constant element into Inputs so we can constant
2963     // fold them individually.
2964     BuildVectorSDNode *BV1 = dyn_cast<BuildVectorSDNode>(Cst1);
2965     BuildVectorSDNode *BV2 = dyn_cast<BuildVectorSDNode>(Cst2);
2966     if (!BV1 || !BV2)
2967       return SDValue();
2968
2969     assert(BV1->getNumOperands() == BV2->getNumOperands() && "Out of sync!");
2970
2971     for (unsigned I = 0, E = BV1->getNumOperands(); I != E; ++I) {
2972       ConstantSDNode *V1 = dyn_cast<ConstantSDNode>(BV1->getOperand(I));
2973       ConstantSDNode *V2 = dyn_cast<ConstantSDNode>(BV2->getOperand(I));
2974       if (!V1 || !V2) // Not a constant, bail.
2975         return SDValue();
2976
2977       if (V1->isOpaque() || V2->isOpaque())
2978         return SDValue();
2979
2980       // Avoid BUILD_VECTOR nodes that perform implicit truncation.
2981       // FIXME: This is valid and could be handled by truncating the APInts.
2982       if (V1->getValueType(0) != SVT || V2->getValueType(0) != SVT)
2983         return SDValue();
2984
2985       Inputs.push_back(std::make_pair(V1, V2));
2986     }
2987   }
2988
2989   // We have a number of constant values, constant fold them element by element.
2990   for (unsigned I = 0, E = Inputs.size(); I != E; ++I) {
2991     const APInt &C1 = Inputs[I].first->getAPIntValue();
2992     const APInt &C2 = Inputs[I].second->getAPIntValue();
2993
2994     switch (Opcode) {
2995     case ISD::ADD:
2996       Outputs.push_back(getConstant(C1 + C2, SVT));
2997       break;
2998     case ISD::SUB:
2999       Outputs.push_back(getConstant(C1 - C2, SVT));
3000       break;
3001     case ISD::MUL:
3002       Outputs.push_back(getConstant(C1 * C2, SVT));
3003       break;
3004     case ISD::UDIV:
3005       if (!C2.getBoolValue())
3006         return SDValue();
3007       Outputs.push_back(getConstant(C1.udiv(C2), SVT));
3008       break;
3009     case ISD::UREM:
3010       if (!C2.getBoolValue())
3011         return SDValue();
3012       Outputs.push_back(getConstant(C1.urem(C2), SVT));
3013       break;
3014     case ISD::SDIV:
3015       if (!C2.getBoolValue())
3016         return SDValue();
3017       Outputs.push_back(getConstant(C1.sdiv(C2), SVT));
3018       break;
3019     case ISD::SREM:
3020       if (!C2.getBoolValue())
3021         return SDValue();
3022       Outputs.push_back(getConstant(C1.srem(C2), SVT));
3023       break;
3024     case ISD::AND:
3025       Outputs.push_back(getConstant(C1 & C2, SVT));
3026       break;
3027     case ISD::OR:
3028       Outputs.push_back(getConstant(C1 | C2, SVT));
3029       break;
3030     case ISD::XOR:
3031       Outputs.push_back(getConstant(C1 ^ C2, SVT));
3032       break;
3033     case ISD::SHL:
3034       Outputs.push_back(getConstant(C1 << C2, SVT));
3035       break;
3036     case ISD::SRL:
3037       Outputs.push_back(getConstant(C1.lshr(C2), SVT));
3038       break;
3039     case ISD::SRA:
3040       Outputs.push_back(getConstant(C1.ashr(C2), SVT));
3041       break;
3042     case ISD::ROTL:
3043       Outputs.push_back(getConstant(C1.rotl(C2), SVT));
3044       break;
3045     case ISD::ROTR:
3046       Outputs.push_back(getConstant(C1.rotr(C2), SVT));
3047       break;
3048     default:
3049       return SDValue();
3050     }
3051   }
3052
3053   assert((Scalar1 && Scalar2) || (VT.getVectorNumElements() == Outputs.size() &&
3054                                   "Expected a scalar or vector!"));
3055
3056   // Handle the scalar case first.
3057   if (!VT.isVector())
3058     return Outputs.back();
3059
3060   // We may have a vector type but a scalar result. Create a splat.
3061   Outputs.resize(VT.getVectorNumElements(), Outputs.back());
3062
3063   // Build a big vector out of the scalar elements we generated.
3064   return getNode(ISD::BUILD_VECTOR, SDLoc(), VT, Outputs);
3065 }
3066
3067 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT, SDValue N1,
3068                               SDValue N2, bool nuw, bool nsw, bool exact) {
3069   ConstantSDNode *N1C = dyn_cast<ConstantSDNode>(N1.getNode());
3070   ConstantSDNode *N2C = dyn_cast<ConstantSDNode>(N2.getNode());
3071   switch (Opcode) {
3072   default: break;
3073   case ISD::TokenFactor:
3074     assert(VT == MVT::Other && N1.getValueType() == MVT::Other &&
3075            N2.getValueType() == MVT::Other && "Invalid token factor!");
3076     // Fold trivial token factors.
3077     if (N1.getOpcode() == ISD::EntryToken) return N2;
3078     if (N2.getOpcode() == ISD::EntryToken) return N1;
3079     if (N1 == N2) return N1;
3080     break;
3081   case ISD::CONCAT_VECTORS:
3082     // Concat of UNDEFs is UNDEF.
3083     if (N1.getOpcode() == ISD::UNDEF &&
3084         N2.getOpcode() == ISD::UNDEF)
3085       return getUNDEF(VT);
3086
3087     // A CONCAT_VECTOR with all operands BUILD_VECTOR can be simplified to
3088     // one big BUILD_VECTOR.
3089     if (N1.getOpcode() == ISD::BUILD_VECTOR &&
3090         N2.getOpcode() == ISD::BUILD_VECTOR) {
3091       SmallVector<SDValue, 16> Elts(N1.getNode()->op_begin(),
3092                                     N1.getNode()->op_end());
3093       Elts.append(N2.getNode()->op_begin(), N2.getNode()->op_end());
3094       return getNode(ISD::BUILD_VECTOR, DL, VT, Elts);
3095     }
3096     break;
3097   case ISD::AND:
3098     assert(VT.isInteger() && "This operator does not apply to FP types!");
3099     assert(N1.getValueType() == N2.getValueType() &&
3100            N1.getValueType() == VT && "Binary operator types must match!");
3101     // (X & 0) -> 0.  This commonly occurs when legalizing i64 values, so it's
3102     // worth handling here.
3103     if (N2C && N2C->isNullValue())
3104       return N2;
3105     if (N2C && N2C->isAllOnesValue())  // X & -1 -> X
3106       return N1;
3107     break;
3108   case ISD::OR:
3109   case ISD::XOR:
3110   case ISD::ADD:
3111   case ISD::SUB:
3112     assert(VT.isInteger() && "This operator does not apply to FP types!");
3113     assert(N1.getValueType() == N2.getValueType() &&
3114            N1.getValueType() == VT && "Binary operator types must match!");
3115     // (X ^|+- 0) -> X.  This commonly occurs when legalizing i64 values, so
3116     // it's worth handling here.
3117     if (N2C && N2C->isNullValue())
3118       return N1;
3119     break;
3120   case ISD::UDIV:
3121   case ISD::UREM:
3122   case ISD::MULHU:
3123   case ISD::MULHS:
3124   case ISD::MUL:
3125   case ISD::SDIV:
3126   case ISD::SREM:
3127     assert(VT.isInteger() && "This operator does not apply to FP types!");
3128     assert(N1.getValueType() == N2.getValueType() &&
3129            N1.getValueType() == VT && "Binary operator types must match!");
3130     break;
3131   case ISD::FADD:
3132   case ISD::FSUB:
3133   case ISD::FMUL:
3134   case ISD::FDIV:
3135   case ISD::FREM:
3136     if (getTarget().Options.UnsafeFPMath) {
3137       if (Opcode == ISD::FADD) {
3138         // 0+x --> x
3139         if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(N1))
3140           if (CFP->getValueAPF().isZero())
3141             return N2;
3142         // x+0 --> x
3143         if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(N2))
3144           if (CFP->getValueAPF().isZero())
3145             return N1;
3146       } else if (Opcode == ISD::FSUB) {
3147         // x-0 --> x
3148         if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(N2))
3149           if (CFP->getValueAPF().isZero())
3150             return N1;
3151       } else if (Opcode == ISD::FMUL) {
3152         ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(N1);
3153         SDValue V = N2;
3154
3155         // If the first operand isn't the constant, try the second
3156         if (!CFP) {
3157           CFP = dyn_cast<ConstantFPSDNode>(N2);
3158           V = N1;
3159         }
3160
3161         if (CFP) {
3162           // 0*x --> 0
3163           if (CFP->isZero())
3164             return SDValue(CFP,0);
3165           // 1*x --> x
3166           if (CFP->isExactlyValue(1.0))
3167             return V;
3168         }
3169       }
3170     }
3171     assert(VT.isFloatingPoint() && "This operator only applies to FP types!");
3172     assert(N1.getValueType() == N2.getValueType() &&
3173            N1.getValueType() == VT && "Binary operator types must match!");
3174     break;
3175   case ISD::FCOPYSIGN:   // N1 and result must match.  N1/N2 need not match.
3176     assert(N1.getValueType() == VT &&
3177            N1.getValueType().isFloatingPoint() &&
3178            N2.getValueType().isFloatingPoint() &&
3179            "Invalid FCOPYSIGN!");
3180     break;
3181   case ISD::SHL:
3182   case ISD::SRA:
3183   case ISD::SRL:
3184   case ISD::ROTL:
3185   case ISD::ROTR:
3186     assert(VT == N1.getValueType() &&
3187            "Shift operators return type must be the same as their first arg");
3188     assert(VT.isInteger() && N2.getValueType().isInteger() &&
3189            "Shifts only work on integers");
3190     assert((!VT.isVector() || VT == N2.getValueType()) &&
3191            "Vector shift amounts must be in the same as their first arg");
3192     // Verify that the shift amount VT is bit enough to hold valid shift
3193     // amounts.  This catches things like trying to shift an i1024 value by an
3194     // i8, which is easy to fall into in generic code that uses
3195     // TLI.getShiftAmount().
3196     assert(N2.getValueType().getSizeInBits() >=
3197                    Log2_32_Ceil(N1.getValueType().getSizeInBits()) &&
3198            "Invalid use of small shift amount with oversized value!");
3199
3200     // Always fold shifts of i1 values so the code generator doesn't need to
3201     // handle them.  Since we know the size of the shift has to be less than the
3202     // size of the value, the shift/rotate count is guaranteed to be zero.
3203     if (VT == MVT::i1)
3204       return N1;
3205     if (N2C && N2C->isNullValue())
3206       return N1;
3207     break;
3208   case ISD::FP_ROUND_INREG: {
3209     EVT EVT = cast<VTSDNode>(N2)->getVT();
3210     assert(VT == N1.getValueType() && "Not an inreg round!");
3211     assert(VT.isFloatingPoint() && EVT.isFloatingPoint() &&
3212            "Cannot FP_ROUND_INREG integer types");
3213     assert(EVT.isVector() == VT.isVector() &&
3214            "FP_ROUND_INREG type should be vector iff the operand "
3215            "type is vector!");
3216     assert((!EVT.isVector() ||
3217             EVT.getVectorNumElements() == VT.getVectorNumElements()) &&
3218            "Vector element counts must match in FP_ROUND_INREG");
3219     assert(EVT.bitsLE(VT) && "Not rounding down!");
3220     (void)EVT;
3221     if (cast<VTSDNode>(N2)->getVT() == VT) return N1;  // Not actually rounding.
3222     break;
3223   }
3224   case ISD::FP_ROUND:
3225     assert(VT.isFloatingPoint() &&
3226            N1.getValueType().isFloatingPoint() &&
3227            VT.bitsLE(N1.getValueType()) &&
3228            isa<ConstantSDNode>(N2) && "Invalid FP_ROUND!");
3229     if (N1.getValueType() == VT) return N1;  // noop conversion.
3230     break;
3231   case ISD::AssertSext:
3232   case ISD::AssertZext: {
3233     EVT EVT = cast<VTSDNode>(N2)->getVT();
3234     assert(VT == N1.getValueType() && "Not an inreg extend!");
3235     assert(VT.isInteger() && EVT.isInteger() &&
3236            "Cannot *_EXTEND_INREG FP types");
3237     assert(!EVT.isVector() &&
3238            "AssertSExt/AssertZExt type should be the vector element type "
3239            "rather than the vector type!");
3240     assert(EVT.bitsLE(VT) && "Not extending!");
3241     if (VT == EVT) return N1; // noop assertion.
3242     break;
3243   }
3244   case ISD::SIGN_EXTEND_INREG: {
3245     EVT EVT = cast<VTSDNode>(N2)->getVT();
3246     assert(VT == N1.getValueType() && "Not an inreg extend!");
3247     assert(VT.isInteger() && EVT.isInteger() &&
3248            "Cannot *_EXTEND_INREG FP types");
3249     assert(EVT.isVector() == VT.isVector() &&
3250            "SIGN_EXTEND_INREG type should be vector iff the operand "
3251            "type is vector!");
3252     assert((!EVT.isVector() ||
3253             EVT.getVectorNumElements() == VT.getVectorNumElements()) &&
3254            "Vector element counts must match in SIGN_EXTEND_INREG");
3255     assert(EVT.bitsLE(VT) && "Not extending!");
3256     if (EVT == VT) return N1;  // Not actually extending
3257
3258     if (N1C) {
3259       APInt Val = N1C->getAPIntValue();
3260       unsigned FromBits = EVT.getScalarType().getSizeInBits();
3261       Val <<= Val.getBitWidth()-FromBits;
3262       Val = Val.ashr(Val.getBitWidth()-FromBits);
3263       return getConstant(Val, VT);
3264     }
3265     break;
3266   }
3267   case ISD::EXTRACT_VECTOR_ELT:
3268     // EXTRACT_VECTOR_ELT of an UNDEF is an UNDEF.
3269     if (N1.getOpcode() == ISD::UNDEF)
3270       return getUNDEF(VT);
3271
3272     // EXTRACT_VECTOR_ELT of CONCAT_VECTORS is often formed while lowering is
3273     // expanding copies of large vectors from registers.
3274     if (N2C &&
3275         N1.getOpcode() == ISD::CONCAT_VECTORS &&
3276         N1.getNumOperands() > 0) {
3277       unsigned Factor =
3278         N1.getOperand(0).getValueType().getVectorNumElements();
3279       return getNode(ISD::EXTRACT_VECTOR_ELT, DL, VT,
3280                      N1.getOperand(N2C->getZExtValue() / Factor),
3281                      getConstant(N2C->getZExtValue() % Factor,
3282                                  N2.getValueType()));
3283     }
3284
3285     // EXTRACT_VECTOR_ELT of BUILD_VECTOR is often formed while lowering is
3286     // expanding large vector constants.
3287     if (N2C && N1.getOpcode() == ISD::BUILD_VECTOR) {
3288       SDValue Elt = N1.getOperand(N2C->getZExtValue());
3289
3290       if (VT != Elt.getValueType())
3291         // If the vector element type is not legal, the BUILD_VECTOR operands
3292         // are promoted and implicitly truncated, and the result implicitly
3293         // extended. Make that explicit here.
3294         Elt = getAnyExtOrTrunc(Elt, DL, VT);
3295
3296       return Elt;
3297     }
3298
3299     // EXTRACT_VECTOR_ELT of INSERT_VECTOR_ELT is often formed when vector
3300     // operations are lowered to scalars.
3301     if (N1.getOpcode() == ISD::INSERT_VECTOR_ELT) {
3302       // If the indices are the same, return the inserted element else
3303       // if the indices are known different, extract the element from
3304       // the original vector.
3305       SDValue N1Op2 = N1.getOperand(2);
3306       ConstantSDNode *N1Op2C = dyn_cast<ConstantSDNode>(N1Op2.getNode());
3307
3308       if (N1Op2C && N2C) {
3309         if (N1Op2C->getZExtValue() == N2C->getZExtValue()) {
3310           if (VT == N1.getOperand(1).getValueType())
3311             return N1.getOperand(1);
3312           else
3313             return getSExtOrTrunc(N1.getOperand(1), DL, VT);
3314         }
3315
3316         return getNode(ISD::EXTRACT_VECTOR_ELT, DL, VT, N1.getOperand(0), N2);
3317       }
3318     }
3319     break;
3320   case ISD::EXTRACT_ELEMENT:
3321     assert(N2C && (unsigned)N2C->getZExtValue() < 2 && "Bad EXTRACT_ELEMENT!");
3322     assert(!N1.getValueType().isVector() && !VT.isVector() &&
3323            (N1.getValueType().isInteger() == VT.isInteger()) &&
3324            N1.getValueType() != VT &&
3325            "Wrong types for EXTRACT_ELEMENT!");
3326
3327     // EXTRACT_ELEMENT of BUILD_PAIR is often formed while legalize is expanding
3328     // 64-bit integers into 32-bit parts.  Instead of building the extract of
3329     // the BUILD_PAIR, only to have legalize rip it apart, just do it now.
3330     if (N1.getOpcode() == ISD::BUILD_PAIR)
3331       return N1.getOperand(N2C->getZExtValue());
3332
3333     // EXTRACT_ELEMENT of a constant int is also very common.
3334     if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(N1)) {
3335       unsigned ElementSize = VT.getSizeInBits();
3336       unsigned Shift = ElementSize * N2C->getZExtValue();
3337       APInt ShiftedVal = C->getAPIntValue().lshr(Shift);
3338       return getConstant(ShiftedVal.trunc(ElementSize), VT);
3339     }
3340     break;
3341   case ISD::EXTRACT_SUBVECTOR: {
3342     SDValue Index = N2;
3343     if (VT.isSimple() && N1.getValueType().isSimple()) {
3344       assert(VT.isVector() && N1.getValueType().isVector() &&
3345              "Extract subvector VTs must be a vectors!");
3346       assert(VT.getVectorElementType() ==
3347              N1.getValueType().getVectorElementType() &&
3348              "Extract subvector VTs must have the same element type!");
3349       assert(VT.getSimpleVT() <= N1.getSimpleValueType() &&
3350              "Extract subvector must be from larger vector to smaller vector!");
3351
3352       if (isa<ConstantSDNode>(Index.getNode())) {
3353         assert((VT.getVectorNumElements() +
3354                 cast<ConstantSDNode>(Index.getNode())->getZExtValue()
3355                 <= N1.getValueType().getVectorNumElements())
3356                && "Extract subvector overflow!");
3357       }
3358
3359       // Trivial extraction.
3360       if (VT.getSimpleVT() == N1.getSimpleValueType())
3361         return N1;
3362     }
3363     break;
3364   }
3365   }
3366
3367   // Perform trivial constant folding.
3368   SDValue SV = FoldConstantArithmetic(Opcode, VT, N1.getNode(), N2.getNode());
3369   if (SV.getNode()) return SV;
3370
3371   // Canonicalize constant to RHS if commutative.
3372   if (N1C && !N2C && isCommutativeBinOp(Opcode)) {
3373     std::swap(N1C, N2C);
3374     std::swap(N1, N2);
3375   }
3376
3377   // Constant fold FP operations.
3378   ConstantFPSDNode *N1CFP = dyn_cast<ConstantFPSDNode>(N1.getNode());
3379   ConstantFPSDNode *N2CFP = dyn_cast<ConstantFPSDNode>(N2.getNode());
3380   if (N1CFP) {
3381     if (!N2CFP && isCommutativeBinOp(Opcode)) {
3382       // Canonicalize constant to RHS if commutative.
3383       std::swap(N1CFP, N2CFP);
3384       std::swap(N1, N2);
3385     } else if (N2CFP) {
3386       APFloat V1 = N1CFP->getValueAPF(), V2 = N2CFP->getValueAPF();
3387       APFloat::opStatus s;
3388       switch (Opcode) {
3389       case ISD::FADD:
3390         s = V1.add(V2, APFloat::rmNearestTiesToEven);
3391         if (s != APFloat::opInvalidOp)
3392           return getConstantFP(V1, VT);
3393         break;
3394       case ISD::FSUB:
3395         s = V1.subtract(V2, APFloat::rmNearestTiesToEven);
3396         if (s!=APFloat::opInvalidOp)
3397           return getConstantFP(V1, VT);
3398         break;
3399       case ISD::FMUL:
3400         s = V1.multiply(V2, APFloat::rmNearestTiesToEven);
3401         if (s!=APFloat::opInvalidOp)
3402           return getConstantFP(V1, VT);
3403         break;
3404       case ISD::FDIV:
3405         s = V1.divide(V2, APFloat::rmNearestTiesToEven);
3406         if (s!=APFloat::opInvalidOp && s!=APFloat::opDivByZero)
3407           return getConstantFP(V1, VT);
3408         break;
3409       case ISD::FREM :
3410         s = V1.mod(V2, APFloat::rmNearestTiesToEven);
3411         if (s!=APFloat::opInvalidOp && s!=APFloat::opDivByZero)
3412           return getConstantFP(V1, VT);
3413         break;
3414       case ISD::FCOPYSIGN:
3415         V1.copySign(V2);
3416         return getConstantFP(V1, VT);
3417       default: break;
3418       }
3419     }
3420
3421     if (Opcode == ISD::FP_ROUND) {
3422       APFloat V = N1CFP->getValueAPF();    // make copy
3423       bool ignored;
3424       // This can return overflow, underflow, or inexact; we don't care.
3425       // FIXME need to be more flexible about rounding mode.
3426       (void)V.convert(EVTToAPFloatSemantics(VT),
3427                       APFloat::rmNearestTiesToEven, &ignored);
3428       return getConstantFP(V, VT);
3429     }
3430   }
3431
3432   // Canonicalize an UNDEF to the RHS, even over a constant.
3433   if (N1.getOpcode() == ISD::UNDEF) {
3434     if (isCommutativeBinOp(Opcode)) {
3435       std::swap(N1, N2);
3436     } else {
3437       switch (Opcode) {
3438       case ISD::FP_ROUND_INREG:
3439       case ISD::SIGN_EXTEND_INREG:
3440       case ISD::SUB:
3441       case ISD::FSUB:
3442       case ISD::FDIV:
3443       case ISD::FREM:
3444       case ISD::SRA:
3445         return N1;     // fold op(undef, arg2) -> undef
3446       case ISD::UDIV:
3447       case ISD::SDIV:
3448       case ISD::UREM:
3449       case ISD::SREM:
3450       case ISD::SRL:
3451       case ISD::SHL:
3452         if (!VT.isVector())
3453           return getConstant(0, VT);    // fold op(undef, arg2) -> 0
3454         // For vectors, we can't easily build an all zero vector, just return
3455         // the LHS.
3456         return N2;
3457       }
3458     }
3459   }
3460
3461   // Fold a bunch of operators when the RHS is undef.
3462   if (N2.getOpcode() == ISD::UNDEF) {
3463     switch (Opcode) {
3464     case ISD::XOR:
3465       if (N1.getOpcode() == ISD::UNDEF)
3466         // Handle undef ^ undef -> 0 special case. This is a common
3467         // idiom (misuse).
3468         return getConstant(0, VT);
3469       // fallthrough
3470     case ISD::ADD:
3471     case ISD::ADDC:
3472     case ISD::ADDE:
3473     case ISD::SUB:
3474     case ISD::UDIV:
3475     case ISD::SDIV:
3476     case ISD::UREM:
3477     case ISD::SREM:
3478       return N2;       // fold op(arg1, undef) -> undef
3479     case ISD::FADD:
3480     case ISD::FSUB:
3481     case ISD::FMUL:
3482     case ISD::FDIV:
3483     case ISD::FREM:
3484       if (getTarget().Options.UnsafeFPMath)
3485         return N2;
3486       break;
3487     case ISD::MUL:
3488     case ISD::AND:
3489     case ISD::SRL:
3490     case ISD::SHL:
3491       if (!VT.isVector())
3492         return getConstant(0, VT);  // fold op(arg1, undef) -> 0
3493       // For vectors, we can't easily build an all zero vector, just return
3494       // the LHS.
3495       return N1;
3496     case ISD::OR:
3497       if (!VT.isVector())
3498         return getConstant(APInt::getAllOnesValue(VT.getSizeInBits()), VT);
3499       // For vectors, we can't easily build an all one vector, just return
3500       // the LHS.
3501       return N1;
3502     case ISD::SRA:
3503       return N1;
3504     }
3505   }
3506
3507   // Memoize this node if possible.
3508   BinarySDNode *N;
3509   SDVTList VTs = getVTList(VT);
3510   const bool BinOpHasFlags = isBinOpWithFlags(Opcode);
3511   if (VT != MVT::Glue) {
3512     SDValue Ops[] = {N1, N2};
3513     FoldingSetNodeID ID;
3514     AddNodeIDNode(ID, Opcode, VTs, Ops);
3515     if (BinOpHasFlags)
3516       AddBinaryNodeIDCustom(ID, Opcode, nuw, nsw, exact);
3517     void *IP = nullptr;
3518     if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
3519       return SDValue(E, 0);
3520
3521     N = GetBinarySDNode(Opcode, DL, VTs, N1, N2, nuw, nsw, exact);
3522
3523     CSEMap.InsertNode(N, IP);
3524   } else {
3525
3526     N = GetBinarySDNode(Opcode, DL, VTs, N1, N2, nuw, nsw, exact);
3527   }
3528
3529   AllNodes.push_back(N);
3530 #ifndef NDEBUG
3531   VerifySDNode(N);
3532 #endif
3533   return SDValue(N, 0);
3534 }
3535
3536 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT,
3537                               SDValue N1, SDValue N2, SDValue N3) {
3538   // Perform various simplifications.
3539   ConstantSDNode *N1C = dyn_cast<ConstantSDNode>(N1.getNode());
3540   switch (Opcode) {
3541   case ISD::FMA: {
3542     ConstantFPSDNode *N1CFP = dyn_cast<ConstantFPSDNode>(N1);
3543     ConstantFPSDNode *N2CFP = dyn_cast<ConstantFPSDNode>(N2);
3544     ConstantFPSDNode *N3CFP = dyn_cast<ConstantFPSDNode>(N3);
3545     if (N1CFP && N2CFP && N3CFP) {
3546       APFloat  V1 = N1CFP->getValueAPF();
3547       const APFloat &V2 = N2CFP->getValueAPF();
3548       const APFloat &V3 = N3CFP->getValueAPF();
3549       APFloat::opStatus s =
3550         V1.fusedMultiplyAdd(V2, V3, APFloat::rmNearestTiesToEven);
3551       if (s != APFloat::opInvalidOp)
3552         return getConstantFP(V1, VT);
3553     }
3554     break;
3555   }
3556   case ISD::CONCAT_VECTORS:
3557     // A CONCAT_VECTOR with all operands BUILD_VECTOR can be simplified to
3558     // one big BUILD_VECTOR.
3559     if (N1.getOpcode() == ISD::BUILD_VECTOR &&
3560         N2.getOpcode() == ISD::BUILD_VECTOR &&
3561         N3.getOpcode() == ISD::BUILD_VECTOR) {
3562       SmallVector<SDValue, 16> Elts(N1.getNode()->op_begin(),
3563                                     N1.getNode()->op_end());
3564       Elts.append(N2.getNode()->op_begin(), N2.getNode()->op_end());
3565       Elts.append(N3.getNode()->op_begin(), N3.getNode()->op_end());
3566       return getNode(ISD::BUILD_VECTOR, DL, VT, Elts);
3567     }
3568     break;
3569   case ISD::SETCC: {
3570     // Use FoldSetCC to simplify SETCC's.
3571     SDValue Simp = FoldSetCC(VT, N1, N2, cast<CondCodeSDNode>(N3)->get(), DL);
3572     if (Simp.getNode()) return Simp;
3573     break;
3574   }
3575   case ISD::SELECT:
3576     if (N1C) {
3577      if (N1C->getZExtValue())
3578        return N2;             // select true, X, Y -> X
3579      return N3;             // select false, X, Y -> Y
3580     }
3581
3582     if (N2 == N3) return N2;   // select C, X, X -> X
3583     break;
3584   case ISD::VECTOR_SHUFFLE:
3585     llvm_unreachable("should use getVectorShuffle constructor!");
3586   case ISD::INSERT_SUBVECTOR: {
3587     SDValue Index = N3;
3588     if (VT.isSimple() && N1.getValueType().isSimple()
3589         && N2.getValueType().isSimple()) {
3590       assert(VT.isVector() && N1.getValueType().isVector() &&
3591              N2.getValueType().isVector() &&
3592              "Insert subvector VTs must be a vectors");
3593       assert(VT == N1.getValueType() &&
3594              "Dest and insert subvector source types must match!");
3595       assert(N2.getSimpleValueType() <= N1.getSimpleValueType() &&
3596              "Insert subvector must be from smaller vector to larger vector!");
3597       if (isa<ConstantSDNode>(Index.getNode())) {
3598         assert((N2.getValueType().getVectorNumElements() +
3599                 cast<ConstantSDNode>(Index.getNode())->getZExtValue()
3600                 <= VT.getVectorNumElements())
3601                && "Insert subvector overflow!");
3602       }
3603
3604       // Trivial insertion.
3605       if (VT.getSimpleVT() == N2.getSimpleValueType())
3606         return N2;
3607     }
3608     break;
3609   }
3610   case ISD::BITCAST:
3611     // Fold bit_convert nodes from a type to themselves.
3612     if (N1.getValueType() == VT)
3613       return N1;
3614     break;
3615   }
3616
3617   // Memoize node if it doesn't produce a flag.
3618   SDNode *N;
3619   SDVTList VTs = getVTList(VT);
3620   if (VT != MVT::Glue) {
3621     SDValue Ops[] = { N1, N2, N3 };
3622     FoldingSetNodeID ID;
3623     AddNodeIDNode(ID, Opcode, VTs, Ops);
3624     void *IP = nullptr;
3625     if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
3626       return SDValue(E, 0);
3627
3628     N = new (NodeAllocator) TernarySDNode(Opcode, DL.getIROrder(),
3629                                           DL.getDebugLoc(), VTs, N1, N2, N3);
3630     CSEMap.InsertNode(N, IP);
3631   } else {
3632     N = new (NodeAllocator) TernarySDNode(Opcode, DL.getIROrder(),
3633                                           DL.getDebugLoc(), VTs, N1, N2, N3);
3634   }
3635
3636   AllNodes.push_back(N);
3637 #ifndef NDEBUG
3638   VerifySDNode(N);
3639 #endif
3640   return SDValue(N, 0);
3641 }
3642
3643 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT,
3644                               SDValue N1, SDValue N2, SDValue N3,
3645                               SDValue N4) {
3646   SDValue Ops[] = { N1, N2, N3, N4 };
3647   return getNode(Opcode, DL, VT, Ops);
3648 }
3649
3650 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT,
3651                               SDValue N1, SDValue N2, SDValue N3,
3652                               SDValue N4, SDValue N5) {
3653   SDValue Ops[] = { N1, N2, N3, N4, N5 };
3654   return getNode(Opcode, DL, VT, Ops);
3655 }
3656
3657 /// getStackArgumentTokenFactor - Compute a TokenFactor to force all
3658 /// the incoming stack arguments to be loaded from the stack.
3659 SDValue SelectionDAG::getStackArgumentTokenFactor(SDValue Chain) {
3660   SmallVector<SDValue, 8> ArgChains;
3661
3662   // Include the original chain at the beginning of the list. When this is
3663   // used by target LowerCall hooks, this helps legalize find the
3664   // CALLSEQ_BEGIN node.
3665   ArgChains.push_back(Chain);
3666
3667   // Add a chain value for each stack argument.
3668   for (SDNode::use_iterator U = getEntryNode().getNode()->use_begin(),
3669        UE = getEntryNode().getNode()->use_end(); U != UE; ++U)
3670     if (LoadSDNode *L = dyn_cast<LoadSDNode>(*U))
3671       if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(L->getBasePtr()))
3672         if (FI->getIndex() < 0)
3673           ArgChains.push_back(SDValue(L, 1));
3674
3675   // Build a tokenfactor for all the chains.
3676   return getNode(ISD::TokenFactor, SDLoc(Chain), MVT::Other, ArgChains);
3677 }
3678
3679 /// getMemsetValue - Vectorized representation of the memset value
3680 /// operand.
3681 static SDValue getMemsetValue(SDValue Value, EVT VT, SelectionDAG &DAG,
3682                               SDLoc dl) {
3683   assert(Value.getOpcode() != ISD::UNDEF);
3684
3685   unsigned NumBits = VT.getScalarType().getSizeInBits();
3686   if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Value)) {
3687     assert(C->getAPIntValue().getBitWidth() == 8);
3688     APInt Val = APInt::getSplat(NumBits, C->getAPIntValue());
3689     if (VT.isInteger())
3690       return DAG.getConstant(Val, VT);
3691     return DAG.getConstantFP(APFloat(DAG.EVTToAPFloatSemantics(VT), Val), VT);
3692   }
3693
3694   Value = DAG.getNode(ISD::ZERO_EXTEND, dl, VT, Value);
3695   if (NumBits > 8) {
3696     // Use a multiplication with 0x010101... to extend the input to the
3697     // required length.
3698     APInt Magic = APInt::getSplat(NumBits, APInt(8, 0x01));
3699     Value = DAG.getNode(ISD::MUL, dl, VT, Value, DAG.getConstant(Magic, VT));
3700   }
3701
3702   return Value;
3703 }
3704
3705 /// getMemsetStringVal - Similar to getMemsetValue. Except this is only
3706 /// used when a memcpy is turned into a memset when the source is a constant
3707 /// string ptr.
3708 static SDValue getMemsetStringVal(EVT VT, SDLoc dl, SelectionDAG &DAG,
3709                                   const TargetLowering &TLI, StringRef Str) {
3710   // Handle vector with all elements zero.
3711   if (Str.empty()) {
3712     if (VT.isInteger())
3713       return DAG.getConstant(0, VT);
3714     else if (VT == MVT::f32 || VT == MVT::f64 || VT == MVT::f128)
3715       return DAG.getConstantFP(0.0, VT);
3716     else if (VT.isVector()) {
3717       unsigned NumElts = VT.getVectorNumElements();
3718       MVT EltVT = (VT.getVectorElementType() == MVT::f32) ? MVT::i32 : MVT::i64;
3719       return DAG.getNode(ISD::BITCAST, dl, VT,
3720                          DAG.getConstant(0, EVT::getVectorVT(*DAG.getContext(),
3721                                                              EltVT, NumElts)));
3722     } else
3723       llvm_unreachable("Expected type!");
3724   }
3725
3726   assert(!VT.isVector() && "Can't handle vector type here!");
3727   unsigned NumVTBits = VT.getSizeInBits();
3728   unsigned NumVTBytes = NumVTBits / 8;
3729   unsigned NumBytes = std::min(NumVTBytes, unsigned(Str.size()));
3730
3731   APInt Val(NumVTBits, 0);
3732   if (TLI.isLittleEndian()) {
3733     for (unsigned i = 0; i != NumBytes; ++i)
3734       Val |= (uint64_t)(unsigned char)Str[i] << i*8;
3735   } else {
3736     for (unsigned i = 0; i != NumBytes; ++i)
3737       Val |= (uint64_t)(unsigned char)Str[i] << (NumVTBytes-i-1)*8;
3738   }
3739
3740   // If the "cost" of materializing the integer immediate is less than the cost
3741   // of a load, then it is cost effective to turn the load into the immediate.
3742   Type *Ty = VT.getTypeForEVT(*DAG.getContext());
3743   if (TLI.shouldConvertConstantLoadToIntImm(Val, Ty))
3744     return DAG.getConstant(Val, VT);
3745   return SDValue(nullptr, 0);
3746 }
3747
3748 /// getMemBasePlusOffset - Returns base and offset node for the
3749 ///
3750 static SDValue getMemBasePlusOffset(SDValue Base, unsigned Offset, SDLoc dl,
3751                                       SelectionDAG &DAG) {
3752   EVT VT = Base.getValueType();
3753   return DAG.getNode(ISD::ADD, dl,
3754                      VT, Base, DAG.getConstant(Offset, VT));
3755 }
3756
3757 /// isMemSrcFromString - Returns true if memcpy source is a string constant.
3758 ///
3759 static bool isMemSrcFromString(SDValue Src, StringRef &Str) {
3760   unsigned SrcDelta = 0;
3761   GlobalAddressSDNode *G = nullptr;
3762   if (Src.getOpcode() == ISD::GlobalAddress)
3763     G = cast<GlobalAddressSDNode>(Src);
3764   else if (Src.getOpcode() == ISD::ADD &&
3765            Src.getOperand(0).getOpcode() == ISD::GlobalAddress &&
3766            Src.getOperand(1).getOpcode() == ISD::Constant) {
3767     G = cast<GlobalAddressSDNode>(Src.getOperand(0));
3768     SrcDelta = cast<ConstantSDNode>(Src.getOperand(1))->getZExtValue();
3769   }
3770   if (!G)
3771     return false;
3772
3773   return getConstantStringInfo(G->getGlobal(), Str, SrcDelta, false);
3774 }
3775
3776 /// FindOptimalMemOpLowering - Determines the optimial series memory ops
3777 /// to replace the memset / memcpy. Return true if the number of memory ops
3778 /// is below the threshold. It returns the types of the sequence of
3779 /// memory ops to perform memset / memcpy by reference.
3780 static bool FindOptimalMemOpLowering(std::vector<EVT> &MemOps,
3781                                      unsigned Limit, uint64_t Size,
3782                                      unsigned DstAlign, unsigned SrcAlign,
3783                                      bool IsMemset,
3784                                      bool ZeroMemset,
3785                                      bool MemcpyStrSrc,
3786                                      bool AllowOverlap,
3787                                      SelectionDAG &DAG,
3788                                      const TargetLowering &TLI) {
3789   assert((SrcAlign == 0 || SrcAlign >= DstAlign) &&
3790          "Expecting memcpy / memset source to meet alignment requirement!");
3791   // If 'SrcAlign' is zero, that means the memory operation does not need to
3792   // load the value, i.e. memset or memcpy from constant string. Otherwise,
3793   // it's the inferred alignment of the source. 'DstAlign', on the other hand,
3794   // is the specified alignment of the memory operation. If it is zero, that
3795   // means it's possible to change the alignment of the destination.
3796   // 'MemcpyStrSrc' indicates whether the memcpy source is constant so it does
3797   // not need to be loaded.
3798   EVT VT = TLI.getOptimalMemOpType(Size, DstAlign, SrcAlign,
3799                                    IsMemset, ZeroMemset, MemcpyStrSrc,
3800                                    DAG.getMachineFunction());
3801
3802   if (VT == MVT::Other) {
3803     unsigned AS = 0;
3804     if (DstAlign >= TLI.getDataLayout()->getPointerPrefAlignment(AS) ||
3805         TLI.allowsUnalignedMemoryAccesses(VT, AS)) {
3806       VT = TLI.getPointerTy();
3807     } else {
3808       switch (DstAlign & 7) {
3809       case 0:  VT = MVT::i64; break;
3810       case 4:  VT = MVT::i32; break;
3811       case 2:  VT = MVT::i16; break;
3812       default: VT = MVT::i8;  break;
3813       }
3814     }
3815
3816     MVT LVT = MVT::i64;
3817     while (!TLI.isTypeLegal(LVT))
3818       LVT = (MVT::SimpleValueType)(LVT.SimpleTy - 1);
3819     assert(LVT.isInteger());
3820
3821     if (VT.bitsGT(LVT))
3822       VT = LVT;
3823   }
3824
3825   unsigned NumMemOps = 0;
3826   while (Size != 0) {
3827     unsigned VTSize = VT.getSizeInBits() / 8;
3828     while (VTSize > Size) {
3829       // For now, only use non-vector load / store's for the left-over pieces.
3830       EVT NewVT = VT;
3831       unsigned NewVTSize;
3832
3833       bool Found = false;
3834       if (VT.isVector() || VT.isFloatingPoint()) {
3835         NewVT = (VT.getSizeInBits() > 64) ? MVT::i64 : MVT::i32;
3836         if (TLI.isOperationLegalOrCustom(ISD::STORE, NewVT) &&
3837             TLI.isSafeMemOpType(NewVT.getSimpleVT()))
3838           Found = true;
3839         else if (NewVT == MVT::i64 &&
3840                  TLI.isOperationLegalOrCustom(ISD::STORE, MVT::f64) &&
3841                  TLI.isSafeMemOpType(MVT::f64)) {
3842           // i64 is usually not legal on 32-bit targets, but f64 may be.
3843           NewVT = MVT::f64;
3844           Found = true;
3845         }
3846       }
3847
3848       if (!Found) {
3849         do {
3850           NewVT = (MVT::SimpleValueType)(NewVT.getSimpleVT().SimpleTy - 1);
3851           if (NewVT == MVT::i8)
3852             break;
3853         } while (!TLI.isSafeMemOpType(NewVT.getSimpleVT()));
3854       }
3855       NewVTSize = NewVT.getSizeInBits() / 8;
3856
3857       // If the new VT cannot cover all of the remaining bits, then consider
3858       // issuing a (or a pair of) unaligned and overlapping load / store.
3859       // FIXME: Only does this for 64-bit or more since we don't have proper
3860       // cost model for unaligned load / store.
3861       bool Fast;
3862       unsigned AS = 0;
3863       if (NumMemOps && AllowOverlap &&
3864           VTSize >= 8 && NewVTSize < Size &&
3865           TLI.allowsUnalignedMemoryAccesses(VT, AS, &Fast) && Fast)
3866         VTSize = Size;
3867       else {
3868         VT = NewVT;
3869         VTSize = NewVTSize;
3870       }
3871     }
3872
3873     if (++NumMemOps > Limit)
3874       return false;
3875
3876     MemOps.push_back(VT);
3877     Size -= VTSize;
3878   }
3879
3880   return true;
3881 }
3882
3883 static SDValue getMemcpyLoadsAndStores(SelectionDAG &DAG, SDLoc dl,
3884                                        SDValue Chain, SDValue Dst,
3885                                        SDValue Src, uint64_t Size,
3886                                        unsigned Align, bool isVol,
3887                                        bool AlwaysInline,
3888                                        MachinePointerInfo DstPtrInfo,
3889                                        MachinePointerInfo SrcPtrInfo) {
3890   // Turn a memcpy of undef to nop.
3891   if (Src.getOpcode() == ISD::UNDEF)
3892     return Chain;
3893
3894   // Expand memcpy to a series of load and store ops if the size operand falls
3895   // below a certain threshold.
3896   // TODO: In the AlwaysInline case, if the size is big then generate a loop
3897   // rather than maybe a humongous number of loads and stores.
3898   const TargetLowering &TLI = DAG.getTargetLoweringInfo();
3899   std::vector<EVT> MemOps;
3900   bool DstAlignCanChange = false;
3901   MachineFunction &MF = DAG.getMachineFunction();
3902   MachineFrameInfo *MFI = MF.getFrameInfo();
3903   bool OptSize =
3904     MF.getFunction()->getAttributes().
3905       hasAttribute(AttributeSet::FunctionIndex, Attribute::OptimizeForSize);
3906   FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
3907   if (FI && !MFI->isFixedObjectIndex(FI->getIndex()))
3908     DstAlignCanChange = true;
3909   unsigned SrcAlign = DAG.InferPtrAlignment(Src);
3910   if (Align > SrcAlign)
3911     SrcAlign = Align;
3912   StringRef Str;
3913   bool CopyFromStr = isMemSrcFromString(Src, Str);
3914   bool isZeroStr = CopyFromStr && Str.empty();
3915   unsigned Limit = AlwaysInline ? ~0U : TLI.getMaxStoresPerMemcpy(OptSize);
3916
3917   if (!FindOptimalMemOpLowering(MemOps, Limit, Size,
3918                                 (DstAlignCanChange ? 0 : Align),
3919                                 (isZeroStr ? 0 : SrcAlign),
3920                                 false, false, CopyFromStr, true, DAG, TLI))
3921     return SDValue();
3922
3923   if (DstAlignCanChange) {
3924     Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
3925     unsigned NewAlign = (unsigned) TLI.getDataLayout()->getABITypeAlignment(Ty);
3926
3927     // Don't promote to an alignment that would require dynamic stack
3928     // realignment.
3929     const TargetRegisterInfo *TRI = MF.getTarget().getRegisterInfo();
3930     if (!TRI->needsStackRealignment(MF))
3931        while (NewAlign > Align &&
3932              TLI.getDataLayout()->exceedsNaturalStackAlignment(NewAlign))
3933           NewAlign /= 2;
3934
3935     if (NewAlign > Align) {
3936       // Give the stack frame object a larger alignment if needed.
3937       if (MFI->getObjectAlignment(FI->getIndex()) < NewAlign)
3938         MFI->setObjectAlignment(FI->getIndex(), NewAlign);
3939       Align = NewAlign;
3940     }
3941   }
3942
3943   SmallVector<SDValue, 8> OutChains;
3944   unsigned NumMemOps = MemOps.size();
3945   uint64_t SrcOff = 0, DstOff = 0;
3946   for (unsigned i = 0; i != NumMemOps; ++i) {
3947     EVT VT = MemOps[i];
3948     unsigned VTSize = VT.getSizeInBits() / 8;
3949     SDValue Value, Store;
3950
3951     if (VTSize > Size) {
3952       // Issuing an unaligned load / store pair  that overlaps with the previous
3953       // pair. Adjust the offset accordingly.
3954       assert(i == NumMemOps-1 && i != 0);
3955       SrcOff -= VTSize - Size;
3956       DstOff -= VTSize - Size;
3957     }
3958
3959     if (CopyFromStr &&
3960         (isZeroStr || (VT.isInteger() && !VT.isVector()))) {
3961       // It's unlikely a store of a vector immediate can be done in a single
3962       // instruction. It would require a load from a constantpool first.
3963       // We only handle zero vectors here.
3964       // FIXME: Handle other cases where store of vector immediate is done in
3965       // a single instruction.
3966       Value = getMemsetStringVal(VT, dl, DAG, TLI, Str.substr(SrcOff));
3967       if (Value.getNode())
3968         Store = DAG.getStore(Chain, dl, Value,
3969                              getMemBasePlusOffset(Dst, DstOff, dl, DAG),
3970                              DstPtrInfo.getWithOffset(DstOff), isVol,
3971                              false, Align);
3972     }
3973
3974     if (!Store.getNode()) {
3975       // The type might not be legal for the target.  This should only happen
3976       // if the type is smaller than a legal type, as on PPC, so the right
3977       // thing to do is generate a LoadExt/StoreTrunc pair.  These simplify
3978       // to Load/Store if NVT==VT.
3979       // FIXME does the case above also need this?
3980       EVT NVT = TLI.getTypeToTransformTo(*DAG.getContext(), VT);
3981       assert(NVT.bitsGE(VT));
3982       Value = DAG.getExtLoad(ISD::EXTLOAD, dl, NVT, Chain,
3983                              getMemBasePlusOffset(Src, SrcOff, dl, DAG),
3984                              SrcPtrInfo.getWithOffset(SrcOff), VT, isVol, false,
3985                              MinAlign(SrcAlign, SrcOff));
3986       Store = DAG.getTruncStore(Chain, dl, Value,
3987                                 getMemBasePlusOffset(Dst, DstOff, dl, DAG),
3988                                 DstPtrInfo.getWithOffset(DstOff), VT, isVol,
3989                                 false, Align);
3990     }
3991     OutChains.push_back(Store);
3992     SrcOff += VTSize;
3993     DstOff += VTSize;
3994     Size -= VTSize;
3995   }
3996
3997   return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, OutChains);
3998 }
3999
4000 static SDValue getMemmoveLoadsAndStores(SelectionDAG &DAG, SDLoc dl,
4001                                         SDValue Chain, SDValue Dst,
4002                                         SDValue Src, uint64_t Size,
4003                                         unsigned Align,  bool isVol,
4004                                         bool AlwaysInline,
4005                                         MachinePointerInfo DstPtrInfo,
4006                                         MachinePointerInfo SrcPtrInfo) {
4007   // Turn a memmove of undef to nop.
4008   if (Src.getOpcode() == ISD::UNDEF)
4009     return Chain;
4010
4011   // Expand memmove to a series of load and store ops if the size operand falls
4012   // below a certain threshold.
4013   const TargetLowering &TLI = DAG.getTargetLoweringInfo();
4014   std::vector<EVT> MemOps;
4015   bool DstAlignCanChange = false;
4016   MachineFunction &MF = DAG.getMachineFunction();
4017   MachineFrameInfo *MFI = MF.getFrameInfo();
4018   bool OptSize = MF.getFunction()->getAttributes().
4019     hasAttribute(AttributeSet::FunctionIndex, Attribute::OptimizeForSize);
4020   FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
4021   if (FI && !MFI->isFixedObjectIndex(FI->getIndex()))
4022     DstAlignCanChange = true;
4023   unsigned SrcAlign = DAG.InferPtrAlignment(Src);
4024   if (Align > SrcAlign)
4025     SrcAlign = Align;
4026   unsigned Limit = AlwaysInline ? ~0U : TLI.getMaxStoresPerMemmove(OptSize);
4027
4028   if (!FindOptimalMemOpLowering(MemOps, Limit, Size,
4029                                 (DstAlignCanChange ? 0 : Align), SrcAlign,
4030                                 false, false, false, false, DAG, TLI))
4031     return SDValue();
4032
4033   if (DstAlignCanChange) {
4034     Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
4035     unsigned NewAlign = (unsigned) TLI.getDataLayout()->getABITypeAlignment(Ty);
4036     if (NewAlign > Align) {
4037       // Give the stack frame object a larger alignment if needed.
4038       if (MFI->getObjectAlignment(FI->getIndex()) < NewAlign)
4039         MFI->setObjectAlignment(FI->getIndex(), NewAlign);
4040       Align = NewAlign;
4041     }
4042   }
4043
4044   uint64_t SrcOff = 0, DstOff = 0;
4045   SmallVector<SDValue, 8> LoadValues;
4046   SmallVector<SDValue, 8> LoadChains;
4047   SmallVector<SDValue, 8> OutChains;
4048   unsigned NumMemOps = MemOps.size();
4049   for (unsigned i = 0; i < NumMemOps; i++) {
4050     EVT VT = MemOps[i];
4051     unsigned VTSize = VT.getSizeInBits() / 8;
4052     SDValue Value;
4053
4054     Value = DAG.getLoad(VT, dl, Chain,
4055                         getMemBasePlusOffset(Src, SrcOff, dl, DAG),
4056                         SrcPtrInfo.getWithOffset(SrcOff), isVol,
4057                         false, false, SrcAlign);
4058     LoadValues.push_back(Value);
4059     LoadChains.push_back(Value.getValue(1));
4060     SrcOff += VTSize;
4061   }
4062   Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, LoadChains);
4063   OutChains.clear();
4064   for (unsigned i = 0; i < NumMemOps; i++) {
4065     EVT VT = MemOps[i];
4066     unsigned VTSize = VT.getSizeInBits() / 8;
4067     SDValue Store;
4068
4069     Store = DAG.getStore(Chain, dl, LoadValues[i],
4070                          getMemBasePlusOffset(Dst, DstOff, dl, DAG),
4071                          DstPtrInfo.getWithOffset(DstOff), isVol, false, Align);
4072     OutChains.push_back(Store);
4073     DstOff += VTSize;
4074   }
4075
4076   return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, OutChains);
4077 }
4078
4079 /// \brief Lower the call to 'memset' intrinsic function into a series of store
4080 /// operations.
4081 ///
4082 /// \param DAG Selection DAG where lowered code is placed.
4083 /// \param dl Link to corresponding IR location.
4084 /// \param Chain Control flow dependency.
4085 /// \param Dst Pointer to destination memory location.
4086 /// \param Src Value of byte to write into the memory.
4087 /// \param Size Number of bytes to write.
4088 /// \param Align Alignment of the destination in bytes.
4089 /// \param isVol True if destination is volatile.
4090 /// \param DstPtrInfo IR information on the memory pointer.
4091 /// \returns New head in the control flow, if lowering was successful, empty
4092 /// SDValue otherwise.
4093 ///
4094 /// The function tries to replace 'llvm.memset' intrinsic with several store
4095 /// operations and value calculation code. This is usually profitable for small
4096 /// memory size.
4097 static SDValue getMemsetStores(SelectionDAG &DAG, SDLoc dl,
4098                                SDValue Chain, SDValue Dst,
4099                                SDValue Src, uint64_t Size,
4100                                unsigned Align, bool isVol,
4101                                MachinePointerInfo DstPtrInfo) {
4102   // Turn a memset of undef to nop.
4103   if (Src.getOpcode() == ISD::UNDEF)
4104     return Chain;
4105
4106   // Expand memset to a series of load/store ops if the size operand
4107   // falls below a certain threshold.
4108   const TargetLowering &TLI = DAG.getTargetLoweringInfo();
4109   std::vector<EVT> MemOps;
4110   bool DstAlignCanChange = false;
4111   MachineFunction &MF = DAG.getMachineFunction();
4112   MachineFrameInfo *MFI = MF.getFrameInfo();
4113   bool OptSize = MF.getFunction()->getAttributes().
4114     hasAttribute(AttributeSet::FunctionIndex, Attribute::OptimizeForSize);
4115   FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Dst);
4116   if (FI && !MFI->isFixedObjectIndex(FI->getIndex()))
4117     DstAlignCanChange = true;
4118   bool IsZeroVal =
4119     isa<ConstantSDNode>(Src) && cast<ConstantSDNode>(Src)->isNullValue();
4120   if (!FindOptimalMemOpLowering(MemOps, TLI.getMaxStoresPerMemset(OptSize),
4121                                 Size, (DstAlignCanChange ? 0 : Align), 0,
4122                                 true, IsZeroVal, false, true, DAG, TLI))
4123     return SDValue();
4124
4125   if (DstAlignCanChange) {
4126     Type *Ty = MemOps[0].getTypeForEVT(*DAG.getContext());
4127     unsigned NewAlign = (unsigned) TLI.getDataLayout()->getABITypeAlignment(Ty);
4128     if (NewAlign > Align) {
4129       // Give the stack frame object a larger alignment if needed.
4130       if (MFI->getObjectAlignment(FI->getIndex()) < NewAlign)
4131         MFI->setObjectAlignment(FI->getIndex(), NewAlign);
4132       Align = NewAlign;
4133     }
4134   }
4135
4136   SmallVector<SDValue, 8> OutChains;
4137   uint64_t DstOff = 0;
4138   unsigned NumMemOps = MemOps.size();
4139
4140   // Find the largest store and generate the bit pattern for it.
4141   EVT LargestVT = MemOps[0];
4142   for (unsigned i = 1; i < NumMemOps; i++)
4143     if (MemOps[i].bitsGT(LargestVT))
4144       LargestVT = MemOps[i];
4145   SDValue MemSetValue = getMemsetValue(Src, LargestVT, DAG, dl);
4146
4147   for (unsigned i = 0; i < NumMemOps; i++) {
4148     EVT VT = MemOps[i];
4149     unsigned VTSize = VT.getSizeInBits() / 8;
4150     if (VTSize > Size) {
4151       // Issuing an unaligned load / store pair  that overlaps with the previous
4152       // pair. Adjust the offset accordingly.
4153       assert(i == NumMemOps-1 && i != 0);
4154       DstOff -= VTSize - Size;
4155     }
4156
4157     // If this store is smaller than the largest store see whether we can get
4158     // the smaller value for free with a truncate.
4159     SDValue Value = MemSetValue;
4160     if (VT.bitsLT(LargestVT)) {
4161       if (!LargestVT.isVector() && !VT.isVector() &&
4162           TLI.isTruncateFree(LargestVT, VT))
4163         Value = DAG.getNode(ISD::TRUNCATE, dl, VT, MemSetValue);
4164       else
4165         Value = getMemsetValue(Src, VT, DAG, dl);
4166     }
4167     assert(Value.getValueType() == VT && "Value with wrong type.");
4168     SDValue Store = DAG.getStore(Chain, dl, Value,
4169                                  getMemBasePlusOffset(Dst, DstOff, dl, DAG),
4170                                  DstPtrInfo.getWithOffset(DstOff),
4171                                  isVol, false, Align);
4172     OutChains.push_back(Store);
4173     DstOff += VT.getSizeInBits() / 8;
4174     Size -= VTSize;
4175   }
4176
4177   return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, OutChains);
4178 }
4179
4180 SDValue SelectionDAG::getMemcpy(SDValue Chain, SDLoc dl, SDValue Dst,
4181                                 SDValue Src, SDValue Size,
4182                                 unsigned Align, bool isVol, bool AlwaysInline,
4183                                 MachinePointerInfo DstPtrInfo,
4184                                 MachinePointerInfo SrcPtrInfo) {
4185   assert(Align && "The SDAG layer expects explicit alignment and reserves 0");
4186
4187   // Check to see if we should lower the memcpy to loads and stores first.
4188   // For cases within the target-specified limits, this is the best choice.
4189   ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);
4190   if (ConstantSize) {
4191     // Memcpy with size zero? Just return the original chain.
4192     if (ConstantSize->isNullValue())
4193       return Chain;
4194
4195     SDValue Result = getMemcpyLoadsAndStores(*this, dl, Chain, Dst, Src,
4196                                              ConstantSize->getZExtValue(),Align,
4197                                 isVol, false, DstPtrInfo, SrcPtrInfo);
4198     if (Result.getNode())
4199       return Result;
4200   }
4201
4202   // Then check to see if we should lower the memcpy with target-specific
4203   // code. If the target chooses to do this, this is the next best.
4204   SDValue Result =
4205     TSI.EmitTargetCodeForMemcpy(*this, dl, Chain, Dst, Src, Size, Align,
4206                                 isVol, AlwaysInline,
4207                                 DstPtrInfo, SrcPtrInfo);
4208   if (Result.getNode())
4209     return Result;
4210
4211   // If we really need inline code and the target declined to provide it,
4212   // use a (potentially long) sequence of loads and stores.
4213   if (AlwaysInline) {
4214     assert(ConstantSize && "AlwaysInline requires a constant size!");
4215     return getMemcpyLoadsAndStores(*this, dl, Chain, Dst, Src,
4216                                    ConstantSize->getZExtValue(), Align, isVol,
4217                                    true, DstPtrInfo, SrcPtrInfo);
4218   }
4219
4220   // FIXME: If the memcpy is volatile (isVol), lowering it to a plain libc
4221   // memcpy is not guaranteed to be safe. libc memcpys aren't required to
4222   // respect volatile, so they may do things like read or write memory
4223   // beyond the given memory regions. But fixing this isn't easy, and most
4224   // people don't care.
4225
4226   const TargetLowering *TLI = TM.getTargetLowering();
4227
4228   // Emit a library call.
4229   TargetLowering::ArgListTy Args;
4230   TargetLowering::ArgListEntry Entry;
4231   Entry.Ty = TLI->getDataLayout()->getIntPtrType(*getContext());
4232   Entry.Node = Dst; Args.push_back(Entry);
4233   Entry.Node = Src; Args.push_back(Entry);
4234   Entry.Node = Size; Args.push_back(Entry);
4235   // FIXME: pass in SDLoc
4236   TargetLowering::CallLoweringInfo CLI(*this);
4237   CLI.setDebugLoc(dl).setChain(Chain)
4238     .setCallee(TLI->getLibcallCallingConv(RTLIB::MEMCPY),
4239                Type::getVoidTy(*getContext()),
4240                getExternalSymbol(TLI->getLibcallName(RTLIB::MEMCPY),
4241                                  TLI->getPointerTy()), std::move(Args), 0)
4242     .setDiscardResult();
4243   std::pair<SDValue,SDValue> CallResult = TLI->LowerCallTo(CLI);
4244
4245   return CallResult.second;
4246 }
4247
4248 SDValue SelectionDAG::getMemmove(SDValue Chain, SDLoc dl, SDValue Dst,
4249                                  SDValue Src, SDValue Size,
4250                                  unsigned Align, bool isVol,
4251                                  MachinePointerInfo DstPtrInfo,
4252                                  MachinePointerInfo SrcPtrInfo) {
4253   assert(Align && "The SDAG layer expects explicit alignment and reserves 0");
4254
4255   // Check to see if we should lower the memmove to loads and stores first.
4256   // For cases within the target-specified limits, this is the best choice.
4257   ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);
4258   if (ConstantSize) {
4259     // Memmove with size zero? Just return the original chain.
4260     if (ConstantSize->isNullValue())
4261       return Chain;
4262
4263     SDValue Result =
4264       getMemmoveLoadsAndStores(*this, dl, Chain, Dst, Src,
4265                                ConstantSize->getZExtValue(), Align, isVol,
4266                                false, DstPtrInfo, SrcPtrInfo);
4267     if (Result.getNode())
4268       return Result;
4269   }
4270
4271   // Then check to see if we should lower the memmove with target-specific
4272   // code. If the target chooses to do this, this is the next best.
4273   SDValue Result =
4274     TSI.EmitTargetCodeForMemmove(*this, dl, Chain, Dst, Src, Size, Align, isVol,
4275                                  DstPtrInfo, SrcPtrInfo);
4276   if (Result.getNode())
4277     return Result;
4278
4279   // FIXME: If the memmove is volatile, lowering it to plain libc memmove may
4280   // not be safe.  See memcpy above for more details.
4281
4282   const TargetLowering *TLI = TM.getTargetLowering();
4283
4284   // Emit a library call.
4285   TargetLowering::ArgListTy Args;
4286   TargetLowering::ArgListEntry Entry;
4287   Entry.Ty = TLI->getDataLayout()->getIntPtrType(*getContext());
4288   Entry.Node = Dst; Args.push_back(Entry);
4289   Entry.Node = Src; Args.push_back(Entry);
4290   Entry.Node = Size; Args.push_back(Entry);
4291   // FIXME:  pass in SDLoc
4292   TargetLowering::CallLoweringInfo CLI(*this);
4293   CLI.setDebugLoc(dl).setChain(Chain)
4294     .setCallee(TLI->getLibcallCallingConv(RTLIB::MEMMOVE),
4295                Type::getVoidTy(*getContext()),
4296                getExternalSymbol(TLI->getLibcallName(RTLIB::MEMMOVE),
4297                                  TLI->getPointerTy()), std::move(Args), 0)
4298     .setDiscardResult();
4299   std::pair<SDValue,SDValue> CallResult = TLI->LowerCallTo(CLI);
4300
4301   return CallResult.second;
4302 }
4303
4304 SDValue SelectionDAG::getMemset(SDValue Chain, SDLoc dl, SDValue Dst,
4305                                 SDValue Src, SDValue Size,
4306                                 unsigned Align, bool isVol,
4307                                 MachinePointerInfo DstPtrInfo) {
4308   assert(Align && "The SDAG layer expects explicit alignment and reserves 0");
4309
4310   // Check to see if we should lower the memset to stores first.
4311   // For cases within the target-specified limits, this is the best choice.
4312   ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);
4313   if (ConstantSize) {
4314     // Memset with size zero? Just return the original chain.
4315     if (ConstantSize->isNullValue())
4316       return Chain;
4317
4318     SDValue Result =
4319       getMemsetStores(*this, dl, Chain, Dst, Src, ConstantSize->getZExtValue(),
4320                       Align, isVol, DstPtrInfo);
4321
4322     if (Result.getNode())
4323       return Result;
4324   }
4325
4326   // Then check to see if we should lower the memset with target-specific
4327   // code. If the target chooses to do this, this is the next best.
4328   SDValue Result =
4329     TSI.EmitTargetCodeForMemset(*this, dl, Chain, Dst, Src, Size, Align, isVol,
4330                                 DstPtrInfo);
4331   if (Result.getNode())
4332     return Result;
4333
4334   // Emit a library call.
4335   const TargetLowering *TLI = TM.getTargetLowering();
4336   Type *IntPtrTy = TLI->getDataLayout()->getIntPtrType(*getContext());
4337   TargetLowering::ArgListTy Args;
4338   TargetLowering::ArgListEntry Entry;
4339   Entry.Node = Dst; Entry.Ty = IntPtrTy;
4340   Args.push_back(Entry);
4341   // Extend or truncate the argument to be an i32 value for the call.
4342   if (Src.getValueType().bitsGT(MVT::i32))
4343     Src = getNode(ISD::TRUNCATE, dl, MVT::i32, Src);
4344   else
4345     Src = getNode(ISD::ZERO_EXTEND, dl, MVT::i32, Src);
4346   Entry.Node = Src;
4347   Entry.Ty = Type::getInt32Ty(*getContext());
4348   Entry.isSExt = true;
4349   Args.push_back(Entry);
4350   Entry.Node = Size;
4351   Entry.Ty = IntPtrTy;
4352   Entry.isSExt = false;
4353   Args.push_back(Entry);
4354
4355   // FIXME: pass in SDLoc
4356   TargetLowering::CallLoweringInfo CLI(*this);
4357   CLI.setDebugLoc(dl).setChain(Chain)
4358     .setCallee(TLI->getLibcallCallingConv(RTLIB::MEMSET),
4359                Type::getVoidTy(*getContext()),
4360                getExternalSymbol(TLI->getLibcallName(RTLIB::MEMSET),
4361                                  TLI->getPointerTy()), std::move(Args), 0)
4362     .setDiscardResult();
4363
4364   std::pair<SDValue,SDValue> CallResult = TLI->LowerCallTo(CLI);
4365   return CallResult.second;
4366 }
4367
4368 SDValue SelectionDAG::getAtomic(unsigned Opcode, SDLoc dl, EVT MemVT,
4369                                 SDVTList VTList, ArrayRef<SDValue> Ops,
4370                                 MachineMemOperand *MMO,
4371                                 AtomicOrdering SuccessOrdering,
4372                                 AtomicOrdering FailureOrdering,
4373                                 SynchronizationScope SynchScope) {
4374   FoldingSetNodeID ID;
4375   ID.AddInteger(MemVT.getRawBits());
4376   AddNodeIDNode(ID, Opcode, VTList, Ops);
4377   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
4378   void* IP = nullptr;
4379   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP)) {
4380     cast<AtomicSDNode>(E)->refineAlignment(MMO);
4381     return SDValue(E, 0);
4382   }
4383
4384   // Allocate the operands array for the node out of the BumpPtrAllocator, since
4385   // SDNode doesn't have access to it.  This memory will be "leaked" when
4386   // the node is deallocated, but recovered when the allocator is released.
4387   // If the number of operands is less than 5 we use AtomicSDNode's internal
4388   // storage.
4389   unsigned NumOps = Ops.size();
4390   SDUse *DynOps = NumOps > 4 ? OperandAllocator.Allocate<SDUse>(NumOps)
4391                              : nullptr;
4392
4393   SDNode *N = new (NodeAllocator) AtomicSDNode(Opcode, dl.getIROrder(),
4394                                                dl.getDebugLoc(), VTList, MemVT,
4395                                                Ops.data(), DynOps, NumOps, MMO,
4396                                                SuccessOrdering, FailureOrdering,
4397                                                SynchScope);
4398   CSEMap.InsertNode(N, IP);
4399   AllNodes.push_back(N);
4400   return SDValue(N, 0);
4401 }
4402
4403 SDValue SelectionDAG::getAtomic(unsigned Opcode, SDLoc dl, EVT MemVT,
4404                                 SDVTList VTList, ArrayRef<SDValue> Ops,
4405                                 MachineMemOperand *MMO,
4406                                 AtomicOrdering Ordering,
4407                                 SynchronizationScope SynchScope) {
4408   return getAtomic(Opcode, dl, MemVT, VTList, Ops, MMO, Ordering,
4409                    Ordering, SynchScope);
4410 }
4411
4412 SDValue SelectionDAG::getAtomicCmpSwap(
4413     unsigned Opcode, SDLoc dl, EVT MemVT, SDVTList VTs, SDValue Chain,
4414     SDValue Ptr, SDValue Cmp, SDValue Swp, MachinePointerInfo PtrInfo,
4415     unsigned Alignment, AtomicOrdering SuccessOrdering,
4416     AtomicOrdering FailureOrdering, SynchronizationScope SynchScope) {
4417   assert(Opcode == ISD::ATOMIC_CMP_SWAP ||
4418          Opcode == ISD::ATOMIC_CMP_SWAP_WITH_SUCCESS);
4419   assert(Cmp.getValueType() == Swp.getValueType() && "Invalid Atomic Op Types");
4420
4421   if (Alignment == 0)  // Ensure that codegen never sees alignment 0
4422     Alignment = getEVTAlignment(MemVT);
4423
4424   MachineFunction &MF = getMachineFunction();
4425
4426   // FIXME: Volatile isn't really correct; we should keep track of atomic
4427   // orderings in the memoperand.
4428   unsigned Flags = MachineMemOperand::MOVolatile;
4429   Flags |= MachineMemOperand::MOLoad;
4430   Flags |= MachineMemOperand::MOStore;
4431
4432   MachineMemOperand *MMO =
4433     MF.getMachineMemOperand(PtrInfo, Flags, MemVT.getStoreSize(), Alignment);
4434
4435   return getAtomicCmpSwap(Opcode, dl, MemVT, VTs, Chain, Ptr, Cmp, Swp, MMO,
4436                           SuccessOrdering, FailureOrdering, SynchScope);
4437 }
4438
4439 SDValue SelectionDAG::getAtomicCmpSwap(unsigned Opcode, SDLoc dl, EVT MemVT,
4440                                        SDVTList VTs, SDValue Chain, SDValue Ptr,
4441                                        SDValue Cmp, SDValue Swp,
4442                                        MachineMemOperand *MMO,
4443                                        AtomicOrdering SuccessOrdering,
4444                                        AtomicOrdering FailureOrdering,
4445                                        SynchronizationScope SynchScope) {
4446   assert(Opcode == ISD::ATOMIC_CMP_SWAP ||
4447          Opcode == ISD::ATOMIC_CMP_SWAP_WITH_SUCCESS);
4448   assert(Cmp.getValueType() == Swp.getValueType() && "Invalid Atomic Op Types");
4449
4450   SDValue Ops[] = {Chain, Ptr, Cmp, Swp};
4451   return getAtomic(Opcode, dl, MemVT, VTs, Ops, MMO,
4452                    SuccessOrdering, FailureOrdering, SynchScope);
4453 }
4454
4455 SDValue SelectionDAG::getAtomic(unsigned Opcode, SDLoc dl, EVT MemVT,
4456                                 SDValue Chain,
4457                                 SDValue Ptr, SDValue Val,
4458                                 const Value* PtrVal,
4459                                 unsigned Alignment,
4460                                 AtomicOrdering Ordering,
4461                                 SynchronizationScope SynchScope) {
4462   if (Alignment == 0)  // Ensure that codegen never sees alignment 0
4463     Alignment = getEVTAlignment(MemVT);
4464
4465   MachineFunction &MF = getMachineFunction();
4466   // An atomic store does not load. An atomic load does not store.
4467   // (An atomicrmw obviously both loads and stores.)
4468   // For now, atomics are considered to be volatile always, and they are
4469   // chained as such.
4470   // FIXME: Volatile isn't really correct; we should keep track of atomic
4471   // orderings in the memoperand.
4472   unsigned Flags = MachineMemOperand::MOVolatile;
4473   if (Opcode != ISD::ATOMIC_STORE)
4474     Flags |= MachineMemOperand::MOLoad;
4475   if (Opcode != ISD::ATOMIC_LOAD)
4476     Flags |= MachineMemOperand::MOStore;
4477
4478   MachineMemOperand *MMO =
4479     MF.getMachineMemOperand(MachinePointerInfo(PtrVal), Flags,
4480                             MemVT.getStoreSize(), Alignment);
4481
4482   return getAtomic(Opcode, dl, MemVT, Chain, Ptr, Val, MMO,
4483                    Ordering, SynchScope);
4484 }
4485
4486 SDValue SelectionDAG::getAtomic(unsigned Opcode, SDLoc dl, EVT MemVT,
4487                                 SDValue Chain,
4488                                 SDValue Ptr, SDValue Val,
4489                                 MachineMemOperand *MMO,
4490                                 AtomicOrdering Ordering,
4491                                 SynchronizationScope SynchScope) {
4492   assert((Opcode == ISD::ATOMIC_LOAD_ADD ||
4493           Opcode == ISD::ATOMIC_LOAD_SUB ||
4494           Opcode == ISD::ATOMIC_LOAD_AND ||
4495           Opcode == ISD::ATOMIC_LOAD_OR ||
4496           Opcode == ISD::ATOMIC_LOAD_XOR ||
4497           Opcode == ISD::ATOMIC_LOAD_NAND ||
4498           Opcode == ISD::ATOMIC_LOAD_MIN ||
4499           Opcode == ISD::ATOMIC_LOAD_MAX ||
4500           Opcode == ISD::ATOMIC_LOAD_UMIN ||
4501           Opcode == ISD::ATOMIC_LOAD_UMAX ||
4502           Opcode == ISD::ATOMIC_SWAP ||
4503           Opcode == ISD::ATOMIC_STORE) &&
4504          "Invalid Atomic Op");
4505
4506   EVT VT = Val.getValueType();
4507
4508   SDVTList VTs = Opcode == ISD::ATOMIC_STORE ? getVTList(MVT::Other) :
4509                                                getVTList(VT, MVT::Other);
4510   SDValue Ops[] = {Chain, Ptr, Val};
4511   return getAtomic(Opcode, dl, MemVT, VTs, Ops, MMO, Ordering, SynchScope);
4512 }
4513
4514 SDValue SelectionDAG::getAtomic(unsigned Opcode, SDLoc dl, EVT MemVT,
4515                                 EVT VT, SDValue Chain,
4516                                 SDValue Ptr,
4517                                 MachineMemOperand *MMO,
4518                                 AtomicOrdering Ordering,
4519                                 SynchronizationScope SynchScope) {
4520   assert(Opcode == ISD::ATOMIC_LOAD && "Invalid Atomic Op");
4521
4522   SDVTList VTs = getVTList(VT, MVT::Other);
4523   SDValue Ops[] = {Chain, Ptr};
4524   return getAtomic(Opcode, dl, MemVT, VTs, Ops, MMO, Ordering, SynchScope);
4525 }
4526
4527 /// getMergeValues - Create a MERGE_VALUES node from the given operands.
4528 SDValue SelectionDAG::getMergeValues(ArrayRef<SDValue> Ops, SDLoc dl) {
4529   if (Ops.size() == 1)
4530     return Ops[0];
4531
4532   SmallVector<EVT, 4> VTs;
4533   VTs.reserve(Ops.size());
4534   for (unsigned i = 0; i < Ops.size(); ++i)
4535     VTs.push_back(Ops[i].getValueType());
4536   return getNode(ISD::MERGE_VALUES, dl, getVTList(VTs), Ops);
4537 }
4538
4539 SDValue
4540 SelectionDAG::getMemIntrinsicNode(unsigned Opcode, SDLoc dl, SDVTList VTList,
4541                                   ArrayRef<SDValue> Ops,
4542                                   EVT MemVT, MachinePointerInfo PtrInfo,
4543                                   unsigned Align, bool Vol,
4544                                   bool ReadMem, bool WriteMem) {
4545   if (Align == 0)  // Ensure that codegen never sees alignment 0
4546     Align = getEVTAlignment(MemVT);
4547
4548   MachineFunction &MF = getMachineFunction();
4549   unsigned Flags = 0;
4550   if (WriteMem)
4551     Flags |= MachineMemOperand::MOStore;
4552   if (ReadMem)
4553     Flags |= MachineMemOperand::MOLoad;
4554   if (Vol)
4555     Flags |= MachineMemOperand::MOVolatile;
4556   MachineMemOperand *MMO =
4557     MF.getMachineMemOperand(PtrInfo, Flags, MemVT.getStoreSize(), Align);
4558
4559   return getMemIntrinsicNode(Opcode, dl, VTList, Ops, MemVT, MMO);
4560 }
4561
4562 SDValue
4563 SelectionDAG::getMemIntrinsicNode(unsigned Opcode, SDLoc dl, SDVTList VTList,
4564                                   ArrayRef<SDValue> Ops, EVT MemVT,
4565                                   MachineMemOperand *MMO) {
4566   assert((Opcode == ISD::INTRINSIC_VOID ||
4567           Opcode == ISD::INTRINSIC_W_CHAIN ||
4568           Opcode == ISD::PREFETCH ||
4569           Opcode == ISD::LIFETIME_START ||
4570           Opcode == ISD::LIFETIME_END ||
4571           (Opcode <= INT_MAX &&
4572            (int)Opcode >= ISD::FIRST_TARGET_MEMORY_OPCODE)) &&
4573          "Opcode is not a memory-accessing opcode!");
4574
4575   // Memoize the node unless it returns a flag.
4576   MemIntrinsicSDNode *N;
4577   if (VTList.VTs[VTList.NumVTs-1] != MVT::Glue) {
4578     FoldingSetNodeID ID;
4579     AddNodeIDNode(ID, Opcode, VTList, Ops);
4580     ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
4581     void *IP = nullptr;
4582     if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP)) {
4583       cast<MemIntrinsicSDNode>(E)->refineAlignment(MMO);
4584       return SDValue(E, 0);
4585     }
4586
4587     N = new (NodeAllocator) MemIntrinsicSDNode(Opcode, dl.getIROrder(),
4588                                                dl.getDebugLoc(), VTList, Ops,
4589                                                MemVT, MMO);
4590     CSEMap.InsertNode(N, IP);
4591   } else {
4592     N = new (NodeAllocator) MemIntrinsicSDNode(Opcode, dl.getIROrder(),
4593                                                dl.getDebugLoc(), VTList, Ops,
4594                                                MemVT, MMO);
4595   }
4596   AllNodes.push_back(N);
4597   return SDValue(N, 0);
4598 }
4599
4600 /// InferPointerInfo - If the specified ptr/offset is a frame index, infer a
4601 /// MachinePointerInfo record from it.  This is particularly useful because the
4602 /// code generator has many cases where it doesn't bother passing in a
4603 /// MachinePointerInfo to getLoad or getStore when it has "FI+Cst".
4604 static MachinePointerInfo InferPointerInfo(SDValue Ptr, int64_t Offset = 0) {
4605   // If this is FI+Offset, we can model it.
4606   if (const FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Ptr))
4607     return MachinePointerInfo::getFixedStack(FI->getIndex(), Offset);
4608
4609   // If this is (FI+Offset1)+Offset2, we can model it.
4610   if (Ptr.getOpcode() != ISD::ADD ||
4611       !isa<ConstantSDNode>(Ptr.getOperand(1)) ||
4612       !isa<FrameIndexSDNode>(Ptr.getOperand(0)))
4613     return MachinePointerInfo();
4614
4615   int FI = cast<FrameIndexSDNode>(Ptr.getOperand(0))->getIndex();
4616   return MachinePointerInfo::getFixedStack(FI, Offset+
4617                        cast<ConstantSDNode>(Ptr.getOperand(1))->getSExtValue());
4618 }
4619
4620 /// InferPointerInfo - If the specified ptr/offset is a frame index, infer a
4621 /// MachinePointerInfo record from it.  This is particularly useful because the
4622 /// code generator has many cases where it doesn't bother passing in a
4623 /// MachinePointerInfo to getLoad or getStore when it has "FI+Cst".
4624 static MachinePointerInfo InferPointerInfo(SDValue Ptr, SDValue OffsetOp) {
4625   // If the 'Offset' value isn't a constant, we can't handle this.
4626   if (ConstantSDNode *OffsetNode = dyn_cast<ConstantSDNode>(OffsetOp))
4627     return InferPointerInfo(Ptr, OffsetNode->getSExtValue());
4628   if (OffsetOp.getOpcode() == ISD::UNDEF)
4629     return InferPointerInfo(Ptr);
4630   return MachinePointerInfo();
4631 }
4632
4633
4634 SDValue
4635 SelectionDAG::getLoad(ISD::MemIndexedMode AM, ISD::LoadExtType ExtType,
4636                       EVT VT, SDLoc dl, SDValue Chain,
4637                       SDValue Ptr, SDValue Offset,
4638                       MachinePointerInfo PtrInfo, EVT MemVT,
4639                       bool isVolatile, bool isNonTemporal, bool isInvariant,
4640                       unsigned Alignment, const MDNode *TBAAInfo,
4641                       const MDNode *Ranges) {
4642   assert(Chain.getValueType() == MVT::Other &&
4643         "Invalid chain type");
4644   if (Alignment == 0)  // Ensure that codegen never sees alignment 0
4645     Alignment = getEVTAlignment(VT);
4646
4647   unsigned Flags = MachineMemOperand::MOLoad;
4648   if (isVolatile)
4649     Flags |= MachineMemOperand::MOVolatile;
4650   if (isNonTemporal)
4651     Flags |= MachineMemOperand::MONonTemporal;
4652   if (isInvariant)
4653     Flags |= MachineMemOperand::MOInvariant;
4654
4655   // If we don't have a PtrInfo, infer the trivial frame index case to simplify
4656   // clients.
4657   if (PtrInfo.V.isNull())
4658     PtrInfo = InferPointerInfo(Ptr, Offset);
4659
4660   MachineFunction &MF = getMachineFunction();
4661   MachineMemOperand *MMO =
4662     MF.getMachineMemOperand(PtrInfo, Flags, MemVT.getStoreSize(), Alignment,
4663                             TBAAInfo, Ranges);
4664   return getLoad(AM, ExtType, VT, dl, Chain, Ptr, Offset, MemVT, MMO);
4665 }
4666
4667 SDValue
4668 SelectionDAG::getLoad(ISD::MemIndexedMode AM, ISD::LoadExtType ExtType,
4669                       EVT VT, SDLoc dl, SDValue Chain,
4670                       SDValue Ptr, SDValue Offset, EVT MemVT,
4671                       MachineMemOperand *MMO) {
4672   if (VT == MemVT) {
4673     ExtType = ISD::NON_EXTLOAD;
4674   } else if (ExtType == ISD::NON_EXTLOAD) {
4675     assert(VT == MemVT && "Non-extending load from different memory type!");
4676   } else {
4677     // Extending load.
4678     assert(MemVT.getScalarType().bitsLT(VT.getScalarType()) &&
4679            "Should only be an extending load, not truncating!");
4680     assert(VT.isInteger() == MemVT.isInteger() &&
4681            "Cannot convert from FP to Int or Int -> FP!");
4682     assert(VT.isVector() == MemVT.isVector() &&
4683            "Cannot use trunc store to convert to or from a vector!");
4684     assert((!VT.isVector() ||
4685             VT.getVectorNumElements() == MemVT.getVectorNumElements()) &&
4686            "Cannot use trunc store to change the number of vector elements!");
4687   }
4688
4689   bool Indexed = AM != ISD::UNINDEXED;
4690   assert((Indexed || Offset.getOpcode() == ISD::UNDEF) &&
4691          "Unindexed load with an offset!");
4692
4693   SDVTList VTs = Indexed ?
4694     getVTList(VT, Ptr.getValueType(), MVT::Other) : getVTList(VT, MVT::Other);
4695   SDValue Ops[] = { Chain, Ptr, Offset };
4696   FoldingSetNodeID ID;
4697   AddNodeIDNode(ID, ISD::LOAD, VTs, Ops);
4698   ID.AddInteger(MemVT.getRawBits());
4699   ID.AddInteger(encodeMemSDNodeFlags(ExtType, AM, MMO->isVolatile(),
4700                                      MMO->isNonTemporal(),
4701                                      MMO->isInvariant()));
4702   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
4703   void *IP = nullptr;
4704   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP)) {
4705     cast<LoadSDNode>(E)->refineAlignment(MMO);
4706     return SDValue(E, 0);
4707   }
4708   SDNode *N = new (NodeAllocator) LoadSDNode(Ops, dl.getIROrder(),
4709                                              dl.getDebugLoc(), VTs, AM, ExtType,
4710                                              MemVT, MMO);
4711   CSEMap.InsertNode(N, IP);
4712   AllNodes.push_back(N);
4713   return SDValue(N, 0);
4714 }
4715
4716 SDValue SelectionDAG::getLoad(EVT VT, SDLoc dl,
4717                               SDValue Chain, SDValue Ptr,
4718                               MachinePointerInfo PtrInfo,
4719                               bool isVolatile, bool isNonTemporal,
4720                               bool isInvariant, unsigned Alignment,
4721                               const MDNode *TBAAInfo,
4722                               const MDNode *Ranges) {
4723   SDValue Undef = getUNDEF(Ptr.getValueType());
4724   return getLoad(ISD::UNINDEXED, ISD::NON_EXTLOAD, VT, dl, Chain, Ptr, Undef,
4725                  PtrInfo, VT, isVolatile, isNonTemporal, isInvariant, Alignment,
4726                  TBAAInfo, Ranges);
4727 }
4728
4729 SDValue SelectionDAG::getLoad(EVT VT, SDLoc dl,
4730                               SDValue Chain, SDValue Ptr,
4731                               MachineMemOperand *MMO) {
4732   SDValue Undef = getUNDEF(Ptr.getValueType());
4733   return getLoad(ISD::UNINDEXED, ISD::NON_EXTLOAD, VT, dl, Chain, Ptr, Undef,
4734                  VT, MMO);
4735 }
4736
4737 SDValue SelectionDAG::getExtLoad(ISD::LoadExtType ExtType, SDLoc dl, EVT VT,
4738                                  SDValue Chain, SDValue Ptr,
4739                                  MachinePointerInfo PtrInfo, EVT MemVT,
4740                                  bool isVolatile, bool isNonTemporal,
4741                                  unsigned Alignment, const MDNode *TBAAInfo) {
4742   SDValue Undef = getUNDEF(Ptr.getValueType());
4743   return getLoad(ISD::UNINDEXED, ExtType, VT, dl, Chain, Ptr, Undef,
4744                  PtrInfo, MemVT, isVolatile, isNonTemporal, false, Alignment,
4745                  TBAAInfo);
4746 }
4747
4748
4749 SDValue SelectionDAG::getExtLoad(ISD::LoadExtType ExtType, SDLoc dl, EVT VT,
4750                                  SDValue Chain, SDValue Ptr, EVT MemVT,
4751                                  MachineMemOperand *MMO) {
4752   SDValue Undef = getUNDEF(Ptr.getValueType());
4753   return getLoad(ISD::UNINDEXED, ExtType, VT, dl, Chain, Ptr, Undef,
4754                  MemVT, MMO);
4755 }
4756
4757 SDValue
4758 SelectionDAG::getIndexedLoad(SDValue OrigLoad, SDLoc dl, SDValue Base,
4759                              SDValue Offset, ISD::MemIndexedMode AM) {
4760   LoadSDNode *LD = cast<LoadSDNode>(OrigLoad);
4761   assert(LD->getOffset().getOpcode() == ISD::UNDEF &&
4762          "Load is already a indexed load!");
4763   return getLoad(AM, LD->getExtensionType(), OrigLoad.getValueType(), dl,
4764                  LD->getChain(), Base, Offset, LD->getPointerInfo(),
4765                  LD->getMemoryVT(), LD->isVolatile(), LD->isNonTemporal(),
4766                  false, LD->getAlignment());
4767 }
4768
4769 SDValue SelectionDAG::getStore(SDValue Chain, SDLoc dl, SDValue Val,
4770                                SDValue Ptr, MachinePointerInfo PtrInfo,
4771                                bool isVolatile, bool isNonTemporal,
4772                                unsigned Alignment, const MDNode *TBAAInfo) {
4773   assert(Chain.getValueType() == MVT::Other &&
4774         "Invalid chain type");
4775   if (Alignment == 0)  // Ensure that codegen never sees alignment 0
4776     Alignment = getEVTAlignment(Val.getValueType());
4777
4778   unsigned Flags = MachineMemOperand::MOStore;
4779   if (isVolatile)
4780     Flags |= MachineMemOperand::MOVolatile;
4781   if (isNonTemporal)
4782     Flags |= MachineMemOperand::MONonTemporal;
4783
4784   if (PtrInfo.V.isNull())
4785     PtrInfo = InferPointerInfo(Ptr);
4786
4787   MachineFunction &MF = getMachineFunction();
4788   MachineMemOperand *MMO =
4789     MF.getMachineMemOperand(PtrInfo, Flags,
4790                             Val.getValueType().getStoreSize(), Alignment,
4791                             TBAAInfo);
4792
4793   return getStore(Chain, dl, Val, Ptr, MMO);
4794 }
4795
4796 SDValue SelectionDAG::getStore(SDValue Chain, SDLoc dl, SDValue Val,
4797                                SDValue Ptr, MachineMemOperand *MMO) {
4798   assert(Chain.getValueType() == MVT::Other &&
4799         "Invalid chain type");
4800   EVT VT = Val.getValueType();
4801   SDVTList VTs = getVTList(MVT::Other);
4802   SDValue Undef = getUNDEF(Ptr.getValueType());
4803   SDValue Ops[] = { Chain, Val, Ptr, Undef };
4804   FoldingSetNodeID ID;
4805   AddNodeIDNode(ID, ISD::STORE, VTs, Ops);
4806   ID.AddInteger(VT.getRawBits());
4807   ID.AddInteger(encodeMemSDNodeFlags(false, ISD::UNINDEXED, MMO->isVolatile(),
4808                                      MMO->isNonTemporal(), MMO->isInvariant()));
4809   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
4810   void *IP = nullptr;
4811   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP)) {
4812     cast<StoreSDNode>(E)->refineAlignment(MMO);
4813     return SDValue(E, 0);
4814   }
4815   SDNode *N = new (NodeAllocator) StoreSDNode(Ops, dl.getIROrder(),
4816                                               dl.getDebugLoc(), VTs,
4817                                               ISD::UNINDEXED, false, VT, MMO);
4818   CSEMap.InsertNode(N, IP);
4819   AllNodes.push_back(N);
4820   return SDValue(N, 0);
4821 }
4822
4823 SDValue SelectionDAG::getTruncStore(SDValue Chain, SDLoc dl, SDValue Val,
4824                                     SDValue Ptr, MachinePointerInfo PtrInfo,
4825                                     EVT SVT,bool isVolatile, bool isNonTemporal,
4826                                     unsigned Alignment,
4827                                     const MDNode *TBAAInfo) {
4828   assert(Chain.getValueType() == MVT::Other &&
4829         "Invalid chain type");
4830   if (Alignment == 0)  // Ensure that codegen never sees alignment 0
4831     Alignment = getEVTAlignment(SVT);
4832
4833   unsigned Flags = MachineMemOperand::MOStore;
4834   if (isVolatile)
4835     Flags |= MachineMemOperand::MOVolatile;
4836   if (isNonTemporal)
4837     Flags |= MachineMemOperand::MONonTemporal;
4838
4839   if (PtrInfo.V.isNull())
4840     PtrInfo = InferPointerInfo(Ptr);
4841
4842   MachineFunction &MF = getMachineFunction();
4843   MachineMemOperand *MMO =
4844     MF.getMachineMemOperand(PtrInfo, Flags, SVT.getStoreSize(), Alignment,
4845                             TBAAInfo);
4846
4847   return getTruncStore(Chain, dl, Val, Ptr, SVT, MMO);
4848 }
4849
4850 SDValue SelectionDAG::getTruncStore(SDValue Chain, SDLoc dl, SDValue Val,
4851                                     SDValue Ptr, EVT SVT,
4852                                     MachineMemOperand *MMO) {
4853   EVT VT = Val.getValueType();
4854
4855   assert(Chain.getValueType() == MVT::Other &&
4856         "Invalid chain type");
4857   if (VT == SVT)
4858     return getStore(Chain, dl, Val, Ptr, MMO);
4859
4860   assert(SVT.getScalarType().bitsLT(VT.getScalarType()) &&
4861          "Should only be a truncating store, not extending!");
4862   assert(VT.isInteger() == SVT.isInteger() &&
4863          "Can't do FP-INT conversion!");
4864   assert(VT.isVector() == SVT.isVector() &&
4865          "Cannot use trunc store to convert to or from a vector!");
4866   assert((!VT.isVector() ||
4867           VT.getVectorNumElements() == SVT.getVectorNumElements()) &&
4868          "Cannot use trunc store to change the number of vector elements!");
4869
4870   SDVTList VTs = getVTList(MVT::Other);
4871   SDValue Undef = getUNDEF(Ptr.getValueType());
4872   SDValue Ops[] = { Chain, Val, Ptr, Undef };
4873   FoldingSetNodeID ID;
4874   AddNodeIDNode(ID, ISD::STORE, VTs, Ops);
4875   ID.AddInteger(SVT.getRawBits());
4876   ID.AddInteger(encodeMemSDNodeFlags(true, ISD::UNINDEXED, MMO->isVolatile(),
4877                                      MMO->isNonTemporal(), MMO->isInvariant()));
4878   ID.AddInteger(MMO->getPointerInfo().getAddrSpace());
4879   void *IP = nullptr;
4880   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP)) {
4881     cast<StoreSDNode>(E)->refineAlignment(MMO);
4882     return SDValue(E, 0);
4883   }
4884   SDNode *N = new (NodeAllocator) StoreSDNode(Ops, dl.getIROrder(),
4885                                               dl.getDebugLoc(), VTs,
4886                                               ISD::UNINDEXED, true, SVT, MMO);
4887   CSEMap.InsertNode(N, IP);
4888   AllNodes.push_back(N);
4889   return SDValue(N, 0);
4890 }
4891
4892 SDValue
4893 SelectionDAG::getIndexedStore(SDValue OrigStore, SDLoc dl, SDValue Base,
4894                               SDValue Offset, ISD::MemIndexedMode AM) {
4895   StoreSDNode *ST = cast<StoreSDNode>(OrigStore);
4896   assert(ST->getOffset().getOpcode() == ISD::UNDEF &&
4897          "Store is already a indexed store!");
4898   SDVTList VTs = getVTList(Base.getValueType(), MVT::Other);
4899   SDValue Ops[] = { ST->getChain(), ST->getValue(), Base, Offset };
4900   FoldingSetNodeID ID;
4901   AddNodeIDNode(ID, ISD::STORE, VTs, Ops);
4902   ID.AddInteger(ST->getMemoryVT().getRawBits());
4903   ID.AddInteger(ST->getRawSubclassData());
4904   ID.AddInteger(ST->getPointerInfo().getAddrSpace());
4905   void *IP = nullptr;
4906   if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
4907     return SDValue(E, 0);
4908
4909   SDNode *N = new (NodeAllocator) StoreSDNode(Ops, dl.getIROrder(),
4910                                               dl.getDebugLoc(), VTs, AM,
4911                                               ST->isTruncatingStore(),
4912                                               ST->getMemoryVT(),
4913                                               ST->getMemOperand());
4914   CSEMap.InsertNode(N, IP);
4915   AllNodes.push_back(N);
4916   return SDValue(N, 0);
4917 }
4918
4919 SDValue SelectionDAG::getVAArg(EVT VT, SDLoc dl,
4920                                SDValue Chain, SDValue Ptr,
4921                                SDValue SV,
4922                                unsigned Align) {
4923   SDValue Ops[] = { Chain, Ptr, SV, getTargetConstant(Align, MVT::i32) };
4924   return getNode(ISD::VAARG, dl, getVTList(VT, MVT::Other), Ops);
4925 }
4926
4927 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT,
4928                               ArrayRef<SDUse> Ops) {
4929   switch (Ops.size()) {
4930   case 0: return getNode(Opcode, DL, VT);
4931   case 1: return getNode(Opcode, DL, VT, static_cast<const SDValue>(Ops[0]));
4932   case 2: return getNode(Opcode, DL, VT, Ops[0], Ops[1]);
4933   case 3: return getNode(Opcode, DL, VT, Ops[0], Ops[1], Ops[2]);
4934   default: break;
4935   }
4936
4937   // Copy from an SDUse array into an SDValue array for use with
4938   // the regular getNode logic.
4939   SmallVector<SDValue, 8> NewOps(Ops.begin(), Ops.end());
4940   return getNode(Opcode, DL, VT, NewOps);
4941 }
4942
4943 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, EVT VT,
4944                               ArrayRef<SDValue> Ops) {
4945   unsigned NumOps = Ops.size();
4946   switch (NumOps) {
4947   case 0: return getNode(Opcode, DL, VT);
4948   case 1: return getNode(Opcode, DL, VT, Ops[0]);
4949   case 2: return getNode(Opcode, DL, VT, Ops[0], Ops[1]);
4950   case 3: return getNode(Opcode, DL, VT, Ops[0], Ops[1], Ops[2]);
4951   default: break;
4952   }
4953
4954   switch (Opcode) {
4955   default: break;
4956   case ISD::SELECT_CC: {
4957     assert(NumOps == 5 && "SELECT_CC takes 5 operands!");
4958     assert(Ops[0].getValueType() == Ops[1].getValueType() &&
4959            "LHS and RHS of condition must have same type!");
4960     assert(Ops[2].getValueType() == Ops[3].getValueType() &&
4961            "True and False arms of SelectCC must have same type!");
4962     assert(Ops[2].getValueType() == VT &&
4963            "select_cc node must be of same type as true and false value!");
4964     break;
4965   }
4966   case ISD::BR_CC: {
4967     assert(NumOps == 5 && "BR_CC takes 5 operands!");
4968     assert(Ops[2].getValueType() == Ops[3].getValueType() &&
4969            "LHS/RHS of comparison should match types!");
4970     break;
4971   }
4972   }
4973
4974   // Memoize nodes.
4975   SDNode *N;
4976   SDVTList VTs = getVTList(VT);
4977
4978   if (VT != MVT::Glue) {
4979     FoldingSetNodeID ID;
4980     AddNodeIDNode(ID, Opcode, VTs, Ops);
4981     void *IP = nullptr;
4982
4983     if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
4984       return SDValue(E, 0);
4985
4986     N = new (NodeAllocator) SDNode(Opcode, DL.getIROrder(), DL.getDebugLoc(),
4987                                    VTs, Ops);
4988     CSEMap.InsertNode(N, IP);
4989   } else {
4990     N = new (NodeAllocator) SDNode(Opcode, DL.getIROrder(), DL.getDebugLoc(),
4991                                    VTs, Ops);
4992   }
4993
4994   AllNodes.push_back(N);
4995 #ifndef NDEBUG
4996   VerifySDNode(N);
4997 #endif
4998   return SDValue(N, 0);
4999 }
5000
5001 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL,
5002                               ArrayRef<EVT> ResultTys, ArrayRef<SDValue> Ops) {
5003   return getNode(Opcode, DL, getVTList(ResultTys), Ops);
5004 }
5005
5006 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5007                               ArrayRef<SDValue> Ops) {
5008   if (VTList.NumVTs == 1)
5009     return getNode(Opcode, DL, VTList.VTs[0], Ops);
5010
5011 #if 0
5012   switch (Opcode) {
5013   // FIXME: figure out how to safely handle things like
5014   // int foo(int x) { return 1 << (x & 255); }
5015   // int bar() { return foo(256); }
5016   case ISD::SRA_PARTS:
5017   case ISD::SRL_PARTS:
5018   case ISD::SHL_PARTS:
5019     if (N3.getOpcode() == ISD::SIGN_EXTEND_INREG &&
5020         cast<VTSDNode>(N3.getOperand(1))->getVT() != MVT::i1)
5021       return getNode(Opcode, DL, VT, N1, N2, N3.getOperand(0));
5022     else if (N3.getOpcode() == ISD::AND)
5023       if (ConstantSDNode *AndRHS = dyn_cast<ConstantSDNode>(N3.getOperand(1))) {
5024         // If the and is only masking out bits that cannot effect the shift,
5025         // eliminate the and.
5026         unsigned NumBits = VT.getScalarType().getSizeInBits()*2;
5027         if ((AndRHS->getValue() & (NumBits-1)) == NumBits-1)
5028           return getNode(Opcode, DL, VT, N1, N2, N3.getOperand(0));
5029       }
5030     break;
5031   }
5032 #endif
5033
5034   // Memoize the node unless it returns a flag.
5035   SDNode *N;
5036   unsigned NumOps = Ops.size();
5037   if (VTList.VTs[VTList.NumVTs-1] != MVT::Glue) {
5038     FoldingSetNodeID ID;
5039     AddNodeIDNode(ID, Opcode, VTList, Ops);
5040     void *IP = nullptr;
5041     if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
5042       return SDValue(E, 0);
5043
5044     if (NumOps == 1) {
5045       N = new (NodeAllocator) UnarySDNode(Opcode, DL.getIROrder(),
5046                                           DL.getDebugLoc(), VTList, Ops[0]);
5047     } else if (NumOps == 2) {
5048       N = new (NodeAllocator) BinarySDNode(Opcode, DL.getIROrder(),
5049                                            DL.getDebugLoc(), VTList, Ops[0],
5050                                            Ops[1]);
5051     } else if (NumOps == 3) {
5052       N = new (NodeAllocator) TernarySDNode(Opcode, DL.getIROrder(),
5053                                             DL.getDebugLoc(), VTList, Ops[0],
5054                                             Ops[1], Ops[2]);
5055     } else {
5056       N = new (NodeAllocator) SDNode(Opcode, DL.getIROrder(), DL.getDebugLoc(),
5057                                      VTList, Ops);
5058     }
5059     CSEMap.InsertNode(N, IP);
5060   } else {
5061     if (NumOps == 1) {
5062       N = new (NodeAllocator) UnarySDNode(Opcode, DL.getIROrder(),
5063                                           DL.getDebugLoc(), VTList, Ops[0]);
5064     } else if (NumOps == 2) {
5065       N = new (NodeAllocator) BinarySDNode(Opcode, DL.getIROrder(),
5066                                            DL.getDebugLoc(), VTList, Ops[0],
5067                                            Ops[1]);
5068     } else if (NumOps == 3) {
5069       N = new (NodeAllocator) TernarySDNode(Opcode, DL.getIROrder(),
5070                                             DL.getDebugLoc(), VTList, Ops[0],
5071                                             Ops[1], Ops[2]);
5072     } else {
5073       N = new (NodeAllocator) SDNode(Opcode, DL.getIROrder(), DL.getDebugLoc(),
5074                                      VTList, Ops);
5075     }
5076   }
5077   AllNodes.push_back(N);
5078 #ifndef NDEBUG
5079   VerifySDNode(N);
5080 #endif
5081   return SDValue(N, 0);
5082 }
5083
5084 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList) {
5085   return getNode(Opcode, DL, VTList, ArrayRef<SDValue>());
5086 }
5087
5088 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5089                               SDValue N1) {
5090   SDValue Ops[] = { N1 };
5091   return getNode(Opcode, DL, VTList, Ops);
5092 }
5093
5094 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5095                               SDValue N1, SDValue N2) {
5096   SDValue Ops[] = { N1, N2 };
5097   return getNode(Opcode, DL, VTList, Ops);
5098 }
5099
5100 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5101                               SDValue N1, SDValue N2, SDValue N3) {
5102   SDValue Ops[] = { N1, N2, N3 };
5103   return getNode(Opcode, DL, VTList, Ops);
5104 }
5105
5106 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5107                               SDValue N1, SDValue N2, SDValue N3,
5108                               SDValue N4) {
5109   SDValue Ops[] = { N1, N2, N3, N4 };
5110   return getNode(Opcode, DL, VTList, Ops);
5111 }
5112
5113 SDValue SelectionDAG::getNode(unsigned Opcode, SDLoc DL, SDVTList VTList,
5114                               SDValue N1, SDValue N2, SDValue N3,
5115                               SDValue N4, SDValue N5) {
5116   SDValue Ops[] = { N1, N2, N3, N4, N5 };
5117   return getNode(Opcode, DL, VTList, Ops);
5118 }
5119
5120 SDVTList SelectionDAG::getVTList(EVT VT) {
5121   return makeVTList(SDNode::getValueTypeList(VT), 1);
5122 }
5123
5124 SDVTList SelectionDAG::getVTList(EVT VT1, EVT VT2) {
5125   FoldingSetNodeID ID;
5126   ID.AddInteger(2U);
5127   ID.AddInteger(VT1.getRawBits());
5128   ID.AddInteger(VT2.getRawBits());
5129
5130   void *IP = nullptr;
5131   SDVTListNode *Result = VTListMap.FindNodeOrInsertPos(ID, IP);
5132   if (!Result) {
5133     EVT *Array = Allocator.Allocate<EVT>(2);
5134     Array[0] = VT1;
5135     Array[1] = VT2;
5136     Result = new (Allocator) SDVTListNode(ID.Intern(Allocator), Array, 2);
5137     VTListMap.InsertNode(Result, IP);
5138   }
5139   return Result->getSDVTList();
5140 }
5141
5142 SDVTList SelectionDAG::getVTList(EVT VT1, EVT VT2, EVT VT3) {
5143   FoldingSetNodeID ID;
5144   ID.AddInteger(3U);
5145   ID.AddInteger(VT1.getRawBits());
5146   ID.AddInteger(VT2.getRawBits());
5147   ID.AddInteger(VT3.getRawBits());
5148
5149   void *IP = nullptr;
5150   SDVTListNode *Result = VTListMap.FindNodeOrInsertPos(ID, IP);
5151   if (!Result) {
5152     EVT *Array = Allocator.Allocate<EVT>(3);
5153     Array[0] = VT1;
5154     Array[1] = VT2;
5155     Array[2] = VT3;
5156     Result = new (Allocator) SDVTListNode(ID.Intern(Allocator), Array, 3);
5157     VTListMap.InsertNode(Result, IP);
5158   }
5159   return Result->getSDVTList();
5160 }
5161
5162 SDVTList SelectionDAG::getVTList(EVT VT1, EVT VT2, EVT VT3, EVT VT4) {
5163   FoldingSetNodeID ID;
5164   ID.AddInteger(4U);
5165   ID.AddInteger(VT1.getRawBits());
5166   ID.AddInteger(VT2.getRawBits());
5167   ID.AddInteger(VT3.getRawBits());
5168   ID.AddInteger(VT4.getRawBits());
5169
5170   void *IP = nullptr;
5171   SDVTListNode *Result = VTListMap.FindNodeOrInsertPos(ID, IP);
5172   if (!Result) {
5173     EVT *Array = Allocator.Allocate<EVT>(4);
5174     Array[0] = VT1;
5175     Array[1] = VT2;
5176     Array[2] = VT3;
5177     Array[3] = VT4;
5178     Result = new (Allocator) SDVTListNode(ID.Intern(Allocator), Array, 4);
5179     VTListMap.InsertNode(Result, IP);
5180   }
5181   return Result->getSDVTList();
5182 }
5183
5184 SDVTList SelectionDAG::getVTList(ArrayRef<EVT> VTs) {
5185   unsigned NumVTs = VTs.size();
5186   FoldingSetNodeID ID;
5187   ID.AddInteger(NumVTs);
5188   for (unsigned index = 0; index < NumVTs; index++) {
5189     ID.AddInteger(VTs[index].getRawBits());
5190   }
5191
5192   void *IP = nullptr;
5193   SDVTListNode *Result = VTListMap.FindNodeOrInsertPos(ID, IP);
5194   if (!Result) {
5195     EVT *Array = Allocator.Allocate<EVT>(NumVTs);
5196     std::copy(VTs.begin(), VTs.end(), Array);
5197     Result = new (Allocator) SDVTListNode(ID.Intern(Allocator), Array, NumVTs);
5198     VTListMap.InsertNode(Result, IP);
5199   }
5200   return Result->getSDVTList();
5201 }
5202
5203
5204 /// UpdateNodeOperands - *Mutate* the specified node in-place to have the
5205 /// specified operands.  If the resultant node already exists in the DAG,
5206 /// this does not modify the specified node, instead it returns the node that
5207 /// already exists.  If the resultant node does not exist in the DAG, the
5208 /// input node is returned.  As a degenerate case, if you specify the same
5209 /// input operands as the node already has, the input node is returned.
5210 SDNode *SelectionDAG::UpdateNodeOperands(SDNode *N, SDValue Op) {
5211   assert(N->getNumOperands() == 1 && "Update with wrong number of operands");
5212
5213   // Check to see if there is no change.
5214   if (Op == N->getOperand(0)) return N;
5215
5216   // See if the modified node already exists.
5217   void *InsertPos = nullptr;
5218   if (SDNode *Existing = FindModifiedNodeSlot(N, Op, InsertPos))
5219     return Existing;
5220
5221   // Nope it doesn't.  Remove the node from its current place in the maps.
5222   if (InsertPos)
5223     if (!RemoveNodeFromCSEMaps(N))
5224       InsertPos = nullptr;
5225
5226   // Now we update the operands.
5227   N->OperandList[0].set(Op);
5228
5229   // If this gets put into a CSE map, add it.
5230   if (InsertPos) CSEMap.InsertNode(N, InsertPos);
5231   return N;
5232 }
5233
5234 SDNode *SelectionDAG::UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2) {
5235   assert(N->getNumOperands() == 2 && "Update with wrong number of operands");
5236
5237   // Check to see if there is no change.
5238   if (Op1 == N->getOperand(0) && Op2 == N->getOperand(1))
5239     return N;   // No operands changed, just return the input node.
5240
5241   // See if the modified node already exists.
5242   void *InsertPos = nullptr;
5243   if (SDNode *Existing = FindModifiedNodeSlot(N, Op1, Op2, InsertPos))
5244     return Existing;
5245
5246   // Nope it doesn't.  Remove the node from its current place in the maps.
5247   if (InsertPos)
5248     if (!RemoveNodeFromCSEMaps(N))
5249       InsertPos = nullptr;
5250
5251   // Now we update the operands.
5252   if (N->OperandList[0] != Op1)
5253     N->OperandList[0].set(Op1);
5254   if (N->OperandList[1] != Op2)
5255     N->OperandList[1].set(Op2);
5256
5257   // If this gets put into a CSE map, add it.
5258   if (InsertPos) CSEMap.InsertNode(N, InsertPos);
5259   return N;
5260 }
5261
5262 SDNode *SelectionDAG::
5263 UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2, SDValue Op3) {
5264   SDValue Ops[] = { Op1, Op2, Op3 };
5265   return UpdateNodeOperands(N, Ops);
5266 }
5267
5268 SDNode *SelectionDAG::
5269 UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2,
5270                    SDValue Op3, SDValue Op4) {
5271   SDValue Ops[] = { Op1, Op2, Op3, Op4 };
5272   return UpdateNodeOperands(N, Ops);
5273 }
5274
5275 SDNode *SelectionDAG::
5276 UpdateNodeOperands(SDNode *N, SDValue Op1, SDValue Op2,
5277                    SDValue Op3, SDValue Op4, SDValue Op5) {
5278   SDValue Ops[] = { Op1, Op2, Op3, Op4, Op5 };
5279   return UpdateNodeOperands(N, Ops);
5280 }
5281
5282 SDNode *SelectionDAG::
5283 UpdateNodeOperands(SDNode *N, ArrayRef<SDValue> Ops) {
5284   unsigned NumOps = Ops.size();
5285   assert(N->getNumOperands() == NumOps &&
5286          "Update with wrong number of operands");
5287
5288   // Check to see if there is no change.
5289   bool AnyChange = false;
5290   for (unsigned i = 0; i != NumOps; ++i) {
5291     if (Ops[i] != N->getOperand(i)) {
5292       AnyChange = true;
5293       break;
5294     }
5295   }
5296
5297   // No operands changed, just return the input node.
5298   if (!AnyChange) return N;
5299
5300   // See if the modified node already exists.
5301   void *InsertPos = nullptr;
5302   if (SDNode *Existing = FindModifiedNodeSlot(N, Ops, InsertPos))
5303     return Existing;
5304
5305   // Nope it doesn't.  Remove the node from its current place in the maps.
5306   if (InsertPos)
5307     if (!RemoveNodeFromCSEMaps(N))
5308       InsertPos = nullptr;
5309
5310   // Now we update the operands.
5311   for (unsigned i = 0; i != NumOps; ++i)
5312     if (N->OperandList[i] != Ops[i])
5313       N->OperandList[i].set(Ops[i]);
5314
5315   // If this gets put into a CSE map, add it.
5316   if (InsertPos) CSEMap.InsertNode(N, InsertPos);
5317   return N;
5318 }
5319
5320 /// DropOperands - Release the operands and set this node to have
5321 /// zero operands.
5322 void SDNode::DropOperands() {
5323   // Unlike the code in MorphNodeTo that does this, we don't need to
5324   // watch for dead nodes here.
5325   for (op_iterator I = op_begin(), E = op_end(); I != E; ) {
5326     SDUse &Use = *I++;
5327     Use.set(SDValue());
5328   }
5329 }
5330
5331 /// SelectNodeTo - These are wrappers around MorphNodeTo that accept a
5332 /// machine opcode.
5333 ///
5334 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5335                                    EVT VT) {
5336   SDVTList VTs = getVTList(VT);
5337   return SelectNodeTo(N, MachineOpc, VTs, None);
5338 }
5339
5340 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5341                                    EVT VT, SDValue Op1) {
5342   SDVTList VTs = getVTList(VT);
5343   SDValue Ops[] = { Op1 };
5344   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5345 }
5346
5347 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5348                                    EVT VT, SDValue Op1,
5349                                    SDValue Op2) {
5350   SDVTList VTs = getVTList(VT);
5351   SDValue Ops[] = { Op1, Op2 };
5352   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5353 }
5354
5355 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5356                                    EVT VT, SDValue Op1,
5357                                    SDValue Op2, SDValue Op3) {
5358   SDVTList VTs = getVTList(VT);
5359   SDValue Ops[] = { Op1, Op2, Op3 };
5360   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5361 }
5362
5363 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5364                                    EVT VT, ArrayRef<SDValue> Ops) {
5365   SDVTList VTs = getVTList(VT);
5366   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5367 }
5368
5369 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5370                                    EVT VT1, EVT VT2, ArrayRef<SDValue> Ops) {
5371   SDVTList VTs = getVTList(VT1, VT2);
5372   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5373 }
5374
5375 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5376                                    EVT VT1, EVT VT2) {
5377   SDVTList VTs = getVTList(VT1, VT2);
5378   return SelectNodeTo(N, MachineOpc, VTs, None);
5379 }
5380
5381 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5382                                    EVT VT1, EVT VT2, EVT VT3,
5383                                    ArrayRef<SDValue> Ops) {
5384   SDVTList VTs = getVTList(VT1, VT2, VT3);
5385   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5386 }
5387
5388 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5389                                    EVT VT1, EVT VT2, EVT VT3, EVT VT4,
5390                                    ArrayRef<SDValue> Ops) {
5391   SDVTList VTs = getVTList(VT1, VT2, VT3, VT4);
5392   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5393 }
5394
5395 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5396                                    EVT VT1, EVT VT2,
5397                                    SDValue Op1) {
5398   SDVTList VTs = getVTList(VT1, VT2);
5399   SDValue Ops[] = { Op1 };
5400   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5401 }
5402
5403 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5404                                    EVT VT1, EVT VT2,
5405                                    SDValue Op1, SDValue Op2) {
5406   SDVTList VTs = getVTList(VT1, VT2);
5407   SDValue Ops[] = { Op1, Op2 };
5408   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5409 }
5410
5411 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5412                                    EVT VT1, EVT VT2,
5413                                    SDValue Op1, SDValue Op2,
5414                                    SDValue Op3) {
5415   SDVTList VTs = getVTList(VT1, VT2);
5416   SDValue Ops[] = { Op1, Op2, Op3 };
5417   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5418 }
5419
5420 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5421                                    EVT VT1, EVT VT2, EVT VT3,
5422                                    SDValue Op1, SDValue Op2,
5423                                    SDValue Op3) {
5424   SDVTList VTs = getVTList(VT1, VT2, VT3);
5425   SDValue Ops[] = { Op1, Op2, Op3 };
5426   return SelectNodeTo(N, MachineOpc, VTs, Ops);
5427 }
5428
5429 SDNode *SelectionDAG::SelectNodeTo(SDNode *N, unsigned MachineOpc,
5430                                    SDVTList VTs,ArrayRef<SDValue> Ops) {
5431   N = MorphNodeTo(N, ~MachineOpc, VTs, Ops);
5432   // Reset the NodeID to -1.
5433   N->setNodeId(-1);
5434   return N;
5435 }
5436
5437 /// UpdadeSDLocOnMergedSDNode - If the opt level is -O0 then it throws away
5438 /// the line number information on the merged node since it is not possible to
5439 /// preserve the information that operation is associated with multiple lines.
5440 /// This will make the debugger working better at -O0, were there is a higher
5441 /// probability having other instructions associated with that line.
5442 ///
5443 /// For IROrder, we keep the smaller of the two
5444 SDNode *SelectionDAG::UpdadeSDLocOnMergedSDNode(SDNode *N, SDLoc OLoc) {
5445   DebugLoc NLoc = N->getDebugLoc();
5446   if (!(NLoc.isUnknown()) && (OptLevel == CodeGenOpt::None) &&
5447     (OLoc.getDebugLoc() != NLoc)) {
5448     N->setDebugLoc(DebugLoc());
5449   }
5450   unsigned Order = std::min(N->getIROrder(), OLoc.getIROrder());
5451   N->setIROrder(Order);
5452   return N;
5453 }
5454
5455 /// MorphNodeTo - This *mutates* the specified node to have the specified
5456 /// return type, opcode, and operands.
5457 ///
5458 /// Note that MorphNodeTo returns the resultant node.  If there is already a
5459 /// node of the specified opcode and operands, it returns that node instead of
5460 /// the current one.  Note that the SDLoc need not be the same.
5461 ///
5462 /// Using MorphNodeTo is faster than creating a new node and swapping it in
5463 /// with ReplaceAllUsesWith both because it often avoids allocating a new
5464 /// node, and because it doesn't require CSE recalculation for any of
5465 /// the node's users.
5466 ///
5467 SDNode *SelectionDAG::MorphNodeTo(SDNode *N, unsigned Opc,
5468                                   SDVTList VTs, ArrayRef<SDValue> Ops) {
5469   unsigned NumOps = Ops.size();
5470   // If an identical node already exists, use it.
5471   void *IP = nullptr;
5472   if (VTs.VTs[VTs.NumVTs-1] != MVT::Glue) {
5473     FoldingSetNodeID ID;
5474     AddNodeIDNode(ID, Opc, VTs, Ops);
5475     if (SDNode *ON = CSEMap.FindNodeOrInsertPos(ID, IP))
5476       return UpdadeSDLocOnMergedSDNode(ON, SDLoc(N));
5477   }
5478
5479   if (!RemoveNodeFromCSEMaps(N))
5480     IP = nullptr;
5481
5482   // Start the morphing.
5483   N->NodeType = Opc;
5484   N->ValueList = VTs.VTs;
5485   N->NumValues = VTs.NumVTs;
5486
5487   // Clear the operands list, updating used nodes to remove this from their
5488   // use list.  Keep track of any operands that become dead as a result.
5489   SmallPtrSet<SDNode*, 16> DeadNodeSet;
5490   for (SDNode::op_iterator I = N->op_begin(), E = N->op_end(); I != E; ) {
5491     SDUse &Use = *I++;
5492     SDNode *Used = Use.getNode();
5493     Use.set(SDValue());
5494     if (Used->use_empty())
5495       DeadNodeSet.insert(Used);
5496   }
5497
5498   if (MachineSDNode *MN = dyn_cast<MachineSDNode>(N)) {
5499     // Initialize the memory references information.
5500     MN->setMemRefs(nullptr, nullptr);
5501     // If NumOps is larger than the # of operands we can have in a
5502     // MachineSDNode, reallocate the operand list.
5503     if (NumOps > MN->NumOperands || !MN->OperandsNeedDelete) {
5504       if (MN->OperandsNeedDelete)
5505         delete[] MN->OperandList;
5506       if (NumOps > array_lengthof(MN->LocalOperands))
5507         // We're creating a final node that will live unmorphed for the
5508         // remainder of the current SelectionDAG iteration, so we can allocate
5509         // the operands directly out of a pool with no recycling metadata.
5510         MN->InitOperands(OperandAllocator.Allocate<SDUse>(NumOps),
5511                          Ops.data(), NumOps);
5512       else
5513         MN->InitOperands(MN->LocalOperands, Ops.data(), NumOps);
5514       MN->OperandsNeedDelete = false;
5515     } else
5516       MN->InitOperands(MN->OperandList, Ops.data(), NumOps);
5517   } else {
5518     // If NumOps is larger than the # of operands we currently have, reallocate
5519     // the operand list.
5520     if (NumOps > N->NumOperands) {
5521       if (N->OperandsNeedDelete)
5522         delete[] N->OperandList;
5523       N->InitOperands(new SDUse[NumOps], Ops.data(), NumOps);
5524       N->OperandsNeedDelete = true;
5525     } else
5526       N->InitOperands(N->OperandList, Ops.data(), NumOps);
5527   }
5528
5529   // Delete any nodes that are still dead after adding the uses for the
5530   // new operands.
5531   if (!DeadNodeSet.empty()) {
5532     SmallVector<SDNode *, 16> DeadNodes;
5533     for (SmallPtrSet<SDNode *, 16>::iterator I = DeadNodeSet.begin(),
5534          E = DeadNodeSet.end(); I != E; ++I)
5535       if ((*I)->use_empty())
5536         DeadNodes.push_back(*I);
5537     RemoveDeadNodes(DeadNodes);
5538   }
5539
5540   if (IP)
5541     CSEMap.InsertNode(N, IP);   // Memoize the new node.
5542   return N;
5543 }
5544
5545
5546 /// getMachineNode - These are used for target selectors to create a new node
5547 /// with specified return type(s), MachineInstr opcode, and operands.
5548 ///
5549 /// Note that getMachineNode returns the resultant node.  If there is already a
5550 /// node of the specified opcode and operands, it returns that node instead of
5551 /// the current one.
5552 MachineSDNode *
5553 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT) {
5554   SDVTList VTs = getVTList(VT);
5555   return getMachineNode(Opcode, dl, VTs, None);
5556 }
5557
5558 MachineSDNode *
5559 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT, SDValue Op1) {
5560   SDVTList VTs = getVTList(VT);
5561   SDValue Ops[] = { Op1 };
5562   return getMachineNode(Opcode, dl, VTs, Ops);
5563 }
5564
5565 MachineSDNode *
5566 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT,
5567                              SDValue Op1, SDValue Op2) {
5568   SDVTList VTs = getVTList(VT);
5569   SDValue Ops[] = { Op1, Op2 };
5570   return getMachineNode(Opcode, dl, VTs, Ops);
5571 }
5572
5573 MachineSDNode *
5574 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT,
5575                              SDValue Op1, SDValue Op2, SDValue Op3) {
5576   SDVTList VTs = getVTList(VT);
5577   SDValue Ops[] = { Op1, Op2, Op3 };
5578   return getMachineNode(Opcode, dl, VTs, Ops);
5579 }
5580
5581 MachineSDNode *
5582 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT,
5583                              ArrayRef<SDValue> Ops) {
5584   SDVTList VTs = getVTList(VT);
5585   return getMachineNode(Opcode, dl, VTs, Ops);
5586 }
5587
5588 MachineSDNode *
5589 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT1, EVT VT2) {
5590   SDVTList VTs = getVTList(VT1, VT2);
5591   return getMachineNode(Opcode, dl, VTs, None);
5592 }
5593
5594 MachineSDNode *
5595 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
5596                              EVT VT1, EVT VT2, SDValue Op1) {
5597   SDVTList VTs = getVTList(VT1, VT2);
5598   SDValue Ops[] = { Op1 };
5599   return getMachineNode(Opcode, dl, VTs, Ops);
5600 }
5601
5602 MachineSDNode *
5603 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
5604                              EVT VT1, EVT VT2, SDValue Op1, SDValue Op2) {
5605   SDVTList VTs = getVTList(VT1, VT2);
5606   SDValue Ops[] = { Op1, Op2 };
5607   return getMachineNode(Opcode, dl, VTs, Ops);
5608 }
5609
5610 MachineSDNode *
5611 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
5612                              EVT VT1, EVT VT2, SDValue Op1,
5613                              SDValue Op2, SDValue Op3) {
5614   SDVTList VTs = getVTList(VT1, VT2);
5615   SDValue Ops[] = { Op1, Op2, Op3 };
5616   return getMachineNode(Opcode, dl, VTs, Ops);
5617 }
5618
5619 MachineSDNode *
5620 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
5621                              EVT VT1, EVT VT2,
5622                              ArrayRef<SDValue> Ops) {
5623   SDVTList VTs = getVTList(VT1, VT2);
5624   return getMachineNode(Opcode, dl, VTs, Ops);
5625 }
5626
5627 MachineSDNode *
5628 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
5629                              EVT VT1, EVT VT2, EVT VT3,
5630                              SDValue Op1, SDValue Op2) {
5631   SDVTList VTs = getVTList(VT1, VT2, VT3);
5632   SDValue Ops[] = { Op1, Op2 };
5633   return getMachineNode(Opcode, dl, VTs, Ops);
5634 }
5635
5636 MachineSDNode *
5637 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
5638                              EVT VT1, EVT VT2, EVT VT3,
5639                              SDValue Op1, SDValue Op2, SDValue Op3) {
5640   SDVTList VTs = getVTList(VT1, VT2, VT3);
5641   SDValue Ops[] = { Op1, Op2, Op3 };
5642   return getMachineNode(Opcode, dl, VTs, Ops);
5643 }
5644
5645 MachineSDNode *
5646 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
5647                              EVT VT1, EVT VT2, EVT VT3,
5648                              ArrayRef<SDValue> Ops) {
5649   SDVTList VTs = getVTList(VT1, VT2, VT3);
5650   return getMachineNode(Opcode, dl, VTs, Ops);
5651 }
5652
5653 MachineSDNode *
5654 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl, EVT VT1,
5655                              EVT VT2, EVT VT3, EVT VT4,
5656                              ArrayRef<SDValue> Ops) {
5657   SDVTList VTs = getVTList(VT1, VT2, VT3, VT4);
5658   return getMachineNode(Opcode, dl, VTs, Ops);
5659 }
5660
5661 MachineSDNode *
5662 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc dl,
5663                              ArrayRef<EVT> ResultTys,
5664                              ArrayRef<SDValue> Ops) {
5665   SDVTList VTs = getVTList(ResultTys);
5666   return getMachineNode(Opcode, dl, VTs, Ops);
5667 }
5668
5669 MachineSDNode *
5670 SelectionDAG::getMachineNode(unsigned Opcode, SDLoc DL, SDVTList VTs,
5671                              ArrayRef<SDValue> OpsArray) {
5672   bool DoCSE = VTs.VTs[VTs.NumVTs-1] != MVT::Glue;
5673   MachineSDNode *N;
5674   void *IP = nullptr;
5675   const SDValue *Ops = OpsArray.data();
5676   unsigned NumOps = OpsArray.size();
5677
5678   if (DoCSE) {
5679     FoldingSetNodeID ID;
5680     AddNodeIDNode(ID, ~Opcode, VTs, OpsArray);
5681     IP = nullptr;
5682     if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP)) {
5683       return cast<MachineSDNode>(UpdadeSDLocOnMergedSDNode(E, DL));
5684     }
5685   }
5686
5687   // Allocate a new MachineSDNode.
5688   N = new (NodeAllocator) MachineSDNode(~Opcode, DL.getIROrder(),
5689                                         DL.getDebugLoc(), VTs);
5690
5691   // Initialize the operands list.
5692   if (NumOps > array_lengthof(N->LocalOperands))
5693     // We're creating a final node that will live unmorphed for the
5694     // remainder of the current SelectionDAG iteration, so we can allocate
5695     // the operands directly out of a pool with no recycling metadata.
5696     N->InitOperands(OperandAllocator.Allocate<SDUse>(NumOps),
5697                     Ops, NumOps);
5698   else
5699     N->InitOperands(N->LocalOperands, Ops, NumOps);
5700   N->OperandsNeedDelete = false;
5701
5702   if (DoCSE)
5703     CSEMap.InsertNode(N, IP);
5704
5705   AllNodes.push_back(N);
5706 #ifndef NDEBUG
5707   VerifyMachineNode(N);
5708 #endif
5709   return N;
5710 }
5711
5712 /// getTargetExtractSubreg - A convenience function for creating
5713 /// TargetOpcode::EXTRACT_SUBREG nodes.
5714 SDValue
5715 SelectionDAG::getTargetExtractSubreg(int SRIdx, SDLoc DL, EVT VT,
5716                                      SDValue Operand) {
5717   SDValue SRIdxVal = getTargetConstant(SRIdx, MVT::i32);
5718   SDNode *Subreg = getMachineNode(TargetOpcode::EXTRACT_SUBREG, DL,
5719                                   VT, Operand, SRIdxVal);
5720   return SDValue(Subreg, 0);
5721 }
5722
5723 /// getTargetInsertSubreg - A convenience function for creating
5724 /// TargetOpcode::INSERT_SUBREG nodes.
5725 SDValue
5726 SelectionDAG::getTargetInsertSubreg(int SRIdx, SDLoc DL, EVT VT,
5727                                     SDValue Operand, SDValue Subreg) {
5728   SDValue SRIdxVal = getTargetConstant(SRIdx, MVT::i32);
5729   SDNode *Result = getMachineNode(TargetOpcode::INSERT_SUBREG, DL,
5730                                   VT, Operand, Subreg, SRIdxVal);
5731   return SDValue(Result, 0);
5732 }
5733
5734 /// getNodeIfExists - Get the specified node if it's already available, or
5735 /// else return NULL.
5736 SDNode *SelectionDAG::getNodeIfExists(unsigned Opcode, SDVTList VTList,
5737                                       ArrayRef<SDValue> Ops, bool nuw, bool nsw,
5738                                       bool exact) {
5739   if (VTList.VTs[VTList.NumVTs - 1] != MVT::Glue) {
5740     FoldingSetNodeID ID;
5741     AddNodeIDNode(ID, Opcode, VTList, Ops);
5742     if (isBinOpWithFlags(Opcode))
5743       AddBinaryNodeIDCustom(ID, nuw, nsw, exact);
5744     void *IP = nullptr;
5745     if (SDNode *E = CSEMap.FindNodeOrInsertPos(ID, IP))
5746       return E;
5747   }
5748   return nullptr;
5749 }
5750
5751 /// getDbgValue - Creates a SDDbgValue node.
5752 ///
5753 /// SDNode
5754 SDDbgValue *
5755 SelectionDAG::getDbgValue(MDNode *MDPtr, SDNode *N, unsigned R,
5756                           bool IsIndirect, uint64_t Off,
5757                           DebugLoc DL, unsigned O) {
5758   return new (Allocator) SDDbgValue(MDPtr, N, R, IsIndirect, Off, DL, O);
5759 }
5760
5761 /// Constant
5762 SDDbgValue *
5763 SelectionDAG::getConstantDbgValue(MDNode *MDPtr, const Value *C,
5764                                   uint64_t Off,
5765                                   DebugLoc DL, unsigned O) {
5766   return new (Allocator) SDDbgValue(MDPtr, C, Off, DL, O);
5767 }
5768
5769 /// FrameIndex
5770 SDDbgValue *
5771 SelectionDAG::getFrameIndexDbgValue(MDNode *MDPtr, unsigned FI, uint64_t Off,
5772                                     DebugLoc DL, unsigned O) {
5773   return new (Allocator) SDDbgValue(MDPtr, FI, Off, DL, O);
5774 }
5775
5776 namespace {
5777
5778 /// RAUWUpdateListener - Helper for ReplaceAllUsesWith - When the node
5779 /// pointed to by a use iterator is deleted, increment the use iterator
5780 /// so that it doesn't dangle.
5781 ///
5782 class RAUWUpdateListener : public SelectionDAG::DAGUpdateListener {
5783   SDNode::use_iterator &UI;
5784   SDNode::use_iterator &UE;
5785
5786   void NodeDeleted(SDNode *N, SDNode *E) override {
5787     // Increment the iterator as needed.
5788     while (UI != UE && N == *UI)
5789       ++UI;
5790   }
5791
5792 public:
5793   RAUWUpdateListener(SelectionDAG &d,
5794                      SDNode::use_iterator &ui,
5795                      SDNode::use_iterator &ue)
5796     : SelectionDAG::DAGUpdateListener(d), UI(ui), UE(ue) {}
5797 };
5798
5799 }
5800
5801 /// ReplaceAllUsesWith - Modify anything using 'From' to use 'To' instead.
5802 /// This can cause recursive merging of nodes in the DAG.
5803 ///
5804 /// This version assumes From has a single result value.
5805 ///
5806 void SelectionDAG::ReplaceAllUsesWith(SDValue FromN, SDValue To) {
5807   SDNode *From = FromN.getNode();
5808   assert(From->getNumValues() == 1 && FromN.getResNo() == 0 &&
5809          "Cannot replace with this method!");
5810   assert(From != To.getNode() && "Cannot replace uses of with self");
5811
5812   // Iterate over all the existing uses of From. New uses will be added
5813   // to the beginning of the use list, which we avoid visiting.
5814   // This specifically avoids visiting uses of From that arise while the
5815   // replacement is happening, because any such uses would be the result
5816   // of CSE: If an existing node looks like From after one of its operands
5817   // is replaced by To, we don't want to replace of all its users with To
5818   // too. See PR3018 for more info.
5819   SDNode::use_iterator UI = From->use_begin(), UE = From->use_end();
5820   RAUWUpdateListener Listener(*this, UI, UE);
5821   while (UI != UE) {
5822     SDNode *User = *UI;
5823
5824     // This node is about to morph, remove its old self from the CSE maps.
5825     RemoveNodeFromCSEMaps(User);
5826
5827     // A user can appear in a use list multiple times, and when this
5828     // happens the uses are usually next to each other in the list.
5829     // To help reduce the number of CSE recomputations, process all
5830     // the uses of this user that we can find this way.
5831     do {
5832       SDUse &Use = UI.getUse();
5833       ++UI;
5834       Use.set(To);
5835     } while (UI != UE && *UI == User);
5836
5837     // Now that we have modified User, add it back to the CSE maps.  If it
5838     // already exists there, recursively merge the results together.
5839     AddModifiedNodeToCSEMaps(User);
5840   }
5841
5842   // If we just RAUW'd the root, take note.
5843   if (FromN == getRoot())
5844     setRoot(To);
5845 }
5846
5847 /// ReplaceAllUsesWith - Modify anything using 'From' to use 'To' instead.
5848 /// This can cause recursive merging of nodes in the DAG.
5849 ///
5850 /// This version assumes that for each value of From, there is a
5851 /// corresponding value in To in the same position with the same type.
5852 ///
5853 void SelectionDAG::ReplaceAllUsesWith(SDNode *From, SDNode *To) {
5854 #ifndef NDEBUG
5855   for (unsigned i = 0, e = From->getNumValues(); i != e; ++i)
5856     assert((!From->hasAnyUseOfValue(i) ||
5857             From->getValueType(i) == To->getValueType(i)) &&
5858            "Cannot use this version of ReplaceAllUsesWith!");
5859 #endif
5860
5861   // Handle the trivial case.
5862   if (From == To)
5863     return;
5864
5865   // Iterate over just the existing users of From. See the comments in
5866   // the ReplaceAllUsesWith above.
5867   SDNode::use_iterator UI = From->use_begin(), UE = From->use_end();
5868   RAUWUpdateListener Listener(*this, UI, UE);
5869   while (UI != UE) {
5870     SDNode *User = *UI;
5871
5872     // This node is about to morph, remove its old self from the CSE maps.
5873     RemoveNodeFromCSEMaps(User);
5874
5875     // A user can appear in a use list multiple times, and when this
5876     // happens the uses are usually next to each other in the list.
5877     // To help reduce the number of CSE recomputations, process all
5878     // the uses of this user that we can find this way.
5879     do {
5880       SDUse &Use = UI.getUse();
5881       ++UI;
5882       Use.setNode(To);
5883     } while (UI != UE && *UI == User);
5884
5885     // Now that we have modified User, add it back to the CSE maps.  If it
5886     // already exists there, recursively merge the results together.
5887     AddModifiedNodeToCSEMaps(User);
5888   }
5889
5890   // If we just RAUW'd the root, take note.
5891   if (From == getRoot().getNode())
5892     setRoot(SDValue(To, getRoot().getResNo()));
5893 }
5894
5895 /// ReplaceAllUsesWith - Modify anything using 'From' to use 'To' instead.
5896 /// This can cause recursive merging of nodes in the DAG.
5897 ///
5898 /// This version can replace From with any result values.  To must match the
5899 /// number and types of values returned by From.
5900 void SelectionDAG::ReplaceAllUsesWith(SDNode *From, const SDValue *To) {
5901   if (From->getNumValues() == 1)  // Handle the simple case efficiently.
5902     return ReplaceAllUsesWith(SDValue(From, 0), To[0]);
5903
5904   // Iterate over just the existing users of From. See the comments in
5905   // the ReplaceAllUsesWith above.
5906   SDNode::use_iterator UI = From->use_begin(), UE = From->use_end();
5907   RAUWUpdateListener Listener(*this, UI, UE);
5908   while (UI != UE) {
5909     SDNode *User = *UI;
5910
5911     // This node is about to morph, remove its old self from the CSE maps.
5912     RemoveNodeFromCSEMaps(User);
5913
5914     // A user can appear in a use list multiple times, and when this
5915     // happens the uses are usually next to each other in the list.
5916     // To help reduce the number of CSE recomputations, process all
5917     // the uses of this user that we can find this way.
5918     do {
5919       SDUse &Use = UI.getUse();
5920       const SDValue &ToOp = To[Use.getResNo()];
5921       ++UI;
5922       Use.set(ToOp);
5923     } while (UI != UE && *UI == User);
5924
5925     // Now that we have modified User, add it back to the CSE maps.  If it
5926     // already exists there, recursively merge the results together.
5927     AddModifiedNodeToCSEMaps(User);
5928   }
5929
5930   // If we just RAUW'd the root, take note.
5931   if (From == getRoot().getNode())
5932     setRoot(SDValue(To[getRoot().getResNo()]));
5933 }
5934
5935 /// ReplaceAllUsesOfValueWith - Replace any uses of From with To, leaving
5936 /// uses of other values produced by From.getNode() alone.  The Deleted
5937 /// vector is handled the same way as for ReplaceAllUsesWith.
5938 void SelectionDAG::ReplaceAllUsesOfValueWith(SDValue From, SDValue To){
5939   // Handle the really simple, really trivial case efficiently.
5940   if (From == To) return;
5941
5942   // Handle the simple, trivial, case efficiently.
5943   if (From.getNode()->getNumValues() == 1) {
5944     ReplaceAllUsesWith(From, To);
5945     return;
5946   }
5947
5948   // Iterate over just the existing users of From. See the comments in
5949   // the ReplaceAllUsesWith above.
5950   SDNode::use_iterator UI = From.getNode()->use_begin(),
5951                        UE = From.getNode()->use_end();
5952   RAUWUpdateListener Listener(*this, UI, UE);
5953   while (UI != UE) {
5954     SDNode *User = *UI;
5955     bool UserRemovedFromCSEMaps = false;
5956
5957     // A user can appear in a use list multiple times, and when this
5958     // happens the uses are usually next to each other in the list.
5959     // To help reduce the number of CSE recomputations, process all
5960     // the uses of this user that we can find this way.
5961     do {
5962       SDUse &Use = UI.getUse();
5963
5964       // Skip uses of different values from the same node.
5965       if (Use.getResNo() != From.getResNo()) {
5966         ++UI;
5967         continue;
5968       }
5969
5970       // If this node hasn't been modified yet, it's still in the CSE maps,
5971       // so remove its old self from the CSE maps.
5972       if (!UserRemovedFromCSEMaps) {
5973         RemoveNodeFromCSEMaps(User);
5974         UserRemovedFromCSEMaps = true;
5975       }
5976
5977       ++UI;
5978       Use.set(To);
5979     } while (UI != UE && *UI == User);
5980
5981     // We are iterating over all uses of the From node, so if a use
5982     // doesn't use the specific value, no changes are made.
5983     if (!UserRemovedFromCSEMaps)
5984       continue;
5985
5986     // Now that we have modified User, add it back to the CSE maps.  If it
5987     // already exists there, recursively merge the results together.
5988     AddModifiedNodeToCSEMaps(User);
5989   }
5990
5991   // If we just RAUW'd the root, take note.
5992   if (From == getRoot())
5993     setRoot(To);
5994 }
5995
5996 namespace {
5997   /// UseMemo - This class is used by SelectionDAG::ReplaceAllUsesOfValuesWith
5998   /// to record information about a use.
5999   struct UseMemo {
6000     SDNode *User;
6001     unsigned Index;
6002     SDUse *Use;
6003   };
6004
6005   /// operator< - Sort Memos by User.
6006   bool operator<(const UseMemo &L, const UseMemo &R) {
6007     return (intptr_t)L.User < (intptr_t)R.User;
6008   }
6009 }
6010
6011 /// ReplaceAllUsesOfValuesWith - Replace any uses of From with To, leaving
6012 /// uses of other values produced by From.getNode() alone.  The same value
6013 /// may appear in both the From and To list.  The Deleted vector is
6014 /// handled the same way as for ReplaceAllUsesWith.
6015 void SelectionDAG::ReplaceAllUsesOfValuesWith(const SDValue *From,
6016                                               const SDValue *To,
6017                                               unsigned Num){
6018   // Handle the simple, trivial case efficiently.
6019   if (Num == 1)
6020     return ReplaceAllUsesOfValueWith(*From, *To);
6021
6022   // Read up all the uses and make records of them. This helps
6023   // processing new uses that are introduced during the
6024   // replacement process.
6025   SmallVector<UseMemo, 4> Uses;
6026   for (unsigned i = 0; i != Num; ++i) {
6027     unsigned FromResNo = From[i].getResNo();
6028     SDNode *FromNode = From[i].getNode();
6029     for (SDNode::use_iterator UI = FromNode->use_begin(),
6030          E = FromNode->use_end(); UI != E; ++UI) {
6031       SDUse &Use = UI.getUse();
6032       if (Use.getResNo() == FromResNo) {
6033         UseMemo Memo = { *UI, i, &Use };
6034         Uses.push_back(Memo);
6035       }
6036     }
6037   }
6038
6039   // Sort the uses, so that all the uses from a given User are together.
6040   std::sort(Uses.begin(), Uses.end());
6041
6042   for (unsigned UseIndex = 0, UseIndexEnd = Uses.size();
6043        UseIndex != UseIndexEnd; ) {
6044     // We know that this user uses some value of From.  If it is the right
6045     // value, update it.
6046     SDNode *User = Uses[UseIndex].User;
6047
6048     // This node is about to morph, remove its old self from the CSE maps.
6049     RemoveNodeFromCSEMaps(User);
6050
6051     // The Uses array is sorted, so all the uses for a given User
6052     // are next to each other in the list.
6053     // To help reduce the number of CSE recomputations, process all
6054     // the uses of this user that we can find this way.
6055     do {
6056       unsigned i = Uses[UseIndex].Index;
6057       SDUse &Use = *Uses[UseIndex].Use;
6058       ++UseIndex;
6059
6060       Use.set(To[i]);
6061     } while (UseIndex != UseIndexEnd && Uses[UseIndex].User == User);
6062
6063     // Now that we have modified User, add it back to the CSE maps.  If it
6064     // already exists there, recursively merge the results together.
6065     AddModifiedNodeToCSEMaps(User);
6066   }
6067 }
6068
6069 /// AssignTopologicalOrder - Assign a unique node id for each node in the DAG
6070 /// based on their topological order. It returns the maximum id and a vector
6071 /// of the SDNodes* in assigned order by reference.
6072 unsigned SelectionDAG::AssignTopologicalOrder() {
6073
6074   unsigned DAGSize = 0;
6075
6076   // SortedPos tracks the progress of the algorithm. Nodes before it are
6077   // sorted, nodes after it are unsorted. When the algorithm completes
6078   // it is at the end of the list.
6079   allnodes_iterator SortedPos = allnodes_begin();
6080
6081   // Visit all the nodes. Move nodes with no operands to the front of
6082   // the list immediately. Annotate nodes that do have operands with their
6083   // operand count. Before we do this, the Node Id fields of the nodes
6084   // may contain arbitrary values. After, the Node Id fields for nodes
6085   // before SortedPos will contain the topological sort index, and the
6086   // Node Id fields for nodes At SortedPos and after will contain the
6087   // count of outstanding operands.
6088   for (allnodes_iterator I = allnodes_begin(),E = allnodes_end(); I != E; ) {
6089     SDNode *N = I++;
6090     checkForCycles(N, this);
6091     unsigned Degree = N->getNumOperands();
6092     if (Degree == 0) {
6093       // A node with no uses, add it to the result array immediately.
6094       N->setNodeId(DAGSize++);
6095       allnodes_iterator Q = N;
6096       if (Q != SortedPos)
6097         SortedPos = AllNodes.insert(SortedPos, AllNodes.remove(Q));
6098       assert(SortedPos != AllNodes.end() && "Overran node list");
6099       ++SortedPos;
6100     } else {
6101       // Temporarily use the Node Id as scratch space for the degree count.
6102       N->setNodeId(Degree);
6103     }
6104   }
6105
6106   // Visit all the nodes. As we iterate, move nodes into sorted order,
6107   // such that by the time the end is reached all nodes will be sorted.
6108   for (allnodes_iterator I = allnodes_begin(),E = allnodes_end(); I != E; ++I) {
6109     SDNode *N = I;
6110     checkForCycles(N, this);
6111     // N is in sorted position, so all its uses have one less operand
6112     // that needs to be sorted.
6113     for (SDNode::use_iterator UI = N->use_begin(), UE = N->use_end();
6114          UI != UE; ++UI) {
6115       SDNode *P = *UI;
6116       unsigned Degree = P->getNodeId();
6117       assert(Degree != 0 && "Invalid node degree");
6118       --Degree;
6119       if (Degree == 0) {
6120         // All of P's operands are sorted, so P may sorted now.
6121         P->setNodeId(DAGSize++);
6122         if (P != SortedPos)
6123           SortedPos = AllNodes.insert(SortedPos, AllNodes.remove(P));
6124         assert(SortedPos != AllNodes.end() && "Overran node list");
6125         ++SortedPos;
6126       } else {
6127         // Update P's outstanding operand count.
6128         P->setNodeId(Degree);
6129       }
6130     }
6131     if (I == SortedPos) {
6132 #ifndef NDEBUG
6133       SDNode *S = ++I;
6134       dbgs() << "Overran sorted position:\n";
6135       S->dumprFull(this); dbgs() << "\n";
6136       dbgs() << "Checking if this is due to cycles\n";
6137       checkForCycles(this, true);
6138 #endif
6139       llvm_unreachable(nullptr);
6140     }
6141   }
6142
6143   assert(SortedPos == AllNodes.end() &&
6144          "Topological sort incomplete!");
6145   assert(AllNodes.front().getOpcode() == ISD::EntryToken &&
6146          "First node in topological sort is not the entry token!");
6147   assert(AllNodes.front().getNodeId() == 0 &&
6148          "First node in topological sort has non-zero id!");
6149   assert(AllNodes.front().getNumOperands() == 0 &&
6150          "First node in topological sort has operands!");
6151   assert(AllNodes.back().getNodeId() == (int)DAGSize-1 &&
6152          "Last node in topologic sort has unexpected id!");
6153   assert(AllNodes.back().use_empty() &&
6154          "Last node in topologic sort has users!");
6155   assert(DAGSize == allnodes_size() && "Node count mismatch!");
6156   return DAGSize;
6157 }
6158
6159 /// AddDbgValue - Add a dbg_value SDNode. If SD is non-null that means the
6160 /// value is produced by SD.
6161 void SelectionDAG::AddDbgValue(SDDbgValue *DB, SDNode *SD, bool isParameter) {
6162   DbgInfo->add(DB, SD, isParameter);
6163   if (SD)
6164     SD->setHasDebugValue(true);
6165 }
6166
6167 /// TransferDbgValues - Transfer SDDbgValues.
6168 void SelectionDAG::TransferDbgValues(SDValue From, SDValue To) {
6169   if (From == To || !From.getNode()->getHasDebugValue())
6170     return;
6171   SDNode *FromNode = From.getNode();
6172   SDNode *ToNode = To.getNode();
6173   ArrayRef<SDDbgValue *> DVs = GetDbgValues(FromNode);
6174   SmallVector<SDDbgValue *, 2> ClonedDVs;
6175   for (ArrayRef<SDDbgValue *>::iterator I = DVs.begin(), E = DVs.end();
6176        I != E; ++I) {
6177     SDDbgValue *Dbg = *I;
6178     if (Dbg->getKind() == SDDbgValue::SDNODE) {
6179       SDDbgValue *Clone = getDbgValue(Dbg->getMDPtr(), ToNode, To.getResNo(),
6180                                       Dbg->isIndirect(),
6181                                       Dbg->getOffset(), Dbg->getDebugLoc(),
6182                                       Dbg->getOrder());
6183       ClonedDVs.push_back(Clone);
6184     }
6185   }
6186   for (SmallVectorImpl<SDDbgValue *>::iterator I = ClonedDVs.begin(),
6187          E = ClonedDVs.end(); I != E; ++I)
6188     AddDbgValue(*I, ToNode, false);
6189 }
6190
6191 //===----------------------------------------------------------------------===//
6192 //                              SDNode Class
6193 //===----------------------------------------------------------------------===//
6194
6195 HandleSDNode::~HandleSDNode() {
6196   DropOperands();
6197 }
6198
6199 GlobalAddressSDNode::GlobalAddressSDNode(unsigned Opc, unsigned Order,
6200                                          DebugLoc DL, const GlobalValue *GA,
6201                                          EVT VT, int64_t o, unsigned char TF)
6202   : SDNode(Opc, Order, DL, getSDVTList(VT)), Offset(o), TargetFlags(TF) {
6203   TheGlobal = GA;
6204 }
6205
6206 AddrSpaceCastSDNode::AddrSpaceCastSDNode(unsigned Order, DebugLoc dl, EVT VT,
6207                                          SDValue X, unsigned SrcAS,
6208                                          unsigned DestAS)
6209  : UnarySDNode(ISD::ADDRSPACECAST, Order, dl, getSDVTList(VT), X),
6210    SrcAddrSpace(SrcAS), DestAddrSpace(DestAS) {}
6211
6212 MemSDNode::MemSDNode(unsigned Opc, unsigned Order, DebugLoc dl, SDVTList VTs,
6213                      EVT memvt, MachineMemOperand *mmo)
6214  : SDNode(Opc, Order, dl, VTs), MemoryVT(memvt), MMO(mmo) {
6215   SubclassData = encodeMemSDNodeFlags(0, ISD::UNINDEXED, MMO->isVolatile(),
6216                                       MMO->isNonTemporal(), MMO->isInvariant());
6217   assert(isVolatile() == MMO->isVolatile() && "Volatile encoding error!");
6218   assert(isNonTemporal() == MMO->isNonTemporal() &&
6219          "Non-temporal encoding error!");
6220   assert(memvt.getStoreSize() == MMO->getSize() && "Size mismatch!");
6221 }
6222
6223 MemSDNode::MemSDNode(unsigned Opc, unsigned Order, DebugLoc dl, SDVTList VTs,
6224                      ArrayRef<SDValue> Ops, EVT memvt, MachineMemOperand *mmo)
6225    : SDNode(Opc, Order, dl, VTs, Ops),
6226      MemoryVT(memvt), MMO(mmo) {
6227   SubclassData = encodeMemSDNodeFlags(0, ISD::UNINDEXED, MMO->isVolatile(),
6228                                       MMO->isNonTemporal(), MMO->isInvariant());
6229   assert(isVolatile() == MMO->isVolatile() && "Volatile encoding error!");
6230   assert(memvt.getStoreSize() == MMO->getSize() && "Size mismatch!");
6231 }
6232
6233 /// Profile - Gather unique data for the node.
6234 ///
6235 void SDNode::Profile(FoldingSetNodeID &ID) const {
6236   AddNodeIDNode(ID, this);
6237 }
6238
6239 namespace {
6240   struct EVTArray {
6241     std::vector<EVT> VTs;
6242
6243     EVTArray() {
6244       VTs.reserve(MVT::LAST_VALUETYPE);
6245       for (unsigned i = 0; i < MVT::LAST_VALUETYPE; ++i)
6246         VTs.push_back(MVT((MVT::SimpleValueType)i));
6247     }
6248   };
6249 }
6250
6251 static ManagedStatic<std::set<EVT, EVT::compareRawBits> > EVTs;
6252 static ManagedStatic<EVTArray> SimpleVTArray;
6253 static ManagedStatic<sys::SmartMutex<true> > VTMutex;
6254
6255 /// getValueTypeList - Return a pointer to the specified value type.
6256 ///
6257 const EVT *SDNode::getValueTypeList(EVT VT) {
6258   if (VT.isExtended()) {
6259     sys::SmartScopedLock<true> Lock(*VTMutex);
6260     return &(*EVTs->insert(VT).first);
6261   } else {
6262     assert(VT.getSimpleVT() < MVT::LAST_VALUETYPE &&
6263            "Value type out of range!");
6264     return &SimpleVTArray->VTs[VT.getSimpleVT().SimpleTy];
6265   }
6266 }
6267
6268 /// hasNUsesOfValue - Return true if there are exactly NUSES uses of the
6269 /// indicated value.  This method ignores uses of other values defined by this
6270 /// operation.
6271 bool SDNode::hasNUsesOfValue(unsigned NUses, unsigned Value) const {
6272   assert(Value < getNumValues() && "Bad value!");
6273
6274   // TODO: Only iterate over uses of a given value of the node
6275   for (SDNode::use_iterator UI = use_begin(), E = use_end(); UI != E; ++UI) {
6276     if (UI.getUse().getResNo() == Value) {
6277       if (NUses == 0)
6278         return false;
6279       --NUses;
6280     }
6281   }
6282
6283   // Found exactly the right number of uses?
6284   return NUses == 0;
6285 }
6286
6287
6288 /// hasAnyUseOfValue - Return true if there are any use of the indicated
6289 /// value. This method ignores uses of other values defined by this operation.
6290 bool SDNode::hasAnyUseOfValue(unsigned Value) const {
6291   assert(Value < getNumValues() && "Bad value!");
6292
6293   for (SDNode::use_iterator UI = use_begin(), E = use_end(); UI != E; ++UI)
6294     if (UI.getUse().getResNo() == Value)
6295       return true;
6296
6297   return false;
6298 }
6299
6300
6301 /// isOnlyUserOf - Return true if this node is the only use of N.
6302 ///
6303 bool SDNode::isOnlyUserOf(SDNode *N) const {
6304   bool Seen = false;
6305   for (SDNode::use_iterator I = N->use_begin(), E = N->use_end(); I != E; ++I) {
6306     SDNode *User = *I;
6307     if (User == this)
6308       Seen = true;
6309     else
6310       return false;
6311   }
6312
6313   return Seen;
6314 }
6315
6316 /// isOperand - Return true if this node is an operand of N.
6317 ///
6318 bool SDValue::isOperandOf(SDNode *N) const {
6319   for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i)
6320     if (*this == N->getOperand(i))
6321       return true;
6322   return false;
6323 }
6324
6325 bool SDNode::isOperandOf(SDNode *N) const {
6326   for (unsigned i = 0, e = N->NumOperands; i != e; ++i)
6327     if (this == N->OperandList[i].getNode())
6328       return true;
6329   return false;
6330 }
6331
6332 /// reachesChainWithoutSideEffects - Return true if this operand (which must
6333 /// be a chain) reaches the specified operand without crossing any
6334 /// side-effecting instructions on any chain path.  In practice, this looks
6335 /// through token factors and non-volatile loads.  In order to remain efficient,
6336 /// this only looks a couple of nodes in, it does not do an exhaustive search.
6337 bool SDValue::reachesChainWithoutSideEffects(SDValue Dest,
6338                                                unsigned Depth) const {
6339   if (*this == Dest) return true;
6340
6341   // Don't search too deeply, we just want to be able to see through
6342   // TokenFactor's etc.
6343   if (Depth == 0) return false;
6344
6345   // If this is a token factor, all inputs to the TF happen in parallel.  If any
6346   // of the operands of the TF does not reach dest, then we cannot do the xform.
6347   if (getOpcode() == ISD::TokenFactor) {
6348     for (unsigned i = 0, e = getNumOperands(); i != e; ++i)
6349       if (!getOperand(i).reachesChainWithoutSideEffects(Dest, Depth-1))
6350         return false;
6351     return true;
6352   }
6353
6354   // Loads don't have side effects, look through them.
6355   if (LoadSDNode *Ld = dyn_cast<LoadSDNode>(*this)) {
6356     if (!Ld->isVolatile())
6357       return Ld->getChain().reachesChainWithoutSideEffects(Dest, Depth-1);
6358   }
6359   return false;
6360 }
6361
6362 /// hasPredecessor - Return true if N is a predecessor of this node.
6363 /// N is either an operand of this node, or can be reached by recursively
6364 /// traversing up the operands.
6365 /// NOTE: This is an expensive method. Use it carefully.
6366 bool SDNode::hasPredecessor(const SDNode *N) const {
6367   SmallPtrSet<const SDNode *, 32> Visited;
6368   SmallVector<const SDNode *, 16> Worklist;
6369   return hasPredecessorHelper(N, Visited, Worklist);
6370 }
6371
6372 bool
6373 SDNode::hasPredecessorHelper(const SDNode *N,
6374                              SmallPtrSet<const SDNode *, 32> &Visited,
6375                              SmallVectorImpl<const SDNode *> &Worklist) const {
6376   if (Visited.empty()) {
6377     Worklist.push_back(this);
6378   } else {
6379     // Take a look in the visited set. If we've already encountered this node
6380     // we needn't search further.
6381     if (Visited.count(N))
6382       return true;
6383   }
6384
6385   // Haven't visited N yet. Continue the search.
6386   while (!Worklist.empty()) {
6387     const SDNode *M = Worklist.pop_back_val();
6388     for (unsigned i = 0, e = M->getNumOperands(); i != e; ++i) {
6389       SDNode *Op = M->getOperand(i).getNode();
6390       if (Visited.insert(Op))
6391         Worklist.push_back(Op);
6392       if (Op == N)
6393         return true;
6394     }
6395   }
6396
6397   return false;
6398 }
6399
6400 uint64_t SDNode::getConstantOperandVal(unsigned Num) const {
6401   assert(Num < NumOperands && "Invalid child # of SDNode!");
6402   return cast<ConstantSDNode>(OperandList[Num])->getZExtValue();
6403 }
6404
6405 SDValue SelectionDAG::UnrollVectorOp(SDNode *N, unsigned ResNE) {
6406   assert(N->getNumValues() == 1 &&
6407          "Can't unroll a vector with multiple results!");
6408
6409   EVT VT = N->getValueType(0);
6410   unsigned NE = VT.getVectorNumElements();
6411   EVT EltVT = VT.getVectorElementType();
6412   SDLoc dl(N);
6413
6414   SmallVector<SDValue, 8> Scalars;
6415   SmallVector<SDValue, 4> Operands(N->getNumOperands());
6416
6417   // If ResNE is 0, fully unroll the vector op.
6418   if (ResNE == 0)
6419     ResNE = NE;
6420   else if (NE > ResNE)
6421     NE = ResNE;
6422
6423   unsigned i;
6424   for (i= 0; i != NE; ++i) {
6425     for (unsigned j = 0, e = N->getNumOperands(); j != e; ++j) {
6426       SDValue Operand = N->getOperand(j);
6427       EVT OperandVT = Operand.getValueType();
6428       if (OperandVT.isVector()) {
6429         // A vector operand; extract a single element.
6430         const TargetLowering *TLI = TM.getTargetLowering();
6431         EVT OperandEltVT = OperandVT.getVectorElementType();
6432         Operands[j] = getNode(ISD::EXTRACT_VECTOR_ELT, dl,
6433                               OperandEltVT,
6434                               Operand,
6435                               getConstant(i, TLI->getVectorIdxTy()));
6436       } else {
6437         // A scalar operand; just use it as is.
6438         Operands[j] = Operand;
6439       }
6440     }
6441
6442     switch (N->getOpcode()) {
6443     default:
6444       Scalars.push_back(getNode(N->getOpcode(), dl, EltVT, Operands));
6445       break;
6446     case ISD::VSELECT:
6447       Scalars.push_back(getNode(ISD::SELECT, dl, EltVT, Operands));
6448       break;
6449     case ISD::SHL:
6450     case ISD::SRA:
6451     case ISD::SRL:
6452     case ISD::ROTL:
6453     case ISD::ROTR:
6454       Scalars.push_back(getNode(N->getOpcode(), dl, EltVT, Operands[0],
6455                                getShiftAmountOperand(Operands[0].getValueType(),
6456                                                      Operands[1])));
6457       break;
6458     case ISD::SIGN_EXTEND_INREG:
6459     case ISD::FP_ROUND_INREG: {
6460       EVT ExtVT = cast<VTSDNode>(Operands[1])->getVT().getVectorElementType();
6461       Scalars.push_back(getNode(N->getOpcode(), dl, EltVT,
6462                                 Operands[0],
6463                                 getValueType(ExtVT)));
6464     }
6465     }
6466   }
6467
6468   for (; i < ResNE; ++i)
6469     Scalars.push_back(getUNDEF(EltVT));
6470
6471   return getNode(ISD::BUILD_VECTOR, dl,
6472                  EVT::getVectorVT(*getContext(), EltVT, ResNE), Scalars);
6473 }
6474
6475
6476 /// isConsecutiveLoad - Return true if LD is loading 'Bytes' bytes from a
6477 /// location that is 'Dist' units away from the location that the 'Base' load
6478 /// is loading from.
6479 bool SelectionDAG::isConsecutiveLoad(LoadSDNode *LD, LoadSDNode *Base,
6480                                      unsigned Bytes, int Dist) const {
6481   if (LD->getChain() != Base->getChain())
6482     return false;
6483   EVT VT = LD->getValueType(0);
6484   if (VT.getSizeInBits() / 8 != Bytes)
6485     return false;
6486
6487   SDValue Loc = LD->getOperand(1);
6488   SDValue BaseLoc = Base->getOperand(1);
6489   if (Loc.getOpcode() == ISD::FrameIndex) {
6490     if (BaseLoc.getOpcode() != ISD::FrameIndex)
6491       return false;
6492     const MachineFrameInfo *MFI = getMachineFunction().getFrameInfo();
6493     int FI  = cast<FrameIndexSDNode>(Loc)->getIndex();
6494     int BFI = cast<FrameIndexSDNode>(BaseLoc)->getIndex();
6495     int FS  = MFI->getObjectSize(FI);
6496     int BFS = MFI->getObjectSize(BFI);
6497     if (FS != BFS || FS != (int)Bytes) return false;
6498     return MFI->getObjectOffset(FI) == (MFI->getObjectOffset(BFI) + Dist*Bytes);
6499   }
6500
6501   // Handle X+C
6502   if (isBaseWithConstantOffset(Loc) && Loc.getOperand(0) == BaseLoc &&
6503       cast<ConstantSDNode>(Loc.getOperand(1))->getSExtValue() == Dist*Bytes)
6504     return true;
6505
6506   const GlobalValue *GV1 = nullptr;
6507   const GlobalValue *GV2 = nullptr;
6508   int64_t Offset1 = 0;
6509   int64_t Offset2 = 0;
6510   const TargetLowering *TLI = TM.getTargetLowering();
6511   bool isGA1 = TLI->isGAPlusOffset(Loc.getNode(), GV1, Offset1);
6512   bool isGA2 = TLI->isGAPlusOffset(BaseLoc.getNode(), GV2, Offset2);
6513   if (isGA1 && isGA2 && GV1 == GV2)
6514     return Offset1 == (Offset2 + Dist*Bytes);
6515   return false;
6516 }
6517
6518
6519 /// InferPtrAlignment - Infer alignment of a load / store address. Return 0 if
6520 /// it cannot be inferred.
6521 unsigned SelectionDAG::InferPtrAlignment(SDValue Ptr) const {
6522   // If this is a GlobalAddress + cst, return the alignment.
6523   const GlobalValue *GV;
6524   int64_t GVOffset = 0;
6525   const TargetLowering *TLI = TM.getTargetLowering();
6526   if (TLI->isGAPlusOffset(Ptr.getNode(), GV, GVOffset)) {
6527     unsigned PtrWidth = TLI->getPointerTypeSizeInBits(GV->getType());
6528     APInt KnownZero(PtrWidth, 0), KnownOne(PtrWidth, 0);
6529     llvm::computeKnownBits(const_cast<GlobalValue*>(GV), KnownZero, KnownOne,
6530                            TLI->getDataLayout());
6531     unsigned AlignBits = KnownZero.countTrailingOnes();
6532     unsigned Align = AlignBits ? 1 << std::min(31U, AlignBits) : 0;
6533     if (Align)
6534       return MinAlign(Align, GVOffset);
6535   }
6536
6537   // If this is a direct reference to a stack slot, use information about the
6538   // stack slot's alignment.
6539   int FrameIdx = 1 << 31;
6540   int64_t FrameOffset = 0;
6541   if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(Ptr)) {
6542     FrameIdx = FI->getIndex();
6543   } else if (isBaseWithConstantOffset(Ptr) &&
6544              isa<FrameIndexSDNode>(Ptr.getOperand(0))) {
6545     // Handle FI+Cst
6546     FrameIdx = cast<FrameIndexSDNode>(Ptr.getOperand(0))->getIndex();
6547     FrameOffset = Ptr.getConstantOperandVal(1);
6548   }
6549
6550   if (FrameIdx != (1 << 31)) {
6551     const MachineFrameInfo &MFI = *getMachineFunction().getFrameInfo();
6552     unsigned FIInfoAlign = MinAlign(MFI.getObjectAlignment(FrameIdx),
6553                                     FrameOffset);
6554     return FIInfoAlign;
6555   }
6556
6557   return 0;
6558 }
6559
6560 /// GetSplitDestVTs - Compute the VTs needed for the low/hi parts of a type
6561 /// which is split (or expanded) into two not necessarily identical pieces.
6562 std::pair<EVT, EVT> SelectionDAG::GetSplitDestVTs(const EVT &VT) const {
6563   // Currently all types are split in half.
6564   EVT LoVT, HiVT;
6565   if (!VT.isVector()) {
6566     LoVT = HiVT = TLI->getTypeToTransformTo(*getContext(), VT);
6567   } else {
6568     unsigned NumElements = VT.getVectorNumElements();
6569     assert(!(NumElements & 1) && "Splitting vector, but not in half!");
6570     LoVT = HiVT = EVT::getVectorVT(*getContext(), VT.getVectorElementType(),
6571                                    NumElements/2);
6572   }
6573   return std::make_pair(LoVT, HiVT);
6574 }
6575
6576 /// SplitVector - Split the vector with EXTRACT_SUBVECTOR and return the
6577 /// low/high part.
6578 std::pair<SDValue, SDValue>
6579 SelectionDAG::SplitVector(const SDValue &N, const SDLoc &DL, const EVT &LoVT,
6580                           const EVT &HiVT) {
6581   assert(LoVT.getVectorNumElements() + HiVT.getVectorNumElements() <=
6582          N.getValueType().getVectorNumElements() &&
6583          "More vector elements requested than available!");
6584   SDValue Lo, Hi;
6585   Lo = getNode(ISD::EXTRACT_SUBVECTOR, DL, LoVT, N,
6586                getConstant(0, TLI->getVectorIdxTy()));
6587   Hi = getNode(ISD::EXTRACT_SUBVECTOR, DL, HiVT, N,
6588                getConstant(LoVT.getVectorNumElements(), TLI->getVectorIdxTy()));
6589   return std::make_pair(Lo, Hi);
6590 }
6591
6592 void SelectionDAG::ExtractVectorElements(SDValue Op,
6593                                          SmallVectorImpl<SDValue> &Args,
6594                                          unsigned Start, unsigned Count) {
6595   EVT VT = Op.getValueType();
6596   if (Count == 0)
6597     Count = VT.getVectorNumElements();
6598
6599   EVT EltVT = VT.getVectorElementType();
6600   EVT IdxTy = TLI->getVectorIdxTy();
6601   SDLoc SL(Op);
6602   for (unsigned i = Start, e = Start + Count; i != e; ++i) {
6603     Args.push_back(getNode(ISD::EXTRACT_VECTOR_ELT, SL, EltVT,
6604                            Op, getConstant(i, IdxTy)));
6605   }
6606 }
6607
6608 // getAddressSpace - Return the address space this GlobalAddress belongs to.
6609 unsigned GlobalAddressSDNode::getAddressSpace() const {
6610   return getGlobal()->getType()->getAddressSpace();
6611 }
6612
6613
6614 Type *ConstantPoolSDNode::getType() const {
6615   if (isMachineConstantPoolEntry())
6616     return Val.MachineCPVal->getType();
6617   return Val.ConstVal->getType();
6618 }
6619
6620 bool BuildVectorSDNode::isConstantSplat(APInt &SplatValue,
6621                                         APInt &SplatUndef,
6622                                         unsigned &SplatBitSize,
6623                                         bool &HasAnyUndefs,
6624                                         unsigned MinSplatBits,
6625                                         bool isBigEndian) const {
6626   EVT VT = getValueType(0);
6627   assert(VT.isVector() && "Expected a vector type");
6628   unsigned sz = VT.getSizeInBits();
6629   if (MinSplatBits > sz)
6630     return false;
6631
6632   SplatValue = APInt(sz, 0);
6633   SplatUndef = APInt(sz, 0);
6634
6635   // Get the bits.  Bits with undefined values (when the corresponding element
6636   // of the vector is an ISD::UNDEF value) are set in SplatUndef and cleared
6637   // in SplatValue.  If any of the values are not constant, give up and return
6638   // false.
6639   unsigned int nOps = getNumOperands();
6640   assert(nOps > 0 && "isConstantSplat has 0-size build vector");
6641   unsigned EltBitSize = VT.getVectorElementType().getSizeInBits();
6642
6643   for (unsigned j = 0; j < nOps; ++j) {
6644     unsigned i = isBigEndian ? nOps-1-j : j;
6645     SDValue OpVal = getOperand(i);
6646     unsigned BitPos = j * EltBitSize;
6647
6648     if (OpVal.getOpcode() == ISD::UNDEF)
6649       SplatUndef |= APInt::getBitsSet(sz, BitPos, BitPos + EltBitSize);
6650     else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal))
6651       SplatValue |= CN->getAPIntValue().zextOrTrunc(EltBitSize).
6652                     zextOrTrunc(sz) << BitPos;
6653     else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal))
6654       SplatValue |= CN->getValueAPF().bitcastToAPInt().zextOrTrunc(sz) <<BitPos;
6655      else
6656       return false;
6657   }
6658
6659   // The build_vector is all constants or undefs.  Find the smallest element
6660   // size that splats the vector.
6661
6662   HasAnyUndefs = (SplatUndef != 0);
6663   while (sz > 8) {
6664
6665     unsigned HalfSize = sz / 2;
6666     APInt HighValue = SplatValue.lshr(HalfSize).trunc(HalfSize);
6667     APInt LowValue = SplatValue.trunc(HalfSize);
6668     APInt HighUndef = SplatUndef.lshr(HalfSize).trunc(HalfSize);
6669     APInt LowUndef = SplatUndef.trunc(HalfSize);
6670
6671     // If the two halves do not match (ignoring undef bits), stop here.
6672     if ((HighValue & ~LowUndef) != (LowValue & ~HighUndef) ||
6673         MinSplatBits > HalfSize)
6674       break;
6675
6676     SplatValue = HighValue | LowValue;
6677     SplatUndef = HighUndef & LowUndef;
6678
6679     sz = HalfSize;
6680   }
6681
6682   SplatBitSize = sz;
6683   return true;
6684 }
6685
6686 SDValue BuildVectorSDNode::getSplatValue(BitVector *UndefElements) const {
6687   if (UndefElements) {
6688     UndefElements->clear();
6689     UndefElements->resize(getNumOperands());
6690   }
6691   SDValue Splatted;
6692   for (unsigned i = 0, e = getNumOperands(); i != e; ++i) {
6693     SDValue Op = getOperand(i);
6694     if (Op.getOpcode() == ISD::UNDEF) {
6695       if (UndefElements)
6696         (*UndefElements)[i] = true;
6697     } else if (!Splatted) {
6698       Splatted = Op;
6699     } else if (Splatted != Op) {
6700       return SDValue();
6701     }
6702   }
6703
6704   if (!Splatted) {
6705     assert(getOperand(0).getOpcode() == ISD::UNDEF &&
6706            "Can only have a splat without a constant for all undefs.");
6707     return getOperand(0);
6708   }
6709
6710   return Splatted;
6711 }
6712
6713 ConstantSDNode *
6714 BuildVectorSDNode::getConstantSplatNode(BitVector *UndefElements) const {
6715   return dyn_cast_or_null<ConstantSDNode>(
6716       getSplatValue(UndefElements).getNode());
6717 }
6718
6719 ConstantFPSDNode *
6720 BuildVectorSDNode::getConstantFPSplatNode(BitVector *UndefElements) const {
6721   return dyn_cast_or_null<ConstantFPSDNode>(
6722       getSplatValue(UndefElements).getNode());
6723 }
6724
6725 bool BuildVectorSDNode::isConstant() const {
6726   for (unsigned i = 0, e = getNumOperands(); i != e; ++i) {
6727     unsigned Opc = getOperand(i).getOpcode();
6728     if (Opc != ISD::UNDEF && Opc != ISD::Constant && Opc != ISD::ConstantFP)
6729       return false;
6730   }
6731   return true;
6732 }
6733
6734 bool ShuffleVectorSDNode::isSplatMask(const int *Mask, EVT VT) {
6735   // Find the first non-undef value in the shuffle mask.
6736   unsigned i, e;
6737   for (i = 0, e = VT.getVectorNumElements(); i != e && Mask[i] < 0; ++i)
6738     /* search */;
6739
6740   assert(i != e && "VECTOR_SHUFFLE node with all undef indices!");
6741
6742   // Make sure all remaining elements are either undef or the same as the first
6743   // non-undef value.
6744   for (int Idx = Mask[i]; i != e; ++i)
6745     if (Mask[i] >= 0 && Mask[i] != Idx)
6746       return false;
6747   return true;
6748 }
6749
6750 #ifndef NDEBUG
6751 static void checkForCyclesHelper(const SDNode *N,
6752                                  SmallPtrSet<const SDNode*, 32> &Visited,
6753                                  SmallPtrSet<const SDNode*, 32> &Checked,
6754                                  const llvm::SelectionDAG *DAG) {
6755   // If this node has already been checked, don't check it again.
6756   if (Checked.count(N))
6757     return;
6758
6759   // If a node has already been visited on this depth-first walk, reject it as
6760   // a cycle.
6761   if (!Visited.insert(N)) {
6762     errs() << "Detected cycle in SelectionDAG\n";
6763     dbgs() << "Offending node:\n";
6764     N->dumprFull(DAG); dbgs() << "\n";
6765     abort();
6766   }
6767
6768   for(unsigned i = 0, e = N->getNumOperands(); i != e; ++i)
6769     checkForCyclesHelper(N->getOperand(i).getNode(), Visited, Checked, DAG);
6770
6771   Checked.insert(N);
6772   Visited.erase(N);
6773 }
6774 #endif
6775
6776 void llvm::checkForCycles(const llvm::SDNode *N,
6777                           const llvm::SelectionDAG *DAG,
6778                           bool force) {
6779 #ifndef NDEBUG
6780   bool check = force;
6781 #ifdef XDEBUG
6782   check = true;
6783 #endif  // XDEBUG
6784   if (check) {
6785     assert(N && "Checking nonexistent SDNode");
6786     SmallPtrSet<const SDNode*, 32> visited;
6787     SmallPtrSet<const SDNode*, 32> checked;
6788     checkForCyclesHelper(N, visited, checked, DAG);
6789   }
6790 #endif  // !NDEBUG
6791 }
6792
6793 void llvm::checkForCycles(const llvm::SelectionDAG *DAG, bool force) {
6794   checkForCycles(DAG->getRoot().getNode(), DAG, force);
6795 }