Add in support for expansion of all of the comparison operations to the absolute...

[oota-llvm.git] / lib / CodeGen / SelectionDAG / LegalizeIntegerTypes.cpp
diff --git a/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp b/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp

index 1c02c4f21c856886a0231970cfdbe145a27e5113..a370faeb2399f83f44539a9eb591cb251a3b7185 100644 (file)
--- a/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp
+++ b/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp
@@ -212,9 +212,6 @@ SDValue DAGTypeLegalizer::PromoteIntRes_BITCAST(SDNode *N) {
    DebugLoc dl = N->getDebugLoc();
  
    switch (getTypeAction(InVT)) {
-  default:
-    assert(false && "Unknown type action!");
-    break;
    case TargetLowering::TypeLegal:
      break;
    case TargetLowering::TypePromoteInteger:
@@ -252,9 +249,11 @@ SDValue DAGTypeLegalizer::PromoteIntRes_BITCAST(SDNode *N) {
      return DAG.getNode(ISD::BITCAST, dl, NOutVT, InOp);
    }
    case TargetLowering::TypeWidenVector:
-    if (OutVT.bitsEq(NInVT))
-      // The input is widened to the same size.  Convert to the widened value.
-      return DAG.getNode(ISD::BITCAST, dl, OutVT, GetWidenedVector(InOp));
+    // The input is widened to the same size. Convert to the widened value.
+    // Make sure that the outgoing value is not a vector, because this would
+    // make us bitcast between two vectors which are legalized in different ways.
+    if (NOutVT.bitsEq(NInVT) && !NOutVT.isVector())
+      return DAG.getNode(ISD::BITCAST, dl, NOutVT, GetWidenedVector(InOp));
    }
  
    return DAG.getNode(ISD::ANY_EXTEND, dl, NOutVT,
@@ -489,7 +488,11 @@ SDValue DAGTypeLegalizer::PromoteIntRes_SELECT(SDNode *N) {
  }
  
  SDValue DAGTypeLegalizer::PromoteIntRes_VSELECT(SDNode *N) {
-  SDValue Mask = GetPromotedInteger(N->getOperand(0));
+  SDValue Mask = N->getOperand(0);
+  EVT OpTy = N->getOperand(1).getValueType();
+
+  // Promote all the way up to the canonical SetCC type.
+  Mask = PromoteTargetBoolean(Mask, TLI.getSetCCResultType(OpTy));
    SDValue LHS = GetPromotedInteger(N->getOperand(1));
    SDValue RHS = GetPromotedInteger(N->getOperand(2));
    return DAG.getNode(ISD::VSELECT, N->getDebugLoc(),
@@ -585,18 +588,14 @@ SDValue DAGTypeLegalizer::PromoteIntRes_TRUNCATE(SDNode *N) {
      unsigned NumElts = InVT.getVectorNumElements();
      assert(NumElts == NVT.getVectorNumElements() &&
             "Dst and Src must have the same number of elements");
-    EVT EltVT = InVT.getScalarType();
      assert(isPowerOf2_32(NumElts) &&
             "Promoted vector type must be a power of two");
  
-    EVT HalfVT = EVT::getVectorVT(*DAG.getContext(), EltVT, NumElts/2);
+    SDValue EOp1, EOp2;
+    GetSplitVector(InOp, EOp1, EOp2);
+
      EVT HalfNVT = EVT::getVectorVT(*DAG.getContext(), NVT.getScalarType(),
                                     NumElts/2);
-
-    SDValue EOp1 = DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, HalfVT, InOp,
-                               DAG.getIntPtrConstant(0));
-    SDValue EOp2 = DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, HalfVT, InOp,
-                               DAG.getIntPtrConstant(NumElts/2));
      EOp1 = DAG.getNode(ISD::TRUNCATE, dl, HalfNVT, EOp1);
      EOp2 = DAG.getNode(ISD::TRUNCATE, dl, HalfNVT, EOp2);
  
@@ -645,8 +644,9 @@ SDValue DAGTypeLegalizer::PromoteIntRes_XMULO(SDNode *N, unsigned ResNo) {
    EVT SmallVT = LHS.getValueType();
  
    // To determine if the result overflowed in a larger type, we extend the
-  // input to the larger type, do the multiply, then check the high bits of
-  // the result to see if the overflow happened.
+  // input to the larger type, do the multiply (checking if it overflows),
+  // then also check the high bits of the result to see if overflow happened
+  // there.
    if (N->getOpcode() == ISD::SMULO) {
      LHS = SExtPromotedInteger(LHS);
      RHS = SExtPromotedInteger(RHS);
@@ -654,24 +654,31 @@ SDValue DAGTypeLegalizer::PromoteIntRes_XMULO(SDNode *N, unsigned ResNo) {
      LHS = ZExtPromotedInteger(LHS);
      RHS = ZExtPromotedInteger(RHS);
    }
-  SDValue Mul = DAG.getNode(ISD::MUL, DL, LHS.getValueType(), LHS, RHS);
+  SDVTList VTs = DAG.getVTList(LHS.getValueType(), N->getValueType(1));
+  SDValue Mul = DAG.getNode(N->getOpcode(), DL, VTs, LHS, RHS);
  
-  // Overflow occurred iff the high part of the result does not
-  // zero/sign-extend the low part.
+  // Overflow occurred if it occurred in the larger type, or if the high part
+  // of the result does not zero/sign-extend the low part.  Check this second
+  // possibility first.
    SDValue Overflow;
    if (N->getOpcode() == ISD::UMULO) {
-    // Unsigned overflow occurred iff the high part is non-zero.
+    // Unsigned overflow occurred if the high part is non-zero.
      SDValue Hi = DAG.getNode(ISD::SRL, DL, Mul.getValueType(), Mul,
                               DAG.getIntPtrConstant(SmallVT.getSizeInBits()));
      Overflow = DAG.getSetCC(DL, N->getValueType(1), Hi,
                              DAG.getConstant(0, Hi.getValueType()), ISD::SETNE);
    } else {
-    // Signed overflow occurred iff the high part does not sign extend the low.
+    // Signed overflow occurred if the high part does not sign extend the low.
      SDValue SExt = DAG.getNode(ISD::SIGN_EXTEND_INREG, DL, Mul.getValueType(),
                                 Mul, DAG.getValueType(SmallVT));
      Overflow = DAG.getSetCC(DL, N->getValueType(1), SExt, Mul, ISD::SETNE);
    }
  
+  // The only other way for overflow to occur is if the multiplication in the
+  // larger type itself overflowed.
+  Overflow = DAG.getNode(ISD::OR, DL, N->getValueType(1), Overflow,
+                         SDValue(Mul.getNode(), 1));
+
    // Use the calculated overflow everywhere.
    ReplaceValueWith(SDValue(N, 1), Overflow);
    return Mul;
@@ -1176,7 +1183,6 @@ std::pair <SDValue, SDValue> DAGTypeLegalizer::ExpandAtomic(SDNode *Node) {
    switch (Opc) {
    default:
      llvm_unreachable("Unhandled atomic intrinsic Expand!");
-    break;
    case ISD::ATOMIC_SWAP:
      switch (VT.SimpleTy) {
      default: llvm_unreachable("Unexpected value type for atomic!");
@@ -1360,7 +1366,7 @@ ExpandShiftWithKnownAmountBit(SDNode *N, SDValue &Lo, SDValue &Hi) {
  
    APInt HighBitMask = APInt::getHighBitsSet(ShBits, ShBits - Log2_32(NVTBits));
    APInt KnownZero, KnownOne;
-  DAG.ComputeMaskedBits(N->getOperand(1), HighBitMask, KnownZero, KnownOne);
+  DAG.ComputeMaskedBits(N->getOperand(1), KnownZero, KnownOne);
  
    // If we don't know anything about the high bits, exit.
    if (((KnownZero|KnownOne) & HighBitMask) == 0)
@@ -1395,15 +1401,15 @@ ExpandShiftWithKnownAmountBit(SDNode *N, SDValue &Lo, SDValue &Hi) {
      }
    }
  
-#if 0
-  // FIXME: This code is broken for shifts with a zero amount!
    // If we know that all of the high bits of the shift amount are zero, then we
    // can do this as a couple of simple shifts.
    if ((KnownZero & HighBitMask) == HighBitMask) {
-    // Compute 32-amt.
-    SDValue Amt2 = DAG.getNode(ISD::SUB, ShTy,
-                                 DAG.getConstant(NVTBits, ShTy),
-                                 Amt);
+    // Calculate 31-x. 31 is used instead of 32 to avoid creating an undefined
+    // shift if x is zero.  We can use XOR here because x is known to be smaller
+    // than 32.
+    SDValue Amt2 = DAG.getNode(ISD::XOR, dl, ShTy, Amt,
+                               DAG.getConstant(NVTBits-1, ShTy));
+
      unsigned Op1, Op2;
      switch (N->getOpcode()) {
      default: llvm_unreachable("Unknown shift");
@@ -1412,13 +1418,23 @@ ExpandShiftWithKnownAmountBit(SDNode *N, SDValue &Lo, SDValue &Hi) {
      case ISD::SRA:  Op1 = ISD::SRL; Op2 = ISD::SHL; break;
      }
  
-    Lo = DAG.getNode(N->getOpcode(), NVT, InL, Amt);
-    Hi = DAG.getNode(ISD::OR, NVT,
-                     DAG.getNode(Op1, NVT, InH, Amt),
-                     DAG.getNode(Op2, NVT, InL, Amt2));
+    // When shifting right the arithmetic for Lo and Hi is swapped.
+    if (N->getOpcode() != ISD::SHL)
+      std::swap(InL, InH);
+
+    // Use a little trick to get the bits that move from Lo to Hi. First
+    // shift by one bit.
+    SDValue Sh1 = DAG.getNode(Op2, dl, NVT, InL, DAG.getConstant(1, ShTy));
+    // Then compute the remaining shift with amount-1.
+    SDValue Sh2 = DAG.getNode(Op2, dl, NVT, Sh1, Amt2);
+
+    Lo = DAG.getNode(N->getOpcode(), dl, NVT, InL, Amt);
+    Hi = DAG.getNode(ISD::OR, dl, NVT, DAG.getNode(Op1, dl, NVT, InH, Amt),Sh2);
+
+    if (N->getOpcode() != ISD::SHL)
+      std::swap(Hi, Lo);
      return true;
    }
-#endif
  
    return false;
  }
@@ -1498,8 +1514,6 @@ ExpandShiftWithUnknownAmountBit(SDNode *N, SDValue &Lo, SDValue &Hi) {
      Hi = DAG.getNode(ISD::SELECT, dl, NVT, isShort, HiS, HiL);
      return true;
    }
-
-  return false;
  }
  
  void DAGTypeLegalizer::ExpandIntRes_ADDSUB(SDNode *N,
@@ -2247,32 +2261,35 @@ void DAGTypeLegalizer::ExpandIntRes_UADDSUBO(SDNode *N,
  void DAGTypeLegalizer::ExpandIntRes_XMULO(SDNode *N,
                                            SDValue &Lo, SDValue &Hi) {
    EVT VT = N->getValueType(0);
-  Type *RetTy = VT.getTypeForEVT(*DAG.getContext());
-  EVT PtrVT = TLI.getPointerTy();
-  Type *PtrTy = PtrVT.getTypeForEVT(*DAG.getContext());
    DebugLoc dl = N->getDebugLoc();
  
    // A divide for UMULO should be faster than a function call.
    if (N->getOpcode() == ISD::UMULO) {
      SDValue LHS = N->getOperand(0), RHS = N->getOperand(1);
-    DebugLoc DL = N->getDebugLoc();
  
-    SDValue MUL = DAG.getNode(ISD::MUL, DL, LHS.getValueType(), LHS, RHS);
+    SDValue MUL = DAG.getNode(ISD::MUL, dl, LHS.getValueType(), LHS, RHS);
      SplitInteger(MUL, Lo, Hi);
  
      // A divide for UMULO will be faster than a function call. Select to
      // make sure we aren't using 0.
      SDValue isZero = DAG.getSetCC(dl, TLI.getSetCCResultType(VT),
-                                 RHS, DAG.getConstant(0, VT), ISD::SETNE);
+                                  RHS, DAG.getConstant(0, VT), ISD::SETEQ);
      SDValue NotZero = DAG.getNode(ISD::SELECT, dl, VT, isZero,
-                                 DAG.getConstant(1, VT), RHS);
-    SDValue DIV = DAG.getNode(ISD::UDIV, DL, LHS.getValueType(), MUL, NotZero);
-    SDValue Overflow;
-    Overflow = DAG.getSetCC(DL, N->getValueType(1), DIV, LHS, ISD::SETNE);
+                                  DAG.getConstant(1, VT), RHS);
+    SDValue DIV = DAG.getNode(ISD::UDIV, dl, VT, MUL, NotZero);
+    SDValue Overflow = DAG.getSetCC(dl, N->getValueType(1), DIV, LHS,
+                                    ISD::SETNE);
+    Overflow = DAG.getNode(ISD::SELECT, dl, N->getValueType(1), isZero,
+                           DAG.getConstant(0, N->getValueType(1)),
+                           Overflow);
      ReplaceValueWith(SDValue(N, 1), Overflow);
      return;
    }
  
+  Type *RetTy = VT.getTypeForEVT(*DAG.getContext());
+  EVT PtrVT = TLI.getPointerTy();
+  Type *PtrTy = PtrVT.getTypeForEVT(*DAG.getContext());
+  
    // Replace this with a libcall that will check overflow.
    RTLIB::Libcall LC = RTLIB::UNKNOWN_LIBCALL;
    if (VT == MVT::i32)
@@ -2286,8 +2303,8 @@ void DAGTypeLegalizer::ExpandIntRes_XMULO(SDNode *N,
    SDValue Temp = DAG.CreateStackTemporary(PtrVT);
    // Temporary for the overflow value, default it to zero.
    SDValue Chain = DAG.getStore(DAG.getEntryNode(), dl,
-                              DAG.getConstant(0, PtrVT), Temp,
-                              MachinePointerInfo(), false, false, 0);
+                               DAG.getConstant(0, PtrVT), Temp,
+                               MachinePointerInfo(), false, false, 0);
  
    TargetLowering::ArgListTy Args;
    TargetLowering::ArgListEntry Entry;
@@ -2309,14 +2326,17 @@ void DAGTypeLegalizer::ExpandIntRes_XMULO(SDNode *N,
    Args.push_back(Entry);
  
    SDValue Func = DAG.getExternalSymbol(TLI.getLibcallName(LC), PtrVT);
-  std::pair<SDValue, SDValue> CallInfo =
-    TLI.LowerCallTo(Chain, RetTy, true, false, false, false,
-                   0, TLI.getLibcallCallingConv(LC), false,
-                   true, Func, Args, DAG, dl);
+  TargetLowering::
+  CallLoweringInfo CLI(Chain, RetTy, true, false, false, false,
+                       0, TLI.getLibcallCallingConv(LC),
+                       /*isTailCall=*/false,
+                       /*doesNotReturn=*/false, /*isReturnValueUsed=*/true,
+                       Func, Args, DAG, dl);
+  std::pair<SDValue, SDValue> CallInfo = TLI.LowerCallTo(CLI);
  
    SplitInteger(CallInfo.first, Lo, Hi);
    SDValue Temp2 = DAG.getLoad(PtrVT, dl, CallInfo.second, Temp,
-                             MachinePointerInfo(), false, false, false, 0);
+                              MachinePointerInfo(), false, false, false, 0);
    SDValue Ofl = DAG.getSetCC(dl, N->getValueType(1), Temp2,
                               DAG.getConstant(0, PtrVT),
                               ISD::SETNE);
@@ -2787,7 +2807,7 @@ SDValue DAGTypeLegalizer::ExpandIntOp_UINT_TO_FP(SDNode *N) {
      else if (SrcVT == MVT::i128)
        FF = APInt(32, F32TwoE128);
      else
-      assert(false && "Unsupported UINT_TO_FP!");
+      llvm_unreachable("Unsupported UINT_TO_FP!");
  
      // Check whether the sign bit is set.
      SDValue Lo, Hi;