When a load operand is promoted to an extload, replace other uses with uses of extloa...

[oota-llvm.git] / lib / CodeGen / SelectionDAG / TargetLowering.cpp
diff --git a/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/lib/CodeGen/SelectionDAG/TargetLowering.cpp

index f923927c43ec92ba54d80bdf955a28e523ee6aa8..33c8d1a36ff06cac66665f261cce64c44cbe1e93 100644 (file)
--- a/lib/CodeGen/SelectionDAG/TargetLowering.cpp
+++ b/lib/CodeGen/SelectionDAG/TargetLowering.cpp
@@ -174,17 +174,25 @@ static void InitLibcallNames(const char **Names) {
    Names[RTLIB::FLOOR_F64] = "floor";
    Names[RTLIB::FLOOR_F80] = "floorl";
    Names[RTLIB::FLOOR_PPCF128] = "floorl";
+  Names[RTLIB::COPYSIGN_F32] = "copysignf";
+  Names[RTLIB::COPYSIGN_F64] = "copysign";
+  Names[RTLIB::COPYSIGN_F80] = "copysignl";
+  Names[RTLIB::COPYSIGN_PPCF128] = "copysignl";
    Names[RTLIB::FPEXT_F32_F64] = "__extendsfdf2";
+  Names[RTLIB::FPEXT_F16_F32] = "__gnu_h2f_ieee";
+  Names[RTLIB::FPROUND_F32_F16] = "__gnu_f2h_ieee";
    Names[RTLIB::FPROUND_F64_F32] = "__truncdfsf2";
    Names[RTLIB::FPROUND_F80_F32] = "__truncxfsf2";
    Names[RTLIB::FPROUND_PPCF128_F32] = "__trunctfsf2";
    Names[RTLIB::FPROUND_F80_F64] = "__truncxfdf2";
    Names[RTLIB::FPROUND_PPCF128_F64] = "__trunctfdf2";
-  Names[RTLIB::FPTOSINT_F32_I8] = "__fixsfi8";
-  Names[RTLIB::FPTOSINT_F32_I16] = "__fixsfi16";
+  Names[RTLIB::FPTOSINT_F32_I8] = "__fixsfqi";
+  Names[RTLIB::FPTOSINT_F32_I16] = "__fixsfhi";
    Names[RTLIB::FPTOSINT_F32_I32] = "__fixsfsi";
    Names[RTLIB::FPTOSINT_F32_I64] = "__fixsfdi";
    Names[RTLIB::FPTOSINT_F32_I128] = "__fixsfti";
+  Names[RTLIB::FPTOSINT_F64_I8] = "__fixdfqi";
+  Names[RTLIB::FPTOSINT_F64_I16] = "__fixdfhi";
    Names[RTLIB::FPTOSINT_F64_I32] = "__fixdfsi";
    Names[RTLIB::FPTOSINT_F64_I64] = "__fixdfdi";
    Names[RTLIB::FPTOSINT_F64_I128] = "__fixdfti";
@@ -194,11 +202,13 @@ static void InitLibcallNames(const char **Names) {
    Names[RTLIB::FPTOSINT_PPCF128_I32] = "__fixtfsi";
    Names[RTLIB::FPTOSINT_PPCF128_I64] = "__fixtfdi";
    Names[RTLIB::FPTOSINT_PPCF128_I128] = "__fixtfti";
-  Names[RTLIB::FPTOUINT_F32_I8] = "__fixunssfi8";
-  Names[RTLIB::FPTOUINT_F32_I16] = "__fixunssfi16";
+  Names[RTLIB::FPTOUINT_F32_I8] = "__fixunssfqi";
+  Names[RTLIB::FPTOUINT_F32_I16] = "__fixunssfhi";
    Names[RTLIB::FPTOUINT_F32_I32] = "__fixunssfsi";
    Names[RTLIB::FPTOUINT_F32_I64] = "__fixunssfdi";
    Names[RTLIB::FPTOUINT_F32_I128] = "__fixunssfti";
+  Names[RTLIB::FPTOUINT_F64_I8] = "__fixunsdfqi";
+  Names[RTLIB::FPTOUINT_F64_I16] = "__fixunsdfhi";
    Names[RTLIB::FPTOUINT_F64_I32] = "__fixunsdfsi";
    Names[RTLIB::FPTOUINT_F64_I64] = "__fixunsdfdi";
    Names[RTLIB::FPTOUINT_F64_I128] = "__fixunsdfti";
@@ -269,6 +279,7 @@ RTLIB::Libcall RTLIB::getFPEXT(EVT OpVT, EVT RetVT) {
      if (RetVT == MVT::f64)
        return FPEXT_F32_F64;
    }
+
    return UNKNOWN_LIBCALL;
  }
  
@@ -288,6 +299,7 @@ RTLIB::Libcall RTLIB::getFPROUND(EVT OpVT, EVT RetVT) {
      if (OpVT == MVT::ppcf128)
        return FPROUND_PPCF128_F64;
    }
+
    return UNKNOWN_LIBCALL;
  }
  
@@ -306,6 +318,10 @@ RTLIB::Libcall RTLIB::getFPTOSINT(EVT OpVT, EVT RetVT) {
      if (RetVT == MVT::i128)
        return FPTOSINT_F32_I128;
    } else if (OpVT == MVT::f64) {
+    if (RetVT == MVT::i8)
+      return FPTOSINT_F64_I8;
+    if (RetVT == MVT::i16)
+      return FPTOSINT_F64_I16;
      if (RetVT == MVT::i32)
        return FPTOSINT_F64_I32;
      if (RetVT == MVT::i64)
@@ -345,6 +361,10 @@ RTLIB::Libcall RTLIB::getFPTOUINT(EVT OpVT, EVT RetVT) {
      if (RetVT == MVT::i128)
        return FPTOUINT_F32_I128;
    } else if (OpVT == MVT::f64) {
+    if (RetVT == MVT::i8)
+      return FPTOUINT_F64_I8;
+    if (RetVT == MVT::i16)
+      return FPTOUINT_F64_I16;
      if (RetVT == MVT::i32)
        return FPTOUINT_F64_I32;
      if (RetVT == MVT::i64)
@@ -460,14 +480,14 @@ static void InitCmpLibcallCCs(ISD::CondCode *CCs) {
  }
  
  /// NOTE: The constructor takes ownership of TLOF.
-TargetLowering::TargetLowering(TargetMachine &tm,TargetLoweringObjectFile *tlof)
+TargetLowering::TargetLowering(const TargetMachine &tm,
+                               const TargetLoweringObjectFile *tlof)
    : TM(tm), TD(TM.getTargetData()), TLOF(*tlof) {
    // All operations default to being supported.
    memset(OpActions, 0, sizeof(OpActions));
    memset(LoadExtActions, 0, sizeof(LoadExtActions));
    memset(TruncStoreActions, 0, sizeof(TruncStoreActions));
    memset(IndexedModeActions, 0, sizeof(IndexedModeActions));
-  memset(ConvertActions, 0, sizeof(ConvertActions));
    memset(CondCodeActions, 0, sizeof(CondCodeActions));
  
    // Set default actions for various operations.
@@ -540,6 +560,24 @@ TargetLowering::~TargetLowering() {
    delete &TLOF;
  }
  
+/// canOpTrap - Returns true if the operation can trap for the value type.
+/// VT must be a legal type.
+bool TargetLowering::canOpTrap(unsigned Op, EVT VT) const {
+  assert(isTypeLegal(VT));
+  switch (Op) {
+  default:
+    return false;
+  case ISD::FDIV:
+  case ISD::FREM:
+  case ISD::SDIV:
+  case ISD::UDIV:
+  case ISD::SREM:
+  case ISD::UREM:
+    return true;
+  }
+}
+
+
  static unsigned getVectorTypeBreakdownMVT(MVT VT, MVT &IntermediateVT,
                                         unsigned &NumIntermediates,
                                         EVT &RegisterVT,
@@ -683,7 +721,7 @@ void TargetLowering::computeRegisterProperties() {
        unsigned NElts = VT.getVectorNumElements();
        for (unsigned nVT = i+1; nVT <= MVT::LAST_VECTOR_VALUETYPE; ++nVT) {
          EVT SVT = (MVT::SimpleValueType)nVT;
-        if (isTypeLegal(SVT) && SVT.getVectorElementType() == EltVT &&
+        if (isTypeSynthesizable(SVT) && SVT.getVectorElementType() == EltVT &&
              SVT.getVectorNumElements() > NElts && NElts != 1) {
            TransformToType[i] = SVT;
            ValueTypeActions.setTypeAction(VT, Promote);
@@ -774,20 +812,6 @@ unsigned TargetLowering::getVectorTypeBreakdown(LLVMContext &Context, EVT VT,
    return 1;
  }
  
-/// getWidenVectorType: given a vector type, returns the type to widen to
-/// (e.g., v7i8 to v8i8). If the vector type is legal, it returns itself.
-/// If there is no vector type that we want to widen to, returns MVT::Other
-/// When and where to widen is target dependent based on the cost of
-/// scalarizing vs using the wider vector type.
-EVT TargetLowering::getWidenVectorType(EVT VT) const {
-  assert(VT.isVector());
-  if (isTypeLegal(VT))
-    return VT;
- 
-  // Default is not to widen until moved to LegalizeTypes
-  return MVT::Other;
-}
-
  /// getByValTypeAlignment - Return the desired alignment for ByVal aggregate
  /// function arguments in the caller parameter area.  This is the actual
  /// alignment, not its logarithm.
@@ -1256,8 +1280,9 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
      // variable.  The low bit of the shift cannot be an input sign bit unless
      // the shift amount is >= the size of the datatype, which is undefined.
      if (DemandedMask == 1)
-      return TLO.CombineTo(Op, TLO.DAG.getNode(ISD::SRL, dl, Op.getValueType(),
-                                               Op.getOperand(0), Op.getOperand(1)));
+      return TLO.CombineTo(Op,
+                           TLO.DAG.getNode(ISD::SRL, dl, Op.getValueType(),
+                                           Op.getOperand(0), Op.getOperand(1)));
  
      if (ConstantSDNode *SA = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
        EVT VT = Op.getValueType();
@@ -1423,8 +1448,10 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
    case ISD::TRUNCATE: {
      // Simplify the input, using demanded bit information, and compute the known
      // zero/one bits live out.
+    unsigned OperandBitWidth =
+      Op.getOperand(0).getValueType().getScalarType().getSizeInBits();
      APInt TruncMask = NewMask;
-    TruncMask.zext(Op.getOperand(0).getValueSizeInBits());
+    TruncMask.zext(OperandBitWidth);
      if (SimplifyDemandedBits(Op.getOperand(0), TruncMask,
                               KnownZero, KnownOne, TLO, Depth+1))
        return true;
@@ -1435,29 +1462,34 @@ bool TargetLowering::SimplifyDemandedBits(SDValue Op,
      // on the known demanded bits.
      if (Op.getOperand(0).getNode()->hasOneUse()) {
        SDValue In = Op.getOperand(0);
-      unsigned InBitWidth = In.getValueSizeInBits();
        switch (In.getOpcode()) {
        default: break;
        case ISD::SRL:
          // Shrink SRL by a constant if none of the high bits shifted in are
          // demanded.
-        if (ConstantSDNode *ShAmt = dyn_cast<ConstantSDNode>(In.getOperand(1))){
-          APInt HighBits = APInt::getHighBitsSet(InBitWidth,
-                                                 InBitWidth - BitWidth);
-          HighBits = HighBits.lshr(ShAmt->getZExtValue());
-          HighBits.trunc(BitWidth);
-          
-          if (ShAmt->getZExtValue() < BitWidth && !(HighBits & NewMask)) {
-            // None of the shifted in bits are needed.  Add a truncate of the
-            // shift input, then shift it.
-            SDValue NewTrunc = TLO.DAG.getNode(ISD::TRUNCATE, dl,
-                                                 Op.getValueType(), 
-                                                 In.getOperand(0));
-            return TLO.CombineTo(Op, TLO.DAG.getNode(ISD::SRL, dl,
-                                                     Op.getValueType(),
-                                                     NewTrunc, 
-                                                     In.getOperand(1)));
-          }
+        if (TLO.LegalTypes() &&
+            !isTypeDesirableForOp(ISD::SRL, Op.getValueType()))
+          // Do not turn (vt1 truncate (vt2 srl)) into (vt1 srl) if vt1 is
+          // undesirable.
+          break;
+        ConstantSDNode *ShAmt = dyn_cast<ConstantSDNode>(In.getOperand(1));
+        if (!ShAmt)
+          break;
+        APInt HighBits = APInt::getHighBitsSet(OperandBitWidth,
+                                               OperandBitWidth - BitWidth);
+        HighBits = HighBits.lshr(ShAmt->getZExtValue());
+        HighBits.trunc(BitWidth);
+
+        if (ShAmt->getZExtValue() < BitWidth && !(HighBits & NewMask)) {
+          // None of the shifted in bits are needed.  Add a truncate of the
+          // shift input, then shift it.
+          SDValue NewTrunc = TLO.DAG.getNode(ISD::TRUNCATE, dl,
+                                             Op.getValueType(), 
+                                             In.getOperand(0));
+          return TLO.CombineTo(Op, TLO.DAG.getNode(ISD::SRL, dl,
+                                                   Op.getValueType(),
+                                                   NewTrunc, 
+                                                   In.getOperand(1)));
          }
          break;
        }
@@ -1589,7 +1621,7 @@ static bool ValueHasExactlyOneBitSet(SDValue Val, const SelectionDAG &DAG) {
  
    // Fall back to ComputeMaskedBits to catch other known cases.
    EVT OpVT = Val.getValueType();
-  unsigned BitWidth = OpVT.getSizeInBits();
+  unsigned BitWidth = OpVT.getScalarType().getSizeInBits();
    APInt Mask = APInt::getAllOnesValue(BitWidth);
    APInt KnownZero, KnownOne;
    DAG.ComputeMaskedBits(Val, Mask, KnownZero, KnownOne);
@@ -1698,7 +1730,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
            SDValue NewLoad = DAG.getLoad(newVT, dl, Lod->getChain(), Ptr,
                                          Lod->getSrcValue(), 
                                          Lod->getSrcValueOffset() + bestOffset,
-                                        false, NewAlign);
+                                        false, false, NewAlign);
            return DAG.getSetCC(dl, VT, 
                                DAG.getNode(ISD::AND, dl, newVT, NewLoad,
                                        DAG.getConstant(bestMask.trunc(bestWidth),
@@ -1757,7 +1789,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
          break;   // todo, be more careful with signed comparisons
        }
      } else if (N0.getOpcode() == ISD::SIGN_EXTEND_INREG &&
-                (Cond == ISD::SETEQ || Cond == ISD::SETNE)) {
+               (Cond == ISD::SETEQ || Cond == ISD::SETNE)) {
        EVT ExtSrcTy = cast<VTSDNode>(N0.getOperand(1))->getVT();
        unsigned ExtSrcTyBits = ExtSrcTy.getSizeInBits();
        EVT ExtDstTy = N0.getValueType();
@@ -1791,22 +1823,21 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
                            Cond);
      } else if ((N1C->isNullValue() || N1C->getAPIntValue() == 1) &&
                  (Cond == ISD::SETEQ || Cond == ISD::SETNE)) {
-      
        // SETCC (SETCC), [0|1], [EQ|NE]  -> SETCC
-      if (N0.getOpcode() == ISD::SETCC) {
+      if (N0.getOpcode() == ISD::SETCC &&
+          isTypeLegal(VT) && VT.bitsLE(N0.getValueType())) {
          bool TrueWhenTrue = (Cond == ISD::SETEQ) ^ (N1C->getAPIntValue() != 1);
          if (TrueWhenTrue)
-          return N0;
-        
+          return DAG.getNode(ISD::TRUNCATE, dl, VT, N0);        
          // Invert the condition.
          ISD::CondCode CC = cast<CondCodeSDNode>(N0.getOperand(2))->get();
          CC = ISD::getSetCCInverse(CC, 
                                    N0.getOperand(0).getValueType().isInteger());
          return DAG.getSetCC(dl, VT, N0.getOperand(0), N0.getOperand(1), CC);
        }
-      
+
        if ((N0.getOpcode() == ISD::XOR ||
-            (N0.getOpcode() == ISD::AND && 
+           (N0.getOpcode() == ISD::AND && 
              N0.getOperand(0).getOpcode() == ISD::XOR &&
              N0.getOperand(1) == N0.getOperand(0).getOperand(1))) &&
            isa<ConstantSDNode>(N0.getOperand(1)) &&
@@ -1829,9 +1860,36 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
                                N0.getOperand(0).getOperand(0),
                                N0.getOperand(1));
            }
+
            return DAG.getSetCC(dl, VT, Val, N1,
                                Cond == ISD::SETEQ ? ISD::SETNE : ISD::SETEQ);
          }
+      } else if (N1C->getAPIntValue() == 1 &&
+                 (VT == MVT::i1 ||
+                  getBooleanContents() == ZeroOrOneBooleanContent)) {
+        SDValue Op0 = N0;
+        if (Op0.getOpcode() == ISD::TRUNCATE)
+          Op0 = Op0.getOperand(0);
+
+        if ((Op0.getOpcode() == ISD::XOR) &&
+            Op0.getOperand(0).getOpcode() == ISD::SETCC &&
+            Op0.getOperand(1).getOpcode() == ISD::SETCC) {
+          // (xor (setcc), (setcc)) == / != 1 -> (setcc) != / == (setcc)
+          Cond = (Cond == ISD::SETEQ) ? ISD::SETNE : ISD::SETEQ;
+          return DAG.getSetCC(dl, VT, Op0.getOperand(0), Op0.getOperand(1),
+                              Cond);
+        } else if (Op0.getOpcode() == ISD::AND &&
+                isa<ConstantSDNode>(Op0.getOperand(1)) &&
+                cast<ConstantSDNode>(Op0.getOperand(1))->getAPIntValue() == 1) {
+          // If this is (X&1) == / != 1, normalize it to (X&1) != / == 0.
+          if (Op0.getValueType() != VT)
+            Op0 = DAG.getNode(ISD::AND, dl, VT,
+                          DAG.getNode(ISD::TRUNCATE, dl, VT, Op0.getOperand(0)),
+                          DAG.getConstant(1, VT));
+          return DAG.getSetCC(dl, VT, Op0,
+                              DAG.getConstant(0, Op0.getValueType()),
+                              Cond == ISD::SETEQ ? ISD::SETNE : ISD::SETEQ);
+        }
        }
      }
      
@@ -2195,7 +2253,7 @@ TargetLowering::SimplifySetCC(EVT VT, SDValue N0, SDValue N1,
  
  /// isGAPlusOffset - Returns true (and the GlobalValue and the offset) if the
  /// node is a GlobalAddress + offset.
-bool TargetLowering::isGAPlusOffset(SDNode *N, GlobalValue* &GA,
+bool TargetLowering::isGAPlusOffset(SDNode *N, const GlobalValue* &GA,
                                      int64_t &Offset) const {
    if (isa<GlobalAddressSDNode>(N)) {
      GlobalAddressSDNode *GASD = cast<GlobalAddressSDNode>(N);
@@ -2366,7 +2424,7 @@ getRegForInlineAsmConstraint(const std::string &Constraint,
         E = RI->regclass_end(); RCI != E; ++RCI) {
      const TargetRegisterClass *RC = *RCI;
      
-    // If none of the the value types for this register class are valid, we 
+    // If none of the value types for this register class are valid, we 
      // can't use it.  For example, 64-bit reg classes on 32-bit targets.
      bool isLegal = false;
      for (TargetRegisterClass::vt_iterator I = RC->vt_begin(), E = RC->vt_end();