Change:

[oota-llvm.git] / lib / CodeGen / SelectionDAG / LegalizeVectorOps.cpp
diff --git a/lib/CodeGen/SelectionDAG/LegalizeVectorOps.cpp b/lib/CodeGen/SelectionDAG/LegalizeVectorOps.cpp

index df9af2147ca5b7627a2cd7348826c66d2d1ff91c..80b4c6053a68da9689d38f2750c16280eed6c9c2 100644 (file)
--- a/lib/CodeGen/SelectionDAG/LegalizeVectorOps.cpp
+++ b/lib/CodeGen/SelectionDAG/LegalizeVectorOps.cpp
@@ -20,8 +20,8 @@
  // type i8 which must be promoted.
  //
  // This does not legalize vector manipulations like ISD::BUILD_VECTOR,
-// or operations that happen to take a vector which are custom-lowered like
-// ISD::CALL; the legalization for such operations never produces nodes
+// or operations that happen to take a vector which are custom-lowered;
+// the legalization for such operations never produces nodes
  // with illegal types, so it's okay to put off legalizing them until
  // SelectionDAG::Legalize runs.
  //
@@ -34,7 +34,7 @@ using namespace llvm;
  namespace {
  class VectorLegalizer {
    SelectionDAG& DAG;
-  TargetLowering& TLI;
+  const TargetLowering &TLI;
    bool Changed; // Keep track of whether anything changed
  
    /// LegalizedNodes - For nodes that are of legal width, and that have more
@@ -54,13 +54,16 @@ class VectorLegalizer {
    SDValue LegalizeOp(SDValue Op);
    // Assuming the node is legal, "legalize" the results
    SDValue TranslateLegalizeResults(SDValue Op, SDValue Result);
-  // Implements unrolling a generic vector operation, i.e. turning it into
-  // scalar operations.
-  SDValue UnrollVectorOp(SDValue Op);
    // Implements unrolling a VSETCC.
    SDValue UnrollVSETCC(SDValue Op);
    // Implements expansion for FNEG; falls back to UnrollVectorOp if FSUB
    // isn't legal.
+  // Implements expansion for UINT_TO_FLOAT; falls back to UnrollVectorOp if
+  // SINT_TO_FLOAT and SHR on vectors isn't legal.
+  SDValue ExpandUINT_TO_FLOAT(SDValue Op);
+  // Implement vselect in terms of XOR, AND, OR when blend is not supported
+  // by the target.
+  SDValue ExpandVSELECT(SDValue Op);
    SDValue ExpandFNEG(SDValue Op);
    // Implements vector promotion; this is essentially just bitcasting the
    // operands to a different type and bitcasting the result back to the
@@ -82,7 +85,7 @@ bool VectorLegalizer::Run() {
    // node is only legalized after all of its operands are legalized.
    DAG.AssignTopologicalOrder();
    for (SelectionDAG::allnodes_iterator I = DAG.allnodes_begin(),
-       E = prior(DAG.allnodes_end()); I != next(E); ++I)
+       E = prior(DAG.allnodes_end()); I != llvm::next(E); ++I)
      LegalizeOp(SDValue(I, 0));
  
    // Finally, it's possible the root changed.  Get the new root.
@@ -119,7 +122,7 @@ SDValue VectorLegalizer::LegalizeOp(SDValue Op) {
      Ops.push_back(LegalizeOp(Node->getOperand(i)));
  
    SDValue Result =
-      DAG.UpdateNodeOperands(Op.getValue(0), Ops.data(), Ops.size());
+    SDValue(DAG.UpdateNodeOperands(Op.getNode(), Ops.data(), Ops.size()), 0);
  
    bool HasVectorValue = false;
    for (SDNode::value_iterator J = Node->value_begin(), E = Node->value_end();
@@ -129,6 +132,7 @@ SDValue VectorLegalizer::LegalizeOp(SDValue Op) {
    if (!HasVectorValue)
      return TranslateLegalizeResults(Op, Result);
  
+  EVT QueryType;
    switch (Op.getOpcode()) {
    default:
      return TranslateLegalizeResults(Op, Result);
@@ -156,14 +160,13 @@ SDValue VectorLegalizer::LegalizeOp(SDValue Op) {
    case ISD::CTLZ:
    case ISD::CTPOP:
    case ISD::SELECT:
+  case ISD::VSELECT:
    case ISD::SELECT_CC:
-  case ISD::VSETCC:
+  case ISD::SETCC:
    case ISD::ZERO_EXTEND:
    case ISD::ANY_EXTEND:
    case ISD::TRUNCATE:
    case ISD::SIGN_EXTEND:
-  case ISD::SINT_TO_FP:
-  case ISD::UINT_TO_FP:
    case ISD::FP_TO_SINT:
    case ISD::FP_TO_UINT:
    case ISD::FNEG:
@@ -183,10 +186,19 @@ SDValue VectorLegalizer::LegalizeOp(SDValue Op) {
    case ISD::FRINT:
    case ISD::FNEARBYINT:
    case ISD::FFLOOR:
+  case ISD::SIGN_EXTEND_INREG:
+    QueryType = Node->getValueType(0);
+    break;
+  case ISD::FP_ROUND_INREG:
+    QueryType = cast<VTSDNode>(Node->getOperand(1))->getVT();
+    break;
+  case ISD::SINT_TO_FP:
+  case ISD::UINT_TO_FP:
+    QueryType = Node->getOperand(0).getValueType();
      break;
    }
  
-  switch (TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0))) {
+  switch (TLI.getOperationAction(Node->getOpcode(), QueryType)) {
    case TargetLowering::Promote:
      // "Promote" the operation by bitcasting
      Result = PromoteVectorOp(Op);
@@ -202,12 +214,16 @@ SDValue VectorLegalizer::LegalizeOp(SDValue Op) {
      // FALL THROUGH
    }
    case TargetLowering::Expand:
-    if (Node->getOpcode() == ISD::FNEG)
+    if (Node->getOpcode() == ISD::VSELECT)
+      Result = ExpandVSELECT(Op);
+    else if (Node->getOpcode() == ISD::UINT_TO_FP)
+      Result = ExpandUINT_TO_FLOAT(Op);
+    else if (Node->getOpcode() == ISD::FNEG)
        Result = ExpandFNEG(Op);
-    else if (Node->getOpcode() == ISD::VSETCC)
+    else if (Node->getOpcode() == ISD::SETCC)
        Result = UnrollVSETCC(Op);
      else
-      Result = UnrollVectorOp(Op);
+      Result = DAG.UnrollVectorOp(Op.getNode());
      break;
    }
  
@@ -227,40 +243,114 @@ SDValue VectorLegalizer::PromoteVectorOp(SDValue Op) {
    // Vector "promotion" is basically just bitcasting and doing the operation
    // in a different type.  For example, x86 promotes ISD::AND on v2i32 to
    // v1i64.
-  MVT VT = Op.getValueType();
+  EVT VT = Op.getValueType();
    assert(Op.getNode()->getNumValues() == 1 &&
           "Can't promote a vector with multiple results!");
-  MVT NVT = TLI.getTypeToPromoteTo(Op.getOpcode(), VT);
+  EVT NVT = TLI.getTypeToPromoteTo(Op.getOpcode(), VT);
    DebugLoc dl = Op.getDebugLoc();
    SmallVector<SDValue, 4> Operands(Op.getNumOperands());
  
    for (unsigned j = 0; j != Op.getNumOperands(); ++j) {
      if (Op.getOperand(j).getValueType().isVector())
-      Operands[j] = DAG.getNode(ISD::BIT_CONVERT, dl, NVT, Op.getOperand(j));
+      Operands[j] = DAG.getNode(ISD::BITCAST, dl, NVT, Op.getOperand(j));
      else
        Operands[j] = Op.getOperand(j);
    }
  
    Op = DAG.getNode(Op.getOpcode(), dl, NVT, &Operands[0], Operands.size());
  
-  return DAG.getNode(ISD::BIT_CONVERT, dl, VT, Op);
+  return DAG.getNode(ISD::BITCAST, dl, VT, Op);
+}
+
+SDValue VectorLegalizer::ExpandVSELECT(SDValue Op) {
+  // Implement VSELECT in terms of XOR, AND, OR
+  // on platforms which do not support blend natively.
+  EVT VT =  Op.getOperand(0).getValueType();
+  EVT OVT = Op.getOperand(1).getValueType();
+  DebugLoc DL = Op.getDebugLoc();
+
+  SDValue Mask = Op.getOperand(0);
+  SDValue Op1 = Op.getOperand(1);
+  SDValue Op2 = Op.getOperand(2);
+
+  // If we can't even use the basic vector operations of
+  // AND,OR,XOR, we will have to scalarize the op.
+  if (!TLI.isOperationLegalOrCustom(ISD::AND, VT) ||
+      !TLI.isOperationLegalOrCustom(ISD::XOR, VT) ||
+      !TLI.isOperationLegalOrCustom(ISD::OR, VT))
+        return DAG.UnrollVectorOp(Op.getNode());
+
+  assert(VT.getSizeInBits() == OVT.getSizeInBits() && "Invalid mask size");
+  // Bitcast the operands to be the same type as the mask.
+  // This is needed when we select between FP types because
+  // the mask is a vector of integers.
+  Op1 = DAG.getNode(ISD::BITCAST, DL, VT, Op1);
+  Op2 = DAG.getNode(ISD::BITCAST, DL, VT, Op2);
+
+  SDValue AllOnes = DAG.getConstant(
+    APInt::getAllOnesValue(VT.getScalarType().getSizeInBits()), VT);
+  SDValue NotMask = DAG.getNode(ISD::XOR, DL, VT, Mask, AllOnes);
+
+  Op1 = DAG.getNode(ISD::AND, DL, VT, Op1, Mask);
+  Op2 = DAG.getNode(ISD::AND, DL, VT, Op2, NotMask);
+  return DAG.getNode(ISD::OR, DL, VT, Op1, Op2);
+}
+
+SDValue VectorLegalizer::ExpandUINT_TO_FLOAT(SDValue Op) {
+  EVT VT = Op.getOperand(0).getValueType();
+  DebugLoc DL = Op.getDebugLoc();
+
+  // Make sure that the SINT_TO_FP and SRL instructions are available.
+  if (!TLI.isOperationLegalOrCustom(ISD::SINT_TO_FP, VT) ||
+      !TLI.isOperationLegalOrCustom(ISD::SRL, VT))
+      return DAG.UnrollVectorOp(Op.getNode());
+
+ EVT SVT = VT.getScalarType();
+  assert((SVT.getSizeInBits() == 64 || SVT.getSizeInBits() == 32) &&
+      "Elements in vector-UINT_TO_FP must be 32 or 64 bits wide");
+
+  unsigned BW = SVT.getSizeInBits();
+  SDValue HalfWord = DAG.getConstant(BW/2, VT);
+
+  // Constants to clear the upper part of the word.
+  // Notice that we can also use SHL+SHR, but using a constant is slightly
+  // faster on x86.
+  uint64_t HWMask = (SVT.getSizeInBits()==64)?0x00000000FFFFFFFF:0x0000FFFF;
+  SDValue HalfWordMask = DAG.getConstant(HWMask, VT);
+
+  // Two to the power of half-word-size.
+  SDValue TWOHW = DAG.getConstantFP((1<<(BW/2)), Op.getValueType());
+
+  // Clear upper part of LO, lower HI
+  SDValue HI = DAG.getNode(ISD::SRL, DL, VT, Op.getOperand(0), HalfWord);
+  SDValue LO = DAG.getNode(ISD::AND, DL, VT, Op.getOperand(0), HalfWordMask);
+
+  // Convert hi and lo to floats
+  // Convert the hi part back to the upper values
+  SDValue fHI = DAG.getNode(ISD::SINT_TO_FP, DL, Op.getValueType(), HI);
+          fHI = DAG.getNode(ISD::FMUL, DL, Op.getValueType(), fHI, TWOHW);
+  SDValue fLO = DAG.getNode(ISD::SINT_TO_FP, DL, Op.getValueType(), LO);
+
+  // Add the two halves
+  return DAG.getNode(ISD::FADD, DL, Op.getValueType(), fHI, fLO);
  }
  
+
  SDValue VectorLegalizer::ExpandFNEG(SDValue Op) {
    if (TLI.isOperationLegalOrCustom(ISD::FSUB, Op.getValueType())) {
      SDValue Zero = DAG.getConstantFP(-0.0, Op.getValueType());
      return DAG.getNode(ISD::FSUB, Op.getDebugLoc(), Op.getValueType(),
                         Zero, Op.getOperand(0));
    }
-  return UnrollVectorOp(Op);
+  return DAG.UnrollVectorOp(Op.getNode());
  }
  
  SDValue VectorLegalizer::UnrollVSETCC(SDValue Op) {
-  MVT VT = Op.getValueType();
+  EVT VT = Op.getValueType();
    unsigned NumElems = VT.getVectorNumElements();
-  MVT EltVT = VT.getVectorElementType();
+  EVT EltVT = VT.getVectorElementType();
    SDValue LHS = Op.getOperand(0), RHS = Op.getOperand(1), CC = Op.getOperand(2);
-  MVT TmpEltVT = LHS.getValueType().getVectorElementType();
+  EVT TmpEltVT = LHS.getValueType().getVectorElementType();
    DebugLoc dl = Op.getDebugLoc();
    SmallVector<SDValue, 8> Ops(NumElems);
    for (unsigned i = 0; i < NumElems; ++i) {
@@ -278,56 +368,6 @@ SDValue VectorLegalizer::UnrollVSETCC(SDValue Op) {
    return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, &Ops[0], NumElems);
  }
  
-/// UnrollVectorOp - We know that the given vector has a legal type, however
-/// the operation it performs is not legal, and the target has requested that
-/// the operation be expanded.  "Unroll" the vector, splitting out the scalars
-/// and operating on each element individually.
-SDValue VectorLegalizer::UnrollVectorOp(SDValue Op) {
-  MVT VT = Op.getValueType();
-  assert(Op.getNode()->getNumValues() == 1 &&
-         "Can't unroll a vector with multiple results!");
-  unsigned NE = VT.getVectorNumElements();
-  MVT EltVT = VT.getVectorElementType();
-  DebugLoc dl = Op.getDebugLoc();
-
-  SmallVector<SDValue, 8> Scalars;
-  SmallVector<SDValue, 4> Operands(Op.getNumOperands());
-  for (unsigned i = 0; i != NE; ++i) {
-    for (unsigned j = 0; j != Op.getNumOperands(); ++j) {
-      SDValue Operand = Op.getOperand(j);
-      MVT OperandVT = Operand.getValueType();
-      if (OperandVT.isVector()) {
-        // A vector operand; extract a single element.
-        MVT OperandEltVT = OperandVT.getVectorElementType();
-        Operands[j] = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl,
-                                  OperandEltVT,
-                                  Operand,
-                                  DAG.getConstant(i, MVT::i32));
-      } else {
-        // A scalar operand; just use it as is.
-        Operands[j] = Operand;
-      }
-    }
-
-    switch (Op.getOpcode()) {
-    default:
-      Scalars.push_back(DAG.getNode(Op.getOpcode(), dl, EltVT,
-                                    &Operands[0], Operands.size()));
-      break;
-    case ISD::SHL:
-    case ISD::SRA:
-    case ISD::SRL:
-    case ISD::ROTL:
-    case ISD::ROTR:
-      Scalars.push_back(DAG.getNode(Op.getOpcode(), dl, EltVT, Operands[0],
-                                    DAG.getShiftAmountOperand(Operands[1])));
-      break;
-    }
-  }
-
-  return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, &Scalars[0], Scalars.size());
-}
-
  }
  
  bool SelectionDAG::LegalizeVectors() {