Cosmetic changes.

[oota-llvm.git] / lib / Target / ARM / ARMISelDAGToDAG.cpp
diff --git a/lib/Target/ARM/ARMISelDAGToDAG.cpp b/lib/Target/ARM/ARMISelDAGToDAG.cpp

index 7b378e66b6fbd7d53fa2ecdcf6e7620cbd3068c8..57a12f09e046888210a8ca38ef7f6eba173e2299 100644 (file)
--- a/lib/Target/ARM/ARMISelDAGToDAG.cpp
+++ b/lib/Target/ARM/ARMISelDAGToDAG.cpp
@@ -13,7 +13,6 @@
  
  #include "ARM.h"
  #include "ARMAddressingModes.h"
-#include "ARMISelLowering.h"
  #include "ARMTargetMachine.h"
  #include "llvm/CallingConv.h"
  #include "llvm/Constants.h"
@@ -28,6 +27,7 @@
  #include "llvm/CodeGen/SelectionDAGISel.h"
  #include "llvm/Target/TargetLowering.h"
  #include "llvm/Target/TargetOptions.h"
+#include "llvm/Support/CommandLine.h"
  #include "llvm/Support/Compiler.h"
  #include "llvm/Support/Debug.h"
  #include "llvm/Support/ErrorHandling.h"
@@ -35,6 +35,10 @@
  
  using namespace llvm;
  
+static cl::opt<bool>
+UseRegSeq("neon-reg-sequence", cl::Hidden,
+          cl::desc("Use reg_sequence to model ld / st of multiple neon regs"));
+
  //===--------------------------------------------------------------------===//
  /// ARMDAGToDAGISel - ARM specific code to select ARM machine
  /// instructions for SelectionDAG operations.
@@ -143,7 +147,7 @@ private:
                            unsigned *QOpcodes1);
  
    /// SelectV6T2BitfieldExtractOp - Select SBFX/UBFX instructions for ARM.
-  SDNode *SelectV6T2BitfieldExtractOp(SDNode *N, unsigned Opc);
+  SDNode *SelectV6T2BitfieldExtractOp(SDNode *N, bool isSigned);
  
    /// SelectCMOVOp - Select CMOV instructions for ARM.
    SDNode *SelectCMOVOp(SDNode *N);
@@ -160,6 +164,8 @@ private:
                                 ARMCC::CondCodes CCVal, SDValue CCR,
                                 SDValue InFlag);
  
+  SDNode *SelectConcatVector(SDNode *N);
+
    /// SelectInlineAsmMemoryOperand - Implement addressing mode selection for
    /// inline asm expressions.
    virtual bool SelectInlineAsmMemoryOperand(const SDValue &Op,
@@ -940,10 +946,14 @@ SDNode *ARMDAGToDAGISel::SelectT2IndexedLoad(SDNode *N) {
  /// form a quad register.
  SDNode *ARMDAGToDAGISel::PairDRegs(EVT VT, SDValue V0, SDValue V1) {
    DebugLoc dl = V0.getNode()->getDebugLoc();
-  SDValue Undef =
-    SDValue(CurDAG->getMachineNode(TargetOpcode::IMPLICIT_DEF, dl, VT), 0);
    SDValue SubReg0 = CurDAG->getTargetConstant(ARM::DSUBREG_0, MVT::i32);
    SDValue SubReg1 = CurDAG->getTargetConstant(ARM::DSUBREG_1, MVT::i32);
+  if (llvm::ModelWithRegSequence()) {
+    const SDValue Ops[] = { V0, SubReg0, V1, SubReg1 };
+    return CurDAG->getMachineNode(TargetOpcode::REG_SEQUENCE, dl, VT, Ops, 4);
+  }
+  SDValue Undef =
+    SDValue(CurDAG->getMachineNode(TargetOpcode::IMPLICIT_DEF, dl, VT), 0);
    SDNode *Pair = CurDAG->getMachineNode(TargetOpcode::INSERT_SUBREG, dl,
                                          VT, Undef, V0, SubReg0);
    return CurDAG->getMachineNode(TargetOpcode::INSERT_SUBREG, dl,
@@ -1249,10 +1259,42 @@ SDNode *ARMDAGToDAGISel::SelectVLDSTLane(SDNode *N, bool IsLoad,
  }
  
  SDNode *ARMDAGToDAGISel::SelectV6T2BitfieldExtractOp(SDNode *N,
-                                                     unsigned Opc) {
+                                                     bool isSigned) {
    if (!Subtarget->hasV6T2Ops())
      return NULL;
  
+  unsigned Opc = isSigned ? (Subtarget->isThumb() ? ARM::t2SBFX : ARM::SBFX)
+    : (Subtarget->isThumb() ? ARM::t2UBFX : ARM::UBFX);
+
+
+  // For unsigned extracts, check for a shift right and mask
+  unsigned And_imm = 0;
+  if (N->getOpcode() == ISD::AND) {
+    if (isOpcWithIntImmediate(N, ISD::AND, And_imm)) {
+
+      // The immediate is a mask of the low bits iff imm & (imm+1) == 0
+      if (And_imm & (And_imm + 1))
+        return NULL;
+
+      unsigned Srl_imm = 0;
+      if (isOpcWithIntImmediate(N->getOperand(0).getNode(), ISD::SRL,
+                                Srl_imm)) {
+        assert(Srl_imm > 0 && Srl_imm < 32 && "bad amount in shift node!");
+
+        unsigned Width = CountTrailingOnes_32(And_imm);
+        unsigned LSB = Srl_imm;
+        SDValue Reg0 = CurDAG->getRegister(0, MVT::i32);
+        SDValue Ops[] = { N->getOperand(0).getOperand(0),
+                          CurDAG->getTargetConstant(LSB, MVT::i32),
+                          CurDAG->getTargetConstant(Width, MVT::i32),
+          getAL(CurDAG), Reg0 };
+        return CurDAG->SelectNodeTo(N, Opc, MVT::i32, Ops, 5);
+      }
+    }
+    return NULL;
+  }
+
+  // Otherwise, we're looking for a shift of a shift
    unsigned Shl_imm = 0;
    if (isOpcWithIntImmediate(N->getOperand(0).getNode(), ISD::SHL, Shl_imm)) {
      assert(Shl_imm > 0 && Shl_imm < 32 && "bad amount in shift node!");
@@ -1441,6 +1483,21 @@ SDNode *ARMDAGToDAGISel::SelectCMOVOp(SDNode *N) {
    return CurDAG->SelectNodeTo(N, Opc, VT, Ops, 5);
  }
  
+SDNode *ARMDAGToDAGISel::SelectConcatVector(SDNode *N) {
+  // The only time a CONCAT_VECTORS operation can have legal types is when
+  // two 64-bit vectors are concatenated to a 128-bit vector.
+  EVT VT = N->getValueType(0);
+  if (!VT.is128BitVector() || N->getNumOperands() != 2)
+    llvm_unreachable("unexpected CONCAT_VECTORS");
+  DebugLoc dl = N->getDebugLoc();
+  SDValue V0 = N->getOperand(0);
+  SDValue V1 = N->getOperand(1);
+  SDValue SubReg0 = CurDAG->getTargetConstant(ARM::DSUBREG_0, MVT::i32);
+  SDValue SubReg1 = CurDAG->getTargetConstant(ARM::DSUBREG_1, MVT::i32);
+  const SDValue Ops[] = { V0, SubReg0, V1, SubReg1 };
+  return CurDAG->getMachineNode(TargetOpcode::REG_SEQUENCE, dl, VT, Ops, 4);
+}
+
  SDNode *ARMDAGToDAGISel::Select(SDNode *N) {
    DebugLoc dl = N->getDebugLoc();
  
@@ -1516,13 +1573,11 @@ SDNode *ARMDAGToDAGISel::Select(SDNode *N) {
      }
    }
    case ISD::SRL:
-    if (SDNode *I = SelectV6T2BitfieldExtractOp(N,
-                      Subtarget->isThumb() ? ARM::t2UBFX : ARM::UBFX))
+    if (SDNode *I = SelectV6T2BitfieldExtractOp(N, false))
        return I;
      break;
    case ISD::SRA:
-    if (SDNode *I = SelectV6T2BitfieldExtractOp(N,
-                      Subtarget->isThumb() ? ARM::t2SBFX : ARM::SBFX))
+    if (SDNode *I = SelectV6T2BitfieldExtractOp(N, true))
        return I;
      break;
    case ISD::MUL:
@@ -1566,6 +1621,10 @@ SDNode *ARMDAGToDAGISel::Select(SDNode *N) {
      }
      break;
    case ISD::AND: {
+    // Check for unsigned bitfield extract
+    if (SDNode *I = SelectV6T2BitfieldExtractOp(N, false))
+      return I;
+
      // (and (or x, c2), c1) and top 16-bits of c1 and c2 match, lower 16-bits
      // of c1 are 0xffff, and lower 16-bit of c2 are 0. That is, the top 16-bits
      // are entirely contributed by c2 and lower 16-bits are entirely contributed
@@ -1930,6 +1989,10 @@ SDNode *ARMDAGToDAGISel::Select(SDNode *N) {
      }
      }
    }
+
+  case ISD::CONCAT_VECTORS: {
+    return SelectConcatVector(N);
+  }
    }
  
    return SelectCode(N);
@@ -1953,3 +2016,9 @@ FunctionPass *llvm::createARMISelDag(ARMBaseTargetMachine &TM,
                                       CodeGenOpt::Level OptLevel) {
    return new ARMDAGToDAGISel(TM, OptLevel);
  }
+
+/// ModelWithRegSequence - Return true if isel should use REG_SEQUENCE to model
+/// operations involving sub-registers.
+bool llvm::ModelWithRegSequence() {
+  return UseRegSeq;
+}