Covert VORRIMM to be produced via early target-specific DAG combining, rather than...

author Owen Anderson <resistor@mac.com>

Wed, 3 Nov 2010 23:15:26 +0000 (23:15 +0000)

committer Owen Anderson <resistor@mac.com>

Wed, 3 Nov 2010 23:15:26 +0000 (23:15 +0000)
author Owen Anderson <resistor@mac.com>
Wed, 3 Nov 2010 23:15:26 +0000 (23:15 +0000)
committer Owen Anderson <resistor@mac.com>
Wed, 3 Nov 2010 23:15:26 +0000 (23:15 +0000)
diff --git a/lib/Target/ARM/ARMISelLowering.cpp b/lib/Target/ARM/ARMISelLowering.cpp

index 7a3a747f50c2946fa25daf74a5e533c1a9d371fa..0cc6f2298bfbb03eb7b519338bb428f5fe508397 100644 (file)
--- a/lib/Target/ARM/ARMISelLowering.cpp
+++ b/lib/Target/ARM/ARMISelLowering.cpp
@@ -101,7 +101,6 @@ void ARMTargetLowering::addTypeForNEON(EVT VT, EVT PromotedLdStVT,
      setOperationAction(ISD::SHL, VT.getSimpleVT(), Custom);
      setOperationAction(ISD::SRA, VT.getSimpleVT(), Custom);
      setOperationAction(ISD::SRL, VT.getSimpleVT(), Custom);
-    setOperationAction(ISD::OR, VT.getSimpleVT(), Custom);
      setLoadExtAction(ISD::SEXTLOAD, VT.getSimpleVT(), Expand);
      setLoadExtAction(ISD::ZEXTLOAD, VT.getSimpleVT(), Expand);
      for (unsigned InnerVT = (unsigned)MVT::FIRST_VECTOR_VALUETYPE;
@@ -3433,32 +3432,6 @@ static SDValue IsSingleInstrConstant(SDValue N, SelectionDAG &DAG,
    return SDValue();
  }
  
-static SDValue LowerOR(SDValue Op, SelectionDAG &DAG) {
-  SDValue Op1 = Op.getOperand(1);
-  while (Op1.getOpcode() == ISD::BIT_CONVERT && Op1.getOperand(0) != Op1)
-    Op1 = Op1.getOperand(0);
-  if (Op1.getOpcode() != ARMISD::VMOVIMM) return Op;
-  
-  ConstantSDNode* TargetConstant = cast<ConstantSDNode>(Op1.getOperand(0));
-  uint32_t ConstVal = TargetConstant->getZExtValue();
-
-  // FIXME: VORRIMM only supports immediate encodings of 16 and 32 bit size.
-  // In theory for VMOVIMMs whose value is already encoded as with an
-  // 8 bit encoding, we could re-encode it as a 16 or 32 bit immediate.
-  EVT VorrVT = Op1.getValueType();
-  EVT EltVT = VorrVT.getVectorElementType();
-  if (EltVT != MVT::i16 && EltVT != MVT::i32) return Op;
-  
-  ConstVal |= 0x0100;
-  SDValue OrConst = DAG.getTargetConstant(ConstVal, MVT::i32);
-  
-  DebugLoc dl = Op.getDebugLoc();
-  EVT VT = Op.getValueType();
-  SDValue toTy = DAG.getNode(ISD::BIT_CONVERT, dl, VorrVT, Op.getOperand(0));
-  SDValue Vorr = DAG.getNode(ARMISD::VORRIMM, dl, VorrVT, toTy, OrConst);
-  return DAG.getNode(ISD::BIT_CONVERT, dl, VT, Vorr);
-}
-
  // If this is a case we can't handle, return null and let the default
  // expansion code take care of it.
  static SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG,
@@ -3927,7 +3900,6 @@ SDValue ARMTargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG) const {
    case ISD::CONCAT_VECTORS: return LowerCONCAT_VECTORS(Op, DAG);
    case ISD::FLT_ROUNDS_:   return LowerFLT_ROUNDS_(Op, DAG);
    case ISD::MUL:           return LowerMUL(Op, DAG);
-  case ISD::OR:            return LowerOR(Op, DAG);
    }
    return SDValue();
  }
@@ -4474,6 +4446,31 @@ static SDValue PerformMULCombine(SDNode *N,
  static SDValue PerformORCombine(SDNode *N,
                                  TargetLowering::DAGCombinerInfo &DCI,
                                  const ARMSubtarget *Subtarget) {
+  // Attempt to use immediate-form VORR
+  BuildVectorSDNode *BVN = dyn_cast<BuildVectorSDNode>(N->getOperand(1));
+  DebugLoc dl = N->getDebugLoc();
+  EVT VT = N->getValueType(0);
+  SelectionDAG &DAG = DCI.DAG;
+  
+  APInt SplatBits, SplatUndef;
+  unsigned SplatBitSize;
+  bool HasAnyUndefs;
+  if (BVN && Subtarget->hasNEON() &&
+      BVN->isConstantSplat(SplatBits, SplatUndef, SplatBitSize, HasAnyUndefs)) {
+    if (SplatBitSize <= 64) {
+      EVT VorrVT;
+      SDValue Val = isNEONModifiedImm(SplatBits.getZExtValue(),
+                                      SplatUndef.getZExtValue(), SplatBitSize,
+                                      DAG, VorrVT, VT.is128BitVector(), false);
+      if (Val.getNode()) {
+        SDValue Input =
+          DAG.getNode(ISD::BIT_CONVERT, dl, VorrVT, N->getOperand(0));
+        SDValue Vorr = DAG.getNode(ARMISD::VORRIMM, dl, VorrVT, Input, Val);
+        return DAG.getNode(ISD::BIT_CONVERT, dl, VT, Vorr);
+      }
+    }
+  }
+
    // Try to use the ARM/Thumb2 BFI (bitfield insert) instruction when
    // reasonable.
  
@@ -4481,7 +4478,6 @@ static SDValue PerformORCombine(SDNode *N,
    if (Subtarget->isThumb1Only() || !Subtarget->hasV6T2Ops())
      return SDValue();
  
-  SelectionDAG &DAG = DCI.DAG;
    SDValue N0 = N->getOperand(0), N1 = N->getOperand(1);
    DebugLoc DL = N->getDebugLoc();
    // 1) or (and A, mask), val => ARMbfi A, val, mask
@@ -4496,7 +4492,6 @@ static SDValue PerformORCombine(SDNode *N,
    if (N0.getOpcode() != ISD::AND)
      return SDValue();
  
-  EVT VT = N->getValueType(0);
    if (VT != MVT::i32)
      return SDValue();
  
@@ -4565,7 +4560,7 @@ static SDValue PerformORCombine(SDNode *N,
        DCI.CombineTo(N, Res, false);
      }
    }
-
+  
    return SDValue();
  }
  
diff --git a/test/CodeGen/ARM/vbits.ll b/test/CodeGen/ARM/vbits.ll

index 352608b0d4226c435bf137e151bbecfb0811d005..b6077c05ec30839edaeb1cd8bbc1e33a7c69e3bf 100644 (file)
--- a/test/CodeGen/ARM/vbits.ll
+++ b/test/CodeGen/ARM/vbits.ll
@@ -1,4 +1,4 @@
-; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
+; RUN: llc < %s -march=arm -mattr=+neon -mcpu=cortex-a8 | FileCheck %s
  
  define <8 x i8> @v_andi8(<8 x i8>* %A, <8 x i8>* %B) nounwind {
  ;CHECK: v_andi8:
diff --git a/test/MC/ARM/neon-bitwise-encoding.s b/test/MC/ARM/neon-bitwise-encoding.s

index 345b6bb2d268a9c7f0ac89613bc4e74e950bc5e2..43a73ff12805dde3b133ae971d4fc96c28e6f04b 100644 (file)
--- a/test/MC/ARM/neon-bitwise-encoding.s
+++ b/test/MC/ARM/neon-bitwise-encoding.s
@@ -19,6 +19,8 @@
    vorr.i32     d16, #0x1000000
  @ CHECK: vorr.i32      q8, #0x1000000  @ encoding: [0x51,0x07,0xc0,0xf2]
    vorr.i32     q8, #0x1000000
+@ CHECK: vorr.i32      q8, #0x0        @ encoding: [0x50,0x01,0xc0,0xf2]
+  vorr.i32     q8, #0x0
  
  @ CHECK: vbic  d16, d17, d16           @ encoding: [0xb0,0x01,0x51,0xf2]
         vbic    d16, d17, d16
author	Owen Anderson <resistor@mac.com>
	Wed, 3 Nov 2010 23:15:26 +0000 (23:15 +0000)
committer	Owen Anderson <resistor@mac.com>
	Wed, 3 Nov 2010 23:15:26 +0000 (23:15 +0000)
lib/Target/ARM/ARMISelLowering.cpp		patch \| blob \| history
test/CodeGen/ARM/vbits.ll		patch \| blob \| history
test/MC/ARM/neon-bitwise-encoding.s		patch \| blob \| history