Prevents PerformShuffleCombine from creating a node with an illegal type after legali...

author Mon P Wang <wangmp@apple.com>

Sun, 19 Dec 2010 23:55:53 +0000 (23:55 +0000)

committer Mon P Wang <wangmp@apple.com>

Sun, 19 Dec 2010 23:55:53 +0000 (23:55 +0000)
author Mon P Wang <wangmp@apple.com>
Sun, 19 Dec 2010 23:55:53 +0000 (23:55 +0000)
committer Mon P Wang <wangmp@apple.com>
Sun, 19 Dec 2010 23:55:53 +0000 (23:55 +0000)
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp

index 48e418d57ceaa5d5f454b8c10828efd723015e10..3e3ab691bceb0ab14e37af450411699291fca5c8 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -10372,13 +10372,18 @@ bool X86TargetLowering::isGAPlusOffset(SDNode *N,
  /// if the load addresses are consecutive, non-overlapping, and in the right
  /// order.
  static SDValue PerformShuffleCombine(SDNode *N, SelectionDAG &DAG,
-                                     const TargetLowering &TLI) {
+                                     TargetLowering::DAGCombinerInfo &DCI) {
    DebugLoc dl = N->getDebugLoc();
    EVT VT = N->getValueType(0);
  
    if (VT.getSizeInBits() != 128)
      return SDValue();
  
+  // Don't create instructions with illegal types after legalize types has run.
+  const TargetLowering &TLI = DAG.getTargetLoweringInfo();
+  if (!DCI.isBeforeLegalize() && !TLI.isTypeLegal(VT.getVectorElementType()))
+    return SDValue();
+
    SmallVector<SDValue, 16> Elts;
    for (unsigned i = 0, e = VT.getVectorNumElements(); i != e; ++i)
      Elts.push_back(getShuffleScalarElt(N, i, DAG, 0));
@@ -11485,7 +11490,7 @@ SDValue X86TargetLowering::PerformDAGCombine(SDNode *N,
    case X86ISD::PSHUFLW:
    case X86ISD::MOVSS:
    case X86ISD::MOVSD:
-  case ISD::VECTOR_SHUFFLE: return PerformShuffleCombine(N, DAG, *this);
+  case ISD::VECTOR_SHUFFLE: return PerformShuffleCombine(N, DAG, DCI);
    }
  
    return SDValue();
diff --git a/test/CodeGen/X86/vec_shuffle-27.ll b/test/CodeGen/X86/vec_shuffle-27.ll

index d700ccbf530324223716cb59ed4970f3a68de9dd..0556284d0ce608e7e2350f6c57609a50d473b70a 100644 (file)
--- a/test/CodeGen/X86/vec_shuffle-27.ll
+++ b/test/CodeGen/X86/vec_shuffle-27.ll
@@ -1,7 +1,4 @@
-; RUN: llc < %s -march=x86 -mattr=sse41 -o %t
-; RUN: grep addps %t | count 2
-; RUN: grep mulps %t | count 2
-; RUN: grep subps %t | count 2
+; RUN: llc < %s -march=x86 -mattr=sse41 | FileCheck %s
  
  ; ModuleID = 'vec_shuffle-27.bc'
  target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-v64:64:64-v128:128:128-a0:0:64-f80:32:32"
@@ -9,9 +6,32 @@ target triple = "i686-apple-cl.1.0"
  
  define <8 x float> @my2filter4_1d(<4 x float> %a, <8 x float> %T0, <8 x float> %T1) nounwind readnone {
  entry:
+; CHECK: subps
+; CHECK: mulps
+; CHECK: addps
+; CHECK: subps
+; CHECK: mulps
+; CHECK: addps
         %tmp7 = shufflevector <4 x float> %a, <4 x float> undef, <8 x i32> < i32 0, i32 1, i32 2, i32 3, i32 0, i32 1, i32 2, i32 3 >           ; <<8 x float>> [#uses=1]
         %sub = fsub <8 x float> %T1, %T0                ; <<8 x float>> [#uses=1]
         %mul = fmul <8 x float> %sub, %tmp7             ; <<8 x float>> [#uses=1]
         %add = fadd <8 x float> %mul, %T0               ; <<8 x float>> [#uses=1]
         ret <8 x float> %add
  }
+
+
+define void @test2(<4 x i64>* %ap, <4 x i64>* %bp) nounwind {
+entry:
+  %a = load <4 x i64> * %ap
+  %b = load <4 x i64> * %bp
+  %mulaa = mul <4 x i64> %a, %a
+  %mulbb = mul <4 x i64> %b, %b
+  %mulab = mul <4 x i64> %a, %b
+  %vect1271 = shufflevector <4 x i64> %mulaa, <4 x i64> %mulbb, <4 x i32> <i32 0, i32 4, i32 undef, i32 undef>
+  %vect1272 = shufflevector <4 x i64> %mulaa, <4 x i64> %mulbb, <4 x i32> <i32 1, i32 5, i32 undef, i32 undef>
+  %vect1487 = shufflevector <4 x i64> %vect1271, <4 x i64> %mulab, <4 x i32> <i32 0, i32 1, i32 2, i32 4>
+  %vect1488 = shufflevector <4 x i64> %vect1272, <4 x i64> %mulab, <4 x i32> <i32 0, i32 1, i32 2, i32 5>
+  store <4 x i64> %vect1487, <4 x i64>* %ap
+  store <4 x i64> %vect1488, <4 x i64>* %bp
+  ret void;
+}
+\ No newline at end of file
author	Mon P Wang <wangmp@apple.com>
	Sun, 19 Dec 2010 23:55:53 +0000 (23:55 +0000)
committer	Mon P Wang <wangmp@apple.com>
	Sun, 19 Dec 2010 23:55:53 +0000 (23:55 +0000)
lib/Target/X86/X86ISelLowering.cpp		patch \| blob \| history
test/CodeGen/X86/vec_shuffle-27.ll		patch \| blob \| history