Improve code generation for vselect on SSE2:

[oota-llvm.git] / test / CodeGen / X86 / sse2-blend.ll
diff --git a/test/CodeGen/X86/sse2-blend.ll b/test/CodeGen/X86/sse2-blend.ll

index 56b099ec42e6aa6f8a04b288d01a18949d50b60e..0007cab0961f1adab2c59039e75dfc81156eca43 100644 (file)
--- a/test/CodeGen/X86/sse2-blend.ll
+++ b/test/CodeGen/X86/sse2-blend.ll
@@ -1,8 +1,10 @@
-; RUN: llc < %s -march=x86 -mcpu=yonah -promote-elements -mattr=+sse2,-sse41 | FileCheck %s
-
-
-; currently (xor v4i32) is defined as illegal, so we scalarize the code.
+; RUN: llc < %s -march=x86 -mcpu=yonah -mattr=+sse2,-sse41 | FileCheck %s
  
+; CHECK: vsel_float
+; CHECK: pandn
+; CHECK: pand
+; CHECK: por
+; CHECK: ret
  define void@vsel_float(<4 x float>* %v1, <4 x float>* %v2) {
    %A = load <4 x float>* %v1
    %B = load <4 x float>* %v2
@@ -11,8 +13,11 @@ define void@vsel_float(<4 x float>* %v1, <4 x float>* %v2) {
    ret void
  }
  
-; currently (xor v4i32) is defined as illegal, so we scalarize the code.
-
+; CHECK: vsel_i32
+; CHECK: pandn
+; CHECK: pand
+; CHECK: por
+; CHECK: ret
  define void@vsel_i32(<4 x i32>* %v1, <4 x i32>* %v2) {
    %A = load <4 x i32>* %v1
    %B = load <4 x i32>* %v2