Use movq to move low half of XMM register and zero-extend the rest.

author Evan Cheng <evan.cheng@apple.com>

Thu, 8 May 2008 22:35:02 +0000 (22:35 +0000)

committer Evan Cheng <evan.cheng@apple.com>

Thu, 8 May 2008 22:35:02 +0000 (22:35 +0000)
author Evan Cheng <evan.cheng@apple.com>
Thu, 8 May 2008 22:35:02 +0000 (22:35 +0000)
committer Evan Cheng <evan.cheng@apple.com>
Thu, 8 May 2008 22:35:02 +0000 (22:35 +0000)
diff --git a/lib/Target/X86/X86InstrSSE.td b/lib/Target/X86/X86InstrSSE.td

index 375d0add62a2124d6fc5177f409f07772e30196a..c56d4c59e06c17d6823ad73447db8493564ff139 100644 (file)
--- a/lib/Target/X86/X86InstrSSE.td
+++ b/lib/Target/X86/X86InstrSSE.td
@@ -2916,7 +2916,8 @@ let AddedComplexity = 15 in
  def : Pat<(v2f64 (vector_shuffle immAllZerosV_bc, VR128:$src,
             MOVL_shuffle_mask)),
            (MOVZPQILo2PQIrr VR128:$src)>, Requires<[HasSSE2]>;
-
+def : Pat<(v2f64 (X86zvmovl (v2f64 VR128:$src))),
+          (MOVZPQILo2PQIrr VR128:$src)>, Requires<[HasSSE2]>;
  
  // FIXME: Temporary workaround since 2-wide shuffle is broken.
  def : Pat<(int_x86_sse2_movs_d  VR128:$src1, VR128:$src2),
diff --git a/test/CodeGen/X86/vec_set-E.ll b/test/CodeGen/X86/vec_set-E.ll

new file mode 100644 (file)

index 0000000..9dc1932
--- /dev/null
+++ b/test/CodeGen/X86/vec_set-E.ll
@@ -0,0 +1,10 @@
+; RUN: llvm-as < %s | llc -march=x86 -mattr=+sse2 | grep movq
+
+define i32 @t(float %X) nounwind  {
+       %tmp11 = insertelement <4 x float> undef, float %X, i32 0
+       %tmp12 = insertelement <4 x float> %tmp11, float %X, i32 1
+       %tmp27 = insertelement <4 x float> %tmp12, float 0.000000e+00, i32 2
+       %tmp28 = insertelement <4 x float> %tmp27, float 0.000000e+00, i32 3
+       store <4 x float> %tmp28, <4 x float>* null, align 16
+       ret i32 0
+}
author	Evan Cheng <evan.cheng@apple.com>
	Thu, 8 May 2008 22:35:02 +0000 (22:35 +0000)
committer	Evan Cheng <evan.cheng@apple.com>
	Thu, 8 May 2008 22:35:02 +0000 (22:35 +0000)
lib/Target/X86/X86InstrSSE.td		patch \| blob \| history
test/CodeGen/X86/vec_set-E.ll	[new file with mode: 0644]	patch \| blob