Explicitly zero out parts of a vector which are required to be zero by the algorithm...

author Eli Friedman <eli.friedman@gmail.com>

Mon, 29 Aug 2011 21:15:46 +0000 (21:15 +0000)

committer Eli Friedman <eli.friedman@gmail.com>

Mon, 29 Aug 2011 21:15:46 +0000 (21:15 +0000)
author Eli Friedman <eli.friedman@gmail.com>
Mon, 29 Aug 2011 21:15:46 +0000 (21:15 +0000)
committer Eli Friedman <eli.friedman@gmail.com>
Mon, 29 Aug 2011 21:15:46 +0000 (21:15 +0000)
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp

index 9c940c49ca34e0ecb1db6fc62a7e540b0ef88265..bd89bf999d0accc5bb391ae10162d3596fd430e3 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -7713,6 +7713,9 @@ SDValue X86TargetLowering::LowerUINT_TO_FP_i32(SDValue Op,
    SDValue Load = DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, MVT::v4i32,
                               Op.getOperand(0));
  
+  // Zero out the upper parts of the register.
+  Load = getShuffleVectorZeroOrUndef(Load, 0, true, Subtarget->hasSSE2(), DAG);
+
    Load = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::f64,
                       DAG.getNode(ISD::BITCAST, dl, MVT::v2f64, Load),
                       DAG.getIntPtrConstant(0));
diff --git a/test/CodeGen/X86/uint_to_fp-2.ll b/test/CodeGen/X86/uint_to_fp-2.ll

index da5105d8a4eac887c502b3e6967261067de7589c..7536fb8f52c40c4e3f47765f808190421318703f 100644 (file)
--- a/test/CodeGen/X86/uint_to_fp-2.ll
+++ b/test/CodeGen/X86/uint_to_fp-2.ll
@@ -1,8 +1,33 @@
-; RUN: llc < %s -march=x86 -mattr=+sse2 | grep movsd | count 1
-; rdar://6504833
+; RUN: llc < %s -march=x86 -mattr=+sse2 | FileCheck %s
  
-define float @f(i32 %x) nounwind readnone {
+; rdar://6504833
+define float @test1(i32 %x) nounwind readnone {
+; CHECK: test1
+; CHECK: movd
+; CHECK: orpd
+; CHECK: subsd
+; CHECK: cvtsd2ss
+; CHECK: movss
+; CHECK: flds
+; CHECK: ret
  entry:
         %0 = uitofp i32 %x to float
         ret float %0
  }
+
+; PR10802
+define float @test2(<4 x i32> %x) nounwind readnone ssp {
+; CHECK: test2
+; CHECK: xorps [[ZERO:%xmm[0-9]+]]
+; CHECK: movss {{.*}}, [[ZERO]]
+; CHECK: orps
+; CHECK: subsd
+; CHECK: cvtsd2ss
+; CHECK: movss
+; CHECK: flds
+; CHECK: ret
+entry:
+  %vecext = extractelement <4 x i32> %x, i32 0
+  %conv = uitofp i32 %vecext to float
+  ret float %conv
+}
author	Eli Friedman <eli.friedman@gmail.com>
	Mon, 29 Aug 2011 21:15:46 +0000 (21:15 +0000)
committer	Eli Friedman <eli.friedman@gmail.com>
	Mon, 29 Aug 2011 21:15:46 +0000 (21:15 +0000)
lib/Target/X86/X86ISelLowering.cpp		patch \| blob \| history
test/CodeGen/X86/uint_to_fp-2.ll		patch \| blob \| history