Fix a regression from r147481.

author Chad Rosier <mcrosier@apple.com>

Fri, 9 Mar 2012 02:00:48 +0000 (02:00 +0000)

committer Chad Rosier <mcrosier@apple.com>

Fri, 9 Mar 2012 02:00:48 +0000 (02:00 +0000)
author Chad Rosier <mcrosier@apple.com>
Fri, 9 Mar 2012 02:00:48 +0000 (02:00 +0000)
committer Chad Rosier <mcrosier@apple.com>
Fri, 9 Mar 2012 02:00:48 +0000 (02:00 +0000)
diff --git a/lib/Target/X86/X86InstrFragmentsSIMD.td b/lib/Target/X86/X86InstrFragmentsSIMD.td

index 4f9f089d5d4c2e0cbe91fd5ad6c4fc17e784630a..ae3ed1bcb32d044a80bbcc792627d23994e1a979 100644 (file)
--- a/lib/Target/X86/X86InstrFragmentsSIMD.td
+++ b/lib/Target/X86/X86InstrFragmentsSIMD.td
@@ -218,6 +218,11 @@ def alignedload : PatFrag<(ops node:$ptr), (load node:$ptr), [{
    return cast<LoadSDNode>(N)->getAlignment() >= 16;
  }]>;
  
+// Like 'X86vzload', but always requires 128-bit vector alignment.
+def alignedX86vzload : PatFrag<(ops node:$ptr), (X86vzload node:$ptr), [{
+  return cast<MemSDNode>(N)->getAlignment() >= 16;
+}]>;
+
  // Like 'load', but always requires 256-bit vector alignment.
  def alignedload256 : PatFrag<(ops node:$ptr), (load node:$ptr), [{
    return cast<LoadSDNode>(N)->getAlignment() >= 32;
diff --git a/lib/Target/X86/X86InstrSSE.td b/lib/Target/X86/X86InstrSSE.td

index c6d1d192cfe119045c457cd739898dfedd338568..36526ad7a58faa3d004e4220e2e7cc8cf561d435 100644 (file)
--- a/lib/Target/X86/X86InstrSSE.td
+++ b/lib/Target/X86/X86InstrSSE.td
@@ -4820,8 +4820,10 @@ let Predicates = [HasSSE2], AddedComplexity = 20 in {
  }
  
  let Predicates = [HasAVX] in {
-def : Pat<(v4i64 (X86vzload addr:$src)),
+def : Pat<(v4i64 (alignedX86vzload addr:$src)),
            (SUBREG_TO_REG (i32 0), (VMOVAPSrm addr:$src), sub_xmm)>;
+def : Pat<(v4i64 (X86vzload addr:$src)),
+          (SUBREG_TO_REG (i32 0), (VMOVUPSrm addr:$src), sub_xmm)>;
  }
  
  //===---------------------------------------------------------------------===//
diff --git a/test/CodeGen/X86/avx-shuffle.ll b/test/CodeGen/X86/avx-shuffle.ll

index 947d79f9e4c066e172b761d79afbb872241a1f9d..54f01e966d5c03de21e06e8d69fb1ace8ac90344 100644 (file)
--- a/test/CodeGen/X86/avx-shuffle.ll
+++ b/test/CodeGen/X86/avx-shuffle.ll
@@ -135,3 +135,15 @@ define <4 x i32> @test15(<2 x i32>%x) nounwind readnone {
    ret <4 x i32>%x1
  }
  
+; rdar://10974078
+define <8 x float> @test16(float* nocapture %f) nounwind uwtable readonly ssp {
+entry:
+  %0 = bitcast float* %f to <4 x float>*
+  %1 = load <4 x float>* %0, align 8
+; CHECK: test16
+; CHECK: vmovups
+; CHECK-NOT: vxorps
+; CHECK-NOT: vinsertf128
+  %shuffle.i = shufflevector <4 x float> %1, <4 x float> <float 0.000000e+00, float undef, float undef, float undef>, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 4, i32 4, i32 4>
+  ret <8 x float> %shuffle.i
+}
author	Chad Rosier <mcrosier@apple.com>
	Fri, 9 Mar 2012 02:00:48 +0000 (02:00 +0000)
committer	Chad Rosier <mcrosier@apple.com>
	Fri, 9 Mar 2012 02:00:48 +0000 (02:00 +0000)
lib/Target/X86/X86InstrFragmentsSIMD.td		patch \| blob \| history
lib/Target/X86/X86InstrSSE.td		patch \| blob \| history
test/CodeGen/X86/avx-shuffle.ll		patch \| blob \| history