Revert r257055, it caused PR26064.

author Nico Weber <nicolasweber@gmx.de>

Thu, 7 Jan 2016 15:01:46 +0000 (15:01 +0000)

committer Nico Weber <nicolasweber@gmx.de>

Thu, 7 Jan 2016 15:01:46 +0000 (15:01 +0000)
author Nico Weber <nicolasweber@gmx.de>
Thu, 7 Jan 2016 15:01:46 +0000 (15:01 +0000)
committer Nico Weber <nicolasweber@gmx.de>
Thu, 7 Jan 2016 15:01:46 +0000 (15:01 +0000)
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp

index 06def2cacd842598c7771a711b776994db47e90a..d32146b32cf63baa5ddb697fad1bd745cef06590 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -8163,11 +8163,6 @@ static SDValue lowerVectorShuffleAsBroadcast(SDLoc DL, MVT VT, SDValue V,
      break;
    }
  
-  // Peek through any bitcast (only useful for loads).
-  SDValue BC = V;
-  while (BC.getOpcode() == ISD::BITCAST)
-    BC = BC.getOperand(0);
-
    // Check if this is a broadcast of a scalar. We special case lowering
    // for scalars so that we can more effectively fold with loads.
    // First, look through bitcast: if the original value has a larger element
@@ -8187,10 +8182,10 @@ static SDValue lowerVectorShuffleAsBroadcast(SDLoc DL, MVT VT, SDValue V,
      // Only AVX2 has register broadcasts.
      if (!Subtarget->hasAVX2() && !isShuffleFoldableLoad(V))
        return SDValue();
-  } else if (MayFoldLoad(BC) && !cast<LoadSDNode>(BC)->isVolatile()) {
+  } else if (MayFoldLoad(V) && !cast<LoadSDNode>(V)->isVolatile()) {
      // If we are broadcasting a load that is only used by the shuffle
      // then we can reduce the vector load to the broadcasted scalar load.
-    LoadSDNode *Ld = cast<LoadSDNode>(BC);
+    LoadSDNode *Ld = cast<LoadSDNode>(V);
      SDValue BaseAddr = Ld->getOperand(1);
      EVT AddrVT = BaseAddr.getValueType();
      EVT SVT = VT.getScalarType();
diff --git a/test/CodeGen/X86/2012-01-12-extract-sv.ll b/test/CodeGen/X86/2012-01-12-extract-sv.ll

index 6950641a08aeaf9cbcdd4e517d40288a644fcc05..92ec107a00794fcafce28255047da89a3fa7d445 100644 (file)
--- a/test/CodeGen/X86/2012-01-12-extract-sv.ll
+++ b/test/CodeGen/X86/2012-01-12-extract-sv.ll
@@ -3,7 +3,9 @@
  define void @endless_loop() {
  ; CHECK-LABEL: endless_loop:
  ; CHECK-NEXT:  # BB#0:
-; CHECK-NEXT:    vbroadcastss (%eax), %ymm0
+; CHECK-NEXT:    vmovaps (%eax), %ymm0
+; CHECK-NEXT:    vextractf128 $1, %ymm0, %xmm0
+; CHECK-NEXT:    vmovsldup {{.*#+}} xmm0 = xmm0[0,0,2,2]
  ; CHECK-NEXT:    vmovddup {{.*#+}} xmm1 = xmm0[0,0]
  ; CHECK-NEXT:    vinsertf128 $1, %xmm1, %ymm0, %ymm1
  ; CHECK-NEXT:    vxorps %xmm2, %xmm2, %xmm2
diff --git a/test/CodeGen/X86/avx-vbroadcast.ll b/test/CodeGen/X86/avx-vbroadcast.ll

index 837333a0b1f46cf01edb8b2d0c6bceffe22b7f22..86b0628aa0bc6d2bf9724135a26b6b4e10cd8ed3 100644 (file)
--- a/test/CodeGen/X86/avx-vbroadcast.ll
+++ b/test/CodeGen/X86/avx-vbroadcast.ll
@@ -130,7 +130,10 @@ entry:
  define <8 x i32> @load_splat_8i32_8i32_55555555(<8 x i32>* %ptr) nounwind uwtable readnone ssp {
  ; CHECK-LABEL: load_splat_8i32_8i32_55555555:
  ; CHECK:       ## BB#0: ## %entry
-; CHECK-NEXT:    vbroadcastss 20(%rdi), %ymm0
+; CHECK-NEXT:    vmovaps (%rdi), %ymm0
+; CHECK-NEXT:    vextractf128 $1, %ymm0, %xmm0
+; CHECK-NEXT:    vpermilps {{.*#+}} xmm0 = xmm0[1,1,1,1]
+; CHECK-NEXT:    vinsertf128 $1, %xmm0, %ymm0, %ymm0
  ; CHECK-NEXT:    retq
  entry:
    %ld = load <8 x i32>, <8 x i32>* %ptr
@@ -198,7 +201,10 @@ entry:
  define <4 x i64> @load_splat_4i64_4i64_2222(<4 x i64>* %ptr) nounwind uwtable readnone ssp {
  ; CHECK-LABEL: load_splat_4i64_4i64_2222:
  ; CHECK:       ## BB#0: ## %entry
-; CHECK-NEXT:    vbroadcastsd 16(%rdi), %ymm0
+; CHECK-NEXT:    vmovapd (%rdi), %ymm0
+; CHECK-NEXT:    vextractf128 $1, %ymm0, %xmm0
+; CHECK-NEXT:    vmovddup {{.*#+}} xmm0 = xmm0[0,0]
+; CHECK-NEXT:    vinsertf128 $1, %xmm0, %ymm0, %ymm0
  ; CHECK-NEXT:    retq
  entry:
    %ld = load <4 x i64>, <4 x i64>* %ptr
author	Nico Weber <nicolasweber@gmx.de>
	Thu, 7 Jan 2016 15:01:46 +0000 (15:01 +0000)
committer	Nico Weber <nicolasweber@gmx.de>
	Thu, 7 Jan 2016 15:01:46 +0000 (15:01 +0000)
lib/Target/X86/X86ISelLowering.cpp		patch \| blob \| history
test/CodeGen/X86/2012-01-12-extract-sv.ll		patch \| blob \| history
test/CodeGen/X86/avx-vbroadcast.ll		patch \| blob \| history