CodeGen peephole: fold redundant phys reg copies

[oota-llvm.git] / test / CodeGen / X86 / narrow-shl-load.ll
diff --git a/test/CodeGen/X86/narrow-shl-load.ll b/test/CodeGen/X86/narrow-shl-load.ll

index d67a6a5a2f5f9753ca8bb17d9def3793f5378f23..9dc0d749cb238b0622d704c3c0a7120f7a169ab7 100644 (file)
--- a/test/CodeGen/X86/narrow-shl-load.ll
+++ b/test/CodeGen/X86/narrow-shl-load.ll
@@ -1,18 +1,17 @@
-; RUN: llc -march=x86-64 < %s
-
-; DAGCombiner should fold this code in finite time.
-
-; rdar://8606584
+; RUN: llc -march=x86-64 < %s | FileCheck %s
  
  target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
  target triple = "x86_64-pc-linux-gnu"
  
-define void @D() nounwind readnone {
+; DAGCombiner should fold this code in finite time.
+; rdar://8606584
+
+define void @test1() nounwind readnone {
  bb.nph:
    br label %while.cond
  
  while.cond:                                       ; preds = %while.cond, %bb.nph
-  %tmp6 = load i32* undef, align 4
+  %tmp6 = load i32, i32* undef, align 4
    %and = or i64 undef, undef
    %conv11 = zext i32 undef to i64
    %conv14 = zext i32 %tmp6 to i64
@@ -21,7 +20,7 @@ while.cond:                                       ; preds = %while.cond, %bb.nph
    %and17 = or i64 %shl15.masked, %conv11
    %add = add i64 %and17, 1
    %xor = xor i64 %add, %and
-  %tmp20 = load i64* undef, align 8
+  %tmp20 = load i64, i64* undef, align 8
    %add21 = add i64 %xor, %tmp20
    %conv22 = trunc i64 %add21 to i32
    store i32 %conv22, i32* undef, align 4
@@ -30,3 +29,21 @@ while.cond:                                       ; preds = %while.cond, %bb.nph
  while.end:                                        ; preds = %while.cond
    ret void
  }
+
+; DAG Combiner can't fold this into a load of the 1'th byte.
+; PR8757
+define i32 @test3(i32 *%P) nounwind ssp {
+  store volatile i32 128, i32* %P
+  %tmp4.pre = load i32, i32* %P
+  %phitmp = trunc i32 %tmp4.pre to i16
+  %phitmp13 = shl i16 %phitmp, 8
+  %phitmp14 = ashr i16 %phitmp13, 8
+  %phitmp15 = lshr i16 %phitmp14, 8
+  %phitmp16 = zext i16 %phitmp15 to i32
+  ret i32 %phitmp16
+  
+; CHECK: movl  $128, (%rdi)
+; CHECK-NEXT: movsbl   (%rdi), %eax
+; CHECK-NEXT: movzbl   %ah, %eax
+; CHECK-NEXT: ret
+}