Let the inline asm 'q' constraint match float, and on 64-bit double too.

[oota-llvm.git] / test / CodeGen / X86 / h-registers-0.ll
diff --git a/test/CodeGen/X86/h-registers-0.ll b/test/CodeGen/X86/h-registers-0.ll

index 2777be9cc3e0a799d2a15da0af642140d4e26918..cdc75af92e4304bad494d97d86c6cd0fa09dc6a8 100644 (file)
--- a/test/CodeGen/X86/h-registers-0.ll
+++ b/test/CodeGen/X86/h-registers-0.ll
@@ -1,12 +1,23 @@
-; RUN: llvm-as < %s | llc -march=x86-64 | grep {movzbl %\[abcd\]h,} | count 4
-; RUN: llvm-as < %s | llc -march=x86    > %t
-; RUN: grep {incb      %ah} %t | count 3
-; RUN: grep {movzbl    %ah,} %t | count 3
+; RUN: llc < %s -mtriple=x86_64-linux | FileCheck %s -check-prefix=X86-64
+; RUN: llc < %s -mtriple=x86_64-win32 | FileCheck %s -check-prefix=WIN64
+; RUN: llc < %s -march=x86    | FileCheck %s -check-prefix=X86-32
  
  ; Use h registers. On x86-64, codegen doesn't support general allocation
  ; of h registers yet, due to x86 encoding complications.
  
  define void @bar64(i64 inreg %x, i8* inreg %p) nounwind {
+; X86-64: bar64:
+; X86-64: shrq $8, %rdi
+; X86-64: incb %dil
+
+; See FIXME: on regclass GR8.
+; It could be optimally transformed like; incb %ch; movb %ch, (%rdx)
+; WIN64:  bar64:
+; WIN64:  shrq $8, %rcx
+; WIN64:  incb %cl
+
+; X86-32: bar64:
+; X86-32: incb %ah
    %t0 = lshr i64 %x, 8
    %t1 = trunc i64 %t0 to i8
    %t2 = add i8 %t1, 1
@@ -15,6 +26,16 @@ define void @bar64(i64 inreg %x, i8* inreg %p) nounwind {
  }
  
  define void @bar32(i32 inreg %x, i8* inreg %p) nounwind {
+; X86-64: bar32:
+; X86-64: shrl $8, %edi
+; X86-64: incb %dil
+
+; WIN64:  bar32:
+; WIN64:  shrl $8, %ecx
+; WIN64:  incb %cl
+
+; X86-32: bar32:
+; X86-32: incb %ah
    %t0 = lshr i32 %x, 8
    %t1 = trunc i32 %t0 to i8
    %t2 = add i8 %t1, 1
@@ -23,6 +44,16 @@ define void @bar32(i32 inreg %x, i8* inreg %p) nounwind {
  }
  
  define void @bar16(i16 inreg %x, i8* inreg %p) nounwind {
+; X86-64: bar16:
+; X86-64: shrl $8, %edi
+; X86-64: incb %dil
+
+; WIN64:  bar16:
+; WIN64:  shrl $8, %ecx
+; WIN64:  incb %cl
+
+; X86-32: bar16:
+; X86-32: incb %ah
    %t0 = lshr i16 %x, 8
    %t1 = trunc i16 %t0 to i8
    %t2 = add i8 %t1, 1
@@ -31,18 +62,45 @@ define void @bar16(i16 inreg %x, i8* inreg %p) nounwind {
  }
  
  define i64 @qux64(i64 inreg %x) nounwind {
+; X86-64: qux64:
+; X86-64: movq %rdi, %rax
+; X86-64: movzbl %ah, %eax
+
+; WIN64:  qux64:
+; WIN64:  movzbl %ch, %eax
+
+; X86-32: qux64:
+; X86-32: movzbl %ah, %eax
    %t0 = lshr i64 %x, 8
    %t1 = and i64 %t0, 255
    ret i64 %t1
  }
  
  define i32 @qux32(i32 inreg %x) nounwind {
+; X86-64: qux32:
+; X86-64: movl %edi, %eax
+; X86-64: movzbl %ah, %eax
+
+; WIN64:  qux32:
+; WIN64:  movzbl %ch, %eax
+
+; X86-32: qux32:
+; X86-32: movzbl %ah, %eax
    %t0 = lshr i32 %x, 8
    %t1 = and i32 %t0, 255
    ret i32 %t1
  }
  
  define i16 @qux16(i16 inreg %x) nounwind {
+; X86-64: qux16:
+; X86-64: movl %edi, %eax
+; X86-64: movzbl %ah, %eax
+
+; WIN64:  qux16:
+; WIN64:  movzbl %ch, %eax
+
+; X86-32: qux16:
+; X86-32: movzbl %ah, %eax
    %t0 = lshr i16 %x, 8
    ret i16 %t0
  }