ARM:

[oota-llvm.git] / test / CodeGen / ARM / vector-extend-narrow.ll
diff --git a/test/CodeGen/ARM/vector-extend-narrow.ll b/test/CodeGen/ARM/vector-extend-narrow.ll

index 1ec36da38f77d910ba908ae77d60c0abe08a6222..22af7976212802accc8386fbf99a9273e44206ff 100644 (file)
--- a/test/CodeGen/ARM/vector-extend-narrow.ll
+++ b/test/CodeGen/ARM/vector-extend-narrow.ll
@@ -20,7 +20,9 @@ define float @f(<4 x i16>* nocapture %in) {
  
  ; CHECK: g:
  define float @g(<4 x i8>* nocapture %in) {
-  ; CHECK: vldr
+; Note: vld1 here is reasonably important. Mixing VFP and NEON
+; instructions is bad on some cores
+  ; CHECK: vld1
    ; CHECK: vmovl.u8
    ; CHECK: vmovl.u16
    %1 = load <4 x i8>* %in
@@ -47,7 +49,9 @@ define <4 x i8> @h(<4 x float> %v) {
  
  ; CHECK: i:
  define <4 x i8> @i(<4 x i8>* %x) {
-  ; CHECK: vldr
+; Note: vld1 here is reasonably important. Mixing VFP and NEON
+; instructions is bad on some cores
+  ; CHECK: vld1
    ; CHECK: vmovl.s8
    ; CHECK: vmovl.s16
    ; CHECK: vrecpe
@@ -58,3 +62,14 @@ define <4 x i8> @i(<4 x i8>* %x) {
    %2 = sdiv <4 x i8> zeroinitializer, %1
    ret <4 x i8> %2
  }
+; CHECK: j:
+define <4 x i32> @j(<4 x i8>* %in) nounwind {
+  ; CHECK: vld1
+  ; CHECK: vmovl.u8
+  ; CHECK: vmovl.u16
+  ; CHECK-NOT: vand
+  %1 = load <4 x i8>* %in, align 4
+  %2 = zext <4 x i8> %1 to <4 x i32>
+  ret <4 x i32> %2
+}
+