+++ /dev/null
-; Test that vectors are scalarized/lowered correctly
-; (with both legalization methods).
-; RUN: llc -march=x86 -promote-elements < %s
-; RUN: llc -march=x86 < %s
-
-; A simple test to check copyToParts and copyFromParts.
-
-define <4 x i64> @test_param_0(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
- ret <4 x i64> %A
-}
-
-define <2 x i32> @test_param_1(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
- ret <2 x i32> %B
-}
-
-define <4 x i8> @test_param_2(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
- ret <4 x i8> %C
-}
-
-; Simple tests to check arithmetic and vector operations on types which need to
-; be legalized (no loads/stores to/from memory here).
-
-define <4 x i64> @test_arith_0(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
- %K = add <4 x i64> %A, <i64 0, i64 1, i64 3, i64 9>
- ret <4 x i64> %K
-}
-
-define <2 x i32> @test_arith_1(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
- %K = add <2 x i32> %B, <i32 0, i32 1>
- ret <2 x i32> %K
-}
-
-define <4 x i8> @test_arith_2(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
- %K = add <4 x i8> %C, <i8 0, i8 1, i8 3, i8 9>
- ret <4 x i8> %K
-}
-
-define i8 @test_arith_3(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
- %K = add <4 x i8> %C, <i8 0, i8 1, i8 3, i8 9>
- %Y = extractelement <4 x i8> %K, i32 1
- ret i8 %Y
-}
-
-define <4 x i8> @test_arith_4(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
- %Y = insertelement <4 x i8> %C, i8 1, i32 0
- ret <4 x i8> %Y
-}
-
-define <4 x i32> @test_arith_5(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
- %Y = insertelement <4 x i32> %C, i32 1, i32 0
- ret <4 x i32> %Y
-}
-
-define <4 x i32> @test_arith_6(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
- %F = extractelement <2 x i32> %B, i32 1
- %Y = insertelement <4 x i32> %C, i32 %F, i32 0
- ret <4 x i32> %Y
-}
-
-define <4 x i64> @test_arith_7(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
- %F = extractelement <2 x i32> %B, i32 1
- %W = zext i32 %F to i64
- %Y = insertelement <4 x i64> %A, i64 %W, i32 0
- ret <4 x i64> %Y
-}
-
-define i64 @test_arith_8(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
- %F = extractelement <2 x i32> %B, i32 1
- %W = zext i32 %F to i64
- %T = add i64 %W , 11
- ret i64 %T
-}
-
-define <4 x i64> @test_arith_9(<4 x i64> %A, <2 x i32> %B, <4 x i16> %C) {
- %T = add <4 x i16> %C, %C
- %F0 = extractelement <4 x i16> %T, i32 0
- %F1 = extractelement <4 x i16> %T, i32 1
- %W0 = zext i16 %F0 to i64
- %W1 = zext i16 %F1 to i64
- %Y0 = insertelement <4 x i64> %A, i64 %W0, i32 0
- %Y1 = insertelement <4 x i64> %Y0, i64 %W1, i32 2
- ret <4 x i64> %Y1
-}
-
-
-define <4 x i16> @test_arith_10(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
- %F = bitcast <2 x i32> %B to <4 x i16>
- %T = add <4 x i16> %F , <i16 0, i16 1, i16 2, i16 3>
- ret <4 x i16> %T
-}
-
--- /dev/null
+; Test that vectors are scalarized/lowered correctly
+; (with both legalization methods).
+; RUN: llc -march=x86 -promote-elements < %s
+; RUN: llc -march=x86 < %s
+
+; A simple test to check copyToParts and copyFromParts.
+
+define <4 x i64> @test_param_0(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
+ ret <4 x i64> %A
+}
+
+define <2 x i32> @test_param_1(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
+ ret <2 x i32> %B
+}
+
+define <4 x i8> @test_param_2(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
+ ret <4 x i8> %C
+}
+
+; Simple tests to check arithmetic and vector operations on types which need to
+; be legalized (no loads/stores to/from memory here).
+
+define <4 x i64> @test_arith_0(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
+ %K = add <4 x i64> %A, <i64 0, i64 1, i64 3, i64 9>
+ ret <4 x i64> %K
+}
+
+define <2 x i32> @test_arith_1(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
+ %K = add <2 x i32> %B, <i32 0, i32 1>
+ ret <2 x i32> %K
+}
+
+define <4 x i8> @test_arith_2(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
+ %K = add <4 x i8> %C, <i8 0, i8 1, i8 3, i8 9>
+ ret <4 x i8> %K
+}
+
+define i8 @test_arith_3(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
+ %K = add <4 x i8> %C, <i8 0, i8 1, i8 3, i8 9>
+ %Y = extractelement <4 x i8> %K, i32 1
+ ret i8 %Y
+}
+
+define <4 x i8> @test_arith_4(<4 x i64> %A, <2 x i32> %B, <4 x i8> %C) {
+ %Y = insertelement <4 x i8> %C, i8 1, i32 0
+ ret <4 x i8> %Y
+}
+
+define <4 x i32> @test_arith_5(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
+ %Y = insertelement <4 x i32> %C, i32 1, i32 0
+ ret <4 x i32> %Y
+}
+
+define <4 x i32> @test_arith_6(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
+ %F = extractelement <2 x i32> %B, i32 1
+ %Y = insertelement <4 x i32> %C, i32 %F, i32 0
+ ret <4 x i32> %Y
+}
+
+define <4 x i64> @test_arith_7(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
+ %F = extractelement <2 x i32> %B, i32 1
+ %W = zext i32 %F to i64
+ %Y = insertelement <4 x i64> %A, i64 %W, i32 0
+ ret <4 x i64> %Y
+}
+
+define i64 @test_arith_8(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
+ %F = extractelement <2 x i32> %B, i32 1
+ %W = zext i32 %F to i64
+ %T = add i64 %W , 11
+ ret i64 %T
+}
+
+define <4 x i64> @test_arith_9(<4 x i64> %A, <2 x i32> %B, <4 x i16> %C) {
+ %T = add <4 x i16> %C, %C
+ %F0 = extractelement <4 x i16> %T, i32 0
+ %F1 = extractelement <4 x i16> %T, i32 1
+ %W0 = zext i16 %F0 to i64
+ %W1 = zext i16 %F1 to i64
+ %Y0 = insertelement <4 x i64> %A, i64 %W0, i32 0
+ %Y1 = insertelement <4 x i64> %Y0, i64 %W1, i32 2
+ ret <4 x i64> %Y1
+}
+
+define <4 x i16> @test_arith_10(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
+ %F = bitcast <2 x i32> %B to <4 x i16>
+ %T = add <4 x i16> %F , <i16 0, i16 1, i16 2, i16 3>
+ ret <4 x i16> %T
+}
+
+
+; Simple tests to check saving/loading from memory
+define <4 x i16> @test_mem_0(<4 x i64> %A, <2 x i32> %B, <4 x i32> %C) {
+ %F = bitcast <2 x i32> %B to <4 x i16>
+ %T = add <4 x i16> %F , <i16 0, i16 1, i16 2, i16 3>
+ ret <4 x i16> %T
+}
+