1 ; RUN: llc -mcpu=pwr7 -mattr=+vsx < %s | FileCheck %s
2 target datalayout = "E-m:e-i64:64-n32:64"
3 target triple = "powerpc64-unknown-linux-gnu"
5 define double @test1(double %a, double %b) {
7 %v = fmul double %a, %b
11 ; CHECK: xsmuldp 1, 1, 2
15 define double @test2(double %a, double %b) {
17 %v = fdiv double %a, %b
21 ; CHECK: xsdivdp 1, 1, 2
25 define double @test3(double %a, double %b) {
27 %v = fadd double %a, %b
31 ; CHECK: xsadddp 1, 1, 2
35 define <2 x double> @test4(<2 x double> %a, <2 x double> %b) {
37 %v = fadd <2 x double> %a, %b
41 ; CHECK: xvadddp 34, 34, 35
45 define <4 x i32> @test5(<4 x i32> %a, <4 x i32> %b) {
47 %v = xor <4 x i32> %a, %b
51 ; CHECK: xxlxor 34, 34, 35
55 define <8 x i16> @test6(<8 x i16> %a, <8 x i16> %b) {
57 %v = xor <8 x i16> %a, %b
61 ; CHECK: xxlxor 34, 34, 35
65 define <16 x i8> @test7(<16 x i8> %a, <16 x i8> %b) {
67 %v = xor <16 x i8> %a, %b
71 ; CHECK: xxlxor 34, 34, 35
75 define <4 x i32> @test8(<4 x i32> %a, <4 x i32> %b) {
77 %v = or <4 x i32> %a, %b
81 ; CHECK: xxlor 34, 34, 35
85 define <8 x i16> @test9(<8 x i16> %a, <8 x i16> %b) {
87 %v = or <8 x i16> %a, %b
91 ; CHECK: xxlor 34, 34, 35
95 define <16 x i8> @test10(<16 x i8> %a, <16 x i8> %b) {
97 %v = or <16 x i8> %a, %b
100 ; CHECK-LABEL: @test10
101 ; CHECK: xxlor 34, 34, 35
105 define <4 x i32> @test11(<4 x i32> %a, <4 x i32> %b) {
107 %v = and <4 x i32> %a, %b
110 ; CHECK-LABEL: @test11
111 ; CHECK: xxland 34, 34, 35
115 define <8 x i16> @test12(<8 x i16> %a, <8 x i16> %b) {
117 %v = and <8 x i16> %a, %b
120 ; CHECK-LABEL: @test12
121 ; CHECK: xxland 34, 34, 35
125 define <16 x i8> @test13(<16 x i8> %a, <16 x i8> %b) {
127 %v = and <16 x i8> %a, %b
130 ; CHECK-LABEL: @test13
131 ; CHECK: xxland 34, 34, 35
135 define <4 x i32> @test14(<4 x i32> %a, <4 x i32> %b) {
137 %v = or <4 x i32> %a, %b
138 %w = xor <4 x i32> %v, <i32 -1, i32 -1, i32 -1, i32 -1>
141 ; CHECK-LABEL: @test14
142 ; CHECK: xxlnor 34, 34, 35
146 define <8 x i16> @test15(<8 x i16> %a, <8 x i16> %b) {
148 %v = or <8 x i16> %a, %b
149 %w = xor <8 x i16> %v, <i16 -1, i16 -1, i16 -1, i16 -1, i16 -1, i16 -1, i16 -1, i16 -1>
152 ; CHECK-LABEL: @test15
153 ; CHECK: xxlnor 34, 34, 35
157 define <16 x i8> @test16(<16 x i8> %a, <16 x i8> %b) {
159 %v = or <16 x i8> %a, %b
160 %w = xor <16 x i8> %v, <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
163 ; CHECK-LABEL: @test16
164 ; CHECK: xxlnor 34, 34, 35
168 define <4 x i32> @test17(<4 x i32> %a, <4 x i32> %b) {
170 %w = xor <4 x i32> %b, <i32 -1, i32 -1, i32 -1, i32 -1>
171 %v = and <4 x i32> %a, %w
174 ; CHECK-LABEL: @test17
175 ; CHECK: xxlandc 34, 34, 35
179 define <8 x i16> @test18(<8 x i16> %a, <8 x i16> %b) {
181 %w = xor <8 x i16> %b, <i16 -1, i16 -1, i16 -1, i16 -1, i16 -1, i16 -1, i16 -1, i16 -1>
182 %v = and <8 x i16> %a, %w
185 ; CHECK-LABEL: @test18
186 ; CHECK: xxlandc 34, 34, 35
190 define <16 x i8> @test19(<16 x i8> %a, <16 x i8> %b) {
192 %w = xor <16 x i8> %b, <i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1, i8 -1>
193 %v = and <16 x i8> %a, %w
196 ; CHECK-LABEL: @test19
197 ; CHECK: xxlandc 34, 34, 35
201 define <4 x i32> @test20(<4 x i32> %a, <4 x i32> %b, <4 x i32> %c, <4 x i32> %d) {
203 %m = icmp eq <4 x i32> %c, %d
204 %v = select <4 x i1> %m, <4 x i32> %a, <4 x i32> %b
207 ; CHECK-LABEL: @test20
208 ; CHECK: vcmpequw {{[0-9]+}}, 4, 5
209 ; CHECK: xxsel 34, 35, 34, {{[0-9]+}}
213 define <4 x float> @test21(<4 x float> %a, <4 x float> %b, <4 x float> %c, <4 x float> %d) {
215 %m = fcmp oeq <4 x float> %c, %d
216 %v = select <4 x i1> %m, <4 x float> %a, <4 x float> %b
219 ; CHECK-LABEL: @test21
220 ; CHECK: xvcmpeqsp [[V1:[0-9]+]], 36, 37
221 ; CHECK: xxsel 34, 35, 34, [[V1]]
225 define <4 x float> @test22(<4 x float> %a, <4 x float> %b, <4 x float> %c, <4 x float> %d) {
227 %m = fcmp ueq <4 x float> %c, %d
228 %v = select <4 x i1> %m, <4 x float> %a, <4 x float> %b
231 ; CHECK-LABEL: @test22
232 ; CHECK-DAG: xvcmpeqsp {{[0-9]+}}, 37, 37
233 ; CHECK-DAG: xvcmpeqsp {{[0-9]+}}, 36, 36
234 ; CHECK-DAG: xvcmpeqsp {{[0-9]+}}, 36, 37
239 ; CHECK: xxsel 34, 35, 34, {{[0-9]+}}
243 define <8 x i16> @test23(<8 x i16> %a, <8 x i16> %b, <8 x i16> %c, <8 x i16> %d) {
245 %m = icmp eq <8 x i16> %c, %d
246 %v = select <8 x i1> %m, <8 x i16> %a, <8 x i16> %b
249 ; CHECK-LABEL: @test23
250 ; CHECK: vcmpequh {{[0-9]+}}, 4, 5
251 ; CHECK: xxsel 34, 35, 34, {{[0-9]+}}
255 define <16 x i8> @test24(<16 x i8> %a, <16 x i8> %b, <16 x i8> %c, <16 x i8> %d) {
257 %m = icmp eq <16 x i8> %c, %d
258 %v = select <16 x i1> %m, <16 x i8> %a, <16 x i8> %b
261 ; CHECK-LABEL: @test24
262 ; CHECK: vcmpequb {{[0-9]+}}, 4, 5
263 ; CHECK: xxsel 34, 35, 34, {{[0-9]+}}
267 define <2 x double> @test25(<2 x double> %a, <2 x double> %b, <2 x double> %c, <2 x double> %d) {
269 %m = fcmp oeq <2 x double> %c, %d
270 %v = select <2 x i1> %m, <2 x double> %a, <2 x double> %b
273 ; CHECK-LABEL: @test25
274 ; CHECK: xvcmpeqdp [[V1:[0-9]+]], 36, 37
275 ; CHECK: xxsel 34, 35, 34, [[V1]]
279 define <2 x i64> @test26(<2 x i64> %a, <2 x i64> %b) {
280 %v = add <2 x i64> %a, %b
283 ; CHECK-LABEL: @test26
284 ; FIXME: The code quality here is not good; just make sure we do something for now.
290 define <2 x i64> @test27(<2 x i64> %a, <2 x i64> %b) {
291 %v = and <2 x i64> %a, %b
294 ; CHECK-LABEL: @test27
295 ; CHECK: xxland 34, 34, 35
299 define <2 x double> @test28(<2 x double>* %a) {
300 %v = load <2 x double>* %a, align 16
303 ; CHECK-LABEL: @test28
304 ; CHECK: lxvd2x 34, 0, 3
308 define void @test29(<2 x double>* %a, <2 x double> %b) {
309 store <2 x double> %b, <2 x double>* %a, align 16
312 ; CHECK-LABEL: @test29
313 ; CHECK: stxvd2x 34, 0, 3
317 define <2 x double> @test28u(<2 x double>* %a) {
318 %v = load <2 x double>* %a, align 8
321 ; CHECK-LABEL: @test28u
322 ; CHECK: lxvd2x 34, 0, 3
326 define void @test29u(<2 x double>* %a, <2 x double> %b) {
327 store <2 x double> %b, <2 x double>* %a, align 8
330 ; CHECK-LABEL: @test29u
331 ; CHECK: stxvd2x 34, 0, 3
335 define <2 x i64> @test30(<2 x i64>* %a) {
336 %v = load <2 x i64>* %a, align 16
339 ; CHECK-LABEL: @test30
340 ; CHECK: lxvd2x 34, 0, 3
344 define void @test31(<2 x i64>* %a, <2 x i64> %b) {
345 store <2 x i64> %b, <2 x i64>* %a, align 16
348 ; CHECK-LABEL: @test31
349 ; CHECK: stxvd2x 34, 0, 3
353 define <2 x double> @test40(<2 x i64> %a) {
354 %v = uitofp <2 x i64> %a to <2 x double>
357 ; CHECK-LABEL: @test40
358 ; CHECK: xvcvuxddp 34, 34
362 define <2 x double> @test41(<2 x i64> %a) {
363 %v = sitofp <2 x i64> %a to <2 x double>
366 ; CHECK-LABEL: @test41
367 ; CHECK: xvcvsxddp 34, 34
371 define <2 x i64> @test42(<2 x double> %a) {
372 %v = fptoui <2 x double> %a to <2 x i64>
375 ; CHECK-LABEL: @test42
376 ; CHECK: xvcvdpuxds 34, 34
380 define <2 x i64> @test43(<2 x double> %a) {
381 %v = fptosi <2 x double> %a to <2 x i64>
384 ; CHECK-LABEL: @test43
385 ; CHECK: xvcvdpsxds 34, 34
389 define <2 x float> @test44(<2 x i64> %a) {
390 %v = uitofp <2 x i64> %a to <2 x float>
393 ; CHECK-LABEL: @test44
394 ; FIXME: The code quality here looks pretty bad.
398 define <2 x float> @test45(<2 x i64> %a) {
399 %v = sitofp <2 x i64> %a to <2 x float>
402 ; CHECK-LABEL: @test45
403 ; FIXME: The code quality here looks pretty bad.
407 define <2 x i64> @test46(<2 x float> %a) {
408 %v = fptoui <2 x float> %a to <2 x i64>
411 ; CHECK-LABEL: @test46
412 ; FIXME: The code quality here looks pretty bad.
416 define <2 x i64> @test47(<2 x float> %a) {
417 %v = fptosi <2 x float> %a to <2 x i64>
420 ; CHECK-LABEL: @test47
421 ; FIXME: The code quality here looks pretty bad.
425 define <2 x double> @test50(double* %a) {
426 %v = load double* %a, align 8
427 %w = insertelement <2 x double> undef, double %v, i32 0
428 %x = insertelement <2 x double> %w, double %v, i32 1
431 ; CHECK-LABEL: @test50
432 ; CHECK: lxvdsx 34, 0, 3
436 define <2 x double> @test51(<2 x double> %a, <2 x double> %b) {
437 %v = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 0, i32 0>
440 ; CHECK-LABEL: @test51
441 ; CHECK: xxpermdi 34, 34, 34, 0
445 define <2 x double> @test52(<2 x double> %a, <2 x double> %b) {
446 %v = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 0, i32 2>
449 ; CHECK-LABEL: @test52
450 ; CHECK: xxpermdi 34, 34, 35, 0
454 define <2 x double> @test53(<2 x double> %a, <2 x double> %b) {
455 %v = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 2, i32 0>
458 ; CHECK-LABEL: @test53
459 ; CHECK: xxpermdi 34, 35, 34, 0
463 define <2 x double> @test54(<2 x double> %a, <2 x double> %b) {
464 %v = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 1, i32 2>
467 ; CHECK-LABEL: @test54
468 ; CHECK: xxpermdi 34, 34, 35, 2
472 define <2 x double> @test55(<2 x double> %a, <2 x double> %b) {
473 %v = shufflevector <2 x double> %a, <2 x double> %b, <2 x i32> <i32 1, i32 3>
476 ; CHECK-LABEL: @test55
477 ; CHECK: xxpermdi 34, 34, 35, 3
481 define <2 x i64> @test56(<2 x i64> %a, <2 x i64> %b) {
482 %v = shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 1, i32 3>
485 ; CHECK-LABEL: @test56
486 ; CHECK: xxpermdi 34, 34, 35, 3
490 define <2 x i64> @test60(<2 x i64> %a, <2 x i64> %b) {
491 %v = shl <2 x i64> %a, %b
494 ; CHECK-LABEL: @test60
495 ; This should scalarize, and the current code quality is not good.
504 define <2 x i64> @test61(<2 x i64> %a, <2 x i64> %b) {
505 %v = lshr <2 x i64> %a, %b
508 ; CHECK-LABEL: @test61
509 ; This should scalarize, and the current code quality is not good.
518 define <2 x i64> @test62(<2 x i64> %a, <2 x i64> %b) {
519 %v = ashr <2 x i64> %a, %b
522 ; CHECK-LABEL: @test62
523 ; This should scalarize, and the current code quality is not good.
532 define double @test63(<2 x double> %a) {
533 %v = extractelement <2 x double> %a, i32 0
536 ; CHECK-LABEL: @test63
537 ; CHECK: xxlor 1, 34, 34
541 define double @test64(<2 x double> %a) {
542 %v = extractelement <2 x double> %a, i32 1
545 ; CHECK-LABEL: @test64
546 ; CHECK: xxpermdi 1, 34, 34, 2
550 define <2 x i1> @test65(<2 x i64> %a, <2 x i64> %b) {
551 %w = icmp eq <2 x i64> %a, %b
554 ; CHECK-LABEL: @test65
555 ; CHECK: vcmpequw 2, 2, 3
559 define <2 x i1> @test66(<2 x i64> %a, <2 x i64> %b) {
560 %w = icmp ne <2 x i64> %a, %b
563 ; CHECK-LABEL: @test66
564 ; CHECK: vcmpequw {{[0-9]+}}, 2, 3
565 ; CHECK: xxlnor 34, {{[0-9]+}}, {{[0-9]+}}
569 define <2 x i1> @test67(<2 x i64> %a, <2 x i64> %b) {
570 %w = icmp ult <2 x i64> %a, %b
573 ; CHECK-LABEL: @test67
574 ; This should scalarize, and the current code quality is not good.