1 ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu -mcpu=corei7 | FileCheck %s
3 ; Test that we correctly fold a shuffle that performs a swizzle of another
4 ; shuffle node according to the rule
5 ; shuffle (shuffle (x, undef, M0), undef, M1) -> shuffle(x, undef, M2)
7 ; We only do this if the resulting mask is legal to avoid introducing an
8 ; illegal shuffle that is expanded into a sub-optimal sequence of instructions
9 ; during lowering stage.
12 define <4 x i32> @swizzle_1(<4 x i32> %v) {
13 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 3, i32 2, i32 0, i32 1>
14 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 3, i32 2, i32 0, i32 1>
17 ; CHECK-LABEL: swizzle_1
24 define <4 x i32> @swizzle_2(<4 x i32> %v) {
25 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 3, i32 1, i32 0, i32 2>
26 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 3, i32 1, i32 0, i32 2>
29 ; CHECK-LABEL: swizzle_2
36 define <4 x i32> @swizzle_3(<4 x i32> %v) {
37 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 2, i32 3, i32 1, i32 0>
38 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 2, i32 3, i32 1, i32 0>
41 ; CHECK-LABEL: swizzle_3
48 define <4 x i32> @swizzle_4(<4 x i32> %v) {
49 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 2, i32 1, i32 3, i32 0>
50 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 2, i32 1, i32 3, i32 0>
53 ; CHECK-LABEL: swizzle_4
60 define <4 x i32> @swizzle_5(<4 x i32> %v) {
61 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 1, i32 2, i32 3, i32 0>
62 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 1, i32 2, i32 3, i32 0>
65 ; CHECK-LABEL: swizzle_5
72 define <4 x i32> @swizzle_6(<4 x i32> %v) {
73 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 1, i32 2, i32 0, i32 3>
74 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 1, i32 2, i32 0, i32 3>
77 ; CHECK-LABEL: swizzle_6
84 define <4 x i32> @swizzle_7(<4 x i32> %v) {
85 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 0, i32 3, i32 1, i32 2>
86 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 0, i32 3, i32 1, i32 2>
89 ; CHECK-LABEL: swizzle_7
96 define <4 x i32> @swizzle_8(<4 x i32> %v) {
97 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 3, i32 0, i32 2, i32 1>
98 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 3, i32 0, i32 2, i32 1>
101 ; CHECK-LABEL: swizzle_8
108 define <4 x i32> @swizzle_9(<4 x i32> %v) {
109 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 3, i32 0, i32 1, i32 2>
110 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 3, i32 0, i32 1, i32 2>
113 ; CHECK-LABEL: swizzle_9
120 define <4 x i32> @swizzle_10(<4 x i32> %v) {
121 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 2, i32 0, i32 1, i32 3>
122 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 2, i32 0, i32 1, i32 3>
125 ; CHECK-LABEL: swizzle_10
132 define <4 x i32> @swizzle_11(<4 x i32> %v) {
133 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 2, i32 0, i32 3, i32 1>
134 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 2, i32 0, i32 3, i32 1>
137 ; CHECK-LABEL: swizzle_11
144 define <4 x i32> @swizzle_12(<4 x i32> %v) {
145 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 0, i32 2, i32 3, i32 1>
146 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 0, i32 2, i32 3, i32 1>
149 ; CHECK-LABEL: swizzle_12
151 ; CHECK: pshufd $-100
156 define <4 x i32> @swizzle_13(<4 x i32> %v) {
157 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 1, i32 3, i32 0, i32 2>
158 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 1, i32 3, i32 0, i32 2>
161 ; CHECK-LABEL: swizzle_13
168 define <4 x i32> @swizzle_14(<4 x i32> %v) {
169 %1 = shufflevector <4 x i32> %v, <4 x i32> undef, <4 x i32> <i32 1, i32 3, i32 2, i32 0>
170 %2 = shufflevector <4 x i32> %1, <4 x i32> undef, <4 x i32> <i32 1, i32 3, i32 2, i32 0>
173 ; CHECK-LABEL: swizzle_14
180 define <4 x float> @swizzle_15(<4 x float> %v) {
181 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 3, i32 2, i32 0, i32 1>
182 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 3, i32 2, i32 0, i32 1>
185 ; CHECK-LABEL: swizzle_15
192 define <4 x float> @swizzle_16(<4 x float> %v) {
193 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 3, i32 1, i32 0, i32 2>
194 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 3, i32 1, i32 0, i32 2>
197 ; CHECK-LABEL: swizzle_16
204 define <4 x float> @swizzle_17(<4 x float> %v) {
205 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 2, i32 3, i32 1, i32 0>
206 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 2, i32 3, i32 1, i32 0>
209 ; CHECK-LABEL: swizzle_17
216 define <4 x float> @swizzle_18(<4 x float> %v) {
217 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 2, i32 1, i32 3, i32 0>
218 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 2, i32 1, i32 3, i32 0>
221 ; CHECK-LABEL: swizzle_18
223 ; CHECK: pshufd $-121
228 define <4 x float> @swizzle_19(<4 x float> %v) {
229 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 1, i32 2, i32 3, i32 0>
230 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 1, i32 2, i32 3, i32 0>
233 ; CHECK-LABEL: swizzle_19
240 define <4 x float> @swizzle_20(<4 x float> %v) {
241 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 1, i32 2, i32 0, i32 3>
242 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 1, i32 2, i32 0, i32 3>
245 ; CHECK-LABEL: swizzle_20
252 define <4 x float> @swizzle_21(<4 x float> %v) {
253 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 0, i32 3, i32 1, i32 2>
254 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 0, i32 3, i32 1, i32 2>
257 ; CHECK-LABEL: swizzle_21
264 define <4 x float> @swizzle_22(<4 x float> %v) {
265 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 3, i32 0, i32 2, i32 1>
266 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 3, i32 0, i32 2, i32 1>
269 ; CHECK-LABEL: swizzle_22
276 define <4 x float> @swizzle_23(<4 x float> %v) {
277 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 3, i32 0, i32 1, i32 2>
278 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 3, i32 0, i32 1, i32 2>
281 ; CHECK-LABEL: swizzle_23
288 define <4 x float> @swizzle_24(<4 x float> %v) {
289 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 2, i32 0, i32 1, i32 3>
290 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 2, i32 0, i32 1, i32 3>
293 ; CHECK-LABEL: swizzle_24
300 define <4 x float> @swizzle_25(<4 x float> %v) {
301 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 2, i32 0, i32 3, i32 1>
302 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 2, i32 0, i32 3, i32 1>
305 ; CHECK-LABEL: swizzle_25
312 define <4 x float> @swizzle_26(<4 x float> %v) {
313 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 0, i32 2, i32 3, i32 1>
314 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 0, i32 2, i32 3, i32 1>
317 ; CHECK-LABEL: swizzle_26
319 ; CHECK: pshufd $-100
324 define <4 x float> @swizzle_27(<4 x float> %v) {
325 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 1, i32 3, i32 0, i32 2>
326 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 1, i32 3, i32 0, i32 2>
329 ; CHECK-LABEL: swizzle_27
336 define <4 x float> @swizzle_28(<4 x float> %v) {
337 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 1, i32 3, i32 2, i32 0>
338 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 1, i32 3, i32 2, i32 0>
341 ; CHECK-LABEL: swizzle_28
348 define <4 x float> @swizzle_29(<4 x float> %v) {
349 %1 = shufflevector <4 x float> %v, <4 x float> undef, <4 x i32> <i32 3, i32 1, i32 2, i32 0>
350 %2 = shufflevector <4 x float> %1, <4 x float> undef, <4 x i32> <i32 1, i32 0, i32 2, i32 3>
353 ; CHECK-LABEL: swizzle_29
359 ; Make sure that we combine the shuffles from each function below into a single
360 ; legal shuffle (either pshuflw or pshufb depending on the masks).
362 define <8 x i16> @swizzle_30(<8 x i16> %v) {
363 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 3, i32 1, i32 2, i32 0, i32 7, i32 5, i32 6, i32 4>
364 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 1, i32 0, i32 2, i32 3, i32 7, i32 5, i32 6, i32 4>
367 ; CHECK-LABEL: swizzle_30
368 ; Mask: [1,3,2,0,5,7,6,4]
374 define <8 x i16> @swizzle_31(<8 x i16> %v) {
375 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 3, i32 0, i32 2, i32 1, i32 7, i32 5, i32 6, i32 4>
376 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 3, i32 0, i32 2, i32 1, i32 7, i32 5, i32 6, i32 4>
379 ; CHECK-LABEL: swizzle_31
380 ; Mask: [1,3,2,0,4,5,6,7]
386 define <8 x i16> @swizzle_32(<8 x i16> %v) {
387 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 1, i32 2, i32 3, i32 0, i32 7, i32 5, i32 6, i32 4>
388 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 1, i32 2, i32 3, i32 0, i32 7, i32 5, i32 6, i32 4>
391 ; CHECK-LABEL: swizzle_32
392 ; Mask: [2,3,0,1,4,5,6,7] --> equivalent to pshufd mask [1,0,2,3]
397 define <8 x i16> @swizzle_33(<8 x i16> %v) {
398 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 4, i32 6, i32 5, i32 7, i32 2, i32 3, i32 1, i32 0>
399 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 4, i32 6, i32 5, i32 7, i32 2, i32 3, i32 1, i32 0>
402 ; CHECK-LABEL: swizzle_33
409 define <8 x i16> @swizzle_34(<8 x i16> %v) {
410 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 4, i32 7, i32 6, i32 5, i32 1, i32 2, i32 0, i32 3>
411 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 4, i32 7, i32 6, i32 5, i32 1, i32 2, i32 0, i32 3>
414 ; CHECK-LABEL: swizzle_34
421 define <8 x i16> @swizzle_35(<8 x i16> %v) {
422 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 7, i32 4, i32 6, i32 5, i32 1, i32 3, i32 0, i32 2>
423 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 7, i32 4, i32 6, i32 5, i32 1, i32 3, i32 0, i32 2>
426 ; CHECK-LABEL: swizzle_35
432 define <8 x i16> @swizzle_36(<8 x i16> %v) {
433 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 4, i32 6, i32 7, i32 5, i32 0, i32 1, i32 3, i32 2>
434 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 4, i32 6, i32 7, i32 5, i32 0, i32 1, i32 3, i32 2>
437 ; CHECK-LABEL: swizzle_36
444 define <8 x i16> @swizzle_37(<8 x i16> %v) {
445 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 1, i32 0, i32 3, i32 2, i32 7, i32 5, i32 6, i32 4>
446 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 1, i32 0, i32 3, i32 2, i32 7, i32 4, i32 6, i32 5>
449 ; CHECK-LABEL: swizzle_37
450 ; Mask: [0,1,2,3,4,7,6,5]
451 ; CHECK: pshufhw $108
456 define <8 x i16> @swizzle_38(<8 x i16> %v) {
457 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 5, i32 6, i32 4, i32 7, i32 0, i32 2, i32 1, i32 3>
458 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 5, i32 6, i32 4, i32 7, i32 0, i32 2, i32 1, i32 3>
461 ; CHECK-LABEL: swizzle_38
468 define <8 x i16> @swizzle_39(<8 x i16> %v) {
469 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 5, i32 4, i32 6, i32 7, i32 3, i32 2, i32 1, i32 0>
470 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 5, i32 4, i32 6, i32 7, i32 3, i32 2, i32 1, i32 0>
473 ; CHECK-LABEL: swizzle_39
480 define <8 x i16> @swizzle_40(<8 x i16> %v) {
481 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 6, i32 4, i32 7, i32 5, i32 1, i32 0, i32 3, i32 2>
482 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 6, i32 4, i32 7, i32 5, i32 1, i32 0, i32 3, i32 2>
485 ; CHECK-LABEL: swizzle_40
492 define <8 x i16> @swizzle_41(<8 x i16> %v) {
493 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 6, i32 7, i32 5, i32 4, i32 0, i32 1, i32 3, i32 2>
494 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 6, i32 7, i32 5, i32 4, i32 0, i32 1, i32 3, i32 2>
497 ; CHECK-LABEL: swizzle_41
504 define <8 x i16> @swizzle_42(<8 x i16> %v) {
505 %1 = shufflevector <8 x i16> %v, <8 x i16> undef, <8 x i32> <i32 0, i32 1, i32 3, i32 2, i32 7, i32 6, i32 4, i32 5>
506 %2 = shufflevector <8 x i16> %1, <8 x i16> undef, <8 x i32> <i32 0, i32 1, i32 3, i32 2, i32 7, i32 6, i32 4, i32 5>
509 ; CHECK-LABEL: swizzle_42
510 ; Mask: [0,1,2,3,5,4,7,6]
511 ; CHECK: pshufhw $-79