@@ -1553,12 +1553,19 @@ define <8 x i32> @shuffle_v8i32_08991abb(<8 x i32> %a, <8 x i32> %b) {
1553
1553
; AVX2-NEXT: vpblendd {{.*#+}} ymm0 = ymm0[0],ymm1[1,2,3],ymm0[4],ymm1[5,6,7]
1554
1554
; AVX2-NEXT: retq
1555
1555
;
1556
- ; AVX512VL-LABEL: shuffle_v8i32_08991abb:
1557
- ; AVX512VL: # %bb.0:
1558
- ; AVX512VL-NEXT: vpmovzxdq {{.*#+}} xmm2 = xmm0[0],zero,xmm0[1],zero
1559
- ; AVX512VL-NEXT: vmovdqa {{.*#+}} ymm0 = [8,0,1,1,10,2,3,3]
1560
- ; AVX512VL-NEXT: vpermi2d %ymm2, %ymm1, %ymm0
1561
- ; AVX512VL-NEXT: retq
1556
+ ; AVX512VL-SLOW-LABEL: shuffle_v8i32_08991abb:
1557
+ ; AVX512VL-SLOW: # %bb.0:
1558
+ ; AVX512VL-SLOW-NEXT: vpmovzxdq {{.*#+}} xmm2 = xmm0[0],zero,xmm0[1],zero
1559
+ ; AVX512VL-SLOW-NEXT: vmovdqa {{.*#+}} ymm0 = [8,0,1,1,10,2,3,3]
1560
+ ; AVX512VL-SLOW-NEXT: vpermi2d %ymm2, %ymm1, %ymm0
1561
+ ; AVX512VL-SLOW-NEXT: retq
1562
+ ;
1563
+ ; AVX512VL-FAST-LABEL: shuffle_v8i32_08991abb:
1564
+ ; AVX512VL-FAST: # %bb.0:
1565
+ ; AVX512VL-FAST-NEXT: vmovdqa {{.*#+}} ymm2 = [8,0,1,1,9,2,3,3]
1566
+ ; AVX512VL-FAST-NEXT: vpermi2d %ymm0, %ymm1, %ymm2
1567
+ ; AVX512VL-FAST-NEXT: vmovdqa %ymm2, %ymm0
1568
+ ; AVX512VL-FAST-NEXT: retq
1562
1569
%shuffle = shufflevector <8 x i32 > %a , <8 x i32 > %b , <8 x i32 > <i32 0 , i32 8 , i32 9 , i32 9 , i32 1 , i32 10 , i32 11 , i32 11 >
1563
1570
ret <8 x i32 > %shuffle
1564
1571
}
@@ -1605,9 +1612,9 @@ define <8 x i32> @shuffle_v8i32_09ab1def(<8 x i32> %a, <8 x i32> %b) {
1605
1612
;
1606
1613
; AVX512VL-FAST-LABEL: shuffle_v8i32_09ab1def:
1607
1614
; AVX512VL-FAST: # %bb.0:
1608
- ; AVX512VL-FAST-NEXT: vpmovzxdq {{.*#+}} xmm2 = xmm0[0],zero,xmm0[1],zero
1609
- ; AVX512VL-FAST-NEXT: vmovdqa {{.*#+}} ymm0 = [8,1,2,3,10,5,6,7]
1610
- ; AVX512VL-FAST-NEXT: vpermi2d %ymm2, %ymm1 , %ymm0
1615
+ ; AVX512VL-FAST-NEXT: vmovdqa {{.*#+}} ymm2 = [8,1,2,3,9,5,6,7]
1616
+ ; AVX512VL-FAST-NEXT: vpermi2d % ymm0, %ymm1, %ymm2
1617
+ ; AVX512VL-FAST-NEXT: vmovdqa %ymm2, %ymm0
1611
1618
; AVX512VL-FAST-NEXT: retq
1612
1619
%shuffle = shufflevector <8 x i32 > %a , <8 x i32 > %b , <8 x i32 > <i32 0 , i32 9 , i32 10 , i32 11 , i32 1 , i32 13 , i32 14 , i32 15 >
1613
1620
ret <8 x i32 > %shuffle
0 commit comments