|
3 | 3 | define <32 x i8> @foo(<48 x i8>* %x0, <16 x i32> %x1, <16 x i32> %x2) {
|
4 | 4 | ; CHECK-LABEL: foo:
|
5 | 5 | ; CHECK: # BB#0:
|
6 |
| -; CHECK-NEXT: vmovdqu 32(%rdi), %xmm0 |
7 |
| -; CHECK-NEXT: vmovdqu (%rdi), %ymm1 |
8 |
| -; CHECK-NEXT: vextracti128 $1, %ymm1, %xmm2 |
9 |
| -; CHECK-NEXT: vpextrb $0, %xmm2, %eax |
10 |
| -; CHECK-NEXT: vpshufb {{.*#+}} xmm1 = xmm1[0,1,3,4,6,7,9,10,12,13,15],zero,zero,zero,zero,zero |
11 |
| -; CHECK-NEXT: vpinsrb $11, %eax, %xmm1, %xmm1 |
12 |
| -; CHECK-NEXT: vpextrb $2, %xmm2, %eax |
13 |
| -; CHECK-NEXT: vpinsrb $12, %eax, %xmm1, %xmm1 |
14 |
| -; CHECK-NEXT: vpextrb $3, %xmm2, %eax |
15 |
| -; CHECK-NEXT: vpinsrb $13, %eax, %xmm1, %xmm1 |
16 |
| -; CHECK-NEXT: vpextrb $5, %xmm2, %eax |
17 |
| -; CHECK-NEXT: vpinsrb $14, %eax, %xmm1, %xmm1 |
18 |
| -; CHECK-NEXT: vpextrb $6, %xmm2, %eax |
19 |
| -; CHECK-NEXT: vpinsrb $15, %eax, %xmm1, %xmm1 |
20 |
| -; CHECK-NEXT: vpextrb $1, %xmm0, %eax |
21 |
| -; CHECK-NEXT: vpshufb {{.*#+}} xmm2 = xmm2[8,9,11,12,14,15],zero,zero,zero,zero,zero,zero,zero,zero,zero,zero |
22 |
| -; CHECK-NEXT: vpinsrb $6, %eax, %xmm2, %xmm2 |
23 |
| -; CHECK-NEXT: vpextrb $2, %xmm0, %eax |
24 |
| -; CHECK-NEXT: vpinsrb $7, %eax, %xmm2, %xmm2 |
25 |
| -; CHECK-NEXT: vpextrb $4, %xmm0, %eax |
26 |
| -; CHECK-NEXT: vpinsrb $8, %eax, %xmm2, %xmm2 |
27 |
| -; CHECK-NEXT: vpextrb $5, %xmm0, %eax |
28 |
| -; CHECK-NEXT: vpinsrb $9, %eax, %xmm2, %xmm2 |
29 |
| -; CHECK-NEXT: vpextrb $7, %xmm0, %eax |
30 |
| -; CHECK-NEXT: vpinsrb $10, %eax, %xmm2, %xmm2 |
31 |
| -; CHECK-NEXT: vpextrb $8, %xmm0, %eax |
32 |
| -; CHECK-NEXT: vpinsrb $11, %eax, %xmm2, %xmm2 |
33 |
| -; CHECK-NEXT: vpextrb $10, %xmm0, %eax |
34 |
| -; CHECK-NEXT: vpinsrb $12, %eax, %xmm2, %xmm2 |
35 |
| -; CHECK-NEXT: vpextrb $11, %xmm0, %eax |
36 |
| -; CHECK-NEXT: vpinsrb $13, %eax, %xmm2, %xmm2 |
37 |
| -; CHECK-NEXT: vpextrb $13, %xmm0, %eax |
38 |
| -; CHECK-NEXT: vpinsrb $14, %eax, %xmm2, %xmm2 |
39 |
| -; CHECK-NEXT: vpextrb $14, %xmm0, %eax |
40 |
| -; CHECK-NEXT: vpinsrb $15, %eax, %xmm2, %xmm0 |
41 |
| -; CHECK-NEXT: vinserti128 $1, %xmm0, %ymm1, %ymm0 |
| 6 | +; CHECK-NEXT: vmovdqu (%rdi), %ymm0 |
| 7 | +; CHECK-NEXT: vmovdqu 32(%rdi), %xmm1 |
| 8 | +; CHECK-NEXT: vpshufb {{.*#+}} xmm1 = xmm1[u,u,u,u,u,u,1,2,4,5,7,8,10,11,13,14] |
| 9 | +; CHECK-NEXT: vinserti128 $1, %xmm1, %ymm0, %ymm1 |
| 10 | +; CHECK-NEXT: vextracti128 $1, %ymm0, %xmm2 |
| 11 | +; CHECK-NEXT: vpshufb {{.*#+}} xmm3 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,xmm2[0,2,3,5,6] |
| 12 | +; CHECK-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,1,3,4,6,7,9,10,12,13,15],zero,zero,zero,zero,zero |
| 13 | +; CHECK-NEXT: vpor %xmm3, %xmm0, %xmm0 |
| 14 | +; CHECK-NEXT: vpshufb {{.*#+}} xmm2 = xmm2[8,9,11,12,14,15,u,u,u,u,u,u,u,u,u,u] |
| 15 | +; CHECK-NEXT: vinserti128 $1, %xmm2, %ymm0, %ymm0 |
| 16 | +; CHECK-NEXT: vmovdqa {{.*#+}} ymm2 = [255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,255,0,0,0,0,0,0,0,0,0,0] |
| 17 | +; CHECK-NEXT: vpblendvb %ymm2, %ymm0, %ymm1, %ymm0 |
42 | 18 | ; CHECK-NEXT: retq
|
43 | 19 | %1 = load <48 x i8>, <48 x i8>* %x0, align 1
|
44 | 20 | %2 = shufflevector <48 x i8> %1, <48 x i8> undef, <32 x i32> <i32 0, i32 1, i32 3, i32 4, i32 6, i32 7, i32 9, i32 10, i32 12, i32 13, i32 15, i32 16, i32 18, i32 19, i32 21, i32 22, i32 24, i32 25, i32 27, i32 28, i32 30, i32 31, i32 33, i32 34, i32 36, i32 37, i32 39, i32 40, i32 42, i32 43, i32 45, i32 46>
|
|
0 commit comments