|
1 | 1 | ; RUN: llc -march=amdgcn -mcpu=gfx901 -mattr=-flat-for-global -verify-machineinstrs < %s | FileCheck -check-prefix=GFX9 -check-prefix=GCN %s
|
2 |
| -; RUN: llc -march=amdgcn -mcpu=tonga -mattr=-flat-for-global -verify-machineinstrs < %s | FileCheck -check-prefix=VI -check-prefix=GCN %s |
| 2 | +; RUN: llc -march=amdgcn -mcpu=tonga -mattr=-flat-for-global -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=VI %s |
3 | 3 |
|
4 | 4 | ; FIXME: Need to handle non-uniform case for function below (load without gep).
|
5 | 5 | ; GCN-LABEL: {{^}}v_test_add_v2i16:
|
6 | 6 | ; GFX9: v_pk_add_u16 v{{[0-9]+}}, v{{[0-9]+}}, v{{[0-9]+}}
|
7 | 7 |
|
8 |
| -; VI: v_add_u16_e32 v{{[0-9]+}}, v{{[0-9]+}}, v{{[0-9]+}} |
| 8 | +; VI: v_add_u16_sdwa v{{[0-9]+}}, v{{[0-9]+}}, v{{[0-9]+}} |
9 | 9 | ; VI: v_add_u16_e32 v{{[0-9]+}}, v{{[0-9]+}}, v{{[0-9]+}}
|
10 | 10 | define amdgpu_kernel void @v_test_add_v2i16(<2 x i16> addrspace(1)* %out, <2 x i16> addrspace(1)* %in0, <2 x i16> addrspace(1)* %in1) #1 {
|
11 | 11 | %tid = call i32 @llvm.amdgcn.workitem.id.x()
|
@@ -53,7 +53,7 @@ define amdgpu_kernel void @s_test_add_self_v2i16(<2 x i16> addrspace(1)* %out, <
|
53 | 53 | ; GFX9: v_pk_add_u16 v{{[0-9]+}}, v{{[0-9]+}}, s{{[0-9]+}}
|
54 | 54 |
|
55 | 55 | ; VI: v_add_i32
|
56 |
| -; VI: v_add_i32 |
| 56 | +; VI: v_add_i32_sdwa |
57 | 57 | define amdgpu_kernel void @s_test_add_v2i16_kernarg(<2 x i16> addrspace(1)* %out, <2 x i16> %a, <2 x i16> %b) #1 {
|
58 | 58 | %add = add <2 x i16> %a, %b
|
59 | 59 | store <2 x i16> %add, <2 x i16> addrspace(1)* %out
|
@@ -257,7 +257,7 @@ define amdgpu_kernel void @v_test_add_v2i16_sext_to_v2i32(<2 x i32> addrspace(1)
|
257 | 257 | ; GFX9: v_pk_add_u16
|
258 | 258 | ; GFX9: v_lshrrev_b32_e32 v{{[0-9]+}}, 16, v{{[0-9]+}}
|
259 | 259 |
|
260 |
| -; VI: v_add_u16_e32 |
| 260 | +; VI: v_add_u16_sdwa |
261 | 261 | ; VI: v_add_u16_e32
|
262 | 262 |
|
263 | 263 | ; GCN: v_bfe_i32 v{{[0-9]+}}, v{{[0-9]+}}, 0, 16
|
|
0 commit comments