diff --git a/llvm/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp b/llvm/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp --- a/llvm/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp +++ b/llvm/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp @@ -251,9 +251,9 @@ STM, KernelName, getAmdhsaKernelDescriptor(*MF, CurrentProgramInfo), CurrentProgramInfo.NumVGPRsForWavesPerEU, CurrentProgramInfo.NumSGPRsForWavesPerEU - - IsaInfo::getNumExtraSGPRs(&STM, - CurrentProgramInfo.VCCUsed, - CurrentProgramInfo.FlatUsed), + IsaInfo::getNumExtraSGPRs( + &STM, CurrentProgramInfo.VCCUsed, CurrentProgramInfo.FlatUsed, + getTargetStreamer()->getTargetID()->isXnackOnOrAny()), CurrentProgramInfo.VCCUsed, CurrentProgramInfo.FlatUsed, CodeObjectVersion); @@ -721,7 +721,8 @@ // duplicated in part in AMDGPUAsmParser::calculateGPRBlocks, and could be // unified. unsigned ExtraSGPRs = IsaInfo::getNumExtraSGPRs( - &STM, ProgInfo.VCCUsed, ProgInfo.FlatUsed); + &STM, ProgInfo.VCCUsed, ProgInfo.FlatUsed, + getTargetStreamer()->getTargetID()->isXnackOnOrAny()); // Check the addressable register limit before we add ExtraSGPRs. if (STM.getGeneration() >= AMDGPUSubtarget::VOLCANIC_ISLANDS && diff --git a/llvm/test/CodeGen/AMDGPU/tid-kd-xnack-any.ll b/llvm/test/CodeGen/AMDGPU/tid-kd-xnack-any.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/AMDGPU/tid-kd-xnack-any.ll @@ -0,0 +1,22 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a < %s | FileCheck --check-prefixes=ASM %s +; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a --filetype=obj < %s | llvm-objdump -s -j .rodata - | FileCheck --check-prefixes=OBJ %s + +define amdgpu_kernel void @kern() { +; ASM-LABEL: kern: +; ASM: .amdhsa_next_free_sgpr 5 +; ASM: .amdhsa_reserve_xnack_mask 1 + +; Verify that an extra SGPR block is reserved with XNACK "any" tid setting. +; OBJ: Contents of section .rodata: +; OBJ-NEXT: 0000 00000000 00000000 00000000 00000000 ................ +; OBJ-NEXT: 0010 00000000 00000000 00000000 00000000 ................ +; OBJ-NEXT: 0020 00000000 00000000 00000000 00000000 ................ +; OBJ-NEXT: 0030 4000af00 88000000 01000000 00000000 @............... +entry: + tail call void asm sideeffect "", "~{s[0:4]}"() + ret void +} + +!llvm.module.flags = !{!0} +!0 = !{i32 1, !"amdgpu_code_object_version", i32 400} diff --git a/llvm/test/CodeGen/AMDGPU/tid-kd-xnack-off.ll b/llvm/test/CodeGen/AMDGPU/tid-kd-xnack-off.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/AMDGPU/tid-kd-xnack-off.ll @@ -0,0 +1,22 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a -mattr=-xnack < %s | FileCheck --check-prefixes=ASM %s +; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a -mattr=-xnack --filetype=obj < %s | llvm-objdump -s -j .rodata - | FileCheck --check-prefixes=OBJ %s + +define amdgpu_kernel void @kern() { +; ASM-LABEL: kern: +; ASM: .amdhsa_next_free_sgpr 5 +; ASM: .amdhsa_reserve_xnack_mask 0 + +; Verify that an extra SGPR block is not reserved with XNACK "off" tid setting. +; OBJ: Contents of section .rodata: +; OBJ-NEXT: 0000 00000000 00000000 00000000 00000000 ................ +; OBJ-NEXT: 0010 00000000 00000000 00000000 00000000 ................ +; OBJ-NEXT: 0020 00000000 00000000 00000000 00000000 ................ +; OBJ-NEXT: 0030 0000af00 88000000 01000000 00000000 ................ +entry: + tail call void asm sideeffect "", "~{s[0:4]}"() + ret void +} + +!llvm.module.flags = !{!0} +!0 = !{i32 1, !"amdgpu_code_object_version", i32 400} diff --git a/llvm/test/CodeGen/AMDGPU/tid-kd-xnack-on.ll b/llvm/test/CodeGen/AMDGPU/tid-kd-xnack-on.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/AMDGPU/tid-kd-xnack-on.ll @@ -0,0 +1,22 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a -mattr=+xnack < %s | FileCheck --check-prefixes=ASM %s +; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a -mattr=+xnack --filetype=obj < %s | llvm-objdump -s -j .rodata - | FileCheck --check-prefixes=OBJ %s + +define amdgpu_kernel void @kern() { +; ASM-LABEL: kern: +; ASM: .amdhsa_next_free_sgpr 5 +; ASM: .amdhsa_reserve_xnack_mask 1 + +; Verify that an extra SGPR block is reserved with XNACK "on" tid setting. +; OBJ: Contents of section .rodata: +; OBJ-NEXT: 0000 00000000 00000000 00000000 00000000 ................ +; OBJ-NEXT: 0010 00000000 00000000 00000000 00000000 ................ +; OBJ-NEXT: 0020 00000000 00000000 00000000 00000000 ................ +; OBJ-NEXT: 0030 4000af00 88000000 01000000 00000000 @............... +entry: + tail call void asm sideeffect "", "~{s[0:4]}"() + ret void +} + +!llvm.module.flags = !{!0} +!0 = !{i32 1, !"amdgpu_code_object_version", i32 400}