Index: lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp =================================================================== --- lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp +++ lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp @@ -251,7 +251,7 @@ const AMDGPUSubtarget &STM = MF.getSubtarget(); MCContext &Context = getObjFileLowering().getContext(); - if (!STM.isAmdHsaOS()) { + if (!STM.isAmdHsaOS() && !STM.isAmdPalOS()) { MCSectionELF *ConfigSection = Context.getELFSection(".AMDGPU.config", ELF::SHT_PROGBITS, 0); OutStreamer->SwitchSection(ConfigSection); @@ -270,7 +270,7 @@ if (STM.isAmdPalOS()) EmitPalMetadata(MF, CurrentProgramInfo); - if (!STM.isAmdHsaOS()) { + else if (!STM.isAmdHsaOS()) { EmitProgramInfoSI(MF, CurrentProgramInfo); } } else { @@ -935,26 +935,21 @@ OutStreamer->EmitIntValue(RsrcReg, 4); OutStreamer->EmitIntValue(S_00B028_VGPRS(CurrentProgramInfo.VGPRBlocks) | S_00B028_SGPRS(CurrentProgramInfo.SGPRBlocks), 4); - unsigned Rsrc2Val = 0; if (STM.isVGPRSpillingEnabled(*MF.getFunction())) { OutStreamer->EmitIntValue(R_0286E8_SPI_TMPRING_SIZE, 4); OutStreamer->EmitIntValue(S_0286E8_WAVESIZE(CurrentProgramInfo.ScratchBlocks), 4); - if (TM.getTargetTriple().getOS() == Triple::AMDPAL) - Rsrc2Val = S_00B84C_SCRATCH_EN(CurrentProgramInfo.ScratchBlocks > 0); - } - if (MF.getFunction()->getCallingConv() == CallingConv::AMDGPU_PS) { - OutStreamer->EmitIntValue(R_0286CC_SPI_PS_INPUT_ENA, 4); - OutStreamer->EmitIntValue(MFI->getPSInputEnable(), 4); - OutStreamer->EmitIntValue(R_0286D0_SPI_PS_INPUT_ADDR, 4); - OutStreamer->EmitIntValue(MFI->getPSInputAddr(), 4); - Rsrc2Val |= S_00B02C_EXTRA_LDS_SIZE(CurrentProgramInfo.LDSBlocks); - } - if (Rsrc2Val) { - OutStreamer->EmitIntValue(RsrcReg + 4 /*rsrc2*/, 4); - OutStreamer->EmitIntValue(Rsrc2Val, 4); } } + if (MF.getFunction()->getCallingConv() == CallingConv::AMDGPU_PS) { + OutStreamer->EmitIntValue(R_00B02C_SPI_SHADER_PGM_RSRC2_PS, 4); + OutStreamer->EmitIntValue(S_00B02C_EXTRA_LDS_SIZE(CurrentProgramInfo.LDSBlocks), 4); + OutStreamer->EmitIntValue(R_0286CC_SPI_PS_INPUT_ENA, 4); + OutStreamer->EmitIntValue(MFI->getPSInputEnable(), 4); + OutStreamer->EmitIntValue(R_0286D0_SPI_PS_INPUT_ADDR, 4); + OutStreamer->EmitIntValue(MFI->getPSInputAddr(), 4); + } + OutStreamer->EmitIntValue(R_SPILLED_SGPRS, 4); OutStreamer->EmitIntValue(MFI->getNumSpilledSGPRs(), 4); OutStreamer->EmitIntValue(R_SPILLED_VGPRS, 4); Index: test/CodeGen/AMDGPU/amdpal.ll =================================================================== --- test/CodeGen/AMDGPU/amdpal.ll +++ test/CodeGen/AMDGPU/amdpal.ll @@ -1,7 +1,7 @@ ; RUN: llc < %s -mtriple=amdgcn--amdpal -mcpu=tahiti | FileCheck --check-prefix=PAL --enable-var-scope %s -; PAL: .AMDGPU.config - +; PAL-NOT: .AMDGPU.config +; PAL-LABEL: {{^}}simple: define amdgpu_kernel void @simple(i32 addrspace(1)* %out) { entry: store i32 0, i32 addrspace(1)* %out