Diff 497384

llvm/lib/Target/AMDGPU/AsmParser/AMDGPUAsmParser.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

//===- AMDGPUAsmParser.cpp - Parse SI asm to MCInst instructions ----------===//		//===- AMDGPUAsmParser.cpp - Parse SI asm to MCInst instructions ----------===//
//		//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.		// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.		// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception		// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "AMDKernelCodeT.h"		#include "AMDKernelCodeT.h"
#include "MCTargetDesc/AMDGPUMCTargetDesc.h"		#include "MCTargetDesc/AMDGPUMCTargetDesc.h"
		foadUnsubmitted Not Done Reply Inline Actions I think the idea is that the assembler should not include any of the "codegen" parts of the backend. If getNSAMaxSize needs to be shared by codegen and the assembler, it should be moved into AMDGPUBaseInfo - that is why AMDGPUBaseInfo exists. foad: I think the idea is that the assembler should not include any of the "codegen" parts of the…
		mbrkusaninAuthorUnsubmitted Done Reply Inline Actions Moved to AMDGPUBaseInfo. mbrkusanin: Moved to AMDGPUBaseInfo.
#include "MCTargetDesc/AMDGPUTargetStreamer.h"		#include "MCTargetDesc/AMDGPUTargetStreamer.h"
#include "SIDefines.h"		#include "SIDefines.h"
#include "SIInstrInfo.h"		#include "SIInstrInfo.h"
#include "SIRegisterInfo.h"		#include "SIRegisterInfo.h"
#include "TargetInfo/AMDGPUTargetInfo.h"		#include "TargetInfo/AMDGPUTargetInfo.h"
#include "Utils/AMDGPUAsmUtils.h"		#include "Utils/AMDGPUAsmUtils.h"
#include "Utils/AMDGPUBaseInfo.h"		#include "Utils/AMDGPUBaseInfo.h"
#include "Utils/AMDKernelCodeTUtils.h"		#include "Utils/AMDKernelCodeTUtils.h"
▲ Show 20 Lines • Show All 3,659 Lines • ▼ Show 20 Lines	bool AMDGPUAsmParser::validateMIMGAddrSize(const MCInst &Inst) {
unsigned ActualAddrSize =		unsigned ActualAddrSize =
IsNSA ? SrsrcIdx - VAddr0Idx		IsNSA ? SrsrcIdx - VAddr0Idx
: AMDGPU::getRegOperandSize(getMRI(), Desc, VAddr0Idx) / 4;		: AMDGPU::getRegOperandSize(getMRI(), Desc, VAddr0Idx) / 4;
bool IsA16 = (A16Idx != -1 && Inst.getOperand(A16Idx).getImm());		bool IsA16 = (A16Idx != -1 && Inst.getOperand(A16Idx).getImm());

unsigned ExpectedAddrSize =		unsigned ExpectedAddrSize =
AMDGPU::getAddrSizeMIMGOp(BaseOpcode, DimInfo, IsA16, hasG16());		AMDGPU::getAddrSizeMIMGOp(BaseOpcode, DimInfo, IsA16, hasG16());

if (!IsNSA) {		if (IsNSA) {
		if (isGFX11() && ExpectedAddrSize > 5) { // PartialNSA
		arsenmUnsubmitted Not Done Reply Inline Actions Should try to avoid raw generation checks and have some feature for this arsenm: Should try to avoid raw generation checks and have some feature for this
		int VAddrLastIdx =
		AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::vaddr4);
		unsigned VAddrLastSize =
		AMDGPU::getRegOperandSize(getMRI(), Desc, VAddrLastIdx) / 4;

		return VAddrLastIdx - VAddr0Idx + VAddrLastSize == ExpectedAddrSize;
		}
		} else {
if (ExpectedAddrSize > 12)		if (ExpectedAddrSize > 12)
ExpectedAddrSize = 16;		ExpectedAddrSize = 16;

// Allow oversized 8 VGPR vaddr when only 5/6/7 VGPRs are required.		// Allow oversized 8 VGPR vaddr when only 5/6/7 VGPRs are required.
// This provides backward compatibility for assembly created		// This provides backward compatibility for assembly created
// before 160b/192b/224b types were directly supported.		// before 160b/192b/224b types were directly supported.
if (ActualAddrSize == 8 && (ExpectedAddrSize >= 5 && ExpectedAddrSize <= 7))		if (ActualAddrSize == 8 && (ExpectedAddrSize >= 5 && ExpectedAddrSize <= 7))
return true;		return true;
▲ Show 20 Lines • Show All 5,571 Lines • Show Last 20 Lines

llvm/lib/Target/AMDGPU/Disassembler/AMDGPUDisassembler.cpp

Show First 20 Lines • Show All 877 Lines • ▼ Show 20 Lines if (BaseOpcode->BVH) {

if (AMDGPU::hasNamedOperand(MI.getOpcode(), AMDGPU::OpName::a16)) if (AMDGPU::hasNamedOperand(MI.getOpcode(), AMDGPU::OpName::a16))

addOperand(MI, MCOperand::createImm(1)); addOperand(MI, MCOperand::createImm(1));

return MCDisassembler::Success; return MCDisassembler::Success;

} }

bool IsAtomic = (VDstIdx != -1); bool IsAtomic = (VDstIdx != -1);

bool IsGather4 = MCII->get(MI.getOpcode()).TSFlags & SIInstrFlags::Gather4; bool IsGather4 = MCII->get(MI.getOpcode()).TSFlags & SIInstrFlags::Gather4;

bool IsNSA = false; bool IsNSA = false;

bool PartialNSA = false;

unsigned AddrSize = Info->VAddrDwords; unsigned AddrSize = Info->VAddrDwords;

if (isGFX10Plus()) { if (isGFX10Plus()) {

unsigned DimIdx = unsigned DimIdx =

AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::dim); AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::dim);

int A16Idx = int A16Idx =

AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::a16); AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::a16);

const AMDGPU::MIMGDimInfo *Dim = const AMDGPU::MIMGDimInfo *Dim =

AMDGPU::getMIMGDimInfoByEncoding(MI.getOperand(DimIdx).getImm()); AMDGPU::getMIMGDimInfoByEncoding(MI.getOperand(DimIdx).getImm());

const bool IsA16 = (A16Idx != -1 && MI.getOperand(A16Idx).getImm()); const bool IsA16 = (A16Idx != -1 && MI.getOperand(A16Idx).getImm());

AddrSize = AddrSize =

AMDGPU::getAddrSizeMIMGOp(BaseOpcode, Dim, IsA16, AMDGPU::hasG16(STI)); AMDGPU::getAddrSizeMIMGOp(BaseOpcode, Dim, IsA16, AMDGPU::hasG16(STI));

IsNSA = Info->MIMGEncoding == AMDGPU::MIMGEncGfx10NSA || IsNSA = Info->MIMGEncoding == AMDGPU::MIMGEncGfx10NSA ||

Info->MIMGEncoding == AMDGPU::MIMGEncGfx11NSA; Info->MIMGEncoding == AMDGPU::MIMGEncGfx11NSA;

if (!IsNSA) { if (!IsNSA) {

if (AddrSize > 12) if (AddrSize > 12)

AddrSize = 16; AddrSize = 16;

} else { } else {

if (AddrSize > Info->VAddrDwords) { if (AddrSize > Info->VAddrDwords) {

// The NSA encoding does not contain enough operands for the combination if (isGFX11Plus())

// of base opcode / dimension. Should this be an error? PartialNSA = true;

else

// The NSA encoding does not contain enough operands for the

// combination of base opcode / dimension. Should this be an error?

return MCDisassembler::Success; return MCDisassembler::Success;

foadUnsubmitted

Not Done

if (AddrSize > Info->VAddrDwords) {

- if (isGFX11Plus())

- PartialNSA = true;

- else

+ if (!isGFX11Plus()) {

// The NSA encoding does not contain enough operands for the

// combination of base opcode / dimension. Should this be an error?

return MCDisassembler::Success;

- }

+ }

+ PartialNSA = true;

+ }

}

foad:

foadUnsubmitted

Not Done

This should check !hasPartialNSAEncoding?

foad: This should check `!hasPartialNSAEncoding`?

mbrkusaninAuthorUnsubmitted

Done

Sure, it can.
Also changed isGFX10Plus() to STI.hasFeature(AMDGPU::FeatureNSAEncoding) below.

mbrkusanin: Sure, it can. Also changed isGFX10Plus() to STI.hasFeature(AMDGPU::FeatureNSAEncoding) below.

} }

unsigned DMask = MI.getOperand(DMaskIdx).getImm() & 0xf; unsigned DMask = MI.getOperand(DMaskIdx).getImm() & 0xf;

unsigned DstSize = IsGather4 ? 4 : std::max(llvm::popcount(DMask), 1); unsigned DstSize = IsGather4 ? 4 : std::max(llvm::popcount(DMask), 1);

bool D16 = D16Idx >= 0 && MI.getOperand(D16Idx).getImm(); bool D16 = D16Idx >= 0 && MI.getOperand(D16Idx).getImm();

Show All 26 Lines NewVdata = MRI.getMatchingSuperReg(Vdata0, AMDGPU::sub0,

&MRI.getRegClass(DataRCID)); &MRI.getRegClass(DataRCID));

if (NewVdata == AMDGPU::NoRegister) { if (NewVdata == AMDGPU::NoRegister) {

// It's possible to encode this such that the low register + enabled // It's possible to encode this such that the low register + enabled

// components exceeds the register count. // components exceeds the register count.

return MCDisassembler::Success; return MCDisassembler::Success;

} }

// If not using NSA on GFX10+, widen address register to correct size. // For GFX11 vaddr4 provides all additional components in sequential VGPRs if

unsigned NewVAddr0 = AMDGPU::NoRegister; // more then 5 vaddrs are needed.

foadUnsubmitted

Not Done

"more than"

foad: "more th**a**n"

if (isGFX10Plus() && !IsNSA && AddrSize != Info->VAddrDwords) { int16_t VAddrSAOp =

unsigned VAddr0 = MI.getOperand(VAddr0Idx).getReg(); (isGFX11() && PartialNSA) ? AMDGPU::OpName::vaddr4 : AMDGPU::OpName::vaddr0;

unsigned VAddrSub0 = MRI.getSubReg(VAddr0, AMDGPU::sub0); int VAddrSAIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), VAddrSAOp);

VAddr0 = (VAddrSub0 != 0) ? VAddrSub0 : VAddr0;

// If not using NSA on GFX10, widen vaddr0 address register to

// correct size. On GFX11+ widen last address register for partial NSA.

unsigned NewVAddrSA = AMDGPU::NoRegister;

if (isGFX10Plus() && (!IsNSA || PartialNSA) &&

AddrSize != Info->VAddrDwords) {

unsigned VAddrSA = MI.getOperand(VAddrSAIdx).getReg();

unsigned VAddrSubSA = MRI.getSubReg(VAddrSA, AMDGPU::sub0);

VAddrSA = (VAddrSubSA != 0) ? VAddrSubSA : VAddrSA;

auto AddrRCID = MCII->get(NewOpcode).operands()[VAddr0Idx].RegClass; auto AddrRCID = MCII->get(NewOpcode).operands()[VAddrSAIdx].RegClass;

NewVAddr0 = MRI.getMatchingSuperReg(VAddr0, AMDGPU::sub0, NewVAddrSA = MRI.getMatchingSuperReg(VAddrSA, AMDGPU::sub0,

&MRI.getRegClass(AddrRCID)); &MRI.getRegClass(AddrRCID));

if (NewVAddr0 == AMDGPU::NoRegister) if (NewVAddrSA == AMDGPU::NoRegister)

foadUnsubmitted

Not Done

&MRI.getRegClass(AddrRCID));

- if (NewVAddrSA == AMDGPU::NoRegister)

+ if (!NewVAddrSA)

return MCDisassembler::Success;

foad:

return MCDisassembler::Success; return MCDisassembler::Success;

} }

MI.setOpcode(NewOpcode); MI.setOpcode(NewOpcode);

if (NewVdata != AMDGPU::NoRegister) { if (NewVdata != AMDGPU::NoRegister) {

MI.getOperand(VDataIdx) = MCOperand::createReg(NewVdata); MI.getOperand(VDataIdx) = MCOperand::createReg(NewVdata);

if (IsAtomic) { if (IsAtomic) {

// Atomic operations have an additional operand (a copy of data) // Atomic operations have an additional operand (a copy of data)

MI.getOperand(VDstIdx) = MCOperand::createReg(NewVdata); MI.getOperand(VDstIdx) = MCOperand::createReg(NewVdata);

} }

if (NewVAddr0 != AMDGPU::NoRegister) { if (NewVAddrSA != AMDGPU::NoRegister) {

foadUnsubmitted

Not Done

}

- if (NewVAddrSA != AMDGPU::NoRegister) {

+ if (NewVAddrSA) {

MI.getOperand(VAddrSAIdx) = MCOperand::createReg(NewVAddrSA);

foad:

MI.getOperand(VAddr0Idx) = MCOperand::createReg(NewVAddr0); MI.getOperand(VAddrSAIdx) = MCOperand::createReg(NewVAddrSA);

} else if (IsNSA) { } else if (IsNSA) {

assert(AddrSize <= Info->VAddrDwords); assert(AddrSize <= Info->VAddrDwords);

MI.erase(MI.begin() + VAddr0Idx + AddrSize, MI.erase(MI.begin() + VAddr0Idx + AddrSize,

MI.begin() + VAddr0Idx + Info->VAddrDwords); MI.begin() + VAddr0Idx + Info->VAddrDwords);

} }

return MCDisassembler::Success; return MCDisassembler::Success;

} }

▲ Show 20 Lines • Show All 1,066 Lines • Show Last 20 Lines

llvm/lib/Target/AMDGPU/MIMGInstructions.td

Show First 20 Lines • Show All 229 Lines • ▼ Show 20 Lines	def MIMGInfoTable : GenericTable {
let PrimaryKeyName = "getMIMGOpcodeHelper";		let PrimaryKeyName = "getMIMGOpcodeHelper";
}		}

def getMIMGInfo : SearchIndex {		def getMIMGInfo : SearchIndex {
let Table = MIMGInfoTable;		let Table = MIMGInfoTable;
let Key = ["Opcode"];		let Key = ["Opcode"];
}		}

		class NSAHelper {
		dag AddrIns;
		string AddrAsm;
		int NSA;
		}

// This class used to use !foldl to memoize the AddrAsmNames list.		// This class used to use !foldl to memoize the AddrAsmNames list.
// It turned out that that was much slower than using !filter.		// It turned out that that was much slower than using !filter.
class MIMGNSAHelper<int num_addrs,		class MIMGNSAHelper<int num_addrs,
list<RegisterClass> addr_types=!listsplat(VGPR_32, num_addrs)> {		list<RegisterClass> addr_types=!listsplat(VGPR_32, num_addrs)>
		: NSAHelper<> {
list<string> AddrAsmNames =		list<string> AddrAsmNames =
!foreach(i, !filter(i, [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11],		!foreach(i, !filter(i, [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11],
!lt(i, num_addrs)), "vaddr" # i);		!lt(i, num_addrs)), "vaddr" # i);
dag AddrIns = !dag(ins, addr_types, AddrAsmNames);		let AddrIns = !dag(ins, addr_types, AddrAsmNames);
string AddrAsm = "[$" # !interleave(AddrAsmNames, ", $") # "]";		let AddrAsm = "[$" # !interleave(AddrAsmNames, ", $") # "]";

int NSA = !if(!le(num_addrs, 1), ?,		let NSA = !if(!le(num_addrs, 1), ?,
!if(!le(num_addrs, 5), 1,		!if(!le(num_addrs, 5), 1,
!if(!le(num_addrs, 9), 2,		!if(!le(num_addrs, 9), 2,
!if(!le(num_addrs, 13), 3, ?))));		!if(!le(num_addrs, 13), 3, ?))));
}		}

		class PartialNSAHelper<int num_addrs, int max_addr, RegisterClass LastAddrRC>
		: NSAHelper<> {

		list<RegisterClass> addr_types =
		!if(!ge(num_addrs, max_addr),
		!listconcat(!listsplat(VGPR_32, !sub(max_addr, 1)), [LastAddrRC]),
		!listsplat(VGPR_32, num_addrs));

		int VAddrCount = !if(!gt(num_addrs, max_addr), max_addr, num_addrs);
		list<string> AddrAsmNames =
		!foreach(i, !filter(i, [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11],
		!lt(i, VAddrCount)), "vaddr" # i);

		let AddrIns = !dag(ins, addr_types, AddrAsmNames);
		let AddrAsm = "[$" # !interleave(AddrAsmNames, ", $") # "]";
		let NSA = 1;
		}

// Base class of all pre-gfx10 MIMG instructions.		// Base class of all pre-gfx10 MIMG instructions.
class MIMG_gfx6789<bits<8> op, dag outs, string dns = "">		class MIMG_gfx6789<bits<8> op, dag outs, string dns = "">
: MIMG<outs, dns>, MIMGe_gfx6789<op> {		: MIMG<outs, dns>, MIMGe_gfx6789<op> {
let SubtargetPredicate = isGFX6GFX7GFX8GFX9NotGFX90A;		let SubtargetPredicate = isGFX6GFX7GFX8GFX9NotGFX90A;
let AssemblerPredicate = isGFX6GFX7GFX8GFX9NotGFX90A;		let AssemblerPredicate = isGFX6GFX7GFX8GFX9NotGFX90A;

let MIMGEncoding = MIMGEncGfx6;		let MIMGEncoding = MIMGEncGfx6;
let VAddrOperands = 1;		let VAddrOperands = 1;
▲ Show 20 Lines • Show All 54 Lines • ▼ Show 20 Lines	class MIMG_gfx11<int op, dag outs, string dns = "">

let d16 = !if(BaseOpcode.HasD16, ?, 0);		let d16 = !if(BaseOpcode.HasD16, ?, 0);
let nsa = 0;		let nsa = 0;
}		}

// Base class for all NSA MIMG instructions.		// Base class for all NSA MIMG instructions.
// Note that 1-dword addresses always use non-NSA variants.		// Note that 1-dword addresses always use non-NSA variants.
class MIMG_nsa_gfx11<int op, dag outs, int num_addrs, string dns="",		class MIMG_nsa_gfx11<int op, dag outs, int num_addrs, string dns="",
list<RegisterClass> addr_types=[]>		list<RegisterClass> addr_types=[],
		RegisterClass LastAddrRC = VGPR_32>
: MIMG<outs, dns>, MIMGe_gfx11<op> {		: MIMG<outs, dns>, MIMGe_gfx11<op> {
let SubtargetPredicate = isGFX11Plus;		let SubtargetPredicate = isGFX11Plus;
let AssemblerPredicate = isGFX11Plus;		let AssemblerPredicate = isGFX11Plus;

let MIMGEncoding = MIMGEncGfx11NSA;		let MIMGEncoding = MIMGEncGfx11NSA;
let VAddrOperands = num_addrs;		let VAddrOperands = num_addrs;

MIMGNSAHelper nsah = !if(!empty(addr_types),		NSAHelper nsah = !if(!empty(addr_types),
MIMGNSAHelper<num_addrs>,		PartialNSAHelper<num_addrs, 5, LastAddrRC>,
MIMGNSAHelper<num_addrs, addr_types>);		MIMGNSAHelper<num_addrs, addr_types>);
dag AddrIns = nsah.AddrIns;		dag AddrIns = nsah.AddrIns;
string AddrAsm = nsah.AddrAsm;		string AddrAsm = nsah.AddrAsm;

let d16 = !if(BaseOpcode.HasD16, ?, 0);		let d16 = !if(BaseOpcode.HasD16, ?, 0);
let nsa = nsah.NSA;		let nsa = nsah.NSA;
}		}

class MIMG_NoSampler_Helper <mimgopc op, string asm,		class MIMG_NoSampler_Helper <mimgopc op, string asm,
▲ Show 20 Lines • Show All 586 Lines • ▼ Show 20 Lines	let InOperandList = !con((ins AddrRC:$vaddr0, SReg_256:$srsrc, SReg_128:$ssamp,
!if(BaseOpcode.HasD16, (ins D16:$d16), (ins)));		!if(BaseOpcode.HasD16, (ins D16:$d16), (ins)));
let AsmString = opcode#" $vdata, $vaddr0, $srsrc, $ssamp$dmask$dim$unorm"		let AsmString = opcode#" $vdata, $vaddr0, $srsrc, $ssamp$dmask$dim$unorm"
#"$cpol$r128$a16$tfe$lwe"		#"$cpol$r128$a16$tfe$lwe"
#!if(BaseOpcode.HasD16, "$d16", "");		#!if(BaseOpcode.HasD16, "$d16", "");
}		}

class MIMG_Sampler_nsa_gfx11<mimgopc op, string opcode,		class MIMG_Sampler_nsa_gfx11<mimgopc op, string opcode,
RegisterClass DataRC, int num_addrs,		RegisterClass DataRC, int num_addrs,
string dns="">		RegisterClass LastVAddrSize, string dns="">
: MIMG_nsa_gfx11<op.GFX11, (outs DataRC:$vdata), num_addrs, dns> {		: MIMG_nsa_gfx11<op.GFX11, (outs DataRC:$vdata), num_addrs, dns, [],
		LastVAddrSize> {
let InOperandList = !con(AddrIns,		let InOperandList = !con(AddrIns,
(ins SReg_256:$srsrc, SReg_128:$ssamp, DMask:$dmask,		(ins SReg_256:$srsrc, SReg_128:$ssamp, DMask:$dmask,
Dim:$dim, UNorm:$unorm, CPol:$cpol,		Dim:$dim, UNorm:$unorm, CPol:$cpol,
R128A16:$r128, A16:$a16, TFE:$tfe, LWE:$lwe),		R128A16:$r128, A16:$a16, TFE:$tfe, LWE:$lwe),
!if(BaseOpcode.HasD16, (ins D16:$d16), (ins)));		!if(BaseOpcode.HasD16, (ins D16:$d16), (ins)));
let AsmString = opcode#" $vdata, "#AddrAsm#", $srsrc, $ssamp$dmask$dim$unorm"		let AsmString = opcode#" $vdata, "#AddrAsm#", $srsrc, $ssamp$dmask$dim$unorm"
#"$cpol$r128$a16$tfe$lwe"		#"$cpol$r128$a16$tfe$lwe"
#!if(BaseOpcode.HasD16, "$d16", "");		#!if(BaseOpcode.HasD16, "$d16", "");
}		}

class MIMGAddrSize<int dw, bit enable_disasm> {		class MIMGAddrSize<int dw, bit enable_disasm, int AddrDW = dw> {
int NumWords = dw;		int NumWords = dw;

RegisterClass RegClass = !if(!le(NumWords, 0), ?,		RegisterClass RegClass = !if(!le(AddrDW, 0), ?,
!if(!eq(NumWords, 1), VGPR_32,		!if(!eq(AddrDW, 1), VGPR_32,
!if(!eq(NumWords, 2), VReg_64,		!if(!eq(AddrDW, 2), VReg_64,
!if(!eq(NumWords, 3), VReg_96,		!if(!eq(AddrDW, 3), VReg_96,
!if(!eq(NumWords, 4), VReg_128,		!if(!eq(AddrDW, 4), VReg_128,
!if(!eq(NumWords, 5), VReg_160,		!if(!eq(AddrDW, 5), VReg_160,
!if(!eq(NumWords, 6), VReg_192,		!if(!eq(AddrDW, 6), VReg_192,
!if(!eq(NumWords, 7), VReg_224,		!if(!eq(AddrDW, 7), VReg_224,
!if(!le(NumWords, 8), VReg_256,		!if(!eq(AddrDW, 8), VReg_256,
!if(!le(NumWords, 9), VReg_288,		!if(!eq(AddrDW, 9), VReg_288,
!if(!le(NumWords, 10), VReg_320,		!if(!eq(AddrDW, 10), VReg_320,
!if(!le(NumWords, 11), VReg_352,		!if(!eq(AddrDW, 11), VReg_352,
!if(!le(NumWords, 12), VReg_384,		!if(!eq(AddrDW, 12), VReg_384,
!if(!le(NumWords, 16), VReg_512, ?))))))))))))));		!if(!le(AddrDW, 16), VReg_512, ?))))))))))))));

// Whether the instruction variant with this vaddr size should be enabled for		// Whether the instruction variant with this vaddr size should be enabled for
// the auto-generated disassembler.		// the auto-generated disassembler.
bit Disassemble = enable_disasm;		bit Disassemble = enable_disasm;
}		}

		// Returns the MIMGAddrSize with the size of last VAddr for PartialNSA
		class LastVAddrSize <int dw, int max_idx, bit enable_disasm>
		: MIMGAddrSize<dw, enable_disasm,
		!if(!gt(dw, max_idx), !sub(dw, max_idx), 0)>;

// Return whether x is in lst.		// Return whether x is in lst.
class isIntInList<int x, list<int> lst> {		class isIntInList<int x, list<int> lst> {
bit ret = !foldl(0, lst, lhs, y, !or(lhs, !eq(x, y)));		bit ret = !foldl(0, lst, lhs, y, !or(lhs, !eq(x, y)));
}		}

// Return whether a value inside the range [min, max] (endpoints inclusive)		// Return whether a value inside the range [min, max] (endpoints inclusive)
// is in the given list.		// is in the given list.
class isRangeInList<int min, int max, list<int> lst> {		class isRangeInList<int min, int max, list<int> lst> {
bit ret = !foldl(0, lst, lhs, y, !or(lhs, !and(!le(min, y), !le(y, max))));		bit ret = !foldl(0, lst, lhs, y, !or(lhs, !and(!le(min, y), !le(y, max))));
}		}

class MIMGAddrSizes_dw_range<list<int> range> {		class MIMGAddrSizes_dw_range<list<int> range> {
int Min = !head(range);		int Min = !head(range);
int Max = !if(!empty(!tail(range)), Min, !head(!tail(range)));		int Max = !if(!empty(!tail(range)), Min, !head(!tail(range)));
}		}

class MIMG_Sampler_AddrSizes<AMDGPUSampleVariant sample, bit isG16> {		class MIMG_Sampler_AddrSizes<AMDGPUSampleVariant sample, bit isG16,
		int nsa_max_addr = 5> {
// List of all possible numbers of address words, taking all combinations of		// List of all possible numbers of address words, taking all combinations of
// A16 and image dimension into account (note: no MSAA, since this is for		// A16 and image dimension into account (note: no MSAA, since this is for
// sample/gather ops).		// sample/gather ops).
list<int> AllNumAddrWords =		list<int> AllNumAddrWords =
!foreach(dw, !if(sample.Gradients,		!foreach(dw, !if(sample.Gradients,
!if(isG16,		!if(isG16,
!if(!eq(sample.LodOrClamp, ""),		!if(!eq(sample.LodOrClamp, ""),
[2, 3, 4, 5, 6, 7],		[2, 3, 4, 5, 6, 7],
Show All 29 Lines	class MIMG_Sampler_AddrSizes<AMDGPUSampleVariant sample, bit isG16,
// the exact variant based on the sample variant and the image dimension.		// the exact variant based on the sample variant and the image dimension.
list<MIMGAddrSize> NSAInstrs =		list<MIMGAddrSize> NSAInstrs =
!foldl([]<MIMGAddrSize>, [[12, 11, 10], [9, 8, 7, 6], [5, 4, 3, 2]], prev, nsa_group,		!foldl([]<MIMGAddrSize>, [[12, 11, 10], [9, 8, 7, 6], [5, 4, 3, 2]], prev, nsa_group,
!listconcat(prev,		!listconcat(prev,
!foldl([]<MIMGAddrSize>, nsa_group, lhs, dw,		!foldl([]<MIMGAddrSize>, nsa_group, lhs, dw,
!if(isIntInList<dw, AllNumAddrWords>.ret,		!if(isIntInList<dw, AllNumAddrWords>.ret,
!listconcat(lhs, [MIMGAddrSize<dw, !empty(lhs)>]),		!listconcat(lhs, [MIMGAddrSize<dw, !empty(lhs)>]),
lhs))));		lhs))));

		// In NSA format if there is a requirement for more VGPRs then the format
		foadUnsubmitted Done Reply Inline Actions "... more VGPRs than ..." foad: "... more VGPRs than ..."
		// supports, then the rest are sequential after the last one. Generate
		// machine instructions for all possible number of words. The disassembler
		// defaults to the largest number of arguments but no larger than max nsa
		// size. List is generated with the register class needed for last vaddr since
		// it is the only one that could have a register other than VGPR32.
		int EnableDisasmNum = !foldl(!head(AllNumAddrWords), !tail(AllNumAddrWords),
		acc, var, !if(!le(var, nsa_max_addr), var, acc));
		list<LastVAddrSize> PartialNSAInstrs =
		!foldl([]<LastVAddrSize>, [12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2], lhs, dw,
		!if(isIntInList<dw, AllNumAddrWords>.ret,
		!listconcat(lhs, [LastVAddrSize<dw, !sub(nsa_max_addr, 1),
		!eq(dw, EnableDisasmNum)>]),
		lhs));
}		}

multiclass MIMG_Sampler_Src_Helper <mimgopc op, string asm,		multiclass MIMG_Sampler_Src_Helper <mimgopc op, string asm,
AMDGPUSampleVariant sample, RegisterClass dst_rc,		AMDGPUSampleVariant sample, RegisterClass dst_rc,
bit enableDisasm = 0,		bit enableDisasm = 0,
bit ExtendedImageInst = 1, bit isG16 = 0> {		bit ExtendedImageInst = 1, bit isG16 = 0> {
foreach addr = MIMG_Sampler_AddrSizes<sample, isG16>.MachineInstrs in {		foreach addr = MIMG_Sampler_AddrSizes<sample, isG16>.MachineInstrs in {
let VAddrDwords = addr.NumWords in {		let VAddrDwords = addr.NumWords in {
Show All 19 Lines	multiclass MIMG_Sampler_Src_Helper <mimgopc op, string asm,

foreach addr = MIMG_Sampler_AddrSizes<sample, isG16>.NSAInstrs in {		foreach addr = MIMG_Sampler_AddrSizes<sample, isG16>.NSAInstrs in {
let VAddrDwords = addr.NumWords in {		let VAddrDwords = addr.NumWords in {
if op.HAS_GFX10M then {		if op.HAS_GFX10M then {
def _V # addr.NumWords # _nsa_gfx10		def _V # addr.NumWords # _nsa_gfx10
: MIMG_Sampler_nsa_gfx10<op, asm, dst_rc, addr.NumWords,		: MIMG_Sampler_nsa_gfx10<op, asm, dst_rc, addr.NumWords,
!if(!and(enableDisasm, addr.Disassemble), "AMDGPU", "")>;		!if(!and(enableDisasm, addr.Disassemble), "AMDGPU", "")>;
}		}
if !and(op.HAS_GFX11, !le(addr.NumWords, 5)) then {		}
		}

		foreach addr = MIMG_Sampler_AddrSizes<sample, isG16, 5/MaxNSASize/>.PartialNSAInstrs in {
		let VAddrDwords = addr.NumWords in {
		if op.HAS_GFX11 then {
def _V # addr.NumWords # _nsa_gfx11		def _V # addr.NumWords # _nsa_gfx11
: MIMG_Sampler_nsa_gfx11<op, asm, dst_rc, addr.NumWords,		: MIMG_Sampler_nsa_gfx11<op, asm, dst_rc, addr.NumWords, addr.RegClass,
!if(!and(enableDisasm, addr.Disassemble), "AMDGPU", "")>;		!if(!and(enableDisasm, addr.Disassemble), "AMDGPU", "")>;
}		}
}		}
}		}
}		}

class MIMG_Sampler_BaseOpcode<AMDGPUSampleVariant sample>		class MIMG_Sampler_BaseOpcode<AMDGPUSampleVariant sample>
: MIMGBaseOpcode {		: MIMGBaseOpcode {
▲ Show 20 Lines • Show All 464 Lines • Show Last 20 Lines

llvm/test/MC/AMDGPU/gfx11_asm_mimg_features.s

	Show First 20 Lines • Show All 211 Lines • ▼ Show 20 Lines
	// GFX11: image_sample_l_o v[64:66], [v32, v16, v0, v2, v1], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x07,0x9c,0xf0,0x20,0x40,0x01,0x64,0x10,0x00,0x02,0x01]			// GFX11: image_sample_l_o v[64:66], [v32, v16, v0, v2, v1], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x07,0x9c,0xf0,0x20,0x40,0x01,0x64,0x10,0x00,0x02,0x01]

	image_sample_lz_o v[64:66], [v32, v16, v0, v2], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_3D			image_sample_lz_o v[64:66], [v32, v16, v0, v2], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_3D
	// GFX11: image_sample_lz_o v[64:66], [v32, v16, v0, v2], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x07,0xa4,0xf0,0x20,0x40,0x01,0x64,0x10,0x00,0x02,0x00]			// GFX11: image_sample_lz_o v[64:66], [v32, v16, v0, v2], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x07,0xa4,0xf0,0x20,0x40,0x01,0x64,0x10,0x00,0x02,0x00]

	image_sample_c_lz_o v[64:66], [v32, v0, v16], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_1D			image_sample_c_lz_o v[64:66], [v32, v0, v16], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_1D
	// GFX11: image_sample_c_lz_o v[64:66], [v32, v0, v16], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_1D ; encoding: [0x01,0x07,0xb8,0xf0,0x20,0x40,0x01,0x64,0x00,0x10,0x00,0x00]			// GFX11: image_sample_c_lz_o v[64:66], [v32, v0, v16], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_1D ; encoding: [0x01,0x07,0xb8,0xf0,0x20,0x40,0x01,0x64,0x00,0x10,0x00,0x00]

				image_sample_d v64, [v32, v16, v8, v0, v[36:37]], s[4:11], s[4:7] dmask:0x8 dim:SQ_RSRC_IMG_2D
				// GFX11: image_sample_d v64, [v32, v16, v8, v0, v[36:37]], s[4:11], s[4:7] dmask:0x8 dim:SQ_RSRC_IMG_2D ; encoding: [0x05,0x08,0x70,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_d v[64:65], [v32, v16, v8, v0, v[36:38]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE
				// GFX11: image_sample_d v[64:65], [v32, v16, v8, v0, v[36:38]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0d,0x0c,0x70,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_d_o v[64:65], [v32, v16, v8, v0, v[36:39]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE
				// GFX11: image_sample_d_o v[64:65], [v32, v16, v8, v0, v[36:39]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0d,0x0c,0x98,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_d v[64:65], [v32, v16, v8, v0, v[36:40]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D
				// GFX11: image_sample_d v[64:65], [v32, v16, v8, v0, v[36:40]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0x70,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_d_o v[64:65], [v32, v16, v8, v0, v[36:41]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D
				// GFX11: image_sample_d_o v[64:65], [v32, v16, v8, v0, v[36:41]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0x98,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_c_d_o v[64:65], [v32, v16, v8, v0, v[36:42]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D
				// GFX11: image_sample_c_d_o v[64:65], [v32, v16, v8, v0, v[36:42]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0xac,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_c_d_cl_o v[64:65], [v32, v16, v8, v0, v[36:43]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D
				// GFX11: image_sample_c_d_cl_o v[64:65], [v32, v16, v8, v0, v[36:43]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0x28,0xf1,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_d_o_g16 v[64:66], [v32, v16, v8, v0, v36], s[4:11], s[4:7] dmask:0xb dim:SQ_RSRC_IMG_1D_ARRAY
				// GFX11: image_sample_d_o_g16 v[64:66], [v32, v16, v8, v0, v36], s[4:11], s[4:7] dmask:0xb dim:SQ_RSRC_IMG_1D_ARRAY ; encoding: [0x11,0x0b,0xec,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:37]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE
				// GFX11: image_sample_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:37]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0d,0x0c,0xec,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_c_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:38]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE
				// GFX11: image_sample_c_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:38]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0d,0x0c,0xf0,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:39]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D
				// GFX11: image_sample_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:39]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0xec,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

				image_sample_c_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:40]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D
				// GFX11: image_sample_c_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:40]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0xf0,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]

	image_gather4 v[64:67], v32, s[4:11], s[100:103] dmask:0x1 dim:SQ_RSRC_IMG_1D			image_gather4 v[64:67], v32, s[4:11], s[100:103] dmask:0x1 dim:SQ_RSRC_IMG_1D
	// GFX11: image_gather4 v[64:67], v32, s[4:11], s[100:103] dmask:0x1 dim:SQ_RSRC_IMG_1D ; encoding: [0x00,0x01,0xbc,0xf0,0x20,0x40,0x01,0x64]			// GFX11: image_gather4 v[64:67], v32, s[4:11], s[100:103] dmask:0x1 dim:SQ_RSRC_IMG_1D ; encoding: [0x00,0x01,0xbc,0xf0,0x20,0x40,0x01,0x64]

	image_gather4_cl v[64:67], v[32:35], s[4:11], s[100:103] dmask:0x2 dim:SQ_RSRC_IMG_CUBE			image_gather4_cl v[64:67], v[32:35], s[4:11], s[100:103] dmask:0x2 dim:SQ_RSRC_IMG_CUBE
	// GFX11: image_gather4_cl v[64:67], v[32:35], s[4:11], s[100:103] dmask:0x2 dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0c,0x02,0x80,0xf1,0x20,0x40,0x01,0x64]			// GFX11: image_gather4_cl v[64:67], v[32:35], s[4:11], s[100:103] dmask:0x2 dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0c,0x02,0x80,0xf1,0x20,0x40,0x01,0x64]

	image_gather4_l v[64:67], [v32, v0, v4], s[4:11], s[100:103] dmask:0x4 dim:SQ_RSRC_IMG_1D_ARRAY			image_gather4_l v[64:67], [v32, v0, v4], s[4:11], s[100:103] dmask:0x4 dim:SQ_RSRC_IMG_1D_ARRAY
	// GFX11: image_gather4_l v[64:67], [v32, v0, v4], s[4:11], s[100:103] dmask:0x4 dim:SQ_RSRC_IMG_1D_ARRAY ; encoding: [0x11,0x04,0xc0,0xf0,0x20,0x40,0x01,0x64,0x00,0x04,0x00,0x00]			// GFX11: image_gather4_l v[64:67], [v32, v0, v4], s[4:11], s[100:103] dmask:0x4 dim:SQ_RSRC_IMG_1D_ARRAY ; encoding: [0x11,0x04,0xc0,0xf0,0x20,0x40,0x01,0x64,0x00,0x04,0x00,0x00]
	▲ Show 20 Lines • Show All 84 Lines • Show Last 20 Lines

llvm/test/MC/Disassembler/AMDGPU/gfx11_dasm_mimg_features.txt

	Show First 20 Lines • Show All 210 Lines • ▼ Show 20 Lines
	0x09,0x07,0x9c,0xf0,0x20,0x40,0x01,0x64,0x10,0x00,0x02,0x01			0x09,0x07,0x9c,0xf0,0x20,0x40,0x01,0x64,0x10,0x00,0x02,0x01

	# GFX11: image_sample_lz_o v[64:66], [v32, v16, v0, v2], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x07,0xa4,0xf0,0x20,0x40,0x01,0x64,0x10,0x00,0x02,0x00]			# GFX11: image_sample_lz_o v[64:66], [v32, v16, v0, v2], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x07,0xa4,0xf0,0x20,0x40,0x01,0x64,0x10,0x00,0x02,0x00]
	0x09,0x07,0xa4,0xf0,0x20,0x40,0x01,0x64,0x10,0x00,0x02,0x00			0x09,0x07,0xa4,0xf0,0x20,0x40,0x01,0x64,0x10,0x00,0x02,0x00

	# GFX11: image_sample_c_lz_o v[64:66], [v32, v0, v16], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_1D ; encoding: [0x01,0x07,0xb8,0xf0,0x20,0x40,0x01,0x64,0x00,0x10,0x00,0x00]			# GFX11: image_sample_c_lz_o v[64:66], [v32, v0, v16], s[4:11], s[100:103] dmask:0x7 dim:SQ_RSRC_IMG_1D ; encoding: [0x01,0x07,0xb8,0xf0,0x20,0x40,0x01,0x64,0x00,0x10,0x00,0x00]
	0x01,0x07,0xb8,0xf0,0x20,0x40,0x01,0x64,0x00,0x10,0x00,0x00			0x01,0x07,0xb8,0xf0,0x20,0x40,0x01,0x64,0x00,0x10,0x00,0x00

				# GFX11: image_sample_d v64, [v32, v16, v8, v0, v[36:37]], s[4:11], s[4:7] dmask:0x8 dim:SQ_RSRC_IMG_2D ; encoding: [0x05,0x08,0x70,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x05,0x08,0x70,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_d v[64:65], [v32, v16, v8, v0, v[36:38]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0d,0x0c,0x70,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x0d,0x0c,0x70,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_d_o v[64:65], [v32, v16, v8, v0, v[36:39]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0d,0x0c,0x98,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x0d,0x0c,0x98,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_d v[64:65], [v32, v16, v8, v0, v[36:40]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0x70,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x09,0x03,0x70,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_d_o v[64:65], [v32, v16, v8, v0, v[36:41]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0x98,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x09,0x03,0x98,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_c_d_o v[64:65], [v32, v16, v8, v0, v[36:42]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0xac,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x09,0x03,0xac,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_c_d_cl_o v[64:65], [v32, v16, v8, v0, v[36:43]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0x28,0xf1,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x09,0x03,0x28,0xf1,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_d_o_g16 v[64:66], [v32, v16, v8, v0, v36], s[4:11], s[4:7] dmask:0xb dim:SQ_RSRC_IMG_1D_ARRAY ; encoding: [0x11,0x0b,0xec,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x11,0x0b,0xec,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:37]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0d,0x0c,0xec,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x0d,0x0c,0xec,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_c_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:38]], s[4:11], s[4:7] dmask:0xc dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0d,0x0c,0xf0,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x0d,0x0c,0xf0,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:39]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0xec,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x09,0x03,0xec,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

				# GFX11: image_sample_c_d_o_g16 v[64:65], [v32, v16, v8, v0, v[36:40]], s[4:11], s[4:7] dmask:0x3 dim:SQ_RSRC_IMG_3D ; encoding: [0x09,0x03,0xf0,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24]
				0x09,0x03,0xf0,0xf0,0x20,0x40,0x01,0x04,0x10,0x08,0x00,0x24

	# GFX11: image_gather4 v[64:67], v32, s[4:11], s[100:103] dmask:0x1 dim:SQ_RSRC_IMG_1D ; encoding: [0x00,0x01,0xbc,0xf0,0x20,0x40,0x01,0x64]			# GFX11: image_gather4 v[64:67], v32, s[4:11], s[100:103] dmask:0x1 dim:SQ_RSRC_IMG_1D ; encoding: [0x00,0x01,0xbc,0xf0,0x20,0x40,0x01,0x64]
	0x00,0x01,0xbc,0xf0,0x20,0x40,0x01,0x64			0x00,0x01,0xbc,0xf0,0x20,0x40,0x01,0x64

	# GFX11: image_gather4_cl v[64:67], v[32:35], s[4:11], s[100:103] dmask:0x2 dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0c,0x02,0x80,0xf1,0x20,0x40,0x01,0x64]			# GFX11: image_gather4_cl v[64:67], v[32:35], s[4:11], s[100:103] dmask:0x2 dim:SQ_RSRC_IMG_CUBE ; encoding: [0x0c,0x02,0x80,0xf1,0x20,0x40,0x01,0x64]
	0x0c,0x02,0x80,0xf1,0x20,0x40,0x01,0x64			0x0c,0x02,0x80,0xf1,0x20,0x40,0x01,0x64

	# GFX11: image_gather4_l v[64:67], [v32, v0, v4], s[4:11], s[100:103] dmask:0x4 dim:SQ_RSRC_IMG_1D_ARRAY ; encoding: [0x11,0x04,0xc0,0xf0,0x20,0x40,0x01,0x64,0x00,0x04,0x00,0x00]			# GFX11: image_gather4_l v[64:67], [v32, v0, v4], s[4:11], s[100:103] dmask:0x4 dim:SQ_RSRC_IMG_1D_ARRAY ; encoding: [0x11,0x04,0xc0,0xf0,0x20,0x40,0x01,0x64,0x00,0x04,0x00,0x00]
	0x11,0x04,0xc0,0xf0,0x20,0x40,0x01,0x64,0x00,0x04,0x00,0x00			0x11,0x04,0xc0,0xf0,0x20,0x40,0x01,0x64,0x00,0x04,0x00,0x00
	▲ Show 20 Lines • Show All 81 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[AMDGPU][MC][GFX11] Add partial NSA format for image sample instructions
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 497384

llvm/lib/Target/AMDGPU/AsmParser/AMDGPUAsmParser.cpp

llvm/lib/Target/AMDGPU/Disassembler/AMDGPUDisassembler.cpp

llvm/lib/Target/AMDGPU/MIMGInstructions.td

llvm/test/MC/AMDGPU/gfx11_asm_mimg_features.s

llvm/test/MC/Disassembler/AMDGPU/gfx11_dasm_mimg_features.txt

This is an archive of the discontinued LLVM Phabricator instance.

[AMDGPU][MC][GFX11] Add partial NSA format for image sample instructionsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 497384

llvm/lib/Target/AMDGPU/AsmParser/AMDGPUAsmParser.cpp

llvm/lib/Target/AMDGPU/Disassembler/AMDGPUDisassembler.cpp

llvm/lib/Target/AMDGPU/MIMGInstructions.td

llvm/test/MC/AMDGPU/gfx11_asm_mimg_features.s

llvm/test/MC/Disassembler/AMDGPU/gfx11_dasm_mimg_features.txt

[AMDGPU][MC][GFX11] Add partial NSA format for image sample instructions
ClosedPublic