This is an archive of the discontinued LLVM Phabricator instance.

AMDGPU: Process SDWA block at a time
ClosedPublic

Authored by arsenm on Feb 8 2018, 12:21 PM.

Download Raw Diff

Details

Reviewers

rampitec
kzhuravl
cfang

Summary

Right now this loops over the entire function every time there
is a change, which is not very efficient. There's no practical
reason to track this so globally, since the code motion optimization
passes should be sinking instructions with single uses and
the pass currently will not fold with multiple uses.

Diff Detail

Event Timeline

arsenm created this revision.Feb 8 2018, 12:21 PM

Herald added subscribers: t-tye, tpr, dstuttard and 3 others. · View Herald TranscriptFeb 8 2018, 12:21 PM

I agree theoretically. Anyway, are there any regressions?

In D43085#1002316, @rampitec wrote:

I agree theoretically. Anyway, are there any regressions?

None of the tests regressed. I tried a few small samples with multiple blocks and they all sank and were handled

LGTM

This revision is now accepted and ready to land.Feb 8 2018, 12:52 PM

r324667

Revision Contents

Path

Size

lib/

Target/

AMDGPU/

SIPeepholeSDWA.cpp

63 lines

Diff 133468

lib/Target/AMDGPU/SIPeepholeSDWA.cpp

Show First 20 Lines • Show All 80 Lines • ▼ Show 20 Lines
public:		public:
static char ID;		static char ID;

SIPeepholeSDWA() : MachineFunctionPass(ID) {		SIPeepholeSDWA() : MachineFunctionPass(ID) {
initializeSIPeepholeSDWAPass(*PassRegistry::getPassRegistry());		initializeSIPeepholeSDWAPass(*PassRegistry::getPassRegistry());
}		}

bool runOnMachineFunction(MachineFunction &MF) override;		bool runOnMachineFunction(MachineFunction &MF) override;
void matchSDWAOperands(MachineFunction &MF);		void matchSDWAOperands(MachineBasicBlock &MF);
std::unique_ptr<SDWAOperand> matchSDWAOperand(MachineInstr &MI);		std::unique_ptr<SDWAOperand> matchSDWAOperand(MachineInstr &MI);
bool isConvertibleToSDWA(const MachineInstr &MI, const SISubtarget &ST) const;		bool isConvertibleToSDWA(const MachineInstr &MI, const SISubtarget &ST) const;
bool convertToSDWA(MachineInstr &MI, const SDWAOperandsVector &SDWAOperands);		bool convertToSDWA(MachineInstr &MI, const SDWAOperandsVector &SDWAOperands);
void legalizeScalarOperands(MachineInstr &MI, const SISubtarget &ST) const;		void legalizeScalarOperands(MachineInstr &MI, const SISubtarget &ST) const;

StringRef getPassName() const override { return "SI Peephole SDWA"; }		StringRef getPassName() const override { return "SI Peephole SDWA"; }

void getAnalysisUsage(AnalysisUsage &AU) const override {		void getAnalysisUsage(AnalysisUsage &AU) const override {
▲ Show 20 Lines • Show All 701 Lines • ▼ Show 20 Lines	return make_unique<SDWADstPreserveOperand>(
OrDst, OrSDWADef, OrOtherDef, DstSel);		OrDst, OrSDWADef, OrOtherDef, DstSel);

}		}
}		}

return std::unique_ptr<SDWAOperand>(nullptr);		return std::unique_ptr<SDWAOperand>(nullptr);
}		}

void SIPeepholeSDWA::matchSDWAOperands(MachineFunction &MF) {		void SIPeepholeSDWA::matchSDWAOperands(MachineBasicBlock &MBB) {
for (MachineBasicBlock &MBB : MF) {
for (MachineInstr &MI : MBB) {		for (MachineInstr &MI : MBB) {
if (auto Operand = matchSDWAOperand(MI)) {		if (auto Operand = matchSDWAOperand(MI)) {
DEBUG(dbgs() << "Match: " << MI << "To: " << *Operand << '\n');		DEBUG(dbgs() << "Match: " << MI << "To: " << *Operand << '\n');
SDWAOperands[&MI] = std::move(Operand);		SDWAOperands[&MI] = std::move(Operand);
++NumSDWAPatternsFound;		++NumSDWAPatternsFound;
}		}
}		}
}		}
}

bool SIPeepholeSDWA::isConvertibleToSDWA(const MachineInstr &MI,		bool SIPeepholeSDWA::isConvertibleToSDWA(const MachineInstr &MI,
const SISubtarget &ST) const {		const SISubtarget &ST) const {
// Check if this is already an SDWA instruction		// Check if this is already an SDWA instruction
unsigned Opc = MI.getOpcode();		unsigned Opc = MI.getOpcode();
if (TII->isSDWA(Opc))		if (TII->isSDWA(Opc))
return true;		return true;

▲ Show 20 Lines • Show All 228 Lines • ▼ Show 20 Lines	bool SIPeepholeSDWA::runOnMachineFunction(MachineFunction &MF) {
if (!ST.hasSDWA() \|\| skipFunction(MF.getFunction()))		if (!ST.hasSDWA() \|\| skipFunction(MF.getFunction()))
return false;		return false;

MRI = &MF.getRegInfo();		MRI = &MF.getRegInfo();
TRI = ST.getRegisterInfo();		TRI = ST.getRegisterInfo();
TII = ST.getInstrInfo();		TII = ST.getInstrInfo();

// Find all SDWA operands in MF.		// Find all SDWA operands in MF.
bool Changed = false;
bool Ret = false;		bool Ret = false;
		for (MachineBasicBlock &MBB : MF) {
		bool Changed = false;
do {		do {
matchSDWAOperands(MF);		matchSDWAOperands(MBB);

for (const auto &OperandPair : SDWAOperands) {		for (const auto &OperandPair : SDWAOperands) {
const auto &Operand = OperandPair.second;		const auto &Operand = OperandPair.second;
MachineInstr *PotentialMI = Operand->potentialToConvert(TII);		MachineInstr *PotentialMI = Operand->potentialToConvert(TII);
if (PotentialMI && isConvertibleToSDWA(*PotentialMI, ST)) {		if (PotentialMI && isConvertibleToSDWA(*PotentialMI, ST)) {
PotentialMatches[PotentialMI].push_back(Operand.get());		PotentialMatches[PotentialMI].push_back(Operand.get());
}		}
}		}

for (auto &PotentialPair : PotentialMatches) {		for (auto &PotentialPair : PotentialMatches) {
MachineInstr &PotentialMI = *PotentialPair.first;		MachineInstr &PotentialMI = *PotentialPair.first;
convertToSDWA(PotentialMI, PotentialPair.second);		convertToSDWA(PotentialMI, PotentialPair.second);
}		}

PotentialMatches.clear();		PotentialMatches.clear();
SDWAOperands.clear();		SDWAOperands.clear();

Changed = !ConvertedInstructions.empty();		Changed = !ConvertedInstructions.empty();

if (Changed)		if (Changed)
Ret = true;		Ret = true;

while (!ConvertedInstructions.empty())		while (!ConvertedInstructions.empty())
legalizeScalarOperands(*ConvertedInstructions.pop_back_val(), ST);		legalizeScalarOperands(*ConvertedInstructions.pop_back_val(), ST);
} while (Changed);		} while (Changed);
		}

return Ret;		return Ret;
}		}