This is an archive of the discontinued LLVM Phabricator instance.

Differential D119549

[SDAG] clean up scalarizing load transform
ClosedPublic

Authored by spatel on Feb 11 2022, 7:55 AM.

Download Raw Diff

Details

Reviewers

lebedev.ri
efriedma
craig.topper
RKSimon

Commits

rG96b7e0b5a0c6: [SDAG] clean up scalarizing load transform

Summary

I have not found a way to expose a difference for this patch in a test because it only triggers for a one-use load, but this is the code that was adapted into D118376 and caused miscompiles. The new code pattern is the same as what we do in narrowExtractedVectorLoad() (reduces load width for a subvector extract).

This removes seemingly unnecessary manual worklist management and fixes the chain updating via:

SDValue SelectionDAG::makeEquivalentMemoryOrdering(SDValue OldChain,
                                                   SDValue NewMemOpChain) {
  assert(isa<MemSDNode>(NewMemOpChain) && "Expected a memop node");
  assert(NewMemOpChain.getValueType() == MVT::Other && "Expected a token VT");
  // The new memory operation must have the same position as the old load in
  // terms of memory dependency. Create a TokenFactor for the old load and new
  // memory operation and update uses of the old load's output chain to use that
  // TokenFactor.
  if (OldChain == NewMemOpChain || OldChain.use_empty())
    return NewMemOpChain;

  SDValue TokenFactor = getNode(ISD::TokenFactor, SDLoc(OldChain), MVT::Other,
                                OldChain, NewMemOpChain);
  ReplaceAllUsesOfValueWith(OldChain, TokenFactor);
  UpdateNodeOperands(TokenFactor.getNode(), OldChain, NewMemOpChain);
  return TokenFactor;
}

Diff Detail

Repository: rG LLVM Github Monorepo

Event Timeline

spatel created this revision.Feb 11 2022, 7:55 AM

Herald added subscribers: ecnelises, hiraditya, mcrosier. · View Herald TranscriptFeb 11 2022, 7:55 AM

spatel requested review of this revision.Feb 11 2022, 7:55 AM

Herald added a project: Restricted Project. · View Herald TranscriptFeb 11 2022, 7:55 AM

Herald added a subscriber: llvm-commits. · View Herald Transcript

Harbormaster completed remote builds in B148986: Diff 407880.Feb 11 2022, 8:52 AM

spatel mentioned this in D118376: [x86] try harder to scalarize a vector load with extracted integer op uses.Feb 11 2022, 9:36 AM

Sure, LGTM

This revision is now accepted and ready to land.Feb 11 2022, 10:31 AM

This revision was landed with ongoing or failed builds.Feb 12 2022, 8:45 AM

Closed by commit rG96b7e0b5a0c6: [SDAG] clean up scalarizing load transform (authored by spatel). · Explain Why

This revision was automatically updated to reflect the committed changes.

spatel added a commit: rG96b7e0b5a0c6: [SDAG] clean up scalarizing load transform.

Revision Contents

Path

Size

llvm/

lib/

CodeGen/

SelectionDAG/

DAGCombiner.cpp

25 lines

Diff 408185

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 19,189 Lines • ▼ Show 20 Lines	if (!TLI.allowsMemoryAccess(*DAG.getContext(), DAG.getDataLayout(), VecEltVT,
OriginalLoad->getMemOperand()->getFlags(),		OriginalLoad->getMemOperand()->getFlags(),
&IsFast) \|\|		&IsFast) \|\|
!IsFast)		!IsFast)
return SDValue();		return SDValue();

SDValue NewPtr = TLI.getVectorElementPointer(DAG, OriginalLoad->getBasePtr(),		SDValue NewPtr = TLI.getVectorElementPointer(DAG, OriginalLoad->getBasePtr(),
InVecVT, EltNo);		InVecVT, EltNo);

// The replacement we need to do here is a little tricky: we need to		// We are replacing a vector load with a scalar load. The new load must have
// replace an extractelement of a load with a load.		// identical memory op ordering to the original.
// Use ReplaceAllUsesOfValuesWith to do the replacement.
// Note that this replacement assumes that the extractvalue is the only
// use of the load; that's okay because we don't want to perform this
// transformation in other cases anyway.
SDValue Load;		SDValue Load;
SDValue Chain;
if (ResultVT.bitsGT(VecEltVT)) {		if (ResultVT.bitsGT(VecEltVT)) {
// If the result type of vextract is wider than the load, then issue an		// If the result type of vextract is wider than the load, then issue an
// extending load instead.		// extending load instead.
ISD::LoadExtType ExtType =		ISD::LoadExtType ExtType =
TLI.isLoadExtLegal(ISD::ZEXTLOAD, ResultVT, VecEltVT) ? ISD::ZEXTLOAD		TLI.isLoadExtLegal(ISD::ZEXTLOAD, ResultVT, VecEltVT) ? ISD::ZEXTLOAD
: ISD::EXTLOAD;		: ISD::EXTLOAD;
Load = DAG.getExtLoad(ExtType, DL, ResultVT, OriginalLoad->getChain(),		Load = DAG.getExtLoad(ExtType, DL, ResultVT, OriginalLoad->getChain(),
NewPtr, MPI, VecEltVT, Alignment,		NewPtr, MPI, VecEltVT, Alignment,
OriginalLoad->getMemOperand()->getFlags(),		OriginalLoad->getMemOperand()->getFlags(),
OriginalLoad->getAAInfo());		OriginalLoad->getAAInfo());
Chain = Load.getValue(1);		DAG.makeEquivalentMemoryOrdering(OriginalLoad, Load);
} else {		} else {
		// The result type is narrower or the same width as the vector element
Load = DAG.getLoad(VecEltVT, DL, OriginalLoad->getChain(), NewPtr, MPI,		Load = DAG.getLoad(VecEltVT, DL, OriginalLoad->getChain(), NewPtr, MPI,
Alignment, OriginalLoad->getMemOperand()->getFlags(),		Alignment, OriginalLoad->getMemOperand()->getFlags(),
OriginalLoad->getAAInfo());		OriginalLoad->getAAInfo());
Chain = Load.getValue(1);		DAG.makeEquivalentMemoryOrdering(OriginalLoad, Load);
if (ResultVT.bitsLT(VecEltVT))		if (ResultVT.bitsLT(VecEltVT))
Load = DAG.getNode(ISD::TRUNCATE, DL, ResultVT, Load);		Load = DAG.getNode(ISD::TRUNCATE, DL, ResultVT, Load);
else		else
Load = DAG.getBitcast(ResultVT, Load);		Load = DAG.getBitcast(ResultVT, Load);
}		}
WorklistRemover DeadNodes(*this);
SDValue From[] = {SDValue(EVE, 0), SDValue(OriginalLoad, 1)};
SDValue To[] = {Load, Chain};
DAG.ReplaceAllUsesOfValuesWith(From, To, 2);
// Make sure to revisit this node to clean it up; it will usually be dead.
AddToWorklist(EVE);
// Since we're explicitly calling ReplaceAllUses, add the new node to the
// worklist explicitly as well.
AddToWorklistWithUsers(Load.getNode());
++OpsNarrowed;		++OpsNarrowed;
return SDValue(EVE, 0);		return Load;
}		}

/// Transform a vector binary operation into a scalar binary operation by moving		/// Transform a vector binary operation into a scalar binary operation by moving
/// the math/logic after an extract element of a vector.		/// the math/logic after an extract element of a vector.
static SDValue scalarizeExtractedBinop(SDNode *ExtElt, SelectionDAG &DAG,		static SDValue scalarizeExtractedBinop(SDNode *ExtElt, SelectionDAG &DAG,
bool LegalOperations) {		bool LegalOperations) {
const TargetLowering &TLI = DAG.getTargetLoweringInfo();		const TargetLowering &TLI = DAG.getTargetLoweringInfo();
SDValue Vec = ExtElt->getOperand(0);		SDValue Vec = ExtElt->getOperand(0);
▲ Show 20 Lines • Show All 5,090 Lines • Show Last 20 Lines