Diff 488130

llvm/include/llvm/Analysis/CFGPrinter.h

Show All 20 Lines
#include "llvm/Analysis/BlockFrequencyInfo.h"		#include "llvm/Analysis/BlockFrequencyInfo.h"
#include "llvm/Analysis/BranchProbabilityInfo.h"		#include "llvm/Analysis/BranchProbabilityInfo.h"
#include "llvm/Analysis/HeatUtils.h"		#include "llvm/Analysis/HeatUtils.h"
#include "llvm/IR/CFG.h"		#include "llvm/IR/CFG.h"
#include "llvm/IR/Constants.h"		#include "llvm/IR/Constants.h"
#include "llvm/IR/Function.h"		#include "llvm/IR/Function.h"
#include "llvm/IR/Instructions.h"		#include "llvm/IR/Instructions.h"
#include "llvm/IR/PassManager.h"		#include "llvm/IR/PassManager.h"
		#include "llvm/IR/ProfDataUtils.h"
#include "llvm/Support/DOTGraphTraits.h"		#include "llvm/Support/DOTGraphTraits.h"
#include "llvm/Support/FormatVariadic.h"		#include "llvm/Support/FormatVariadic.h"

namespace llvm {		namespace llvm {
template <class GraphType> struct GraphTraits;		template <class GraphType> struct GraphTraits;
class CFGViewerPass : public PassInfoMixin<CFGViewerPass> {		class CFGViewerPass : public PassInfoMixin<CFGViewerPass> {
public:		public:
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);		PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM);
▲ Show 20 Lines • Show All 234 Lines • ▼ Show 20 Lines	std::string getEdgeAttributes(const BasicBlock *Node, const_succ_iterator I,
// profile count (due to scaling).		// profile count (due to scaling).

uint64_t Freq = CFGInfo->getFreq(Node);		uint64_t Freq = CFGInfo->getFreq(Node);
std::string Attrs = formatv("label=\"W:{0}\" penwidth={1}",		std::string Attrs = formatv("label=\"W:{0}\" penwidth={1}",
(uint64_t)(Freq * WeightPercent), Width);		(uint64_t)(Freq * WeightPercent), Width);
if (Attrs.size())		if (Attrs.size())
return Attrs;		return Attrs;

MDNode *WeightsNode = TI->getMetadata(LLVMContext::MD_prof);		MDNode WeightsNode = getBranchWeightMDNode(TI);
if (!WeightsNode)		if (!WeightsNode)
return "";		return "";

MDString *MDName = cast<MDString>(WeightsNode->getOperand(0));
if (MDName->getString() != "branch_weights")
return "";

OpNo = I.getSuccessorIndex() + 1;		OpNo = I.getSuccessorIndex() + 1;
if (OpNo >= WeightsNode->getNumOperands())		if (OpNo >= WeightsNode->getNumOperands())
return "";		return "";
ConstantInt *Weight =		ConstantInt *Weight =
mdconst::dyn_extract<ConstantInt>(WeightsNode->getOperand(OpNo));		mdconst::dyn_extract<ConstantInt>(WeightsNode->getOperand(OpNo));
if (!Weight)		if (!Weight)
return "";		return "";
return ("label=\"W:" + std::to_string(Weight->getZExtValue()) +		return ("label=\"W:" + std::to_string(Weight->getZExtValue()) +
Show All 30 Lines

llvm/include/llvm/IR/Instructions.h

	Show First 20 Lines • Show All 3,614 Lines • ▼ Show 20 Lines
	/// A wrapper class to simplify modification of SwitchInst cases along with			/// A wrapper class to simplify modification of SwitchInst cases along with
	/// their prof branch_weights metadata.			/// their prof branch_weights metadata.
	class SwitchInstProfUpdateWrapper {			class SwitchInstProfUpdateWrapper {
	SwitchInst &SI;			SwitchInst &SI;
	std::optional<SmallVector<uint32_t, 8>> Weights;			std::optional<SmallVector<uint32_t, 8>> Weights;
	bool Changed = false;			bool Changed = false;

	protected:			protected:
	static MDNode *getProfBranchWeightsMD(const SwitchInst &SI);

	MDNode *buildProfBranchWeightsMD();			MDNode *buildProfBranchWeightsMD();

	void init();			void init();

	public:			public:
	using CaseWeightOpt = std::optional<uint32_t>;			using CaseWeightOpt = std::optional<uint32_t>;
	SwitchInst *operator->() { return &SI; }			SwitchInst *operator->() { return &SI; }
	SwitchInst &operator*() { return SI; }			SwitchInst &operator*() { return SI; }
	▲ Show 20 Lines • Show All 1,827 Lines • Show Last 20 Lines

llvm/include/llvm/IR/ProfDataUtils.h

	Show All 28 Lines

	/// Checks if an instructions has Branch Weight Metadata			/// Checks if an instructions has Branch Weight Metadata
	///			///
	/// \param I The instruction to check			/// \param I The instruction to check
	/// \returns True if I has an MD_prof node containing Branch Weights. False			/// \returns True if I has an MD_prof node containing Branch Weights. False
	/// otherwise.			/// otherwise.
	bool hasBranchWeightMD(const Instruction &I);			bool hasBranchWeightMD(const Instruction &I);

				/// Checks if an instructions has valid Branch Weight Metadata
				///
				/// \param I The instruction to check
				/// \returns True if I has an MD_prof node containing valid Branch Weights,
				/// i.e., one weight for each successor. False otherwise.
				bool hasValidBranchWeightMD(const Instruction &I);

				/// Get the branch weights metadata node
				///
				/// \param I The Instruction to get the weights from.
				/// \returns A pointer to I's branch weights metadata node, if it exists.
				/// Nullptr otherwise.
				MDNode *getBranchWeightMDNode(const Instruction &I);

				/// Get the valid branch weights metadata node
				///
				/// \param I The Instruction to get the weights from.
				/// \returns A pointer to I's valid branch weights metadata node, if it exists.
				/// Nullptr otherwise.
				MDNode *getValidBranchWeightMDNode(const Instruction &I);

	/// Extract branch weights from MD_prof metadata			/// Extract branch weights from MD_prof metadata
	///			///
	/// \param ProfileData A pointer to an MDNode.			/// \param ProfileData A pointer to an MDNode.
	/// \param [out] Weights An output vector to fill with branch weights			/// \param [out] Weights An output vector to fill with branch weights
	/// \returns True if weights were extracted, False otherwise. When false Weights			/// \returns True if weights were extracted, False otherwise. When false Weights
	/// will be cleared.			/// will be cleared.
	bool extractBranchWeights(const MDNode *ProfileData,			bool extractBranchWeights(const MDNode *ProfileData,
	SmallVectorImpl<uint32_t> &Weights);			SmallVectorImpl<uint32_t> &Weights);

	/// Extract branch weights attatched to an Instruction			/// Extract branch weights attatched to an Instruction
	///			///
	/// \param I The Instruction to extract weights from.			/// \param I The Instruction to extract weights from.
	/// \param [out] Weights An output vector to fill with branch weights			/// \param [out] Weights An output vector to fill with branch weights
	/// \returns True if weights were extracted, False otherwise. When false Weights			/// \returns True if weights were extracted, False otherwise. When false Weights
	/// will be cleared.			/// will be cleared.
	bool extractBranchWeights(const Instruction &I,			bool extractBranchWeights(const Instruction &I,
	SmallVectorImpl<uint32_t> &Weights);			SmallVectorImpl<uint32_t> &Weights);

	/// Extract branch weights from a conditional branch or select Instruction.			/// Extract branch weights from a conditional branch or select Instruction.
				paulkirthUnsubmitted Done Reply Inline Actions This is incorrect. This overload is specifically for branch/select instructions where the number of successors is 2. There is a more general version that uses weights vector for all instruction types, including switches. If this API isn't needed anywhere/in the code base anymore, then it can be removed IMO, but this comment shouldn't change. paulkirth: This is incorrect. This overload is specifically for branch/select instructions where the…
	///			///
	/// \param I The instruction to extract branch weights from.			/// \param I The instruction to extract branch weights from.
	/// \param [out] TrueVal will contain the branch weight for the True branch			/// \param [out] TrueVal will contain the branch weight for the True branch
	/// \param [out] FalseVal will contain the branch weight for the False branch			/// \param [out] FalseVal will contain the branch weight for the False branch
	/// \returns True on success with profile weights filled in. False if no			/// \returns True on success with profile weights filled in. False if no
	/// metadata or invalid metadata was found.			/// metadata or invalid metadata was found.
	bool extractBranchWeights(const Instruction &I, uint64_t &TrueVal,			bool extractBranchWeights(const Instruction &I, uint64_t &TrueVal,
	uint64_t &FalseVal);			uint64_t &FalseVal);

	/// Retrieve the total of all weights from MD_prof data.			/// Retrieve the total of all weights from MD_prof data.
	///			///
	/// \param ProfileData The profile data to extract the total weight from			/// \param ProfileData The profile data to extract the total weight from
	/// \param [out] TotalWeights input variable to fill with total weights			/// \param [out] TotalWeights input variable to fill with total weights
	/// \returns True on success with profile total weights filled in. False if no			/// \returns True on success with profile total weights filled in. False if no
	/// metadata was found.			/// metadata was found.
	bool extractProfTotalWeight(const MDNode *ProfileData, uint64_t &TotalWeights);			bool extractProfTotalWeight(const MDNode *ProfileData, uint64_t &TotalWeights);

				/// Retrieve the total of all weights from an instruction.
				///
				/// \param I The instruction to extract the total weight from
				/// \param [out] TotalWeights input variable to fill with total weights
				/// \returns True on success with profile total weights filled in. False if no
				/// metadata was found.
				bool extractProfTotalWeight(const Instruction &I, uint64_t &TotalWeights);

	} // namespace llvm			} // namespace llvm
	#endif			#endif

llvm/lib/Analysis/BranchProbabilityInfo.cpp

	Show First 20 Lines • Show All 377 Lines • ▼ Show 20 Lines
	// set to min of metadata and unreachable heuristic.			// set to min of metadata and unreachable heuristic.
	bool BranchProbabilityInfo::calcMetadataWeights(const BasicBlock *BB) {			bool BranchProbabilityInfo::calcMetadataWeights(const BasicBlock *BB) {
	const Instruction *TI = BB->getTerminator();			const Instruction *TI = BB->getTerminator();
	assert(TI->getNumSuccessors() > 1 && "expected more than one successor!");			assert(TI->getNumSuccessors() > 1 && "expected more than one successor!");
	if (!(isa<BranchInst>(TI) \|\| isa<SwitchInst>(TI) \|\| isa<IndirectBrInst>(TI) \|\|			if (!(isa<BranchInst>(TI) \|\| isa<SwitchInst>(TI) \|\| isa<IndirectBrInst>(TI) \|\|
	isa<InvokeInst>(TI) \|\| isa<CallBrInst>(TI)))			isa<InvokeInst>(TI) \|\| isa<CallBrInst>(TI)))
	return false;			return false;

	MDNode *WeightsNode = TI->getMetadata(LLVMContext::MD_prof);			MDNode WeightsNode = getValidBranchWeightMDNode(TI);
	if (!WeightsNode)			if (!WeightsNode)
	return false;			return false;

	// Check that the number of successors is manageable.			// Check that the number of successors is manageable.
	assert(TI->getNumSuccessors() < UINT32_MAX && "Too many successors");			assert(TI->getNumSuccessors() < UINT32_MAX && "Too many successors");

	// Ensure there are weights for all of the successors. Note that the first
	// operand to the metadata node is a name, not a weight.
	if (WeightsNode->getNumOperands() != TI->getNumSuccessors() + 1)
	return false;

	// Build up the final weights that will be used in a temporary buffer.			// Build up the final weights that will be used in a temporary buffer.
	// Compute the sum of all weights to later decide whether they need to			// Compute the sum of all weights to later decide whether they need to
	// be scaled to fit in 32 bits.			// be scaled to fit in 32 bits.
	uint64_t WeightSum = 0;			uint64_t WeightSum = 0;
	SmallVector<uint32_t, 2> Weights;			SmallVector<uint32_t, 2> Weights;
	SmallVector<unsigned, 2> UnreachableIdxs;			SmallVector<unsigned, 2> UnreachableIdxs;
	SmallVector<unsigned, 2> ReachableIdxs;			SmallVector<unsigned, 2> ReachableIdxs;

	extractBranchWeights(*TI, Weights);			extractBranchWeights(WeightsNode, Weights);
	for (unsigned I = 0, E = Weights.size(); I != E; ++I) {			for (unsigned I = 0, E = Weights.size(); I != E; ++I) {
	WeightSum += Weights[I];			WeightSum += Weights[I];
	const LoopBlock SrcLoopBB = getLoopBlock(BB);			const LoopBlock SrcLoopBB = getLoopBlock(BB);
	const LoopBlock DstLoopBB = getLoopBlock(TI->getSuccessor(I));			const LoopBlock DstLoopBB = getLoopBlock(TI->getSuccessor(I));
	auto EstimatedWeight = getEstimatedEdgeWeight({SrcLoopBB, DstLoopBB});			auto EstimatedWeight = getEstimatedEdgeWeight({SrcLoopBB, DstLoopBB});
	if (EstimatedWeight &&			if (EstimatedWeight &&
	*EstimatedWeight <= static_cast<uint32_t>(BlockExecWeight::UNREACHABLE))			*EstimatedWeight <= static_cast<uint32_t>(BlockExecWeight::UNREACHABLE))
	UnreachableIdxs.push_back(I);			UnreachableIdxs.push_back(I);
	▲ Show 20 Lines • Show All 912 Lines • Show Last 20 Lines

llvm/lib/IR/Instruction.cpp

Show All 11 Lines

#include "llvm/IR/Instruction.h"		#include "llvm/IR/Instruction.h"
#include "llvm/ADT/DenseSet.h"		#include "llvm/ADT/DenseSet.h"
#include "llvm/IR/Constants.h"		#include "llvm/IR/Constants.h"
#include "llvm/IR/Instructions.h"		#include "llvm/IR/Instructions.h"
#include "llvm/IR/IntrinsicInst.h"		#include "llvm/IR/IntrinsicInst.h"
#include "llvm/IR/Intrinsics.h"		#include "llvm/IR/Intrinsics.h"
#include "llvm/IR/Operator.h"		#include "llvm/IR/Operator.h"
		#include "llvm/IR/ProfDataUtils.h"
#include "llvm/IR/Type.h"		#include "llvm/IR/Type.h"
using namespace llvm;		using namespace llvm;

Instruction::Instruction(Type ty, unsigned it, Use Ops, unsigned NumOps,		Instruction::Instruction(Type ty, unsigned it, Use Ops, unsigned NumOps,
Instruction *InsertBefore)		Instruction *InsertBefore)
: User(ty, Value::InstructionVal + it, Ops, NumOps), Parent(nullptr) {		: User(ty, Value::InstructionVal + it, Ops, NumOps), Parent(nullptr) {

// If requested, insert this instruction into a basic block...		// If requested, insert this instruction into a basic block...
▲ Show 20 Lines • Show All 822 Lines • ▼ Show 20 Lines	if (getSuccessor(Idx) == OldBB)
setSuccessor(Idx, NewBB);		setSuccessor(Idx, NewBB);
}		}

Instruction *Instruction::cloneImpl() const {		Instruction *Instruction::cloneImpl() const {
llvm_unreachable("Subclass of Instruction failed to implement cloneImpl");		llvm_unreachable("Subclass of Instruction failed to implement cloneImpl");
}		}

void Instruction::swapProfMetadata() {		void Instruction::swapProfMetadata() {
MDNode *ProfileData = getMetadata(LLVMContext::MD_prof);		MDNode ProfileData = getBranchWeightMDNode(this);
if (!ProfileData \|\| ProfileData->getNumOperands() != 3 \|\|		if (!ProfileData \|\| ProfileData->getNumOperands() != 3)
!isa<MDString>(ProfileData->getOperand(0)))
return;

MDString *MDName = cast<MDString>(ProfileData->getOperand(0));
if (MDName->getString() != "branch_weights")
return;		return;

// The first operand is the name. Fetch them backwards and build a new one.		// The first operand is the name. Fetch them backwards and build a new one.
Metadata *Ops[] = {ProfileData->getOperand(0), ProfileData->getOperand(2),		Metadata *Ops[] = {ProfileData->getOperand(0), ProfileData->getOperand(2),
ProfileData->getOperand(1)};		ProfileData->getOperand(1)};
setMetadata(LLVMContext::MD_prof,		setMetadata(LLVMContext::MD_prof,
MDNode::get(ProfileData->getContext(), Ops));		MDNode::get(ProfileData->getContext(), Ops));
}		}
Show All 39 Lines

llvm/lib/IR/Instructions.cpp

Show All 25 Lines
#include "llvm/IR/InstrTypes.h"		#include "llvm/IR/InstrTypes.h"
#include "llvm/IR/Instruction.h"		#include "llvm/IR/Instruction.h"
#include "llvm/IR/Intrinsics.h"		#include "llvm/IR/Intrinsics.h"
#include "llvm/IR/LLVMContext.h"		#include "llvm/IR/LLVMContext.h"
#include "llvm/IR/MDBuilder.h"		#include "llvm/IR/MDBuilder.h"
#include "llvm/IR/Metadata.h"		#include "llvm/IR/Metadata.h"
#include "llvm/IR/Module.h"		#include "llvm/IR/Module.h"
#include "llvm/IR/Operator.h"		#include "llvm/IR/Operator.h"
		#include "llvm/IR/ProfDataUtils.h"
#include "llvm/IR/Type.h"		#include "llvm/IR/Type.h"
#include "llvm/IR/Value.h"		#include "llvm/IR/Value.h"
#include "llvm/Support/AtomicOrdering.h"		#include "llvm/Support/AtomicOrdering.h"
#include "llvm/Support/Casting.h"		#include "llvm/Support/Casting.h"
#include "llvm/Support/ErrorHandling.h"		#include "llvm/Support/ErrorHandling.h"
#include "llvm/Support/MathExtras.h"		#include "llvm/Support/MathExtras.h"
#include "llvm/Support/ModRef.h"		#include "llvm/Support/ModRef.h"
#include "llvm/Support/TypeSize.h"		#include "llvm/Support/TypeSize.h"
▲ Show 20 Lines • Show All 4,525 Lines • ▼ Show 20 Lines
void SwitchInst::growOperands() {		void SwitchInst::growOperands() {
unsigned e = getNumOperands();		unsigned e = getNumOperands();
unsigned NumOps = e*3;		unsigned NumOps = e*3;

ReservedSpace = NumOps;		ReservedSpace = NumOps;
growHungoffUses(ReservedSpace);		growHungoffUses(ReservedSpace);
}		}

MDNode *
SwitchInstProfUpdateWrapper::getProfBranchWeightsMD(const SwitchInst &SI) {
if (MDNode *ProfileData = SI.getMetadata(LLVMContext::MD_prof))
if (auto *MDName = dyn_cast<MDString>(ProfileData->getOperand(0)))
if (MDName->getString() == "branch_weights")
return ProfileData;
return nullptr;
}

MDNode *SwitchInstProfUpdateWrapper::buildProfBranchWeightsMD() {		MDNode *SwitchInstProfUpdateWrapper::buildProfBranchWeightsMD() {
assert(Changed && "called only if metadata has changed");		assert(Changed && "called only if metadata has changed");

if (!Weights)		if (!Weights)
return nullptr;		return nullptr;

assert(SI.getNumSuccessors() == Weights->size() &&		assert(SI.getNumSuccessors() == Weights->size() &&
"num of prof branch_weights must accord with num of successors");		"num of prof branch_weights must accord with num of successors");

bool AllZeroes = all_of(*Weights, [](uint32_t W) { return W == 0; });		bool AllZeroes = all_of(*Weights, [](uint32_t W) { return W == 0; });

if (AllZeroes \|\| Weights->size() < 2)		if (AllZeroes \|\| Weights->size() < 2)
return nullptr;		return nullptr;

return MDBuilder(SI.getParent()->getContext()).createBranchWeights(*Weights);		return MDBuilder(SI.getParent()->getContext()).createBranchWeights(*Weights);
}		}

void SwitchInstProfUpdateWrapper::init() {		void SwitchInstProfUpdateWrapper::init() {
MDNode *ProfileData = getProfBranchWeightsMD(SI);		MDNode *ProfileData = getBranchWeightMDNode(SI);
if (!ProfileData)		if (!ProfileData)
return;		return;

if (ProfileData->getNumOperands() != SI.getNumSuccessors() + 1) {		if (ProfileData->getNumOperands() != SI.getNumSuccessors() + 1) {
llvm_unreachable("number of prof branch_weights metadata operands does "		llvm_unreachable("number of prof branch_weights metadata operands does "
"not correspond to number of succesors");		"not correspond to number of succesors");
}		}
paulkirthUnsubmitted Done Reply Inline Actions I don't think we do this check in ProfDatUtils, so we probably shouldn't remove it, should we? I know I've tripped this assert before when modifying some passes, so I think it's good one to keep. paulkirth: I don't think we do this check in ProfDatUtils, so we probably shouldn't remove it, should we?
DinistroAuthorUnsubmitted Done Reply Inline Actions I changed this back to have the `llvm_unreachable`. The newly added `getValidBranchWeightMDNode` could be used here but that would not cause an assertion violation. Dinistro: I changed this back to have the `llvm_unreachable`. The newly added…

SmallVector<uint32_t, 8> Weights;		SmallVector<uint32_t, 8> Weights;
for (unsigned CI = 1, CE = SI.getNumSuccessors(); CI <= CE; ++CI) {		if (!extractBranchWeights(ProfileData, Weights))
ConstantInt *C = mdconst::extract<ConstantInt>(ProfileData->getOperand(CI));		return;
uint32_t CW = C->getValue().getZExtValue();
Weights.push_back(CW);
}
this->Weights = std::move(Weights);		this->Weights = std::move(Weights);
}		}

SwitchInst::CaseIt		SwitchInst::CaseIt
SwitchInstProfUpdateWrapper::removeCase(SwitchInst::CaseIt I) {		SwitchInstProfUpdateWrapper::removeCase(SwitchInst::CaseIt I) {
if (Weights) {		if (Weights) {
assert(SI.getNumSuccessors() == Weights->size() &&		assert(SI.getNumSuccessors() == Weights->size() &&
"num of prof branch_weights must accord with num of successors");		"num of prof branch_weights must accord with num of successors");
▲ Show 20 Lines • Show All 56 Lines • ▼ Show 20 Lines	if (*W != OldW) {
OldW = *W;		OldW = *W;
}		}
}		}
}		}

SwitchInstProfUpdateWrapper::CaseWeightOpt		SwitchInstProfUpdateWrapper::CaseWeightOpt
SwitchInstProfUpdateWrapper::getSuccessorWeight(const SwitchInst &SI,		SwitchInstProfUpdateWrapper::getSuccessorWeight(const SwitchInst &SI,
unsigned idx) {		unsigned idx) {
if (MDNode *ProfileData = getProfBranchWeightsMD(SI))		if (MDNode *ProfileData = getBranchWeightMDNode(SI))
if (ProfileData->getNumOperands() == SI.getNumSuccessors() + 1)		if (ProfileData->getNumOperands() == SI.getNumSuccessors() + 1)
return mdconst::extract<ConstantInt>(ProfileData->getOperand(idx + 1))		return mdconst::extract<ConstantInt>(ProfileData->getOperand(idx + 1))
->getValue()		->getValue()
.getZExtValue();		.getZExtValue();

return std::nullopt;		return std::nullopt;
}		}

▲ Show 20 Lines • Show All 311 Lines • Show Last 20 Lines

llvm/lib/IR/Metadata.cpp

	Show First 20 Lines • Show All 1,538 Lines • ▼ Show 20 Lines
	bool Instruction::extractProfTotalWeight(uint64_t &TotalVal) const {			bool Instruction::extractProfTotalWeight(uint64_t &TotalVal) const {
	assert(			assert(
	(getOpcode() == Instruction::Br \|\| getOpcode() == Instruction::Select \|\|			(getOpcode() == Instruction::Br \|\| getOpcode() == Instruction::Select \|\|
	getOpcode() == Instruction::Call \|\| getOpcode() == Instruction::Invoke \|\|			getOpcode() == Instruction::Call \|\| getOpcode() == Instruction::Invoke \|\|
	getOpcode() == Instruction::IndirectBr \|\|			getOpcode() == Instruction::IndirectBr \|\|
	getOpcode() == Instruction::Switch) &&			getOpcode() == Instruction::Switch) &&
	"Looking for branch weights on something besides branch");			"Looking for branch weights on something besides branch");

	return ::extractProfTotalWeight(getMetadata(LLVMContext::MD_prof), TotalVal);			return ::extractProfTotalWeight(*this, TotalVal);
	}			}

	void GlobalObject::copyMetadata(const GlobalObject *Other, unsigned Offset) {			void GlobalObject::copyMetadata(const GlobalObject *Other, unsigned Offset) {
	SmallVector<std::pair<unsigned, MDNode *>, 8> MDs;			SmallVector<std::pair<unsigned, MDNode *>, 8> MDs;
	Other->getAllMetadata(MDs);			Other->getAllMetadata(MDs);
	for (auto &MD : MDs) {			for (auto &MD : MDs) {
	// We need to adjust the type metadata offset.			// We need to adjust the type metadata offset.
	if (Offset != 0 && MD.first == LLVMContext::MD_type) {			if (Offset != 0 && MD.first == LLVMContext::MD_type) {
	▲ Show 20 Lines • Show All 93 Lines • Show Last 20 Lines

llvm/lib/IR/ProfDataUtils.cpp

Show All 37 Lines

// //

// We maintain some constants here to ensure that we access the branch weights // We maintain some constants here to ensure that we access the branch weights

// correctly, and can change the behavior in the future if the layout changes // correctly, and can change the behavior in the future if the layout changes

// The index at which the weights vector starts // The index at which the weights vector starts

constexpr unsigned WeightsIdx = 1; constexpr unsigned WeightsIdx = 1;

// the minimum number of operands for MD_prof nodes with branch weights // the minimum number of operands for MD_prof nodes with branch weights

constexpr unsigned MinBWOps = 3; constexpr unsigned MinBWOps = 3;

paulkirthUnsubmitted

Done

This constant is used to check the validity of branch weight metadata. Changing this to 2 implies that a MD_prof node w/ only the "branch_weight" moniker and a single weight are valid. I don't think that's true, so I don't think this should change unless we change how MD_prof is laid out as a whole.

paulkirth: This constant is used to check the validity of branch weight metadata. Changing this to 2…

davidxlUnsubmitted

Done

agree. What the reason to change it to 2?

davidxl: agree. What the reason to change it to 2?

DinistroAuthorUnsubmitted

Done

I changed this because calls can also have branch weights: https://llvm.org/docs/BranchWeightMetadata.html#callinst
It turns out that branch weights of calls different from other branch weights and can thus either way not be handled with the current state of this utility, so I reverted this part.

Dinistro: I changed this because calls can also have branch weights: https://llvm.

bool extractWeights(const MDNode *ProfileData, bool extractWeights(const MDNode *ProfileData,

SmallVectorImpl<uint32_t> &Weights) { SmallVectorImpl<uint32_t> &Weights) {

// Assume preconditions are already met (i.e. this is valid metadata) // Assume preconditions are already met (i.e. this is valid metadata)

assert(ProfileData && "ProfileData was nullptr in extractWeights"); assert(ProfileData && "ProfileData was nullptr in extractWeights");

unsigned NOps = ProfileData->getNumOperands(); unsigned NOps = ProfileData->getNumOperands();

assert(WeightsIdx < NOps && "Weights Index must be less than NOps."); assert(WeightsIdx < NOps && "Weights Index must be less than NOps.");

▲ Show 20 Lines • Show All 41 Lines • ▼ Show 20 Lines bool isBranchWeightMD(const MDNode *ProfileData) {

return isTargetMD(ProfileData, "branch_weights", MinBWOps); return isTargetMD(ProfileData, "branch_weights", MinBWOps);

} }

bool hasBranchWeightMD(const Instruction &I) { bool hasBranchWeightMD(const Instruction &I) {

auto *ProfileData = I.getMetadata(LLVMContext::MD_prof); auto *ProfileData = I.getMetadata(LLVMContext::MD_prof);

return isBranchWeightMD(ProfileData); return isBranchWeightMD(ProfileData);

} }

bool hasValidBranchWeightMD(const Instruction &I) {

auto *ProfileData = I.getMetadata(LLVMContext::MD_prof);

if (!isBranchWeightMD(ProfileData))

return false;

if (ProfileData && ProfileData->getNumOperands() == 1 + I.getNumSuccessors())

return true;

return false;

}

MDNode *getBranchWeightMDNode(const Instruction &I) {

auto *ProfileData = I.getMetadata(LLVMContext::MD_prof);

if (!isBranchWeightMD(ProfileData))

return nullptr;

return ProfileData;

}

MDNode *getValidBranchWeightMDNode(const Instruction &I) {

if (!hasValidBranchWeightMD(I))

return nullptr;

return I.getMetadata(LLVMContext::MD_prof);

}

paulkirthUnsubmitted

Done

return isBranchWeightMD(ProfileData);

}

bool hasValidBranchWeightMD(const Instruction &I) {

- auto *ProfileData = I.getMetadata(LLVMContext::MD_prof);

- if (!isBranchWeightMD(ProfileData))

- return false;

- if (ProfileData && ProfileData->getNumOperands() == 1 + I.getNumSuccessors())

- return true;

- return false;

+ return getValidBranchWeightMDNode(I);

}

MDNode *getBranchWeightMDNode(const Instruction &I) {

auto *ProfileData = I.getMetadata(LLVMContext::MD_prof);

if (!isBranchWeightMD(ProfileData))

return nullptr;

return ProfileData;

}

MDNode *getValidBranchWeightMDNode(const Instruction &I) {

- if (!hasValidBranchWeightMD(I))

- return nullptr;

- return I.getMetadata(LLVMContext::MD_prof);

+ auto *ProfileData = getBranchWeightMDNode(I);

+ if (ProfileData && ProfileData->getNumOperands() == 1 + I.getNumSuccessors())

+ return ProfileData;

+ return nullptr;

}

bool extractBranchWeights(const MDNode *ProfileData,

I'd consider inverting the logic between getValidBranchWeightMDNode() and hasValidBranchWeightMD()

paulkirth: I'd consider inverting the logic between `getValidBranchWeightMDNode()` and…

bool extractBranchWeights(const MDNode *ProfileData, bool extractBranchWeights(const MDNode *ProfileData,

SmallVectorImpl<uint32_t> &Weights) { SmallVectorImpl<uint32_t> &Weights) {

if (!isBranchWeightMD(ProfileData)) if (!isBranchWeightMD(ProfileData))

return false; return false;

return extractWeights(ProfileData, Weights); return extractWeights(ProfileData, Weights);

} }

bool extractBranchWeights(const Instruction &I, bool extractBranchWeights(const Instruction &I,

SmallVectorImpl<uint32_t> &Weights) { SmallVectorImpl<uint32_t> &Weights) {

auto *ProfileData = I.getMetadata(LLVMContext::MD_prof); auto *ProfileData = I.getMetadata(LLVMContext::MD_prof);

return extractBranchWeights(ProfileData, Weights); return extractBranchWeights(ProfileData, Weights);

} }

bool extractBranchWeights(const Instruction &I, uint64_t &TrueVal, bool extractBranchWeights(const Instruction &I, uint64_t &TrueVal,

uint64_t &FalseVal) { uint64_t &FalseVal) {

assert((I.getOpcode() == Instruction::Br || assert((I.getOpcode() == Instruction::Br ||

I.getOpcode() == Instruction::Select) && I.getOpcode() == Instruction::Select) &&

"Looking for branch weights on something besides branch or select"); "Looking for branch weights on something besides branch, select, or "

"switch");

paulkirthUnsubmitted

Done

This is wrong. you can't include a switch here. The overload above takes a SmallVectorImpl is the only appropriate API when dealing with a switch, since it can have an arbitrary number of arms.

The assertion here is to prevent API misuse. If used on a switch, this will always return false, so I don't think thats the right choice here. You get some utility by being able to use this in more places, but I think this will be easy to introduce subtle bugs. For instance, if a switch happens to only have 2 arms this will work when it arguably shouldn't.

My preference would be that everything settle on the SmallVectorImpl API, since that can correctly handle all cases. It isn't' as ergonomic in some of the code uses though, IIRC.

paulkirth: This is wrong. you can't include a switch here. The overload above takes a `SmallVectorImpl` is…

davidxlUnsubmitted

Done

Agree.

davidxl: Agree.

SmallVector<uint32_t, 2> Weights; SmallVector<uint32_t, 2> Weights;

auto *ProfileData = I.getMetadata(LLVMContext::MD_prof); auto *ProfileData = I.getMetadata(LLVMContext::MD_prof);

if (!extractBranchWeights(ProfileData, Weights)) if (!extractBranchWeights(ProfileData, Weights))

return false; return false;

if (Weights.size() > 2) if (Weights.size() > 2)

return false; return false;

Show All 26 Lines if (ProfDataName->getString().equals("VP") &&

TotalVal = mdconst::dyn_extract<ConstantInt>(ProfileData->getOperand(2)) TotalVal = mdconst::dyn_extract<ConstantInt>(ProfileData->getOperand(2))

->getValue() ->getValue()

.getZExtValue(); .getZExtValue();

return true; return true;

} }

return false; return false;

} }

bool extractProfTotalWeight(const Instruction &I, uint64_t &TotalVal) {

return extractProfTotalWeight(I.getMetadata(LLVMContext::MD_prof), TotalVal);

}

} // namespace llvm } // namespace llvm

llvm/lib/Transforms/IPO/PartialInlining.cpp

Show First 20 Lines • Show All 710 Lines • ▼ Show 20 Lines

static bool hasProfileData(const Function &F, const FunctionOutliningInfo &OI) {

if (F.hasProfileData())

return true;

// Now check if any of the entry block has MD_prof data:

for (auto *E : OI.Entries) {

BranchInst *BR = dyn_cast<BranchInst>(E->getTerminator());

if (!BR || BR->isUnconditional())

continue;

uint64_t T, F;

if (hasBranchWeightMD(*BR))

paulkirthUnsubmitted

Done

continue;

- if (getBranchWeightMDNode(*BR))

+ if (hasBranchWeightMD(*BR))

return true;

paulkirth:

if (extractBranchWeights(*BR, T, F))

return true;

}

return false;

}

BranchProbability PartialInlinerImpl::getOutliningCallBBRelativeFreq(

FunctionCloner &Cloner) const {

BasicBlock *OutliningCallBB = Cloner.OutlinedFunctions.back().second;

▲ Show 20 Lines • Show All 819 Lines • Show Last 20 Lines

llvm/lib/Transforms/Instrumentation/ControlHeightReduction.cpp

Show All 23 Lines
#include "llvm/Analysis/RegionIterator.h"		#include "llvm/Analysis/RegionIterator.h"
#include "llvm/Analysis/ValueTracking.h"		#include "llvm/Analysis/ValueTracking.h"
#include "llvm/IR/CFG.h"		#include "llvm/IR/CFG.h"
#include "llvm/IR/Dominators.h"		#include "llvm/IR/Dominators.h"
#include "llvm/IR/IRBuilder.h"		#include "llvm/IR/IRBuilder.h"
#include "llvm/IR/IntrinsicInst.h"		#include "llvm/IR/IntrinsicInst.h"
#include "llvm/IR/MDBuilder.h"		#include "llvm/IR/MDBuilder.h"
#include "llvm/IR/PassManager.h"		#include "llvm/IR/PassManager.h"
		#include "llvm/IR/ProfDataUtils.h"
#include "llvm/InitializePasses.h"		#include "llvm/InitializePasses.h"
#include "llvm/Support/BranchProbability.h"		#include "llvm/Support/BranchProbability.h"
#include "llvm/Support/CommandLine.h"		#include "llvm/Support/CommandLine.h"
#include "llvm/Support/MemoryBuffer.h"		#include "llvm/Support/MemoryBuffer.h"
#include "llvm/Transforms/Utils.h"		#include "llvm/Transforms/Utils.h"
#include "llvm/Transforms/Utils/BasicBlockUtils.h"		#include "llvm/Transforms/Utils/BasicBlockUtils.h"
#include "llvm/Transforms/Utils/Cloning.h"		#include "llvm/Transforms/Utils/Cloning.h"
#include "llvm/Transforms/Utils/ValueMapper.h"		#include "llvm/Transforms/Utils/ValueMapper.h"
▲ Show 20 Lines • Show All 529 Lines • ▼ Show 20 Lines	if (isHoistable(I, DT)) {
}		}
}		}
Visited[I] = false;		Visited[I] = false;
return false;		return false;
}		}
// Non-instructions are considered hoistable.		// Non-instructions are considered hoistable.
return true;		return true;
}		}

// Returns true and sets the true probability and false probability of an		// Constructs the true and false branch probabilities if the the instruction has
		paulkirthUnsubmitted Done Reply Inline Actions Oh, this is a good change. The API use is much better at call sites. Since the validation is basically done in ProfDataUtils, maybe rename this API to something more self descriptive? paulkirth: Oh, this is a good change. The API use is much better at call sites. Since the validation is…
// MD_prof metadata if it's well-formed.		// valid branch weights. Returns true when this was successful, false otherwise.
static bool checkMDProf(MDNode *MD, BranchProbability &TrueProb,		static bool extractBranchProbabilities(Instruction *I,
		BranchProbability &TrueProb,
BranchProbability &FalseProb) {		BranchProbability &FalseProb) {
if (!MD) return false;		uint64_t TrueWeight;
MDString *MDName = cast<MDString>(MD->getOperand(0));		uint64_t FalseWeight;
if (MDName->getString() != "branch_weights" \|\|		if (!extractBranchWeights(*I, TrueWeight, FalseWeight))
MD->getNumOperands() != 3)
return false;		return false;
ConstantInt *TrueWeight = mdconst::extract<ConstantInt>(MD->getOperand(1));		uint64_t SumWeight = TrueWeight + FalseWeight;
		paulkirthUnsubmitted Done Reply Inline Actions nit: if we're changing the variable names, let's be consistent. I'd leave them as they were to limit the change, but if we're changing some, we should change them uniformly. paulkirth: nit: if we're changing the variable names, let's be consistent. I'd leave them as they were to…
ConstantInt *FalseWeight = mdconst::extract<ConstantInt>(MD->getOperand(2));
if (!TrueWeight \|\| !FalseWeight)
return false;
uint64_t TrueWt = TrueWeight->getValue().getZExtValue();
uint64_t FalseWt = FalseWeight->getValue().getZExtValue();
uint64_t SumWt = TrueWt + FalseWt;

assert(SumWt >= TrueWt && SumWt >= FalseWt &&		assert(SumWeight >= TrueWeight && SumWeight >= FalseWeight &&
"Overflow calculating branch probabilities.");		"Overflow calculating branch probabilities.");

// Guard against 0-to-0 branch weights to avoid a division-by-zero crash.		// Guard against 0-to-0 branch weights to avoid a division-by-zero crash.
if (SumWt == 0)		if (SumWeight == 0)
return false;		return false;

TrueProb = BranchProbability::getBranchProbability(TrueWt, SumWt);		TrueProb = BranchProbability::getBranchProbability(TrueWeight, SumWeight);
FalseProb = BranchProbability::getBranchProbability(FalseWt, SumWt);		FalseProb = BranchProbability::getBranchProbability(FalseWeight, SumWeight);
return true;		return true;
}		}

static BranchProbability getCHRBiasThreshold() {		static BranchProbability getCHRBiasThreshold() {
return BranchProbability::getBranchProbability(		return BranchProbability::getBranchProbability(
static_cast<uint64_t>(CHRBiasThreshold * 1000000), 1000000);		static_cast<uint64_t>(CHRBiasThreshold * 1000000), 1000000);
}		}

Show All 22 Lines
// branch of the region is biased.		// branch of the region is biased.
static bool checkBiasedBranch(BranchInst BI, Region R,		static bool checkBiasedBranch(BranchInst BI, Region R,
DenseSet<Region *> &TrueBiasedRegionsGlobal,		DenseSet<Region *> &TrueBiasedRegionsGlobal,
DenseSet<Region *> &FalseBiasedRegionsGlobal,		DenseSet<Region *> &FalseBiasedRegionsGlobal,
DenseMap<Region *, BranchProbability> &BranchBiasMap) {		DenseMap<Region *, BranchProbability> &BranchBiasMap) {
if (!BI->isConditional())		if (!BI->isConditional())
return false;		return false;
BranchProbability ThenProb, ElseProb;		BranchProbability ThenProb, ElseProb;
if (!checkMDProf(BI->getMetadata(LLVMContext::MD_prof),		if (!extractBranchProbabilities(BI, ThenProb, ElseProb))
ThenProb, ElseProb))
return false;		return false;
BasicBlock *IfThen = BI->getSuccessor(0);		BasicBlock *IfThen = BI->getSuccessor(0);
BasicBlock *IfElse = BI->getSuccessor(1);		BasicBlock *IfElse = BI->getSuccessor(1);
assert((IfThen == R->getExit() \|\| IfElse == R->getExit()) &&		assert((IfThen == R->getExit() \|\| IfElse == R->getExit()) &&
IfThen != IfElse &&		IfThen != IfElse &&
"Invariant from findScopes");		"Invariant from findScopes");
if (IfThen == R->getExit()) {		if (IfThen == R->getExit()) {
// Swap them so that IfThen/ThenProb means going into the conditional code		// Swap them so that IfThen/ThenProb means going into the conditional code
Show All 12 Lines
// Returns true and insert a select into the right biased set and the map if the		// Returns true and insert a select into the right biased set and the map if the
// select is biased.		// select is biased.
static bool checkBiasedSelect(		static bool checkBiasedSelect(
SelectInst SI, Region R,		SelectInst SI, Region R,
DenseSet<SelectInst *> &TrueBiasedSelectsGlobal,		DenseSet<SelectInst *> &TrueBiasedSelectsGlobal,
DenseSet<SelectInst *> &FalseBiasedSelectsGlobal,		DenseSet<SelectInst *> &FalseBiasedSelectsGlobal,
DenseMap<SelectInst *, BranchProbability> &SelectBiasMap) {		DenseMap<SelectInst *, BranchProbability> &SelectBiasMap) {
BranchProbability TrueProb, FalseProb;		BranchProbability TrueProb, FalseProb;
if (!checkMDProf(SI->getMetadata(LLVMContext::MD_prof),		if (!extractBranchProbabilities(SI, TrueProb, FalseProb))
TrueProb, FalseProb))
return false;		return false;
CHR_DEBUG(dbgs() << "SI " << *SI << " ");		CHR_DEBUG(dbgs() << "SI " << *SI << " ");
CHR_DEBUG(dbgs() << "TrueProb " << TrueProb << " ");		CHR_DEBUG(dbgs() << "TrueProb " << TrueProb << " ");
CHR_DEBUG(dbgs() << "FalseProb " << FalseProb << "\n");		CHR_DEBUG(dbgs() << "FalseProb " << FalseProb << "\n");
return checkBias(SI, TrueProb, FalseProb,		return checkBias(SI, TrueProb, FalseProb,
TrueBiasedSelectsGlobal, FalseBiasedSelectsGlobal,		TrueBiasedSelectsGlobal, FalseBiasedSelectsGlobal,
SelectBiasMap);		SelectBiasMap);
}		}
▲ Show 20 Lines • Show All 1,421 Lines • Show Last 20 Lines

llvm/lib/Transforms/Scalar/JumpThreading.cpp

Show First 20 Lines • Show All 2,515 Lines • ▼ Show 20 Lines	BasicBlock JumpThreadingPass::splitBlockPreds(BasicBlock BB,
}		}

DTU->applyUpdatesPermissive(Updates);		DTU->applyUpdatesPermissive(Updates);
return NewBBs[0];		return NewBBs[0];
}		}

bool JumpThreadingPass::doesBlockHaveProfileData(BasicBlock *BB) {		bool JumpThreadingPass::doesBlockHaveProfileData(BasicBlock *BB) {
const Instruction *TI = BB->getTerminator();		const Instruction *TI = BB->getTerminator();
assert(TI->getNumSuccessors() > 1 && "not a split");		assert(TI->getNumSuccessors() > 1 && "not a split");
		return hasValidBranchWeightMD(*TI);
		paulkirthUnsubmitted Done Reply Inline Actions I think we discourage `auto` in cases like this, don't we? See: https://llvm.org/docs/CodingStandards.html#use-auto-type-deduction-to-make-code-more-readable paulkirth: I think we discourage `auto` in cases like this, don't we? See: https://llvm.
MDNode *WeightsNode = TI->getMetadata(LLVMContext::MD_prof);
if (!WeightsNode)
return false;

MDString *MDName = cast<MDString>(WeightsNode->getOperand(0));
if (MDName->getString() != "branch_weights")
return false;

// Ensure there are weights for all of the successors. Note that the first
// operand to the metadata node is a name, not a weight.
return WeightsNode->getNumOperands() == TI->getNumSuccessors() + 1;
}		}

/// Update the block frequency of BB and branch weight and the metadata on the		/// Update the block frequency of BB and branch weight and the metadata on the
/// edge BB->SuccBB. This is done by scaling the weight of BB->SuccBB by 1 -		/// edge BB->SuccBB. This is done by scaling the weight of BB->SuccBB by 1 -
/// Freq(PredBB->BB) / Freq(BB->SuccBB).		/// Freq(PredBB->BB) / Freq(BB->SuccBB).
void JumpThreadingPass::updateBlockFreqAndEdgeWeight(BasicBlock *PredBB,		void JumpThreadingPass::updateBlockFreqAndEdgeWeight(BasicBlock *PredBB,
BasicBlock *BB,		BasicBlock *BB,
BasicBlock *NewBB,		BasicBlock *NewBB,
▲ Show 20 Lines • Show All 563 Lines • Show Last 20 Lines

llvm/lib/Transforms/Scalar/LoopPredication.cpp

Show First 20 Lines • Show All 185 Lines • ▼ Show 20 Lines
#include "llvm/Analysis/MemorySSA.h"		#include "llvm/Analysis/MemorySSA.h"
#include "llvm/Analysis/MemorySSAUpdater.h"		#include "llvm/Analysis/MemorySSAUpdater.h"
#include "llvm/Analysis/ScalarEvolution.h"		#include "llvm/Analysis/ScalarEvolution.h"
#include "llvm/Analysis/ScalarEvolutionExpressions.h"		#include "llvm/Analysis/ScalarEvolutionExpressions.h"
#include "llvm/IR/Function.h"		#include "llvm/IR/Function.h"
#include "llvm/IR/IntrinsicInst.h"		#include "llvm/IR/IntrinsicInst.h"
#include "llvm/IR/Module.h"		#include "llvm/IR/Module.h"
#include "llvm/IR/PatternMatch.h"		#include "llvm/IR/PatternMatch.h"
		#include "llvm/IR/ProfDataUtils.h"
#include "llvm/InitializePasses.h"		#include "llvm/InitializePasses.h"
#include "llvm/Pass.h"		#include "llvm/Pass.h"
#include "llvm/Support/CommandLine.h"		#include "llvm/Support/CommandLine.h"
#include "llvm/Support/Debug.h"		#include "llvm/Support/Debug.h"
#include "llvm/Transforms/Scalar.h"		#include "llvm/Transforms/Scalar.h"
#include "llvm/Transforms/Utils/GuardUtils.h"		#include "llvm/Transforms/Utils/GuardUtils.h"
#include "llvm/Transforms/Utils/Local.h"		#include "llvm/Transforms/Utils/Local.h"
#include "llvm/Transforms/Utils/LoopUtils.h"		#include "llvm/Transforms/Utils/LoopUtils.h"
▲ Show 20 Lines • Show All 766 Lines • ▼ Show 20 Lines	bool LoopPredication::isLoopProfitableToPredicate() {
// being complete for an entire function.		// being complete for an entire function.

// If the latch exits into a deoptimize or an unreachable block, do not		// If the latch exits into a deoptimize or an unreachable block, do not
// predicate on that latch check.		// predicate on that latch check.
auto *LatchExitBlock = LatchTerm->getSuccessor(LatchBrExitIdx);		auto *LatchExitBlock = LatchTerm->getSuccessor(LatchBrExitIdx);
if (isa<UnreachableInst>(LatchTerm) \|\|		if (isa<UnreachableInst>(LatchTerm) \|\|
LatchExitBlock->getTerminatingDeoptimizeCall())		LatchExitBlock->getTerminatingDeoptimizeCall())
return false;		return false;

auto IsValidProfileData = [](MDNode ProfileData, const Instruction Term) {
if (!ProfileData \|\| !ProfileData->getOperand(0))
return false;
if (MDString *MDS = dyn_cast<MDString>(ProfileData->getOperand(0)))
if (!MDS->getString().equals("branch_weights"))
return false;
if (ProfileData->getNumOperands() != 1 + Term->getNumSuccessors())
return false;
return true;
};
MDNode *LatchProfileData = LatchTerm->getMetadata(LLVMContext::MD_prof);
// Latch terminator has no valid profile data, so nothing to check		// Latch terminator has no valid profile data, so nothing to check
		paulkirthUnsubmitted Done Reply Inline Actions Should we also provide this API in `ProfDataUtils`? It's a validity check for branch weight nodes, and we already encapsulate most of it ... paulkirth: Should we also provide this API in `ProfDataUtils`? It's a validity check for branch weight…
// profitability on.		// profitability on.
if (!IsValidProfileData(LatchProfileData, LatchTerm))		if (!hasValidBranchWeightMD(*LatchTerm))
return true;		return true;

auto ComputeBranchProbability =		auto ComputeBranchProbability =
[&](const BasicBlock *ExitingBlock,		[&](const BasicBlock *ExitingBlock,
const BasicBlock *ExitBlock) -> BranchProbability {		const BasicBlock *ExitBlock) -> BranchProbability {
auto *Term = ExitingBlock->getTerminator();		auto *Term = ExitingBlock->getTerminator();
MDNode *ProfileData = Term->getMetadata(LLVMContext::MD_prof);
unsigned NumSucc = Term->getNumSuccessors();		unsigned NumSucc = Term->getNumSuccessors();
if (IsValidProfileData(ProfileData, Term)) {		if (MDNode ProfileData = getValidBranchWeightMDNode(Term)) {
uint64_t Numerator = 0, Denominator = 0, ProfVal = 0;		SmallVector<uint32_t> Weights;
for (unsigned i = 0; i < NumSucc; i++) {		extractBranchWeights(ProfileData, Weights);
ConstantInt *CI =		uint64_t Numerator = 0, Denominator = 0;
mdconst::extract<ConstantInt>(ProfileData->getOperand(i + 1));		for (auto [i, Weight] : llvm::enumerate(Weights)) {
		paulkirthUnsubmitted Done Reply Inline Actions I always forget the `enumerate` API exists ... what a massive improvement to readability. paulkirth: I always forget the `enumerate` API exists ... what a massive improvement to readability.
ProfVal = CI->getValue().getZExtValue();
if (Term->getSuccessor(i) == ExitBlock)		if (Term->getSuccessor(i) == ExitBlock)
Numerator += ProfVal;		Numerator += Weight;
Denominator += ProfVal;		Denominator += Weight;
}		}
return BranchProbability::getBranchProbability(Numerator, Denominator);		return BranchProbability::getBranchProbability(Numerator, Denominator);
} else {		} else {
assert(LatchBlock != ExitingBlock &&		assert(LatchBlock != ExitingBlock &&
"Latch term should always have profile data!");		"Latch term should always have profile data!");
// No profile data, so we choose the weight as 1/num_of_succ(Src)		// No profile data, so we choose the weight as 1/num_of_succ(Src)
return BranchProbability::getBranchProbability(1, NumSucc);		return BranchProbability::getBranchProbability(1, NumSucc);
}		}
▲ Show 20 Lines • Show All 321 Lines • Show Last 20 Lines

llvm/lib/Transforms/Utils/Local.cpp

Show First 20 Lines • Show All 56 Lines • ▼ Show 20 Lines

#include "llvm/IR/IntrinsicInst.h" #include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Intrinsics.h" #include "llvm/IR/Intrinsics.h"

#include "llvm/IR/IntrinsicsWebAssembly.h" #include "llvm/IR/IntrinsicsWebAssembly.h"

#include "llvm/IR/LLVMContext.h" #include "llvm/IR/LLVMContext.h"

#include "llvm/IR/MDBuilder.h" #include "llvm/IR/MDBuilder.h"

#include "llvm/IR/Metadata.h" #include "llvm/IR/Metadata.h"

#include "llvm/IR/Module.h" #include "llvm/IR/Module.h"

#include "llvm/IR/PatternMatch.h" #include "llvm/IR/PatternMatch.h"

#include "llvm/IR/ProfDataUtils.h"

#include "llvm/IR/Type.h" #include "llvm/IR/Type.h"

#include "llvm/IR/Use.h" #include "llvm/IR/Use.h"

#include "llvm/IR/User.h" #include "llvm/IR/User.h"

#include "llvm/IR/Value.h" #include "llvm/IR/Value.h"

#include "llvm/IR/ValueHandle.h" #include "llvm/IR/ValueHandle.h"

#include "llvm/Support/Casting.h" #include "llvm/Support/Casting.h"

#include "llvm/Support/Debug.h" #include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h" #include "llvm/Support/ErrorHandling.h"

▲ Show 20 Lines • Show All 132 Lines • ▼ Show 20 Lines for (auto i = SI->case_begin(), e = SI->case_end(); i != e;) {

if (i->getCaseValue() == CI) { if (i->getCaseValue() == CI) {

TheOnlyDest = i->getCaseSuccessor(); TheOnlyDest = i->getCaseSuccessor();

break; break;

} }

// Check to see if this branch is going to the same place as the default // Check to see if this branch is going to the same place as the default

// dest. If so, eliminate it as an explicit compare. // dest. If so, eliminate it as an explicit compare.

if (i->getCaseSuccessor() == DefaultDest) { if (i->getCaseSuccessor() == DefaultDest) {

MDNode *MD = SI->getMetadata(LLVMContext::MD_prof); MDNode *MD = getBranchWeightMDNode(*SI);

unsigned NCases = SI->getNumCases(); unsigned NCases = SI->getNumCases();

// Fold the case metadata into the default if there will be any branches // Fold the case metadata into the default if there will be any branches

// left, unless the metadata doesn't match the switch. // left, unless the metadata doesn't match the switch.

if (NCases > 1 && MD && MD->getNumOperands() == 2 + NCases) { if (NCases > 1 && MD && MD->getNumOperands() == 2 + NCases) {

// Collect branch weights into a vector. // Collect branch weights into a vector.

SmallVector<uint32_t, 8> Weights; SmallVector<uint32_t, 8> Weights;

for (unsigned MD_i = 1, MD_e = MD->getNumOperands(); MD_i < MD_e; extractBranchWeights(MD, Weights);

++MD_i) {

paulkirthUnsubmitted

Done

SmallVector<uint32_t, 8> Weights;

- extractBranchWeights(*SI, Weights);

+ extractBranchWeights(MD, Weights);

// Merge weight of this case to the default weight.

paulkirth:

auto *CI = mdconst::extract<ConstantInt>(MD->getOperand(MD_i));

Weights.push_back(CI->getValue().getZExtValue());

}

// Merge weight of this case to the default weight. // Merge weight of this case to the default weight.

unsigned idx = i->getCaseIndex(); unsigned idx = i->getCaseIndex();

// TODO: no overflow check

paulkirthUnsubmitted

Done

Should we track this improvement w/ an issue? If you don't want to that's fine, but I always lose track of these TODOs unless I file something in a bug tracker and ref it from my code. Totally up to you though.

paulkirth: Should we track this improvement w/ an issue? If you don't want to that's fine, but I always…

DinistroAuthorUnsubmitted

Done

Good idea, I tracked this and another problem with the subsequent swap in here: https://github.com/llvm/llvm-project/issues/59956

Dinistro: Good idea, I tracked this and another problem with the subsequent swap in here: https://github.

Weights[0] += Weights[idx+1]; Weights[0] += Weights[idx+1];

// TODO: that's incorrect, no?

// Remove weight for this case. // Remove weight for this case.

std::swap(Weights[idx+1], Weights.back()); std::swap(Weights[idx+1], Weights.back());

Weights.pop_back(); Weights.pop_back();

SI->setMetadata(LLVMContext::MD_prof, SI->setMetadata(LLVMContext::MD_prof,

MDBuilder(BB->getContext()). MDBuilder(BB->getContext()).

createBranchWeights(Weights)); createBranchWeights(Weights));

} }

// Remove this entry. // Remove this entry.

▲ Show 20 Lines • Show All 72 Lines • ▼ Show 20 Lines if (SI->getNumCases() == 1) {

auto FirstCase = *SI->case_begin(); auto FirstCase = *SI->case_begin();

Value *Cond = Builder.CreateICmpEQ(SI->getCondition(), Value *Cond = Builder.CreateICmpEQ(SI->getCondition(),

FirstCase.getCaseValue(), "cond"); FirstCase.getCaseValue(), "cond");

// Insert the new branch. // Insert the new branch.

BranchInst *NewBr = Builder.CreateCondBr(Cond, BranchInst *NewBr = Builder.CreateCondBr(Cond,

FirstCase.getCaseSuccessor(), FirstCase.getCaseSuccessor(),

SI->getDefaultDest()); SI->getDefaultDest());

MDNode *MD = SI->getMetadata(LLVMContext::MD_prof); SmallVector<uint32_t> Weights;

if (MD && MD->getNumOperands() == 3) { if (extractBranchWeights(*SI, Weights) && Weights.size() == 2) {

ConstantInt *SICase = uint64_t DefWeight = Weights[0];

mdconst::dyn_extract<ConstantInt>(MD->getOperand(2)); uint64_t CaseWeight = Weights[1];

paulkirthUnsubmitted

Done

uint64_t, maybe? I can never remember what is guaranteed to run before we scale down to 32-bit weights, but the size should at least be the same between the weights vector and DefWeight/CaseWeight, right?

paulkirth: `uint64_t`, maybe? I can never remember what is guaranteed to run before we scale down to 32…

DinistroAuthorUnsubmitted

Done

The extractBranchWeights function expects an SmallVectorImp<uint32_t>, so I now changed the Weight variables to uint32_t as well.

Dinistro: The `extractBranchWeights` function expects an `SmallVectorImp<uint32_t>`, so I now changed the…

paulkirthUnsubmitted

Not Done

I think this is fine but we may want to double check that this only gets called after scaling down to 32-bit. Otherwise, maybe we should have a uint64_t version too, or make this a templated function in the .h, so the you can choose at the callsite. That can be a separate change though, as long as 32-bit is safe.

@davidxl do you know if this gets called after scaling down to 32-bit?

paulkirth: I think this is fine but we may want to double check that this only gets called after scaling…

davidxlUnsubmitted

Not Done

IRPGO scales the count before setting the edge weights. Frontend based instrumentation does the same. Static branch weights have small values so they are fine too.

davidxl: IRPGO scales the count before setting the edge weights. Frontend based instrumentation does…

ConstantInt *SIDef =

mdconst::dyn_extract<ConstantInt>(MD->getOperand(1));

assert(SICase && SIDef);

// The TrueWeight should be the weight for the single case of SI. // The TrueWeight should be the weight for the single case of SI.

paulkirthUnsubmitted

Done

SI->getDefaultDest());

- uint64_t DefWeight;

- uint64_t CaseWeight;

- if (extractBranchWeights(*SI, DefWeight, CaseWeight)) {

+ SmallVector<uint64_t,2> Weights;

+ if (extractBranchWeights(MD, DefWeight, CaseWeight)) {

// The TrueWeight should be the weight for the single case of SI.

The overload will just get the MD node again anyway before calling the other API, so I'd suggest just using the MD node directly. Would you mind changing these and any others in this patch that use getBranchWeightMDNode prior to extractBranchWeights

paulkirth: The overload will just get the MD node again anyway before calling the other API, so I'd…

NewBr->setMetadata(LLVMContext::MD_prof, NewBr->setMetadata(LLVMContext::MD_prof,

MDBuilder(BB->getContext()). MDBuilder(BB->getContext())

createBranchWeights(SICase->getValue().getZExtValue(), .createBranchWeights(CaseWeight, DefWeight));

SIDef->getValue().getZExtValue()));

} }

// Update make.implicit metadata to the newly-created conditional branch. // Update make.implicit metadata to the newly-created conditional branch.

MDNode *MakeImplicitMD = SI->getMetadata(LLVMContext::MD_make_implicit); MDNode *MakeImplicitMD = SI->getMetadata(LLVMContext::MD_make_implicit);

if (MakeImplicitMD) if (MakeImplicitMD)

NewBr->setMetadata(LLVMContext::MD_make_implicit, MakeImplicitMD); NewBr->setMetadata(LLVMContext::MD_make_implicit, MakeImplicitMD);

// Delete the old switch. // Delete the old switch.

▲ Show 20 Lines • Show All 3,183 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[llvm][ir] Purge MD_prof custom accessors
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 488130

llvm/include/llvm/Analysis/CFGPrinter.h

llvm/include/llvm/IR/Instructions.h

llvm/include/llvm/IR/ProfDataUtils.h

llvm/lib/Analysis/BranchProbabilityInfo.cpp

llvm/lib/IR/Instruction.cpp

llvm/lib/IR/Instructions.cpp

llvm/lib/IR/Metadata.cpp

llvm/lib/IR/ProfDataUtils.cpp

llvm/lib/Transforms/IPO/PartialInlining.cpp

llvm/lib/Transforms/Instrumentation/ControlHeightReduction.cpp

llvm/lib/Transforms/Scalar/JumpThreading.cpp

llvm/lib/Transforms/Scalar/LoopPredication.cpp

llvm/lib/Transforms/Utils/Local.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[llvm][ir] Purge MD_prof custom accessorsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 488130

llvm/include/llvm/Analysis/CFGPrinter.h

llvm/include/llvm/IR/Instructions.h

llvm/include/llvm/IR/ProfDataUtils.h

llvm/lib/Analysis/BranchProbabilityInfo.cpp

llvm/lib/IR/Instruction.cpp

llvm/lib/IR/Instructions.cpp

llvm/lib/IR/Metadata.cpp

llvm/lib/IR/ProfDataUtils.cpp

llvm/lib/Transforms/IPO/PartialInlining.cpp

llvm/lib/Transforms/Instrumentation/ControlHeightReduction.cpp

llvm/lib/Transforms/Scalar/JumpThreading.cpp

llvm/lib/Transforms/Scalar/LoopPredication.cpp

llvm/lib/Transforms/Utils/Local.cpp

[llvm][ir] Purge MD_prof custom accessors
ClosedPublic