Diff 31882

include/llvm/CodeGen/MachineBasicBlock.h

Show First 20 Lines • Show All 59 Lines • ▼ Show 20 Lines	private:
void createNode(const MachineInstr &);		void createNode(const MachineInstr &);
};		};

class MachineBasicBlock : public ilist_node<MachineBasicBlock> {		class MachineBasicBlock : public ilist_node<MachineBasicBlock> {
typedef ilist<MachineInstr> Instructions;		typedef ilist<MachineInstr> Instructions;
Instructions Insts;		Instructions Insts;
const BasicBlock *BB;		const BasicBlock *BB;
int Number;		int Number;

		/// A flag tracking whether the weights of all successors are normalized.
		bool AreSuccWeightsNormalized;

MachineFunction *xParent;		MachineFunction *xParent;

/// Keep track of the predecessor / successor basic blocks.		/// Keep track of the predecessor / successor basic blocks.
std::vector<MachineBasicBlock *> Predecessors;		std::vector<MachineBasicBlock *> Predecessors;
std::vector<MachineBasicBlock *> Successors;		std::vector<MachineBasicBlock *> Successors;

/// Keep track of the weights to the successors. This vector has the same		/// Keep track of the weights to the successors. This vector has the same
/// order as Successors, or it is empty if we don't use it (disable		/// order as Successors, or it is empty if we don't use it (disable
/// optimization).		/// optimization).
std::vector<uint32_t> Weights;		std::vector<uint32_t> Weights;
typedef std::vector<uint32_t>::iterator weight_iterator;		typedef std::vector<uint32_t>::iterator weight_iterator;
typedef std::vector<uint32_t>::const_iterator const_weight_iterator;		typedef std::vector<uint32_t>::const_iterator const_weight_iterator;

/// Keep track of the physical registers that are livein of the basicblock.		/// Keep track of the physical registers that are livein of the basicblock.
std::vector<unsigned> LiveIns;		std::vector<unsigned> LiveIns;

		davidxlUnsubmitted Done Reply Inline Actions Put this field after int Number field so that the padding space can be used (for 64bit). davidxl: Put this field after int Number field so that the padding space can be used (for 64bit).
		conghAuthorUnsubmitted Not Done Reply Inline Actions OK. Updated. congh: OK. Updated.
/// Alignment of the basic block. Zero if the basic block does not need to be		/// Alignment of the basic block. Zero if the basic block does not need to be
/// aligned. The alignment is specified as log2(bytes).		/// aligned. The alignment is specified as log2(bytes).
unsigned Alignment;		unsigned Alignment;

/// Indicate that this basic block is entered via an exception handler.		/// Indicate that this basic block is entered via an exception handler.
bool IsLandingPad;		bool IsLandingPad;

/// Indicate that this basic block is potentially the target of an indirect		/// Indicate that this basic block is potentially the target of an indirect
Show All 32 Lines	public:
/// Set this block to reflect that it potentially is the target of an indirect		/// Set this block to reflect that it potentially is the target of an indirect
/// branch.		/// branch.
void setHasAddressTaken() { AddressTaken = true; }		void setHasAddressTaken() { AddressTaken = true; }

/// Return the MachineFunction containing this basic block.		/// Return the MachineFunction containing this basic block.
const MachineFunction *getParent() const { return xParent; }		const MachineFunction *getParent() const { return xParent; }
MachineFunction *getParent() { return xParent; }		MachineFunction *getParent() { return xParent; }

		/// Return whether all weights of successors are normalized.
		bool areSuccWeightsNormalized() const { return AreSuccWeightsNormalized; }

/// MachineBasicBlock iterator that automatically skips over MIs that are		/// MachineBasicBlock iterator that automatically skips over MIs that are
/// inside bundles (i.e. walk top level MIs only).		/// inside bundles (i.e. walk top level MIs only).
template<typename Ty, typename IterTy>		template<typename Ty, typename IterTy>
class bundle_iterator		class bundle_iterator
: public std::iterator<std::bidirectional_iterator_tag, Ty, ptrdiff_t> {		: public std::iterator<std::bidirectional_iterator_tag, Ty, ptrdiff_t> {
IterTy MII;		IterTy MII;

public:		public:
▲ Show 20 Lines • Show All 239 Lines • ▼ Show 20 Lines	public:
/// calculate branch probability.		/// calculate branch probability.
///		///
/// Note that duplicate Machine CFG edges are not allowed.		/// Note that duplicate Machine CFG edges are not allowed.
void addSuccessor(MachineBasicBlock *succ, uint32_t weight = 0);		void addSuccessor(MachineBasicBlock *succ, uint32_t weight = 0);

/// Set successor weight of a given iterator.		/// Set successor weight of a given iterator.
void setSuccWeight(succ_iterator I, uint32_t weight);		void setSuccWeight(succ_iterator I, uint32_t weight);

		/// Normalize all succesor weights so that the sum of them does not exceed
		/// UINT32_MAX. Return true if the weights are modified and false otherwise.
		/// Note that weights that are modified after calling this function are not
		/// guaranteed to be normalized.
		bool normalizeSuccWeights();

/// Remove successor from the successors list of this MachineBasicBlock. The		/// Remove successor from the successors list of this MachineBasicBlock. The
/// Predecessors list of succ is automatically updated.		/// Predecessors list of succ is automatically updated.
void removeSuccessor(MachineBasicBlock *succ);		void removeSuccessor(MachineBasicBlock *succ);

/// Remove specified successor from the successors list of this		/// Remove specified successor from the successors list of this
/// MachineBasicBlock. The Predecessors list of succ is automatically updated.		/// MachineBasicBlock. The Predecessors list of succ is automatically updated.
/// Return the iterator to the element after the one removed.		/// Return the iterator to the element after the one removed.
succ_iterator removeSuccessor(succ_iterator I);		succ_iterator removeSuccessor(succ_iterator I);
▲ Show 20 Lines • Show All 398 Lines • Show Last 20 Lines

include/llvm/CodeGen/MachineBranchProbabilityInfo.h

Show First 20 Lines • Show All 54 Lines • ▼ Show 20 Lines	public:
uint32_t getEdgeWeight(const MachineBasicBlock *Src,		uint32_t getEdgeWeight(const MachineBasicBlock *Src,
MachineBasicBlock::const_succ_iterator Dst) const;		MachineBasicBlock::const_succ_iterator Dst) const;

// Get sum of the block successors' weights, potentially scaling them to fit		// Get sum of the block successors' weights, potentially scaling them to fit
// within 32-bits. If scaling is required, sets Scale based on the necessary		// within 32-bits. If scaling is required, sets Scale based on the necessary
// adjustment. Any edge weights used with the sum should be divided by Scale.		// adjustment. Any edge weights used with the sum should be divided by Scale.
uint32_t getSumForBlock(const MachineBasicBlock *MBB, uint32_t &Scale) const;		uint32_t getSumForBlock(const MachineBasicBlock *MBB, uint32_t &Scale) const;

		// Get sum of the block successors' weights, and force normalizing the
		// successors' weights of MBB so that their sum fit within 32-bits.
		uint32_t getSumForBlock(MachineBasicBlock *MBB) const;

// A 'Hot' edge is an edge which probability is >= 80%.		// A 'Hot' edge is an edge which probability is >= 80%.
bool isEdgeHot(const MachineBasicBlock *Src,		bool isEdgeHot(const MachineBasicBlock *Src,
const MachineBasicBlock *Dst) const;		const MachineBasicBlock *Dst) const;

// Return a hot successor for the block BB or null if there isn't one.		// Return a hot successor for the block BB or null if there isn't one.
// NB: This routine's complexity is linear on the number of successors.		// NB: This routine's complexity is linear on the number of successors.
MachineBasicBlock getHotSucc(MachineBasicBlock MBB) const;		MachineBasicBlock getHotSucc(MachineBasicBlock MBB) const;

// Return a probability as a fraction between 0 (0% probability) and		// Return a probability as a fraction between 0 (0% probability) and
// 1 (100% probability), however the value is never equal to 0, and can be 1		// 1 (100% probability), however the value is never equal to 0, and can be 1
// only iff SRC block has only one successor.		// only iff SRC block has only one successor.
// NB: This routine's complexity is linear on the number of successors of		// NB: This routine's complexity is linear on the number of successors of
// Src. Querying sequentially for each successor's probability is a quadratic		// Src. Querying sequentially for each successor's probability is a quadratic
// query pattern.		// query pattern.
BranchProbability getEdgeProbability(const MachineBasicBlock *Src,		BranchProbability getEdgeProbability(const MachineBasicBlock *Src,
const MachineBasicBlock *Dst) const;		const MachineBasicBlock *Dst) const;

// Print value between 0 (0% probability) and 1 (100% probability),		// Print value between 0 (0% probability) and 1 (100% probability),
// however the value is never equal to 0, and can be 1 only iff SRC block		// however the value is never equal to 0, and can be 1 only iff SRC block
// has only one successor.		// has only one successor.
raw_ostream &printEdgeProbability(raw_ostream &OS,		raw_ostream &printEdgeProbability(raw_ostream &OS,
const MachineBasicBlock *Src,		const MachineBasicBlock *Src,
const MachineBasicBlock *Dst) const;		const MachineBasicBlock *Dst) const;

		// Normalize a list of weights by scaling them down so that the sum of them
		// doesn't exceed UINT32_MAX. Return the scale.
		template <class WeightList>
		static uint32_t normalizeEdgeWeights(WeightList &Weights);
};		};

		template <class WeightList>
		uint32_t
		MachineBranchProbabilityInfo::normalizeEdgeWeights(WeightList &Weights) {
		assert(Weights.size() < UINT32_MAX && "Too many weights in the list!");
		// First we compute the sum with 64-bits of precision.
		uint64_t Sum = std::accumulate(Weights.begin(), Weights.end(), uint64_t(0));

		// If the computed sum fits in 32-bits, we're done.
		if (Sum <= UINT32_MAX)
		return 1;

		// Otherwise, compute the scale necessary to cause the weights to fit, and
		// re-sum with that scale applied.
		assert((Sum / UINT32_MAX) < UINT32_MAX &&
		"The sum of weights exceeds UINT32_MAX^2!");
		uint32_t Scale = (Sum / UINT32_MAX) + 1;
		for (auto &W : Weights)
		W /= Scale;
		return Scale;
		}

}		}


#endif		#endif

lib/Analysis/BranchProbabilityInfo.cpp

Show First 20 Lines • Show All 196 Lines • ▼ Show 20 Lines	bool BranchProbabilityInfo::calcMetadataWeights(BasicBlock *BB) {
for (unsigned i = 1, e = WeightsNode->getNumOperands(); i != e; ++i) {		for (unsigned i = 1, e = WeightsNode->getNumOperands(); i != e; ++i) {
ConstantInt *Weight =		ConstantInt *Weight =
mdconst::dyn_extract<ConstantInt>(WeightsNode->getOperand(i));		mdconst::dyn_extract<ConstantInt>(WeightsNode->getOperand(i));
if (!Weight)		if (!Weight)
return false;		return false;
assert(Weight->getValue().getActiveBits() <= 32 &&		assert(Weight->getValue().getActiveBits() <= 32 &&
"Too many bits for uint32_t");		"Too many bits for uint32_t");
Weights.push_back(Weight->getZExtValue());		Weights.push_back(Weight->getZExtValue());
WeightSum += Weights.back();		// We will turn zero weights into one so here we need to take this into
		// account when summing up weights.
		WeightSum += std::max<uint32_t>(Weights.back(), 1);
}		}
assert(Weights.size() == TI->getNumSuccessors() && "Checked above");		assert(Weights.size() == TI->getNumSuccessors() && "Checked above");

// If the sum of weights does not fit in 32 bits, scale every weight down		// If the sum of weights does not fit in 32 bits, scale every weight down
// accordingly.		// accordingly.
uint64_t ScalingFactor =		uint64_t ScalingFactor =
(WeightSum > UINT32_MAX) ? WeightSum / UINT32_MAX + 1 : 1;		(WeightSum > UINT32_MAX) ? WeightSum / UINT32_MAX + 1 : 1;

WeightSum = 0;		WeightSum = 0;
for (unsigned i = 0, e = TI->getNumSuccessors(); i != e; ++i) {		for (unsigned i = 0, e = TI->getNumSuccessors(); i != e; ++i) {
uint32_t W = Weights[i] / ScalingFactor;		// Turn zero weights into one.
		uint32_t W = std::max<uint32_t>(Weights[i] / ScalingFactor, 1);
WeightSum += W;		WeightSum += W;
setEdgeWeight(BB, i, W);		setEdgeWeight(BB, i, W);
}		}
assert(WeightSum <= UINT32_MAX &&		assert(WeightSum <= UINT32_MAX &&
"Expected weights to scale down to 32 bits");		"Expected weights to scale down to 32 bits");

return true;		return true;
}		}
▲ Show 20 Lines • Show All 479 Lines • Show Last 20 Lines

lib/CodeGen/IfConversion.cpp

Show First 20 Lines • Show All 1,226 Lines • ▼ Show 20 Lines	bool IfConverter::IfConvertTriangle(BBInfo &BBI, IfcvtKind Kind) {
Redefs.init(TRI);		Redefs.init(TRI);
Redefs.addLiveIns(CvtBBI->BB);		Redefs.addLiveIns(CvtBBI->BB);
Redefs.addLiveIns(NextBBI->BB);		Redefs.addLiveIns(NextBBI->BB);

DontKill.clear();		DontKill.clear();

bool HasEarlyExit = CvtBBI->FalseBB != nullptr;		bool HasEarlyExit = CvtBBI->FalseBB != nullptr;
uint64_t CvtNext = 0, CvtFalse = 0, BBNext = 0, BBCvt = 0, SumWeight = 0;		uint64_t CvtNext = 0, CvtFalse = 0, BBNext = 0, BBCvt = 0, SumWeight = 0;
uint32_t WeightScale = 0;

if (HasEarlyExit) {		if (HasEarlyExit) {
// Get weights before modifying CvtBBI->BB and BBI.BB.		// Get weights before modifying CvtBBI->BB and BBI.BB.
		// Explictly normalize the weights of all edges from CvtBBI->BB so that we
		// are aware that the edge weights obtained below are normalized.
		CvtBBI->BB->normalizeSuccWeights();
CvtNext = MBPI->getEdgeWeight(CvtBBI->BB, NextBBI->BB);		CvtNext = MBPI->getEdgeWeight(CvtBBI->BB, NextBBI->BB);
CvtFalse = MBPI->getEdgeWeight(CvtBBI->BB, CvtBBI->FalseBB);		CvtFalse = MBPI->getEdgeWeight(CvtBBI->BB, CvtBBI->FalseBB);
BBNext = MBPI->getEdgeWeight(BBI.BB, NextBBI->BB);		BBNext = MBPI->getEdgeWeight(BBI.BB, NextBBI->BB);
BBCvt = MBPI->getEdgeWeight(BBI.BB, CvtBBI->BB);		BBCvt = MBPI->getEdgeWeight(BBI.BB, CvtBBI->BB);
SumWeight = MBPI->getSumForBlock(CvtBBI->BB, WeightScale);		SumWeight = MBPI->getSumForBlock(CvtBBI->BB);
		davidxlUnsubmitted Not Done Reply Inline Actions why not move this before getEdgeWeight so that the explicit call to normalize weight is not needed? davidxl: why not move this before getEdgeWeight so that the explicit call to normalize weight is not…
		conghAuthorUnsubmitted Not Done Reply Inline Actions This is to explicitly stating that we should normalize the edge weights then get them. I am afraid if we just simply put getSumForBlock() before getEdgeWeight(), some people who are not aware that getSumForBlock() does weights normalization may switch them later by mistake. congh: This is to explicitly stating that we should normalize the edge weights then get them. I am…
}		}

if (CvtBBI->BB->pred_size() > 1) {		if (CvtBBI->BB->pred_size() > 1) {
BBI.NonPredSize -= TII->RemoveBranch(*BBI.BB);		BBI.NonPredSize -= TII->RemoveBranch(*BBI.BB);
// Copy instructions in the true block, predicate them, and add them to		// Copy instructions in the true block, predicate them, and add them to
// the entry block.		// the entry block.
CopyAndPredicateBlock(BBI, *CvtBBI, Cond, true);		CopyAndPredicateBlock(BBI, *CvtBBI, Cond, true);

Show All 20 Lines	if (HasEarlyExit) {
BBI.BB->addSuccessor(CvtBBI->FalseBB);		BBI.BB->addSuccessor(CvtBBI->FalseBB);
// Update the edge weight for both CvtBBI->FalseBB and NextBBI.		// Update the edge weight for both CvtBBI->FalseBB and NextBBI.
// New_Weight(BBI.BB, NextBBI->BB) =		// New_Weight(BBI.BB, NextBBI->BB) =
// Weight(BBI.BB, NextBBI->BB) * getSumForBlock(CvtBBI->BB) +		// Weight(BBI.BB, NextBBI->BB) * getSumForBlock(CvtBBI->BB) +
// Weight(BBI.BB, CvtBBI->BB) * Weight(CvtBBI->BB, NextBBI->BB)		// Weight(BBI.BB, CvtBBI->BB) * Weight(CvtBBI->BB, NextBBI->BB)
// New_Weight(BBI.BB, CvtBBI->FalseBB) =		// New_Weight(BBI.BB, CvtBBI->FalseBB) =
// Weight(BBI.BB, CvtBBI->BB) * Weight(CvtBBI->BB, CvtBBI->FalseBB)		// Weight(BBI.BB, CvtBBI->BB) * Weight(CvtBBI->BB, CvtBBI->FalseBB)

uint64_t NewNext = BBNext * SumWeight + (BBCvt * CvtNext) / WeightScale;		uint64_t NewNext = BBNext * SumWeight + BBCvt * CvtNext;
uint64_t NewFalse = (BBCvt * CvtFalse) / WeightScale;		uint64_t NewFalse = BBCvt * CvtFalse;
// We need to scale down all weights of BBI.BB to fit uint32_t.		// We need to scale down all weights of BBI.BB to fit uint32_t.
// Here BBI.BB is connected to CvtBBI->FalseBB and will fall through to		// Here BBI.BB is connected to CvtBBI->FalseBB and will fall through to
// the next block.		// the next block.
ScaleWeights(NewNext, NewFalse, BBI.BB, getNextBlock(BBI.BB),		ScaleWeights(NewNext, NewFalse, BBI.BB, getNextBlock(BBI.BB),
CvtBBI->FalseBB, MBPI);		CvtBBI->FalseBB, MBPI);
}		}

// Merge in the 'false' block if the 'false' block has no other		// Merge in the 'false' block if the 'false' block has no other
▲ Show 20 Lines • Show All 438 Lines • Show Last 20 Lines

lib/CodeGen/MachineBasicBlock.cpp

Show All 10 Lines
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "llvm/CodeGen/MachineBasicBlock.h"		#include "llvm/CodeGen/MachineBasicBlock.h"
#include "llvm/ADT/SmallPtrSet.h"		#include "llvm/ADT/SmallPtrSet.h"
#include "llvm/ADT/SmallString.h"		#include "llvm/ADT/SmallString.h"
#include "llvm/CodeGen/LiveIntervalAnalysis.h"		#include "llvm/CodeGen/LiveIntervalAnalysis.h"
#include "llvm/CodeGen/LiveVariables.h"		#include "llvm/CodeGen/LiveVariables.h"
		#include "llvm/CodeGen/MachineBranchProbabilityInfo.h"
#include "llvm/CodeGen/MachineDominators.h"		#include "llvm/CodeGen/MachineDominators.h"
#include "llvm/CodeGen/MachineFunction.h"		#include "llvm/CodeGen/MachineFunction.h"
#include "llvm/CodeGen/MachineInstrBuilder.h"		#include "llvm/CodeGen/MachineInstrBuilder.h"
#include "llvm/CodeGen/MachineLoopInfo.h"		#include "llvm/CodeGen/MachineLoopInfo.h"
#include "llvm/CodeGen/MachineRegisterInfo.h"		#include "llvm/CodeGen/MachineRegisterInfo.h"
#include "llvm/CodeGen/SlotIndexes.h"		#include "llvm/CodeGen/SlotIndexes.h"
#include "llvm/IR/BasicBlock.h"		#include "llvm/IR/BasicBlock.h"
#include "llvm/IR/DataLayout.h"		#include "llvm/IR/DataLayout.h"
#include "llvm/IR/ModuleSlotTracker.h"		#include "llvm/IR/ModuleSlotTracker.h"
#include "llvm/MC/MCAsmInfo.h"		#include "llvm/MC/MCAsmInfo.h"
#include "llvm/MC/MCContext.h"		#include "llvm/MC/MCContext.h"
#include "llvm/Support/Debug.h"		#include "llvm/Support/Debug.h"
#include "llvm/Support/raw_ostream.h"		#include "llvm/Support/raw_ostream.h"
#include "llvm/Target/TargetInstrInfo.h"		#include "llvm/Target/TargetInstrInfo.h"
#include "llvm/Target/TargetMachine.h"		#include "llvm/Target/TargetMachine.h"
#include "llvm/Target/TargetRegisterInfo.h"		#include "llvm/Target/TargetRegisterInfo.h"
#include "llvm/Target/TargetSubtargetInfo.h"		#include "llvm/Target/TargetSubtargetInfo.h"
#include <algorithm>		#include <algorithm>
using namespace llvm;		using namespace llvm;

#define DEBUG_TYPE "codegen"		#define DEBUG_TYPE "codegen"

MachineBasicBlock::MachineBasicBlock(MachineFunction &mf, const BasicBlock *bb)		MachineBasicBlock::MachineBasicBlock(MachineFunction &mf, const BasicBlock *bb)
: BB(bb), Number(-1), xParent(&mf), Alignment(0), IsLandingPad(false),		: BB(bb), Number(-1), AreSuccWeightsNormalized(false), xParent(&mf),
AddressTaken(false), CachedMCSymbol(nullptr) {		Alignment(0), IsLandingPad(false), AddressTaken(false),
		CachedMCSymbol(nullptr) {
Insts.Parent = this;		Insts.Parent = this;
}		}

MachineBasicBlock::~MachineBasicBlock() {		MachineBasicBlock::~MachineBasicBlock() {
}		}

/// getSymbol - Return the MCSymbol for this basic block.		/// getSymbol - Return the MCSymbol for this basic block.
///		///
▲ Show 20 Lines • Show All 424 Lines • ▼ Show 20 Lines

void MachineBasicBlock::addSuccessor(MachineBasicBlock *succ, uint32_t weight) {		void MachineBasicBlock::addSuccessor(MachineBasicBlock *succ, uint32_t weight) {

// If we see non-zero value for the first time it means we actually use Weight		// If we see non-zero value for the first time it means we actually use Weight
// list, so we fill all Weights with 0's.		// list, so we fill all Weights with 0's.
if (weight != 0 && Weights.empty())		if (weight != 0 && Weights.empty())
Weights.resize(Successors.size());		Weights.resize(Successors.size());

if (weight != 0 \|\| !Weights.empty())		if (weight != 0 \|\| !Weights.empty()) {
Weights.push_back(weight);		Weights.push_back(weight);
		AreSuccWeightsNormalized = false;
		}

Successors.push_back(succ);		Successors.push_back(succ);
succ->addPredecessor(this);		succ->addPredecessor(this);
}		}

void MachineBasicBlock::removeSuccessor(MachineBasicBlock *succ) {		void MachineBasicBlock::removeSuccessor(MachineBasicBlock *succ) {
succ->removePredecessor(this);		succ->removePredecessor(this);
succ_iterator I = std::find(Successors.begin(), Successors.end(), succ);		succ_iterator I = std::find(Successors.begin(), Successors.end(), succ);
▲ Show 20 Lines • Show All 597 Lines • ▼ Show 20 Lines	uint32_t MachineBasicBlock::getSuccWeight(const_succ_iterator Succ) const {

return *getWeightIterator(Succ);		return *getWeightIterator(Succ);
}		}

/// Set successor weight of a given iterator.		/// Set successor weight of a given iterator.
void MachineBasicBlock::setSuccWeight(succ_iterator I, uint32_t weight) {		void MachineBasicBlock::setSuccWeight(succ_iterator I, uint32_t weight) {
if (Weights.empty())		if (Weights.empty())
return;		return;
*getWeightIterator(I) = weight;		auto WeightIter = getWeightIterator(I);
		uint32_t OldWeight = *WeightIter;
		*WeightIter = weight;
		if (weight > OldWeight)
		AreSuccWeightsNormalized = false;
		}

		/// Normalize all succesor weights so that the sum of them does not exceed
		/// UINT32_MAX. Return true if the weights are modified and false otherwise.
		/// Note that weights that are modified after calling this function are not
		/// guaranteed to be normalized.
		bool MachineBasicBlock::normalizeSuccWeights() {
		if (!AreSuccWeightsNormalized) {
		uint32_t Scale =
		MachineBranchProbabilityInfo::normalizeEdgeWeights(Weights);
		AreSuccWeightsNormalized = true;
		return Scale != 1;
		}
		return false;
}		}

/// getWeightIterator - Return wight iterator corresonding to the I successor		/// getWeightIterator - Return wight iterator corresonding to the I successor
/// iterator		/// iterator
MachineBasicBlock::weight_iterator MachineBasicBlock::		MachineBasicBlock::weight_iterator MachineBasicBlock::
getWeightIterator(MachineBasicBlock::succ_iterator I) {		getWeightIterator(MachineBasicBlock::succ_iterator I) {
assert(Weights.size() == Successors.size() && "Async weight list!");		assert(Weights.size() == Successors.size() && "Async weight list!");
size_t index = std::distance(Successors.begin(), I);		size_t index = std::distance(Successors.begin(), I);
▲ Show 20 Lines • Show All 88 Lines • Show Last 20 Lines

lib/CodeGen/MachineBlockPlacement.cpp

Show First 20 Lines • Show All 355 Lines • ▼ Show 20 Lines	MachineBlockPlacement::selectBestSuccessor(MachineBasicBlock *BB,
MachineBasicBlock *BestSucc = nullptr;		MachineBasicBlock *BestSucc = nullptr;
// FIXME: Due to the performance of the probability and weight routines in		// FIXME: Due to the performance of the probability and weight routines in
// the MBPI analysis, we manually compute probabilities using the edge		// the MBPI analysis, we manually compute probabilities using the edge
// weights. This is suboptimal as it means that the somewhat subtle		// weights. This is suboptimal as it means that the somewhat subtle
// definition of edge weight semantics is encoded here as well. We should		// definition of edge weight semantics is encoded here as well. We should
// improve the MBPI interface to efficiently support query patterns such as		// improve the MBPI interface to efficiently support query patterns such as
// this.		// this.
uint32_t BestWeight = 0;		uint32_t BestWeight = 0;
uint32_t WeightScale = 0;		uint32_t SumWeight = MBPI->getSumForBlock(BB);
uint32_t SumWeight = MBPI->getSumForBlock(BB, WeightScale);
DEBUG(dbgs() << "Attempting merge from: " << getBlockName(BB) << "\n");		DEBUG(dbgs() << "Attempting merge from: " << getBlockName(BB) << "\n");
for (MachineBasicBlock *Succ : BB->successors()) {		for (MachineBasicBlock *Succ : BB->successors()) {
if (BlockFilter && !BlockFilter->count(Succ))		if (BlockFilter && !BlockFilter->count(Succ))
continue;		continue;
BlockChain &SuccChain = *BlockToChain[Succ];		BlockChain &SuccChain = *BlockToChain[Succ];
if (&SuccChain == &Chain) {		if (&SuccChain == &Chain) {
DEBUG(dbgs() << " " << getBlockName(Succ) << " -> Already merged!\n");		DEBUG(dbgs() << " " << getBlockName(Succ) << " -> Already merged!\n");
continue;		continue;
}		}
if (Succ != *SuccChain.begin()) {		if (Succ != *SuccChain.begin()) {
DEBUG(dbgs() << " " << getBlockName(Succ) << " -> Mid chain!\n");		DEBUG(dbgs() << " " << getBlockName(Succ) << " -> Mid chain!\n");
continue;		continue;
}		}

uint32_t SuccWeight = MBPI->getEdgeWeight(BB, Succ);		uint32_t SuccWeight = MBPI->getEdgeWeight(BB, Succ);
BranchProbability SuccProb(SuccWeight / WeightScale, SumWeight);		BranchProbability SuccProb(SuccWeight, SumWeight);

// If we outline optional branches, look whether Succ is unavoidable, i.e.		// If we outline optional branches, look whether Succ is unavoidable, i.e.
// dominates all terminators of the MachineFunction. If it does, other		// dominates all terminators of the MachineFunction. If it does, other
// successors must be optional. Don't do this for cold branches.		// successors must be optional. Don't do this for cold branches.
if (OutlineOptionalBranches && SuccProb > HotProb.getCompl() &&		if (OutlineOptionalBranches && SuccProb > HotProb.getCompl() &&
UnavoidableBlocks.count(Succ) > 0) {		UnavoidableBlocks.count(Succ) > 0) {
auto HasShortOptionalBranch = [&]() {		auto HasShortOptionalBranch = [&]() {
for (MachineBasicBlock *Pred : Succ->predecessors()) {		for (MachineBasicBlock *Pred : Succ->predecessors()) {
▲ Show 20 Lines • Show All 280 Lines • ▼ Show 20 Lines	for (MachineBasicBlock *MBB : L.getBlocks()) {
// We store the old exiting state and restore it if a viable looping		// We store the old exiting state and restore it if a viable looping
// successor isn't found.		// successor isn't found.
MachineBasicBlock *OldExitingBB = ExitingBB;		MachineBasicBlock *OldExitingBB = ExitingBB;
BlockFrequency OldBestExitEdgeFreq = BestExitEdgeFreq;		BlockFrequency OldBestExitEdgeFreq = BestExitEdgeFreq;
bool HasLoopingSucc = false;		bool HasLoopingSucc = false;
// FIXME: Due to the performance of the probability and weight routines in		// FIXME: Due to the performance of the probability and weight routines in
// the MBPI analysis, we use the internal weights and manually compute the		// the MBPI analysis, we use the internal weights and manually compute the
// probabilities to avoid quadratic behavior.		// probabilities to avoid quadratic behavior.
uint32_t WeightScale = 0;		uint32_t SumWeight = MBPI->getSumForBlock(MBB);
uint32_t SumWeight = MBPI->getSumForBlock(MBB, WeightScale);
for (MachineBasicBlock *Succ : MBB->successors()) {		for (MachineBasicBlock *Succ : MBB->successors()) {
if (Succ->isLandingPad())		if (Succ->isLandingPad())
continue;		continue;
if (Succ == MBB)		if (Succ == MBB)
continue;		continue;
BlockChain &SuccChain = *BlockToChain[Succ];		BlockChain &SuccChain = *BlockToChain[Succ];
// Don't split chains, either this chain or the successor's chain.		// Don't split chains, either this chain or the successor's chain.
if (&Chain == &SuccChain) {		if (&Chain == &SuccChain) {
Show All 12 Lines	for (MachineBasicBlock *Succ : MBB->successors()) {

unsigned SuccLoopDepth = 0;		unsigned SuccLoopDepth = 0;
if (MachineLoop *ExitLoop = MLI->getLoopFor(Succ)) {		if (MachineLoop *ExitLoop = MLI->getLoopFor(Succ)) {
SuccLoopDepth = ExitLoop->getLoopDepth();		SuccLoopDepth = ExitLoop->getLoopDepth();
if (ExitLoop->contains(&L))		if (ExitLoop->contains(&L))
BlocksExitingToOuterLoop.insert(MBB);		BlocksExitingToOuterLoop.insert(MBB);
}		}

BranchProbability SuccProb(SuccWeight / WeightScale, SumWeight);		BranchProbability SuccProb(SuccWeight, SumWeight);
BlockFrequency ExitEdgeFreq = MBFI->getBlockFreq(MBB) * SuccProb;		BlockFrequency ExitEdgeFreq = MBFI->getBlockFreq(MBB) * SuccProb;
DEBUG(dbgs() << " exiting: " << getBlockName(MBB) << " -> "		DEBUG(dbgs() << " exiting: " << getBlockName(MBB) << " -> "
<< getBlockName(Succ) << " [L:" << SuccLoopDepth << "] (";		<< getBlockName(Succ) << " [L:" << SuccLoopDepth << "] (";
MBFI->printBlockFreq(dbgs(), ExitEdgeFreq) << ")\n");		MBFI->printBlockFreq(dbgs(), ExitEdgeFreq) << ")\n");
// Note that we bias this toward an existing layout successor to retain		// Note that we bias this toward an existing layout successor to retain
// incoming order in the absence of better information. The exit must have		// incoming order in the absence of better information. The exit must have
// a frequency higher than the current exit before we consider breaking		// a frequency higher than the current exit before we consider breaking
// the layout.		// the layout.
▲ Show 20 Lines • Show All 511 Lines • Show Last 20 Lines

lib/CodeGen/MachineBranchProbabilityInfo.cpp

Show All 22 Lines	INITIALIZE_PASS_BEGIN(MachineBranchProbabilityInfo, "machine-branch-prob",
"Machine Branch Probability Analysis", false, true)		"Machine Branch Probability Analysis", false, true)
INITIALIZE_PASS_END(MachineBranchProbabilityInfo, "machine-branch-prob",		INITIALIZE_PASS_END(MachineBranchProbabilityInfo, "machine-branch-prob",
"Machine Branch Probability Analysis", false, true)		"Machine Branch Probability Analysis", false, true)

char MachineBranchProbabilityInfo::ID = 0;		char MachineBranchProbabilityInfo::ID = 0;

void MachineBranchProbabilityInfo::anchor() { }		void MachineBranchProbabilityInfo::anchor() { }

uint32_t MachineBranchProbabilityInfo::		uint32_t
getSumForBlock(const MachineBasicBlock *MBB, uint32_t &Scale) const {		MachineBranchProbabilityInfo::getSumForBlock(MachineBasicBlock *MBB) const {
// First we compute the sum with 64-bits of precision, ensuring that cannot		// Normalize the weights of MBB's all successors so that the sum is guaranteed
// overflow by bounding the number of weights considered. Hopefully no one		// to be no greater than UINT32_MAX.
// actually needs 2^32 successors.		MBB->normalizeSuccWeights();
assert(MBB->succ_size() < UINT32_MAX);
uint64_t Sum = 0;		SmallVector<uint32_t, 8> Weights;
Scale = 1;
for (MachineBasicBlock::const_succ_iterator I = MBB->succ_begin(),		for (MachineBasicBlock::const_succ_iterator I = MBB->succ_begin(),
E = MBB->succ_end(); I != E; ++I) {		E = MBB->succ_end();
uint32_t Weight = getEdgeWeight(MBB, I);		I != E; ++I)
Sum += Weight;		Weights.push_back(getEdgeWeight(MBB, I));

		return std::accumulate(Weights.begin(), Weights.end(), 0u);
}		}

// If the computed sum fits in 32-bits, we're done.		uint32_t
if (Sum <= UINT32_MAX)		MachineBranchProbabilityInfo::getSumForBlock(const MachineBasicBlock *MBB,
return Sum;		uint32_t &Scale) const {
		SmallVector<uint32_t, 8> Weights;
// Otherwise, compute the scale necessary to cause the weights to fit, and
// re-sum with that scale applied.
assert((Sum / UINT32_MAX) < UINT32_MAX);
Scale = (Sum / UINT32_MAX) + 1;
Sum = 0;
for (MachineBasicBlock::const_succ_iterator I = MBB->succ_begin(),		for (MachineBasicBlock::const_succ_iterator I = MBB->succ_begin(),
E = MBB->succ_end(); I != E; ++I) {		E = MBB->succ_end();
uint32_t Weight = getEdgeWeight(MBB, I);		I != E; ++I)
Sum += Weight / Scale;		Weights.push_back(getEdgeWeight(MBB, I));
}
assert(Sum <= UINT32_MAX);		if (MBB->areSuccWeightsNormalized())
return Sum;		Scale = 1;
		else
		Scale = MachineBranchProbabilityInfo::normalizeEdgeWeights(Weights);
		return std::accumulate(Weights.begin(), Weights.end(), 0u);
}		}

uint32_t MachineBranchProbabilityInfo::		uint32_t MachineBranchProbabilityInfo::
getEdgeWeight(const MachineBasicBlock *Src,		getEdgeWeight(const MachineBasicBlock *Src,
MachineBasicBlock::const_succ_iterator Dst) const {		MachineBasicBlock::const_succ_iterator Dst) const {
uint32_t Weight = Src->getSuccWeight(Dst);		uint32_t Weight = Src->getSuccWeight(Dst);
if (!Weight)		if (!Weight)
return DEFAULT_WEIGHT;		return DEFAULT_WEIGHT;
▲ Show 20 Lines • Show All 58 Lines • Show Last 20 Lines

test/CodeGen/X86/pr24377.ll

This file was added.

				; RUN: llc -mtriple=x86_64-linux < %s

				; ModuleID = 'bugpoint-reduced-simplified.bc'
				target datalayout = "E-m:e-i64:64-n32:64"
				target triple = "x86_64-unknown-linux-gnu"

				define void @__kmpc_atomic_cmplx8_mul() #0 {
				entry:
				br i1 undef, label %if.then.i.43, label %if.end.i.47

				if.then.i.43: ; preds = %entry
				unreachable

				if.end.i.47: ; preds = %entry
				br i1 undef, label %if.then.4.i.48, label %_Z25__kmp_acquire_atomic_lockP16kmp_queuing_locki.exit49

				if.then.4.i.48: ; preds = %if.end.i.47
				unreachable

				_Z25__kmp_acquire_atomic_lockP16kmp_queuing_locki.exit49: ; preds = %if.end.i.47
				br i1 undef, label %complex_mul_libcall.23, label %complex_mul_cont.25, !prof !1

				complex_mul_libcall.23: ; preds = %_Z25__kmp_acquire_atomic_lockP16kmp_queuing_locki.exit49
				tail call void @__muldc3() #1
				br label %complex_mul_cont.25

				complex_mul_cont.25: ; preds = %complex_mul_libcall.23, %_Z25__kmp_acquire_atomic_lockP16kmp_queuing_locki.exit49
				br i1 undef, label %if.then.i.54, label %return

				if.then.i.54: ; preds = %complex_mul_cont.25
				unreachable

				return: ; preds = %complex_mul_cont.25
				ret void
				}

				declare void @__muldc3()

				attributes #0 = { "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="a2q" "target-features"="+qpx,-altivec,-bpermd,-crypto,-direct-move,-extdiv,-power8-vector,-vsx" "unsafe-fp-math"="false" "use-soft-float"="false" }
				attributes #1 = { nounwind }

				!llvm.ident = !{!0}

				!0 = !{!"clang version 3.8.0 "}
				!1 = !{!"branch_weights", i32 0, i32 -1}

test/Transforms/SampleProfile/branch.ll

	Show All 30 Lines
	define i32 @main(i32 %argc, i8** nocapture readonly %argv) #0 {			define i32 @main(i32 %argc, i8** nocapture readonly %argv) #0 {
	; CHECK: Printing analysis 'Branch Probability Analysis' for function 'main':			; CHECK: Printing analysis 'Branch Probability Analysis' for function 'main':

	entry:			entry:
	tail call void @llvm.dbg.value(metadata i32 %argc, i64 0, metadata !13, metadata !DIExpression()), !dbg !27			tail call void @llvm.dbg.value(metadata i32 %argc, i64 0, metadata !13, metadata !DIExpression()), !dbg !27
	tail call void @llvm.dbg.value(metadata i8** %argv, i64 0, metadata !14, metadata !DIExpression()), !dbg !27			tail call void @llvm.dbg.value(metadata i8** %argv, i64 0, metadata !14, metadata !DIExpression()), !dbg !27
	%cmp = icmp slt i32 %argc, 2, !dbg !28			%cmp = icmp slt i32 %argc, 2, !dbg !28
	br i1 %cmp, label %return, label %if.end, !dbg !28			br i1 %cmp, label %return, label %if.end, !dbg !28
	; CHECK: edge entry -> return probability is 0 / 1 = 0%			; CHECK: edge entry -> return probability is 1 / 2 = 50%
	; CHECK: edge entry -> if.end probability is 1 / 1 = 100%			; CHECK: edge entry -> if.end probability is 1 / 2 = 50%

				davidxlUnsubmitted Not Done Reply Inline Actions Since BFI always ignores zero weight which leads to inconsistency (as BPI did not ignore zero weight before this fix, only BFI does it). If the test case really intend to test a highly biased branch here, I think the test case should be modified to not use zero weight after this fix (as it now will be completely ignored). Changing the the results to 50% may violate what is intended by the test. davidxl: Since BFI always ignores zero weight which leads to inconsistency (as BPI did not ignore zero…
				conghAuthorUnsubmitted Not Done Reply Inline Actions I did an investigation on this. The weight 0 and 1 are not indicated in this test cased but are read from a sample profile file, in which most lines have zero weights except two which are large weights. Where does 1 come from? When a zero weight is read from sample profile, it is converted to 1 (see include/llvm/ProfileData/SampleProf.h:175). In the comment, it says that the weight is set to 0 if the profile data is missing. If the profile data exist and the number of samples is zero, it will be converted to 1 to differentiate those two different cases. However, this will lead to a possible result that two edges from the same block have weight 0 and 1 (0 for missing profile and 1 for 0 sample): now how to interpret them? I think here it is a good idea to convert 0 to 1 in BPI for this case. For the original test case the probability 0 and 100% are quite wrong, but 50% and 50% as in the updated test case is more reasonable. congh: I did an investigation on this. The weight 0 and 1 are not indicated in this test cased but are…
				davidxlUnsubmitted Not Done Reply Inline Actions In AutoFDO, lines with instructions generated but without any samples are annotated with 0 counts -- they actually should not be converted to 1 as 0 counts are strong signals of coldness. One the other hand, lines that do not have any instructions associated (due to CSE, PRE, IVOPT etc) do not have any counts either, but they should not be marked with 0 counts and should be specially handled. It seems current implementation tries to overload zero weight again to represent this state which is wrong because zero weight does not do what it thinks it does. At this point, I think this test does not matters that much (Dehao and Diego are working to overhaul SampleFDO support anyway) -- so I am ok with this change. Duncan, WDYT? davidxl: In AutoFDO, lines with instructions generated but without any samples are annotated with 0…
	if.end: ; preds = %entry			if.end: ; preds = %entry
	%arrayidx = getelementptr inbounds i8, i8* %argv, i64 1, !dbg !30			%arrayidx = getelementptr inbounds i8, i8* %argv, i64 1, !dbg !30
	%0 = load i8, i8* %arrayidx, align 8, !dbg !30, !tbaa !31			%0 = load i8, i8* %arrayidx, align 8, !dbg !30, !tbaa !31
	%call = tail call i32 @atoi(i8* %0) #4, !dbg !30			%call = tail call i32 @atoi(i8* %0) #4, !dbg !30
	tail call void @llvm.dbg.value(metadata i32 %call, i64 0, metadata !17, metadata !DIExpression()), !dbg !30			tail call void @llvm.dbg.value(metadata i32 %call, i64 0, metadata !17, metadata !DIExpression()), !dbg !30
	%cmp1 = icmp sgt i32 %call, 100, !dbg !35			%cmp1 = icmp sgt i32 %call, 100, !dbg !35
	br i1 %cmp1, label %for.body, label %if.end6, !dbg !35			br i1 %cmp1, label %for.body, label %if.end6, !dbg !35
	; CHECK: edge if.end -> for.body probability is 0 / 1 = 0%			; CHECK: edge if.end -> for.body probability is 1 / 2 = 50%
	; CHECK: edge if.end -> if.end6 probability is 1 / 1 = 100%			; CHECK: edge if.end -> if.end6 probability is 1 / 2 = 50%

	for.body: ; preds = %if.end, %for.body			for.body: ; preds = %if.end, %for.body
	%u.016 = phi i32 [ %inc, %for.body ], [ 0, %if.end ]			%u.016 = phi i32 [ %inc, %for.body ], [ 0, %if.end ]
	%s.015 = phi double [ %sub, %for.body ], [ 0x40370ABE6A337A81, %if.end ]			%s.015 = phi double [ %sub, %for.body ], [ 0x40370ABE6A337A81, %if.end ]
	%add = fadd double %s.015, 3.049000e+00, !dbg !36			%add = fadd double %s.015, 3.049000e+00, !dbg !36
	%conv = sitofp i32 %u.016 to double, !dbg !36			%conv = sitofp i32 %u.016 to double, !dbg !36
	%add4 = fadd double %add, %conv, !dbg !36			%add4 = fadd double %add, %conv, !dbg !36
	tail call void @llvm.dbg.value(metadata double %add4, i64 0, metadata !18, metadata !DIExpression()), !dbg !36			tail call void @llvm.dbg.value(metadata double %add4, i64 0, metadata !18, metadata !DIExpression()), !dbg !36
	%div = fdiv double 3.940000e+00, %s.015, !dbg !37			%div = fdiv double 3.940000e+00, %s.015, !dbg !37
	%mul = fmul double %div, 3.200000e-01, !dbg !37			%mul = fmul double %div, 3.200000e-01, !dbg !37
	%add5 = fadd double %add4, %mul, !dbg !37			%add5 = fadd double %add4, %mul, !dbg !37
	%sub = fsub double %add4, %add5, !dbg !37			%sub = fsub double %add4, %add5, !dbg !37
	tail call void @llvm.dbg.value(metadata double %sub, i64 0, metadata !18, metadata !DIExpression()), !dbg !37			tail call void @llvm.dbg.value(metadata double %sub, i64 0, metadata !18, metadata !DIExpression()), !dbg !37
	%inc = add nsw i32 %u.016, 1, !dbg !38			%inc = add nsw i32 %u.016, 1, !dbg !38
	tail call void @llvm.dbg.value(metadata i32 %inc, i64 0, metadata !21, metadata !DIExpression()), !dbg !38			tail call void @llvm.dbg.value(metadata i32 %inc, i64 0, metadata !21, metadata !DIExpression()), !dbg !38
	%exitcond = icmp eq i32 %inc, %call, !dbg !38			%exitcond = icmp eq i32 %inc, %call, !dbg !38
	br i1 %exitcond, label %if.end6, label %for.body, !dbg !38			br i1 %exitcond, label %if.end6, label %for.body, !dbg !38
	; CHECK: edge for.body -> if.end6 probability is 0 / 10226 = 0%			; CHECK: edge for.body -> if.end6 probability is 1 / 10227 = 0.00977804%
	; CHECK: edge for.body -> for.body probability is 10226 / 10226 = 100% [HOT edge]			; CHECK: edge for.body -> for.body probability is 10226 / 10227 = 99.9902% [HOT edge]

	if.end6: ; preds = %for.body, %if.end			if.end6: ; preds = %for.body, %if.end
	%result.0 = phi double [ 0.000000e+00, %if.end ], [ %sub, %for.body ]			%result.0 = phi double [ 0.000000e+00, %if.end ], [ %sub, %for.body ]
	%call7 = tail call i32 (i8, ...) @printf(i8 getelementptr inbounds ([15 x i8], [15 x i8]* @.str, i64 0, i64 0), double %result.0), !dbg !39			%call7 = tail call i32 (i8, ...) @printf(i8 getelementptr inbounds ([15 x i8], [15 x i8]* @.str, i64 0, i64 0), double %result.0), !dbg !39
	br label %return, !dbg !40			br label %return, !dbg !40
	; CHECK: edge if.end6 -> return probability is 16 / 16 = 100% [HOT edge]			; CHECK: edge if.end6 -> return probability is 16 / 16 = 100% [HOT edge]

	return: ; preds = %entry, %if.end6			return: ; preds = %entry, %if.end6
	▲ Show 20 Lines • Show All 66 Lines • Show Last 20 Lines

test/Transforms/SampleProfile/calls.ll

Show First 20 Lines • Show All 46 Lines • ▼ Show 20 Lines	entry:
br label %while.cond, !dbg !13		br label %while.cond, !dbg !13

while.cond: ; preds = %if.end, %entry		while.cond: ; preds = %if.end, %entry
%0 = load i32, i32* %i, align 4, !dbg !14		%0 = load i32, i32* %i, align 4, !dbg !14
%inc = add nsw i32 %0, 1, !dbg !14		%inc = add nsw i32 %0, 1, !dbg !14
store i32 %inc, i32* %i, align 4, !dbg !14		store i32 %inc, i32* %i, align 4, !dbg !14
%cmp = icmp slt i32 %0, 400000000, !dbg !14		%cmp = icmp slt i32 %0, 400000000, !dbg !14
br i1 %cmp, label %while.body, label %while.end, !dbg !14		br i1 %cmp, label %while.body, label %while.end, !dbg !14
; CHECK: edge while.cond -> while.body probability is 5391 / 5391 = 100% [HOT edge]		; CHECK: edge while.cond -> while.body probability is 5391 / 5392 = 99.9815% [HOT edge]
; CHECK: edge while.cond -> while.end probability is 0 / 5391 = 0%		; CHECK: edge while.cond -> while.end probability is 1 / 5392 = 0.018546%

while.body: ; preds = %while.cond		while.body: ; preds = %while.cond
%1 = load i32, i32* %i, align 4, !dbg !16		%1 = load i32, i32* %i, align 4, !dbg !16
%cmp1 = icmp ne i32 %1, 100, !dbg !16		%cmp1 = icmp ne i32 %1, 100, !dbg !16
br i1 %cmp1, label %if.then, label %if.else, !dbg !16		br i1 %cmp1, label %if.then, label %if.else, !dbg !16
; Without discriminator information, the profiler used to think that		; Without discriminator information, the profiler used to think that
; both branches out of while.body had the same weight. In reality,		; both branches out of while.body had the same weight. In reality,
; the edge while.body->if.then is taken most of the time.		; the edge while.body->if.then is taken most of the time.
;		;
; CHECK: edge while.body -> if.then probability is 5752 / 5752 = 100% [HOT edge]		; CHECK: edge while.body -> if.then probability is 5752 / 5753 = 99.9826% [HOT edge]
; CHECK: edge while.body -> if.else probability is 0 / 5752 = 0%		; CHECK: edge while.body -> if.else probability is 1 / 5753 = 0.0173822%


if.then: ; preds = %while.body		if.then: ; preds = %while.body
%2 = load i32, i32* %i, align 4, !dbg !18		%2 = load i32, i32* %i, align 4, !dbg !18
%3 = load i32, i32* %s, align 4, !dbg !18		%3 = load i32, i32* %s, align 4, !dbg !18
%call = call i32 @_Z3sumii(i32 %2, i32 %3), !dbg !18		%call = call i32 @_Z3sumii(i32 %2, i32 %3), !dbg !18
store i32 %call, i32* %s, align 4, !dbg !18		store i32 %call, i32* %s, align 4, !dbg !18
br label %if.end, !dbg !18		br label %if.end, !dbg !18
▲ Show 20 Lines • Show All 45 Lines • Show Last 20 Lines

test/Transforms/SampleProfile/propagate.ll

Show First 20 Lines • Show All 67 Lines • ▼ Show 20 Lines	if.else: ; preds = %entry
store i64 0, i64* %i, align 8, !dbg !15		store i64 0, i64* %i, align 8, !dbg !15
br label %for.cond, !dbg !15		br label %for.cond, !dbg !15

for.cond: ; preds = %for.inc16, %if.else		for.cond: ; preds = %for.inc16, %if.else
%4 = load i64, i64* %i, align 8, !dbg !15		%4 = load i64, i64* %i, align 8, !dbg !15
%5 = load i64, i64* %N.addr, align 8, !dbg !15		%5 = load i64, i64* %N.addr, align 8, !dbg !15
%cmp1 = icmp slt i64 %4, %5, !dbg !15		%cmp1 = icmp slt i64 %4, %5, !dbg !15
br i1 %cmp1, label %for.body, label %for.end18, !dbg !15		br i1 %cmp1, label %for.body, label %for.end18, !dbg !15
; CHECK: edge for.cond -> for.body probability is 10 / 10 = 100% [HOT edge]		; CHECK: edge for.cond -> for.body probability is 10 / 11 = 90.9091% [HOT edge]
; CHECK: edge for.cond -> for.end18 probability is 0 / 10 = 0%		; CHECK: edge for.cond -> for.end18 probability is 1 / 11 = 9.09091%

for.body: ; preds = %for.cond		for.body: ; preds = %for.cond
%6 = load i64, i64* %i, align 8, !dbg !18		%6 = load i64, i64* %i, align 8, !dbg !18
%7 = load i64, i64* %N.addr, align 8, !dbg !18		%7 = load i64, i64* %N.addr, align 8, !dbg !18
%div = sdiv i64 %7, 3, !dbg !18		%div = sdiv i64 %7, 3, !dbg !18
%cmp2 = icmp sgt i64 %6, %div, !dbg !18		%cmp2 = icmp sgt i64 %6, %div, !dbg !18
br i1 %cmp2, label %if.then3, label %if.end, !dbg !18		br i1 %cmp2, label %if.then3, label %if.end, !dbg !18
; CHECK: edge for.body -> if.then3 probability is 1 / 5 = 20%		; CHECK: edge for.body -> if.then3 probability is 1 / 5 = 20%
Show All 28 Lines	if.else7: ; preds = %if.end
br label %for.cond8, !dbg !28		br label %for.cond8, !dbg !28

for.cond8: ; preds = %for.inc, %if.else7		for.cond8: ; preds = %for.inc, %if.else7
%13 = load i32, i32* %j, align 4, !dbg !28		%13 = load i32, i32* %j, align 4, !dbg !28
%conv9 = zext i32 %13 to i64, !dbg !28		%conv9 = zext i32 %13 to i64, !dbg !28
%14 = load i64, i64* %i, align 8, !dbg !28		%14 = load i64, i64* %i, align 8, !dbg !28
%cmp10 = icmp slt i64 %conv9, %14, !dbg !28		%cmp10 = icmp slt i64 %conv9, %14, !dbg !28
br i1 %cmp10, label %for.body11, label %for.end, !dbg !28		br i1 %cmp10, label %for.body11, label %for.end, !dbg !28
; CHECK: edge for.cond8 -> for.body11 probability is 16191 / 16191 = 100% [HOT edge]		; CHECK: edge for.cond8 -> for.body11 probability is 16191 / 16192 = 99.9938% [HOT edge]
; CHECK: edge for.cond8 -> for.end probability is 0 / 16191 = 0%		; CHECK: edge for.cond8 -> for.end probability is 1 / 16192 = 0.00617589%

for.body11: ; preds = %for.cond8		for.body11: ; preds = %for.cond8
%15 = load i32, i32* %j, align 4, !dbg !31		%15 = load i32, i32* %j, align 4, !dbg !31
%16 = load i32, i32* %x.addr, align 4, !dbg !31		%16 = load i32, i32* %x.addr, align 4, !dbg !31
%add12 = add i32 %16, %15, !dbg !31		%add12 = add i32 %16, %15, !dbg !31
store i32 %add12, i32* %x.addr, align 4, !dbg !31		store i32 %add12, i32* %x.addr, align 4, !dbg !31
%17 = load i32, i32* %y.addr, align 4, !dbg !33		%17 = load i32, i32* %y.addr, align 4, !dbg !33
%sub13 = sub nsw i32 %17, 3, !dbg !33		%sub13 = sub nsw i32 %17, 3, !dbg !33
▲ Show 20 Lines • Show All 112 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

Provide an interface normalizeSuccWeights in MachineBasicBlock to normalize its successors' weights and use it in other places.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 31882

include/llvm/CodeGen/MachineBasicBlock.h

include/llvm/CodeGen/MachineBranchProbabilityInfo.h

lib/Analysis/BranchProbabilityInfo.cpp

lib/CodeGen/IfConversion.cpp

lib/CodeGen/MachineBasicBlock.cpp

lib/CodeGen/MachineBlockPlacement.cpp

lib/CodeGen/MachineBranchProbabilityInfo.cpp

test/CodeGen/X86/pr24377.ll

test/Transforms/SampleProfile/branch.ll

test/Transforms/SampleProfile/calls.ll

test/Transforms/SampleProfile/propagate.ll

This is an archive of the discontinued LLVM Phabricator instance.

Provide an interface normalizeSuccWeights in MachineBasicBlock to normalize its successors' weights and use it in other places.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 31882

include/llvm/CodeGen/MachineBasicBlock.h

include/llvm/CodeGen/MachineBranchProbabilityInfo.h

lib/Analysis/BranchProbabilityInfo.cpp

lib/CodeGen/IfConversion.cpp

lib/CodeGen/MachineBasicBlock.cpp

lib/CodeGen/MachineBlockPlacement.cpp

lib/CodeGen/MachineBranchProbabilityInfo.cpp

test/CodeGen/X86/pr24377.ll

test/Transforms/SampleProfile/branch.ll

test/Transforms/SampleProfile/calls.ll

test/Transforms/SampleProfile/propagate.ll

Provide an interface normalizeSuccWeights in MachineBasicBlock to normalize its successors' weights and use it in other places.
ClosedPublic